Skip to content

Commit e9c443b

Browse files
committed
adding tiny-llama to the bling catalog
1 parent 470a894 commit e9c443b

File tree

2 files changed

+12
-4
lines changed

2 files changed

+12
-4
lines changed

examples/Models/bling_fast_start.py

Lines changed: 6 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -352,7 +352,7 @@ def hello_world_questions():
352352

353353

354354
# this is the main script to be run
355-
def bling_meets_llmware_hello_world (model_name, from_hf=False):
355+
def bling_meets_llmware_hello_world (model_name):
356356

357357
t0 = time.time()
358358
test_list = hello_world_questions()
@@ -361,7 +361,7 @@ def bling_meets_llmware_hello_world (model_name, from_hf=False):
361361
# Note: Some newer models use local custom code in their HF repos which is not trusted by default
362362
# For now, you can pass in a dummy api_key and we'll set the right config to trust that code
363363
# This will likely be changing in the future
364-
prompter = Prompt().load_model(model_name, from_hf=from_hf, api_key="dummy_not_used_by_hf")
364+
prompter = Prompt().load_model(model_name)
365365

366366
t1 = time.time()
367367
print(f"\n > Model {model_name} load time: {t1-t0} seconds")
@@ -386,8 +386,9 @@ def bling_meets_llmware_hello_world (model_name, from_hf=False):
386386

387387
if __name__ == "__main__":
388388

389-
# list of 8 available 'rag-instruct' bling models on HuggingFace
389+
# list of 'rag-instruct' laptop-ready bling models on HuggingFace
390390
model_list = ["llmware/bling-1b-0.1",
391+
"llmware/bling-tiny-llama-v0",
391392
"llmware/bling-1.4b-0.1",
392393
"llmware/bling-falcon-1b-0.1",
393394
"llmware/bling-cerebras-1.3b-0.1",
@@ -397,5 +398,6 @@ def bling_meets_llmware_hello_world (model_name, from_hf=False):
397398
"llmware/bling-stable-lm-3b-4e1t-v0"
398399
]
399400

400-
bling_meets_llmware_hello_world(model_list[0], from_hf=True)
401+
# try the newest bling model - 'tiny-llama'
402+
bling_meets_llmware_hello_world(model_list[1])
401403

llmware/models.py

Lines changed: 6 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -239,6 +239,12 @@
239239
"temperature": 0.3, "trailing_space": "", "link": "https://huggingface.co/llmware/bling-cerebras-1.3b-0.1",
240240
"custom_model_files": [], "custom_model_repo": ""},
241241

242+
{"model_name": "llmware/bling-tiny-llama-v0", "display_name": "Bling-Tiny-Llama-v0",
243+
"model_family": "HFGenerativeModel", "model_category": "generative_local", "model_location": "hf_repo",
244+
"context_window": 2048, "instruction_following": False, "prompt_wrapper": "human_bot",
245+
"temperature": 0.3, "trailing_space": "", "link": "https://huggingface.co/llmware/bling-tiny-llama-v0",
246+
"custom_model_files": [], "custom_model_repo": ""},
247+
242248
# create dragon models
243249
{"model_name": "llmware/dragon-yi-6b-v0", "display_name": "Dragon-Yi-6B",
244250
"model_family": "HFGenerativeModel", "model_category": "generative_local", "model_location": "hf_repo",

0 commit comments

Comments
 (0)