@@ -352,7 +352,7 @@ def hello_world_questions():
352352
353353
354354# this is the main script to be run
355- def bling_meets_llmware_hello_world (model_name , from_hf = False ):
355+ def bling_meets_llmware_hello_world (model_name ):
356356
357357 t0 = time .time ()
358358 test_list = hello_world_questions ()
@@ -361,7 +361,7 @@ def bling_meets_llmware_hello_world (model_name, from_hf=False):
361361 # Note: Some newer models use local custom code in their HF repos which is not trusted by default
362362 # For now, you can pass in a dummy api_key and we'll set the right config to trust that code
363363 # This will likely be changing in the future
364- prompter = Prompt ().load_model (model_name , from_hf = from_hf , api_key = "dummy_not_used_by_hf" )
364+ prompter = Prompt ().load_model (model_name )
365365
366366 t1 = time .time ()
367367 print (f"\n > Model { model_name } load time: { t1 - t0 } seconds" )
@@ -386,8 +386,9 @@ def bling_meets_llmware_hello_world (model_name, from_hf=False):
386386
387387if __name__ == "__main__" :
388388
389- # list of 8 available 'rag-instruct' bling models on HuggingFace
389+ # list of 'rag-instruct' laptop-ready bling models on HuggingFace
390390 model_list = ["llmware/bling-1b-0.1" ,
391+ "llmware/bling-tiny-llama-v0" ,
391392 "llmware/bling-1.4b-0.1" ,
392393 "llmware/bling-falcon-1b-0.1" ,
393394 "llmware/bling-cerebras-1.3b-0.1" ,
@@ -397,5 +398,6 @@ def bling_meets_llmware_hello_world (model_name, from_hf=False):
397398 "llmware/bling-stable-lm-3b-4e1t-v0"
398399 ]
399400
400- bling_meets_llmware_hello_world (model_list [0 ], from_hf = True )
401+ # try the newest bling model - 'tiny-llama'
402+ bling_meets_llmware_hello_world (model_list [1 ])
401403
0 commit comments