diff --git a/src/embeddedllm/backend/onnxruntime_engine.py b/src/embeddedllm/backend/onnxruntime_engine.py index 7fcc15b..fbd3ff5 100644 --- a/src/embeddedllm/backend/onnxruntime_engine.py +++ b/src/embeddedllm/backend/onnxruntime_engine.py @@ -70,7 +70,7 @@ def __init__(self, model_path: str, vision: bool, device: str = "cpu"): logger.info("Attempt to load slower tokenizer") self.tokenizer = PreTrainedTokenizer.from_pretrained(self.model_path) - self.model = og.Model(model_path) + self.model = og.Model(self.model_path) logger.info("Model loaded") self.onnx_tokenizer = og.Tokenizer(self.model) self.onnx_tokenizer_stream = self.onnx_tokenizer.create_stream()