fixed bug with token size

TechNickAI · Nov 24, 2023 · 94fd681 · 94fd681
1 parent 586268f
commit 94fd681
Showing 1 changed file with 10 additions and 7 deletions.
diff --git a/aicodebot/lm.py b/aicodebot/lm.py
@@ -119,6 +119,7 @@ def get_ollama_model(
         return Ollama(
             model=model_name,
             # NOTE: num_ctx is similar, but not exactly the same as response_token_size
+            #       num_ctx is the number of tokens in the context, whereas response_token_size is the number of tokens
             num_ctx=response_token_size,
             temperature=temperature,
             callbacks=callbacks,
@@ -205,7 +206,15 @@ def get_model_token_limit(self, model_name):
 
     def get_token_size(self, text):
         """Get the number of tokens in a string using the tiktoken library."""
-        encoding = tiktoken.encoding_for_model(self.tiktoken_model_name)
+
+        try:
+            encoding = tiktoken.encoding_for_model(self.tiktoken_model_name)
+        except KeyError:
+            # NOTE: This sets the token size to default value for Ollama.
+            #       TikToken doesn't seem to support Ollama-based models.
+            #       Local models will not work as intended without dynamically setting the token size.
+            # TODO: Dynamically set token size for Ollama-based models.
+            return 2048
         tokens = encoding.encode(text)
         return len(tokens)
 
@@ -301,12 +310,6 @@ def use_appropriate_sized_model(self, chain, token_size):
 
 def token_size(text):
     # Shortcut
-    # NOTE: This sets the token size to default value for Ollama.
-    #       TikToken doesn't seem to support Ollama-based models.
-    #       Local models will not work as intended without dynamically setting the token size.
-    # TODO: Dynamically set token size for Ollama-based models.
-    if LanguageModelManager.DEFAULT_PROVIDER == LanguageModelManager.OLLAMA:
-        return 2048
     return LanguageModelManager().get_token_size(text)