refactor: moved openai model metadata into seperate file, added make update-models to use gptme to update it

ErikBjare · ErikBjare · commit 11221dbc772c · 2024-09-18T16:53:41.000+02:00
diff --git a/Makefile b/Makefile
@@ -41,6 +41,10 @@ format:
 	poetry run pyupgrade --py310-plus --exit-zero-even-if-changed ${SRCFILES}
 	poetry run black ${SRCDIRS}
 
+update-models:
+	wayback_url=$$(curl "https://archive.org/wayback/available?url=openai.com/api/pricing/" | jq -r '.archived_snapshots.closest.url') && \
+		gptme 'update the model metadata from this page' gptme/models.py gptme/llm_openai_models.py "$${wayback_url}" --non-interactive
+
 precommit: format lint typecheck test
 
 docs/.clean: docs/conf.py
diff --git a/gptme/llm_openai.py b/gptme/llm_openai.py
@@ -4,6 +4,7 @@
 
 from .constants import TEMPERATURE, TOP_P
 from .message import Message, msgs2dicts
+from .models import ModelMeta
 
 if TYPE_CHECKING:
     from openai import OpenAI
diff --git a/gptme/llm_openai_models.py b/gptme/llm_openai_models.py
@@ -0,0 +1,145 @@
+from typing import TypedDict
+from typing_extensions import NotRequired
+
+class _ModelDictMeta(TypedDict):
+    context: int
+    max_output: NotRequired[int]
+    price_input: NotRequired[float]
+    price_output: NotRequired[float]
+
+OPENAI_MODELS: dict[str, _ModelDictMeta] = {
+    # GPT-4o
+    "gpt-4o": {
+        "context": 128_000,
+        "price_input": 5,
+        "price_output": 15,
+    },
+    "gpt-4o-2024-08-06": {
+        "context": 128_000,
+        "price_input": 2.5,
+        "price_output": 10,
+    },
+    "gpt-4o-2024-05-13": {
+        "context": 128_000,
+        "price_input": 5,
+        "price_output": 15,
+    },
+    # GPT-4o mini
+    "gpt-4o-mini": {
+        "context": 128_000,
+        "price_input": 0.15,
+        "price_output": 0.6,
+    },
+    "gpt-4o-mini-2024-07-18": {
+        "context": 128_000,
+        "price_input": 0.15,
+        "price_output": 0.6,
+    },
+    # OpenAI o1-preview
+    "o1-preview": {
+        "context": 128_000,
+        "price_input": 15,
+        "price_output": 60,
+    },
+    "o1-preview-2024-09-12": {
+        "context": 128_000,
+        "price_input": 15,
+        "price_output": 60,
+    },
+    # OpenAI o1-mini
+    "o1-mini": {
+        "context": 128_000,
+        "price_input": 3,
+        "price_output": 12,
+    },
+    "o1-mini-2024-09-12": {
+        "context": 128_000,
+        "price_input": 3,
+        "price_output": 12,
+    },
+    # GPT-4 Turbo
+    "gpt-4-turbo": {
+        "context": 128_000,
+        "price_input": 10,
+        "price_output": 30,
+    },
+    "gpt-4-turbo-2024-04-09": {
+        "context": 128_000,
+        "price_input": 10,
+        "price_output": 30,
+    },
+    "gpt-4-0125-preview": {
+        "context": 128_000,
+        "price_input": 10,
+        "price_output": 30,
+    },
+    "gpt-4-1106-preview": {
+        "context": 128_000,
+        "price_input": 10,
+        "price_output": 30,
+    },
+    "gpt-4-vision-preview": {
+        "context": 128_000,
+        "price_input": 10,
+        "price_output": 30,
+    },
+    # GPT-4
+    "gpt-4": {
+        "context": 8192,
+        "price_input": 30,
+        "price_output": 60,
+    },
+    "gpt-4-32k": {
+        "context": 32768,
+        "price_input": 60,
+        "price_output": 120,
+    },
+    # GPT-3.5 Turbo
+    "gpt-3.5-turbo-0125": {
+        "context": 16385,
+        "price_input": 0.5,
+        "price_output": 1.5,
+    },
+    "gpt-3.5-turbo": {
+        "context": 16385,
+        "price_input": 0.5,
+        "price_output": 1.5,
+    },
+    "gpt-3.5-turbo-instruct": {
+        "context": 4096,
+        "price_input": 1.5,
+        "price_output": 2,
+    },
+    # Deprecated models (kept for reference)
+    "gpt-3.5-turbo-1106": {
+        "context": 16385,
+        "price_input": 1,
+        "price_output": 2,
+    },
+    "gpt-3.5-turbo-0613": {
+        "context": 4096,
+        "price_input": 1.5,
+        "price_output": 2,
+    },
+    "gpt-3.5-turbo-16k-0613": {
+        "context": 16385,
+        "price_input": 3,
+        "price_output": 4,
+    },
+    "gpt-3.5-turbo-0301": {
+        "context": 4096,
+        "price_input": 1.5,
+        "price_output": 2,
+    },
+    # Other models
+    "davinci-002": {
+        "context": 4096,  # Assuming default context size
+        "price_input": 2,
+        "price_output": 2,
+    },
+    "babbage-002": {
+        "context": 4096,  # Assuming default context size
+        "price_input": 0.4,
+        "price_output": 0.4,
+    },
+}
diff --git a/gptme/models.py b/gptme/models.py
@@ -4,6 +4,8 @@
 
 from typing_extensions import NotRequired
 
+from .llm_openai_models import OPENAI_MODELS
+
 logger = logging.getLogger(__name__)
 
 
@@ -38,71 +40,7 @@ class _ModelDictMeta(TypedDict):
 # known models metadata
 # TODO: can we get this from the API?
 MODELS: dict[str, dict[str, _ModelDictMeta]] = {
-    "openai": {
-        # gpt-3.5
-        "gpt-3.5-turbo": {
-            "context": 4097,
-            "price_input": 1,
-            "price_output": 2,
-        },
-        "gpt-3.5-turbo-16k": {
-            "context": 16385,
-        },
-        "gpt-3.5-turbo-1106": {
-            "context": 16385,
-        },
-        # gpt-4
-        "gpt-4": {
-            "context": 8193,
-            "price_input": 30,
-            "price_output": 60,
-        },
-        "gpt-4-32k": {
-            "context": 32769,
-            "price_input": 60,
-            "price_output": 120,
-        },
-        # gpt-4-turbo
-        # https://openai.com/blog/new-models-and-developer-products-announced-at-devday
-        "gpt-4-1106-preview": {
-            "context": 128_000,
-        },
-        "gpt-4-vision-preview": {
-            "context": 128_000,
-        },
-        "gpt-4-turbo": {
-            "context": 128_000,
-            "price_input": 10,
-            "price_output": 30,
-        },
-        "gpt-4o": {
-            "context": 128_000,
-            "price_input": 5,
-            "price_output": 15,
-        },
-        "gpt-4o-2024-08-06": {
-            "context": 128_000,
-            "price_input": 2.5,
-            "price_output": 10,
-        },
-        "gpt-4o-mini": {
-            "context": 128_000,
-            "price_input": 0.15,
-            "price_output": 0.6,
-        },
-        "o1-mini": {
-            "context": 128_000,
-            "max_output": 65536,
-            "price_input": 3,
-            "price_output": 12,
-        },
-        "o1-preview": {
-            "context": 128_000,
-            "max_output": 32768,
-            "price_input": 15,
-            "price_output": 60,
-        },
-    },
+    "openai": OPENAI_MODELS,
     "anthropic": {
         "claude-3-opus-20240229": {
             "context": 200_000,