jxnl · jxnl · Mar 29, 2024 · Mar 29, 2024 · Mar 29, 2024 · Mar 29, 2024
diff --git a/docs/blog/posts/anthropic.md b/docs/blog/posts/anthropic.md
@@ -9,7 +9,7 @@ authors:
 
 A special shoutout to [Shreya](https://twitter.com/shreyaw_) for her contributions to the anthropic support. As of now, all features are operational with the exception of streaming support.
 
-For those eager to experiment, simply patch the client with `ANTHROPIC_TOOLS`, which will enable you to leverage the `anthropic` client for making requests.
+For those eager to experiment, simply patch the client with `ANTHROPIC_JSON`, which will enable you to leverage the `anthropic` client for making requests.
 
 ```
 pip install instructor[anthropic]
@@ -28,7 +28,7 @@ import instructor
 # Patching the Anthropics client with the instructor for enhanced capabilities
 anthropic_client = instructor.patch(
     create=anthropic.Anthropic().messages.create,
-    mode=instructor.Mode.ANTHROPIC_TOOLS
+    mode=instructor.Mode.ANTHROPIC_JSON
 )
 
 class Properties(BaseModel):

diff --git a/docs/concepts/patching.md b/docs/concepts/patching.md
@@ -77,3 +77,33 @@ from openai import OpenAI
 
 client = instructor.patch(OpenAI(), mode=instructor.Mode.MD_JSON)
 ```
+
+## Anthropic JSON Mode
+
+Anthropic JSON mode uses Anthropic's JSON format for responses by setting the `mode` parameter to `instructor.Mode.ANTHROPIC_JSON` when patching the client.
+
+```python
+import instructor
+from anthropic import Anthropic
+
+create = instructor.patch(
+    create=anthropic.Anthropic().messages.create,
+    mode=instructor.Mode.ANTHROPIC_JSON
+)
+
+class User(BaseModel):
+    name: str
+    age: int
+
+resp = create(
+    model="claude-3-haiku-20240307",
+    max_tokens=1024,
+    messages=[
+        {
+            "role": "user",
+            "content": "Create a user",
+        }
+    ],
+    response_model=User,
+)
+```
diff --git a/examples/classification/test_run.py b/examples/classification/test_run.py
diff --git a/instructor/function_calls.py b/instructor/function_calls.py
@@ -99,7 +99,13 @@ def from_response(
             assert hasattr(completion, "content")
             return xml_to_model(cls, extract_xml(completion.content[0].text))  # type:ignore
 
-        assert hasattr(completion, "choices")
+        if mode == Mode.ANTHROPIC_JSON:
+            assert hasattr(completion, "content")
+            text = completion.content[0].text  # type: ignore
+            extra_text = extract_json_from_codeblock(text)
+            return cls.model_validate_json(extra_text)
+
+        assert hasattr(completion, "choices"), "No choices in completion"
 
         if completion.choices[0].finish_reason == "length":
             logger.error("Incomplete output detected, should increase max_tokens")

diff --git a/instructor/mode.py b/instructor/mode.py
@@ -13,6 +13,7 @@ class Mode(enum.Enum):
     MD_JSON = "markdown_json_mode"
     JSON_SCHEMA = "json_schema_mode"
     ANTHROPIC_TOOLS = "anthropic_tools"
+    ANTHROPIC_JSON = "anthropic_json"
 
     def __new__(cls, value: str) -> "Mode":
         member = object.__new__(cls)

diff --git a/instructor/process_response.py b/instructor/process_response.py
@@ -11,7 +11,7 @@
 from openai.types.chat import ChatCompletion
 from pydantic import BaseModel
 
-
+import json
 import inspect
 import logging
 from typing import (
@@ -245,7 +245,7 @@ def handle_response_model(
                 As a genius expert, your task is to understand the content and provide
                 the parsed objects in json that match the following json_schema:\n
 
-                {response_model.model_json_schema()}
+                {json.dumps(response_model.model_json_schema(), indent=2)}
 
                 Make sure to return an instance of the JSON, not the schema itself
                 """
@@ -305,6 +305,34 @@ def handle_response_model(
                 new_kwargs["system"] = f"{system_prompt}\n{new_kwargs['system']}"
             else:
                 new_kwargs["system"] = system_prompt
+        elif mode == Mode.ANTHROPIC_JSON:
+            # anthropic wants system message to be a string so we first extract out any system message
+            openai_system_messages = [
+                message["content"]
+                for message in new_kwargs.get("messages", [])
+                if message["role"] == "system"
+            ]
+
+            new_kwargs["system"] = (
+                new_kwargs.get("system", "")
+                + "\n\n"
+                + "\n\n".join(openai_system_messages)
+            )
+
+            new_kwargs["system"] += f"""
+            You must only response in JSON format that adheres to the following schema:
+
+            <JSON_SCHEMA>
+            {json.dumps(response_model.model_json_schema(), indent=2)}
+            </JSON_SCHEMA>
+            """
+            new_kwargs["system"] = dedent(new_kwargs["system"])
+
+            new_kwargs["messages"] = [
+                message
+                for message in new_kwargs.get("messages", [])
+                if message["role"] != "system"
+            ]
         else:
             raise ValueError(f"Invalid patch mode: {mode}")
 

diff --git a/tests/anthropic/test_anthropic.py b/tests/anthropic/test_anthropic.py
diff --git a/tests/anthropic/test_simple.py b/tests/anthropic/test_simple.py
@@ -1,10 +1,11 @@
 import anthropic
 import instructor
 from pydantic import BaseModel
-from typing import List
+from typing import List, Literal
+from enum import Enum
 
 create = instructor.patch(
-    create=anthropic.Anthropic().messages.create, mode=instructor.Mode.ANTHROPIC_TOOLS
+    create=anthropic.Anthropic().messages.create, mode=instructor.Mode.ANTHROPIC_JSON
 )
 
 
@@ -63,14 +64,14 @@ class User(BaseModel):
     assert resp.address.street_name == "First Avenue"
 
 
-def test_list():
+def test_list_str():
     class User(BaseModel):
         name: str
         age: int
         family: List[str]
 
     resp = create(
-        model="claude-3-opus-20240229",  # Fails with claude-3-haiku-20240307
+        model="claude-3-haiku-20240307",
         max_tokens=1024,
         max_retries=0,
         messages=[
@@ -88,6 +89,54 @@ class User(BaseModel):
         assert isinstance(member, str)
 
 
+def test_enum():
+    class Role(str, Enum):
+        ADMIN = "admin"
+        USER = "user"
+
+    class User(BaseModel):
+        name: str
+        role: Role
+
+    resp = create(
+        model="claude-3-haiku-20240307",
+        max_tokens=1024,
+        max_retries=0,
+        messages=[
+            {
+                "role": "user",
+                "content": "Create a user for a model with a name and role of admin.",
+            }
+        ],
+        response_model=User,
+    )  # type: ignore
+
+    assert isinstance(resp, User)
+    assert resp.role == Role.ADMIN
+
+
+def test_literal():
+    class User(BaseModel):
+        name: str
+        role: Literal["admin", "user"]
+
+    resp = create(
+        model="claude-3-haiku-20240307",
+        max_tokens=1024,
+        max_retries=0,
+        messages=[
+            {
+                "role": "user",
+                "content": "Create a admin user for a model with a name and role.",
+            }
+        ],
+        response_model=User,
+    )  # type: ignore
+
+    assert isinstance(resp, User)
+    assert resp.role == "admin"
+
+
 def test_nested_list():
     class Properties(BaseModel):
         key: str
@@ -99,7 +148,7 @@ class User(BaseModel):
         properties: List[Properties]
 
     resp = create(
-        model="claude-3-opus-20240229",  # Fails with claude-3-haiku-20240307
+        model="claude-3-haiku-20240307",
         max_tokens=1024,
         max_retries=0,
         messages=[
@@ -114,3 +163,26 @@ class User(BaseModel):
     assert isinstance(resp, User)
     for property in resp.properties:
         assert isinstance(property, Properties)
+
+
+def test_system_messages_allcaps():
+    class User(BaseModel):
+        name: str
+        age: int
+
+    resp = create(
+        model="claude-3-haiku-20240307",
+        max_tokens=1024,
+        max_retries=0,
+        messages=[
+            {"role": "system", "content": "EVERYTHING MUST BE IN ALL CAPS"},
+            {
+                "role": "user",
+                "content": "Create a user for a model with a name and age.",
+            },
+        ],
+        response_model=User,
+    )  # type: ignore
+
+    assert isinstance(resp, User)
+    assert resp.name.isupper()