In [None]:
#|default_exp core

# Claudette's source

This is the 'literate' source code for Claudette. You can view the fully rendered version of the notebook [here](https://claudette.answer.ai/core.html), or you can clone the git repo and run the [interactive notebook](https://github.com/AnswerDotAI/claudette/blob/main/00_core.ipynb) in Jupyter. The notebook is converted the [Python module claudette/core.py](https://github.com/AnswerDotAI/claudette/blob/main/claudette/core.py) using [nbdev](https://nbdev.fast.ai/). The goal of this source code is to both create the Python module, and also to teach the reader *how* it is created, without assuming much existing knowledge about Claude's API.

Most of the time you'll see that we write some source code *first*, and then a description or discussion of it *afterwards*.

## Setup

In [None]:
import os
# os.environ['ANTHROPIC_LOG'] = 'debug'

To print every HTTP request and response in full, uncomment the above line. This functionality is provided by Anthropic's SDK.

In [None]:
#| export
import inspect, typing, json
from collections import abc
try: from IPython import display
except: display=None
from typing import get_type_hints
from functools import wraps

from anthropic import Anthropic, AnthropicBedrock, AnthropicVertex
from anthropic.types import (Usage, TextBlock, ServerToolUseBlock,
                             WebSearchToolResultBlock, Message, ToolUseBlock,
                             ThinkingBlock, ServerToolUsage)
from anthropic.resources import messages

import toolslm
from toolslm.funccall import *

from fastcore.meta import delegates
from fastcore.utils import *
from msglm import mk_msg_anthropic as mk_msg, mk_msgs_anthropic as mk_msgs

In [None]:
#| hide
from nbdev import show_doc

# Used to show available models from the anthropic SDK
from anthropic.types import Model
from claudette.text_editor import *
from typing import get_args
from datetime import datetime
from pprint import pprint

import warnings

warnings.filterwarnings("ignore", message="Pydantic serializer warnings")

In [None]:
#| export
_all_ = ['mk_msg', 'mk_msgs']

In [None]:
#| export
empty = inspect.Parameter.empty

:::{.callout-tip}

If you're reading the rendered version of this notebook, you'll see an "Exported source" collapsible widget below. If you're reading the source notebook directly, you'll see `#| exports` at the top of the cell. These show that this piece of code will be exported into the python module that this notebook creates. No other code will be included -- any other code in this notebook is just for demonstration, documentation, and testing.

You can toggle expanding/collapsing the source code of all exported sections by using the `</> Code` menu in the top right of the rendered notebook page.

:::

In [None]:
#| exports

model_types = {
    # Anthropic
    'claude-opus-4-20250514': 'opus',
    'claude-sonnet-4-20250514': 'sonnet',
    'claude-3-opus-20240229': 'opus-3',
    'claude-3-7-sonnet-20250219': 'sonnet-3-7',
    'claude-3-5-sonnet-20241022': 'sonnet-3-5',
    'claude-3-haiku-20240307': 'haiku-3',
    'claude-3-5-haiku-20241022': 'haiku-3-5',
    # AWS
    'anthropic.claude-3-opus-20240229-v1:0': 'opus',
    'anthropic.claude-3-5-sonnet-20241022-v2:0': 'sonnet',
    'anthropic.claude-3-sonnet-20240229-v1:0': 'sonnet',
    'anthropic.claude-3-haiku-20240307-v1:0': 'haiku',
    # Google
    'claude-3-opus@20240229': 'opus',
    'claude-3-5-sonnet-v2@20241022': 'sonnet',
    'claude-3-sonnet@20240229': 'sonnet',
    'claude-3-haiku@20240307': 'haiku',
}

all_models = list(model_types)

In [None]:
#|hide

# Full list of models via the anthropic SDK for reference. Not all models are surfaced by Claudette.
Model

typing.Union[typing.Literal['claude-3-7-sonnet-latest', 'claude-3-7-sonnet-20250219', 'claude-3-5-haiku-latest', 'claude-3-5-haiku-20241022', 'claude-sonnet-4-20250514', 'claude-sonnet-4-0', 'claude-4-sonnet-20250514', 'claude-3-5-sonnet-latest', 'claude-3-5-sonnet-20241022', 'claude-3-5-sonnet-20240620', 'claude-opus-4-0', 'claude-opus-4-20250514', 'claude-4-opus-20250514', 'claude-3-opus-latest', 'claude-3-opus-20240229', 'claude-3-sonnet-20240229', 'claude-3-haiku-20240307', 'claude-2.1', 'claude-2.0'], str]

In [None]:
#| export
models = all_models[:5]

In [None]:
models

['claude-opus-4-20250514',
 'claude-sonnet-4-20250514',
 'claude-3-opus-20240229',
 'claude-3-7-sonnet-20250219',
 'claude-3-5-sonnet-20241022']

In [None]:
#| export
models_aws = ['claude-3-5-haiku-20241022',
 'claude-3-7-sonnet-20250219',
 'anthropic.claude-3-opus-20240229-v1:0',
 'anthropic.claude-3-5-sonnet-20241022-v2:0']

In [None]:
#| export
models_goog = ['anthropic.claude-3-sonnet-20240229-v1:0',
 'anthropic.claude-3-haiku-20240307-v1:0',
 'claude-3-opus@20240229',
 'claude-3-5-sonnet-v2@20241022',
 'claude-3-sonnet@20240229',
 'claude-3-haiku@20240307']

In [None]:
#| exports
text_only_models = ('claude-3-5-haiku-20241022',)

In [None]:
#| exports
has_streaming_models = set(all_models)
has_system_prompt_models = set(all_models)
has_temperature_models = set(all_models)
has_extended_thinking_models = {'claude-opus-4-20250514', 'claude-sonnet-4-20250514', 'claude-3-7-sonnet-20250219'}

In [None]:
has_extended_thinking_models

{'claude-3-7-sonnet-20250219',
 'claude-opus-4-20250514',
 'claude-sonnet-4-20250514'}

In [None]:
#| exports

def can_stream(m): return m in has_streaming_models
def can_set_system_prompt(m): return m in has_system_prompt_models
def can_set_temperature(m): return m in has_temperature_models
def can_use_extended_thinking(m): return m in has_extended_thinking_models

We include these functions to provide a uniform library interface with cosette since openai models such as o1 do not have many of these capabilities.

In [None]:
assert can_stream('claude-3-5-sonnet-20241022') and can_set_system_prompt('claude-3-5-sonnet-20241022') and can_set_temperature('claude-3-5-sonnet-20241022')

These are the current versions and [prices](https://www.anthropic.com/pricing#anthropic-api) of Anthropic's models at the time of writing.

In [None]:
model = models[1]; model

'claude-sonnet-4-20250514'

For examples, we'll use the latest Sonnet, since it's awesome.

## Antropic SDK

In [None]:
cli = Anthropic()

This is what Anthropic's SDK provides for interacting with Python. To use it, pass it a list of *messages*, with *content* and a *role*. The roles should alternate between *user* and *assistant*.

:::{.callout-tip}

After the code below you'll see an indented section with an orange vertical line on the left. This is used to show the *result* of running the code above. Because the code is running in a Jupyter Notebook, we don't have to use `print` to display results, we can just type the expression directly, as we do with `r` here.

:::

In [None]:
m = {'role': 'user', 'content': "I'm Jeremy"}
r = cli.messages.create(messages=[m], model=model, max_tokens=100)
r

Hello Jeremy! Nice to meet you. How are you doing today?

<details>

- id: `msg_01QeJQQgvbTUVuj1veGPxVJm`
- content: `[{'citations': None, 'text': 'Hello Jeremy! Nice to meet you. How are you doing today?', 'type': 'text'}]`
- model: `claude-sonnet-4-20250514`
- role: `assistant`
- stop_reason: `end_turn`
- stop_sequence: `None`
- type: `message`
- usage: `{'cache_creation_input_tokens': 0, 'cache_read_input_tokens': 0, 'input_tokens': 10, 'output_tokens': 17, 'server_tool_use': None, 'service_tier': 'standard'}`

</details>

### Formatting output

That output is pretty long and hard to read, so let's clean it up. We'll start by pulling out the `Content` part of the message.
To do that, we're going to write our first function which will be included to the `claudette/core.py` module.

:::{.callout-tip}

This is the first exported public function or class we're creating (the previous export was of a variable). In the rendered version of the notebook for these you'll see 4 things, in this order (unless the symbol starts with a single `_`, which indicates it's *private*):

- The signature (with the symbol name as a heading, with a horizontal rule above)
- A table of paramater docs (if provided)
- The doc string (in italics).
- The source code (in a collapsible "Exported source" block)

After that, we generally provide a bit more detail on what we've created, and why, along with a sample usage.

:::

In [None]:
#| exports
def _type(x):
    try: return x.type
    except AttributeError: return x.get('type')

def find_block(r:abc.Mapping, # The message to look in
               blk_type:type|str=TextBlock  # The type of block to find
              ):
    "Find the first block of type `blk_type` in `r.content`."
    f = (lambda x:_type(x)==blk_type) if isinstance(blk_type,str) else (lambda x:isinstance(x,blk_type))
    return first(o for o in r.content if f(o))

This makes it easier to grab the needed parts of Claude's responses, which can include multiple pieces of content. By default, we look for the first text block. That will generally have the content we want to display.

In [None]:
find_block(r)

TextBlock(citations=None, text='Hello Jeremy! Nice to meet you. How are you doing today?', type='text')

In [None]:
def contents(r):
    "Helper to get the contents from Claude response `r`."
    blk = find_block(r)
    if not blk and r.content: blk = r.content[0]
    return blk.text.strip() if hasattr(blk,'text') else str(blk)

For display purposes, we often just want to show the text itself.

In [None]:
contents(r)

'Hello Jeremy! Nice to meet you. How are you doing today?'

In [None]:
#| exports
@patch
def _repr_markdown_(self:(Message)):
    det = '\n- '.join(f'{k}: `{v}`' for k,v in self.model_dump().items())
    cts = re.sub(r'\$', '&#36;', contents(self))  # escape `$` for jupyter latex
    return f"""{cts}

<details>

- {det}

</details>"""

Jupyter looks for a `_repr_markdown_` method in displayed objects; we add this in order to display just the content text, and collapse full details into a hideable section. Note that `patch` is from [fastcore](https://fastcore.fast.ai/), and is used to add (or replace) functionality in an existing class. We pass the class(es) that we want to patch as type annotations to `self`. In this case, `_repr_markdown_` is being added to Anthropic's `Message` class, so when we display the message now we just see the contents, and the details are hidden away in a collapsible details block.

In [None]:
r

Hello Jeremy! Nice to meet you. How are you doing today?

<details>

- id: `msg_01QeJQQgvbTUVuj1veGPxVJm`
- content: `[{'citations': None, 'text': 'Hello Jeremy! Nice to meet you. How are you doing today?', 'type': 'text'}]`
- model: `claude-sonnet-4-20250514`
- role: `assistant`
- stop_reason: `end_turn`
- stop_sequence: `None`
- type: `message`
- usage: `{'cache_creation_input_tokens': 0, 'cache_read_input_tokens': 0, 'input_tokens': 10, 'output_tokens': 17, 'server_tool_use': None, 'service_tier': 'standard'}`

</details>

One key part of the response is the `usage` key, which tells us how many tokens we used by returning a `Usage` object.

We'll add some helpers to make things a bit cleaner for creating and formatting these objects.

In [None]:
r.usage

In: 10; Out: 17; Cache create: 0; Cache read: 0; Total Tokens: 27; Server tool use (web search requests): 0

In [None]:
#| exports
def server_tool_usage(web_search_requests=0):
    'Little helper to create a server tool usage object'
    return ServerToolUsage(web_search_requests=web_search_requests)

In [None]:
#| exports
def usage(inp=0, # input tokens
          out=0,  # Output tokens
          cache_create=0, # Cache creation tokens
          cache_read=0, # Cache read tokens
          server_tool_use=server_tool_usage() # server tool use
         ):
    'Slightly more concise version of `Usage`.'
    return Usage(input_tokens=inp, output_tokens=out, cache_creation_input_tokens=cache_create,
                 cache_read_input_tokens=cache_read, server_tool_use=server_tool_use)

The constructor provided by Anthropic is rather verbose, so we clean it up a bit, using a lowercase version of the name.

In [None]:
usage(5)

In: 5; Out: 0; Cache create: 0; Cache read: 0; Total Tokens: 5; Server tool use (web search requests): 0

In [None]:
#| exports
def _dgetattr(o,s,d): 
    "Like getattr, but returns the default if the result is None"
    return getattr(o,s,d) or d

@patch(as_prop=True)
def total(self:Usage): return self.input_tokens+self.output_tokens+_dgetattr(self, "cache_creation_input_tokens",0)+_dgetattr(self, "cache_read_input_tokens",0)

Adding a `total` property to `Usage` makes it easier to see how many tokens we've used up altogether.

In [None]:
usage(5,1).total

6

In [None]:
#| exports
@patch
def __repr__(self:Usage):
    io_toks = f'In: {self.input_tokens}; Out: {self.output_tokens}'
    cache_toks = f'Cache create: {_dgetattr(self, "cache_creation_input_tokens",0)}; Cache read: {_dgetattr(self, "cache_read_input_tokens",0)}'
    server_tool_use = _dgetattr(self, "server_tool_use",server_tool_usage())
    server_tool_use_str = f'Server tool use (web search requests): {server_tool_use.web_search_requests}'
    total_tok = f'Total Tokens: {self.total}'
    return f'{io_toks}; {cache_toks}; {total_tok}; {server_tool_use_str}'

In python, patching `__repr__` lets us change how an object is displayed. (More generally, methods starting and ending in `__` in Python are called `dunder` methods, and have some `magic` behavior -- such as, in this case, changing how an object is displayed.) We won't be directly displaying ServerToolUsage's, so we can handle its display behavior in the same Usage `__repr__`

In [None]:
usage(5)

In: 5; Out: 0; Cache create: 0; Cache read: 0; Total Tokens: 5; Server tool use (web search requests): 0

In [None]:
#| exports
@patch
def __add__(self:ServerToolUsage, b):
    "Add together each of the server tool use counts"
    return ServerToolUsage(web_search_requests=self.web_search_requests+b.web_search_requests)

And, patching `__add__` lets `+` work on a `ServerToolUsage` as well as a `Usage` object.

In [None]:
server_tool_usage(1) + server_tool_usage(2)

ServerToolUsage(web_search_requests=3)

In [None]:
#| exports
@patch
def __add__(self:Usage, b):
    "Add together each of `input_tokens` and `output_tokens`"
    return usage(self.input_tokens+b.input_tokens, self.output_tokens+b.output_tokens,
                 _dgetattr(self,'cache_creation_input_tokens',0)+_dgetattr(b,'cache_creation_input_tokens',0),
                 _dgetattr(self,'cache_read_input_tokens',0)+_dgetattr(b,'cache_read_input_tokens',0),
                 _dgetattr(self,'server_tool_use',server_tool_usage())+_dgetattr(b,'server_tool_use',server_tool_usage()))

In [None]:
r.usage+r.usage + usage(server_tool_use=server_tool_usage(1))

In: 20; Out: 34; Cache create: 0; Cache read: 0; Total Tokens: 54; Server tool use (web search requests): 1

### Creating messages

Creating correctly formatted `dict`s from scratch every time isn't very handy, so we'll import a couple of helper functions from the `msglm` library.

Let's use `mk_msg` to recreate our msg `{'role': 'user', 'content': "I'm Jeremy"}` from earlier.

In [None]:
prompt = "I'm Jeremy"
m = mk_msg(prompt)
r = cli.messages.create(messages=[m], model=model, max_tokens=100)
r

Nice to meet you, Jeremy! How are you doing today? Is there anything I can help you with?

<details>

- id: `msg_019KTch2ouq92y6sowmgSnYx`
- content: `[{'citations': None, 'text': 'Nice to meet you, Jeremy! How are you doing today? Is there anything I can help you with?', 'type': 'text'}]`
- model: `claude-sonnet-4-20250514`
- role: `assistant`
- stop_reason: `end_turn`
- stop_sequence: `None`
- type: `message`
- usage: `{'cache_creation_input_tokens': 0, 'cache_read_input_tokens': 0, 'input_tokens': 10, 'output_tokens': 25, 'server_tool_use': None, 'service_tier': 'standard'}`

</details>

We can pass more than just text messages to Claude. As we'll see later we can also pass images, SDK objects, etc. To handle these different data types we need to pass the type along with our content to Claude. 

Here's an example of a multimodal message containing text and images. 

```json
{
    'role': 'user', 
    'content': [
        {'type':'text', 'text':'What is in the image?'},
        {
            'type':'image', 
            'source': {
                'type':'base64', 'media_type':'media_type', 'data': 'data'
            }
        }
    ]
}
```

`mk_msg` infers the type automatically and creates the appropriate data structure. 

LLMs, don't actually have state, but instead dialogs are created by passing back all previous prompts and responses every time. With Claude, they always alternate *user* and *assistant*. We'll use `mk_msgs` from `msglm` to make it easier to build up these dialog lists.

In [None]:
msgs = mk_msgs([prompt, r, "I forgot my name. Can you remind me please?"]) 
msgs

[{'role': 'user', 'content': "I'm Jeremy"},
 {'role': 'assistant',
  'content': [TextBlock(citations=None, text='Nice to meet you, Jeremy! How are you doing today? Is there anything I can help you with?', type='text')]},
 {'role': 'user', 'content': 'I forgot my name. Can you remind me please?'}]

In [None]:
cli.messages.create(messages=msgs, model=model, max_tokens=200)

Your name is Jeremy - you introduced yourself to me just a moment ago at the start of our conversation.

<details>

- id: `msg_01WiFxGU88RFidepLUSNPkU8`
- content: `[{'citations': None, 'text': 'Your name is Jeremy - you introduced yourself to me just a moment ago at the start of our conversation.', 'type': 'text'}]`
- model: `claude-sonnet-4-20250514`
- role: `assistant`
- stop_reason: `end_turn`
- stop_sequence: `None`
- type: `message`
- usage: `{'cache_creation_input_tokens': 0, 'cache_read_input_tokens': 0, 'input_tokens': 49, 'output_tokens': 24, 'server_tool_use': None, 'service_tier': 'standard'}`

</details>

## Client

In [None]:
#| exports
class Client:
    def __init__(self, model, cli=None, log=False, cache=False):
        "Basic Anthropic messages client."
        self.model,self.use = model,usage()
        self.text_only = model in text_only_models
        self.log = [] if log else None
        self.c = (cli or Anthropic(default_headers={'anthropic-beta': 'prompt-caching-2024-07-31'}))
        self.cache = cache

We'll create a simple `Client` for `Anthropic` which tracks usage stores the model to use. We don't add any methods right away -- instead we'll use `patch` for that so we can add and document them incrementally.

In [None]:
c = Client(model)
c.use

In: 0; Out: 0; Cache create: 0; Cache read: 0; Total Tokens: 0; Server tool use (web search requests): 0

In [None]:
#| exports
@patch
def _r(self:Client, r:Message, prefill=''):
    "Store the result of the message and accrue total usage."
    if prefill:
        blk = find_block(r)
        blk.text = prefill + (blk.text or '')
    self.result = r
    self.use += r.usage
    self.stop_reason = r.stop_reason
    self.stop_sequence = r.stop_sequence
    return r

We use a `_` prefix on private methods, but we document them here in the interests of literate source code.

`_r` will be used each time we get a new result, to track usage and also to keep the result available for later.

In [None]:
c._r(r)
c.use

In: 10; Out: 25; Cache create: 0; Cache read: 0; Total Tokens: 35; Server tool use (web search requests): 0

Whereas OpenAI's models use a `stream` parameter for streaming, Anthropic's use a separate method. We implement Anthropic's approach in a private method, and then use a `stream` parameter in `__call__` for consistency:

In [None]:
#| exports
@patch
def _log(self:Client, final, prefill, msgs, maxtok=None, sp=None, temp=None, stream=None, stop=None, **kwargs):
    self._r(final, prefill)
    if self.log is not None: self.log.append({
        "msgs": msgs, "prefill": prefill, **kwargs,
        "msgs": msgs, "prefill": prefill, "maxtok": maxtok, "sp": sp, "temp": temp, "stream": stream, "stop": stop, **kwargs,
        "result": self.result, "use": self.use, "stop_reason": self.stop_reason, "stop_sequence": self.stop_sequence
    })
    return self.result

In [None]:
#| exports
@patch
def _stream(self:Client, msgs:list, prefill='', **kwargs):
    with self.c.messages.stream(model=self.model, messages=mk_msgs(msgs, cache=self.cache, cache_last_ckpt_only=self.cache), **kwargs) as s:
        if prefill: yield(prefill)
        yield from s.text_stream
        self._log(s.get_final_message(), prefill, msgs, **kwargs)

Claude supports adding an extra `assistant` message at the end, which contains the *prefill* -- i.e. the text we want Claude to assume the response starts with. However Claude doesn't actually repeat that in the response, so for convenience we add it.

In [None]:
#| exports
@patch
def _precall(self:Client, msgs, prefill, stop, kwargs):
    pref = [prefill.strip()] if prefill else []
    if not isinstance(msgs,list): msgs = [msgs]
    if stop is not None:
        if not isinstance(stop, (list)): stop = [stop]
        kwargs["stop_sequences"] = stop
    msgs = mk_msgs(msgs+pref, cache=self.cache, cache_last_ckpt_only=self.cache)
    return msgs

In [None]:
@patch
@delegates(messages.Messages.create)
def __call__(self:Client,
             msgs:list, # List of messages in the dialog
             sp='', # The system prompt
             temp=0, # Temperature
             maxtok=4096, # Maximum tokens
             prefill='', # Optional prefill to pass to Claude as start of its response
             stream:bool=False, # Stream response?
             stop=None, # Stop sequence
             **kwargs):
    "Make a call to Claude."
    msgs = self._precall(msgs, prefill, stop, kwargs)
    if stream: return self._stream(msgs, prefill=prefill, max_tokens=maxtok, system=sp, temperature=temp, **kwargs)
    res = self.c.messages.create(
        model=self.model, messages=msgs, max_tokens=maxtok, system=sp, temperature=temp, **kwargs)
    return self._log(res, prefill, msgs, maxtok, sp, temp, stream=stream, **kwargs)

Defining `__call__` let's us use an object like a function (i.e it's *callable*). We use it as a small wrapper over `messages.create`. However we're not exporting this version just yet -- we have some additions we'll make in a moment...

In [None]:
c = Client(model, log=True)
c.use

In: 0; Out: 0; Cache create: 0; Cache read: 0; Total Tokens: 0; Server tool use (web search requests): 0

In [None]:
c('Hi')

Hello! How are you doing today? Is there anything I can help you with?

<details>

- id: `msg_0198RkhbnJJ6ieaawFWnD4Ka`
- content: `[{'citations': None, 'text': 'Hello! How are you doing today? Is there anything I can help you with?', 'type': 'text'}]`
- model: `claude-sonnet-4-20250514`
- role: `assistant`
- stop_reason: `end_turn`
- stop_sequence: `None`
- type: `message`
- usage: `{'cache_creation_input_tokens': 0, 'cache_read_input_tokens': 0, 'input_tokens': 8, 'output_tokens': 20, 'server_tool_use': None, 'service_tier': 'standard'}`

</details>

In [None]:
c.use

In: 8; Out: 20; Cache create: 0; Cache read: 0; Total Tokens: 28; Server tool use (web search requests): 0

Let's try out *prefill*:

In [None]:
q = "Concisely, what is the meaning of life?"
pref = 'According to Douglas Adams,'

In [None]:
c(q, prefill=pref)

According to Douglas Adams,it's 42.

More seriously, there's no universal answer. Common perspectives include:

- **Religious**: To serve/connect with the divine
- **Existentialist**: To create your own meaning through choices and actions
- **Humanistic**: To reduce suffering and increase flourishing
- **Biological**: To survive, reproduce, and evolve
- **Personal**: To love, learn, create, or leave a positive impact

The question itself might be more valuable than any single answer.

<details>

- id: `msg_01AHpQejBesD7bG34Nfqe7n3`
- content: `[{'citations': None, 'text': "According to Douglas Adams,it's 42.\n\nMore seriously, there's no universal answer. Common perspectives include:\n\n- **Religious**: To serve/connect with the divine\n- **Existentialist**: To create your own meaning through choices and actions\n- **Humanistic**: To reduce suffering and increase flourishing\n- **Biological**: To survive, reproduce, and evolve\n- **Personal**: To love, learn, create, or leave a positive impact\n\nThe question itself might be more valuable than any single answer.", 'type': 'text'}]`
- model: `claude-sonnet-4-20250514`
- role: `assistant`
- stop_reason: `end_turn`
- stop_sequence: `None`
- type: `message`
- usage: `{'cache_creation_input_tokens': 0, 'cache_read_input_tokens': 0, 'input_tokens': 24, 'output_tokens': 109, 'server_tool_use': None, 'service_tier': 'standard'}`

</details>

We can pass `stream=True` to stream the response back incrementally:

In [None]:
for o in c('Hi', stream=True): print(o, end='')

Hello! How are you doing today? Is there anything I can help you with?

In [None]:
c.use

In: 40; Out: 149; Cache create: 0; Cache read: 0; Total Tokens: 189; Server tool use (web search requests): 0

In [None]:
for o in c(q, prefill=pref, stream=True): print(o, end='')

According to Douglas Adams,it's 42.

More seriously, there's no universal answer. Common perspectives include:

- **Religious**: To serve/connect with the divine
- **Existentialist**: To create your own meaning through choices and actions
- **Humanistic**: To reduce suffering and increase flourishing
- **Biological**: To survive, reproduce, and evolve
- **Personal**: To love, learn, create, or leave a positive impact

The question itself might be more valuable than any single answer.

In [None]:
c.use

In: 64; Out: 258; Cache create: 0; Cache read: 0; Total Tokens: 322; Server tool use (web search requests): 0

Pass a stop sequence if you want claude to stop generating text when it encounters it.

In [None]:
c("Count from 1 to 10", stop="5")

1, 2, 3, 4,

<details>

- id: `msg_01GbcBDLMTGECncRuqK2RM7n`
- content: `[{'citations': None, 'text': '1, 2, 3, 4, ', 'type': 'text'}]`
- model: `claude-sonnet-4-20250514`
- role: `assistant`
- stop_reason: `stop_sequence`
- stop_sequence: `5`
- type: `message`
- usage: `{'cache_creation_input_tokens': 0, 'cache_read_input_tokens': 0, 'input_tokens': 15, 'output_tokens': 14, 'server_tool_use': None, 'service_tier': 'standard'}`

</details>

This also works with streaming, and you can pass more than one stop sequence:

In [None]:
for o in c("Count from 1 to 10", stop=["2", "yellow"], stream=True): print(o, end='')
print(c.stop_reason, c.stop_sequence)

1, stop_sequence 2


You can check the logs:

In [None]:
c.log[-1]

{'msgs': [{'role': 'user', 'content': 'Count from 1 to 10'}],
 'prefill': '',
 'max_tokens': 4096,
 'system': '',
 'temperature': 0,
 'stop_sequences': ['2', 'yellow'],
 'maxtok': None,
 'sp': None,
 'temp': None,
 'stream': None,
 'stop': None,
 'result': Message(id='msg_017K1BLzA92LUHQ1NesrNQtN', content=[TextBlock(citations=None, text='1, ', type='text')], model='claude-sonnet-4-20250514', role='assistant', stop_reason='stop_sequence', stop_sequence='2', type='message', usage=In: 15; Out: 5; Cache create: 0; Cache read: 0; Total Tokens: 20; Server tool use (web search requests): 0),
 'use': In: 94; Out: 277; Cache create: 0; Cache read: 0; Total Tokens: 371; Server tool use (web search requests): 0,
 'stop_reason': 'stop_sequence',
 'stop_sequence': '2'}

We've shown the token usage but we really care about is pricing. Let's extract the latest [pricing](https://www.anthropic.com/pricing#anthropic-api) from Anthropic into a `pricing` dict.

In [None]:
#| export
pricing = {  # model type: $ / million tokens (input, output, cache write, cache read)
    'opus': (15, 75, 18.75, 1.5),
    'sonnet': (3, 15, 3.75, 0.3),
    'haiku-3': (0.25, 1.25, 0.3, 0.03),
    'haiku-3-5': (1, 3, 1.25, 0.1),
}

In [None]:
#| exports
def get_pricing(m, u):
    return pricing[m][:3] if u.prompt_token_count < 128_000 else pricing[m][3:]

Similarly, let's get the pricing for the latest [server tools]():

In [None]:
#| export
server_tool_pricing = {
    'web_search_requests': 10, # $10 per 1,000
}

We'll patch `Usage` to enable it compute the cost given pricing.

In [None]:
#| exports
@patch
def cost(self:Usage, costs:tuple) -> float:
    cache_w, cache_r = _dgetattr(self, "cache_creation_input_tokens",0), _dgetattr(self, "cache_read_input_tokens",0)
    tok_cost = sum([self.input_tokens * costs[0] +  self.output_tokens * costs[1] +  cache_w * costs[2] + cache_r * costs[3]]) / 1e6
    server_tool_use = _dgetattr(self, "server_tool_use",server_tool_usage())
    server_tool_cost = server_tool_use.web_search_requests * server_tool_pricing['web_search_requests'] / 1e3
    return tok_cost + server_tool_cost

In [None]:
#| exports
@patch(as_prop=True)
def cost(self: Client) -> float: return self.use.cost(pricing[model_types[self.model]])

In [None]:
#| exports
def get_costs(c):
    costs = pricing[model_types[c.model]]
    
    inp_cost = c.use.input_tokens * costs[0] / 1e6
    out_cost = c.use.output_tokens * costs[1] / 1e6

    cache_w = c.use.cache_creation_input_tokens   
    cache_r = c.use.cache_read_input_tokens
    cache_cost = (cache_w * costs[2] + cache_r * costs[3]) / 1e6

    server_tool_use = c.use.server_tool_use
    server_tool_cost = server_tool_use.web_search_requests * server_tool_pricing['web_search_requests'] / 1e3
    return inp_cost, out_cost, cache_cost, cache_w + cache_r, server_tool_cost

In [None]:
#| exports
@patch
def _repr_markdown_(self:Client):
    if not hasattr(self,'result'): return 'No results yet'
    msg = contents(self.result)
    inp_cost, out_cost, cache_cost, cached_toks, server_tool_cost = get_costs(self)
    return f"""{msg}

| Metric | Count | Cost (USD) |
|--------|------:|-----:|
| Input tokens | {self.use.input_tokens:,} | {inp_cost:.6f} |
| Output tokens | {self.use.output_tokens:,} | {out_cost:.6f} |
| Cache tokens | {cached_toks:,} | {cache_cost:.6f} |
| Server tool use | {self.use.server_tool_use.web_search_requests:,} | {server_tool_cost:.6f} |
| **Total** | **{self.use.total:,}** | **${self.cost:.6f}** |"""

In [None]:
c

1,

| Metric | Count | Cost (USD) |
|--------|------:|-----:|
| Input tokens | 94 | 0.000282 |
| Output tokens | 277 | 0.004155 |
| Cache tokens | 0 | 0.000000 |
| Server tool use | 0 | 0.000000 |
| **Total** | **371** | **$0.004437** |

## Tool use

Let's now add tool use (aka *function calling*).

In [None]:
#| export
def mk_tool_choice(choose:Union[str,bool,None])->dict:
    "Create a `tool_choice` dict that's 'auto' if `choose` is `None`, 'any' if it is True, or 'tool' otherwise"
    return {"type": "tool", "name": choose} if isinstance(choose,str) else {'type':'any'} if choose else {'type':'auto'}

In [None]:
print(mk_tool_choice('sums'))
print(mk_tool_choice(True))
print(mk_tool_choice(None))

{'type': 'tool', 'name': 'sums'}
{'type': 'any'}
{'type': 'auto'}


Claude can be forced to use a particular tool, or select from a specific list of tools, or decide for itself when to use a tool. If you want to force a tool (or force choosing from a list), include a `tool_choice` param with a dict from `mk_tool_choice`.

For testing, we need a function that Claude can call; we'll write a simple function that adds numbers together, and will tell us when it's being called:

In [None]:
from dataclasses import dataclass

In [None]:
@dataclass
class MySum: val:int

def sums(
    a:int,  # First thing to sum
    b:int=1 # Second thing to sum
) -> int: # The sum of the inputs
    "Adds a + b."
    print(f"Finding the sum of {a} and {b}")
    return MySum(a + b)

In [None]:
a,b = 604542,6458932
pr = f"What is {a}+{b}?"
sp = "You are a summing expert."

Claudette can autogenerate a schema thanks to the `toolslm` library. We'll force the use of the tool using the function we created earlier.

In [None]:
tools=[get_schema(sums)]
choice = mk_tool_choice('sums')

We'll start a dialog with Claude now. We'll store the messages of our dialog in `msgs`. The first message will be our prompt `pr`, and we'll pass our `tools` schema.

In [None]:
msgs = mk_msgs(pr)
r = c(msgs, sp=sp, tools=tools, tool_choice=choice)
r

ToolUseBlock(id='toolu_015SaTbNCNvNy6jDpDc2wuBF', input={'a': 604542, 'b': 6458932}, name='sums', type='tool_use')

<details>

- id: `msg_011SsN38382XnFgRwCidSS56`
- content: `[{'id': 'toolu_015SaTbNCNvNy6jDpDc2wuBF', 'input': {'a': 604542, 'b': 6458932}, 'name': 'sums', 'type': 'tool_use'}]`
- model: `claude-sonnet-4-20250514`
- role: `assistant`
- stop_reason: `tool_use`
- stop_sequence: `None`
- type: `message`
- usage: `{'cache_creation_input_tokens': 0, 'cache_read_input_tokens': 0, 'input_tokens': 443, 'output_tokens': 53, 'server_tool_use': None, 'service_tier': 'standard'}`

</details>

When Claude decides that it should use a tool, it passes back a `ToolUseBlock` with the name of the tool to call, and the params to use.

We don't want to allow it to call just any possible function (that would be a security disaster!) so we create a *namespace* -- that is, a dictionary of allowable function names to call.

In [None]:
ns = mk_ns(sums)
ns

{'sums': <function __main__.sums(a: int, b: int = 1) -> int>}

In [None]:
#| exports
def mk_funcres(fc, ns):
    "Given tool use block `fc`, get tool result, and create a tool_result response."
    res = call_func(fc.name, fc.input, ns=ns, raise_on_err=False)
    return dict(type="tool_result", tool_use_id=fc.id, content=str(res))

We can now use the function requested by Claude. We look it up in `ns`, and pass in the provided parameters.

In [None]:
fcs = [o for o in r.content if isinstance(o,ToolUseBlock)]
fcs

[ToolUseBlock(id='toolu_015SaTbNCNvNy6jDpDc2wuBF', input={'a': 604542, 'b': 6458932}, name='sums', type='tool_use')]

In [None]:
res = [mk_funcres(fc, ns=ns) for fc in fcs]
res

Finding the sum of 604542 and 6458932


[{'type': 'tool_result',
  'tool_use_id': 'toolu_015SaTbNCNvNy6jDpDc2wuBF',
  'content': 'MySum(val=7063474)'}]

In [None]:
def contents(r):
    "Helper to get the contents from Claude response `r`."
    blk = find_block(r)
    if not blk and r.content: blk = r.content[0]
    if hasattr(blk,'text'): return blk.text.strip()
    elif hasattr(blk,'content'): return blk.content.strip()
    return str(blk)

In [None]:
#| exports
def mk_toolres(
    r:abc.Mapping, # Tool use request response from Claude
    ns:Optional[abc.Mapping]=None, # Namespace to search for tools
    obj:Optional=None # Class to search for tools
    ):
    "Create a `tool_result` message from response `r`."
    cts = getattr(r, 'content', [])
    res = [mk_msg(r.model_dump(), role='assistant')]
    if ns is None: ns=globals()
    if obj is not None: ns = mk_ns(obj)
    tcs = [mk_funcres(o, ns) for o in cts if isinstance(o,ToolUseBlock)]
    if tcs: res.append(mk_msg(tcs))
    return res

In order to tell Claude the result of the tool call, we pass back the tool use assistant request and the `tool_result` response.

In [None]:
tr = mk_toolres(r, ns=ns)
tr

Finding the sum of 604542 and 6458932


[{'role': 'assistant',
  'content': [ToolUseBlock(id='toolu_015SaTbNCNvNy6jDpDc2wuBF', input={'a': 604542, 'b': 6458932}, name='sums', type='tool_use')]},
 {'role': 'user',
  'content': [{'type': 'tool_result',
    'tool_use_id': 'toolu_015SaTbNCNvNy6jDpDc2wuBF',
    'content': 'MySum(val=7063474)'}]}]

In [None]:
msgs

[{'role': 'user', 'content': 'What is 604542+6458932?'}]

We add this to our dialog, and now Claude has all the information it needs to answer our question.

In [None]:
msgs += tr
contents(c(msgs, sp=sp, tools=tools))

'604542 + 6458932 = 7,063,474'

In [None]:
contents(msgs[-1])

'MySum(val=7063474)'

In [None]:
msgs

[{'role': 'user', 'content': 'What is 604542+6458932?'},
 {'role': 'assistant',
  'content': [ToolUseBlock(id='toolu_015SaTbNCNvNy6jDpDc2wuBF', input={'a': 604542, 'b': 6458932}, name='sums', type='tool_use')]},
 {'role': 'user',
  'content': [{'type': 'tool_result',
    'tool_use_id': 'toolu_015SaTbNCNvNy6jDpDc2wuBF',
    'content': 'MySum(val=7063474)'}]}]

This works with methods as well -- in this case, use the object itself for `ns`:

In [None]:
class Dummy:
    def sums(
        self,
        a:int,  # First thing to sum
        b:int=1 # Second thing to sum
    ) -> int: # The sum of the inputs
        "Adds a + b."
        print(f"Finding the sum of {a} and {b}")
        return a + b

In [None]:
tools = [get_schema(Dummy.sums)]
o = Dummy()
r = c(pr, sp=sp, tools=tools, tool_choice=choice)
tr = mk_toolres(r, obj=o)
msgs += tr
contents(c(msgs, sp=sp, tools=tools))

Finding the sum of 604542 and 6458932


'604542 + 6458932 = 7,063,474'

### Text editing

Anthropic also has a special tool type specific to text editing.

In [None]:
tools = [text_editor_conf['sonnet']]
tools

[{'type': 'text_editor_20250429', 'name': 'str_replace_based_edit_tool'}]

In [None]:
pr = 'Could you please explain my _quarto.yml file?'
msgs = [mk_msg(pr)]
r = c(msgs, sp=sp, tools=tools)
find_block(r, ToolUseBlock)

ToolUseBlock(id='toolu_018vACkL2Ua6vTZSd5i4C6Ci', input={'command': 'view', 'path': '_quarto.yml'}, name='str_replace_based_edit_tool', type='tool_use')

We've gone ahead and create a reference implementation that you can directly use from our `text_editor` module. Or use as reference for creating your own. 

In [None]:
ns = mk_ns(str_replace_based_edit_tool)
tr = mk_toolres(r, ns=ns)
msgs += tr
print(contents(c(msgs, sp=sp, tools=tools))[:128])

Great! Let me explain your `_quarto.yml` configuration file section by section:

## Project Configuration
```yaml
project:
  typ


## Callable Client

In [None]:
#| export
def get_types(msgs):
    types = []
    for m in msgs:
        content = m.get('content', [])
        if isinstance(content, list): types.extend(getattr(c, 'type', None) or c['type'] for c in content)
        else: types.append('text')
    return types

In [None]:
get_types(msgs)

['text', 'text', 'tool_use', 'tool_result']

In [None]:
#| exports
@patch
@delegates(messages.Messages.create)
def __call__(self:Client,
             msgs:list, # List of messages in the dialog
             sp='', # The system prompt
             temp=0, # Temperature
             maxtok=4096, # Maximum tokens
             maxthinktok=0, # Maximum thinking tokens
             prefill='', # Optional prefill to pass to Claude as start of its response
             stream:bool=False, # Stream response?
             stop=None, # Stop sequence
             tools:Optional[list]=None, # List of tools to make available to Claude
             tool_choice:Optional[dict]=None, # Optionally force use of some tool
             **kwargs):
    "Make a call to Claude."
    if tools: kwargs['tools'] = [get_schema(o) if callable(o) else o for o in listify(tools)]
    if tool_choice: kwargs['tool_choice'] = mk_tool_choice(tool_choice)
    if maxthinktok: 
        kwargs['thinking']={'type':'enabled', 'budget_tokens':maxthinktok} 
        temp=1; prefill=''
    msgs = self._precall(msgs, prefill, stop, kwargs)
    if any(t == 'image' for t in get_types(msgs)): assert not self.text_only, f"Images are not supported by the current model type: {self.model}"
    if stream: return self._stream(msgs, prefill=prefill, max_tokens=maxtok, system=sp, temperature=temp, **kwargs)
    res = self.c.messages.create(model=self.model, messages=msgs, max_tokens=maxtok, system=sp, temperature=temp, **kwargs)
    return self._log(res, prefill, msgs, maxtok, sp, temp, stream=stream, stop=stop, **kwargs)

In [None]:
a,b = 604542,6458932
pr = f"What is {a}+{b}?"
sp = "You are a summing expert."

In [None]:
for tools in [sums, [get_schema(sums)]]:
    r = c(pr, sp=sp, tools=tools, tool_choice='sums')
    print(r)

Message(id='msg_01Rn6UCZEtKrhnhB58JTCR9P', content=[ToolUseBlock(id='toolu_01BefC1u7bbPGcu9cXXuVvaK', input={'a': 604542, 'b': 6458932}, name='sums', type='tool_use')], model='claude-sonnet-4-20250514', role='assistant', stop_reason='tool_use', stop_sequence=None, type='message', usage=In: 443; Out: 53; Cache create: 0; Cache read: 0; Total Tokens: 496; Server tool use (web search requests): 0)
Message(id='msg_01JmDectZUD3txGJ8sfc5NrE', content=[ToolUseBlock(id='toolu_014qMZWji6Gpa3wfBw2sbYHe', input={'a': 604542, 'b': 6458932}, name='sums', type='tool_use')], model='claude-sonnet-4-20250514', role='assistant', stop_reason='tool_use', stop_sequence=None, type='message', usage=In: 443; Out: 53; Cache create: 0; Cache read: 0; Total Tokens: 496; Server tool use (web search requests): 0)


In [None]:
ns = mk_ns(sums)
tr = mk_toolres(r, ns=ns)

Finding the sum of 604542 and 6458932


In [None]:
#| exports
@patch
@delegates(Client.__call__)
def structured(self:Client,
               msgs:list, # List of messages in the dialog
               tools:Optional[list]=None, # List of tools to make available to Claude
               obj:Optional=None, # Class to search for tools
               ns:Optional[abc.Mapping]=None, # Namespace to search for tools
               **kwargs):
    "Return the value of all tool calls (generally used for structured outputs)"
    tools = listify(tools)
    res = self(msgs, tools=tools, tool_choice=tools, **kwargs)
    if ns is None: ns=mk_ns(*tools)
    if obj is not None: ns = mk_ns(obj)
    cts = getattr(res, 'content', [])
    tcs = [call_func(o.name, o.input, ns=ns) for o in cts if isinstance(o,ToolUseBlock)]
    return tcs

Anthropic's API does not support response formats directly, so instead we provide a `structured` method to use tool calling to achieve the same result. The result of the tool is not passed back to Claude in this case, but instead is returned directly to the user. 

In [None]:
c.structured(pr, tools=[sums])

Finding the sum of 604542 and 6458932


[MySum(val=7063474)]

In [None]:
c

ToolUseBlock(id='toolu_01HGwroRth83r5uTpcpMQzMs', input={'a': 604542, 'b': 6458932}, name='sums', type='tool_use')

| Metric | Count | Cost (USD) |
|--------|------:|-----:|
| Input tokens | 6,002 | 0.018006 |
| Output tokens | 1,404 | 0.021060 |
| Cache tokens | 0 | 0.000000 |
| Server tool use | 0 | 0.000000 |
| **Total** | **7,406** | **$0.039066** |

## Custom Types with Tools Use

We need to add tool support for custom types too. Let's test out custom types using a minimal example.

In [None]:
class Book(BasicRepr):
    def __init__(self, title: str, pages: int): store_attr()
    def __repr__(self):
        return f"Book Title : {self.title}\nNumber of Pages : {self.pages}"

In [None]:
Book("War and Peace", 950)

Book Title : War and Peace
Number of Pages : 950

In [None]:
def find_page(book: Book, # The book to find the halfway point of
              percent: int, # Percent of a book to read to, e.g. halfway == 50, 
) -> int:
    "The page number corresponding to `percent` completion of a book"
    return round(book.pages * (percent / 100.0))

In [None]:
get_schema(find_page)

{'name': 'find_page',
 'description': 'The page number corresponding to `percent` completion of a book\n\nReturns:\n- type: integer',
 'input_schema': {'type': 'object',
  'properties': {'book': {'type': 'object',
    'description': 'The book to find the halfway point of',
    '$ref': '#/$defs/Book'},
   'percent': {'type': 'integer',
    'description': 'Percent of a book to read to, e.g. halfway == 50,'}},
  'title': None,
  'required': ['book', 'percent'],
  '$defs': {'Book': {'type': 'object',
    'properties': {'title': {'type': 'string', 'description': ''},
     'pages': {'type': 'integer', 'description': ''}},
    'title': 'Book',
    'required': ['title', 'pages']}}}}

In [None]:
choice = mk_tool_choice('find_page')
choice

{'type': 'tool', 'name': 'find_page'}

Claudette will pack objects as dict, so we'll transform tool functions with user-defined types into tool functions that accept a dict in lieu of the user-defined type.

First let's convert a single argument:

In [None]:
#| export
def _is_builtin(tp: type):
    "Returns True for built in primitive types or containers"
    return (tp in (str, int, float, bool, complex) or tp is None
        or getattr(tp, '__origin__', None) is not None)  # Pass through all container types

def _convert(val: Dict, # dictionary argument being passed in
            tp: type): # type of the tool function input
    "Convert converts a single argument"
    if val is None or _is_builtin(tp) or not isinstance(val, dict): return val
    return tp(**val)

`_is_builtin` decides whether to pass an argument through as-is. Let's check the argument conversion:

In [None]:
(_is_builtin(int), _is_builtin(Book), _is_builtin(List))

(True, False, True)

In [None]:
(_convert(555, int),
 _convert({"title": "War and Peace", "pages": 923}, Book),
 _convert([1, 2, 3, 4], List))

(555,
 Book Title : War and Peace
 Number of Pages : 923,
 [1, 2, 3, 4])

To apply `tool()` to a function is to return a new function where the user-defined types are replaced with dictionary inputs.

In [None]:
#| export
def tool(func):
    if isinstance(func, dict): return func # it's a schema, so don't change
    hints = get_type_hints(func)
    @wraps(func)
    def wrapper(*args, **kwargs):
        new_args = [_convert(arg, hints[p]) for p,arg in zip(inspect.signature(func).parameters, args)]
        new_kwargs = {k: _convert(v, hints[k]) if k in hints else v for k,v in kwargs.items()}
        return func(*new_args, **new_kwargs)
    return wrapper

A function is transformed into a function with dict arguments substituted for user-defined types. Built-in types such as `percent` here are left untouched.

In [None]:
find_page(book=Book("War and Peace", 950), percent=50)

475

In [None]:
tool(find_page)({"title": "War and Peace", "pages": 950}, percent=50)

475

By passing tools wrapped by `tool()`, user-defined types now work completes without failing in tool calls.

In [None]:
pr = "How many pages do I have to read to get halfway through my 950 page copy of War and Peace"
tools = tool(find_page)
tools

<function __main__.find_page(book: __main__.Book, percent: int) -> int>

In [None]:
r = c(pr, tools=[tools])
find_block(r, ToolUseBlock)

ToolUseBlock(id='toolu_01RkktpMG4uyneFs6TYHMKmM', input={'book': {'title': 'War and Peace', 'pages': 950}, 'percent': 50}, name='find_page', type='tool_use')

In [None]:
tr = mk_toolres(r, ns=[tools])
tr

[{'role': 'assistant',
  'content': [TextBlock(citations=None, text="I'll help you find the halfway point of your copy of War and Peace.", type='text'),
   ToolUseBlock(id='toolu_01RkktpMG4uyneFs6TYHMKmM', input={'book': {'title': 'War and Peace', 'pages': 950}, 'percent': 50}, name='find_page', type='tool_use')]},
 {'role': 'user',
  'content': [{'type': 'tool_result',
    'tool_use_id': 'toolu_01RkktpMG4uyneFs6TYHMKmM',
    'content': '475'}]}]

In [None]:
msgs = [pr]+tr
contents(c(msgs, sp=sp, tools=[tools]))

"To get halfway through your 950-page copy of War and Peace, you need to read to page 475. That means you'll have read 475 pages when you reach the halfway point of the book."

## Chat

Rather than manually adding the responses to a dialog, we'll create a simple `Chat` class to do that for us, each time we make a request. We'll also store the system prompt and tools here, to avoid passing them every time.

In [None]:
#| export
class Chat:
    def __init__(self,
                 model:Optional[str]=None, # Model to use (leave empty if passing `cli`)
                 cli:Optional[Client]=None, # Client to use (leave empty if passing `model`)
                 sp='', # Optional system prompt
                 tools:Optional[list]=None, # List of tools to make available to Claude
                 temp=0, # Temperature
                 cont_pr:Optional[str]=None, # User prompt to continue an assistant response
                 cache: bool = False,  # Use Claude cache?
                 hist: list = None,  # Initialize history
                 ns:Optional[abc.Mapping]=None # Namespace to search for tools
                ):
        "Anthropic chat client."
        assert model or cli
        assert cont_pr != "", "cont_pr may not be an empty string"
        self.c = (cli or Client(model, cache=cache))
        if hist is None: hist=[]
        if tools: tools = [tool(t) for t in listify(tools)]
        if ns is None: ns=tools
        self.h,self.sp,self.tools,self.cont_pr,self.temp,self.cache,self.ns = hist,sp,tools,cont_pr,temp,cache,ns

    @property
    def use(self): return self.c.use

The class stores the `Client` that will provide the responses in `c`, and a history of messages in `h`.

In [None]:
sp = "Never mention what tools you use."
chat = Chat(model, sp=sp)
chat.c.use, chat.h

(In: 0; Out: 0; Cache create: 0; Cache read: 0; Total Tokens: 0; Server tool use (web search requests): 0,
 [])

In [None]:
chat.c.use.cost(pricing[model_types[chat.c.model]])

0.0

This is clunky. Let's add `cost` as a property for the `Chat` class. It will pass in the appropriate prices for the current model to the usage cost calculator.

In [None]:
#| exports
@patch(as_prop=True)
def cost(self: Chat) -> float: return self.c.cost

In [None]:
chat.cost

0.0

In [None]:
#| exports
@patch
def _stream(self:Chat, res):
    yield from res
    self.last = mk_toolres(self.c.result, ns=self.ns) #, obj=self)
    self.h += self.last

In [None]:
#| exports
@patch
def _post_pr(self:Chat, pr, prev_role):
    if pr is None and prev_role == 'assistant':
        if self.cont_pr is None:
            raise ValueError("Prompt must be given after assistant completion, or use `self.cont_pr`.")
        pr = self.cont_pr # No user prompt, keep the chain
    if pr: self.h.append(mk_msg(pr, cache=self.cache))

In [None]:
#| exports
@patch
def _append_pr(self:Chat,
               pr=None,  # Prompt / message
              ):
    prev_role = nested_idx(self.h, -1, 'role') if self.h else 'assistant' # First message should be 'user'
    if pr and prev_role == 'user': self() # already user request pending
    self._post_pr(pr, prev_role)

In [None]:
#| exports
@patch
def __call__(self:Chat,
             pr=None,  # Prompt / message
             temp=None, # Temperature
             maxtok=4096, # Maximum tokens
             maxthinktok=0, # Maximum thinking tokens
             stream=False, # Stream response?
             prefill='', # Optional prefill to pass to Claude as start of its response
             tool_choice:Optional[dict]=None, # Optionally force use of some tool
             **kw):
    if temp is None: temp=self.temp
    self._append_pr(pr)
    res = self.c(self.h, stream=stream, prefill=prefill, sp=self.sp, temp=temp, maxtok=maxtok, maxthinktok=maxthinktok, tools=self.tools, tool_choice=tool_choice,**kw)
    if stream: return self._stream(res)
    self.last = mk_toolres(self.c.result, ns=self.ns)
    self.h += self.last
    return res

The `__call__` method just passes the request along to the `Client`, but rather than just passing in this one prompt, it appends it to the history and passes it all along. As a result, we now have state!

In [None]:
chat = Chat(model, sp=sp)

In [None]:
chat("I'm Jeremy")
chat("What's my name?")

Your name is Jeremy! You introduced yourself at the beginning of our conversation.

<details>

- id: `msg_01Q8gi3zX6Fo7mVX39ovEQFD`
- content: `[{'citations': None, 'text': 'Your name is Jeremy! You introduced yourself at the beginning of our conversation.', 'type': 'text'}]`
- model: `claude-sonnet-4-20250514`
- role: `assistant`
- stop_reason: `end_turn`
- stop_sequence: `None`
- type: `message`
- usage: `{'cache_creation_input_tokens': 0, 'cache_read_input_tokens': 0, 'input_tokens': 42, 'output_tokens': 18, 'server_tool_use': None, 'service_tier': 'standard'}`

</details>

In [None]:
chat.use, chat.cost

(In: 59; Out: 35; Cache create: 0; Cache read: 0; Total Tokens: 94; Server tool use (web search requests): 0,
 0.000702)

Let's try out prefill too:

In [None]:
q = "Concisely, what is the meaning of life?"
pref = 'According to Douglas Adams,'

In [None]:
chat.c.result

Your name is Jeremy! You introduced yourself at the beginning of our conversation.

<details>

- id: `msg_01Q8gi3zX6Fo7mVX39ovEQFD`
- content: `[{'citations': None, 'text': 'Your name is Jeremy! You introduced yourself at the beginning of our conversation.', 'type': 'text'}]`
- model: `claude-sonnet-4-20250514`
- role: `assistant`
- stop_reason: `end_turn`
- stop_sequence: `None`
- type: `message`
- usage: `{'cache_creation_input_tokens': 0, 'cache_read_input_tokens': 0, 'input_tokens': 42, 'output_tokens': 18, 'server_tool_use': None, 'service_tier': 'standard'}`

</details>

In [None]:
chat(q, prefill=pref)

According to Douglas Adams,it's 42. But seriously, the meaning of life is likely what you make it - finding purpose through relationships, growth, contribution, and experiences that matter to you.

<details>

- id: `msg_01Uu21keyVeLD4e3fH5rjpM8`
- content: `[{'citations': None, 'text': "According to Douglas Adams,it's 42. But seriously, the meaning of life is likely what you make it - finding purpose through relationships, growth, contribution, and experiences that matter to you.", 'type': 'text'}]`
- model: `claude-sonnet-4-20250514`
- role: `assistant`
- stop_reason: `end_turn`
- stop_sequence: `None`
- type: `message`
- usage: `{'cache_creation_input_tokens': 0, 'cache_read_input_tokens': 0, 'input_tokens': 80, 'output_tokens': 38, 'server_tool_use': None, 'service_tier': 'standard'}`

</details>

By default messages must be in user, assistant, user format. If this isn't followed (aka calling `chat()` without a user message) it will error out:

In [None]:
try: chat()
except ValueError as e: print("Error:", e)

Error: Prompt must be given after assistant completion, or use `self.cont_pr`.


Setting `cont_pr` allows a "default prompt" to be specified when a prompt isn't specified. Usually used to prompt the model to continue.

In [None]:
chat.cont_pr = "keep going..."
chat()

The search for meaning itself might be more important than finding a single answer. Some find it through:

- Creating something lasting
- Alleviating suffering 
- Pursuing truth and understanding
- Experiencing beauty and wonder
- Building deep connections
- Living authentically according to your values

Maybe life's meaning isn't a destination but the conscious act of living with intention, curiosity, and compassion. The question keeps us human.

<details>

- id: `msg_015NjqhMnsGEmdVYXPMZWnUm`
- content: `[{'citations': None, 'text': "The search for meaning itself might be more important than finding a single answer. Some find it through:\n\n- Creating something lasting\n- Alleviating suffering \n- Pursuing truth and understanding\n- Experiencing beauty and wonder\n- Building deep connections\n- Living authentically according to your values\n\nMaybe life's meaning isn't a destination but the conscious act of living with intention, curiosity, and compassion. The question keeps us human.", 'type': 'text'}]`
- model: `claude-sonnet-4-20250514`
- role: `assistant`
- stop_reason: `end_turn`
- stop_sequence: `None`
- type: `message`
- usage: `{'cache_creation_input_tokens': 0, 'cache_read_input_tokens': 0, 'input_tokens': 124, 'output_tokens': 95, 'server_tool_use': None, 'service_tier': 'standard'}`

</details>

We can also use streaming:

In [None]:
chat = Chat(model, sp=sp)
for o in chat("I'm Jeremy", stream=True): print(o, end='')

Hi Jeremy! Nice to meet you. How are you doing today?

In [None]:
for o in chat(q, prefill=pref, stream=True): print(o, end='')

According to Douglas Adams,it's 42. But more seriously, life's meaning is likely something you create through your relationships, contributions, growth, and what brings you fulfillment and purpose.

You can provide a history of messages to initialise `Chat` with:

In [None]:
chat = Chat(model, sp=sp, hist=["Can you guess my name?", "Hmmm I really don't know. Is it 'Merlin G. Penfolds'?"])
chat('Wow how did you know?')

I have to be honest - I was just making a playful, completely random guess! I don't actually have any way to know your real name. I was being silly with that very specific and unusual name combination. 

Is that actually your name, or were you playing along with my random guess? Either way, I'm curious now!

<details>

- id: `msg_01VcUWNoZsvUJSragJnRWwKp`
- content: `[{'citations': None, 'text': "I have to be honest - I was just making a playful, completely random guess! I don't actually have any way to know your real name. I was being silly with that very specific and unusual name combination. \n\nIs that actually your name, or were you playing along with my random guess? Either way, I'm curious now!", 'type': 'text'}]`
- model: `claude-sonnet-4-20250514`
- role: `assistant`
- stop_reason: `end_turn`
- stop_sequence: `None`
- type: `message`
- usage: `{'cache_creation_input_tokens': 0, 'cache_read_input_tokens': 0, 'input_tokens': 58, 'output_tokens': 73, 'server_tool_use': None, 'service_tier': 'standard'}`

</details>

### Chat tool use

We automagically get streamlined tool use as well:

In [None]:
pr = f"What is {a}+{b}?"
pr

'What is 604542+6458932?'

In [None]:
chat = Chat(model, sp=sp, tools=[sums])
r = chat(pr)
r

Finding the sum of 604542 and 6458932


ToolUseBlock(id='toolu_01JzXrbX5z3UQVZPV6MYaf7f', input={'a': 604542, 'b': 6458932}, name='sums', type='tool_use')

<details>

- id: `msg_01PcBwNBeU9LWEa6BbQYaDkS`
- content: `[{'id': 'toolu_01JzXrbX5z3UQVZPV6MYaf7f', 'input': {'a': 604542, 'b': 6458932}, 'name': 'sums', 'type': 'tool_use'}]`
- model: `claude-sonnet-4-20250514`
- role: `assistant`
- stop_reason: `tool_use`
- stop_sequence: `None`
- type: `message`
- usage: `{'cache_creation_input_tokens': 0, 'cache_read_input_tokens': 0, 'input_tokens': 437, 'output_tokens': 72, 'server_tool_use': None, 'service_tier': 'standard'}`

</details>

Now we need to send this result to Claude—calling the object with no parameters tells it to return the tool result to Claude:

In [None]:
chat()

604542 + 6458932 = 7,063,474

<details>

- id: `msg_01QctoXHrtJES7zXzVE8FY62`
- content: `[{'citations': None, 'text': '604542 + 6458932 = 7,063,474', 'type': 'text'}]`
- model: `claude-sonnet-4-20250514`
- role: `assistant`
- stop_reason: `end_turn`
- stop_sequence: `None`
- type: `message`
- usage: `{'cache_creation_input_tokens': 0, 'cache_read_input_tokens': 0, 'input_tokens': 530, 'output_tokens': 19, 'server_tool_use': None, 'service_tier': 'standard'}`

</details>

It should be correct, because it actually used our Python function to do the addition. Let's check:

In [None]:
a+b

7063474

Let's test a function with user defined types.

In [None]:
chat = Chat(model, sp=sp, tools=[find_page])
r = chat("How many pages is three quarters of the way through my 80 page edition of Tao Te Ching?")
r

ToolUseBlock(id='toolu_01RvQPLD9k756RzWbNRCpLoM', input={'book': {'title': 'Tao Te Ching', 'pages': 80}, 'percent': 75}, name='find_page', type='tool_use')

<details>

- id: `msg_01ShUen66HBcVHHNhXTPQtDX`
- content: `[{'id': 'toolu_01RvQPLD9k756RzWbNRCpLoM', 'input': {'book': {'title': 'Tao Te Ching', 'pages': 80}, 'percent': 75}, 'name': 'find_page', 'type': 'tool_use'}]`
- model: `claude-sonnet-4-20250514`
- role: `assistant`
- stop_reason: `tool_use`
- stop_sequence: `None`
- type: `message`
- usage: `{'cache_creation_input_tokens': 0, 'cache_read_input_tokens': 0, 'input_tokens': 547, 'output_tokens': 86, 'server_tool_use': None, 'service_tier': 'standard'}`

</details>

Now we need to send this result to Claude—calling the object with no parameters tells it to return the tool result to Claude:

In [None]:
chat()

Three quarters of the way through your 80-page edition of Tao Te Ching would be page 60.

<details>

- id: `msg_01X3DzdxaUkkoW2JpxvU3CLz`
- content: `[{'citations': None, 'text': 'Three quarters of the way through your 80-page edition of Tao Te Ching would be page 60.', 'type': 'text'}]`
- model: `claude-sonnet-4-20250514`
- role: `assistant`
- stop_reason: `end_turn`
- stop_sequence: `None`
- type: `message`
- usage: `{'cache_creation_input_tokens': 0, 'cache_read_input_tokens': 0, 'input_tokens': 647, 'output_tokens': 29, 'server_tool_use': None, 'service_tier': 'standard'}`

</details>

It should be correct, because it actually used our Python function to do the addition. Let's check:

In [None]:
80 * .75

60.0

In [None]:
#| exports
@patch
def _repr_markdown_(self:Chat):
    if not hasattr(self.c, 'result'): return 'No results yet'
    last_msg = contents(self.c.result)
    
    def fmt_msg(m):
        t = contents(m)
        if isinstance(t, dict): return t['content']
        return t
        
    history = '\n\n'.join(f"**{m['role']}**: {fmt_msg(m)}" 
                         for m in self.h)
    det = self.c._repr_markdown_().split('\n\n')[-1]
    if history: history = f"""
<details>
<summary>► History</summary>

{history}

</details>
"""

    return f"""{last_msg}
{history}
{det}"""

In [None]:
chat

Three quarters of the way through your 80-page edition of Tao Te Ching would be page 60.

<details>
<summary>► History</summary>

**user**: H

**assistant**: ToolUseBlock(id='toolu_01RvQPLD9k756RzWbNRCpLoM', input={'book': {'title': 'Tao Te Ching', 'pages': 80}, 'percent': 75}, name='find_page', type='tool_use')

**user**: 60

**assistant**: Three quarters of the way through your 80-page edition of Tao Te Ching would be page 60.

</details>

| Metric | Count | Cost (USD) |
|--------|------:|-----:|
| Input tokens | 1,194 | 0.003582 |
| Output tokens | 115 | 0.001725 |
| Cache tokens | 0 | 0.000000 |
| Server tool use | 0 | 0.000000 |
| **Total** | **1,309** | **$0.005307** |

In [None]:
chat = Chat(model, tools=[text_editor_conf['sonnet']], ns=mk_ns(str_replace_based_edit_tool))

When not providing tools directly as Python functions (like `sum`), you **must** create and pass a namespace dictionary (mapping the tool name string to the function object) using the `ns` parameter to methods like `mk_toolres` or `toolloop`. `toolslm` cannot automatically generate the namespace in this case. For schema-based tools (i.e., Python functions), `claudette` handles namespace creation automatically.

In [None]:
r = chat('Please explain what my _quarto.yml does. Use your tools')
find_block(r, ToolUseBlock)

ToolUseBlock(id='toolu_01VtVGN7StnhXzJD6kAZD75w', input={'command': 'view', 'path': '.'}, name='str_replace_based_edit_tool', type='tool_use')

In [None]:
chat()

Now let me examine the `_quarto.yml` file:

<details>

- id: `msg_01Xi9MhA3PProt4baSao3MEB`
- content: `[{'citations': None, 'text': 'Now let me examine the `_quarto.yml` file:', 'type': 'text'}, {'id': 'toolu_01JKwmHe5gJHaTxiAPwLPqTb', 'input': {'command': 'view', 'path': '/_Users/jhoward/aai-ws/claudette/_quarto.yml'}, 'name': 'str_replace_based_edit_tool', 'type': 'tool_use'}]`
- model: `claude-sonnet-4-20250514`
- role: `assistant`
- stop_reason: `tool_use`
- stop_sequence: `None`
- type: `message`
- usage: `{'cache_creation_input_tokens': 0, 'cache_read_input_tokens': 0, 'input_tokens': 2693, 'output_tokens': 109, 'server_tool_use': None, 'service_tier': 'standard'}`

</details>

## Images

Claude can handle image data as well. As everyone knows, when testing image APIs you have to use a cute puppy.

In [None]:
# Image is Cute_dog.jpg from Wikimedia
fn = Path('samples/puppy.jpg')
display.Image(filename=fn, width=200)

<IPython.core.display.Image object>

In [None]:
img = fn.read_bytes()

Claude expects an image message to have the following structure

```js
{
    'role': 'user', 
    'content': [
        {'type':'text', 'text':'What is in the image?'},
        {
            'type':'image', 
            'source': {
                'type':'base64', 'media_type':'media_type', 'data': 'data'
            }
        }
    ]
}
```
`msglm` automatically detects if a message is an image, encodes it, and generates the data structure above.
All we need to do is a create a list containing our image and a query and then pass it to `mk_msg`.

Let's try it out...

In [None]:
q = "In brief, what color flowers are in this image?"
msg = mk_msg([img, q])

In [None]:
c([msg])

The flowers in this image are purple.

<details>

- id: `msg_01ToLdeUX71Uwk7QhRRhMHKW`
- content: `[{'citations': None, 'text': 'The flowers in this image are purple.', 'type': 'text'}]`
- model: `claude-sonnet-4-20250514`
- role: `assistant`
- stop_reason: `end_turn`
- stop_sequence: `None`
- type: `message`
- usage: `{'cache_creation_input_tokens': 0, 'cache_read_input_tokens': 0, 'input_tokens': 110, 'output_tokens': 11, 'server_tool_use': None, 'service_tier': 'standard'}`

</details>

You don't need to call `mk_msg` on each individual message before passing them to the `Chat` class. Instead you can pass your messages in a list and the `Chat` class will automatically call `mk_msgs` in the background. 

```python
c(["How are you?", r])
```

For messages that contain multiple content types (like an image with a question), you'll need to enclose the message contents in a list as shown below:

```python
c(["How are you?", r, [img, q]])
```

In [None]:
c = Chat(model)
c([img, q])

The flowers in this image are purple.

<details>

- id: `msg_01CfXqwv33obnY7qfsvH3MFU`
- content: `[{'citations': None, 'text': 'The flowers in this image are purple.', 'type': 'text'}]`
- model: `claude-sonnet-4-20250514`
- role: `assistant`
- stop_reason: `end_turn`
- stop_sequence: `None`
- type: `message`
- usage: `{'cache_creation_input_tokens': 0, 'cache_read_input_tokens': 0, 'input_tokens': 110, 'output_tokens': 11, 'server_tool_use': None, 'service_tier': 'standard'}`

</details>

In [None]:
def contents(r):
    "Helper to get the contents from Claude response `r`."
    blk = find_block(r)
    if not blk and r.content: blk = r.content[0]
    if hasattr(blk,'text'): return blk.text.strip()
    elif hasattr(blk,'content'): return blk.content.strip()
    elif hasattr(blk,'source'): return f'*Media Type - {blk.type}*'
    return str(blk)

In [None]:
contents(c.h[0])

'*Media Type - image*'

In [None]:
c

The flowers in this image are purple.

<details>
<summary>► History</summary>

**user**: *Media Type - image*

**assistant**: The flowers in this image are purple.

</details>

| Metric | Count | Cost (USD) |
|--------|------:|-----:|
| Input tokens | 110 | 0.000330 |
| Output tokens | 11 | 0.000165 |
| Cache tokens | 0 | 0.000000 |
| Server tool use | 0 | 0.000000 |
| **Total** | **121** | **$0.000495** |

:::{.callout-note}

Unfortunately, not all Claude models support images 😞. This [table](https://docs.anthropic.com/en/docs/about-claude/models#model-comparison-table) summarizes the capabilities of each Claude model and the different modalities they support.

:::

## Caching

Claude supports context caching by adding a `cache_control` header to the message content.

```js
{
    "role": "user",
    "content": [
        {
            "type": "text", 
            "text": "Please cache my message", 
            "cache_control": {"type": "ephemeral"}
        }
    ]
}
```

To cache a message, we simply set `cache=True` when calling `mk_msg`.

In [None]:
mk_msg(['hi', 'there'], cache=True)

```json
{ 'content': [ {'text': 'hi', 'type': 'text'},
               { 'cache_control': {'type': 'ephemeral'},
                 'text': 'there',
                 'type': 'text'}],
  'role': 'user'}
```

Claude also now supports smart cache look-ups, so it's very simple to keep an entire conversation in cache by constantly telling it to update the cache with the latest message. To do this, we just need to set `cache=True` when creating a `Chat`.

In [None]:
chat = Chat(model, sp=sp, cache=True)

Caching has a minimum token limit of 1024 tokens for Sonnet and Opus, and 2048 for Haiku. If your conversation is below this limit, it will not be cached.

In [None]:
chat("Hi, I'm Jeremy.")

Hi Jeremy! Nice to meet you. How are you doing today?

<details>

- id: `msg_01UkAzUS4wBxBkfG4AEczUE1`
- content: `[{'citations': None, 'text': 'Hi Jeremy! Nice to meet you. How are you doing today?', 'type': 'text'}]`
- model: `claude-sonnet-4-20250514`
- role: `assistant`
- stop_reason: `end_turn`
- stop_sequence: `None`
- type: `message`
- usage: `{'cache_creation_input_tokens': 0, 'cache_read_input_tokens': 0, 'input_tokens': 20, 'output_tokens': 17, 'server_tool_use': None, 'service_tier': 'standard'}`

</details>

Note the usage: no cache is created, nor used. Now, let's send a long enough message to trigger caching.

In [None]:
chat("""Lorem ipsum dolor sit amet""" * 150)

I see you've sent a very long block of "Lorem ipsum dolor sit amet" repeated many times! Lorem ipsum is that classic placeholder text used in design and publishing. 

Was this intentional, or did something go wrong with copy-pasting? Either way, no worries - happens to the best of us! Is there something specific you'd like to chat about, Jeremy?

<details>

- id: `msg_01Cf5S1iAx1bxeFxw4EoCQoH`
- content: `[{'citations': None, 'text': 'I see you\'ve sent a very long block of "Lorem ipsum dolor sit amet" repeated many times! Lorem ipsum is that classic placeholder text used in design and publishing. \n\nWas this intentional, or did something go wrong with copy-pasting? Either way, no worries - happens to the best of us! Is there something specific you\'d like to chat about, Jeremy?', 'type': 'text'}]`
- model: `claude-sonnet-4-20250514`
- role: `assistant`
- stop_reason: `end_turn`
- stop_sequence: `None`
- type: `message`
- usage: `{'cache_creation_input_tokens': 1084, 'cache_read_input_tokens': 0, 'input_tokens': 4, 'output_tokens': 82, 'server_tool_use': None, 'service_tier': 'standard'}`

</details>

The context is now long enough for cache to be used. All the conversation history has now been written to the temporary cache. Any subsequent message will read from it rather than re-processing the entire conversation history.

In [None]:
chat("Oh thank you! Sorry, my lorem ipsum generator got out of control!")

Haha, no problem at all! Those lorem ipsum generators can definitely get a bit enthusiastic sometimes. It's like they're trying to fill every possible space with placeholder text! 

I've seen that happen before - you ask for a paragraph and suddenly you've got enough fake Latin to write a novel. Did you get it sorted out, or is it still churning out endless "dolor sit amets" somewhere?

<details>

- id: `msg_0178XFDJbdG7F642694cNyJU`
- content: `[{'citations': None, 'text': 'Haha, no problem at all! Those lorem ipsum generators can definitely get a bit enthusiastic sometimes. It\'s like they\'re trying to fill every possible space with placeholder text! \n\nI\'ve seen that happen before - you ask for a paragraph and suddenly you\'ve got enough fake Latin to write a novel. Did you get it sorted out, or is it still churning out endless "dolor sit amets" somewhere?', 'type': 'text'}]`
- model: `claude-sonnet-4-20250514`
- role: `assistant`
- stop_reason: `end_turn`
- stop_sequence: `None`
- type: `message`
- usage: `{'cache_creation_input_tokens': 100, 'cache_read_input_tokens': 1084, 'input_tokens': 4, 'output_tokens': 90, 'server_tool_use': None, 'service_tier': 'standard'}`

</details>

## Extended Thinking

Claude >=3.7 Sonnet & Opus have enhanced reasoning capabilities for complex tasks. See [docs](https://docs.anthropic.com/en/docs/build-with-claude/extended-thinking) for more info.

We can enable extended thinking by passing a `thinking` param with the following structure.

```js
thinking={
    "type": "enabled",
    "budget_tokens": 16000
}
```

When extended thinking is enabled a thinking block is included in the response as shown below.

```js
{
  "content": [
    {
      "type": "thinking",
      "thinking": "To approach this, let's think about...",
      "signature": "Imtakcjsu38219c0.eyJoYXNoIjoiYWJjM0NTY3fQ...."
    },
    {
      "type": "text",
      "text": "Yes, there are infinitely many prime numbers such that..."
    }
  ]
}
```

Let's add a `maxthinktok` param to the `Client` and `Chat` call methods. When this value is not 0, we'll pass a thinking param to Claude `{"type":"enabled", "budget_tokens":maxthinktok}`.

*Note: When thinking is [enabled](https://docs.anthropic.com/en/docs/build-with-claude/extended-thinking#important-considerations-when-using-extended-thinking) `prefill` must be empty and the `temp` must be 1.*

In [None]:
#| export
def think_md(txt, thk):
    return f"""
{txt}

<details>
<summary>Thinking</summary>
{thk}
</details>
"""

In [None]:
def contents(r, show_thk=True):
    "Helper to get the contents from Claude response `r`."
    blk = find_block(r)
    if show_thk:
        tk_blk = find_block(r, blk_type=ThinkingBlock)
        if tk_blk: return think_md(blk.text.strip(), tk_blk.thinking.strip())
    if not blk and r.content: blk = r.content[0]
    if hasattr(blk,'text'): return blk.text.strip()
    elif hasattr(blk,'content'): return blk.content.strip()
    elif hasattr(blk,'source'): return f'*Media Type - {blk.type}*'
    return str(blk)

Let's call the model without extended thinking enabled. 

In [None]:
tk_model = first(has_extended_thinking_models)
tk_model

'claude-3-7-sonnet-20250219'

In [None]:
chat = Chat(tk_model)

In [None]:
chat("Write a sentence about Python!")

Python is a versatile programming language known for its readable syntax and wide application in fields ranging from web development to data science and artificial intelligence.

<details>

- id: `msg_01LxGU66RgaTvb5HZd2mbqbF`
- content: `[{'citations': None, 'text': 'Python is a versatile programming language known for its readable syntax and wide application in fields ranging from web development to data science and artificial intelligence.', 'type': 'text'}]`
- model: `claude-3-7-sonnet-20250219`
- role: `assistant`
- stop_reason: `end_turn`
- stop_sequence: `None`
- type: `message`
- usage: `{'cache_creation_input_tokens': 0, 'cache_read_input_tokens': 0, 'input_tokens': 13, 'output_tokens': 31, 'server_tool_use': None, 'service_tier': 'standard'}`

</details>

Now, let's call the model with extended thinking enabled.

In [None]:
chat("Write a sentence about Python!", maxthinktok=1024)


Python, named after the comedy group Monty Python, has grown from a hobby project started by Guido van Rossum in the late 1980s to become one of the world's most popular programming languages.

<details>
<summary>Thinking</summary>
I'm being asked to write another sentence about Python. Since I already wrote one response about Python as a programming language, I should write something different this time to provide variety. I could focus on different aspects of Python such as:

- Its creator or history
- Its popularity
- Specific features
- Community aspects
- Another meaning of "python" (like the snake)

I'll write a different sentence that highlights another aspect of Python that wasn't covered in my previous response.
</details>


<details>

- id: `msg_016TJyrSqSWbAuswncFJW35F`
- content: `[{'signature': 'ErUBCkYIBBgCIkADIHw1kNZ+ywY7wv6qQfP8STLvwf4iz7lzg1idFGuewF2OOsWxiEFqDuhfYg3Qt41u+1SLe50oQySERi37JpnUEgxcd4xRd79sPih9WlEaDH93qslG2RDFBK0PoSIwr5iITLyR7qjXzlWIie0cI8EfVZ/lIBBj6tzw4YK+0Ozb9rdRtm6OOtwUBMeXA/qYKh0pdLh4C1RxZbg+djwpt0uo9o82jrj3jGnhYwvAKhgC', 'thinking': 'I\'m being asked to write another sentence about Python. Since I already wrote one response about Python as a programming language, I should write something different this time to provide variety. I could focus on different aspects of Python such as:\n\n- Its creator or history\n- Its popularity\n- Specific features\n- Community aspects\n- Another meaning of "python" (like the snake)\n\nI\'ll write a different sentence that highlights another aspect of Python that wasn\'t covered in my previous response.', 'type': 'thinking'}, {'citations': None, 'text': "Python, named after the comedy group Monty Python, has grown from a hobby project started by Guido van Rossum in the late 1980s to become one of the world's most popular programming languages.", 'type': 'text'}]`
- model: `claude-3-7-sonnet-20250219`
- role: `assistant`
- stop_reason: `end_turn`
- stop_sequence: `None`
- type: `message`
- usage: `{'cache_creation_input_tokens': 0, 'cache_read_input_tokens': 0, 'input_tokens': 81, 'output_tokens': 158, 'server_tool_use': None, 'service_tier': 'standard'}`

</details>

## Server Tools and Web Search

The `str_replace` special tool type is a client side tool, i.e., one where we provide the implementation. However, Anthropic also supports server side tools. The current one available is their search tool, which you can find the documentation for [here](https://docs.anthropic.com/en/docs/build-with-claude/tool-use/web-search-tool). When provided as a tool to claude, claude can decide to search the web in order to answer or solve the task at hand.

In [None]:
#| export
def search_conf(max_uses:int=None, allowed_domains:list=None, blocked_domains:list=None, user_location:dict=None):
    'Little helper to create a search tool config'
    conf = {'type': 'web_search_20250305', 'name': 'web_search'}
    if max_uses: conf['max_uses'] = max_uses
    if allowed_domains: conf['allowed_domains'] = allowed_domains
    if blocked_domains: conf['blocked_domains'] = blocked_domains
    if user_location: conf['user_location'] = user_location
    return conf

Similar to client side tools, you provide to the `tools` argument in the anthropic api a non-schema dictionary with the tool's name, type, and any additional metadata specific to that tool. Here's a function to make that process easier for the web search tool.

In [None]:
search_conf()

{'type': 'web_search_20250305', 'name': 'web_search'}

The web search tool returns a list of `TextBlock`s comprised of response text from the model, `ServerToolUseBlock` and server tool results block such as `WebSearchToolResultBlock`. Some of these `TextBlock`s will contain citations with references to the results of the web search tool. Here is what all this looks like:

```js
{
  "content": [
    {
      "type": "text",
      "text": "I'll check the current weather in...",
    },
    {
      "type": "server_tool_use",
      "name": "web_search",
      "input": {"query": "San Diego weather forecast today May 12 2025"},
      "id":"srvtoolu_014t7fS449voTHRCVzi5jQGC"
    },
    {
      "type": "web_search_tool_result",
      "tool_use_id": "srvtoolu_014t7fS449voTHRCVzi5jQGC",
      "content": [
        "type": "web_search_result",
        "title": "Heat Advisory issued May 9...",
        "url": "https://kesq.com/weather/...",
        "page_age": "3 days ago",
        "encrypted_content": "ErgECioIAxgCIiQ4ODk4YTFkY...",
        ...
      ]
    }
    {
      "type": "text",
      "citations": [
        {
            "cited_text": 'The average temperature during this month...',
            "title": "Weather San Diego in May 2025:...",
            "url": "https://en.climate-data.org/...",
            "encrypted_index": "EpMBCioIAxgCIiQ4ODk4YTF..."
        }
      ],
      "text": "The average temperature in San Diego during May is..."
    },
    ...
  ]
}
```

 Let's update our `contents` function to handle these cases. For handling citations, we will use the excellent reference syntax in markdown to make clickable citation links.

In [None]:
#| export
def find_blocks(r, blk_type=TextBlock, type='text'):
    "Helper to find all blocks of type `blk_type` in response `r`."
    if isinstance(r, dict): f = lambda b: b.get('type') == 'text'
    else: f = lambda b: isinstance(b, TextBlock)
    return [b for b in getattr(r, "content", []) if f(b)]

In [None]:
#| export
def blks2cited_txt(txt_blks):
    "Helper to get the contents from a list of `TextBlock`s, with citations."
    text_sections, citations = [], []
    for blk in txt_blks:
        if isinstance(blk, dict): blk = AttrDict(blk)
        section = blk.text
        if getattr(blk, 'citations', None):
            markers = []
            for cit in blk.citations:
                citations.append(cit)
                markers.append(f"[^{len(citations)}]") # maintain global citation order
            section = f"{section} " + " ".join(markers)
        text_sections.append(section)
    body = "".join(text_sections)
    if citations:
        refs = "\n\n".join(f"[^{i+1}]: {c.url}\n\t\"{c.cited_text}\"" for i, c in enumerate(citations))
        body = f"{body}\n\n{refs}" if body else refs
    return body

In [None]:
#| export
def contents(r, show_thk=True):
    "Helper to get the contents from Claude response `r`."
    blks = find_blocks(r, blk_type=TextBlock)
    content = None
    if blks: content = blks2cited_txt(blks)
    if show_thk:
        tk_blk = find_block(r, blk_type=ThinkingBlock)
        if tk_blk: return think_md(content, tk_blk.thinking.strip())
    if not content:
        blk = find_block(r)
        if not blk and getattr(r, "content", None): blk = r.content[0]
        if hasattr(blk, "text"): content = blk.text.strip()
        elif hasattr(blk, "content"): content = blk.content.strip()
        elif hasattr(blk, "source"): content = f"*Media Type - {blk.type}*"
        else: content = str(blk)
    return content

In [None]:
chat = Chat(model, sp='Be concise in your responses.', tools=[search_conf()], cache=True)
pr = 'What is the weather in San Diego?'
r = chat(pr)
r

Based on the current weather information for San Diego, here's what I found:

The current temperature in San Diego is 72°F with partly cloudy conditions [^1]. Winds are coming from the north at 2 mph with gusts up to 10 mph [^2].

For tonight, expect cloudy skies with a low of 61°F and winds from the west-northwest at 5 to 10 mph [^3].

Tomorrow's forecast shows sunshine along with some cloudy intervals, with a high of 74°F and west winds at 5 to 10 mph [^4].

According to the National Weather Service, today will be the hottest day of the week with temperatures 5-10 degrees above normal [^5].

The air quality shows some concerns, as the air has reached a high level of pollution and is unhealthy for sensitive groups [^6].

[^1]: https://www.wunderground.com/weather/us/ca/san-diego
	"zoom out · Showing Stations · access_time 6:33 PM PDT on June 14, 2025 (GMT -7) | Updated 5 seconds ago · --° | 61° · 72 °F · like 73° · Partly Cloudy..."

[^2]: https://www.wunderground.com/weather/us/ca/san-diego
	"zoom out · Showing Stations · access_time 6:33 PM PDT on June 14, 2025 (GMT -7) | Updated 5 seconds ago · --° | 61° · 72 °F · like 73° · Partly Cloudy..."

[^3]: https://www.wunderground.com/weather/us/ca/san-diego
	"/ 0.00 °in Cloudy. Low 61F. Winds WNW at 5 to 10 mph. "

[^4]: https://www.wunderground.com/weather/us/ca/san-diego
	"/ 0.00 °in Sunshine along with some cloudy intervals. High 74F. Winds W at 5 to 10 mph. "

[^5]: https://www.weather.gov/sgx/
	"Today will be the hottest day of the week with highs 5-10 degrees above normal. "

[^6]: https://www.accuweather.com/en/us/san-diego/92101/weather-forecast/347628
	"The air has reached a high level of pollution and is unhealthy for sensitive groups. "

<details>

- id: `msg_01TqqiUjP4ua8Lqgdb9qx6du`
- content: `[{'id': 'srvtoolu_018EJgmzXbsoYSRWUMYq2DBq', 'input': {'query': 'San Diego weather today'}, 'name': 'web_search', 'type': 'server_tool_use'}, {'content': [{'encrypted_content': 'EqcCCioIBBgCIiQ4ODk4YTFkYy0yMTNkLTRhNmYtOTljYi03ZTBlNTUzZDc0NWISDCaMaO6VgxiaKqZXrxoMNAD0b/ETmfNw7RkxIjDc1peQ1+ADsdjQIltXag4RocW9N9eVMb4pmUgsO+XV9hKsDYJtFKuYDMuZ5SzCdUwqqgEN6WHTbX+1ePj08vlE5eW8NmJOpH+qKF2zx5E3F/Z5Z8lh2uMitZu2rKqwqhlNAcUFrEufQfoEkpuEWn2oSAffuJCGI7QCC5V+Bjee/f6ryDX6YcWFoLyWHwGP+XRQ2CW5rbVEtCO44UEXErYkJllmpjAyK63Bi/9JTRvxJlNJGYLGE4wD1S8wFF99nhdISqmHurPneNtWLzUrVSofLUd0iUNtDBdD4OlJbxgD', 'page_age': '2 weeks ago', 'title': '10-Day Weather Forecast for San Diego, CA - The Weather Channel | weather.com', 'type': 'web_search_result', 'url': 'https://weather.com/weather/tenday/l/San+Diego+CA?canonicalCityId=3b2b39ed755b459b725bf2a29c71d678'}, {'encrypted_content': 'Eu0MCioIBBgCIiQ4ODk4YTFkYy0yMTNkLTRhNmYtOTljYi03ZTBlNTUzZDc0NWISDFshmUI7nR3olbes9RoM/aA1chqe9CKZoDqgIjBv2Rl4YrhD9ecV7x1nGMkPv8VXk40g1CVo2Q312leODqov21X0Z/KUELfHOMBPDK8q8AuRAdIky5BupOL4SvUA30F0Rdw6xzBKifWNAYrqTmrSpaBOtljmPzkSLTQ93Z3QqAQbghT6NTRKMPKDRVfZ2caPtkxtd0HpOKdHK5T1ITmBl7A8H96DEN7cAlf8ItNovysmTwvqN4T6swVcw00iaiGyBCCKn+DoGpDxrdDVyNbhRmaavPzzO6/uLILRo89t27ouJT3hHw8JFsIBgE9ggdBf9jA3E3rZS/t1yP5FI7Ls5SryV9tAMvjLJgPteltaXE20GPd22vFBUQx2GCnNe1AViKCPQNJE4LfGX1WCMRdCg73pyDyT9yDBTRLQd5AEx02Yj2roSIk/Z2snxH26RqYWirBi1xyNPDdDjooUjfJqPyXcvIPGS+ssUVzTL7j0rE5J0rypCvWlb7s1ldpHHdSg5W7lG5EIgXaioWradvM2KU0xUadNqtKNDAVyYf/eF86dTGawigupA7Va1zPK9e7G5ByqWNIozsP9G4N58E9PQsthe+MGWEskJ9Iaq1neXKXzFrsRY2VP38aJ0tgIqO5tz7ZL4h6A86VcdmGPMNdEQygHaZ2GKEDBjWXcbs3A2iS04DGp/JEhzq1Yn2miuIJozhhYmAGdcMH6QM4JS1NhpRngH2nzEToUCVC56ms1SAKgKHPkg5zcNZNDQZUh2UXIuNs8P8ZArxn1rP+bmJIO8cIM+ZJM7BRHLfh7ijpGeiSqpV0/+QTLxjYC57kUKbnAj06Le449koGPsTnyQsuJcLg0iY0zXroFnzopHFhlrNDg1/0gNTBp3xJeT2CUDxnDkF5pmx1ZjvzeZvWlaDJ7pE0AtsN6odenFBUFK6Qs9mZnJWBfIzr/Qmvq5yisWAqoX+MVIBd+LzCdOe40XhLkh4mR3c/WwPzk74hPqleKcqSkaK7Il1fXVBSOO14AeKTSnUwh3fL39Y2aWY3no30HxCD5e2728TDhXcLsSBTL+OYiVTdajYWWPxmvAVXuVsMAn7Oc91Z9uJrD7LHil95sKC4yYtFBpEAMwBTMN/BTEd3hi1RLWdpnTqBGSrdFWFMidRKWCsO/KTTxIWITzA5OaZxjXhlFEueEWcr/97oR82qZtNWdWoBjuMHanPbpmXk0h+gzRcKD8kEGdWzqQV3zhlLSu8QFjbPoYahlbGzhY2JQTN1YiRE/WdCwC85KgwLtizDH1MLT1ax83WY+kPQbpqQiV02kOri0CDw1dT9I5Sg3zeuiNXG7VKGv4HAXHWJZKKNb0Xa8bAS3w8plLzjziNb0x2aXoQHwA+QsA47VzBNY5j76pE+GGaZsWMDLqm9Qigi1hNnylX4TGwiTzI1Qv6GXQB21PDFHOPKSPat3uXsfvGiNl8ITIgctrnXR/bNAYvM6Gnk20Q8WbSS3aVOD+e453peUHpq9Pfnaz1uedMlOSgmDZ7mBnhtK8Wubt4JfKRCnRUy3d8Bj7R142vHIH7TGxpbCsnT0WPsSYWYNl4It+oyJ79U/oLhdnHX7F4d+m7HJW0WY4IHOhWSxvSqqDcCnxL4UtbAyiqfaMU0U+PgQa17UvQDdJRu3wl4M4AfC7Zn+ALH3MHL5RJFHA7gmRAM+f5v8Jp7J+jd4rEC0UHllYLbVkf5s60SGMIZ7rWzzmnPNhYwWmEWXFa+0km6UyzvmbhupxoLTEGlbF3Msv0LXSa5YN+e5zdqrL9KGNBjoijoSRcODfxrQ0omr6cT+4TO6pGj+cZspQhuoayjLQ3UMXCk/OX+rnM90muUEyqA0racQ9S+BnVahvChhfHxmXTkNHW6JcIUfOif/bzn24NyQB25gQyFne/02SsSSN2PLH+FUmDLuPPcjm/q4Por2gTZTseI97gsxfdHgctmeEU0HGOZJYsq+9nLrMg4AjjlzJdcDg/PmEOtUgpl0mqC8/1i6GMCBkpX8XZPF4uDvlzrkzRi6sJMv2+baqGV/hDtJk2796DvQOmSFoBT4an7tD3/lfyBM190ASvn1/tYxYnfgVUY6O+0xSjSSOQ7MY2DVhQYfeSfCo9d9EqiLB7VUGRgD', 'page_age': 'April 15, 2025', 'title': 'San Diego, CA Weather Forecast | AccuWeather', 'type': 'web_search_result', 'url': 'https://www.accuweather.com/en/us/san-diego/92101/weather-forecast/347628'}, {'encrypted_content': 'Er0ECioIBBgCIiQ4ODk4YTFkYy0yMTNkLTRhNmYtOTljYi03ZTBlNTUzZDc0NWISDNY90xpfN6cqZ3++9RoMEQkk3+UnooY2hvGvIjDRbFmzhyteUhit4wvP43DaEaq6On0KmhshYS05b6F6qfHvY5C+/3HE7ImVBQ9IBx8qwAOOY0n8A6pSd0GIWiEDOP/lodpa7lu4v+W9YB1rKIbJhTsB/ebqChX8YOKcp9Fzb0Y/O86CIv/Kzpdz+vCUY+UBZlck+ycNpsGNt/MbI+zvk6025RnAwx6jOqyUTou9Xz2JS1FRSHIGB4CkZ9MGkZQw7tdOle4DflfvqoM01O6vwIe+abxsfTtVULrPenYKBPJ6RdiFqf2Hmr/3HaszD02aBibLGWimgKlYDwNHWgAJtiBe+D7YQMFzWeqC8Ybhg5AMnAX6Wmrt3/GYqSryRf9p2wFyPrHBLz/qLd2/94ACJuTVeIQGn8+gaMVZcSZBGmqVzV/Vom6x3T2Ooev2RiCD4lUY1OkNvlFxnCPvdGQh8WuvR108S0tLbwhrdaeoABXzTiMy+XCHUfcFhT6tZUdaaQ0bh/uUPcayghAPnuJVUIkecqZnn/AumAURBlB3ilWhRWS9RvtDXqb4fSYkgT5RBEZPt7j+faIecWhguusCHAyEToebHKdjn/vW7PSOZ3H9jzDSAdOOfS71P26OtTjfgR0ZxijCsfCjO6GWyv9l5lWddc7a4m7Uyph6GeLgpX66OOu/e2E/tg1O04Hx+WC2GAM=', 'page_age': '4 days ago', 'title': 'San Diego weather forecast – NBC 7 San Diego', 'type': 'web_search_result', 'url': 'https://www.nbcsandiego.com/weather/'}, {'encrypted_content': 'EpcECioIBBgCIiQ4ODk4YTFkYy0yMTNkLTRhNmYtOTljYi03ZTBlNTUzZDc0NWISDCxrTkwD4JR/u+KimBoMIJCy8vf/Ko5P18U8IjAv37v/Hi7vudgCv3tQzfHyFby4i1y0en4Ct9ASZ5tlXxoNBukiCzBybTmz/iS21QsqmgNyxn5FM89mqxMc8+oV578FqknFaMBe32Qh7U0kmqXO/KHZAgdUj2jPmzbI62t+fJQ9n2gKBVWbtS2hffql2RVrrT/+X+kuFrDLev48KbhpuCpjXDqtaR9Pu4N0JjjA+YJxNLxoDJRpHn0mrFjctMNexU9EbfMBM52FBv31FfXUpVbJoCgi2qiPhBOIYqIlo8I4NJdxxZQNGuOy0fgR7Wfp93wfy6fpEv0vccUyi0SFgY1Yo5cGWHi10tWjc5kMw1ZMxMRkvVf/8PRANNumWdjMVFiAU09kylTzTBKxa3tDdMdwLn6vBKaWJRInsJvGMBRHQh6d35ZiuI048PTPa3nY9rK45PFTSyu8Xgm7ibtRMFWStFHhX7T3rUUE/CAF0g0ch1sA+zCkSEsuSWF8YoQ8TFfUbBnh60eZ2dQfrGPNBdnhawsPgSoaBw02gxh4WiAvl8d4NaK2KiuyxRW0TmKF44EpITNT9c0rzN8fJ+9qF1qODWgArVVjHi7YRBA1FmZhITO3p7xDwkfblvVlaVwEEmTTvo+1JGhS9xgD', 'page_age': '5 days ago', 'title': 'Weather Forecast and Conditions for San Diego, CA - The Weather Channel | Weather.com', 'type': 'web_search_result', 'url': 'https://weather.com/weather/today/l/San+Diego+CA?canonicalCityId=3b2b39ed755b459b725bf2a29c71d678'}, {'encrypted_content': 'EroDCioIBBgCIiQ4ODk4YTFkYy0yMTNkLTRhNmYtOTljYi03ZTBlNTUzZDc0NWISDM2M1q21W4CwikdFEhoMKLh1bM0WqSMDv5VUIjD7DfvNBcQg7xe75rPnWBitQLyX43rik90OFX3fbOU2e2PRBSSkwTLXPW1fgf5rkkwqvQI/zg1bUksm+kTH7Cfkp/n7HIg59PA4chz93RzHeOG4ot8TaXqx+ozA//xDXOTMHDjex63EP57iznGaxdBJe5O6WBbgT0fZlxskjixOPCJonI+KJCYzakf8Tru4GSUlgQBc/NxG+tcYoR8x1J8Q0V+6Wd9Y7+uViYcohaRXem/R83bS+BvENU4lhtuTAcUrT9IpWWqU1Po3rDtlGiOQo8Gf0qgByCMNYxCuOs7149jThdN5CYg9Avm6Cbw14VpG7M6wxhil4GLlRVjfWu+ulRSTECE93Swt20WcghCr/II/ZUGcuA8g97leQPphDFEmbQIB13STx45/mTcXR7cIplv9Moho+PGh7EK7q1rKsLtH4RPgcSdiD934eD2qOhntsI93lu4P4a+zWUneEicbRK7D9oKAPRkbChKRKmcRmxgD', 'page_age': '1 day ago', 'title': 'San Diego, CA', 'type': 'web_search_result', 'url': 'https://www.weather.gov/sgx/'}, {'encrypted_content': 'EoUMCioIBBgCIiQ4ODk4YTFkYy0yMTNkLTRhNmYtOTljYi03ZTBlNTUzZDc0NWISDKSHiE0ERHQskYMGtxoMALIkXeohSYJrbjWcIjDEJo1/wqCA4y9NlQQK8ckAD9hqUcXgFPyScce9ZxdQwZDcBKKiq2w76Jv/0PUYbcAqiAudVK8jRop1PsSV1Vq90qybbuZRnztS8ozbhN2PtxrLQDzQ3qTUzgaUaZ8R0yPP4V/WEI04OcLuldYLb6GV9yKcUYwlbCWmB9ICEdUIizvmMqXu6YWjt0EIwsI4KQRCIyUEpH54yBgOSgacpL9sINYI2cPOvlCKw3EJHV3vUcL1fLV4wY7J9i5a0eTGobCBb1oyoViL1mSSi9rlJ/nOTKzcYWwkplyj5hV+VxlndoEMkr2tCCiC7TccoEXS3zgZ+Y9JepTlUqY6F5c9B3t+gMKoybXQ7uTsg6EkhW/k/M38YfogYnUQ7V0lh5ySbWpFU6FbwORItk4mRyR2y8yUxbgH6zgM3YSXKzHqv6a6MIAlXzaSEd3c2aK75gysMWUdJ+HlZMA/6PQXFoREhO42qJpq1tNSUUPVou46GNflnuRqmyw0Zb5wpn3xfhg75AqBWhvb4rrB+ZPEdHwJsbqrnRfWwsfILEywxViYSVTlsvre6Pne1FwNdJaKV7j/AqJYivHCzwgGqV3hpzds7QbTf4SW3g92s1LR+gNvS3FXjZRGJn6R22NUyhg5vf52Tzp/c+flBLCeb/eUFiLRNPLA/GvSC0uPphP9LDPQmPgfAq/iPt7R/KdbjDBED+vz5U9aajN9X30STB0MNFjXpxzb9d0XmULk/XT4RQsq3AM+nQlQvXZ40uf6djc9Vpme0QLUHNh/XBu+07p7FZ16t9kuSeXJK+Orb2Bum4H3tMQvhhXSebO2h9FzbLGxrvxj0GQtp1GyfwMRy8IckwlzuIF/VWBUhL6NvCUrQ7HkhuytJXDW34WzRF6G4mGY4yTQPfAHk4hpQ/slIXQ6FlFU1zJn5y0XLv1bNOttKF0MeVYXvNCfNuHbSvMPL2lGevQyAhl6SCuP5s6M+0N7BN1+JNGU1H+sZCngEj4wRjegXl2Z75Wzj50s3pZJPeKxRm6ti63XHc/QmQUFuhMiEmpsoOft5GR4O05dTS90tNBdllho9usXnTnHcfBjxPi1wB7uw9LuVu0/OMdgIOZOIWg+usSlTloxFlh8czRnJ0dxNrezOWqVpThKVvEnaae9Id+SnzcaSn4bTklLtaMf3ZgHm9Z2TcSrI7C+wEdXqSCLQOXkg038gvMuE+jgdcK4RzBvIuENhNPvMWd5oAWT5VI3SgYlozsTe6GKOmQqFkFrEL1OfH0wcTV4UYav2f7DOhg1NFvbHPsuFNaXBIsLR6nTTSZZWEDA9u5dLBjoyclrdHpKB+AyQkPAMDrSak2STdVWx98CMvckFYPjw7cVEmUar2ZM2k4H13hZMFsLzttyfNmE7FYurp2PkOeeWS9exPexIumFvCzfZtf0B25JurJANfzAoNZXvFPH9KVz19DN1iGtm8abUJ3Zfgcbsy2S3hNj+P0m8rKXEMoUQyS0N+zs8AaneFlufh6j4tUE4qnJ76QFS1I8l9ECc8NmNNSioindW++ciT0NHW0o9XyDECFHOMUbpG+fccQXQ24nbAd8IDf2SoioD/1/gBKaLohqzklBLdqToaF/cNhOuoOpJE7Ryjp+FF1CbjGFHEqgko6olUmnmO+iIGkSSDlrjX+An4ptdaxOfEoAph9Rsw7qJGjnVaOkWJh3I+H5Uim7a9dkvJpVmaBf9dJsihwiYeCIl0iJCbo1bUxWO63kIvWF7FqG334bI/DOIibaBHtxenlgDuOV+pdWm5iLSzQmP62NAH0ShqW1tjKPJ+Xd8lsLBkDXBXIEa8IS7HfOhES/R4zwJmmZwvB1Q50BgnsugrMAWBPGtdW4dNVnxazVskbOSI+QCZDwKHScDcAinimo8ZOgvt1GzKUvbvk6W6GeH0TuHSA4suppJLvUUCRLT6yakWF1tNIQRTdeYizpHfBsgP0YAw==', 'page_age': None, 'title': 'San Diego, CA 10-Day Weather Forecast | Weather Underground', 'type': 'web_search_result', 'url': 'https://www.wunderground.com/forecast/us/ca/san-diego'}, {'encrypted_content': 'EpkCCioIBBgCIiQ4ODk4YTFkYy0yMTNkLTRhNmYtOTljYi03ZTBlNTUzZDc0NWISDISA7lvI35O+vFVLtRoM42xUKvGTd+2vHcpaIjDcPSz8+HKJEBoL6dOeQV2ZrHaYZYbgqL0RZotRA5U+ak0Slj4GbEASiq5qceG2o3wqnAFZcXWUbWditOgxdiKZMwU9gLoVTt+rZg6tERIiNQaPchal6ZhnTJ4zwketdwkNua+71SxldweH4ZyrNNdh1PePF10TrbGXt7oYwSfZ9t1eyBvnnqqYJ3vb3MIpGC10O24bNVwis6Ao2ghRD+rYENJ3+F/g+o5ehIEnDeHKrFDt0bW7W800oEBLl4Sv76tpSK3yHTNbiEOTKmYW0DgYAw==', 'page_age': None, 'title': 'San Diego, CA Weather Forecast | KGTV | kgtv.com', 'type': 'web_search_result', 'url': 'https://www.10news.com/weather'}, {'encrypted_content': 'Eo4NCioIBBgCIiQ4ODk4YTFkYy0yMTNkLTRhNmYtOTljYi03ZTBlNTUzZDc0NWISDCvQiw3hiXo/wWdmeRoMAFSFMoFWqyD2CohJIjDItSLBfm2inh6cRnXUWi+Mm0CxxvNQcUVvrRvA9Mp5b2cHMADF0KiwgHLIGiBcYg4qkQwVAS/B/QJt0ZKZHgN2l2ocNS/fohkQffm62MoJrrVfoRz2iKYz4Tr0OYSeoC8P4sM8g+KqlltKdWCWA4JGh0qRb4ZVUS1Q2+jGbLvvE9GTTeeylQh9ljTKTHiKagEwIApr9T+CRzaPNTebE4BahEf7wfbKGapziCsA+2I59TgwJ2cfFXAO+YnWvMOtKzutiU6xMuShRFAq8vlbXA/Xmr/UaENeU4vXXjLWSoCHZkX8PHv9hOdWB3LSAm8XTK1lsBdzNS90l8SjHSc7VhYYg5Iexpjnk/KajnOg8ZEgaJMZSCyPoOVCmbmd1gsJEBMgDb/V5FXxFCC/p5yYB/JGt4059J0l/7mG7XfAJlsIQV5jrEjxY3ByMLZ0ehSXaig6wgNdu6C7+ZxV2KtHSb8Wshbl7STLhfTmJZk5+XVffONsTUKs9IFVnnBkWhUac9ukb/QNERSS00hnc0uCVog8azRbt1QevRiwl7MorHYZsNmYsZ2sZ8CCze3k6b14ETXNkLF6HL8FhZiV5pIL3DPCQ7MIZh8wxh8aZ+g4A3zzSKFecC+mL0EswHVNmP6b125GShjs4BjB1U2jYHPEDcQGX4K4ZrA4DTcNeVNkxcWGYUADvkVW8BKA5/kt17V2T4LIj/VS77ZApkAbuapwFs61NUi5XNfWsAQvdyxzxUzR8FBGYZBcHoEYV6an3ItwjDVF+8gDRb25+9pHFNa55uA8Q7BWOvB6VN9axchbzBmXiAbnOujbWb4B9oR/f2NGblFvmLr3Ufia5Cy5B5J4zZ740m8N8cASzKFFNdVghwmADq1WMm1ofE0tTXNN+iRPfexGyR7v05GkiKT6SgxDCcuiqdC/pWQbirQ5g5gua21aR3W23jbdPwBgPSQRthglch6zQf27L2Siexao7kAVEAsV3xQrAPco+UQnuwdIMwqumChbRPwQCAgj0luSlPzZKxmZwULQ2eojp3kRslid0OowDT8vNuBZJRHx8rLnpMgvdK8sg9UDmZP/h+FMAA7ZoWvALqSaaC8DmI6eVMNZAKIxh+041zakbJKyUb194q/VNWZwCcvcOaLui+m3+kRIIre2SOqvhBcIVuyyleWs3G3EPlEzSPipBNWF9P2cW7Zgb0Vpkl1bN7RCOhxSUmKDgzY76CYBriSYs4bqmTq0K5ECkHKDphC9jNLkw+js/0Srq1nmlVndDAoNpjwWXWI7o1D7VQ45l7VAyaMCqXmbq6Ec7s8wfLIaDLje2j3UK5K+MpsyzUqzJHljj/D0nzqb0PgRHEKZNo3MkeXNH3GESW8A8cvBMCWufk0r//QGt1YAgbxYIae+tAxRVj1ZayVHAXim5UDcw8BZ8V5JCt35elyY7A5xG7YSa7sbhtrfBbs0LMxb2AEp34QQpeFhJNEAcO9D3RycrVYBnLVHJyR1xMPan91ec94UIQzImwC/Esew4m7REV8zQT0SF4RI3wNgm5Wl8evDPccHjG4zrzYHmqkKrIHhiPlJGnE14Qj3gapDMECQ5TFFPZse0IhFoe2rsnzcUryxiCPb2EZvVzoOFnSPKKcJjBLvP2vnfVZKvsB+utQ0KRAZL6mLGJHTzl7QzbndEJM0X+kEsy72O0UbG3aHdo5K5Vs95ecIWDc/Jr3RbQNj27fTp44LY0IqlKAzkN+gTSnalaaF8ILQO+KCehsRfGGJPOyjhkRlW9xSI7HQsDt+lF8UzAFydjsN1aIAE86QzzSRdl60EBMfkFwykHsy8U+fQ59mGsQoc3y/RZbRzAyCqhhdnfcde9chB4ZGSbYlfzMjzyA4sMfrJfIC61DOcvVbk+V5aQKI8jZRNjv/gMMeKliDI2NlHzEtlbScYlGi/Wuri1slR17j1zaVfcBEhTBs0OixtPDzA837AJCs3WJ44jmgg9KeWyvtrs7F4lf58QN7zp2IcC/48Uq33Qr+CntmMN6IAG/iElTimsReyLQTIcV+u18UKa4ecwqPh9fLrfHVuYHiVEnDir8atKJL9P4HlZhKFPAHWDzGiCGrZUXG45FNJPjr/k9AXSzNUzkbSSiLv4QhmX1vOgo59ZOJEmP6zRgD', 'page_age': 'April 12, 2025', 'title': 'San Diego, CA Weather Conditions | Weather Underground', 'type': 'web_search_result', 'url': 'https://www.wunderground.com/weather/us/ca/san-diego'}, {'encrypted_content': 'EpQCCioIBBgCIiQ4ODk4YTFkYy0yMTNkLTRhNmYtOTljYi03ZTBlNTUzZDc0NWISDFuTkKRdyjRoe42sShoM9INXl1iPL+1H6qL3IjCiDxuIJSjJ1HzVWgPj4SyXbQ+cTM43/iWCfjtkzCnaos6zOMQs9v2r6lv5NyzjELkqlwGKZK4hPA791b7rZr38bK1pJn/0EWh8rZ5lHGYDD1OWpIr8i8Puc1mtfrc2jSfzR6Bgvbnp9m/0L3LJDWKzyBgXJKCHLiA38l+Myc/4vXDkHOd2dq+lj3vE6GKvUHPz92p0kogKPkK/+GsnzceK1WqwMb8Bhlsom6fkVI8GAdCazJp1t5dTt31TzmhInIDolIXoJerldCriGAM=', 'page_age': '1 day ago', 'title': 'Hourly Weather Forecast for San Diego, CA - The Weather Channel | Weather.com', 'type': 'web_search_result', 'url': 'https://weather.com/weather/hourbyhour/l/San+Diego+CA?canonicalCityId=3b2b39ed755b459b725bf2a29c71d678'}, {'encrypted_content': 'EuANCioIBBgCIiQ4ODk4YTFkYy0yMTNkLTRhNmYtOTljYi03ZTBlNTUzZDc0NWISDPPaPpMtSRob70NnLxoMWJpuqxpoxZmbY0rCIjAkvstJ8UOwYoDrWcbisjekzykmuGlItq3XBmDhcLH/C/RFSw6ItqMik9VW2jnKTU0q4ww9rLWd/CfntwRSWY6imyTeiIpLBiPkm7vMKI4+cFpFQUv05DNNJW7IUyDDmwFsO2VkPnOjpjjzLS9SGfJ1LVHhmBGEenACZLBNRvuByf2U+Dp5mZMf0m5rTLY7Vh0+Z7Qjj71M09pg3sSumTGjD8saf925dwjAJHuoBW5aA0YEN4EmAl8Xzw/jG6Yvx4dv0+zIRXRpxXrbIk3ztlzqbflMnp7d/yHbzytW/h4bP+z738IQGrDfyuESJqu6WTUorMtTOi7dQ3jiliH9W/5EiMjAQzxu4eKCCES02sAsKeb5LVI5Yg4DeSW6VGA2FagGSKhXeQ9vx4M5ka+NNT0i2hm1ZGlvScGvJVzGlZ7AFhFBLSriIq6kZJ83GEyvRiLspZ+KoOIYmHpJK8O7UcCPI5RiS+wMN2IqTxdvzSz0uzoUy8eWrNeqtgyMVmkwqFl9nKuq7qKEK28O61hcPsTNt8SIzK2sLBaW1aVrTB0TZdnxgll757riA00T40/Ybc4YsjdK0EJKwgVQy/YvaEFVkj1LV2DoMJ4qVnLx1ClQdZ6QnrfhdWUp7Tk9EhgOnUcp9wn6lksB14gz6n9RoLF9gwZsAoFsZGo+/rUIiprdcHj4QT+ZXpOFUfsBvmaFaMCHlMVfUcMuWJtPHKlYgLIZufe+p04boJxhAGs0atAKY5xCHV01n0Ge9ftQWrYKHBMD/Nxl+Dt0ZGi27zk0OEms6lm3WRx1n+AyAicUn2nvv+zyO8romVYJFZ26ReHHhXGfbNnGMQVFHfzv0MoKoA/va8N4hNXDEnjelUNH4M1dAsxO4Jr4+xrHUvoBGg0P34osnuCh6r5jdauZT5A8fHLd2gGSTIP6BbEv2IuKhppLMkj0t0jq80L7K4H0Fzd80mQ/fKeCVGwJAZCWi/Y8rSUDqiEaQNeW0gWcDybgMTwqDgSc/6jBrpzZFZN94OFsLJ29situKj/YY552OUf3oF6ntY82ZAXaIqexbuZPTPsL3cCtp/am82lIg7dMfZYnUn8aKXzs1dU+KquSnDYUD7pzDLD4tgk9ATpY32KqEso0A31/fOdRriyxtcYQBPPjmZlpb7M7G9Q6kirEqAAbza7JFmxqjmv3laKBjjHfRXrPR+JZ5i27dxOiZS5BOXq0+vtM+KUYZHYfLvANTNX/K8z5AJ1WchyoroSIKxvcXkILQ9ZsjmOvFoCMDRFf3HE8oghU1OkwV7H0+JDOrTCUux5TCdA5q0/n85T7Zk/Qz73ECGP5SqtqLU7Ehu61dvC0yUiWbYxGjzW8BChXHCff6KyPIbqC3c0TCd47QeKLwfgI59Z9jhHbPPXyUnMSeVPvHR3PmxOix/DvfaH4f6Fnnh2GFogW1cIY3J0qKLMgn7dzQKMBt52gHfjZiTgL3Y6HhXahOqD8UEIFCsF9AATXmkDM3bY+i79r35qLDmxrCMdaLswGLrIvLup3WYRcW5K6xEpKTOIJ2gMK29XRu5hM5x1h9FnEoef5JM23k9METMmZAvl4mOYls81rre3JacQx3G5e9eUAV57gh9J8EiBvSIdt3kaRaaDpTWTutvGZT4ltL8guPooxi+v3y5wQAfypBw7zPvkudComy0XXWllWSunbygpQARCyRXxAhmrRJ8iMFxvZrgZqkP/H6z7YU8LptTQXw8wXoKMzvtZxsRLo6OUF9TB8WC6inY2tzAlRuUoIz2DHphLVYbL+3+ZSBeOelQrnokfNVKhYdW2R105LurFYU+hdoYH4DVklq0u4K0Gjf9ksciUNyWSj4gkVQpmVi6S5swdWxovi0xDa3EVioQU4UiwegWtGMPuSebGop52y5HK6hj9MTOMrZIfAxIIg1arJhil8hdUXPMbLFeW5Yk7KPt2PL5QpoBFNjDi3V6kpr+A6qFVg5OOuJj0+wYAZQs4WhoWY0YUmeQ36MD+M0fyK5ipYvZtrPHzovREss3Zqga1LCmUH+5EsSdIEiT7f75GyVcj4fi9k8fo89fS4SydpOTh30XQGsfMfLkBN/ATnfnrXprXP4tjSb5cjvH2Olmqa0FBp7SCf1WGxc3IFaXYXw/DcPs9hndVpsm5D642duity/95QD+P1pOZR6KBkTMPWo+EJdnhlYlB3HMyP1zqbRH437FZU0MwJTeKG/YR4R5v4AXSk/T/iw0FPa5YJizg3ya7DpSYYAw==', 'page_age': None, 'title': 'San Diego, CA Hourly Weather | AccuWeather', 'type': 'web_search_result', 'url': 'https://www.accuweather.com/en/us/san-diego/92101/hourly-weather-forecast/347628'}], 'tool_use_id': 'srvtoolu_018EJgmzXbsoYSRWUMYq2DBq', 'type': 'web_search_tool_result'}, {'citations': None, 'text': "Based on the current weather information for San Diego, here's what I found:\n\n", 'type': 'text'}, {'citations': [{'cited_text': 'zoom out · Showing Stations · access_time 6:33 PM PDT on June 14, 2025 (GMT -7) | Updated 5 seconds ago · --° | 61° · 72 °F · like 73° · Partly Cloudy...', 'encrypted_index': 'Eo8BCioIBBgCIiQ4ODk4YTFkYy0yMTNkLTRhNmYtOTljYi03ZTBlNTUzZDc0NWISDMiDDwXL9x9T1822kxoMnoM61hIgtDvqZK7PIjD3H/JD/Ok2AX/f086uI3EYr1ABE87DbyVa7vSKDjnLnk6GISaJmCGPgs0exLHQPgEqE75O74HM8P+d7Kwr5HyKm+IicxQYBA==', 'title': 'San Diego, CA Weather Conditions | Weather Underground', 'type': 'web_search_result_location', 'url': 'https://www.wunderground.com/weather/us/ca/san-diego'}], 'text': 'The current temperature in San Diego is 72°F with partly cloudy conditions', 'type': 'text'}, {'citations': None, 'text': '. ', 'type': 'text'}, {'citations': [{'cited_text': 'zoom out · Showing Stations · access_time 6:33 PM PDT on June 14, 2025 (GMT -7) | Updated 5 seconds ago · --° | 61° · 72 °F · like 73° · Partly Cloudy...', 'encrypted_index': 'Eo8BCioIBBgCIiQ4ODk4YTFkYy0yMTNkLTRhNmYtOTljYi03ZTBlNTUzZDc0NWISDCfSx4X7AoCpadfCWhoMKValR7qmllSkvMczIjBx9xJWR2xNyIWZJ7okQTGNzC2dqTqoLIr5cu7skk/T2Nmln+owCx0ueCt5nMtszVkqE2ubFs32WGr9g4tgVzVfZTkbRREYBA==', 'title': 'San Diego, CA Weather Conditions | Weather Underground', 'type': 'web_search_result_location', 'url': 'https://www.wunderground.com/weather/us/ca/san-diego'}], 'text': 'Winds are coming from the north at 2 mph with gusts up to 10 mph', 'type': 'text'}, {'citations': None, 'text': '.\n\nFor tonight, ', 'type': 'text'}, {'citations': [{'cited_text': '/ 0.00 °in Cloudy. Low 61F. Winds WNW at 5 to 10 mph. ', 'encrypted_index': 'EpIBCioIBBgCIiQ4ODk4YTFkYy0yMTNkLTRhNmYtOTljYi03ZTBlNTUzZDc0NWISDNb3fDJ3zru9wKRjwRoMmJlwNM5IJCeYbtq0IjAROe1gt4pZSWbLgKQEh0l3BAxuud9Tzl6SIh165ZyUQyCncoVcN+LxVXltIERrX5QqFjWM9wXYtljky/+Hn4z50Gcc6YEzY0oYBA==', 'title': 'San Diego, CA Weather Conditions | Weather Underground', 'type': 'web_search_result_location', 'url': 'https://www.wunderground.com/weather/us/ca/san-diego'}], 'text': 'expect cloudy skies with a low of 61°F and winds from the west-northwest at 5 to 10 mph', 'type': 'text'}, {'citations': None, 'text': ".\n\nTomorrow's forecast shows ", 'type': 'text'}, {'citations': [{'cited_text': '/ 0.00 °in Sunshine along with some cloudy intervals. High 74F. Winds W at 5 to 10 mph. ', 'encrypted_index': 'EpMBCioIBBgCIiQ4ODk4YTFkYy0yMTNkLTRhNmYtOTljYi03ZTBlNTUzZDc0NWISDLt0AZ9iZgqqm6fv3BoMYXmPusg/Ldb9azRuIjBhfRLZ9n9cYr7TY1M3ChXb43a4CzKqLS4Bk9kkHONA4QQA1R8VAADriuOmENWhuVwqF4fRzlt+5/DP66qx+2Dant1kd/snkBSuGAQ=', 'title': 'San Diego, CA Weather Conditions | Weather Underground', 'type': 'web_search_result_location', 'url': 'https://www.wunderground.com/weather/us/ca/san-diego'}], 'text': 'sunshine along with some cloudy intervals, with a high of 74°F and west winds at 5 to 10 mph', 'type': 'text'}, {'citations': None, 'text': '.\n\nAccording to the National Weather Service, ', 'type': 'text'}, {'citations': [{'cited_text': 'Today will be the hottest day of the week with highs 5-10 degrees above normal. ', 'encrypted_index': 'Eo8BCioIBBgCIiQ4ODk4YTFkYy0yMTNkLTRhNmYtOTljYi03ZTBlNTUzZDc0NWISDAhaZBx5zCgMJ1XQ8BoM4/ogPo0LF26e4Js2IjD0MgRXkvcVaA46bV+dFuvI7XJo0fKaw6kFRBTM2215OrjklMKwMGvyYkouKFl5y9MqE6QMBmjL1llB17xH53OZOZbSGXsYBA==', 'title': 'San Diego, CA', 'type': 'web_search_result_location', 'url': 'https://www.weather.gov/sgx/'}], 'text': 'today will be the hottest day of the week with temperatures 5-10 degrees above normal', 'type': 'text'}, {'citations': None, 'text': '.\n\nThe air quality shows some concerns, as ', 'type': 'text'}, {'citations': [{'cited_text': 'The air has reached a high level of pollution and is unhealthy for sensitive groups. ', 'encrypted_index': 'Eo8BCioIBBgCIiQ4ODk4YTFkYy0yMTNkLTRhNmYtOTljYi03ZTBlNTUzZDc0NWISDBPq8PK+EsRijupskhoMDtf3fPlv50khzs2SIjBGFyFnxyF1kdYTac6ePIGC7hHtLMaqndnKVWiHtteBay7F224W7mpwKTDsHOZGhRkqE0hmLGQ99ZcRYHgC5c6V1rsomHgYBA==', 'title': 'San Diego, CA Weather Forecast | AccuWeather', 'type': 'web_search_result_location', 'url': 'https://www.accuweather.com/en/us/san-diego/92101/weather-forecast/347628'}], 'text': 'the air has reached a high level of pollution and is unhealthy for sensitive groups', 'type': 'text'}, {'citations': None, 'text': '.', 'type': 'text'}]`
- model: `claude-sonnet-4-20250514`
- role: `assistant`
- stop_reason: `end_turn`
- stop_sequence: `None`
- type: `message`
- usage: `{'cache_creation_input_tokens': 0, 'cache_read_input_tokens': 8604, 'input_tokens': 12, 'output_tokens': 352, 'server_tool_use': {'web_search_requests': 1}, 'service_tier': 'standard'}`

</details>

## Third party providers

### Amazon Bedrock

These are Amazon's current Claude models:

In [None]:
models_aws

['claude-3-5-haiku-20241022',
 'claude-3-7-sonnet-20250219',
 'anthropic.claude-3-opus-20240229-v1:0',
 'anthropic.claude-3-5-sonnet-20241022-v2:0']

:::{.callout-note}

`anthropic` at version 0.34.2 seems not to install `boto3` as a dependency. You may need to do a `pip install boto3` or the creation of the `Client` below fails.

:::

Provided `boto3` is installed, we otherwise don't need any extra code to support Amazon Bedrock -- we just have to set up the approach client:

In [None]:
ab = AnthropicBedrock(
    aws_access_key=os.environ['AWS_ACCESS_KEY'],
    aws_secret_key=os.environ['AWS_SECRET_KEY'],
)
client = Client(models_aws[-1], ab)

In [None]:
chat = Chat(cli=client)

In [None]:
chat("I'm Jeremy")

### Google Vertex

In [None]:
models_goog

['anthropic.claude-3-sonnet-20240229-v1:0',
 'anthropic.claude-3-haiku-20240307-v1:0',
 'claude-3-opus@20240229',
 'claude-3-5-sonnet-v2@20241022',
 'claude-3-sonnet@20240229',
 'claude-3-haiku@20240307']

In [None]:
from anthropic import AnthropicVertex
import google.auth

In [None]:
project_id = google.auth.default()[1]
region = "us-east5"
gv = AnthropicVertex(project_id=project_id, region=region)
client = Client(models_goog[-1], gv)

In [None]:
chat = Chat(cli=client)

In [None]:
chat("I'm Jeremy")

## Export -

In [None]:
#|hide
#|eval: false
from nbdev.doclinks import nbdev_export
nbdev_export()