In [14]:
import os
from PIL import Image
from smolagents import CodeAgent, DuckDuckGoSearchTool, VisitWebpageTool, ToolCallingAgent
from smolagents import LiteLLMModel

In [1]:
import math
from typing import Optional, Tuple

from smolagents import tool


@tool
def calculate_cargo_travel_time(
    origin_coords: Tuple[float, float],
    destination_coords: Tuple[float, float],
    cruising_speed_kmh: Optional[float] = 750.0,  # Average speed for cargo planes
) -> float:
    """
    Calculate the travel time for a cargo plane between two points on Earth using great-circle distance.

    Args:
        origin_coords: Tuple of (latitude, longitude) for the starting point
        destination_coords: Tuple of (latitude, longitude) for the destination
        cruising_speed_kmh: Optional cruising speed in km/h (defaults to 750 km/h for typical cargo planes)

    Returns:
        float: The estimated travel time in hours

    Example:
        >>> # Chicago (41.8781° N, 87.6298° W) to Sydney (33.8688° S, 151.2093° E)
        >>> result = calculate_cargo_travel_time((41.8781, -87.6298), (-33.8688, 151.2093))
    """

    def to_radians(degrees: float) -> float:
        return degrees * (math.pi / 180)

    # Extract coordinates
    lat1, lon1 = map(to_radians, origin_coords)
    lat2, lon2 = map(to_radians, destination_coords)

    # Earth's radius in kilometers
    EARTH_RADIUS_KM = 6371.0

    # Calculate great-circle distance using the haversine formula
    dlon = lon2 - lon1
    dlat = lat2 - lat1

    a = (
        math.sin(dlat / 2) ** 2
        + math.cos(lat1) * math.cos(lat2) * math.sin(dlon / 2) ** 2
    )
    c = 2 * math.asin(math.sqrt(a))
    distance = EARTH_RADIUS_KM * c

    # Add 10% to account for non-direct routes and air traffic controls
    actual_distance = distance * 1.1

    # Calculate flight time
    # Add 1 hour for takeoff and landing procedures
    flight_time = (actual_distance / cruising_speed_kmh) + 1.0

    # Format the results
    return round(flight_time, 2)


print(calculate_cargo_travel_time((41.8781, -87.6298), (-33.8688, 151.2093)))

22.82


In [None]:
import os
from PIL import Image
from smolagents import CodeAgent, DuckDuckGoSearchTool, VisitWebpageTool

# model = InferenceClientModel(model_id="Qwen/Qwen2.5-Coder-32B-Instruct", provider="together")
from smolagents import LiteLLMModel

# model = LiteLLMModel(
#         # model_id="ollama_chat/qwen2.5-coder:3b",  # Or try other Ollama-supported 
#         model_id="ollama_chat/gemma3:4b",
#         api_base="http://127.0.0.1:11434",  # Default Ollama local server
#         num_ctx=8192,
# )

model = LiteLLMModel(
    # model_name="gemini/gemini-2.0-flash",  # Use the litellm format for Gemini
    model_id="gemini/gemini-2.0-flash",
    # api_key=os.environ.get("GEMINI_API_KEY"),
    # provider="gemini",
    temperature=0.7,
    max_tokens=1024
)

task = """Find all Batman filming locations in the world, calculate the time to transfer via cargo plane to here (we're in Gotham, 40.7128° N, 74.0060° W), and return them to me as a pandas dataframe."""
# Also give me some supercar factories with the same cargo plane transfer time."""

agent = CodeAgent(
    model=model,
    tools=[DuckDuckGoSearchTool(), VisitWebpageTool(), calculate_cargo_travel_time],
    additional_authorized_imports=["pandas"],
    max_steps=20,
)
agent.planning_interval = 4

result = agent.run(f"""
You're an expert analyst. You make comprehensive reports after visiting many websites.
Don't hesitate to search for many queries at once in a for loop.
For each data point that you find, visit the source url to confirm numbers.

{task}
""")

In [None]:
model = LiteLLMModel(
    model_id="gemini/gemini-2.0-flash",
    temperature=0,
    max_tokens=1024
)

web_agent = CodeAgent(
    model=model,
    tools=[
        DuckDuckGoSearchTool(),
        VisitWebpageTool(),
        calculate_cargo_travel_time,
    ],
    name="web_agent",
    description="Browses the web to find information",
    verbosity_level=0,
    max_steps=10,
)


In [45]:
find_city_coordinate_agent = CodeAgent(
    model=LiteLLMModel(
        model_id="gemini/gemini-2.0-flash", 
        temperature=0, 
        max_tokens=1024,
        # system_message="You are a helpful assistant that only responds with longitude and latitude coordinates when asked about cities."
        ),
    tools=[
        DuckDuckGoSearchTool(),
    ],
    name="find_city_coordinate_agent",
    description="Browses the web to find information about a city latitude and longitude coordinates",
    verbosity_level=1,
    max_steps=10,
    additional_authorized_imports=["json"],
)

# Example usage
find_city_coordinate_agent.run("Find the latitude and logitude of New York. Return only the coordinates.")

'40.71427000, -74.00597000'

In [46]:
find_filming_location_agent = CodeAgent(
    model=LiteLLMModel(
        model_id="gemini/gemini-2.0-flash", 
        temperature=0, 
        max_tokens=1024,
        # system_message="You are a helpful assistant that provides a list of filming locations (cities only) for movies when requested, focusing solely on that information. Return only the list of filming locations in json format.",
        ),
    tools=[
        DuckDuckGoSearchTool(),
    ],
    name="find_filming_location_agent",
    description="Browses the web to find information about filming locations",
    verbosity_level=1,
    max_steps=5,
    additional_authorized_imports=["json"],
)

# Example usage
# find_filming_location_agent.run("Find the filming locations of the movie 'Batman'. Return only the list of filming locations.")
find_filming_location_agent.run("Find the filming locations of the movie 'Batman'. Return only the list of filming locations (city only) in json format.")

'["London", "Hatfield", "Stevenage", "Iver", "Saint Neots"]'

In [47]:
manager_agent = CodeAgent(
    model=LiteLLMModel("gemini/gemini-2.0-flash", temperature=0, max_tokens=8096),
    tools=[calculate_cargo_travel_time],
    managed_agents=[find_city_coordinate_agent, find_filming_location_agent],
    additional_authorized_imports=[
        "geopandas",
        "plotly",
        "plotly.express",
        "shapely",
        "json",
        "pandas",
        "numpy",
        "json",
    ],
    planning_interval=5,
    verbosity_level=2,
    # final_answer_checks=[check_reasoning_and_plot],
    max_steps=10,
)

manager_agent.visualize()

In [48]:
manager_agent.run("""
Find at most 5 Batman filming locations in the world, calculate the time to transfer via cargo plane to here (we're in Gotham, 40.7128° N, 74.0060° W). Save the results as a pandas dataframe.
""")
#When calling the find_city_coordinate_agent, specifically ask to return only the longitude and latitude of a city.
# When calling the find_filming_location_agent, specifically ask to return only the list of filming locations (city only) at most 5. Example prompt: "Find the filming locations of the movie 'Batman'. Return only the list of filming locations (city only).".

Unnamed: 0,location,travel_time
0,Chicago,2.68
1,London,9.17
2,Hong Kong,20.0
3,Pinewood Studios,9.13


In [None]:
from smolagents.utils import encode_image_base64, make_image_url
# from smolagents import OpenAIServerModel


def check_reasoning_and_plot(final_answer, agent_memory):
    multimodal_model = LiteLLMModel("gemini/gemini-2.0-flash", temperature=0, max_tokens=8096)
    filepath = "saved_map.png"
    assert os.path.exists(filepath), "Make sure to save the plot under saved_map.png!"
    image = Image.open(filepath)
    prompt = (
        f"Here is a user-given task and the agent steps: {agent_memory.get_succinct_steps()}. Now here is the plot that was made."
        "Please check that the reasoning process and plot are correct: do they correctly answer the given task?"
        "First list reasons why yes/no, then write your final decision: PASS in caps lock if it is satisfactory, FAIL if it is not."
        "Don't be harsh: if the plot mostly solves the task, it should pass."
        "To pass, a plot should be made using px.scatter_map and not any other method (scatter_map looks nicer)."
    )
    messages = [
        {
            "role": "user",
            "content": [
                {
                    "type": "text",
                    "text": prompt,
                },
                {
                    "type": "image_url",
                    "image_url": {"url": make_image_url(encode_image_base64(image))},
                },
            ],
        }
    ]
    output = multimodal_model(messages).content
    print("Feedback: ", output)
    if "FAIL" in output:
        raise Exception(output)
    return True


manager_agent = CodeAgent(
    model=LiteLLMModel("gemini/gemini-2.0-flash", temperature=0, max_tokens=8096),
    tools=[calculate_cargo_travel_time],
    managed_agents=[web_agent],
    additional_authorized_imports=[
        "geopandas",
        "plotly",
        "plotly.express",
        "shapely",
        "json",
        "pandas",
        "numpy",
    ],
    planning_interval=5,
    verbosity_level=2,
    final_answer_checks=[check_reasoning_and_plot],
    max_steps=15,
)

In [12]:
manager_agent.visualize()

In [None]:
manager_agent.run("""
Find all Batman filming locations in the world, calculate the time to transfer via cargo plane to here (we're in Gotham, 40.7128° N, 74.0060° W).
Also give me some supercar factories with the same cargo plane transfer time. You need at most 6 points in total.
Represent this as spatial map of the world, with the locations represented as scatter points with a color that depends on the travel time, and save it to saved_map.png!

Here's an example of how to plot and return a map:
import plotly.express as px
df = px.data.carshare()
fig = px.scatter_map(df, lat="centroid_lat", lon="centroid_lon", text="name", color="peak_hour", size=100,
     color_continuous_scale=px.colors.sequential.Magma, size_max=15, zoom=1)
fig.show()
fig.write_image("saved_image.png")
final_answer(fig)

Never try to process strings using code: when you have a string to read, just print it and you'll see it.
""")