In [1]:
from sqlalchemy import create_engine,MetaData,Table,Column,String,Integer,Float,insert,inspect,text

In [2]:
engine = create_engine("sqlite:///:memory:")
metadata_obj = MetaData()

In [3]:
import os
os.environ["HF_TOKEN"]="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"


## 1. Adding Mock SQL DB for Testing

In [4]:
def insert_rows_into_table(rows, table, engine=engine):
    for row in rows:
        stmt = insert(table).values(**row)
        with engine.begin() as connection:
            connection.execute(stmt)

table_name = "receipts"
receipts = Table(
    table_name,
    metadata_obj,
    Column("receipt_id", Integer, primary_key=True),
    Column("customer_name", String(16), primary_key=True),
    Column("price", Float),
    Column("tip", Float),
)
metadata_obj.create_all(engine)

rows = [
    {"receipt_id": 1, "customer_name": "Alan Payne", "price": 12.06, "tip": 1.20},
    {"receipt_id": 2, "customer_name": "Alex Mason", "price": 23.86, "tip": 0.24},
    {"receipt_id": 3, "customer_name": "Woodrow Wilson", "price": 53.43, "tip": 5.43},
    {"receipt_id": 4, "customer_name": "Margaret James", "price": 21.11, "tip": 1.00},
]
insert_rows_into_table(rows, receipts)

## 2. Agent Building

### 2.1. Tool 

Tool is a function that an LLM can use in an agentic system. To use it LLM needs

* name
* tool
* desc
* output type

Tool is a class which wraps a function with required metadata that helps LLM understand how to use it

In [5]:
inspector = inspect(engine)
columns_info = [(col["name"], col["type"]) for col in inspector.get_columns("receipts")]

table_description = "Columns:\n" + "\n".join([f"  - {name}: {col_type}" for name, col_type in columns_info])
print(table_description)

Columns:
  - receipt_id: INTEGER
  - customer_name: VARCHAR(16)
  - price: FLOAT
  - tip: FLOAT


### 2.2. Tool Creation

In [7]:
from smolagents import  tool

  from .autonotebook import tqdm as notebook_tqdm


In [8]:

@tool
def sql_engine(query: str) -> str:
    """
    Allows you to perform SQL queries on the table. Returns a string representation of the result.
    The table is named 'receipts'. Its description is as follows:
        Columns:
        - receipt_id: INTEGER
        - customer_name: VARCHAR(16)
        - price: FLOAT
        - tip: FLOAT

    Args:
        query: The query to perform. This should be correct SQL.
    """
    output = ""
    with engine.connect() as con:
        rows = con.execute(text(query))
        for row in rows:
            output += "\n" + str(row)
    return output

In [9]:
from smolagents import CodeAgent, MLXModel

In [10]:
mlx_model = MLXModel("mlx-community/Llama-3.1-8B-Instruct-4bit")

Fetching 6 files: 100%|██████████| 6/6 [00:00<00:00, 72523.99it/s]


## 2.3. Running Agent

In [11]:
from phoenix.otel import register
from openinference.instrumentation.smolagents import SmolagentsInstrumentor

register()
SmolagentsInstrumentor().instrument()

🔭 OpenTelemetry Tracing Details 🔭
|  Phoenix Project: default
|  Span Processor: SimpleSpanProcessor
|  Collector Endpoint: localhost:4317
|  Transport: gRPC
|  Transport Headers: {'user-agent': '****'}
|  
|  Using a default SpanProcessor. `add_span_processor` will overwrite this default.
|  
|  `register` has set this TracerProvider as the global OpenTelemetry default.
|  To disable this behavior, call `register` with `set_global_tracer_provider=False`.



In [None]:
from smolagents import CodeAgent

agent = CodeAgent(
    tools=[sql_engine],
    model=mlx_model,
)
agent.run("Provide me with names of customer in ascending order of tip given and with joke about tip")