# Retrieval-Augmented Generation (RAG)

In [13]:
import chromadb
import dotenv
from pathlib import Path
from agents import Agent, Runner, function_tool, trace

dotenv.load_dotenv()

True

Create a static calorie table that we can use as a tool:

In [14]:
# We populated the RAG with the data from the data/calories.csv file in
# the rag_setup.ipynb notebook
# Ahora vamos a crear un objeto de tipo chromadb que apunte al directorio donde tenemos los embeddings
chroma_client = chromadb.PersistentClient(path="../chroma")

# Ahora vamos a crear una colección de tipo nutrition_db
nutrition_db = chroma_client.get_collection(name="nutrition_db")  # 'nutrition_db' es el nombre de la colección que creamos en el notebook 'rag_setup.ipynb'


In [15]:
# Ahora vamos a hacer una consulta a la base de datos para ver si podemos encontrar información sobre 'bananas'
results = nutrition_db.query(query_texts=["banana"], 
                             n_results=2)      # n_results es el número de resultados que queremos obtener
                             
for i, doc in enumerate(results["documents"][0]):
    print(sorted(results["metadatas"][0][i].items()))
    print(doc)
    print("\n")

[('calories_per_100g', 89.0), ('food_category', 'fruits'), ('food_item', 'banana'), ('keywords', 'banana_fruits'), ('kj_per_100g', 374.0), ('serving_info', '100g')]
Food: Banana
        Category: Fruits
        Nutritional Information:
        - Calories: 89 per 100g
        - Energy: 374 kJ per 100g
        - Serving size reference: 100g

        This is a fruits food item that provides 89 calories per 100 grams.


[('calories_per_100g', 50.0), ('food_category', '(fruit)juices'), ('food_item', 'banana juice'), ('keywords', 'banana_juice_(fruit)juices'), ('kj_per_100g', 210.0), ('serving_info', '100ml')]
Food: Banana Juice
        Category: (Fruit)Juices
        Nutritional Information:
        - Calories: 50 per 100g
        - Energy: 210 kJ per 100g
        - Serving size reference: 100ml

        This is a (fruit)juices food item that provides 50 calories per 100 grams.




In [20]:
# Creamos la función que se encargará de buscar la información en la base de datos de embeddings
# Es importante crear un docstring para la función que describa su comportamiento, datos de entrada y salida
@function_tool
def calorie_lookup_tool(query: str, max_results: int = 3) -> str:
    """
    Tool function for a RAG database to look up calorie information for specific food items, but not for meals.

    Args:
        query: The food item to look up.
        max_results: The maximum number of results to return.

    Returns:
        A string containing the nutrition information.
    """

    results = nutrition_db.query(query_texts=[query], n_results=max_results)

    if not results["documents"][0]:
        return f"No nutrition information found for: {query}"

    # Format results for the agent
    formatted_results = []
    for i, doc in enumerate(results["documents"][0]):
        metadata = results["metadatas"][0][i]
        food_item = metadata["food_item"].title()
        calories = metadata["calories_per_100g"]
        category = metadata["food_category"].title()

        formatted_results.append(
            f"{food_item} ({category}): {calories} calories per 100g"
        )

    return "Nutrition Information:\n" + "\n".join(formatted_results)

Hagamos una prueba de esta función:

> todavia no es una tool... es solo una función

__La siguiente celda solo funcionara con la definicion de funcion. No lo hará si la convertimos en una tool con `@function_tool` __

In [None]:
#calorie_lookup_tool('bananas')

'Nutrition Information:\nBanana (Fruits): 89.0 calories per 100g\nBanana Juice ((Fruit)Juices): 50.0 calories per 100g\nBanana Nut Bread (Pastries,Breads&Rolls): 326.0 calories per 100g'

In [22]:
# ahora para probar la tool, la convertimos la funcion en una tool con @function_tool
# y creamos un agente que use esta tool
# le agregamos la tool a la lista de tools
calorie_agent = Agent(
    name="Nutrition Assistant",
    instructions="""
    You are a helpful nutrition assistant giving out calorie information.
    You give concise answers.
    If you need to look up calorie information, use the calorie_lookup_tool.
    """,
    tools=[calorie_lookup_tool],
)

In [23]:
with trace("Nutrition Assistant with RAG"):
    result = await Runner.run(
        calorie_agent,
        "How many calories are in total in a banana and an apple? Also give calories per 100g",
    )
    print(result.final_output)

- Calories per 100 g: banana 89 kcal, apple 52 kcal.
- Estimated total for typical portions: banana (~118 g) ≈ 105 kcal; apple (~182 g) ≈ 95 kcal; total ≈ 200 kcal. 
Note: values vary by size.
