In [1]:
# Install necessary packages
%pip install kitchenai-whisk llama-index openai




Collecting kitchenai-whisk
  Downloading kitchenai_whisk-0.2.1-py3-none-any.whl.metadata (11 kB)
Collecting llama-index
  Downloading llama_index-0.12.19-py3-none-any.whl.metadata (12 kB)
Collecting openai
  Downloading openai-1.63.2-py3-none-any.whl.metadata (27 kB)
Collecting anyio>=3.7.1 (from kitchenai-whisk)
  Using cached anyio-4.8.0-py3-none-any.whl.metadata (4.6 kB)
Collecting cookiecutter>=2.5.0 (from kitchenai-whisk)
  Using cached cookiecutter-2.6.0-py3-none-any.whl.metadata (7.3 kB)
Collecting fastapi>=0.100.0 (from kitchenai-whisk)
  Using cached fastapi-0.115.8-py3-none-any.whl.metadata (27 kB)
Collecting faststream>=0.4.0 (from faststream[nats]>=0.4.0->kitchenai-whisk)
  Using cached faststream-0.5.34-py3-none-any.whl.metadata (25 kB)
Collecting httpx>=0.26.0 (from kitchenai-whisk)
  Using cached httpx-0.28.1-py3-none-any.whl.metadata (7.1 kB)
Collecting pydantic>=2.0.0 (from kitchenai-whisk)
  Using cached pydantic-2.10.6-py3-none-any.whl.metadata (30 kB)
Collecting pyt

In [21]:
# Import required libraries

from whisk.kitchenai_sdk.kitchenai import KitchenAIApp

from whisk.kitchenai_sdk.schema import (
    ChatInput, 
    ChatResponse,
)
kitchen = KitchenAIApp(namespace="react-agent-with-query-engine")

from llama_index.core import (
    SimpleDirectoryReader,
    VectorStoreIndex,
    StorageContext,
    load_index_from_storage,
)
from llama_index.core.tools import QueryEngineTool, ToolMetadata
import openai


In [7]:
import os

api_key = input("Please enter your OpenAI API key: ")
os.environ["OPENAI_API_KEY"] = api_key



# ReAct Agent with Query Engine (RAG) Tools

In this section, we show how to setup an agent powered by the ReAct loop for financial analysis.

The agent has access to two "tools": one to query the 2021 Lyft 10-K and the other to query the 2021 Uber 10-K.

We try two different LLMs:

- gpt-3.5-turbo
- gpt-3.5-turbo-instruct

Note that you can plug in any LLM that exposes a text completion endpoint.

## Build Query Engine Tools

In [8]:
%pip install llama-index-llms-openai


[1m[[0m[34;49mnotice[0m[1;39;49m][0m[39;49m A new release of pip is available: [0m[31;49m24.0[0m[39;49m -> [0m[32;49m25.0.1[0m
[1m[[0m[34;49mnotice[0m[1;39;49m][0m[39;49m To update, run: [0m[32;49mpip install --upgrade pip[0m
Note: you may need to restart the kernel to use updated packages.


In [9]:
from llama_index.core import (
    SimpleDirectoryReader,
    VectorStoreIndex,
    StorageContext,
    load_index_from_storage,
)

from llama_index.core.tools import QueryEngineTool, ToolMetadata

In [10]:
try:
    storage_context = StorageContext.from_defaults(
        persist_dir="./storage/lyft"
    )
    lyft_index = load_index_from_storage(storage_context)

    storage_context = StorageContext.from_defaults(
        persist_dir="./storage/uber"
    )
    uber_index = load_index_from_storage(storage_context)

    index_loaded = True
except:
    index_loaded = False

Download Data

In [11]:
!mkdir -p 'data/10k/'
!wget 'https://raw.githubusercontent.com/run-llama/llama_index/main/docs/docs/examples/data/10k/uber_2021.pdf' -O 'data/10k/uber_2021.pdf'
!wget 'https://raw.githubusercontent.com/run-llama/llama_index/main/docs/docs/examples/data/10k/lyft_2021.pdf' -O 'data/10k/lyft_2021.pdf'

--2025-02-18 11:04:39--  https://raw.githubusercontent.com/run-llama/llama_index/main/docs/docs/examples/data/10k/uber_2021.pdf
Resolving raw.githubusercontent.com (raw.githubusercontent.com)... 2606:50c0:8002::154, 2606:50c0:8001::154, 2606:50c0:8000::154, ...
Connecting to raw.githubusercontent.com (raw.githubusercontent.com)|2606:50c0:8002::154|:443... connected.
HTTP request sent, awaiting response... 200 OK
Length: 1880483 (1.8M) [application/octet-stream]
Saving to: ‘data/10k/uber_2021.pdf’


2025-02-18 11:04:39 (29.9 MB/s) - ‘data/10k/uber_2021.pdf’ saved [1880483/1880483]

--2025-02-18 11:04:39--  https://raw.githubusercontent.com/run-llama/llama_index/main/docs/docs/examples/data/10k/lyft_2021.pdf
Resolving raw.githubusercontent.com (raw.githubusercontent.com)... 2606:50c0:8003::154, 2606:50c0:8000::154, 2606:50c0:8002::154, ...
Connecting to raw.githubusercontent.com (raw.githubusercontent.com)|2606:50c0:8003::154|:443... connected.
HTTP request sent, awaiting response... 200

In [12]:
if not index_loaded:
    # load data
    lyft_docs = SimpleDirectoryReader(
        input_files=["./data/10k/lyft_2021.pdf"]
    ).load_data()
    uber_docs = SimpleDirectoryReader(
        input_files=["./data/10k/uber_2021.pdf"]
    ).load_data()

    # build index
    lyft_index = VectorStoreIndex.from_documents(lyft_docs)
    uber_index = VectorStoreIndex.from_documents(uber_docs)

    # persist index
    lyft_index.storage_context.persist(persist_dir="./storage/lyft")
    uber_index.storage_context.persist(persist_dir="./storage/uber")

In [13]:
lyft_engine = lyft_index.as_query_engine(similarity_top_k=3)
uber_engine = uber_index.as_query_engine(similarity_top_k=3)

In [14]:
query_engine_tools = [
    QueryEngineTool(
        query_engine=lyft_engine,
        metadata=ToolMetadata(
            name="lyft_10k",
            description=(
                "Provides information about Lyft financials for year 2021. "
                "Use a detailed plain text question as input to the tool."
            ),
        ),
    ),
    QueryEngineTool(
        query_engine=uber_engine,
        metadata=ToolMetadata(
            name="uber_10k",
            description=(
                "Provides information about Uber financials for year 2021. "
                "Use a detailed plain text question as input to the tool."
            ),
        ),
    ),
]

## Setup ReAct Agent

Here we setup two ReAct agents: one powered by standard gpt-3.5-turbo, and the other powered by gpt-3.5-turbo-instruct.

You can **optionally** specify context which will be added to the core ReAct system prompt.

In [15]:
from llama_index.core.agent import ReActAgent
from llama_index.llms.openai import OpenAI

In [16]:
# [Optional] Add Context
# context = """\
# You are a stock market sorcerer who is an expert on the companies Lyft and Uber.\
#     You will answer questions about Uber and Lyft as in the persona of a sorcerer \
#     and veteran stock market investor.
# """
llm = OpenAI(model="gpt-3.5-turbo")

agent = ReActAgent.from_tools(
    query_engine_tools,
    llm=llm,
    verbose=True,
    # context=context
)

agent_whisk = ReActAgent.from_tools(
    query_engine_tools,
    llm=llm,
    verbose=True,
    # context=context
)

In [None]:
response = agent.chat("What was Lyft's revenue growth in 2021?")
print(str(response))

[38;5;200m[1;3mThought: I need to use a tool to help me answer the question.
Action: lyft_10k
Action Input: {'input': "What was Lyft's revenue growth in 2021?"}
[0m[36;1m[1;3mObservation: Lyft's revenue growth in 2021 was 36%.
[0m[38;5;200m[1;3mResponse: Lyft's revenue growth in 2021 was 36%.
[0mLyft's revenue growth in 2021 was 36%.


## Run Some Example Queries

We run some example queries using the agent, showcasing some of the agent's abilities to do chain-of-thought-reasoning and tool use to synthesize the right answer.

We also show queries.

In [None]:
response = agent.chat(
    "Compare and contrast the revenue growth of Uber and Lyft in 2021, then"
    " give an analysis"
)
print(str(response))

[38;5;200m[1;3mThought: I need to use a tool to help me compare the revenue growth of Uber and Lyft in 2021.
Action: lyft_10k
Action Input: {'input': "What was Lyft's revenue growth in 2021?"}
[0m[36;1m[1;3mObservation: Lyft's revenue growth in 2021 was 36%.
[0m[38;5;200m[1;3mThought: I need to use a tool to help me compare the revenue growth of Uber and Lyft in 2021.
Action: uber_10k
Action Input: {'input': "What was Uber's revenue growth in 2021?"}
[0m[36;1m[1;3mObservation: Uber's revenue growth in 2021 was 57%.
[0m[38;5;200m[1;3mResponse: In 2021, Lyft's revenue growth was 36% while Uber's revenue growth was 57%. This indicates that Uber experienced a higher revenue growth compared to Lyft in 2021.
[0mIn 2021, Lyft's revenue growth was 36% while Uber's revenue growth was 57%. This indicates that Uber experienced a higher revenue growth compared to Lyft in 2021.


**Async execution**: Here we try another query with async execution

In [None]:
# Try another query with async execution

import nest_asyncio

nest_asyncio.apply()

response = await agent.achat(
    "Compare and contrast the risks of Uber and Lyft in 2021, then give an"
    " analysis"
)
print(str(response))

### Compare gpt-3.5-turbo vs. gpt-3.5-turbo-instruct 

We compare the performance of the two agents in being able to answer some complex queries.

#### Taking a look at a turbo-instruct agent

In [17]:
llm_instruct = OpenAI(model="gpt-3.5-turbo-instruct")
agent_instruct = ReActAgent.from_tools(
    query_engine_tools, llm=llm_instruct, verbose=True
)

agent_instruct_whisk = ReActAgent.from_tools(
    query_engine_tools, llm=llm_instruct, verbose=True
)

In [13]:
response = agent_instruct.chat("What was Lyft's revenue growth in 2021?")
print(str(response))

> Running step 6819b25e-6e24-41db-9739-1ced207dc05e. Step input: What was Lyft's revenue growth in 2021?
[1;3;38;5;200mThought: The current language of the user is: English. I need to use a tool to help me answer the question.
Action: lyft_10k
Action Input: {'input': "What was Lyft's revenue growth in 2021?"}
[0m[1;3;34mObservation: Lyft's revenue growth in 2021 was 36%.
[0m> Running step 2e29480f-cb88-4a98-ab00-b214624eb82f. Step input: None
[1;3;38;5;200mThought: I can answer without using any more tools. I'll use the user's language to answer
Answer: Lyft's revenue growth in 2021 was 36%.
[0mLyft's revenue growth in 2021 was 36%.


#### Try more complex queries

We compare gpt-3.5-turbo with gpt-3.5-turbo-instruct agents on more complex queries.

In [None]:
response = agent.chat(
    "Compare and contrast the revenue growth of Uber and Lyft in 2021, then"
    " give an analysis"
)
print(str(response))

[38;5;200m[1;3mThought: I need to use a tool to help me compare the revenue growth of Uber and Lyft in 2021.
Action: uber_10k
Action Input: {'input': "Please provide information about Uber's revenue growth in 2021."}
[0m[36;1m[1;3mObservation: Uber's revenue grew by 57% in 2021 compared to the previous year. This growth was primarily driven by an increase in Gross Bookings, with Delivery Gross Bookings increasing by 71% and Mobility Gross Bookings growing by 38%. The increase in Delivery Gross Bookings was due to higher demand for food delivery orders and expansion across U.S. and international markets. The growth in Mobility Gross Bookings was a result of increased Trip volumes as the business recovered from the impacts of COVID-19.
[0m[38;5;200m[1;3mThought: I have information about Uber's revenue growth in 2021. Now I need to use a tool to get information about Lyft's revenue growth in 2021.
Action: lyft_10k
Action Input: {'input': "Please provide information about Lyft's re

In [None]:
response = agent_instruct.chat(
    "Compare and contrast the revenue growth of Uber and Lyft in 2021, then"
    " give an analysis"
)
print(str(response))

[38;5;200m[1;3mResponse: The revenue growth of Uber was higher than Lyft in 2021, with Uber experiencing a 74% growth compared to Lyft's 48%. This indicates that Uber may have had a stronger financial performance in 2021. However, further analysis is needed to fully understand the factors contributing to this difference.
[0mThe revenue growth of Uber was higher than Lyft in 2021, with Uber experiencing a 74% growth compared to Lyft's 48%. This indicates that Uber may have had a stronger financial performance in 2021. However, further analysis is needed to fully understand the factors contributing to this difference.


In [None]:
response = agent.chat(
    "Can you tell me about the risk factors of the company with the higher"
    " revenue?"
)
print(str(response))

[38;5;200m[1;3mThought: I need to find out which company has higher revenue before I can provide information about its risk factors.
Action: lyft_10k
Action Input: {'input': 'What is the revenue of Lyft in 2021?'}
[0m[36;1m[1;3mObservation: The revenue of Lyft in 2021 is $3,208,323,000.
[0m[38;5;200m[1;3mThought: Now that I know Lyft has higher revenue, I can find information about its risk factors.
Action: lyft_10k
Action Input: {'input': 'What are the risk factors of Lyft?'}
[0m[36;1m[1;3mObservation: Lyft faces numerous risk factors that could potentially harm its business, financial condition, and results of operations. These risk factors include general economic factors such as the impact of the COVID-19 pandemic, natural disasters, economic downturns, and political crises. Operational factors such as limited operating history, financial performance, competition, unpredictability of results, uncertainty regarding market growth, ability to attract and retain drivers and 

In [None]:
response = agent_instruct.query(
    "Can you tell me about the risk factors of the company with the higher"
    " revenue?"
)
print(str(response))

[38;5;200m[1;3mResponse: The risk factors for the company with the higher revenue include competition, regulatory changes, and dependence on drivers.
[0mThe risk factors for the company with the higher revenue include competition, regulatory changes, and dependence on drivers.


**Observation**: The turbo-instruct agent seems to do worse on agent reasoning compared to the regular turbo model. Of course, this is subject to further observation!

In [24]:
# Define a chat handler for querying the index
@kitchen.chat.handler("regular-agent")
async def query_financial_documents(chat: ChatInput) -> ChatResponse:
    """Query the financial documents using the Llama Index."""

    # Extract the user's latest message
    question = chat.messages[-1].content

    # Query the index (assuming index is already built and accessible)
    response = await agent_whisk.achat(question)

    # Return response in chat format
    return ChatResponse(content=str(response))


In [25]:
# Define a chat handler for querying the index
@kitchen.chat.handler("instruct-agent")
async def query_financial_documents(chat: ChatInput) -> ChatResponse:
    """Query the financial documents using the Llama Index."""

    # Extract the user's latest message
    question = chat.messages[-1].content

    # Query the index (assuming index is already built and accessible)
    response = await agent_instruct_whisk.achat(question)

    # Return response in chat format
    return ChatResponse(content=str(response))


In [26]:
# Launch Whisk server
from whisk.config import WhiskConfig, ServerConfig
from whisk.router import WhiskRouter

config = WhiskConfig(server=ServerConfig(type="fastapi"))
router = WhiskRouter(kitchen_app=kitchen, config=config)

# Run the Whisk server in the notebook
router.run_in_notebook(host="0.0.0.0", port=8000)


Shutting down existing Whisk server...
Whisk server stopped.
Whisk server started on http://0.0.0.0:8000 (in background)


INFO:     Started server process [3333614]
INFO:     Waiting for application startup.
INFO:     Application startup complete.
INFO:     Uvicorn running on http://0.0.0.0:8000 (Press CTRL+C to quit)


INFO:     127.0.0.1:57412 - "GET /v1/models HTTP/1.1" 200 OK
INFO:     127.0.0.1:54468 - "OPTIONS /v1/chat/completions HTTP/1.1" 200 OK
INFO:     127.0.0.1:54470 - "POST /v1/chat/completions HTTP/1.1" 200 OK
> Running step cff1d456-9afb-4b0d-af29-56f009d94ce7. Step input: compare the risks between uber and lyft in 2021
[1;3;38;5;200mThought: The user is asking for a comparison of risks between Uber and Lyft in 2021. I can use the financial information tools for both companies to gather data on their risks.
Action: lyft_10k
Action Input: {'input': 'Please provide information on the risks faced by Lyft in 2021'}
[0m[1;3;34mObservation: Lyft faced various risks in 2021, including challenges related to forecasting revenue and managing expenses, attracting and retaining drivers and riders cost-effectively, complying with laws and regulations, managing operations during the COVID-19 pandemic, planning and managing capital expenditures, developing and maintaining assets, responding to macr

In [27]:
router.stop_in_notebook()

INFO:     Shutting down
INFO:     Waiting for application shutdown.
INFO:     Application shutdown complete.
INFO:     Finished server process [3333614]


Shutting down existing Whisk server...
Whisk server stopped.
