In [15]:
from llama_index.core import SimpleDirectoryReader
documents = SimpleDirectoryReader(input_files=['../data_uber/uber_2021.pdf']).load_data()
#documents = SimpleDirectoryReader(input_files=['../data2/source.txt']).load_data()

In [16]:
!pip install llama-index-embeddings-ollama



In [17]:
from llama_index.embeddings.ollama import OllamaEmbedding

In [18]:
ollama_embedding = OllamaEmbedding(
    model_name="nomic-embed-text:latest",  # Replace with your desired model
    base_url="http://localhost:11434",  # Ensure Ollama is running at this endpoint
    ollama_additional_kwargs={"mirostat": 0} #Mirostat is a technique for controlling perplexity and balancing the text generation process in large language models (LLMs).
)    

In [19]:
from llama_index.core import VectorStoreIndex

vector_store_index = VectorStoreIndex.from_documents(documents, embed_model=ollama_embedding)

In [20]:
from llama_index.core import Settings
from llama_index.llms.ollama import  Ollama

Settings.llm = Ollama(model='llama3.2:latest', base_url='http://localhost:11434',temperature=0.1)

In [21]:
query_engine = vector_store_index.as_query_engine()


In [23]:
response = query_engine.query("Provide summary of the company performance in this quarter compared to earlier quarter")


In [24]:
from pprint import pprint 
print(response)


The company's revenue decreased by $127 million, or 94%, from the same period in 2020. This decline was primarily due to the sale of its ATG Business and the JUMP Divestiture. In terms of adjusted EBITDA loss, the company saw an improvement of $450 million, or 98%.


In [25]:
vector_retriever = vector_store_index.as_retriever(similarity_top_k=3)


In [26]:
nodes = vector_retriever.retrieve("Provide summary of the company performance in this quarter compared to earlier quarter")


In [27]:
len(nodes)

3

In [28]:
type(nodes)


list

In [29]:
nodes[0].dict().keys()

dict_keys(['node', 'score', 'class_name'])

In [30]:
print(nodes[0].get_content())

All Other
For  the  year  ended  December  31,  2021  compared  to  the  same  period  in  2020,  All  Other  revenue  decreased  $127  million,  or  94%  and  All  Otheradjusted EBITDA loss improved $450 million, or 98%.All Other revenue and All Other adjusted EBITDA loss improved primarily due to the  favorable impact of the sale of our ATG Business in the first quarter of2021 and the JUMP Divestiture in the second quarter of 2020.Certain Key Metrics and Non-GAAP Financial MeasuresAdjusted EBITDA and revenue  growth rates in constant currency  are non-GAAP financial  measures. For more information about how we use these non-GAAP financial measures in our business, the limitations of these measures, and reconciliations of these measures to the most directly comparable GAAP financialmeasures, see the section titled “Reconciliations of Non-GAAP Financial Measures.”Monthly Active Platform Consumers. MAPCs  is the number of unique consumers who completed a Mobility or New Mobility ride or

In [31]:
for node in nodes:
  print("Node Id:",node.id_)
  print("Metadata:",node.metadata)
  print("Score:",node.get_score())
  print("------------------------------------")

Node Id: f13b6e51-d5da-437e-869c-cc5cbba3f9f4
Metadata: {'page_label': '62', 'file_name': 'uber_2021.pdf', 'file_path': '..\\data_uber\\uber_2021.pdf', 'file_type': 'application/pdf', 'file_size': 1880483, 'creation_date': '2024-11-19', 'last_modified_date': '2024-11-19'}
Score: 0.6280461576380775
------------------------------------
Node Id: 5e204c28-9b87-46dd-a0b1-c940f468725d
Metadata: {'page_label': '2', 'file_name': 'uber_2021.pdf', 'file_path': '..\\data_uber\\uber_2021.pdf', 'file_type': 'application/pdf', 'file_size': 1880483, 'creation_date': '2024-11-19', 'last_modified_date': '2024-11-19'}
Score: 0.5931906201550231
------------------------------------
Node Id: 6f926d5b-23fc-46cf-b525-8b0e6905aa9f
Metadata: {'page_label': '93', 'file_name': 'uber_2021.pdf', 'file_path': '..\\data_uber\\uber_2021.pdf', 'file_type': 'application/pdf', 'file_size': 1880483, 'creation_date': '2024-11-19', 'last_modified_date': '2024-11-19'}
Score: 0.5923450937182048
------------------------------