In [1]:
import os
from dotenv import load_dotenv
from langchain_openai import OpenAIEmbeddings
from langchain_pinecone import PineconeVectorStore
from pprint import pprint

  from tqdm.autonotebook import tqdm


In [2]:
index_name = "langchain-index"
embeddings = OpenAIEmbeddings(model="text-embedding-3-small")

In [3]:
vector_store = PineconeVectorStore(index_name=index_name, embedding=embeddings)

In [4]:
query = "Tax policies for young adults"
docs = vector_store.similarity_search(query, 3)
pprint(docs[0].page_content)
pprint(docs[1].page_content)
pprint(docs[2].page_content)

('Provides Life-Saving Humanitarian Assistance and Combats Global Food '
 'Insecurity. The Budget provides $10.3 billion in life-saving humanitarian '
 'and refugee assistance to support more than 330 million people in need in '
 'more than 70 countries in addition to the emergency supplemental request of '
 '$10 billion to address unprecedented global humanitarian needs, including '
 'the dire humanitarian situation facing Palestinians in Gaza. The Department '
 'of State and the United States Agency for International Development will '
 'have to reduce life-saving assistance around the globe without the '
 'additional $10 billion in humanitarian assistance requested in the '
 'Administration’s October 2023 National Security Supplemental Request.\n'
 '\n'
 '### Title: FACT SHEET: The President’s Budget for Fiscal Year 2025 Date '
 'Posted: March 11, 2024 Category: Statements and Releases')
('In addition, the President’s Budget explains his principles for addressing '
 'tax cuts expiri

In [7]:
# Make actual retriever
vector_store = PineconeVectorStore(index_name=index_name, embedding=embeddings)

retriever = vector_store.as_retriever(search_type="similarity", search_kwargs={"k": 3})

In [10]:
matched_docs = retriever.invoke(query)
for i, d in enumerate(matched_docs):
    print(f"\n## Document {i}\n")
    pprint(d.page_content)
    pprint(d.metadata)


## Document 0

('Provides Life-Saving Humanitarian Assistance and Combats Global Food '
 'Insecurity. The Budget provides $10.3 billion in life-saving humanitarian '
 'and refugee assistance to support more than 330 million people in need in '
 'more than 70 countries in addition to the emergency supplemental request of '
 '$10 billion to address unprecedented global humanitarian needs, including '
 'the dire humanitarian situation facing Palestinians in Gaza. The Department '
 'of State and the United States Agency for International Development will '
 'have to reduce life-saving assistance around the globe without the '
 'additional $10 billion in humanitarian assistance requested in the '
 'Administration’s October 2023 National Security Supplemental Request.\n'
 '\n'
 '### Title: FACT SHEET: The President’s Budget for Fiscal Year 2025 Date '
 'Posted: March 11, 2024 Category: Statements and Releases')
{'collection': 'whbriefingroom',
 'database': 'WTP',
 'id': '66a9003defac37d905d