In [77]:
from dotenv import load_dotenv
load_dotenv()

import os
os.environ["HF_TOKEN"] = os.getenv("HF_TOKEN")

In [78]:
from langchain_huggingface import HuggingFaceEmbeddings
embedding = HuggingFaceEmbeddings(model_name="all-MiniLM-L6-v2")

In [79]:
check_embedding_model = embedding.embed_query("Hello AI")
len(check_embedding_model)

384

In [80]:
from langchain_google_genai import GoogleGenerativeAIEmbeddings
embeddings = GoogleGenerativeAIEmbeddings(model="models/gemini-embedding-001")

In [81]:
check_embedding_model = embeddings.embed_query("Hello AI")
len(check_embedding_model)

3072

In [82]:
from pinecone import Pinecone

In [83]:
pinecone_api_key = os.getenv("PINECONE_API_KEY")

In [84]:
pinecone_api_key

'pcsk_2hyePj_KP7jEWrtkJcAAhsyKCAU8UnBZXZ1jbBFAgGFy6PbTThVgpW9ddU8RvDy5RE9VSn'

In [85]:
pc = Pinecone(api_key=pinecone_api_key)

In [86]:
from pinecone import ServerlessSpec
#Serverless: Server will be Managed by the cloud provider

In [87]:
index_name="agentic-docs"

In [88]:
pc.has_index(index_name)

False

In [89]:
#creating a index
if not pc.has_index(index_name):
    pc.create_index(
    name=index_name,
    dimension=3072,
    metric="cosine",
    spec=ServerlessSpec(cloud="aws",region="us-east-1")    
)

In [90]:
#loading the index
index=pc.Index(index_name)

In [91]:
from langchain_pinecone import PineconeVectorStore

In [92]:
vector_store = PineconeVectorStore(index=index,embedding=embeddings)

In [93]:
results = vector_store.similarity_search("what is a langchain?")

In [94]:
results

[]

In [95]:
from uuid import uuid4
from langchain_core.documents import Document

document_1 = Document(
    page_content="I had chocolate chip pancakes and scrambled eggs for breakfast this morning.",
    metadata={"source": "tweet"}, #additional info
)

document_2 = Document(
    page_content="The weather forecast for tomorrow is cloudy and overcast, with a high of 62 degrees.",
    metadata={"source": "news"},
)

document_3 = Document(
    page_content="Building an exciting new project with LangChain - come check it out!",
    metadata={"source": "tweet"},
)

document_4 = Document(
    page_content="Robbers broke into the city bank and stole $1 million in cash.",
    metadata={"source": "news"},
)

document_5 = Document(
    page_content="Wow! That was an amazing movie. I can't wait to see it again.",
    metadata={"source": "tweet"},
)

document_6 = Document(
    page_content="Is the new iPhone worth the price? Read this review to find out.",
    metadata={"source": "website"},
)

document_7 = Document(
    page_content="The top 10 soccer players in the world right now.",
    metadata={"source": "website"},
)

document_8 = Document(
    page_content="LangGraph is the best framework for building stateful, agentic applications!",
    metadata={"source": "tweet"},
)

document_9 = Document(
    page_content="The stock market is down 500 points today due to fears of a recession.",
    metadata={"source": "news"},
)

document_10 = Document(
    page_content="I have a bad feeling I am going to get deleted :(",
    metadata={"source": "tweet"},
)


In [96]:
documents = [
    document_1,
    document_2,
    document_3,
    document_4,
    document_5,
    document_6,
    document_7,
    document_8,
    document_9,
    document_10,
]

In [97]:
documents

[Document(metadata={'source': 'tweet'}, page_content='I had chocolate chip pancakes and scrambled eggs for breakfast this morning.'),
 Document(metadata={'source': 'news'}, page_content='The weather forecast for tomorrow is cloudy and overcast, with a high of 62 degrees.'),
 Document(metadata={'source': 'tweet'}, page_content='Building an exciting new project with LangChain - come check it out!'),
 Document(metadata={'source': 'news'}, page_content='Robbers broke into the city bank and stole $1 million in cash.'),
 Document(metadata={'source': 'tweet'}, page_content="Wow! That was an amazing movie. I can't wait to see it again."),
 Document(metadata={'source': 'website'}, page_content='Is the new iPhone worth the price? Read this review to find out.'),
 Document(metadata={'source': 'website'}, page_content='The top 10 soccer players in the world right now.'),
 Document(metadata={'source': 'tweet'}, page_content='LangGraph is the best framework for building stateful, agentic application

In [98]:
len(documents)

10

In [99]:
range(len(documents))

range(0, 10)

In [100]:
for i in range(len(documents)):
    print(i)
    print(str(uuid4()))
    

0
b7591b03-53bd-41bd-b9c2-a0f8d866bf42
1
0cd9382c-f7c3-4b75-a61f-614e8cb01e54
2
cdedb52c-d994-4087-9d81-74316c284d53
3
510fa2f2-37a2-4f7b-abf3-d08d3eee6f36
4
7303ff26-20c7-40d1-aa70-65da7a770642
5
cc302efb-f0a0-45ae-943d-f6d497751463
6
c2ebf964-dc97-4875-9288-bea1585b55cc
7
341ee6d4-1818-4e64-9011-114bb011bea9
8
4e8e0b25-6f24-48fa-a721-e1677b81535a
9
6a94d5e7-eb86-45ac-bbc6-415eaa6ad396


In [101]:
#universal indentification number
uuids = [str(uuid4()) for _ in range(len(documents))]

In [102]:
uuids

['36511a0f-05dc-4bfd-ada1-785feb31b88a',
 'f840fb7a-1efd-4280-ae46-c1cceb29cb26',
 'bc2c60de-8a57-4631-8b08-191bb99dcba2',
 '8f730a22-9265-4e92-94a9-f1e0afbec90a',
 'd6ea59f6-4573-4c62-bc68-5d4b135c5e89',
 '596982a6-98f7-4982-a4c5-f2f36ae60149',
 'dc28dc9a-2e1a-4ddb-a5cb-0d3bef00ea34',
 'ff8aa14f-0f34-4a2c-86e3-21852d9ecaaa',
 'd3f3ccf8-b17c-4a0b-b522-3507f6465380',
 'fd05ebf0-89e4-4b43-a7da-0922ec0df632']

In [103]:
vector_store.add_documents(documents=documents, ids=uuids)

['36511a0f-05dc-4bfd-ada1-785feb31b88a',
 'f840fb7a-1efd-4280-ae46-c1cceb29cb26',
 'bc2c60de-8a57-4631-8b08-191bb99dcba2',
 '8f730a22-9265-4e92-94a9-f1e0afbec90a',
 'd6ea59f6-4573-4c62-bc68-5d4b135c5e89',
 '596982a6-98f7-4982-a4c5-f2f36ae60149',
 'dc28dc9a-2e1a-4ddb-a5cb-0d3bef00ea34',
 'ff8aa14f-0f34-4a2c-86e3-21852d9ecaaa',
 'd3f3ccf8-b17c-4a0b-b522-3507f6465380',
 'fd05ebf0-89e4-4b43-a7da-0922ec0df632']

In [111]:
results = vector_store.similarity_search("What langchain provides to us?", k=8)
results

[Document(id='bc2c60de-8a57-4631-8b08-191bb99dcba2', metadata={'source': 'tweet'}, page_content='Building an exciting new project with LangChain - come check it out!'),
 Document(id='ff8aa14f-0f34-4a2c-86e3-21852d9ecaaa', metadata={'source': 'tweet'}, page_content='LangGraph is the best framework for building stateful, agentic applications!'),
 Document(id='fd05ebf0-89e4-4b43-a7da-0922ec0df632', metadata={'source': 'tweet'}, page_content='I have a bad feeling I am going to get deleted :('),
 Document(id='f840fb7a-1efd-4280-ae46-c1cceb29cb26', metadata={'source': 'news'}, page_content='The weather forecast for tomorrow is cloudy and overcast, with a high of 62 degrees.'),
 Document(id='d3f3ccf8-b17c-4a0b-b522-3507f6465380', metadata={'source': 'news'}, page_content='The stock market is down 500 points today due to fears of a recession.'),
 Document(id='36511a0f-05dc-4bfd-ada1-785feb31b88a', metadata={'source': 'tweet'}, page_content='I had chocolate chip pancakes and scrambled eggs for 

In [110]:
results = vector_store.similarity_search("What langchain provides to us?", k=5, filter={"source": "tweet"})
results

[Document(id='bc2c60de-8a57-4631-8b08-191bb99dcba2', metadata={'source': 'tweet'}, page_content='Building an exciting new project with LangChain - come check it out!'),
 Document(id='ff8aa14f-0f34-4a2c-86e3-21852d9ecaaa', metadata={'source': 'tweet'}, page_content='LangGraph is the best framework for building stateful, agentic applications!'),
 Document(id='fd05ebf0-89e4-4b43-a7da-0922ec0df632', metadata={'source': 'tweet'}, page_content='I have a bad feeling I am going to get deleted :('),
 Document(id='36511a0f-05dc-4bfd-ada1-785feb31b88a', metadata={'source': 'tweet'}, page_content='I had chocolate chip pancakes and scrambled eggs for breakfast this morning.'),
 Document(id='d6ea59f6-4573-4c62-bc68-5d4b135c5e89', metadata={'source': 'tweet'}, page_content="Wow! That was an amazing movie. I can't wait to see it again.")]

### Let's implement RAG on top of this

In [115]:
retriever=vector_store.as_retriever(
    search_type="similarity_score_threshold",
    search_kwargs={"k":3, "score_threshold": 0.7} #hyperparameter
)

In [116]:
retriever.invoke("langchain")

[Document(id='bc2c60de-8a57-4631-8b08-191bb99dcba2', metadata={'source': 'tweet'}, page_content='Building an exciting new project with LangChain - come check it out!'),
 Document(id='ff8aa14f-0f34-4a2c-86e3-21852d9ecaaa', metadata={'source': 'tweet'}, page_content='LangGraph is the best framework for building stateful, agentic applications!'),
 Document(id='d3f3ccf8-b17c-4a0b-b522-3507f6465380', metadata={'source': 'news'}, page_content='The stock market is down 500 points today due to fears of a recession.')]

In [117]:
retriever.invoke("google")

[Document(id='596982a6-98f7-4982-a4c5-f2f36ae60149', metadata={'source': 'website'}, page_content='Is the new iPhone worth the price? Read this review to find out.'),
 Document(id='fd05ebf0-89e4-4b43-a7da-0922ec0df632', metadata={'source': 'tweet'}, page_content='I have a bad feeling I am going to get deleted :('),
 Document(id='bc2c60de-8a57-4631-8b08-191bb99dcba2', metadata={'source': 'tweet'}, page_content='Building an exciting new project with LangChain - come check it out!')]

In [None]:
from langchain_google_genai import ChatGoogleGenerativeAI
model=ChatGoogleGenerativeAI(model='gemini-3-flash-preview')

In [120]:
from langchain_classic import hub
prompt = hub.pull("rlm/rag-prompt")

In [121]:
import pprint
pprint.pprint(prompt.messages)

[HumanMessagePromptTemplate(prompt=PromptTemplate(input_variables=['context', 'question'], input_types={}, partial_variables={}, template="You are an assistant for question-answering tasks. Use the following pieces of retrieved context to answer the question. If you don't know the answer, just say that you don't know. Use three sentences maximum and keep the answer concise.\nQuestion: {question} \nContext: {context} \nAnswer:"), additional_kwargs={})]


In [122]:
from langchain_core.prompts import PromptTemplate

In [123]:
prompt=PromptTemplate(
    template="""You are an assistant for question-answering tasks. Use the following pieces of retrieved context to answer the question. If you don't know the answer, just say that you don't know. Use three sentences maximum and keep the answer concise.\nQuestion: {question} \nContext: {context} \nAnswer:""",
    input_variables=['context', 'question']
)

In [124]:
prompt

PromptTemplate(input_variables=['context', 'question'], input_types={}, partial_variables={}, template="You are an assistant for question-answering tasks. Use the following pieces of retrieved context to answer the question. If you don't know the answer, just say that you don't know. Use three sentences maximum and keep the answer concise.\nQuestion: {question} \nContext: {context} \nAnswer:")

In [125]:
prompt.invoke({"question":"what is a langchain?","context":"langchain is very super framework for LLM."})

StringPromptValue(text="You are an assistant for question-answering tasks. Use the following pieces of retrieved context to answer the question. If you don't know the answer, just say that you don't know. Use three sentences maximum and keep the answer concise.\nQuestion: what is a langchain? \nContext: langchain is very super framework for LLM. \nAnswer:")

In [126]:
from langchain_core.output_parsers import StrOutputParser
from langchain_core.runnables import RunnablePassthrough

In [127]:
def format_docs(docs):
    return "\n\n".join(doc.page_content for doc in docs)

In [128]:
rag_chain = (
    {"context": retriever | format_docs, "question": RunnablePassthrough()}
    | prompt
    | model
    | StrOutputParser()
)

In [129]:
rag_chain.invoke("what is llama model?")

ChatGoogleGenerativeAIError: Error calling model 'gemini-1.5-flash' (NOT_FOUND): 404 NOT_FOUND. {'error': {'code': 404, 'message': 'models/gemini-1.5-flash is not found for API version v1beta, or is not supported for generateContent. Call ListModels to see the list of available models and their supported methods.', 'status': 'NOT_FOUND'}}