In [1]:
from langchain_ollama import ChatOllama,OllamaEmbeddings
from langchain_core.prompts import PromptTemplate
from langchain_core.output_parsers import StrOutputParser
from langchain_core.runnables import RunnableSequence
from langchain_chroma import Chroma
from langchain_core.documents import Document

  from .autonotebook import tqdm as notebook_tqdm


In [2]:
llm = ChatOllama(
    model='qwen2:7b',
    temperature=0.25
)

embeddings = OllamaEmbeddings(
    model="nomic-embed-text"
)

In [3]:
doc1 = Document(
        page_content="Artificial Intelligence is transforming healthcare by enabling early disease detection, personalized treatments, and intelligent patient monitoring systems.",
        metadata={"source": "healthcare_ai.pdf", "topic": "AI in Healthcare", "page": 1}
    )

doc2 = Document(
        page_content="Climate change is intensifying heat waves, floods, and air pollution in urban areas, forcing cities to adopt sustainable infrastructure and green planning strategies.",
        metadata={"source": "climate_report.pdf", "topic": "Climate Change", "page": 3}
    )

doc3 = Document(
        page_content="Digital education platforms provide flexible learning opportunities through virtual classrooms, recorded lectures, and AI-powered personalized learning paths.",
        metadata={"source": "edtech_study.pdf", "topic": "Digital Education", "page": 5}
    )

doc4 = Document(
        page_content="Blockchain technology ensures transparency and security by using decentralized ledgers, making it valuable for finance, supply chain management, and identity verification.",
        metadata={"source": "blockchain_intro.pdf", "topic": "Blockchain", "page": 2}
    )

doc5 = Document(
        page_content="Renewable energy sources such as solar and wind power reduce carbon emissions and play a crucial role in achieving global sustainability goals.",
        metadata={"source": "renewable_energy.pdf", "topic": "Renewable Energy", "page": 4}
    )


documents = [doc1,doc2,doc3,doc4,doc5]

In [4]:
vector_store= Chroma(
    embedding_function=embeddings,
    persist_directory='chroma_db',
    collection_name='sample'
)

In [5]:
vector_store.add_documents(documents=documents)

['6b07c222-be66-493b-b777-47c811f8af0c',
 '051dd0c9-bcb0-4ae6-bf0e-551f0654bea6',
 'a714aa6d-1542-4dfb-969b-0f9763276c48',
 'd25116ea-c50f-4cb7-8720-11f902e92214',
 '33ad3e70-a30d-4b91-8e27-673ef2dc6689']

In [6]:
vector_store.get(include=['embeddings','documents','metadatas'])

{'ids': ['6b07c222-be66-493b-b777-47c811f8af0c',
  '051dd0c9-bcb0-4ae6-bf0e-551f0654bea6',
  'a714aa6d-1542-4dfb-969b-0f9763276c48',
  'd25116ea-c50f-4cb7-8720-11f902e92214',
  '33ad3e70-a30d-4b91-8e27-673ef2dc6689'],
 'embeddings': array([[-0.01201622,  0.04824475, -0.20268233, ..., -0.03268716,
         -0.03367926,  0.0375347 ],
        [ 0.03164107,  0.01733262, -0.18116248, ..., -0.05233952,
         -0.03189682, -0.03273316],
        [-0.03317867,  0.05688502, -0.16555917, ..., -0.05312532,
         -0.00448262, -0.00966839],
        [ 0.02738579,  0.07661138, -0.17295662, ..., -0.08102485,
         -0.03788646, -0.00431817],
        [ 0.03025259,  0.06974135, -0.16867268, ..., -0.04695843,
         -0.03084164, -0.03841866]], shape=(5, 768)),
 'documents': ['Artificial Intelligence is transforming healthcare by enabling early disease detection, personalized treatments, and intelligent patient monitoring systems.',
  'Climate change is intensifying heat waves, floods, and air pol

In [8]:
vector_store.similarity_search_with_score(
    query='what flexible learning opoortunities are provided by digital education',
    k=2
)

[(Document(id='a714aa6d-1542-4dfb-969b-0f9763276c48', metadata={'source': 'edtech_study.pdf', 'topic': 'Digital Education', 'page': 5}, page_content='Digital education platforms provide flexible learning opportunities through virtual classrooms, recorded lectures, and AI-powered personalized learning paths.'),
  0.4852980971336365),
 (Document(id='6b07c222-be66-493b-b777-47c811f8af0c', metadata={'page': 1, 'topic': 'AI in Healthcare', 'source': 'healthcare_ai.pdf'}, page_content='Artificial Intelligence is transforming healthcare by enabling early disease detection, personalized treatments, and intelligent patient monitoring systems.'),
  1.0176291465759277)]

In [9]:
updated_doc1 =Document(
    page_content='Delhi is capital of India',
    metadata={"source":"TOI","topic": "General Knowledge", "page": 1}
)

vector_store.update_document(document_id='6b07c222-be66-493b-b777-47c811f8af0c',document=updated_doc1)