## Chroma DB

Chroma is a AI-native open-source vector database focused on developer productivity and happiness. Chroma is licensed under Apache 2.0

In [3]:
from langchain_chroma import Chroma

In [4]:
from langchain_community.document_loaders import TextLoader
from langchain_community.vectorstores import FAISS
from langchain_community.embeddings import OllamaEmbeddings
from langchain_text_splitters import CharacterTextSplitter

loader=TextLoader("/home/raja/learnings/GEN_AI_KRISH/Langchain/1-Langchain/1_DataInjection/speech.txt")
documents=loader.load()

In [5]:
text_spliter=CharacterTextSplitter(chunk_size=1000,chunk_overlap=30)
docs=text_spliter.split_documents(documents)

In [7]:
embeddings=OllamaEmbeddings(model="gemma:2b")

In [8]:
db=Chroma.from_documents(docs,embeddings)

In [9]:
### Query 
query="How does the speaker describe the desired outcome of the war?"

In [11]:
doc=db.similarity_search(query)
doc

[Document(metadata={'source': '/home/raja/learnings/GEN_AI_KRISH/Langchain/1-Langchain/1_DataInjection/speech.txt'}, page_content='…\n\nIt will be all the easier for us to conduct ourselves as belligerents in a high spirit of right and fairness because we act without animus, not in enmity toward a people or with the desire to bring any injury or disadvantage upon them, but only in armed opposition to an irresponsible government which has thrown aside all considerations of humanity and of right and is running amuck. We are, let me say again, the sincere friends of the German people, and shall desire nothing so much as the early reestablishment of intimate relations of mutual advantage between us—however hard it may be for them, for the time being, to believe that this is spoken from our hearts.'),
 Document(metadata={'source': '/home/raja/learnings/GEN_AI_KRISH/Langchain/1-Langchain/1_DataInjection/speech.txt'}, page_content='To such a task we can dedicate our lives and our fortunes, ev

In [12]:
doc[0].page_content

'…\n\nIt will be all the easier for us to conduct ourselves as belligerents in a high spirit of right and fairness because we act without animus, not in enmity toward a people or with the desire to bring any injury or disadvantage upon them, but only in armed opposition to an irresponsible government which has thrown aside all considerations of humanity and of right and is running amuck. We are, let me say again, the sincere friends of the German people, and shall desire nothing so much as the early reestablishment of intimate relations of mutual advantage between us—however hard it may be for them, for the time being, to believe that this is spoken from our hearts.'

In [13]:
##Save db
db=Chroma.from_documents(docs,embeddings,persist_directory="./chromadb")


In [14]:
reusestoreddb=Chroma(persist_directory="./chromadb",embedding_function=embeddings)

In [15]:
reusestoreddb.similarity_search(query)

[Document(metadata={'source': '/home/raja/learnings/GEN_AI_KRISH/Langchain/1-Langchain/1_DataInjection/speech.txt'}, page_content='…\n\nIt will be all the easier for us to conduct ourselves as belligerents in a high spirit of right and fairness because we act without animus, not in enmity toward a people or with the desire to bring any injury or disadvantage upon them, but only in armed opposition to an irresponsible government which has thrown aside all considerations of humanity and of right and is running amuck. We are, let me say again, the sincere friends of the German people, and shall desire nothing so much as the early reestablishment of intimate relations of mutual advantage between us—however hard it may be for them, for the time being, to believe that this is spoken from our hearts.'),
 Document(metadata={'source': '/home/raja/learnings/GEN_AI_KRISH/Langchain/1-Langchain/1_DataInjection/speech.txt'}, page_content='To such a task we can dedicate our lives and our fortunes, ev

In [16]:
reusestoreddb.similarity_search_with_score(query)   ### score is manhattan distance

[(Document(metadata={'source': '/home/raja/learnings/GEN_AI_KRISH/Langchain/1-Langchain/1_DataInjection/speech.txt'}, page_content='…\n\nIt will be all the easier for us to conduct ourselves as belligerents in a high spirit of right and fairness because we act without animus, not in enmity toward a people or with the desire to bring any injury or disadvantage upon them, but only in armed opposition to an irresponsible government which has thrown aside all considerations of humanity and of right and is running amuck. We are, let me say again, the sincere friends of the German people, and shall desire nothing so much as the early reestablishment of intimate relations of mutual advantage between us—however hard it may be for them, for the time being, to believe that this is spoken from our hearts.'),
  2946.6435194455653),
 (Document(metadata={'source': '/home/raja/learnings/GEN_AI_KRISH/Langchain/1-Langchain/1_DataInjection/speech.txt'}, page_content='To such a task we can dedicate our l

In [18]:
retriever=reusestoreddb.as_retriever()
retriever.invoke(query)

[Document(metadata={'source': '/home/raja/learnings/GEN_AI_KRISH/Langchain/1-Langchain/1_DataInjection/speech.txt'}, page_content='…\n\nIt will be all the easier for us to conduct ourselves as belligerents in a high spirit of right and fairness because we act without animus, not in enmity toward a people or with the desire to bring any injury or disadvantage upon them, but only in armed opposition to an irresponsible government which has thrown aside all considerations of humanity and of right and is running amuck. We are, let me say again, the sincere friends of the German people, and shall desire nothing so much as the early reestablishment of intimate relations of mutual advantage between us—however hard it may be for them, for the time being, to believe that this is spoken from our hearts.'),
 Document(metadata={'source': '/home/raja/learnings/GEN_AI_KRISH/Langchain/1-Langchain/1_DataInjection/speech.txt'}, page_content='To such a task we can dedicate our lives and our fortunes, ev