### Chroma 
Chroma is a AI native open-source vector database focused on develope productivity and happiness. Chroma is licensed under Apache 2.0.

In [1]:
from langchain_chroma import Chroma
from langchain_community.document_loaders import TextLoader
from langchain_text_splitters import RecursiveCharacterTextSplitter
from langchain_community.embeddings import OllamaEmbeddings


In [3]:
loader = TextLoader('speech.txt')
data = loader.load()
data

[Document(metadata={'source': 'speech.txt'}, page_content='Rajiv Gandhi University of Knowledge Technologies (RGUKT) Basar is unique university which actively uses Information and Communication Technology (ICT) in teaching. It is perhaps the first of its kind in the country with an educational model that is intensely ICT based. Established by the Government of erstwhile Andhra Pradesh vide a special act of legislation, this campus is loacated at the holy land of Basar (the abode of Gnyana Saraswathi, Goddess of knowledge) in Nirmal District (Telangana State). The campus is set in about 272 acres of salubrious and serene surrounding just a short distance from the banks of river Godavari.\n\nThe primary objective of establishing RGUKT is to provide high quality educational opportunities for the rural youth of the state. The selection process follows approved rules and has very high competition where only the top rural graduates (mostly within the top 5%) get the opportunity to study at R

In [5]:
text_splitter = RecursiveCharacterTextSplitter(chunk_size=300,chunk_overlap=30)
text = text_splitter.split_documents(data)
text

[Document(metadata={'source': 'speech.txt'}, page_content='Rajiv Gandhi University of Knowledge Technologies (RGUKT) Basar is unique university which actively uses Information and Communication Technology (ICT) in teaching. It is perhaps the first of its kind in the country with an educational model that is intensely ICT based. Established by the Government'),
 Document(metadata={'source': 'speech.txt'}, page_content='Established by the Government of erstwhile Andhra Pradesh vide a special act of legislation, this campus is loacated at the holy land of Basar (the abode of Gnyana Saraswathi, Goddess of knowledge) in Nirmal District (Telangana State). The campus is set in about 272 acres of salubrious and serene'),
 Document(metadata={'source': 'speech.txt'}, page_content='of salubrious and serene surrounding just a short distance from the banks of river Godavari.'),
 Document(metadata={'source': 'speech.txt'}, page_content='The primary objective of establishing RGUKT is to provide high 

In [6]:
embeddings = OllamaEmbeddings(model="gemma2:2b")
embeddings

OllamaEmbeddings(base_url='http://localhost:11434', model='gemma2:2b', embed_instruction='passage: ', query_instruction='query: ', mirostat=None, mirostat_eta=None, mirostat_tau=None, num_ctx=None, num_gpu=None, num_thread=None, repeat_last_n=None, repeat_penalty=None, temperature=None, stop=None, tfs_z=None, top_k=None, top_p=None, show_progress=False, headers=None, model_kwargs=None)

In [7]:
db = Chroma.from_documents(text,embeddings)
db

<langchain_chroma.vectorstores.Chroma at 0x76dda53145b0>

In [12]:
query="Summarize the text"
result = db.similarity_search(query)
result[0].page_content

'RGUKT has slowly but surely risen in reputation as its graduating engineers have acted as perfect brand ambassadors for the university. Batches of engineers graduated from RGUKT are placed in various companies, Government services and public sector. Some of them have also set up their own business'

In [13]:
vector_db = Chroma.from_documents(text,embeddings,persist_directory="./chroma_db")
vector_db

<langchain_chroma.vectorstores.Chroma at 0x76ddc8f17310>

In [14]:
db = Chroma(persist_directory="./chroma_db",embedding_function=embeddings)
result = db.similarity_search(query)
result

[Document(metadata={'source': 'speech.txt'}, page_content='RGUKT has slowly but surely risen in reputation as its graduating engineers have acted as perfect brand ambassadors for the university. Batches of engineers graduated from RGUKT are placed in various companies, Government services and public sector. Some of them have also set up their own business'),
 Document(metadata={'source': 'speech.txt'}, page_content='recreational facilities, well equipped gymnasium, courts for basketball, badminton, table tennies, cricket, other sports and games.'),
 Document(metadata={'source': 'speech.txt'}, page_content='Established by the Government of erstwhile Andhra Pradesh vide a special act of legislation, this campus is loacated at the holy land of Basar (the abode of Gnyana Saraswathi, Goddess of knowledge) in Nirmal District (Telangana State). The campus is set in about 272 acres of salubrious and serene'),
 Document(metadata={'source': 'speech.txt'}, page_content='1,00,000 volumes, boys’ an

In [15]:
result = db.similarity_search_with_score(query)
result

[(Document(metadata={'source': 'speech.txt'}, page_content='RGUKT has slowly but surely risen in reputation as its graduating engineers have acted as perfect brand ambassadors for the university. Batches of engineers graduated from RGUKT are placed in various companies, Government services and public sector. Some of them have also set up their own business'),
  7860.908691640049),
 (Document(metadata={'source': 'speech.txt'}, page_content='recreational facilities, well equipped gymnasium, courts for basketball, badminton, table tennies, cricket, other sports and games.'),
  9980.454538519843),
 (Document(metadata={'source': 'speech.txt'}, page_content='Established by the Government of erstwhile Andhra Pradesh vide a special act of legislation, this campus is loacated at the holy land of Basar (the abode of Gnyana Saraswathi, Goddess of knowledge) in Nirmal District (Telangana State). The campus is set in about 272 acres of salubrious and serene'),
  10636.10497604885),
 (Document(metad

In [17]:
retriever = db.as_retriever()
result = retriever.invoke(query)
result[0].page_content

'RGUKT has slowly but surely risen in reputation as its graduating engineers have acted as perfect brand ambassadors for the university. Batches of engineers graduated from RGUKT are placed in various companies, Government services and public sector. Some of them have also set up their own business'