In [1]:
#building sample vector db

from langchain_chroma import Chroma
from langchain_community.document_loaders import TextLoader
from langchain_community.embeddings import OllamaEmbeddings
from langchain_text_splitters import RecursiveCharacterTextSplitter



In [3]:
loader = TextLoader("test.txt")
documents = loader.load()

text_splitter = RecursiveCharacterTextSplitter(chunk_size=500, chunk_overlap=0)
splits = text_splitter.split_documents(documents)

In [4]:
embedding = OllamaEmbeddings(model ="gemma2:2b")
vector_db = Chroma.from_documents(documents=splits, embedding=embedding)

vector_db

<langchain_chroma.vectorstores.Chroma at 0x72452d96d6f0>

In [5]:
query = "How is our dependency growing in AI tools"
docs = vector_db.similarity_search(query)

docs[0].page_content

'Our growing dependency on AI tools also raises concerns about digital dependency. The ease of access to AI-generated content can create a false sense of productivity, masking the fact that we’re becoming increasingly passive consumers of information. This dependency can lead to a decline in our ability to learn independently and make informed decisions without external assistance.\nFinding a Balance\nfinding balance'

In [6]:
## Saving to the disk
vector_db = Chroma.from_documents(documents=splits, embedding=embedding, persist_directory="./chroma_db")


In [7]:
db2 = Chroma(persist_directory="./chroma_db", embedding_function=embedding)
docs = db2.similarity_search(query)
docs[0].page_content

'Our growing dependency on AI tools also raises concerns about digital dependency. The ease of access to AI-generated content can create a false sense of productivity, masking the fact that we’re becoming increasingly passive consumers of information. This dependency can lead to a decline in our ability to learn independently and make informed decisions without external assistance.\nFinding a Balance\nfinding balance'

In [8]:
##Retriever option

retriever = vector_db.as_retriever()
retriever.invoke(query)[0].page_content

'Our growing dependency on AI tools also raises concerns about digital dependency. The ease of access to AI-generated content can create a false sense of productivity, masking the fact that we’re becoming increasingly passive consumers of information. This dependency can lead to a decline in our ability to learn independently and make informed decisions without external assistance.\nFinding a Balance\nfinding balance'