### Chroma Vector StoreDB and Retriever

In [9]:
from langchain_chroma import Chroma
from langchain_community.document_loaders import TextLoader
from langchain_text_splitters import CharacterTextSplitter
from langchain_community.embeddings import OllamaEmbeddings

loader=TextLoader("speech1.txt")
data = loader.load()
data


[Document(metadata={'source': 'speech1.txt'}, page_content="Speech is the use of the human voice as a medium for language. Spoken language combines vowel and consonant sounds to form units of meaning like words, which belong to a language's lexicon. There are many different intentional speech acts, such as informing, declaring, asking, persuading, directing; acts may vary in various aspects like enunciation, intonation, loudness, and tempo to convey meaning. Individuals may also unintentionally communicate aspects of their social position through speech, such as sex, age, place of origin, physiological and mental condition, education, and experiences.\nWhile normally used to facilitate communication with others, people may also use speech without the intent to communicate. Speech may nevertheless express emotions or desires; people talk to themselves sometimes in acts that are a development of what some psychologists (e.g., Lev Vygotsky) have maintained is the use of silent speech in a

In [10]:
text_splitter=CharacterTextSplitter(chunk_size=1000, chunk_overlap=30)
docs=text_splitter.split_documents(data)
docs

Created a chunk of size 1217, which is longer than the specified 1000


[Document(metadata={'source': 'speech1.txt'}, page_content="Speech is the use of the human voice as a medium for language. Spoken language combines vowel and consonant sounds to form units of meaning like words, which belong to a language's lexicon. There are many different intentional speech acts, such as informing, declaring, asking, persuading, directing; acts may vary in various aspects like enunciation, intonation, loudness, and tempo to convey meaning. Individuals may also unintentionally communicate aspects of their social position through speech, such as sex, age, place of origin, physiological and mental condition, education, and experiences.\nWhile normally used to facilitate communication with others, people may also use speech without the intent to communicate. Speech may nevertheless express emotions or desires; people talk to themselves sometimes in acts that are a development of what some psychologists (e.g., Lev Vygotsky) have maintained is the use of silent speech in a

In [11]:
embeddings=(
    OllamaEmbeddings(model="gemma:2b")
)
db=Chroma.from_documents(docs,embeddings)
db

<langchain_chroma.vectorstores.Chroma at 0x2b291ad5780>

In [14]:
## Query
query="What is the main topic of the speech?"
docs = db.similarity_search(query)
docs[0].page_content

"Places of articulation (passive and active):\n1. Exo-labial, 2. Endo-labial, 3. Dental, 4. Alveolar, 5. Post-alveolar, 6. Pre-palatal, 7. Palatal, 8. Velar, 9. Uvular, 10. Pharyngeal, 11. Glottal, 12. Epiglottal, 13. Radical, 14. Postero-dorsal, 15. Antero-dorsal, 16. Laminal, 17. Apical, 18. Sub-apical\nMonkeys, non-human apes and humans, like many other animals, have evolved specialised mechanisms for producing sound for purposes of social communication.[7] On the other hand, no monkey or ape uses its tongue for such purposes.[8][9] The human species' unprecedented use of the tongue, lips and other moveable parts seems to place speech in a quite separate category, making its evolutionary emergence an intriguing theoretical challenge in the eyes of many scholars.[10]"

In [16]:
docs_scores=db.similarity_search_with_score(query)
docs_scores

[(Document(id='13d290cd-4031-4ec8-934e-b1dc14d959df', metadata={'source': 'speech1.txt'}, page_content="Places of articulation (passive and active):\n1. Exo-labial, 2. Endo-labial, 3. Dental, 4. Alveolar, 5. Post-alveolar, 6. Pre-palatal, 7. Palatal, 8. Velar, 9. Uvular, 10. Pharyngeal, 11. Glottal, 12. Epiglottal, 13. Radical, 14. Postero-dorsal, 15. Antero-dorsal, 16. Laminal, 17. Apical, 18. Sub-apical\nMonkeys, non-human apes and humans, like many other animals, have evolved specialised mechanisms for producing sound for purposes of social communication.[7] On the other hand, no monkey or ape uses its tongue for such purposes.[8][9] The human species' unprecedented use of the tongue, lips and other moveable parts seems to place speech in a quite separate category, making its evolutionary emergence an intriguing theoretical challenge in the eyes of many scholars.[10]"),
  2618.8427734375),
 (Document(id='1e58c25c-7cb6-446e-ab6f-e7f92f8966eb', metadata={'source': 'speech1.txt'}, page

In [18]:
embedding_vector= embeddings.embed_query(query)
db.similarity_search_by_vector(embedding_vector)

[Document(id='13d290cd-4031-4ec8-934e-b1dc14d959df', metadata={'source': 'speech1.txt'}, page_content="Places of articulation (passive and active):\n1. Exo-labial, 2. Endo-labial, 3. Dental, 4. Alveolar, 5. Post-alveolar, 6. Pre-palatal, 7. Palatal, 8. Velar, 9. Uvular, 10. Pharyngeal, 11. Glottal, 12. Epiglottal, 13. Radical, 14. Postero-dorsal, 15. Antero-dorsal, 16. Laminal, 17. Apical, 18. Sub-apical\nMonkeys, non-human apes and humans, like many other animals, have evolved specialised mechanisms for producing sound for purposes of social communication.[7] On the other hand, no monkey or ape uses its tongue for such purposes.[8][9] The human species' unprecedented use of the tongue, lips and other moveable parts seems to place speech in a quite separate category, making its evolutionary emergence an intriguing theoretical challenge in the eyes of many scholars.[10]"),
 Document(id='1e58c25c-7cb6-446e-ab6f-e7f92f8966eb', metadata={'source': 'speech1.txt'}, page_content='Determining 

In [20]:
vectordb=Chroma.from_documents(docs, embeddings, persist_directory="./chroma_db")

In [24]:
retriever=vectordb.as_retriever()
docs = retriever.invoke(query)
docs[0].page_content

"Places of articulation (passive and active):\n1. Exo-labial, 2. Endo-labial, 3. Dental, 4. Alveolar, 5. Post-alveolar, 6. Pre-palatal, 7. Palatal, 8. Velar, 9. Uvular, 10. Pharyngeal, 11. Glottal, 12. Epiglottal, 13. Radical, 14. Postero-dorsal, 15. Antero-dorsal, 16. Laminal, 17. Apical, 18. Sub-apical\nMonkeys, non-human apes and humans, like many other animals, have evolved specialised mechanisms for producing sound for purposes of social communication.[7] On the other hand, no monkey or ape uses its tongue for such purposes.[8][9] The human species' unprecedented use of the tongue, lips and other moveable parts seems to place speech in a quite separate category, making its evolutionary emergence an intriguing theoretical challenge in the eyes of many scholars.[10]"