In [None]:
import os
from dotenv import load_dotenv
load_dotenv()

from langchain_community.document_loaders import TextLoader
from langchain_text_splitters import RecursiveCharacterTextSplitter
from langchain_huggingface import HuggingFaceEmbeddings
from langchain_chroma import Chroma

In [4]:
os.environ['HUGGINGFACE_TOKEN'] = os.getenv('HUGGINGFACE_TOKEN')

In [5]:
# load text file
loader = TextLoader('../1.3-textsplitter/speech.txt')
docs = loader.load()

In [6]:
docs

[Document(metadata={'source': '../1.3-textsplitter/speech.txt'}, page_content='Machine Learning and Generative AI: Shaping the Future of Intelligence\nThe last decade has witnessed an unprecedented surge in the advancement of artificial intelligence (AI), driven largely by the breakthroughs in machine learning (ML) and the explosive growth of generative AI. Together, these technologies are not just changing how machines process information—they\'re transforming entire industries, reshaping creative processes, and redefining the boundaries between human and machine capabilities.\n\nIn this blog, we’ll explore what machine learning is, how generative AI fits into the larger AI ecosystem, their real-world applications, and what the future holds.\n\nWhat is Machine Learning?\nMachine learning is a subset of artificial intelligence that enables machines to learn from data and improve their performance without being explicitly programmed. Instead of following hard-coded instructions, ML algo

In [7]:
# split the text
text_splitters = RecursiveCharacterTextSplitter(chunk_size=500, chunk_overlap=50)
splits = text_splitters.split_documents(docs)

In [9]:
splits[:5]

[Document(metadata={'source': '../1.3-textsplitter/speech.txt'}, page_content='Machine Learning and Generative AI: Shaping the Future of Intelligence'),
 Document(metadata={'source': '../1.3-textsplitter/speech.txt'}, page_content="The last decade has witnessed an unprecedented surge in the advancement of artificial intelligence (AI), driven largely by the breakthroughs in machine learning (ML) and the explosive growth of generative AI. Together, these technologies are not just changing how machines process information—they're transforming entire industries, reshaping creative processes, and redefining the boundaries between human and machine capabilities."),
 Document(metadata={'source': '../1.3-textsplitter/speech.txt'}, page_content='In this blog, we’ll explore what machine learning is, how generative AI fits into the larger AI ecosystem, their real-world applications, and what the future holds.\n\nWhat is Machine Learning?\nMachine learning is a subset of artificial intelligence th

In [None]:
# embedding usign huggingface
embeddings = HuggingFaceEmbeddings(model='all-MiniLM-L6-v2')

  from .autonotebook import tqdm as notebook_tqdm


In [11]:
text = "Machine Learning and Generative AI: Shaping the Future of Intelligence"
query_result = embeddings.embed_query(text)

In [12]:
query_result

[-0.05351195111870766,
 -0.013099039904773235,
 0.116485595703125,
 -0.027270670980215073,
 -0.041483357548713684,
 0.01757950335741043,
 -0.029203588142991066,
 -0.03915770724415779,
 -0.04861374944448471,
 0.02509899064898491,
 -0.027181310579180717,
 -0.03709578886628151,
 0.00399068184196949,
 -0.024972550570964813,
 -0.06034812331199646,
 0.01933102495968342,
 0.008461285382509232,
 -0.013423248194158077,
 -0.079146608710289,
 -0.08355256170034409,
 0.057936638593673706,
 0.033668261021375656,
 0.006824105978012085,
 -0.0698118656873703,
 -0.026086129248142242,
 0.035656824707984924,
 0.08228103071451187,
 -0.01616726629436016,
 0.01815248653292656,
 -0.07392267137765884,
 0.10216724127531052,
 0.039067480713129044,
 -0.04406827688217163,
 0.011656763963401318,
 -0.0374576598405838,
 0.07291632890701294,
 -0.021226124837994576,
 0.020076029002666473,
 0.08062448352575302,
 -0.033993910998106,
 0.03662258759140968,
 -0.06365561485290527,
 -0.003700646571815014,
 0.00275558978319168

In [None]:
vector_store = Chroma.from_documents(splits, embeddings)

In [18]:
print(vector_store._collection.count())
print(vector_store._collection.peek())

1
{'ids': ['7dbceef2-a5f8-46a3-8e0d-0f5163e5985a'], 'embeddings': array([[-4.88554612e-02, -2.19461918e-02,  8.61539766e-02,
         1.93584450e-02,  4.46362831e-02, -8.14938080e-03,
        -7.33738244e-02, -3.86601388e-02, -3.99435200e-02,
         2.07947902e-02, -9.45010632e-02,  2.21419265e-03,
         1.15430504e-02, -2.43193172e-02, -4.52109240e-02,
        -1.30570531e-02,  3.48499715e-02,  6.60635903e-03,
        -7.59726167e-02, -1.00676477e-01,  6.97132871e-02,
         4.99609634e-02, -5.00909388e-02, -1.73939466e-02,
        -6.82357652e-03,  5.71046844e-02,  3.05477921e-02,
        -4.76579368e-02, -3.91794741e-02, -5.44107072e-02,
         4.47156653e-02, -1.91858541e-02, -1.83587316e-02,
         5.82472272e-02, -7.43660852e-02,  5.74566312e-02,
        -1.33156972e-02,  4.37478200e-02,  7.82778561e-02,
        -5.98911569e-02,  1.01269856e-02, -1.00630410e-01,
        -4.22973223e-02, -2.54733507e-02,  1.17233098e-01,
         4.29650843e-02, -3.11627928e-02, -7.7979

In [19]:
query = "In supervised learning, the algorithm is trained on labeled data"
result = vector_store.similarity_search(query)

In [21]:
result[0].page_content

'Machine Learning and Generative AI: Shaping the Future of Intelligence\nThe last decade has witnessed an unprecedented surge in the advancement of artificial intelligence (AI), driven largely by the breakthroughs in machine learning (ML) and the explosive growth of generative AI. Together, these technologies are not just changing how machines process information—they\'re transforming entire industries, reshaping creative processes, and redefining the boundaries between human and machine capabilities.\n\nIn this blog, we’ll explore what machine learning is, how generative AI fits into the larger AI ecosystem, their real-world applications, and what the future holds.\n\nWhat is Machine Learning?\nMachine learning is a subset of artificial intelligence that enables machines to learn from data and improve their performance without being explicitly programmed. Instead of following hard-coded instructions, ML algorithms find patterns in data and make predictions or decisions based on it.\n\

In [22]:
vector_store.similarity_search_with_score(query)

[(Document(id='7dbceef2-a5f8-46a3-8e0d-0f5163e5985a', metadata={'source': '../1.3-textsplitter/speech.txt'}, page_content='Machine Learning and Generative AI: Shaping the Future of Intelligence\nThe last decade has witnessed an unprecedented surge in the advancement of artificial intelligence (AI), driven largely by the breakthroughs in machine learning (ML) and the explosive growth of generative AI. Together, these technologies are not just changing how machines process information—they\'re transforming entire industries, reshaping creative processes, and redefining the boundaries between human and machine capabilities.\n\nIn this blog, we’ll explore what machine learning is, how generative AI fits into the larger AI ecosystem, their real-world applications, and what the future holds.\n\nWhat is Machine Learning?\nMachine learning is a subset of artificial intelligence that enables machines to learn from data and improve their performance without being explicitly programmed. Instead o

In [23]:
retriver = vector_store.as_retriever()
retriver.invoke(query)

[Document(id='7dbceef2-a5f8-46a3-8e0d-0f5163e5985a', metadata={'source': '../1.3-textsplitter/speech.txt'}, page_content='Machine Learning and Generative AI: Shaping the Future of Intelligence\nThe last decade has witnessed an unprecedented surge in the advancement of artificial intelligence (AI), driven largely by the breakthroughs in machine learning (ML) and the explosive growth of generative AI. Together, these technologies are not just changing how machines process information—they\'re transforming entire industries, reshaping creative processes, and redefining the boundaries between human and machine capabilities.\n\nIn this blog, we’ll explore what machine learning is, how generative AI fits into the larger AI ecosystem, their real-world applications, and what the future holds.\n\nWhat is Machine Learning?\nMachine learning is a subset of artificial intelligence that enables machines to learn from data and improve their performance without being explicitly programmed. Instead of

In [24]:
retriver.invoke(query)[0].page_content

'Machine Learning and Generative AI: Shaping the Future of Intelligence\nThe last decade has witnessed an unprecedented surge in the advancement of artificial intelligence (AI), driven largely by the breakthroughs in machine learning (ML) and the explosive growth of generative AI. Together, these technologies are not just changing how machines process information—they\'re transforming entire industries, reshaping creative processes, and redefining the boundaries between human and machine capabilities.\n\nIn this blog, we’ll explore what machine learning is, how generative AI fits into the larger AI ecosystem, their real-world applications, and what the future holds.\n\nWhat is Machine Learning?\nMachine learning is a subset of artificial intelligence that enables machines to learn from data and improve their performance without being explicitly programmed. Instead of following hard-coded instructions, ML algorithms find patterns in data and make predictions or decisions based on it.\n\