In [2]:
from langchain_community.document_loaders import TextLoader
from langchain.vectorstores import FAISS
from langchain.embeddings import OllamaEmbeddings
from langchain_text_splitters import CharacterTextSplitter


loader = TextLoader("Speech.txt")
doc = loader.load()

text_splitter = CharacterTextSplitter(chunk_size=200, chunk_overlap=30)
docs = text_splitter.split_documents(doc)

docs




[Document(metadata={'source': 'Speech.txt'}, page_content='Speech on AI: The Future is Here\n\nGood [morning/afternoon/evening] everyone,'),
 Document(metadata={'source': 'Speech.txt'}, page_content='Artificial Intelligence is no longer just science fiction—it is shaping our world today. From personal assistants like Siri to self-driving cars, AI is transforming how we live, work, and connect.'),
 Document(metadata={'source': 'Speech.txt'}, page_content='Businesses use AI for automation, boosting efficiency and innovation. Healthcare benefits from AI-driven diagnoses, improving patient care. Even creative fields, like music and art, are evolving with AI-powered tools.'),
 Document(metadata={'source': 'Speech.txt'}, page_content='However, AI also raises ethical questions. Bias, privacy concerns, and job displacement must be addressed responsibly. AI should serve humanity, not replace it.'),
 Document(metadata={'source': 'Speech.txt'}, page_content='The future of AI depends on how we dev

In [4]:
embeddings = (
    OllamaEmbeddings(model="deepseek-r1:8b") ## default llama
)
vectorstore = FAISS.from_documents(docs, embeddings)
vectorstore

<langchain_community.vectorstores.faiss.FAISS at 0x10c962550>

In [6]:
#QUERY

query = vectorstore.similarity_search("AI", k=2)
print(query[0].page_content)

Businesses use AI for automation, boosting efficiency and innovation. Healthcare benefits from AI-driven diagnoses, improving patient care. Even creative fields, like music and art, are evolving with AI-powered tools.


In [10]:
#Retriever

retriever = vectorstore.as_retriever()
d = retriever.invoke("AI")
d[0].page_content

'Businesses use AI for automation, boosting efficiency and innovation. Healthcare benefits from AI-driven diagnoses, improving patient care. Even creative fields, like music and art, are evolving with AI-powered tools.'

In [11]:
doc_score = vectorstore.similarity_search_with_score("AI")
doc_score

[(Document(id='eb8a9f63-e0dd-4099-90e7-eb82f9a086c1', metadata={'source': 'Speech.txt'}, page_content='Businesses use AI for automation, boosting efficiency and innovation. Healthcare benefits from AI-driven diagnoses, improving patient care. Even creative fields, like music and art, are evolving with AI-powered tools.'),
  30644.402),
 (Document(id='0358fe1a-385f-4403-b1a5-e38166d25cda', metadata={'source': 'Speech.txt'}, page_content='However, AI also raises ethical questions. Bias, privacy concerns, and job displacement must be addressed responsibly. AI should serve humanity, not replace it.'),
  31359.42),
 (Document(id='e4decfc9-8a06-41f0-b5cc-33981655c190', metadata={'source': 'Speech.txt'}, page_content='The future of AI depends on how we develop and regulate it. We must ensure it remains a tool for progress, equality, and empowerment.'),
  32638.684),
 (Document(id='ac8714a6-4283-4b80-a417-4f9608f321ee', metadata={'source': 'Speech.txt'}, page_content='Artificial Intelligence i

In [13]:
embed_vector = embeddings.embed_query("AI")
embed_vector

[-3.3423171043395996,
 -1.93832266330719,
 3.1171646118164062,
 -3.7407798767089844,
 2.1142737865448,
 -2.757006883621216,
 0.12485199421644211,
 0.06450057029724121,
 0.28402212262153625,
 2.170238494873047,
 -1.1399246454238892,
 -0.4621748626232147,
 1.2554938793182373,
 -1.1430515050888062,
 2.6709184646606445,
 0.15376894176006317,
 -0.6436708569526672,
 1.6188633441925049,
 1.1797330379486084,
 -0.3985511362552643,
 -1.9567934274673462,
 1.8848602771759033,
 0.5666308999061584,
 0.5359656810760498,
 1.8237156867980957,
 0.7405449748039246,
 1.228162407875061,
 1.8849552869796753,
 1.019057273864746,
 -3.7137057781219482,
 -2.7918479442596436,
 3.344459295272827,
 -1.0481278896331787,
 2.136749505996704,
 -3.0121567249298096,
 0.11036760360002518,
 1.9039490222930908,
 1.0650299787521362,
 -1.6134910583496094,
 -1.6278598308563232,
 -0.25733697414398193,
 -4.796111106872559,
 -4.149754524230957,
 -1.1664303541183472,
 -0.20868244767189026,
 -0.6563511490821838,
 1.380079507827758

In [14]:
vectorstore.save_local("faiss_index")

In [18]:
new_df = FAISS.load_local("faiss_index", embeddings, allow_dangerous_deserialization=True)
docx = new_df.similarity_search("AI")
docx

[Document(id='eb8a9f63-e0dd-4099-90e7-eb82f9a086c1', metadata={'source': 'Speech.txt'}, page_content='Businesses use AI for automation, boosting efficiency and innovation. Healthcare benefits from AI-driven diagnoses, improving patient care. Even creative fields, like music and art, are evolving with AI-powered tools.'),
 Document(id='0358fe1a-385f-4403-b1a5-e38166d25cda', metadata={'source': 'Speech.txt'}, page_content='However, AI also raises ethical questions. Bias, privacy concerns, and job displacement must be addressed responsibly. AI should serve humanity, not replace it.'),
 Document(id='e4decfc9-8a06-41f0-b5cc-33981655c190', metadata={'source': 'Speech.txt'}, page_content='The future of AI depends on how we develop and regulate it. We must ensure it remains a tool for progress, equality, and empowerment.'),
 Document(id='ac8714a6-4283-4b80-a417-4f9608f321ee', metadata={'source': 'Speech.txt'}, page_content='Artificial Intelligence is no longer just science fiction—it is shapin