In [1]:
from langchain_community.document_loaders import TextLoader
from langchain_community.vectorstores import FAISS
from langchain_community.embeddings import OllamaEmbeddings
from langchain_text_splitters import CharacterTextSplitter

loader=TextLoader("speech.txt")
documents=loader.load()
text_splitter=CharacterTextSplitter(chunk_size=1000,chunk_overlap=30)
docs=text_splitter.split_documents(documents)

In [2]:
embeddings=OllamaEmbeddings(model="gemma:2b")
db=FAISS.from_documents(docs,embeddings)
db

  embeddings=OllamaEmbeddings(model="gemma:2b")


<langchain_community.vectorstores.faiss.FAISS at 0x151da6fac20>

In [3]:
query="How does the speaker describe the desired outcome of the war?"
docs=db.similarity_search(query)
docs[0].page_content

'…\n\nIt will be all the easier for us to conduct ourselves as belligerents in a high spirit of right and fairness because we act without animus, not in enmity toward a people or with the desire to bring any injury or disadvantage upon them, but only in armed opposition to an irresponsible government which has thrown aside all considerations of humanity and of right and is running amuck. We are, let me say again, the sincere friends of the German people, and shall desire nothing so much as the early reestablishment of intimate relations of mutual advantage between us—however hard it may be for them, for the time being, to believe that this is spoken from our hearts.'

In [4]:
retriever=db.as_retriever()
docs=retriever.invoke(query)
docs[0].page_content

'…\n\nIt will be all the easier for us to conduct ourselves as belligerents in a high spirit of right and fairness because we act without animus, not in enmity toward a people or with the desire to bring any injury or disadvantage upon them, but only in armed opposition to an irresponsible government which has thrown aside all considerations of humanity and of right and is running amuck. We are, let me say again, the sincere friends of the German people, and shall desire nothing so much as the early reestablishment of intimate relations of mutual advantage between us—however hard it may be for them, for the time being, to believe that this is spoken from our hearts.'

In [5]:
docs_and_score=db.similarity_search_with_score(query)
docs_and_score

[(Document(id='7cbe9e6f-6670-4e09-85d9-284eae3c6115', metadata={'source': 'speech.txt'}, page_content='…\n\nIt will be all the easier for us to conduct ourselves as belligerents in a high spirit of right and fairness because we act without animus, not in enmity toward a people or with the desire to bring any injury or disadvantage upon them, but only in armed opposition to an irresponsible government which has thrown aside all considerations of humanity and of right and is running amuck. We are, let me say again, the sincere friends of the German people, and shall desire nothing so much as the early reestablishment of intimate relations of mutual advantage between us—however hard it may be for them, for the time being, to believe that this is spoken from our hearts.'),
  2940.6172),
 (Document(id='01272a8e-c747-413e-b8ed-52b3293dee8a', metadata={'source': 'speech.txt'}, page_content='It is a distressing and oppressive duty, gentlemen of the Congress, which I have performed in thus addr

In [6]:
embedding_vector=embeddings.embed_query(query)
embedding_vector

[0.31795307993888855,
 -2.140655517578125,
 0.27908188104629517,
 1.0014718770980835,
 0.6126188635826111,
 0.5618122816085815,
 -0.9133124351501465,
 0.11938159912824631,
 -0.07714525610208511,
 -0.7931925654411316,
 1.118130087852478,
 -0.04589167237281799,
 -1.0918283462524414,
 1.0698192119598389,
 0.04507961496710777,
 -1.024010419845581,
 3.0880439281463623,
 1.722328782081604,
 1.165444016456604,
 0.7492797374725342,
 0.312674880027771,
 -0.28908148407936096,
 0.31421661376953125,
 1.4012460708618164,
 0.19737887382507324,
 -0.3814530372619629,
 -1.3764407634735107,
 -1.2622896432876587,
 -0.5816783905029297,
 -2.1050291061401367,
 -0.2831632196903229,
 -1.4254580736160278,
 1.2106008529663086,
 -0.9503772854804993,
 -0.4175291657447815,
 -0.24053360521793365,
 1.8830140829086304,
 0.5564766526222229,
 0.18502338230609894,
 -0.5303439497947693,
 0.34733396768569946,
 0.5402993559837341,
 0.9508274793624878,
 -1.3186930418014526,
 -1.3478591442108154,
 0.6065159440040588,
 0.0390

In [7]:
db.save_local("faiss_index")

In [8]:
new_db=FAISS.load_local("faiss_index",embeddings,allow_dangerous_deserialization=True)
docs=new_db.similarity_search(query)

In [9]:
docs

[Document(id='7cbe9e6f-6670-4e09-85d9-284eae3c6115', metadata={'source': 'speech.txt'}, page_content='…\n\nIt will be all the easier for us to conduct ourselves as belligerents in a high spirit of right and fairness because we act without animus, not in enmity toward a people or with the desire to bring any injury or disadvantage upon them, but only in armed opposition to an irresponsible government which has thrown aside all considerations of humanity and of right and is running amuck. We are, let me say again, the sincere friends of the German people, and shall desire nothing so much as the early reestablishment of intimate relations of mutual advantage between us—however hard it may be for them, for the time being, to believe that this is spoken from our hearts.'),
 Document(id='01272a8e-c747-413e-b8ed-52b3293dee8a', metadata={'source': 'speech.txt'}, page_content='It is a distressing and oppressive duty, gentlemen of the Congress, which I have performed in thus addressing you. Ther