In [3]:
import os
import sys
from dotenv import load_dotenv

from langchain_experimental.text_splitter import SemanticChunker
from langchain_google_genai import GoogleGenerativeAIEmbeddings
from langchain_community.vectorstores import FAISS
from langchain.document_loaders import PyPDFLoader
from langchain_cohere import CohereEmbeddings

load_dotenv()

base_embeddings = CohereEmbeddings(
    model="embed-english-light-v3.0"
)

In [4]:
loader = PyPDFLoader("data/Understanding_Climate_Change.pdf")
docs = loader.load()

In [5]:
text_splitter = SemanticChunker(base_embeddings, breakpoint_threshold_type='percentile', breakpoint_threshold_amount=90)

In [6]:
splitted_docs = text_splitter.split_documents(docs)

In [7]:
vectorstore = FAISS.from_documents(docs, base_embeddings)
chunks_query_retriever = vectorstore.as_retriever(search_kwargs={"k": 2})

In [9]:
test_query = "What is the main cause of climate change?"

retrieved = chunks_query_retriever.invoke(test_query)
context = [doc.page_content for doc in retrieved]

In [10]:
for i, c in enumerate(context):
        print(f"Context {i + 1}:")
        print(c)
        print("\n")

Context 1:
Understanding Climate Change 
Chapter 1: Introduction to Climate Change 
Climate change refers to significant, long-term changes in the global climate. The term 
"global climate" encompasses the planet's overall weather patterns, including temperature, 
precipitation, and wind patterns, over an extended period. Over the past century, human 
activities, particularly the burning of fossil fuels and deforestation, have significantly 
contributed to climate change. 
Historical Context 
The Earth's climate has changed throughout history. Over the past 650,000 years, there have 
been seven cycles of glacial advance and retreat, with the abrupt end of the last ice age about 
11,700 years ago marking the beginning of the modern climate era and human civilization. 
Most of these climate changes are attributed to very small variations in Earth's orbit that 
change the amount of solar energy our planet receives. During the Holocene epoch, which 
began at the end of the last ice age, hu