In [2]:
# Import necessary libraries
import os
from dotenv import load_dotenv
from llama_index.core import VectorStoreIndex, SimpleDirectoryReader

from llama_index.core import Settings
from llama_index.core.callbacks import CallbackManager
from langfuse.llama_index import LlamaIndexCallbackHandler

langfuse_callback_handler = LlamaIndexCallbackHandler(
  public_key= os.getenv("LANGFUSE_PUBLIC_KEY"),
  secret_key= os.getenv("LANGFUSE_SECRET_KEY"),
  host="https://us.cloud.langfuse.com"
)
Settings.callback_manager = CallbackManager([langfuse_callback_handler])

# Load environment variables
load_dotenv()

# Load documents from a directory (you can change this path as needed)
documents = SimpleDirectoryReader("data").load_data()

# Create an index from the documents
index = VectorStoreIndex.from_documents(documents)

# Create a query engine
query_engine = index.as_query_engine()

# Example query
response = query_engine.query("What years does the strategic plan cover?")

print(response)

The strategic plan covers the years 2024 to 2028.


In [3]:
print(documents)
print(index)

[Document(id_='035a3b72-495a-4e05-b245-6a47d4968147', embedding=None, metadata={'page_label': '1', 'file_name': 'CodePath strategic plan.pdf', 'file_path': '/Users/sahila/workbench/codepath-ai/lab2/data/CodePath strategic plan.pdf', 'file_type': 'application/pdf', 'file_size': 1452743, 'creation_date': '2024-09-16', 'last_modified_date': '2024-09-16'}, excluded_embed_metadata_keys=['file_name', 'file_type', 'file_size', 'creation_date', 'last_modified_date', 'last_accessed_date'], excluded_llm_metadata_keys=['file_name', 'file_type', 'file_size', 'creation_date', 'last_modified_date', 'last_accessed_date'], relationships={}, text='CodePath\n2024-28\nStrategic\nPlan\n+\nAppendices\n(V1\n|\n04.23.24)\nExecutive\nSummary\nProblem\nSolution\nImpact\nand\nEvidence\nTo\nDate\nIntroduction\nto\nthe\n2024-28\nPlan\nPillar\n1:\nScale\nNationally\nin\nBreadth,\nand\nRegionally\nin\nDepth\nPillar\n2:\nImprove\nEffectiveness\nWhile\nReducing\nCosts\nPillar\n3:\nDevelop\nSustainable\nSources\nof\nR