In [None]:
import pandas as pd
from src.rag import RAGPipeline
from pathlib import Path

# Initialize pipeline
rag = RAGPipeline(
    index_path=Path("../vectorstore/faiss_index.bin"),
    metadata_path=Path("../vectorstore/metadata.parquet")
)

# Evaluation questions
questions = [
    "What are the most common issues with credit cards?",
    "How are customers complaining about late fees?",
    "What problems do users report with the mobile app?",
    "Which product has the most complaints about billing errors?",
    "Are there any security concerns mentioned in complaints?"
]

# Run evaluation
results = []
for question in questions:
    result = rag.query(question)
    results.append({
        "Question": question,
        "Answer": result["answer"],
        "Product": result["sources"][0]["product"],
        "Key Excerpt": result["sources"][0]["excerpt"][:200] + "...",
        "Score": None  # You'll fill this during manual review
    })

# Create evaluation dataframe
eval_df = pd.DataFrame(results)
eval_df.to_markdown("../docs/rag_evaluation.md", index=False)