## Setup and Installation

In [None]:
!pip install -r ../requirements.txt

## Download Hansard Reports

In [None]:
from src.data_downloader import download_hansard_reports
from datetime import datetime

# Define the date range
start_date = datetime(2024, 6, 17)
end_date = datetime(2024, 6, 19)

# Download Hansard reports for the given range
print(f"Downloading Hansard reports from {start_date} to {end_date}...")
downloaded_report_paths = download_hansard_reports(start_date, end_date)

## Extract Relevant Text

In [None]:
from src.text_extractor import extract_relevant_text

# Define the topic for text extraction
topic = "Climate change"

# Extract relevant text from the downloaded reports
relevant_text = None
for report_path in downloaded_report_paths:
    extracted_text = extract_relevant_text(report_path, topic, use_embeddings=True, top_k=5)
    if extracted_text:
        relevant_text = extracted_text
        break  # Use the first relevant report

if relevant_text:
    print(f"Extracted text: {relevant_text[:1000]}...")  # Show the first 1000 characters
else:
    print(f"No relevant text found for the topic '{topic}'.")


## Generate and Compare Summaries

In [None]:
from src.model_comparison import compare_llm_summaries

# Define an optional reference summary (for ROUGE-L evaluation)
reference_summary = "This is a well-crafted reference summary for the topic."

# Generate and compare summaries using different models
if relevant_text:
    print("Generating and comparing summaries from different models...")
    compare_llm_summaries(relevant_text, topic, length='medium', reference_summary=reference_summary)


## CLI Example

In [None]:
# Show how users would use the CLI for main.py
!python ../main.py --start_date 2024-06-17 --end_date 2024-06-19 --topic "Climate change" --summary_length "medium" --reference_summary "This is a well-crafted reference summary for the topic."
