In [1]:
import pandas as pd
import os
os.chdir("../../")

def load_evaluation_data(csv_file_path: str = "data/evaluation_set.csv") -> dict:
    """Loads evaluation data from a CSV file and returns questions and ground truths.

    Args:
        csv_file_path (str): The path to the CSV file containing the evaluation data.
            The CSV should have columns named "question" and "ground_truth".

    Returns:
        dict: A dictionary containing:
            - "questions": A list of questions.
            - "ground_truths": A list of corresponding ground truth answers.
    """

    df = pd.read_csv(csv_file_path)  # Read the CSV file
    
    # Check if required columns are present
    if "question" not in df.columns or "ground_truth" not in df.columns:
        raise ValueError("The CSV file must contain 'question' and 'ground_truth' columns.")

    questions = df["question"].tolist()
    ground_truths = df["ground_truth"].tolist()

    return {"questions": questions, "ground_truths": ground_truths}


In [2]:
load_evaluation_data()

{'questions': ['What upcoming animated project will feature Adam West and Burt Ward reprising their roles as Batman and Robin?',
  'What animated project did Adam West and Burt Ward announce at the Mad Monster Party in Charlotte, NC?',
  'What event is Rory McIlroy preparing for after the WGC-Cadillac Championship?',
  'How did Donald Trump help Rory McIlroy retrieve his golf club?',
  'What caused the collapse of the Iraqi army during the ISIS offensive in 2014?'],
 'ground_truths': ["Adam West and Burt Ward will be reprising their roles as Batman and Robin in an upcoming animated 'Batman' full length, 90-minute feature, which will be released on the 50th anniversary of the 1960s Batman TV series.",
  "Adam West and Burt Ward announced a new animated 'Batman' full length, 90-minute feature at the Mad Monster Party in Charlotte, NC.",
  'Rory McIlroy is preparing for the U.S. Masters at Augusta next month.',
  'Donald Trump helped Rory McIlroy retrieve his golf club by getting a scuba 