In [1]:
import os
from datasets import Dataset 
import pandas as pd
from ragas import evaluate
from ragas.metrics import faithfulness
from langchain_openai import OpenAIEmbeddings, ChatOpenAI

  from .autonotebook import tqdm as notebook_tqdm


In [2]:
MODEL='gpt-4o'
llm = ChatOpenAI(model_name = MODEL, temperature=0)
embeddings = OpenAIEmbeddings(model=MODEL)

In [3]:
df = pd.read_csv('../assign/examples_to_annotate.csv', encoding='utf-8')
scores = []
for index, row in df.iterrows():
    # print(row)
    data_sample = {
        'question':['Provide a concise summary of the following passage, covering the core pieces of information described.'],
        'contexts':[[row['source']]], 
        'answer':[row['summary']]
    }
    input_data = Dataset.from_dict(data_sample)
    score = evaluate(input_data, metrics=[faithfulness], llm=llm, embeddings=embeddings)
    # print(data_sample)
    print(score['faithfulness'])
    scores.append(score['faithfulness'])
df.insert(len(df.columns), f'Ragas_{MODEL}', scores)
df.to_csv('../assign/examples_to_annotate.csv', mode='w', index=False, header=True)
            

Evaluating: 100%|██████████| 1/1 [00:18<00:00, 18.35s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:17<00:00, 17.82s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:09<00:00,  9.35s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:20<00:00, 20.88s/it]


{'faithfulness': 0.9000}


Evaluating: 100%|██████████| 1/1 [00:06<00:00,  6.05s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:19<00:00, 19.85s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:06<00:00,  6.50s/it]


{'faithfulness': 0.3333}


Evaluating: 100%|██████████| 1/1 [00:09<00:00,  9.12s/it]


{'faithfulness': 0.8889}


Evaluating: 100%|██████████| 1/1 [00:20<00:00, 20.90s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:06<00:00,  6.46s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:08<00:00,  8.23s/it]


{'faithfulness': 0.5556}


Evaluating: 100%|██████████| 1/1 [00:12<00:00, 12.87s/it]


{'faithfulness': 0.8333}


Evaluating: 100%|██████████| 1/1 [00:20<00:00, 20.27s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:15<00:00, 15.87s/it]


{'faithfulness': 0.9167}


Evaluating: 100%|██████████| 1/1 [00:15<00:00, 15.88s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:02<00:00,  2.94s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:20<00:00, 20.52s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:15<00:00, 15.16s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:11<00:00, 11.89s/it]


{'faithfulness': 0.7500}


Evaluating: 100%|██████████| 1/1 [00:07<00:00,  7.34s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:12<00:00, 12.31s/it]


{'faithfulness': 0.9000}


Evaluating: 100%|██████████| 1/1 [00:16<00:00, 16.94s/it]


{'faithfulness': 0.8333}


Evaluating: 100%|██████████| 1/1 [00:16<00:00, 16.91s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:23<00:00, 23.19s/it]


{'faithfulness': 0.9500}


Evaluating: 100%|██████████| 1/1 [00:17<00:00, 17.04s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:14<00:00, 14.79s/it]


{'faithfulness': 0.8667}


Evaluating: 100%|██████████| 1/1 [00:14<00:00, 14.61s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:23<00:00, 23.37s/it]


{'faithfulness': 0.8421}


Evaluating: 100%|██████████| 1/1 [00:13<00:00, 13.79s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:17<00:00, 17.34s/it]


{'faithfulness': 0.9412}


Evaluating: 100%|██████████| 1/1 [00:10<00:00, 10.82s/it]


{'faithfulness': 0.9167}


Evaluating: 100%|██████████| 1/1 [00:21<00:00, 21.40s/it]


{'faithfulness': 0.7222}


Evaluating: 100%|██████████| 1/1 [00:17<00:00, 17.80s/it]


{'faithfulness': 0.8889}


Evaluating: 100%|██████████| 1/1 [00:15<00:00, 15.06s/it]


{'faithfulness': 0.9333}


Evaluating: 100%|██████████| 1/1 [00:10<00:00, 10.27s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:21<00:00, 21.92s/it]


{'faithfulness': 0.9565}


Evaluating: 100%|██████████| 1/1 [00:17<00:00, 17.26s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:19<00:00, 19.54s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:21<00:00, 21.11s/it]


{'faithfulness': 0.7895}


Evaluating: 100%|██████████| 1/1 [00:14<00:00, 14.08s/it]


{'faithfulness': 0.8462}


Evaluating: 100%|██████████| 1/1 [00:11<00:00, 11.37s/it]


{'faithfulness': 0.6667}


Evaluating: 100%|██████████| 1/1 [00:09<00:00,  9.36s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:24<00:00, 24.70s/it]


{'faithfulness': 0.9655}


Evaluating: 100%|██████████| 1/1 [00:13<00:00, 13.91s/it]


{'faithfulness': 0.9231}


Evaluating: 100%|██████████| 1/1 [00:23<00:00, 23.35s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:12<00:00, 12.21s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:24<00:00, 24.28s/it]


{'faithfulness': 0.9474}


Evaluating: 100%|██████████| 1/1 [00:18<00:00, 18.47s/it]


{'faithfulness': 0.8421}


Evaluating: 100%|██████████| 1/1 [00:19<00:00, 19.33s/it]


{'faithfulness': 0.8824}


Evaluating: 100%|██████████| 1/1 [00:18<00:00, 18.49s/it]


{'faithfulness': 0.7778}


Evaluating: 100%|██████████| 1/1 [00:18<00:00, 18.44s/it]


{'faithfulness': 0.9286}


Evaluating: 100%|██████████| 1/1 [00:30<00:00, 30.43s/it]


{'faithfulness': 0.8857}


Evaluating: 100%|██████████| 1/1 [00:18<00:00, 18.36s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:12<00:00, 12.59s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:16<00:00, 16.66s/it]


{'faithfulness': 0.8333}


Evaluating: 100%|██████████| 1/1 [00:22<00:00, 22.38s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:19<00:00, 19.50s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:15<00:00, 15.19s/it]


{'faithfulness': 0.6667}


Evaluating: 100%|██████████| 1/1 [00:22<00:00, 22.15s/it]


{'faithfulness': 0.8667}


Evaluating: 100%|██████████| 1/1 [00:12<00:00, 12.43s/it]


{'faithfulness': 0.9091}


Evaluating: 100%|██████████| 1/1 [00:28<00:00, 28.46s/it]


{'faithfulness': 0.8500}


Evaluating: 100%|██████████| 1/1 [00:13<00:00, 13.53s/it]


{'faithfulness': 0.6667}


Evaluating: 100%|██████████| 1/1 [00:16<00:00, 16.30s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:19<00:00, 19.45s/it]


{'faithfulness': 0.9412}


Evaluating: 100%|██████████| 1/1 [00:11<00:00, 11.46s/it]


{'faithfulness': 0.8182}


Evaluating: 100%|██████████| 1/1 [00:24<00:00, 24.99s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:17<00:00, 17.98s/it]


{'faithfulness': 0.9412}


Evaluating: 100%|██████████| 1/1 [00:15<00:00, 15.47s/it]


{'faithfulness': 0.7857}


Evaluating: 100%|██████████| 1/1 [00:14<00:00, 14.76s/it]


{'faithfulness': 0.9167}


Evaluating: 100%|██████████| 1/1 [00:13<00:00, 13.92s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:20<00:00, 20.33s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:18<00:00, 18.52s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:21<00:00, 21.40s/it]


{'faithfulness': 0.9524}


Evaluating: 100%|██████████| 1/1 [00:39<00:00, 39.05s/it]


{'faithfulness': 0.7857}


Evaluating: 100%|██████████| 1/1 [00:13<00:00, 13.90s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:23<00:00, 23.12s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:20<00:00, 20.81s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:10<00:00, 10.20s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:09<00:00,  9.47s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:19<00:00, 19.24s/it]


{'faithfulness': 0.8824}


Evaluating: 100%|██████████| 1/1 [00:17<00:00, 17.72s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:15<00:00, 15.16s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:16<00:00, 16.10s/it]


{'faithfulness': 0.9333}


Evaluating: 100%|██████████| 1/1 [00:27<00:00, 27.69s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:08<00:00,  8.13s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:07<00:00,  7.36s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:20<00:00, 20.42s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:15<00:00, 15.35s/it]


{'faithfulness': 0.9167}


Evaluating: 100%|██████████| 1/1 [00:35<00:00, 35.57s/it]


{'faithfulness': 0.9333}


Evaluating: 100%|██████████| 1/1 [00:19<00:00, 19.22s/it]


{'faithfulness': 0.9231}


Evaluating: 100%|██████████| 1/1 [00:20<00:00, 20.78s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:18<00:00, 18.76s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:25<00:00, 25.71s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:15<00:00, 15.80s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:08<00:00,  8.73s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:15<00:00, 15.84s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:11<00:00, 11.60s/it]


{'faithfulness': 0.8750}


Evaluating: 100%|██████████| 1/1 [00:14<00:00, 14.44s/it]


{'faithfulness': 0.9167}


Evaluating: 100%|██████████| 1/1 [00:15<00:00, 15.82s/it]


{'faithfulness': 0.8000}


Evaluating: 100%|██████████| 1/1 [00:17<00:00, 17.84s/it]


{'faithfulness': 0.9000}


Evaluating: 100%|██████████| 1/1 [00:20<00:00, 20.75s/it]


{'faithfulness': 0.9412}


Evaluating: 100%|██████████| 1/1 [00:21<00:00, 21.15s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:30<00:00, 30.77s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:15<00:00, 15.02s/it]


{'faithfulness': 0.9231}


Evaluating: 100%|██████████| 1/1 [00:20<00:00, 20.79s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:19<00:00, 19.86s/it]


{'faithfulness': 0.9412}


Evaluating: 100%|██████████| 1/1 [00:15<00:00, 15.31s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:17<00:00, 17.84s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:15<00:00, 15.23s/it]


{'faithfulness': 0.6364}


Evaluating: 100%|██████████| 1/1 [00:22<00:00, 22.37s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:19<00:00, 19.37s/it]


{'faithfulness': 0.9375}


Evaluating: 100%|██████████| 1/1 [00:25<00:00, 25.50s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:05<00:00,  5.21s/it]


{'faithfulness': 0.3333}


Evaluating: 100%|██████████| 1/1 [00:04<00:00,  4.14s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:04<00:00,  4.01s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:24<00:00, 24.50s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:15<00:00, 15.46s/it]


{'faithfulness': 0.9000}


Evaluating: 100%|██████████| 1/1 [00:08<00:00,  8.49s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:15<00:00, 15.28s/it]


{'faithfulness': 0.7778}


Evaluating: 100%|██████████| 1/1 [00:13<00:00, 13.86s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:24<00:00, 24.45s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:12<00:00, 12.23s/it]


{'faithfulness': 0.6667}


Evaluating: 100%|██████████| 1/1 [00:08<00:00,  8.84s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:27<00:00, 27.32s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:08<00:00,  8.23s/it]


{'faithfulness': 0.8571}


Evaluating: 100%|██████████| 1/1 [00:10<00:00, 10.99s/it]


{'faithfulness': 0.9000}


Evaluating: 100%|██████████| 1/1 [00:10<00:00, 10.44s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:17<00:00, 17.14s/it]


{'faithfulness': 0.8571}


Evaluating: 100%|██████████| 1/1 [00:17<00:00, 17.78s/it]


{'faithfulness': 0.9167}


Evaluating: 100%|██████████| 1/1 [00:20<00:00, 20.33s/it]


{'faithfulness': 0.5500}


Evaluating: 100%|██████████| 1/1 [00:03<00:00,  3.71s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:21<00:00, 21.84s/it]


{'faithfulness': 0.6000}


Evaluating: 100%|██████████| 1/1 [00:20<00:00, 20.34s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:14<00:00, 14.27s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:10<00:00, 10.85s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:14<00:00, 14.66s/it]


{'faithfulness': 0.8571}


Evaluating: 100%|██████████| 1/1 [00:30<00:00, 30.58s/it]


{'faithfulness': 0.8947}


Evaluating: 100%|██████████| 1/1 [00:42<00:00, 42.06s/it]


{'faithfulness': 0.6923}


Evaluating: 100%|██████████| 1/1 [00:29<00:00, 29.03s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:35<00:00, 35.63s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:15<00:00, 15.35s/it]


{'faithfulness': 0.6000}


Evaluating: 100%|██████████| 1/1 [00:23<00:00, 23.51s/it]


{'faithfulness': 0.9091}


Evaluating: 100%|██████████| 1/1 [00:25<00:00, 25.82s/it]


{'faithfulness': 0.9375}


Evaluating: 100%|██████████| 1/1 [00:16<00:00, 16.85s/it]


{'faithfulness': 0.7647}


Evaluating: 100%|██████████| 1/1 [00:21<00:00, 21.51s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:12<00:00, 12.48s/it]


{'faithfulness': 0.9167}


Evaluating: 100%|██████████| 1/1 [00:20<00:00, 20.37s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:13<00:00, 13.44s/it]


{'faithfulness': 0.8462}


Evaluating: 100%|██████████| 1/1 [00:19<00:00, 19.82s/it]


{'faithfulness': 0.8000}


Evaluating: 100%|██████████| 1/1 [00:11<00:00, 11.77s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:15<00:00, 15.51s/it]


{'faithfulness': 0.8750}


Evaluating: 100%|██████████| 1/1 [00:16<00:00, 16.90s/it]


{'faithfulness': 0.8750}


Evaluating: 100%|██████████| 1/1 [00:16<00:00, 16.03s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:18<00:00, 18.91s/it]


{'faithfulness': 0.5882}


Evaluating: 100%|██████████| 1/1 [00:13<00:00, 13.91s/it]


{'faithfulness': 0.6000}


Evaluating: 100%|██████████| 1/1 [00:05<00:00,  5.46s/it]


{'faithfulness': 0.8000}


Evaluating: 100%|██████████| 1/1 [00:10<00:00, 10.75s/it]


{'faithfulness': 0.8000}


Evaluating: 100%|██████████| 1/1 [00:21<00:00, 21.67s/it]


{'faithfulness': 0.9048}


Evaluating: 100%|██████████| 1/1 [00:20<00:00, 20.04s/it]


{'faithfulness': 0.8000}


Evaluating: 100%|██████████| 1/1 [00:16<00:00, 16.01s/it]


{'faithfulness': 0.8462}


Evaluating: 100%|██████████| 1/1 [00:19<00:00, 19.95s/it]


{'faithfulness': 0.9286}


Evaluating: 100%|██████████| 1/1 [00:19<00:00, 19.84s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:17<00:00, 17.62s/it]


{'faithfulness': 0.9474}


Evaluating: 100%|██████████| 1/1 [00:15<00:00, 15.94s/it]


{'faithfulness': 0.8571}


Evaluating: 100%|██████████| 1/1 [00:12<00:00, 12.10s/it]


{'faithfulness': 0.8462}


Evaluating: 100%|██████████| 1/1 [00:15<00:00, 15.49s/it]


{'faithfulness': 0.8462}


Evaluating: 100%|██████████| 1/1 [00:10<00:00, 10.88s/it]


{'faithfulness': 0.6154}


Evaluating: 100%|██████████| 1/1 [00:17<00:00, 17.62s/it]


{'faithfulness': 0.6923}


Evaluating: 100%|██████████| 1/1 [00:16<00:00, 16.61s/it]


{'faithfulness': 0.7368}


Evaluating: 100%|██████████| 1/1 [00:13<00:00, 13.51s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:13<00:00, 13.74s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:13<00:00, 13.58s/it]


{'faithfulness': 0.9231}


Evaluating: 100%|██████████| 1/1 [00:17<00:00, 17.04s/it]


{'faithfulness': 0.6471}


Evaluating: 100%|██████████| 1/1 [00:18<00:00, 18.37s/it]


{'faithfulness': 0.7333}


Evaluating: 100%|██████████| 1/1 [00:18<00:00, 18.94s/it]


{'faithfulness': 0.7000}


Evaluating: 100%|██████████| 1/1 [00:13<00:00, 13.54s/it]


{'faithfulness': 0.8333}


Evaluating: 100%|██████████| 1/1 [00:19<00:00, 19.63s/it]


{'faithfulness': 0.8571}


Evaluating: 100%|██████████| 1/1 [00:15<00:00, 15.20s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:11<00:00, 11.16s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:10<00:00, 10.85s/it]


{'faithfulness': 0.9091}


Evaluating: 100%|██████████| 1/1 [00:14<00:00, 14.92s/it]


{'faithfulness': 0.9333}


Evaluating: 100%|██████████| 1/1 [00:09<00:00,  9.32s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:20<00:00, 20.42s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:18<00:00, 18.70s/it]


{'faithfulness': 0.9375}


Evaluating: 100%|██████████| 1/1 [00:11<00:00, 11.09s/it]


{'faithfulness': 0.8333}


Evaluating: 100%|██████████| 1/1 [00:11<00:00, 11.13s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:12<00:00, 12.01s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:16<00:00, 16.05s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:20<00:00, 20.51s/it]


{'faithfulness': 0.9000}


Evaluating: 100%|██████████| 1/1 [00:21<00:00, 21.61s/it]


{'faithfulness': 0.7826}


Evaluating: 100%|██████████| 1/1 [00:12<00:00, 12.16s/it]


{'faithfulness': 0.9286}


Evaluating: 100%|██████████| 1/1 [00:13<00:00, 13.52s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:21<00:00, 21.13s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:10<00:00, 10.91s/it]


{'faithfulness': 0.7000}


Evaluating: 100%|██████████| 1/1 [00:11<00:00, 11.61s/it]


{'faithfulness': 0.9333}


Evaluating: 100%|██████████| 1/1 [00:23<00:00, 23.23s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:13<00:00, 13.96s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:20<00:00, 20.35s/it]


{'faithfulness': 0.8571}


Evaluating: 100%|██████████| 1/1 [00:12<00:00, 12.23s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:13<00:00, 13.23s/it]


{'faithfulness': 0.8571}


Evaluating: 100%|██████████| 1/1 [00:10<00:00, 10.99s/it]


{'faithfulness': 0.7000}


Evaluating: 100%|██████████| 1/1 [00:22<00:00, 22.67s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:16<00:00, 16.82s/it]


{'faithfulness': 0.8182}


Evaluating: 100%|██████████| 1/1 [00:21<00:00, 21.60s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:17<00:00, 17.44s/it]


{'faithfulness': 0.9231}


Evaluating: 100%|██████████| 1/1 [00:09<00:00,  9.43s/it]


{'faithfulness': 0.7143}


Evaluating: 100%|██████████| 1/1 [00:33<00:00, 33.59s/it]


{'faithfulness': 0.7826}


Evaluating: 100%|██████████| 1/1 [00:18<00:00, 18.68s/it]


{'faithfulness': 0.9375}


Evaluating: 100%|██████████| 1/1 [00:12<00:00, 12.41s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:16<00:00, 16.70s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:20<00:00, 20.40s/it]


{'faithfulness': 0.8333}


Evaluating: 100%|██████████| 1/1 [00:13<00:00, 13.92s/it]


{'faithfulness': 0.8462}


Evaluating: 100%|██████████| 1/1 [00:17<00:00, 17.21s/it]


{'faithfulness': 0.9375}


Evaluating: 100%|██████████| 1/1 [00:17<00:00, 17.36s/it]


{'faithfulness': 0.7778}


Evaluating: 100%|██████████| 1/1 [00:14<00:00, 14.12s/it]


{'faithfulness': 0.9231}


Evaluating: 100%|██████████| 1/1 [00:12<00:00, 12.64s/it]


{'faithfulness': 0.9167}


Evaluating: 100%|██████████| 1/1 [00:15<00:00, 15.59s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:17<00:00, 17.86s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:13<00:00, 13.05s/it]


{'faithfulness': 0.8000}


Evaluating: 100%|██████████| 1/1 [00:27<00:00, 27.20s/it]


{'faithfulness': 0.9333}


Evaluating: 100%|██████████| 1/1 [00:21<00:00, 21.38s/it]


{'faithfulness': 0.9091}


Evaluating: 100%|██████████| 1/1 [00:16<00:00, 16.06s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:33<00:00, 33.73s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:29<00:00, 29.41s/it]


{'faithfulness': 0.8261}


Evaluating: 100%|██████████| 1/1 [00:26<00:00, 26.28s/it]


{'faithfulness': 0.9375}


Evaluating: 100%|██████████| 1/1 [00:18<00:00, 18.49s/it]


{'faithfulness': 0.8889}


Evaluating: 100%|██████████| 1/1 [00:25<00:00, 25.38s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:05<00:00,  5.25s/it]


{'faithfulness': 0.7500}


Evaluating: 100%|██████████| 1/1 [00:06<00:00,  6.92s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:03<00:00,  3.70s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:21<00:00, 21.94s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:15<00:00, 15.29s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:14<00:00, 14.60s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:11<00:00, 11.65s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:09<00:00,  9.63s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:14<00:00, 14.37s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:08<00:00,  8.36s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:14<00:00, 14.78s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:04<00:00,  4.15s/it]


{'faithfulness': 0.6667}


Evaluating: 100%|██████████| 1/1 [00:06<00:00,  6.70s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:11<00:00, 11.92s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:08<00:00,  8.55s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:11<00:00, 11.49s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:03<00:00,  3.99s/it]


{'faithfulness': 0.3333}


Evaluating: 100%|██████████| 1/1 [00:15<00:00, 15.63s/it]


{'faithfulness': 0.9375}


Evaluating: 100%|██████████| 1/1 [00:03<00:00,  3.89s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:13<00:00, 13.48s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:16<00:00, 16.16s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:14<00:00, 14.53s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:12<00:00, 12.09s/it]


{'faithfulness': 0.7273}


Evaluating: 100%|██████████| 1/1 [00:12<00:00, 12.48s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:09<00:00,  9.11s/it]


{'faithfulness': 0.8889}


Evaluating: 100%|██████████| 1/1 [00:15<00:00, 15.68s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:17<00:00, 17.68s/it]


{'faithfulness': 0.9286}


Evaluating: 100%|██████████| 1/1 [00:20<00:00, 20.14s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:19<00:00, 19.18s/it]


{'faithfulness': 0.9474}


Evaluating: 100%|██████████| 1/1 [00:13<00:00, 13.28s/it]


{'faithfulness': 0.8462}


Evaluating: 100%|██████████| 1/1 [00:20<00:00, 20.44s/it]


{'faithfulness': 0.8333}


Evaluating: 100%|██████████| 1/1 [00:18<00:00, 18.73s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:12<00:00, 12.91s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:11<00:00, 11.66s/it]


{'faithfulness': 0.7500}


Evaluating: 100%|██████████| 1/1 [00:20<00:00, 20.78s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:22<00:00, 22.56s/it]


{'faithfulness': 0.8333}


Evaluating: 100%|██████████| 1/1 [00:16<00:00, 16.19s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:08<00:00,  8.11s/it]


{'faithfulness': 0.8571}


Evaluating: 100%|██████████| 1/1 [00:21<00:00, 21.21s/it]


{'faithfulness': 0.8571}


Evaluating: 100%|██████████| 1/1 [00:16<00:00, 16.55s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:23<00:00, 23.85s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:18<00:00, 18.11s/it]


{'faithfulness': 0.9565}


Evaluating: 100%|██████████| 1/1 [00:16<00:00, 16.77s/it]


{'faithfulness': 0.9444}


Evaluating: 100%|██████████| 1/1 [00:10<00:00, 10.20s/it]


{'faithfulness': 0.8182}


Evaluating: 100%|██████████| 1/1 [00:08<00:00,  8.62s/it]


{'faithfulness': 0.8889}


Evaluating: 100%|██████████| 1/1 [00:27<00:00, 27.90s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:17<00:00, 17.40s/it]


{'faithfulness': 0.9444}


Evaluating: 100%|██████████| 1/1 [00:17<00:00, 17.15s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:21<00:00, 21.13s/it]


{'faithfulness': 0.9500}


Evaluating: 100%|██████████| 1/1 [00:17<00:00, 17.27s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:23<00:00, 23.51s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:16<00:00, 16.80s/it]


{'faithfulness': 0.9500}


Evaluating: 100%|██████████| 1/1 [00:16<00:00, 16.57s/it]


{'faithfulness': 0.8889}


Evaluating: 100%|██████████| 1/1 [00:19<00:00, 19.97s/it]


{'faithfulness': 0.9375}


Evaluating: 100%|██████████| 1/1 [00:21<00:00, 21.94s/it]


{'faithfulness': 0.9643}


Evaluating: 100%|██████████| 1/1 [00:12<00:00, 12.42s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:13<00:00, 13.66s/it]


{'faithfulness': 0.9412}


Evaluating: 100%|██████████| 1/1 [00:11<00:00, 11.65s/it]


{'faithfulness': 0.8182}


Evaluating: 100%|██████████| 1/1 [00:15<00:00, 15.95s/it]


{'faithfulness': 0.9231}


Evaluating: 100%|██████████| 1/1 [00:13<00:00, 13.71s/it]


{'faithfulness': 0.7692}


Evaluating: 100%|██████████| 1/1 [00:15<00:00, 15.33s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:18<00:00, 18.62s/it]


{'faithfulness': 0.9500}


Evaluating: 100%|██████████| 1/1 [00:19<00:00, 19.15s/it]


{'faithfulness': 0.9474}


Evaluating: 100%|██████████| 1/1 [00:14<00:00, 14.12s/it]


{'faithfulness': 0.9375}


Evaluating: 100%|██████████| 1/1 [00:15<00:00, 15.43s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:17<00:00, 17.50s/it]


{'faithfulness': 0.9474}


Evaluating: 100%|██████████| 1/1 [00:11<00:00, 11.64s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:12<00:00, 12.30s/it]


{'faithfulness': 0.9167}


Evaluating: 100%|██████████| 1/1 [00:13<00:00, 13.90s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:17<00:00, 17.28s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:18<00:00, 18.21s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:18<00:00, 18.12s/it]


{'faithfulness': 0.8125}


Evaluating: 100%|██████████| 1/1 [00:11<00:00, 11.77s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:14<00:00, 14.39s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:28<00:00, 28.62s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:20<00:00, 20.64s/it]


{'faithfulness': 0.9565}


Evaluating: 100%|██████████| 1/1 [00:17<00:00, 17.08s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:20<00:00, 20.73s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:14<00:00, 14.36s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:13<00:00, 13.66s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:13<00:00, 13.01s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:14<00:00, 14.51s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:11<00:00, 11.81s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:18<00:00, 18.62s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:17<00:00, 17.27s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:19<00:00, 19.23s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:13<00:00, 13.08s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:12<00:00, 12.08s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:14<00:00, 14.68s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:21<00:00, 21.94s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:11<00:00, 11.07s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:13<00:00, 13.79s/it]


{'faithfulness': 0.9286}


Evaluating: 100%|██████████| 1/1 [00:18<00:00, 18.82s/it]


{'faithfulness': 0.9412}


Evaluating: 100%|██████████| 1/1 [00:15<00:00, 15.01s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:20<00:00, 20.58s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:18<00:00, 18.06s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:15<00:00, 15.13s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:13<00:00, 13.71s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:38<00:00, 38.15s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:21<00:00, 21.15s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:16<00:00, 16.46s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:11<00:00, 11.04s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:12<00:00, 12.43s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:21<00:00, 21.70s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:14<00:00, 14.53s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:22<00:00, 22.69s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:37<00:00, 37.21s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:34<00:00, 34.36s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:37<00:00, 37.10s/it]


{'faithfulness': 0.9565}


Evaluating: 100%|██████████| 1/1 [00:31<00:00, 31.72s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:31<00:00, 31.99s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:39<00:00, 39.70s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:37<00:00, 37.93s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:31<00:00, 31.85s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:27<00:00, 27.99s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:12<00:00, 12.47s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:05<00:00,  5.22s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:13<00:00, 13.83s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:19<00:00, 19.17s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:10<00:00, 10.08s/it]


{'faithfulness': 0.8889}


Evaluating: 100%|██████████| 1/1 [00:08<00:00,  8.80s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:11<00:00, 11.62s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:08<00:00,  8.96s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:17<00:00, 17.13s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:05<00:00,  5.13s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:06<00:00,  6.24s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:10<00:00, 10.73s/it]


{'faithfulness': 0.8750}


Evaluating: 100%|██████████| 1/1 [00:07<00:00,  7.47s/it]


{'faithfulness': 0.7500}


Evaluating: 100%|██████████| 1/1 [00:06<00:00,  6.96s/it]


{'faithfulness': 0.8333}


Evaluating: 100%|██████████| 1/1 [00:06<00:00,  6.97s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:11<00:00, 11.49s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:12<00:00, 12.47s/it]


{'faithfulness': 0.6250}


Evaluating: 100%|██████████| 1/1 [00:11<00:00, 11.26s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:04<00:00,  4.64s/it]


{'faithfulness': 0.6667}


Evaluating: 100%|██████████| 1/1 [00:13<00:00, 13.20s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:13<00:00, 13.63s/it]


{'faithfulness': 0.8182}


Evaluating: 100%|██████████| 1/1 [00:10<00:00, 10.94s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:05<00:00,  5.70s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:10<00:00, 10.70s/it]


{'faithfulness': 0.8750}


Evaluating: 100%|██████████| 1/1 [00:10<00:00, 10.06s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:17<00:00, 17.60s/it]


{'faithfulness': 0.8000}


Evaluating: 100%|██████████| 1/1 [00:14<00:00, 14.14s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:25<00:00, 25.71s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:16<00:00, 16.63s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:17<00:00, 17.52s/it]


{'faithfulness': 0.7000}


Evaluating: 100%|██████████| 1/1 [00:33<00:00, 33.70s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:16<00:00, 16.88s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:17<00:00, 17.79s/it]


{'faithfulness': 0.9000}


Evaluating: 100%|██████████| 1/1 [00:38<00:00, 38.52s/it]


{'faithfulness': 0.7273}


Evaluating: 100%|██████████| 1/1 [00:31<00:00, 31.56s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:21<00:00, 21.70s/it]


{'faithfulness': 0.9286}


Evaluating: 100%|██████████| 1/1 [00:20<00:00, 20.97s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:09<00:00,  9.84s/it]


{'faithfulness': 0.8333}


Evaluating: 100%|██████████| 1/1 [00:17<00:00, 17.10s/it]


{'faithfulness': 0.9231}


Evaluating: 100%|██████████| 1/1 [00:23<00:00, 23.77s/it]


{'faithfulness': 0.9375}


Evaluating: 100%|██████████| 1/1 [00:24<00:00, 24.53s/it]


{'faithfulness': 0.8667}


Evaluating: 100%|██████████| 1/1 [00:13<00:00, 13.79s/it]


{'faithfulness': 0.9231}


Evaluating: 100%|██████████| 1/1 [00:25<00:00, 25.70s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:06<00:00,  6.29s/it]


{'faithfulness': 0.6000}


Evaluating: 100%|██████████| 1/1 [00:19<00:00, 19.04s/it]


{'faithfulness': 0.8750}


Evaluating: 100%|██████████| 1/1 [00:34<00:00, 34.27s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:22<00:00, 22.77s/it]


{'faithfulness': 0.9412}


Evaluating: 100%|██████████| 1/1 [00:21<00:00, 21.55s/it]


{'faithfulness': 0.9091}


Evaluating: 100%|██████████| 1/1 [00:22<00:00, 22.52s/it]


{'faithfulness': 0.7778}


Evaluating: 100%|██████████| 1/1 [00:32<00:00, 32.87s/it]


{'faithfulness': 0.9412}


Evaluating: 100%|██████████| 1/1 [00:26<00:00, 26.48s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:16<00:00, 16.23s/it]


{'faithfulness': 0.9091}


Evaluating: 100%|██████████| 1/1 [00:14<00:00, 14.71s/it]


{'faithfulness': 0.9000}


Evaluating: 100%|██████████| 1/1 [00:22<00:00, 22.94s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:21<00:00, 21.61s/it]


{'faithfulness': 0.7000}


Evaluating: 100%|██████████| 1/1 [00:17<00:00, 17.56s/it]


{'faithfulness': 0.8750}


Evaluating: 100%|██████████| 1/1 [00:44<00:00, 44.65s/it]


{'faithfulness': 0.6429}


Evaluating: 100%|██████████| 1/1 [00:16<00:00, 16.54s/it]


{'faithfulness': 0.5000}


Evaluating: 100%|██████████| 1/1 [00:27<00:00, 27.28s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:22<00:00, 22.45s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:24<00:00, 24.31s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:48<00:00, 48.66s/it]


{'faithfulness': 0.8571}


Evaluating: 100%|██████████| 1/1 [00:16<00:00, 16.19s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:49<00:00, 49.35s/it]


{'faithfulness': 0.9286}


Evaluating: 100%|██████████| 1/1 [00:34<00:00, 34.47s/it]


{'faithfulness': 0.8462}


Evaluating: 100%|██████████| 1/1 [00:28<00:00, 28.07s/it]


{'faithfulness': 0.7143}


Evaluating: 100%|██████████| 1/1 [00:16<00:00, 16.54s/it]


{'faithfulness': 0.8333}


Evaluating: 100%|██████████| 1/1 [00:16<00:00, 16.67s/it]


{'faithfulness': 0.8750}


Evaluating: 100%|██████████| 1/1 [00:26<00:00, 26.34s/it]


{'faithfulness': 0.9375}


Evaluating: 100%|██████████| 1/1 [00:32<00:00, 32.67s/it]


{'faithfulness': 0.8462}


Evaluating: 100%|██████████| 1/1 [00:23<00:00, 23.12s/it]


{'faithfulness': 0.9167}


Evaluating: 100%|██████████| 1/1 [00:40<00:00, 40.75s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:26<00:00, 26.01s/it]


{'faithfulness': 0.8750}


Evaluating: 100%|██████████| 1/1 [00:19<00:00, 19.70s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [01:08<00:00, 68.36s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:19<00:00, 19.05s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:30<00:00, 30.99s/it]


{'faithfulness': 0.9231}


Evaluating: 100%|██████████| 1/1 [00:36<00:00, 36.48s/it]


{'faithfulness': 0.9412}


Evaluating: 100%|██████████| 1/1 [00:19<00:00, 19.84s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:15<00:00, 15.26s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:31<00:00, 31.43s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:12<00:00, 12.25s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:13<00:00, 13.84s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:25<00:00, 25.24s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:26<00:00, 26.56s/it]


{'faithfulness': 0.8125}


Evaluating: 100%|██████████| 1/1 [00:13<00:00, 13.44s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:20<00:00, 20.27s/it]


{'faithfulness': 0.9286}


Evaluating: 100%|██████████| 1/1 [00:08<00:00,  8.57s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:09<00:00,  9.97s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:20<00:00, 20.58s/it]


{'faithfulness': 0.8667}


Evaluating: 100%|██████████| 1/1 [00:10<00:00, 10.01s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:14<00:00, 14.48s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:16<00:00, 16.26s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:12<00:00, 12.41s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:27<00:00, 27.04s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:17<00:00, 17.99s/it]


{'faithfulness': 0.9545}


Evaluating: 100%|██████████| 1/1 [00:13<00:00, 13.07s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:08<00:00,  8.69s/it]


{'faithfulness': 0.8750}


Evaluating: 100%|██████████| 1/1 [00:24<00:00, 24.37s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:14<00:00, 14.20s/it]


{'faithfulness': 0.9167}


Evaluating: 100%|██████████| 1/1 [00:12<00:00, 12.89s/it]


{'faithfulness': 0.8333}


Evaluating: 100%|██████████| 1/1 [00:09<00:00,  9.40s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:11<00:00, 11.91s/it]


{'faithfulness': 0.6667}


Evaluating: 100%|██████████| 1/1 [00:10<00:00, 10.87s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:14<00:00, 14.49s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:17<00:00, 17.41s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:12<00:00, 12.30s/it]


{'faithfulness': 0.8182}


Evaluating: 100%|██████████| 1/1 [00:20<00:00, 20.93s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:08<00:00,  8.21s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:08<00:00,  8.48s/it]


{'faithfulness': 0.6250}


Evaluating: 100%|██████████| 1/1 [00:15<00:00, 15.30s/it]


{'faithfulness': 0.9231}


Evaluating: 100%|██████████| 1/1 [00:15<00:00, 15.21s/it]


{'faithfulness': 0.9091}


Evaluating: 100%|██████████| 1/1 [00:55<00:00, 55.59s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:09<00:00,  9.05s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:17<00:00, 17.38s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:06<00:00,  6.10s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:04<00:00,  4.61s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:03<00:00,  3.51s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:09<00:00,  9.19s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:15<00:00, 15.86s/it]


{'faithfulness': 0.8889}


Evaluating: 100%|██████████| 1/1 [00:07<00:00,  7.83s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:11<00:00, 11.20s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:06<00:00,  6.33s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:21<00:00, 21.37s/it]


{'faithfulness': 0.9286}


Evaluating: 100%|██████████| 1/1 [00:02<00:00,  2.91s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:08<00:00,  8.23s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:10<00:00, 11.00s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:03<00:00,  3.25s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:08<00:00,  8.66s/it]


{'faithfulness': 0.8750}


Evaluating: 100%|██████████| 1/1 [00:10<00:00, 10.03s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:09<00:00,  9.19s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:17<00:00, 17.18s/it]


{'faithfulness': 0.8889}


Evaluating: 100%|██████████| 1/1 [00:14<00:00, 14.22s/it]


{'faithfulness': 0.6667}


Evaluating: 100%|██████████| 1/1 [00:03<00:00,  3.61s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:07<00:00,  7.78s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:26<00:00, 26.72s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:12<00:00, 12.21s/it]


{'faithfulness': 0.9000}


Evaluating: 100%|██████████| 1/1 [00:06<00:00,  6.25s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:06<00:00,  6.97s/it]


{'faithfulness': 0.3333}


Evaluating: 100%|██████████| 1/1 [00:10<00:00, 10.50s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:13<00:00, 13.20s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:11<00:00, 11.86s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:12<00:00, 12.71s/it]


{'faithfulness': 0.7692}


Evaluating: 100%|██████████| 1/1 [00:19<00:00, 19.70s/it]


{'faithfulness': 0.8235}


Evaluating: 100%|██████████| 1/1 [00:14<00:00, 14.05s/it]


{'faithfulness': 0.7692}


Evaluating: 100%|██████████| 1/1 [00:22<00:00, 22.13s/it]


{'faithfulness': 0.8667}


Evaluating: 100%|██████████| 1/1 [00:15<00:00, 15.03s/it]


{'faithfulness': 0.9091}


Evaluating: 100%|██████████| 1/1 [00:14<00:00, 14.31s/it]


{'faithfulness': 0.1111}


Evaluating: 100%|██████████| 1/1 [00:12<00:00, 12.47s/it]


{'faithfulness': 0.9231}


Evaluating: 100%|██████████| 1/1 [00:16<00:00, 16.16s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:14<00:00, 14.94s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:13<00:00, 13.99s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:06<00:00,  6.83s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:16<00:00, 16.97s/it]


{'faithfulness': 0.7273}


Evaluating: 100%|██████████| 1/1 [00:17<00:00, 17.50s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:22<00:00, 22.45s/it]


{'faithfulness': 0.7895}


Evaluating: 100%|██████████| 1/1 [00:19<00:00, 19.11s/it]


{'faithfulness': 0.8824}


Evaluating: 100%|██████████| 1/1 [00:22<00:00, 22.96s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:08<00:00,  8.87s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:15<00:00, 15.88s/it]


{'faithfulness': 0.8889}


Evaluating: 100%|██████████| 1/1 [00:25<00:00, 25.62s/it]


{'faithfulness': 0.9474}


Evaluating: 100%|██████████| 1/1 [00:17<00:00, 17.73s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:20<00:00, 20.08s/it]


{'faithfulness': 0.9474}


Evaluating: 100%|██████████| 1/1 [00:18<00:00, 18.09s/it]


{'faithfulness': 0.8182}


Evaluating: 100%|██████████| 1/1 [00:10<00:00, 10.55s/it]


{'faithfulness': 0.7778}


Evaluating: 100%|██████████| 1/1 [00:30<00:00, 30.39s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:22<00:00, 22.26s/it]


{'faithfulness': 0.9091}


Evaluating: 100%|██████████| 1/1 [00:22<00:00, 22.62s/it]


{'faithfulness': 0.7059}


Evaluating: 100%|██████████| 1/1 [00:47<00:00, 47.35s/it]


{'faithfulness': 0.9412}


Evaluating: 100%|██████████| 1/1 [00:13<00:00, 13.17s/it]


{'faithfulness': 0.9167}


Evaluating: 100%|██████████| 1/1 [00:28<00:00, 29.00s/it]


{'faithfulness': 0.8571}


Evaluating: 100%|██████████| 1/1 [00:21<00:00, 22.00s/it]


{'faithfulness': 0.1333}


Evaluating: 100%|██████████| 1/1 [00:19<00:00, 19.74s/it]


{'faithfulness': 0.8571}


Evaluating: 100%|██████████| 1/1 [00:24<00:00, 24.67s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:16<00:00, 16.55s/it]


{'faithfulness': 0.8333}


Evaluating: 100%|██████████| 1/1 [00:10<00:00, 10.82s/it]


{'faithfulness': 0.8889}


Evaluating: 100%|██████████| 1/1 [00:20<00:00, 20.99s/it]


{'faithfulness': 0.9167}


Evaluating: 100%|██████████| 1/1 [00:22<00:00, 22.03s/it]


{'faithfulness': 0.8667}


Evaluating: 100%|██████████| 1/1 [00:19<00:00, 19.97s/it]


{'faithfulness': 0.7857}


Evaluating: 100%|██████████| 1/1 [00:19<00:00, 19.34s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:23<00:00, 23.58s/it]


{'faithfulness': 0.9412}


Evaluating: 100%|██████████| 1/1 [00:12<00:00, 12.31s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:19<00:00, 19.32s/it]


{'faithfulness': 0.8889}


Evaluating: 100%|██████████| 1/1 [00:15<00:00, 15.17s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:15<00:00, 15.63s/it]


{'faithfulness': 0.9286}


Evaluating: 100%|██████████| 1/1 [00:13<00:00, 13.55s/it]


{'faithfulness': 0.9167}


Evaluating: 100%|██████████| 1/1 [00:18<00:00, 18.16s/it]


{'faithfulness': 0.9091}


Evaluating: 100%|██████████| 1/1 [00:12<00:00, 12.88s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:16<00:00, 16.43s/it]


{'faithfulness': 0.9091}


Evaluating: 100%|██████████| 1/1 [00:17<00:00, 17.98s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:20<00:00, 20.85s/it]


{'faithfulness': 0.8889}


Evaluating: 100%|██████████| 1/1 [00:13<00:00, 13.30s/it]


{'faithfulness': 0.6667}


Evaluating: 100%|██████████| 1/1 [00:16<00:00, 16.58s/it]


{'faithfulness': 0.9333}


Evaluating: 100%|██████████| 1/1 [00:16<00:00, 16.54s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:15<00:00, 15.24s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:09<00:00,  9.47s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:09<00:00,  9.91s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:10<00:00, 10.19s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:17<00:00, 17.60s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:18<00:00, 18.97s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:14<00:00, 14.57s/it]


{'faithfulness': 0.6364}


Evaluating: 100%|██████████| 1/1 [00:11<00:00, 11.70s/it]


{'faithfulness': 0.9231}


Evaluating: 100%|██████████| 1/1 [00:10<00:00, 10.16s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:08<00:00,  8.27s/it]


{'faithfulness': 0.8571}


Evaluating: 100%|██████████| 1/1 [00:16<00:00, 16.08s/it]


{'faithfulness': 0.8824}


Evaluating: 100%|██████████| 1/1 [00:13<00:00, 13.60s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:20<00:00, 20.22s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:13<00:00, 13.43s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:13<00:00, 13.84s/it]


{'faithfulness': 0.9000}


Evaluating: 100%|██████████| 1/1 [00:24<00:00, 24.09s/it]


{'faithfulness': 0.9500}


Evaluating: 100%|██████████| 1/1 [00:11<00:00, 11.22s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:14<00:00, 14.05s/it]


{'faithfulness': 0.9167}


Evaluating: 100%|██████████| 1/1 [00:09<00:00,  9.72s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:22<00:00, 22.80s/it]


{'faithfulness': 0.9333}


Evaluating: 100%|██████████| 1/1 [00:10<00:00, 10.26s/it]


{'faithfulness': 0.8889}


Evaluating: 100%|██████████| 1/1 [00:13<00:00, 13.36s/it]


{'faithfulness': 0.9167}


Evaluating: 100%|██████████| 1/1 [00:10<00:00, 10.39s/it]


{'faithfulness': 0.8750}


Evaluating: 100%|██████████| 1/1 [00:11<00:00, 11.46s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:14<00:00, 14.72s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:15<00:00, 15.17s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:20<00:00, 20.75s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:11<00:00, 11.40s/it]


{'faithfulness': 0.8182}


Evaluating: 100%|██████████| 1/1 [00:15<00:00, 15.29s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:17<00:00, 17.02s/it]


{'faithfulness': 0.9167}


Evaluating: 100%|██████████| 1/1 [00:11<00:00, 11.48s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:25<00:00, 25.94s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:15<00:00, 15.95s/it]


{'faithfulness': 0.8571}


Evaluating: 100%|██████████| 1/1 [00:16<00:00, 16.17s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:17<00:00, 17.12s/it]


{'faithfulness': 0.8000}


Evaluating: 100%|██████████| 1/1 [01:07<00:00, 67.17s/it]


{'faithfulness': 0.8824}


Evaluating: 100%|██████████| 1/1 [00:08<00:00,  8.19s/it]


{'faithfulness': 0.6667}


Evaluating: 100%|██████████| 1/1 [00:05<00:00,  5.22s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:05<00:00,  5.60s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:11<00:00, 11.94s/it]


{'faithfulness': 0.9000}


Evaluating: 100%|██████████| 1/1 [00:09<00:00,  9.43s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:08<00:00,  8.61s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:21<00:00, 21.31s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:08<00:00,  8.53s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:08<00:00,  8.85s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:06<00:00,  6.29s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:09<00:00,  9.14s/it]


{'faithfulness': 0.8333}


Evaluating: 100%|██████████| 1/1 [00:12<00:00, 12.98s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:08<00:00,  8.24s/it]


{'faithfulness': 0.8000}


Evaluating: 100%|██████████| 1/1 [00:10<00:00, 10.22s/it]


{'faithfulness': 0.7143}


Evaluating: 100%|██████████| 1/1 [00:08<00:00,  8.37s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:09<00:00,  9.44s/it]


{'faithfulness': 0.8571}


Evaluating: 100%|██████████| 1/1 [00:12<00:00, 12.70s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:09<00:00,  9.53s/it]


{'faithfulness': 0.8333}


Evaluating: 100%|██████████| 1/1 [00:04<00:00,  4.74s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:12<00:00, 12.41s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:12<00:00, 12.73s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:08<00:00,  8.06s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:07<00:00,  7.64s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:03<00:00,  3.90s/it]


{'faithfulness': 0.0000}


Evaluating: 100%|██████████| 1/1 [00:07<00:00,  7.76s/it]


{'faithfulness': 0.8000}


Evaluating: 100%|██████████| 1/1 [00:19<00:00, 19.35s/it]


{'faithfulness': 0.7000}


Evaluating: 100%|██████████| 1/1 [00:13<00:00, 13.01s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:30<00:00, 30.23s/it]


{'faithfulness': 0.9091}


Evaluating: 100%|██████████| 1/1 [00:12<00:00, 12.11s/it]


{'faithfulness': 0.7778}


Evaluating: 100%|██████████| 1/1 [00:08<00:00,  8.25s/it]


{'faithfulness': 0.8571}


Evaluating: 100%|██████████| 1/1 [00:19<00:00, 19.67s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:15<00:00, 15.84s/it]


{'faithfulness': 0.9167}


Evaluating: 100%|██████████| 1/1 [00:10<00:00, 10.26s/it]


{'faithfulness': 0.6000}


Evaluating: 100%|██████████| 1/1 [00:13<00:00, 13.50s/it]


{'faithfulness': 0.8571}


Evaluating: 100%|██████████| 1/1 [00:18<00:00, 18.78s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:12<00:00, 12.75s/it]


{'faithfulness': 0.8182}


Evaluating: 100%|██████████| 1/1 [00:16<00:00, 16.91s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:06<00:00,  6.14s/it]


{'faithfulness': 0.8333}


Evaluating: 100%|██████████| 1/1 [00:14<00:00, 14.49s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:16<00:00, 16.59s/it]


{'faithfulness': 0.8571}


Evaluating: 100%|██████████| 1/1 [00:24<00:00, 24.14s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:14<00:00, 14.02s/it]


{'faithfulness': 0.9091}


Evaluating: 100%|██████████| 1/1 [00:14<00:00, 14.92s/it]


{'faithfulness': 0.7857}


Evaluating: 100%|██████████| 1/1 [00:06<00:00,  6.84s/it]


{'faithfulness': 0.8333}


Evaluating: 100%|██████████| 1/1 [00:12<00:00, 12.76s/it]


{'faithfulness': 0.8889}


Evaluating: 100%|██████████| 1/1 [00:16<00:00, 16.56s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:19<00:00, 19.53s/it]


{'faithfulness': 0.9167}


Evaluating: 100%|██████████| 1/1 [00:17<00:00, 17.34s/it]


{'faithfulness': 0.9231}


Evaluating: 100%|██████████| 1/1 [00:07<00:00,  7.38s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:12<00:00, 12.16s/it]


{'faithfulness': 0.8182}


Evaluating: 100%|██████████| 1/1 [00:14<00:00, 14.04s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:22<00:00, 22.52s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:13<00:00, 13.28s/it]


{'faithfulness': 0.8182}


Evaluating: 100%|██████████| 1/1 [00:15<00:00, 15.35s/it]


{'faithfulness': 0.7778}


Evaluating: 100%|██████████| 1/1 [00:12<00:00, 12.39s/it]


{'faithfulness': 0.7143}


Evaluating: 100%|██████████| 1/1 [00:12<00:00, 12.60s/it]


{'faithfulness': 0.8571}


Evaluating: 100%|██████████| 1/1 [00:12<00:00, 12.40s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:09<00:00,  9.84s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:12<00:00, 12.09s/it]


{'faithfulness': 0.9000}


Evaluating: 100%|██████████| 1/1 [00:12<00:00, 12.96s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:13<00:00, 13.60s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:10<00:00, 10.63s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:10<00:00, 10.49s/it]


{'faithfulness': 0.8182}


Evaluating: 100%|██████████| 1/1 [00:14<00:00, 14.60s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:10<00:00, 10.81s/it]


{'faithfulness': 0.8000}


Evaluating: 100%|██████████| 1/1 [00:09<00:00,  9.38s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:11<00:00, 11.61s/it]


{'faithfulness': 0.8571}


Evaluating: 100%|██████████| 1/1 [00:13<00:00, 13.16s/it]


{'faithfulness': 0.8889}


Evaluating: 100%|██████████| 1/1 [00:09<00:00,  9.55s/it]


{'faithfulness': 0.8333}


Evaluating: 100%|██████████| 1/1 [00:10<00:00, 10.94s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:14<00:00, 14.32s/it]


{'faithfulness': 0.9286}


Evaluating: 100%|██████████| 1/1 [00:13<00:00, 13.92s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:14<00:00, 14.51s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:23<00:00, 23.83s/it]


{'faithfulness': 0.9333}


Evaluating: 100%|██████████| 1/1 [00:19<00:00, 19.77s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:17<00:00, 17.04s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:15<00:00, 15.33s/it]


{'faithfulness': 0.8750}


Evaluating: 100%|██████████| 1/1 [00:21<00:00, 21.29s/it]


{'faithfulness': 0.9286}


Evaluating: 100%|██████████| 1/1 [00:18<00:00, 18.66s/it]


{'faithfulness': 0.9412}


Evaluating: 100%|██████████| 1/1 [00:08<00:00,  8.76s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:08<00:00,  8.20s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:06<00:00,  6.88s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:11<00:00, 11.89s/it]


{'faithfulness': 0.8000}


Evaluating: 100%|██████████| 1/1 [00:20<00:00, 20.59s/it]


{'faithfulness': 0.9167}


Evaluating: 100%|██████████| 1/1 [00:19<00:00, 19.00s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:12<00:00, 12.08s/it]


{'faithfulness': 0.6250}


Evaluating: 100%|██████████| 1/1 [00:45<00:00, 45.59s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:16<00:00, 16.51s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:16<00:00, 16.11s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:41<00:00, 41.16s/it]


{'faithfulness': 0.9048}


Evaluating: 100%|██████████| 1/1 [00:15<00:00, 15.52s/it]


{'faithfulness': 0.8333}


Evaluating: 100%|██████████| 1/1 [00:26<00:00, 26.66s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:18<00:00, 18.17s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:19<00:00, 19.02s/it]


{'faithfulness': 0.8333}


Evaluating: 100%|██████████| 1/1 [00:29<00:00, 29.74s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:24<00:00, 24.82s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:25<00:00, 25.18s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:11<00:00, 11.55s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:21<00:00, 21.07s/it]


{'faithfulness': 0.9167}


Evaluating: 100%|██████████| 1/1 [00:11<00:00, 11.88s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:39<00:00, 39.59s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:14<00:00, 14.42s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:15<00:00, 15.40s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:32<00:00, 32.91s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:26<00:00, 26.22s/it]


{'faithfulness': 0.6667}


Evaluating: 100%|██████████| 1/1 [00:34<00:00, 34.89s/it]


{'faithfulness': 0.9091}


Evaluating: 100%|██████████| 1/1 [00:30<00:00, 30.92s/it]


{'faithfulness': 0.8462}


Evaluating: 100%|██████████| 1/1 [01:10<00:00, 70.85s/it]


{'faithfulness': 0.9474}


Evaluating: 100%|██████████| 1/1 [00:29<00:00, 29.70s/it]


{'faithfulness': 0.9231}


Evaluating: 100%|██████████| 1/1 [00:20<00:00, 20.20s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:22<00:00, 22.98s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:36<00:00, 36.48s/it]


{'faithfulness': 0.5455}


Evaluating: 100%|██████████| 1/1 [00:26<00:00, 26.87s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:26<00:00, 26.04s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:28<00:00, 28.26s/it]


{'faithfulness': 0.9375}


Evaluating: 100%|██████████| 1/1 [00:08<00:00,  8.61s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:08<00:00,  8.02s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:10<00:00, 10.51s/it]


{'faithfulness': 0.0000}


Evaluating: 100%|██████████| 1/1 [00:19<00:00, 19.75s/it]


{'faithfulness': 0.9000}


Evaluating: 100%|██████████| 1/1 [00:28<00:00, 28.33s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:22<00:00, 22.07s/it]


{'faithfulness': 0.8889}


Evaluating: 100%|██████████| 1/1 [00:28<00:00, 28.18s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:13<00:00, 13.48s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:18<00:00, 18.19s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:12<00:00, 12.60s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:15<00:00, 15.43s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:15<00:00, 15.75s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:18<00:00, 18.22s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:28<00:00, 28.59s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:12<00:00, 12.66s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:13<00:00, 13.28s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:21<00:00, 21.71s/it]


{'faithfulness': 0.9091}


Evaluating: 100%|██████████| 1/1 [00:17<00:00, 17.70s/it]


{'faithfulness': 0.8750}


Evaluating: 100%|██████████| 1/1 [00:05<00:00,  5.13s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:35<00:00, 35.77s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:15<00:00, 15.83s/it]


{'faithfulness': 0.8750}


Evaluating: 100%|██████████| 1/1 [00:18<00:00, 18.86s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:37<00:00, 37.07s/it]


{'faithfulness': 0.8571}


Evaluating: 100%|██████████| 1/1 [00:17<00:00, 17.73s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:17<00:00, 17.94s/it]


{'faithfulness': 0.8750}


Evaluating: 100%|██████████| 1/1 [00:14<00:00, 14.84s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:31<00:00, 31.86s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:56<00:00, 56.27s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:19<00:00, 19.02s/it]


{'faithfulness': 0.7500}


Evaluating: 100%|██████████| 1/1 [00:11<00:00, 11.86s/it]


{'faithfulness': 0.8333}


Evaluating: 100%|██████████| 1/1 [00:40<00:00, 40.31s/it]


{'faithfulness': 0.9444}


Evaluating: 100%|██████████| 1/1 [00:30<00:00, 30.62s/it]


{'faithfulness': 0.9333}


Evaluating: 100%|██████████| 1/1 [00:14<00:00, 14.91s/it]


{'faithfulness': 0.8333}


Evaluating: 100%|██████████| 1/1 [00:22<00:00, 22.87s/it]


{'faithfulness': 0.7500}


Evaluating: 100%|██████████| 1/1 [00:30<00:00, 30.34s/it]


{'faithfulness': 0.9333}


Evaluating: 100%|██████████| 1/1 [00:17<00:00, 17.40s/it]


{'faithfulness': 0.8667}


Evaluating: 100%|██████████| 1/1 [00:18<00:00, 18.54s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:13<00:00, 13.35s/it]


{'faithfulness': 0.8333}


Evaluating: 100%|██████████| 1/1 [00:22<00:00, 22.37s/it]


{'faithfulness': 0.8750}


Evaluating: 100%|██████████| 1/1 [00:31<00:00, 31.23s/it]


{'faithfulness': 0.9231}


Evaluating: 100%|██████████| 1/1 [00:24<00:00, 24.63s/it]


{'faithfulness': 0.8750}


Evaluating: 100%|██████████| 1/1 [00:33<00:00, 33.68s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:22<00:00, 22.17s/it]


{'faithfulness': 0.8750}


Evaluating: 100%|██████████| 1/1 [00:28<00:00, 28.42s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:24<00:00, 24.95s/it]


{'faithfulness': 0.8889}


Evaluating: 100%|██████████| 1/1 [00:30<00:00, 30.34s/it]


{'faithfulness': 0.9333}


Evaluating: 100%|██████████| 1/1 [00:15<00:00, 15.18s/it]


{'faithfulness': 0.8889}


Evaluating: 100%|██████████| 1/1 [00:36<00:00, 36.23s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:21<00:00, 21.38s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:21<00:00, 21.77s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:25<00:00, 25.34s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:20<00:00, 20.87s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:11<00:00, 11.59s/it]


{'faithfulness': 0.8750}


Evaluating: 100%|██████████| 1/1 [00:18<00:00, 18.01s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:20<00:00, 20.00s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:18<00:00, 18.16s/it]


{'faithfulness': 0.9091}


Evaluating: 100%|██████████| 1/1 [00:30<00:00, 30.66s/it]


{'faithfulness': 0.9091}


Evaluating: 100%|██████████| 1/1 [00:33<00:00, 33.61s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:15<00:00, 15.65s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:49<00:00, 49.20s/it]


{'faithfulness': 0.9231}


Evaluating: 100%|██████████| 1/1 [00:48<00:00, 48.05s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:35<00:00, 35.84s/it]


{'faithfulness': 0.7895}


Evaluating: 100%|██████████| 1/1 [00:18<00:00, 18.10s/it]


{'faithfulness': 0.8000}


Evaluating: 100%|██████████| 1/1 [00:21<00:00, 21.20s/it]


{'faithfulness': 0.9167}


Evaluating: 100%|██████████| 1/1 [00:24<00:00, 24.05s/it]


{'faithfulness': 0.9091}


Evaluating: 100%|██████████| 1/1 [00:21<00:00, 21.34s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:15<00:00, 15.28s/it]


{'faithfulness': 0.9000}


Evaluating: 100%|██████████| 1/1 [00:18<00:00, 18.23s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:20<00:00, 20.17s/it]


{'faithfulness': 0.7692}


Evaluating: 100%|██████████| 1/1 [00:20<00:00, 20.28s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:22<00:00, 22.43s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:20<00:00, 20.87s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:19<00:00, 19.35s/it]


{'faithfulness': 0.8750}


Evaluating: 100%|██████████| 1/1 [00:30<00:00, 30.80s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:42<00:00, 42.75s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:28<00:00, 28.44s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:30<00:00, 30.56s/it]


{'faithfulness': 0.8333}


Evaluating: 100%|██████████| 1/1 [00:20<00:00, 20.08s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:21<00:00, 21.85s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:23<00:00, 23.12s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:09<00:00,  9.11s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:07<00:00,  7.18s/it]


{'faithfulness': 0.8333}


Evaluating: 100%|██████████| 1/1 [00:12<00:00, 12.05s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:23<00:00, 23.06s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:15<00:00, 15.10s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:16<00:00, 16.20s/it]


{'faithfulness': 0.8000}


Evaluating: 100%|██████████| 1/1 [00:29<00:00, 29.81s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:18<00:00, 18.49s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:11<00:00, 11.58s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:33<00:00, 33.33s/it]


{'faithfulness': 0.9500}


Evaluating: 100%|██████████| 1/1 [00:10<00:00, 10.22s/it]


{'faithfulness': 0.8571}


Evaluating: 100%|██████████| 1/1 [00:14<00:00, 14.16s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:17<00:00, 17.15s/it]


{'faithfulness': 0.9231}


Evaluating: 100%|██████████| 1/1 [00:11<00:00, 11.77s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:35<00:00, 35.06s/it]


{'faithfulness': 0.9444}


Evaluating: 100%|██████████| 1/1 [00:26<00:00, 26.62s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:12<00:00, 12.16s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:10<00:00, 10.30s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:24<00:00, 24.06s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:20<00:00, 20.05s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:20<00:00, 20.01s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:12<00:00, 12.77s/it]


{'faithfulness': 0.9091}


Evaluating: 100%|██████████| 1/1 [00:15<00:00, 15.18s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:15<00:00, 15.09s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:11<00:00, 11.28s/it]


{'faithfulness': 0.8000}


Evaluating: 100%|██████████| 1/1 [00:15<00:00, 15.25s/it]


{'faithfulness': 0.9231}


Evaluating: 100%|██████████| 1/1 [00:13<00:00, 13.69s/it]


{'faithfulness': 0.7778}


Evaluating: 100%|██████████| 1/1 [00:25<00:00, 25.42s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:16<00:00, 16.73s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:11<00:00, 12.00s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:19<00:00, 19.66s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:16<00:00, 16.67s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:33<00:00, 33.52s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:22<00:00, 22.25s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:28<00:00, 28.48s/it]


{'faithfulness': 1.0000}


Evaluating:   0%|          | 0/1 [00:00<?, ?it/s]No statements were generated from the answer.
Evaluating: 100%|██████████| 1/1 [00:00<00:00,  1.10it/s]


{'faithfulness': nan}


Evaluating: 100%|██████████| 1/1 [00:04<00:00,  4.53s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:03<00:00,  3.88s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:12<00:00, 12.39s/it]


{'faithfulness': 0.9000}


Evaluating: 100%|██████████| 1/1 [00:11<00:00, 11.38s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:09<00:00,  9.36s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:11<00:00, 11.53s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:08<00:00,  8.37s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:13<00:00, 13.36s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:03<00:00,  3.96s/it]


{'faithfulness': 0.5000}


Evaluating: 100%|██████████| 1/1 [00:09<00:00,  9.51s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:09<00:00,  9.29s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:05<00:00,  5.08s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:11<00:00, 11.69s/it]


{'faithfulness': 0.9000}


Evaluating: 100%|██████████| 1/1 [00:08<00:00,  8.85s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:13<00:00, 13.36s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:17<00:00, 17.36s/it]


{'faithfulness': 0.9167}


Evaluating: 100%|██████████| 1/1 [00:08<00:00,  8.85s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:04<00:00,  4.50s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:12<00:00, 12.08s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:12<00:00, 12.58s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:10<00:00, 10.81s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:06<00:00,  6.92s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:10<00:00, 10.98s/it]


{'faithfulness': 0.8333}


Evaluating: 100%|██████████| 1/1 [00:21<00:00, 21.29s/it]


{'faithfulness': 0.8182}


Evaluating: 100%|██████████| 1/1 [00:12<00:00, 12.29s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:22<00:00, 22.24s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:16<00:00, 16.44s/it]


{'faithfulness': 0.8462}


Evaluating: 100%|██████████| 1/1 [00:09<00:00,  9.56s/it]


{'faithfulness': 0.8571}


Evaluating: 100%|██████████| 1/1 [00:20<00:00, 20.62s/it]


{'faithfulness': 0.6429}


Evaluating: 100%|██████████| 1/1 [00:16<00:00, 16.16s/it]


{'faithfulness': 0.9167}


Evaluating: 100%|██████████| 1/1 [00:42<00:00, 42.44s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:19<00:00, 19.72s/it]


{'faithfulness': 0.8000}


Evaluating: 100%|██████████| 1/1 [00:15<00:00, 15.07s/it]


{'faithfulness': 0.6250}


Evaluating: 100%|██████████| 1/1 [00:26<00:00, 26.47s/it]


{'faithfulness': 0.9412}


Evaluating: 100%|██████████| 1/1 [00:17<00:00, 17.94s/it]


{'faithfulness': 0.7500}


Evaluating: 100%|██████████| 1/1 [00:15<00:00, 15.75s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:08<00:00,  8.21s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:20<00:00, 20.16s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:30<00:00, 30.63s/it]


{'faithfulness': 0.9000}


Evaluating: 100%|██████████| 1/1 [00:17<00:00, 17.59s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:16<00:00, 16.76s/it]


{'faithfulness': 0.9091}


Evaluating: 100%|██████████| 1/1 [00:15<00:00, 15.87s/it]


{'faithfulness': 0.9091}


Evaluating: 100%|██████████| 1/1 [00:09<00:00,  9.91s/it]


{'faithfulness': 0.6000}


Evaluating: 100%|██████████| 1/1 [00:25<00:00, 25.02s/it]


{'faithfulness': 0.8889}


Evaluating: 100%|██████████| 1/1 [00:18<00:00, 18.05s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:21<00:00, 21.26s/it]


{'faithfulness': 0.9231}


Evaluating: 100%|██████████| 1/1 [00:23<00:00, 23.15s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:08<00:00,  8.82s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:13<00:00, 13.60s/it]


{'faithfulness': 0.9167}


Evaluating: 100%|██████████| 1/1 [00:16<00:00, 16.63s/it]


{'faithfulness': 0.9091}


Evaluating: 100%|██████████| 1/1 [00:13<00:00, 13.02s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:14<00:00, 14.53s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:12<00:00, 12.80s/it]


{'faithfulness': 0.8571}


Evaluating: 100%|██████████| 1/1 [00:15<00:00, 15.34s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:07<00:00,  7.74s/it]


{'faithfulness': 0.8333}


Evaluating: 100%|██████████| 1/1 [00:14<00:00, 14.27s/it]


{'faithfulness': 0.8889}


Evaluating: 100%|██████████| 1/1 [00:13<00:00, 13.40s/it]


{'faithfulness': 0.8750}


Evaluating: 100%|██████████| 1/1 [00:17<00:00, 17.77s/it]


{'faithfulness': 0.7500}


Evaluating: 100%|██████████| 1/1 [00:11<00:00, 11.12s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:14<00:00, 14.47s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:14<00:00, 14.24s/it]


{'faithfulness': 0.8000}


Evaluating: 100%|██████████| 1/1 [00:16<00:00, 16.22s/it]


{'faithfulness': 0.8571}


Evaluating: 100%|██████████| 1/1 [00:09<00:00,  9.43s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:15<00:00, 15.02s/it]


{'faithfulness': 0.8571}


Evaluating: 100%|██████████| 1/1 [00:20<00:00, 20.29s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:15<00:00, 15.63s/it]


{'faithfulness': 0.5000}


Evaluating: 100%|██████████| 1/1 [00:11<00:00, 11.39s/it]


{'faithfulness': 0.8750}


Evaluating: 100%|██████████| 1/1 [00:11<00:00, 11.85s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:18<00:00, 18.35s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:13<00:00, 13.12s/it]


{'faithfulness': 0.8182}


Evaluating: 100%|██████████| 1/1 [00:13<00:00, 13.11s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:11<00:00, 11.78s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:35<00:00, 35.84s/it]


{'faithfulness': 0.9231}


Evaluating: 100%|██████████| 1/1 [00:31<00:00, 31.56s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:21<00:00, 21.65s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:17<00:00, 17.91s/it]


{'faithfulness': 0.7778}


Evaluating: 100%|██████████| 1/1 [00:22<00:00, 22.26s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:28<00:00, 28.27s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:13<00:00, 13.75s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:12<00:00, 13.00s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:17<00:00, 17.04s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:16<00:00, 16.62s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:37<00:00, 37.89s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:32<00:00, 32.86s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:20<00:00, 20.81s/it]


{'faithfulness': 0.8000}


Evaluating: 100%|██████████| 1/1 [00:25<00:00, 25.63s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:10<00:00, 10.18s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:11<00:00, 11.38s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:19<00:00, 19.13s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:12<00:00, 12.81s/it]


{'faithfulness': 0.7778}


Evaluating: 100%|██████████| 1/1 [00:14<00:00, 14.87s/it]


{'faithfulness': 0.8182}


Evaluating: 100%|██████████| 1/1 [00:15<00:00, 15.40s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:13<00:00, 13.84s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:15<00:00, 15.44s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:23<00:00, 23.99s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:14<00:00, 14.56s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:16<00:00, 16.17s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:16<00:00, 16.92s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:10<00:00, 10.51s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:16<00:00, 16.44s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:15<00:00, 15.87s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:09<00:00,  9.54s/it]


{'faithfulness': 0.8000}


Evaluating: 100%|██████████| 1/1 [00:09<00:00,  9.86s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:12<00:00, 12.65s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:15<00:00, 15.41s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:10<00:00, 10.34s/it]


{'faithfulness': 0.8750}


Evaluating: 100%|██████████| 1/1 [00:36<00:00, 36.96s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:20<00:00, 20.54s/it]


{'faithfulness': 0.9000}


Evaluating: 100%|██████████| 1/1 [00:10<00:00, 10.98s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:15<00:00, 15.73s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:10<00:00, 10.96s/it]


{'faithfulness': 0.7778}


Evaluating: 100%|██████████| 1/1 [00:16<00:00, 16.37s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:25<00:00, 25.00s/it]


{'faithfulness': 0.8947}


Evaluating: 100%|██████████| 1/1 [00:24<00:00, 24.35s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:05<00:00,  5.12s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:04<00:00,  4.34s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:04<00:00,  4.83s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:16<00:00, 16.44s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:17<00:00, 17.98s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:12<00:00, 12.83s/it]


{'faithfulness': 0.8000}


Evaluating: 100%|██████████| 1/1 [00:18<00:00, 18.50s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:13<00:00, 13.79s/it]


{'faithfulness': 0.9231}


Evaluating: 100%|██████████| 1/1 [00:09<00:00,  9.09s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:10<00:00, 10.08s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:08<00:00,  8.45s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:21<00:00, 21.01s/it]


{'faithfulness': 0.6842}


Evaluating: 100%|██████████| 1/1 [00:06<00:00,  6.72s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:05<00:00,  5.91s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:05<00:00,  5.35s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:33<00:00, 33.10s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:15<00:00, 15.80s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:15<00:00, 15.37s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:26<00:00, 26.56s/it]


{'faithfulness': 0.9412}


Evaluating: 100%|██████████| 1/1 [00:13<00:00, 13.42s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:18<00:00, 18.75s/it]


{'faithfulness': 0.9000}


Evaluating: 100%|██████████| 1/1 [00:18<00:00, 18.27s/it]


{'faithfulness': 0.9375}


Evaluating: 100%|██████████| 1/1 [00:17<00:00, 17.29s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:05<00:00,  5.14s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:40<00:00, 40.64s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:17<00:00, 17.16s/it]


{'faithfulness': 0.9333}


Evaluating: 100%|██████████| 1/1 [00:13<00:00, 13.62s/it]


{'faithfulness': 0.6667}


Evaluating: 100%|██████████| 1/1 [00:21<00:00, 21.73s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:17<00:00, 17.34s/it]


{'faithfulness': 0.9333}


Evaluating: 100%|██████████| 1/1 [00:20<00:00, 20.22s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:28<00:00, 28.33s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:11<00:00, 11.11s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:15<00:00, 15.76s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:11<00:00, 11.20s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:12<00:00, 12.72s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:11<00:00, 11.70s/it]


{'faithfulness': 0.7778}


Evaluating: 100%|██████████| 1/1 [00:15<00:00, 15.96s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:09<00:00,  9.66s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:16<00:00, 16.12s/it]


{'faithfulness': 0.9167}


Evaluating: 100%|██████████| 1/1 [00:24<00:00, 24.34s/it]


{'faithfulness': 0.9333}


Evaluating: 100%|██████████| 1/1 [00:20<00:00, 20.91s/it]


{'faithfulness': 0.9412}


Evaluating: 100%|██████████| 1/1 [00:11<00:00, 11.38s/it]


{'faithfulness': 0.8000}


Evaluating: 100%|██████████| 1/1 [00:20<00:00, 20.05s/it]


{'faithfulness': 0.9333}


Evaluating: 100%|██████████| 1/1 [00:16<00:00, 16.48s/it]


{'faithfulness': 0.9167}


Evaluating: 100%|██████████| 1/1 [00:11<00:00, 11.27s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:18<00:00, 18.58s/it]


{'faithfulness': 0.9231}


Evaluating: 100%|██████████| 1/1 [00:13<00:00, 13.65s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:12<00:00, 12.84s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:03<00:00,  3.24s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:16<00:00, 16.68s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:16<00:00, 16.47s/it]


{'faithfulness': 0.8571}


Evaluating: 100%|██████████| 1/1 [00:07<00:00,  7.28s/it]


{'faithfulness': 0.8000}


Evaluating: 100%|██████████| 1/1 [00:12<00:00, 12.88s/it]


{'faithfulness': 0.8889}


Evaluating: 100%|██████████| 1/1 [00:15<00:00, 15.79s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:20<00:00, 20.21s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:09<00:00,  9.24s/it]


{'faithfulness': 0.9000}


Evaluating: 100%|██████████| 1/1 [00:25<00:00, 25.84s/it]


{'faithfulness': 0.9583}


Evaluating: 100%|██████████| 1/1 [00:06<00:00,  6.24s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:13<00:00, 13.69s/it]


{'faithfulness': 0.9231}


Evaluating: 100%|██████████| 1/1 [00:13<00:00, 13.44s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:10<00:00, 10.60s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:16<00:00, 16.16s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:11<00:00, 11.15s/it]


{'faithfulness': 0.9000}


Evaluating: 100%|██████████| 1/1 [00:15<00:00, 15.04s/it]


{'faithfulness': 0.8571}


Evaluating: 100%|██████████| 1/1 [00:14<00:00, 14.98s/it]


{'faithfulness': 0.9286}


Evaluating: 100%|██████████| 1/1 [00:08<00:00,  8.14s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:20<00:00, 20.71s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:13<00:00, 13.24s/it]


{'faithfulness': 0.9000}


Evaluating: 100%|██████████| 1/1 [00:10<00:00, 10.92s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:10<00:00, 10.78s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:15<00:00, 15.52s/it]


{'faithfulness': 0.9412}


Evaluating: 100%|██████████| 1/1 [00:16<00:00, 16.47s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:07<00:00,  7.57s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:03<00:00,  3.52s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:16<00:00, 16.00s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:16<00:00, 16.65s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:24<00:00, 24.31s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:14<00:00, 14.42s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:23<00:00, 23.98s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:33<00:00, 33.34s/it]


{'faithfulness': 0.9091}


Evaluating: 100%|██████████| 1/1 [01:02<00:00, 62.59s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:11<00:00, 11.43s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:16<00:00, 16.26s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:13<00:00, 13.72s/it]


{'faithfulness': 0.8000}


Evaluating: 100%|██████████| 1/1 [00:23<00:00, 23.11s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:10<00:00, 10.45s/it]


{'faithfulness': 0.7778}


Evaluating: 100%|██████████| 1/1 [00:10<00:00, 10.25s/it]


{'faithfulness': 0.8750}


Evaluating: 100%|██████████| 1/1 [00:22<00:00, 22.59s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:18<00:00, 18.53s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:16<00:00, 16.16s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:15<00:00, 15.45s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:15<00:00, 15.81s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:20<00:00, 20.68s/it]


{'faithfulness': 0.8750}


Evaluating: 100%|██████████| 1/1 [00:22<00:00, 22.31s/it]


{'faithfulness': 0.8667}


Evaluating: 100%|██████████| 1/1 [00:11<00:00, 11.24s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:18<00:00, 18.90s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:08<00:00,  8.03s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:12<00:00, 12.78s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:27<00:00, 27.91s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:22<00:00, 22.59s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:15<00:00, 15.82s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:16<00:00, 16.70s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:26<00:00, 26.37s/it]


{'faithfulness': 0.9231}


Evaluating: 100%|██████████| 1/1 [00:20<00:00, 20.35s/it]


{'faithfulness': 0.9091}


Evaluating: 100%|██████████| 1/1 [00:24<00:00, 24.69s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:24<00:00, 24.02s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:12<00:00, 12.63s/it]


{'faithfulness': 0.9000}


Evaluating: 100%|██████████| 1/1 [00:22<00:00, 22.81s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:34<00:00, 34.43s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:13<00:00, 13.38s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:12<00:00, 12.84s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:18<00:00, 18.03s/it]


{'faithfulness': 0.9375}


Evaluating: 100%|██████████| 1/1 [00:21<00:00, 21.02s/it]


{'faithfulness': 0.9565}


Evaluating: 100%|██████████| 1/1 [00:19<00:00, 19.60s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:23<00:00, 23.85s/it]


{'faithfulness': 0.9565}


Evaluating: 100%|██████████| 1/1 [00:12<00:00, 12.53s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:14<00:00, 14.45s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:12<00:00, 12.26s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:23<00:00, 23.23s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:19<00:00, 19.32s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:07<00:00,  7.60s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:14<00:00, 14.44s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:08<00:00,  8.49s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:24<00:00, 24.69s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:05<00:00,  5.33s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:09<00:00,  9.28s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:27<00:00, 27.49s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:04<00:00,  4.78s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:11<00:00, 11.44s/it]


{'faithfulness': 0.9000}


Evaluating: 100%|██████████| 1/1 [00:10<00:00, 10.45s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:18<00:00, 18.34s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:25<00:00, 25.33s/it]


{'faithfulness': 0.9231}


Evaluating: 100%|██████████| 1/1 [00:18<00:00, 18.13s/it]


{'faithfulness': 0.9286}


Evaluating: 100%|██████████| 1/1 [00:04<00:00,  4.14s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:20<00:00, 20.85s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:13<00:00, 13.84s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:12<00:00, 12.32s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:05<00:00,  5.14s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:10<00:00, 10.02s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:10<00:00, 10.84s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:14<00:00, 14.17s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:16<00:00, 16.28s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:23<00:00, 23.99s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:17<00:00, 17.60s/it]


{'faithfulness': 0.9286}


Evaluating: 100%|██████████| 1/1 [00:15<00:00, 15.46s/it]


{'faithfulness': 0.8182}


Evaluating: 100%|██████████| 1/1 [00:20<00:00, 20.09s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:20<00:00, 20.84s/it]


{'faithfulness': 0.9333}


Evaluating: 100%|██████████| 1/1 [00:16<00:00, 16.49s/it]


{'faithfulness': 0.9167}


Evaluating: 100%|██████████| 1/1 [00:21<00:00, 21.65s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:17<00:00, 17.86s/it]


{'faithfulness': 0.9286}


Evaluating: 100%|██████████| 1/1 [00:22<00:00, 22.72s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:16<00:00, 16.85s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:08<00:00,  8.23s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:25<00:00, 25.10s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:27<00:00, 27.18s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:21<00:00, 21.60s/it]


{'faithfulness': 0.9583}


Evaluating: 100%|██████████| 1/1 [00:18<00:00, 18.16s/it]


{'faithfulness': 0.8571}


Evaluating: 100%|██████████| 1/1 [00:27<00:00, 27.88s/it]


{'faithfulness': 0.9545}


Evaluating: 100%|██████████| 1/1 [00:08<00:00,  8.28s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:18<00:00, 18.08s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:21<00:00, 21.47s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:22<00:00, 22.28s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:22<00:00, 22.17s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:14<00:00, 14.50s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:24<00:00, 24.79s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:18<00:00, 18.26s/it]


{'faithfulness': 0.9333}


Evaluating: 100%|██████████| 1/1 [00:21<00:00, 21.16s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:11<00:00, 11.37s/it]


{'faithfulness': 0.9000}


Evaluating: 100%|██████████| 1/1 [00:18<00:00, 18.00s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:12<00:00, 12.32s/it]


{'faithfulness': 0.6667}


Evaluating: 100%|██████████| 1/1 [00:17<00:00, 17.61s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:13<00:00, 13.87s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:19<00:00, 19.89s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:18<00:00, 18.47s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:16<00:00, 16.94s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:19<00:00, 19.83s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:30<00:00, 30.01s/it]


{'faithfulness': 0.8125}


Evaluating: 100%|██████████| 1/1 [00:18<00:00, 18.77s/it]


{'faithfulness': 0.8750}


Evaluating: 100%|██████████| 1/1 [00:17<00:00, 17.33s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:27<00:00, 27.60s/it]


{'faithfulness': 0.8824}


Evaluating: 100%|██████████| 1/1 [00:19<00:00, 19.70s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:16<00:00, 16.01s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:15<00:00, 15.98s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:25<00:00, 25.21s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:18<00:00, 18.72s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:16<00:00, 16.21s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:17<00:00, 17.29s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:15<00:00, 15.77s/it]


{'faithfulness': 0.9091}


Evaluating: 100%|██████████| 1/1 [00:20<00:00, 20.90s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:24<00:00, 24.73s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:26<00:00, 26.32s/it]


{'faithfulness': 0.9333}


Evaluating: 100%|██████████| 1/1 [00:21<00:00, 21.49s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:21<00:00, 21.16s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:24<00:00, 24.20s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:20<00:00, 20.34s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:17<00:00, 17.93s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:14<00:00, 14.89s/it]


{'faithfulness': 0.8750}


Evaluating: 100%|██████████| 1/1 [00:12<00:00, 12.69s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:25<00:00, 25.89s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:21<00:00, 21.82s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:20<00:00, 20.42s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:29<00:00, 29.63s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:14<00:00, 14.48s/it]


{'faithfulness': 0.9000}


Evaluating: 100%|██████████| 1/1 [00:14<00:00, 14.97s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:27<00:00, 27.32s/it]


{'faithfulness': 0.9375}


Evaluating: 100%|██████████| 1/1 [00:17<00:00, 17.01s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:21<00:00, 21.84s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:23<00:00, 23.45s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:14<00:00, 14.90s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:21<00:00, 21.49s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:24<00:00, 24.04s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:14<00:00, 14.31s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:12<00:00, 12.30s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:19<00:00, 19.61s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:15<00:00, 15.94s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:33<00:00, 33.65s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:16<00:00, 16.08s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:15<00:00, 15.76s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:15<00:00, 15.33s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:12<00:00, 12.12s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:33<00:00, 33.64s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:16<00:00, 16.28s/it]


{'faithfulness': 0.8182}


Evaluating: 100%|██████████| 1/1 [00:17<00:00, 17.24s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:18<00:00, 18.40s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:10<00:00, 10.66s/it]


{'faithfulness': 0.8750}


Evaluating: 100%|██████████| 1/1 [00:26<00:00, 26.06s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:15<00:00, 15.35s/it]


{'faithfulness': 0.8182}


Evaluating: 100%|██████████| 1/1 [00:19<00:00, 19.54s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:20<00:00, 20.07s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:23<00:00, 23.02s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:04<00:00,  4.70s/it]


{'faithfulness': 0.3333}


Evaluating: 100%|██████████| 1/1 [00:04<00:00,  4.21s/it]


{'faithfulness': 1.0000}


Evaluating: 100%|██████████| 1/1 [00:04<00:00,  4.57s/it]

{'faithfulness': 1.0000}



