In [1]:
import pandas as pd
from rouge_score import rouge_scorer

In [4]:
input_excel = "entrevistas_com_sumarios.xlsx"
output_excel = "metricas_rouge.xlsx"
df = pd.read_excel(input_excel)
scorer = rouge_scorer.RougeScorer(
    ['rouge1', 'rouge2', 'rougeL'], 
    use_stemmer=True
)
def calcular_rouge(referencia, hipotese):
    scores = scorer.score(referencia, hipotese)
    return {
        'ROUGE1': scores['rouge1'].fmeasure,
        'ROUGE2': scores['rouge2'].fmeasure,
        'ROUGEL': scores['rougeL'].fmeasure,
    }
resultados = []
for _, row in df.iterrows():
    referencia = row['Entrevista'] 
    chatgpt = row['Sum ChatGPT'] 
    deepseek = row['Sum Deepseek']  
    t5 = row['Sum meu modelo']

    rouge_chatgpt = calcular_rouge(referencia, chatgpt)
    rouge_deepseek = calcular_rouge(referencia, deepseek)
    rouge_t5 = calcular_rouge(referencia, t5)

    resultados.append({
        'Texto_Original': row['Entrevista'][:100] + "...",  
        'ROUGE1_ChatGPT': rouge_chatgpt['ROUGE1'],
        'ROUGE2_ChatGPT': rouge_chatgpt['ROUGE2'],
        'ROUGEL_ChatGPT': rouge_chatgpt['ROUGEL'],
        'ROUGE1_DeepSeek': rouge_deepseek['ROUGE1'],
        'ROUGE2_DeepSeek': rouge_deepseek['ROUGE2'],
        'ROUGEL_DeepSeek': rouge_deepseek['ROUGEL'],
        'ROUGE1_LAN_T5': rouge_t5['ROUGE1'],
        'ROUGE2_LAN_T5': rouge_t5['ROUGE2'],
        'ROUGEL_LAN_T5': rouge_t5['ROUGEL'],
    })
df_resultados = pd.DataFrame(resultados)
df_resultados.to_excel(output_excel, index=False)

print(f"✅ Métricas ROUGE calculadas e salvas em {output_excel}")

✅ Métricas ROUGE calculadas e salvas em metricas_rouge.xlsx


In [5]:
df2 = pd.read_excel('metricas_rouge.xlsx')
rouge_columns = [
    'ROUGE1_ChatGPT', 'ROUGE2_ChatGPT', 'ROUGEL_ChatGPT',
    'ROUGE1_DeepSeek', 'ROUGE2_DeepSeek', 'ROUGEL_DeepSeek',
    'ROUGE1_LAN_T5', 'ROUGE2_LAN_T5', 'ROUGEL_LAN_T5'
]
rouge_means = df2[rouge_columns].mean()

print("Médias das métricas ROUGE:")
print(rouge_means)

Médias das métricas ROUGE:
ROUGE1_ChatGPT     0.161937
ROUGE2_ChatGPT     0.074780
ROUGEL_ChatGPT     0.111989
ROUGE1_DeepSeek    0.111575
ROUGE2_DeepSeek    0.044420
ROUGEL_DeepSeek    0.080039
ROUGE1_LAN_T5      0.080683
ROUGE2_LAN_T5      0.066590
ROUGEL_LAN_T5      0.076841
dtype: float64
