In [None]:
import pandas as pd
from evaluate import load

bleu = load("sacrebleu")
chrf = load("chrf")
cometm = load("comet")

In [None]:
def compute_scores(preds, ref):
    """
    Compute BLEU and chrF++ scores using all three references for each sentence.
    """
    bleu_score = bleu.compute(predictions=preds, references=ref)["score"]
    chrf_score = chrf.compute(predictions=preds, references=ref)["score"]
    chrf2_score = chrf.compute(predictions=preds, references=ref, char_order=6, word_order=2,  beta=2)["score"]
    comet_score = cometm.compute(sources=src_sentences, predictions=preds, references=ref)["mean_score"]
    return bleu_score, chrf_score, chrf2_score, comet_score

In [None]:
import os
os.getcwd()

## T5 Punctuation Restoration

In [None]:
file_name = "approach1_eng_to_eng_t5_outputs_punct_restor_data.csv"
mode = "t5_punct"

In [None]:
df = pd.read_csv(file_name)
df.head()

In [None]:
src_sentences = df['src']
ref_gem = df['gt']
translations = df['prediction']

In [None]:
bleu_score, chrf_score, chrf2_score, comet_score = compute_scores(translations, ref_gem)

print(f"\n===== FINAL METRICS FOR '{mode}'=====")
print(f"BLEU: {bleu_score:.2f}, chrF++: {chrf_score:.2f}, chrF2++: {chrf2_score:.2f}, COMET: {comet_score:.4f}")

## T5 Seq-to-Seq

In [None]:
file_name = "approach1_eng_to_eng_t5_outputs_mar_data.csv"
mode = "t5"

In [None]:
df = pd.read_csv(file_name)
df.head()

In [None]:
src_sentences = df['src']
ref_gem = df['gt']
translations = df['prediction']

In [None]:
bleu_score, chrf_score, chrf2_score, comet_score = compute_scores(translations, ref_gem)

print(f"\n===== FINAL METRICS FOR '{mode}'=====")
print(f"BLEU: {bleu_score:.2f}, chrF++: {chrf_score:.2f}, chrF2++: {chrf2_score:.2f}, COMET: {comet_score:.4f}")

## IndicTrans2 Sentences Meant

In [None]:
file_name = "sent_meant_outputs.csv"
mode = "original_meant"

In [None]:
df = pd.read_csv(file_name)
df.head()

In [None]:
src_sentences = df['src']
ref_gem = df['gemini']
translations = df['prediction']

In [None]:
bleu_score, chrf_score, chrf2_score, comet_score = compute_scores(translations, ref_gem)

print(f"\n===== FINAL METRICS FOR '{mode}'=====")
print(f"BLEU: {bleu_score:.2f}, chrF++: {chrf_score:.2f}, chrF2++: {chrf2_score:.2f}, COMET: {comet_score:.4f}")

## Cadence Approach1

In [None]:
file_name = "cadence_outputs.csv"
mode = "cadence"

In [None]:
df = pd.read_csv(file_name)
df.head()

In [None]:
src_sentences = df['src']
ref_gem = df['gt_mar']
translations = df['prediction_mar']

In [None]:
bleu_score, chrf_score, chrf2_score, comet_score = compute_scores(translations, ref_gem)

print(f"\n===== FINAL METRICS FOR '{mode}'=====")
print(f"BLEU: {bleu_score:.2f}, chrF++: {chrf_score:.2f}, chrF2++: {chrf2_score:.2f}, COMET: {comet_score:.4f}")

## Cadence Punctuation Restoration

In [None]:
file_name = "approach1_eng_to_eng_cadence_outputs_punct_restor_data.csv"
mode = "cadence_approach1"

In [None]:
df = pd.read_csv(file_name)
df.head()

In [None]:
src_sentences = df['src']
ref_gem = df['gt']
translations = df['prediction']

In [None]:
bleu_score, chrf_score, chrf2_score, comet_score = compute_scores(translations, ref_gem)

print(f"\n===== FINAL METRICS FOR '{mode}'=====")
print(f"BLEU: {bleu_score:.2f}, chrF++: {chrf_score:.2f}, chrF2++: {chrf2_score:.2f}, COMET: {comet_score:.4f}")

## DeepSeek

In [None]:
file_name = "shalaka_deepseek_outputs.csv"
mode = "deepseek"

In [None]:
df = pd.read_csv(file_name)
df.head()

In [None]:
src_sentences = df['src']
ref_gem = df['gt']
translations = df['prediction']

In [None]:
bleu_score, chrf_score, chrf2_score, comet_score = compute_scores(translations, ref_gem)

print(f"\n===== FINAL METRICS FOR '{mode}'=====")
print(f"BLEU: {bleu_score:.2f}, chrF++: {chrf_score:.2f}, chrF2++: {chrf2_score:.2f}, COMET: {comet_score:.4f}")