In [None]:
import numpy as np
import pandas as pd
import scipy.stats as stats

def perform_ttest(standard, hybrid, score_col):
    # Standard scores
    standard_scores = standard[score_col].dropna().to_numpy()

    # Hybrid scores
    hybrid_scores = hybrid[score_col].dropna().to_numpy()

    # Perform t-test to determine if the difference in scores is significant
    t, p = stats.ttest_ind(standard_scores, hybrid_scores)

    print("t-statistic: ", t)
    print("p-value: ", p)

    # Evaluate if the null hypothesis can be rejected based on the p-value
    if p < 0.05: # standard significance level
        print("Null hypothesis rejected, significant difference between the two models.")
    else:
        print("Null hypothesis not rejected, no significant difference between the two models.")

In [None]:
# Load BLEU scores
standard = pd.read_csv('../src/scores/Ilokano to Tagalog/Standard Translator/test/test_bleu_il-tl.csv')
hybrid = pd.read_csv('../src/scores/Ilokano to Tagalog/Hybrid Translator/test/test_bleu_il-tl.csv')
print("ILOKANO TO TAGALOG (BLEU):")
perform_ttest(standard, hybrid, 'BLEU_SCORE')

standard = pd.read_csv('../src/scores/Tagalog to Ilokano/Standard Translator/test/test_bleu_tl-il.csv')
hybrid = pd.read_csv('../src/scores/Tagalog to Ilokano/Hybrid Translator/test/test_bleu_tl-il.csv')
print("\nTAGALOG TO ILOKANO (BLEU):")
perform_ttest(standard, hybrid, 'BLEU_SCORE')

In [None]:
# Load TER scores
standard = pd.read_csv('../src/scores/Ilokano to Tagalog/Standard Translator/test/test_ter_il-tl.csv')
hybrid = pd.read_csv('../src/scores/Ilokano to Tagalog/Hybrid Translator/test/test_ter_il-tl.csv')
print("ILOKANO TO TAGALOG (TER):")
perform_ttest(standard, hybrid, 'TER_SCORE')

standard = pd.read_csv('../src/scores/Tagalog to Ilokano/Standard Translator/test/test_ter_tl-il.csv')
hybrid = pd.read_csv('../src/scores/Tagalog to Ilokano/Hybrid Translator/test/test_ter_tl-il.csv')
print("\nTAGALOG TO ILOKANO (TER):")
perform_ttest(standard, hybrid, 'TER_SCORE')

In [None]:
# Load Rouge scores
standard = pd.read_csv('../src/scores/Ilokano to Tagalog/Standard Translator/test/test_rouge_il-tl.csv')
hybrid = pd.read_csv('../src/scores/Ilokano to Tagalog/Hybrid Translator/test/test_rouge_il-tl.csv')
print("ILOKANO TO TAGALOG (Rouge):")
perform_ttest(standard, hybrid, 'F1_SCORE')

standard = pd.read_csv('../src/scores/Tagalog to Ilokano/Standard Translator/test/test_rouge_tl-il.csv')
hybrid = pd.read_csv('../src/scores/Tagalog to Ilokano/Hybrid Translator/test/test_rouge_tl-il.csv')
print("\nTAGALOG TO ILOKANO (TER):")
perform_ttest(standard, hybrid, 'F1_SCORE')