# median testing

In [1]:
import numpy as np
from scipy import stats
import random

random.seed(42)

def significant_improvement(before_mean_wer, after_mean_wer, sample_size):
    # Generate random data based on mean and sample size (assuming normal distribution)
    before_data = np.random.normal(before_mean_wer, 0.1, sample_size)
    after_data = np.random.normal(after_mean_wer, 0.1, sample_size)
    
    # Mann-Whitney U test
    stat, p_value = stats.mannwhitneyu(before_data, after_data, alternative='two-sided')
    
    # Determine if the improvement is statistically significant
    if p_value < 0.05:
        return True, p_value
    else:
        return False, p_value

before_mean_wer = 0.7440860951
after_mean_wer = 0.7281820568
sample_size = 3033

is_significant, p_value = significant_improvement(before_mean_wer, after_mean_wer, sample_size)
print("Is the improvement statistically significant?", is_significant)
print("p-value:", p_value)

Is the improvement statistically significant? True
p-value: 7.297398609830172e-19


# Welch's t-test

In [5]:
import numpy as np
from scipy.stats import ttest_ind

def significant_improvement(before_mean_wer, after_mean_wer, sample_size):
    # Generate random data based on mean and sample size (assuming normal distribution)
    before_data = np.random.normal(before_mean_wer, 0.1, sample_size)
    after_data = np.random.normal(after_mean_wer, 0.1, sample_size)
    
    # Perform Welch's t-test
    t_stat, p_value = ttest_ind(before_data, after_data, equal_var=False)
    
    # Determine if the improvement is statistically significant
    if p_value < 0.05:
        return True, p_value
    else:
        return False, p_value

before_mean_wer = 0.7440860951
after_mean_wer = 0.7281820568
sample_size = 3033

is_significant, p_value = significant_improvement(before_mean_wer, after_mean_wer, sample_size)
print("Is the improvement statistically significant?", is_significant)
print("p-value:", p_value)

Is the improvement statistically significant? True
p-value: 6.383152395752732e-10
