## Student's t-test

In [1]:
from numpy.random import seed
from numpy.random import randn

# ttest_ind - Calculate the T-test for the means of two independent samples of scores.
from scipy.stats import ttest_ind

In [2]:
seed(1)

# generate two independent samples
data1 = 5 * randn(100) + 50
data2 = 5 * randn(100) + 51

In [3]:
# compare samples
stat, p = ttest_ind(data1, data2)
print('Statistics=%.3f, p=%.3f' % (stat, p))

Statistics=-2.262, p=0.025


In [4]:
alpha = 0.05
if p > alpha:
    print('Same distributions (fail to reject H0)')
else:
    print('Different distributions (reject H0)')

Different distributions (reject H0)


## Paired Student’s t-Test

In [5]:
# We may wish to compare the means between two data samples that are related in some way. 
# For example, the data samples may represent two independent measures or evaluations of the same object

In [6]:
# ttest_rel - Calculate the t-test on TWO RELATED samples of scores, a and b.
from scipy.stats import ttest_rel
stat, p = ttest_rel(data1, data2)
print('Statistics=%.3f, p=%.3f' % (stat, p))

Statistics=-2.372, p=0.020


In [7]:
alpha = 0.05
if p > alpha:
    print('Same distributions (fail to reject H0)')
else:
    print('Different distributions (reject H0)')

Different distributions (reject H0)


## ANOVA

In [8]:
# ANOVA is applying when we have multiple independent data samples
data1 = 5 * randn(100) + 50
data2 = 5 * randn(100) + 50
data3 = 5 * randn(100) + 52

In [9]:
# The one-way ANOVA tests the null hypothesis that two or more groups have the same population mean.
from scipy.stats import f_oneway
stat, p = f_oneway(data1, data2, data3)
print('Statistics=%.3f, p=%.3f' % (stat, p))

Statistics=6.812, p=0.001


In [10]:
# interpret
alpha = 0.05
if p > alpha:
    print('Same distributions (fail to reject H0)')
else:
    print('Different distributions (reject H0)')

Different distributions (reject H0)
