# Hypothesis testing

This is the notebook matching the article from Medium

In [4]:
# Importing necessary libraries
import numpy as np
from scipy.stats import ttest_1samp

# Let's assume that we have a sample data from an experiment
data_sample = np.random.normal(loc=15, scale=5, size=50)

# We hypothesize that the population mean is 20
pop_mean = 20

# Perform one-sample t-test
t_statistic, p_value = ttest_1samp(data_sample, pop_mean)

print("T-statistic: ", t_statistic)
print("p-value: ", p_value)



T-statistic:  -8.257145435755701
p-value:  7.747297408014286e-11


## T-test

In [5]:
# Import necessary libraries
from scipy.stats import ttest_ind

# Assume we have data_samples from two different experiments
data_sample1 = np.random.normal(loc=15, scale=5, size=50)
data_sample2 = np.random.normal(loc=20, scale=5, size=50)

# Perform two-sample t-test
t_statistic, p_value = ttest_ind(data_sample1, data_sample2)

print("T-statistic: ", t_statistic)
print("p-value: ", p_value)


T-statistic:  -5.453678517395461
p-value:  3.698411563937544e-07


## F-test

In [6]:
# Import necessary libraries
import scipy.stats as stats

# Assume we have data_samples from two different experiments
data_sample1 = np.random.normal(loc=15, scale=5, size=50)
data_sample2 = np.random.normal(loc=20, scale=5, size=50)

# Perform F-test
F, p_value = stats.f_oneway(data_sample1, data_sample2)

print("F-statistic: ", F)
print("p-value: ", p_value)

F-statistic:  47.0998288015188
p-value:  6.156380980315648e-10


## Chi-squared test

In [7]:
# Import necessary libraries
from scipy.stats import chi2_contingency

# Assume we have a contingency table from a categorical dataset
contingency_table = np.array([[10, 20, 30], [20, 40, 60]])

# Perform Chi-squared test
chi2, p_value, dof, expected = chi2_contingency(contingency_table)

print("Chi-square statistic: ", chi2)
print("p-value: ", p_value)
print("Degrees of freedom: ", dof)
print("Expected contingency table: \n", expected)

Chi-square statistic:  0.0
p-value:  1.0
Degrees of freedom:  2
Expected contingency table: 
 [[10. 20. 30.]
 [20. 40. 60.]]
