# t検定の所の検算

参考資料: 自然科学の統計学の6章

In [3]:
import scipy.stats

In [4]:
a = [
0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0,
0, 1, 1, 1, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0,
0, 0, 1, 0, 0, 0, 0, 1, 0, 0, 0, 1, 1, 0, 1, 0, 0, 0, 0, 0, 0, 1, 0,
1, 0, 0, 1, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 1, 1, 0, 0, 0,
0, 0, 0, 0, 1, 0, 1, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 1, 0, 1, 0, 0, 0,
0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 1, 0, 0, 0, 0, 1,
0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 1, 0, 0, 1, 0, 0, 0, 0, 0, 1, 1,
0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 0, 1, 0, 0
]

In [5]:
b = [
1, 1, 0, 0, 1, 0, 0, 1, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 1,
1, 0, 0, 1, 1, 0, 1, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 1, 1, 1, 0, 0,
0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0,
0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 1, 0, 1, 0, 0, 0, 1, 0,
0, 1, 1, 1, 0, 0, 0, 0, 1, 0, 0, 0, 0, 1, 1, 0, 1, 0, 0, 1, 0, 1, 0,
1, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0,
0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
0, 0, 0, 0, 0, 0, 0, 1, 0, 1, 1, 0, 1, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0,
1, 0, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 1, 1, 0, 0,
0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 1,
0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 0, 1, 0, 0, 1,
0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 1, 0, 0, 0, 0, 0, 1, 0, 0, 1,
0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 1, 0, 0
]

## 2標本の検定統計量t

$\displaystyle
t = \sqrt{\frac{mn}{m + n}} \cdot \frac{\bar{X} - \bar{Y}}{s} \
$

合成分散$s^2$を

$\displaystyle
s^2 = \frac{1}{m + n - 2}(\sum_{t=1}^{m}(X_i - \bar{X})^2 + \sum_{j=1}^n(Y_j - \bar{Y})^2)
$

とする

In [6]:
a_bar = np.mean(a)
m = len(a)
b_bar = np.mean(b)
n = len(b)
s = np.sqrt((np.sum((a - a_bar)**2) + np.sum((b - b_bar)**2))/(m + n - 2))

In [14]:
# 合成標準偏差
s

0.40518933429649873

In [10]:
np.std(a)

0.39629455632370542

In [11]:
np.std(b)

0.40998245372970621

In [20]:
# t
t = np.sqrt(n*m/(n+m))*(a_bar - b_bar)/s
t

-0.50499426358366117

有意水準$\alpha$の時の両側検定の棄却域

$ |t| > t_{\alpha/2}(m + n - 2)$

度数分布表から

$t(n + m)_{0.025} = 1.96$


In [21]:
np.abs(t) > 1.96

False

により帰無仮説を棄却できない

## 二項分布の検定統計量

192ページの式

$\displaystyle
Z = \sqrt{\frac{mn}{m + n}} \cdot \frac{\hat{p_1} - \hat{p_2}}{\sqrt{\hat{p}(1-\hat{p})}} \
$

In [18]:
p1 = np.mean(a)
p2 = np.mean(b)
p = (sum(a) + sum(b))/(m + n)
Z = np.sqrt(n*m/(n+m))*(p1 - p2)/np.sqrt(p*(1-p))
Z

-0.50588673023427566

有意水準$\alpha$の時の両側検定の棄却域  
$
|Z| > z_{\alpha/2}
$

度数分布表から  
$
Z_{0.025} = 1.96
$

In [19]:
np.abs(Z) > 1.96

False

により、帰無仮説は棄却できない