https://zhuanlan.zhihu.com/p/147214759

In [59]:
import numpy as np
np.random.seed(43)

In [60]:
X = np.random.randn(10000)          # mean=0, std=1, 正态分布
Y = np.random.random(10000) * 10    # [0, 1) 均匀分布

In [61]:
a = 10.0
b = 5.0

# EX&DX性质总结
- 期望的性质
1. $E(a) = a, a \text { 是常数 }$
2. $E(X + b) = E(X) + b ， b \text { 是常数 }$
3. $E(a X) = a E(X)$
4. $E(a X + b) = a E(X) + b$
5. $E(a X + b Y) = a E(X) + b E(Y), a b \text{ 为常数 }$
    - $E \left(\sum_{i}^{n} a_{i} X \right) = \sum_{i}^{n} a_{i} E(X)$
6. $E(X + Y) = E(X) + E(Y)$
7. $E(X Y) = E(X) E(Y) + 2COV(X, Y)$
    - 协方差 $COV(X,Y) = E\{[X - E(X)][Y - E(Y)]\} = E(XY) - E(X) \times E(Y)$
    - $\text { 若X，Y相互独立，则 } E(X Y) = E(X) E(Y)$

- 方差的性质
1. $D(X) \geq 0 \text { 若 } a \text { 是常数,则 } D(a) = 0$
2. $D(X + b) = D(X)， b \text { 是常数 }$
3. $D(a X) = a^2 D(X), a \text{ 是常数 }$
4. $D(a X + b) = a^2 D(X), a b \text{ 为常数 }$
5. $D(a X + b Y) = a^2 D(X) + b^2 D(Y) + 2 a b COV(X, Y)$
    - 协方差 $COV(X,Y) = E\{[X - E(X)][Y - E(Y)]\} = E(XY) - E(X) \times E(Y)$
    - $ \text{ 若 } X,Y \text{ 相互独立，则 } D(a X + b Y) = a^2 D(X) + b^2 D(Y)$
6. $D(X + Y) = D(X) + D(Y) + 2E\{[X - E(X)][Y - E(Y)]\}$
    - $ \text{ 若 } X,Y \text{ 相互独立，则 } D(X + Y) = D(X) + D(Y)$
7. $D(X) = E(X^2) - E^2(X)$
8. $D(\sum_{j=1}^t u_j) = \sum_{j=1}^t D(u_j), u_t \text{ 纯随机,服从正态分布的随机变量 }$
9. 没有 $D(XY)$ 相关性质

# EX 期望(均值)

## 期望的性质

### $E(a) = a, a \text { 是常数 }$

In [62]:
np.mean(a)

10.0

### $E(X + b) = E(X) + b ， b \text { 是常数 }$

In [63]:
np.mean(X + b), np.mean(X) + b

(5.0140830945091786, 5.0140830945091786)

In [64]:
np.mean(X + b) == np.mean(X) + b

True

### $E(a X) = a E(X)$

In [65]:
np.mean(a * X), a * np.mean(X)

(0.14083094509178293, 0.1408309450917829)

In [66]:
np.mean(a * X) == a * np.mean(X)

False

In [67]:
# 大致相等
np.allclose(np.mean(a * X), a * np.mean(X))

True

### $E(a X + b) = a E(X) + b$

In [68]:
np.mean(a * X + b), a * np.mean(X) + b

(5.140830945091783, 5.140830945091783)

In [69]:
np.mean(a * X + b) == a * np.mean(X) + b

True

### $E(a X + b Y) = a E(X) + b E(Y), a b \text{ 为常数 }$

$E \left(\sum_{i}^{n} a_{i} X \right) = \sum_{i}^{n} a_{i} E(X)$

In [70]:
np.mean(a * X + b * Y), a * np.mean(X) + b * np.mean(Y)

(25.125891022750235, 25.125891022750235)

In [71]:
np.mean(a * X + b * Y) == a * np.mean(X) + b * np.mean(Y)

True

In [72]:
np.allclose(np.mean(a * X + b * Y), a * np.mean(X) + b * np.mean(Y))

True

### $E(X + Y) = E(X) + E(Y)$

In [73]:
np.mean(X + Y), np.mean(X) + np.mean(Y)

(5.011095110040868, 5.011095110040869)

In [74]:
np.mean(X + Y) == np.mean(X) + np.mean(Y)

False

In [75]:
np.allclose(np.mean(X + Y), np.mean(X) + np.mean(Y))

True

### $E(X Y) = E(X) E(Y) + 2 COV(X, Y)$

#### 协方差 $COV(X,Y) = E\{[X - E(X)][Y - E(Y)]\} = E(XY) - E(X) \times E(Y)$

In [76]:
cov = np.mean((X - X.mean()) * (Y - Y.mean()))
cov

0.004135824610083393

In [77]:
np.mean(X), np.mean(X) * np.mean(Y) + 2 * cov

(0.014083094509178289, 0.07864504169839906)

In [78]:
np.mean(X) == np.mean(X) * np.mean(Y) + 2 * cov

False

In [79]:
np.allclose(np.mean(X), np.mean(X) * np.mean(Y) + 2 * cov, rtol=0.1, atol=0.1)

True

#### $\text { 若X，Y相互独立，则 } E(X Y) = E(X) E(Y)$

In [80]:
np.mean(X * Y), np.mean(X) * np.mean(Y)

(0.07450921708831569, 0.07037339247823228)

In [81]:
np.mean(X * Y) == np.mean(X) * np.mean(Y)

False

In [82]:
# rtol: 相对宽容度
# atol: 绝对宽容度
np.allclose(np.mean(X * Y), np.mean(X) * np.mean(Y), rtol=0.1, atol=0.1)

True

# DX 方差

## 方差的性质

### $D(X) \geq 0 \text { 若 } a \text { 是常数,则 } D(a) = 0$

In [83]:
np.var(X), np.var(Y)

(0.9994648094252013, 8.327295546421892)

In [84]:
np.var(a)

0.0

### $D(X + b) = D(X)， b \text { 是常数 }$

In [85]:
np.var(X + b), np.var(X)

(0.9994648094252013, 0.9994648094252013)

In [86]:
np.var(X + b) == np.var(X)

True

### $D(a X) = a^2 D(X), a \text{ 是常数 }$

In [87]:
np.var(a * X), a ** 2 * np.var(X)

(99.94648094252013, 99.94648094252014)

In [88]:
np.var(a * X) == a ** 2 * np.var(X)

False

In [89]:
np.allclose(np.var(a * X), a ** 2 * np.var(X))

True

### $D(a X + b) = a^2 D(X), a b \text{ 为常数 }$

In [90]:
np.var(a * X + b), a ** 2 * np.var(X)

(99.94648094252013, 99.94648094252014)

In [91]:
np.var(a * X + b) == a ** 2 * np.var(X)

False

In [92]:
np.allclose(np.var(a * X + b), a ** 2 * np.var(X))

True

### $D(a X + b Y) = a^2 D(X) + b^2 D(Y) + 2 a b COV(X, Y)$

#### 协方差 $COV(X,Y) = E\{[X - E(X)][Y - E(Y)]\} = E(XY) - E(X) \times E(Y)$

In [93]:
cov = np.mean((X - X.mean()) * (Y - Y.mean()))
cov

0.004135824610083393

In [94]:
np.var(a * X + b * Y), a ** 2 * np.var(X) + b ** 2 * np.var(Y) + 2 * a * b * cov

(308.5424520640758, 308.54245206407575)

In [95]:
np.var(a * X + b * Y) == a ** 2 * np.var(X) + b ** 2 * np.var(Y) + 2 * a * b * cov

False

In [96]:
np.allclose(np.var(a * X + b * Y), a ** 2 * np.var(X) + b ** 2 * np.var(Y) + 2 * a * b * cov)

True

#### $ \text{ 若 } X,Y \text{ 相互独立，则 } D(a X + b Y) = a^2 D(X) + b^2 D(Y)$

In [97]:
np.var(a * X + b * Y), a ** 2 * np.var(X) + b ** 2 * np.var(Y)

(308.5424520640758, 308.1288696030674)

In [98]:
np.var(a * X + b * Y) == a ** 2 * np.var(X) + b ** 2 * np.var(Y)

False

In [99]:
np.allclose(np.var(a * X + b * Y), a ** 2 * np.var(X) + b ** 2 * np.var(Y), rtol=0.01, atol=0.01)

True

### $D(X + Y) = D(X) + D(Y) + 2E\{[X - E(X)][Y - E(Y)]\}$

In [100]:
np.var(X + Y), np.var(X) + np.var(Y) + 2 * np.mean((X - X.mean()) * (Y - Y.mean()))

(9.335032005067262, 9.33503200506726)

In [101]:
np.var(X + Y) == np.var(X) + np.var(Y) + 2 * np.mean((X - X.mean()) * (Y - Y.mean()))

False

#### $ \text{ 若 } X,Y \text{ 相互独立，则 } D(X + Y) = D(X) + D(Y)$

In [102]:
np.var(X + Y), np.var(X) + np.var(Y)

(9.335032005067262, 9.326760355847094)

In [103]:
np.var(X + Y) == np.var(X) + np.var(Y)

False

In [104]:
np.allclose(np.var(X + Y), np.var(X) + np.var(Y), rtol=0.01, atol=0.01)

True

### $D(X) = E(X^2) - E^2(X)$

In [105]:
np.var(X) == np.mean(X ** 2) - np.mean(X) ** 2

True

### $D(\sum_{j=1}^t u_j) = \sum_{j=1}^t D(u_j), u_t \text{ 纯随机,服从正态分布的随机变量 }$

### 没有 $D(XY)$ 相关性质