https://zhuanlan.zhihu.com/p/147214759

In [102]:
import numpy as np
np.random.seed(43)

In [197]:
X = np.random.randn(10000)          # mean=0, std=1, 正态分布
Y = np.random.random(10000) * 10    # [0, 1) 均匀分布

In [198]:
a = 10.0
b = 5.0

# EX&DX性质总结
- 期望的性质
1. $E(a) = a, a \text { 是常数 }$
2. $E(X + b) = E(X) + b ， b \text { 是常数 }$
3. $E(a X) = a E(X)$
4. $E(a X + b) = a E(X) + b$
5. $E(a X + b Y) = a E(X) + b E(Y), a b \text{ 为常数 }$
    - $E \left(\sum_{i}^{n} a_{i} X \right) = \sum_{i}^{n} a_{i} E(X)$
6. $E(X + Y) = E(X) + E(Y)$
7. $E(X Y) = E(X) E(Y) + 2COV(X, Y)$
    - 协方差 $COV(X,Y) = E[(X - E(X))(Y - E(Y))] = E(XY) - E(X) * E(Y)$
    - $\text { 若X，Y相互独立，则 } E(X Y) = E(X) E(Y)$

- 方差的性质
1. $D(X) \geq 0 \text { 若 } a \text { 是常数,则 } D(a) = 0$
2. $D(X + b) = D(X)， b \text { 是常数 }$
3. $D(a X) = a^2 D(X), a \text{ 是常数 }$
4. $D(a X + b) = a^2 D(X), a b \text{ 为常数 }$
5. $D(a X + b Y) = a^2 D(X) + b^2 D(Y) + 2 a b E[(X - E(X))(Y - E(Y))]$
    - $ \text{ 若 } X,Y \text{ 相互独立，则 } D(a X + b Y) = a^2 D(X) + b^2 D(Y)$
6. $D(X + Y) = D(X) + D(Y) + 2E[(X - E(X))(Y - E(Y))]$
    - $ \text{ 若 } X,Y \text{ 相互独立，则 } D(X + Y) = D(X) + D(Y)$
7. $D(X) = E(X^2) - E^2(X)$
8. $D(\sum_{j=1}^t u_j) = \sum_{j=1}^t D(u_j), u_t \text{ 纯随机,服从正态分布的随机变量 }$
9. 没有 $D(XY)$ 相关性质

# EX 期望(均值)

## 期望的性质

### $E(a) = a, a \text { 是常数 }$

In [199]:
np.mean(a)

10.0

### $E(X + b) = E(X) + b ， b \text { 是常数 }$

In [200]:
np.mean(X + b), np.mean(X) + b

(5.001221492193753, 5.001221492193753)

In [201]:
np.mean(X + b) == np.mean(X) + b

True

### $E(a X) = a E(X)$

In [202]:
np.mean(a * X), a * np.mean(X)

(0.012214921937526392, 0.012214921937526374)

In [203]:
np.mean(a * X) == a * np.mean(X)

False

In [204]:
# 大致相等
np.allclose(np.mean(a * X), a * np.mean(X))

True

### $E(a X + b) = a E(X) + b$

In [205]:
np.mean(a * X + b), a * np.mean(X) + b

(5.0122149219375265, 5.0122149219375265)

In [206]:
np.mean(a * X + b) == a * np.mean(X) + b

True

### $E(a X + b Y) = a E(X) + b E(Y), a b \text{ 为常数 }$

$E \left(\sum_{i}^{n} a_{i} X \right) = \sum_{i}^{n} a_{i} E(X)$

In [207]:
np.mean(a * X + b * Y), a * np.mean(X) + b * np.mean(Y)

(25.095776703176515, 25.09577670317651)

In [208]:
np.mean(a * X + b * Y) == a * np.mean(X) + b * np.mean(Y)

False

In [209]:
np.allclose(np.mean(a * X + b * Y), a * np.mean(X) + b * np.mean(Y))

True

### $E(X + Y) = E(X) + E(Y)$

In [210]:
np.mean(X + Y), np.mean(X) + np.mean(Y)

(5.01793384844155, 5.017933848441549)

In [211]:
np.mean(X + Y) == np.mean(X) + np.mean(Y)

False

In [212]:
np.allclose(np.mean(X + Y), np.mean(X) + np.mean(Y))

True

### $E(X Y) = E(X) E(Y) + 2 COV(X, Y)$

#### 协方差 $COV(X,Y) = E[(X - E(X))(Y - E(Y))] = E(XY) - E(X) * E(Y)$

In [213]:
cov = np.mean(X * Y) - np.mean(X) * np.mean(Y)
cov

-0.023289086852909514

In [259]:
np.mean(X), np.mean(X) * np.mean(Y) + 2 * cov

(0.0012214921937526374, -0.04045029872435994)

In [260]:
np.mean(X) == np.mean(X) * np.mean(Y) + 2 * cov

False

In [261]:
np.allclose(np.mean(X), np.mean(X) * np.mean(Y) + 2 * cov, rtol=0.1, atol=0.1)

True

#### $\text { 若X，Y相互独立，则 } E(X Y) = E(X) E(Y)$

In [218]:
np.mean(X * Y), np.mean(X) * np.mean(Y)

(-0.017161211871450432, 0.006127874981459084)

In [219]:
np.mean(X * Y) == np.mean(X) * np.mean(Y)

False

In [222]:
# rtol: 相对宽容度
# atol: 绝对宽容度
np.allclose(np.mean(X * Y), np.mean(X) * np.mean(Y), rtol=0.1, atol=0.1)

True

# DX 方差

## 方差的性质

### $D(X) \geq 0 \text { 若 } a \text { 是常数,则 } D(a) = 0$

In [223]:
np.var(X), np.var(Y)

(1.0232594791727416, 8.324325298049954)

In [224]:
np.var(a)

0.0

### $D(X + b) = D(X)， b \text { 是常数 }$

In [225]:
np.var(X + b), np.var(X)

(1.0232594791727416, 1.0232594791727416)

In [226]:
np.var(X + b) == np.var(X)

True

### $D(a X) = a^2 D(X), a \text{ 是常数 }$

In [227]:
np.var(a * X), a ** 2 * np.var(X)

(102.32594791727415, 102.32594791727416)

In [228]:
np.var(a * X) == a ** 2 * np.var(X)

False

In [229]:
np.allclose(np.var(a * X), a ** 2 * np.var(X))

True

### $D(a X + b) = a^2 D(X), a b \text{ 为常数 }$

In [230]:
np.var(a * X + b), a ** 2 * np.var(X)

(102.32594791727414, 102.32594791727416)

In [231]:
np.var(a * X + b) == a ** 2 * np.var(X)

False

In [232]:
np.allclose(np.var(a * X + b), a ** 2 * np.var(X))

True

### $D(a X + b Y) = a^2 D(X) + b^2 D(Y) + 2 a b E[(X - E(X))(Y - E(Y))]$

In [233]:
np.var(a * X + b * Y), a ** 2 * np.var(X) + b ** 2 * np.var(Y) + 2 * a * b * np.mean((X - X.mean()) * (Y - Y.mean()))

(308.105171683232, 308.1051716832321)

In [234]:
np.var(a * X + b * Y) == a ** 2 * np.var(X) + b ** 2 * np.var(Y) + 2 * a * b * np.mean((X - X.mean()) * (Y - Y.mean()))

False

In [235]:
np.allclose(np.var(a * X + b * Y), a ** 2 * np.var(X) + b ** 2 * np.var(Y) + 2 * a * b * np.mean((X - X.mean()) * (Y - Y.mean())))

True

#### $ \text{ 若 } X,Y \text{ 相互独立，则 } D(a X + b Y) = a^2 D(X) + b^2 D(Y)$

In [236]:
np.var(a * X + b * Y), a ** 2 * np.var(X) + b ** 2 * np.var(Y)

(308.105171683232, 310.43408036852304)

In [237]:
np.var(a * X + b * Y) == a ** 2 * np.var(X) + b ** 2 * np.var(Y)

False

In [238]:
np.allclose(np.var(a * X + b * Y), a ** 2 * np.var(X) + b ** 2 * np.var(Y), rtol=0.01, atol=0.01)

True

### $D(X + Y) = D(X) + D(Y) + 2E[(X - E(X))(Y - E(Y))]$

In [244]:
np.var(X + Y), np.var(X) + np.var(Y) + 2 * np.mean((X - X.mean()) * (Y - Y.mean()))

(9.301006603516877, 9.301006603516877)

In [245]:
np.var(X + Y) == np.var(X) + np.var(Y) + 2 * np.mean((X - X.mean()) * (Y - Y.mean()))

True

#### $ \text{ 若 } X,Y \text{ 相互独立，则 } D(X + Y) = D(X) + D(Y)$

In [248]:
np.var(X + Y), np.var(X) + np.var(Y)

(9.301006603516877, 9.347584777222696)

In [264]:
np.var(X + Y) == np.var(X) + np.var(Y)

False

In [266]:
np.allclose(np.var(X + Y), np.var(X) + np.var(Y), rtol=0.01, atol=0.01)

True

### $D(X) = E(X^2) - E^2(X)$

In [258]:
np.var(X) == np.mean(X ** 2) - np.mean(X) ** 2

True

### $D(\sum_{j=1}^t u_j) = \sum_{j=1}^t D(u_j), u_t \text{ 纯随机,服从正态分布的随机变量 }$

### 没有 $D(XY)$ 相关性质