In [69]:
import numpy as np
np.__version__

'1.20.1'

In [70]:
np?

# 一、创建数组

## 1.创建数组

**ndarray类型数组要求其内每个item保持统一类型，不满足则会向上转换，如
整形被转换为浮点型**

In [71]:
np.array([3.14, 4, 2, 3])

array([3.14, 4.  , 2.  , 3.  ])

**用dtype关键字明确指出数组类型**

In [72]:
np.array([1, 2, 3, 4], dtype='float32')

array([1., 2., 3., 4.], dtype=float32)

**多维数组**

In [73]:
np.array([range(i, i+3) for i in [2, 4, 6]])

array([[2, 3, 4],
       [4, 5, 6],
       [6, 7, 8]])

## 2.从头创建数组

In [74]:
np.zeros(10, dtype=int)

array([0, 0, 0, 0, 0, 0, 0, 0, 0, 0])

In [75]:
np.ones((3, 5), dtype=float)

array([[1., 1., 1., 1., 1.],
       [1., 1., 1., 1., 1.],
       [1., 1., 1., 1., 1.]])

In [76]:
np.full((3, 5), 3.14)

array([[3.14, 3.14, 3.14, 3.14, 3.14],
       [3.14, 3.14, 3.14, 3.14, 3.14],
       [3.14, 3.14, 3.14, 3.14, 3.14]])

In [77]:
np.arange(0, 20, 2)

array([ 0,  2,  4,  6,  8, 10, 12, 14, 16, 18])

In [78]:
np.linspace(0, 1, 5)

array([0.  , 0.25, 0.5 , 0.75, 1.  ])

In [79]:
np.random.random((3, 3))

array([[0.65279032, 0.63505887, 0.99529957],
       [0.58185033, 0.41436859, 0.4746975 ],
       [0.6235101 , 0.33800761, 0.67475232]])

**均值为0方差为1的正态分布随机数组**

In [80]:
np.random.normal(0, 1, (3, 3))

array([[ 1.0657892 , -0.69993739,  0.14407911],
       [ 0.3985421 ,  0.02686925,  1.05583713],
       [-0.07318342, -0.66572066, -0.04411241]])

**[0, 10)区间的随机整数数组**

In [81]:
np.random.randint(0, 10, (3, 3))

array([[7, 2, 9],
       [2, 3, 3],
       [2, 3, 4]])

**单位矩阵**

In [82]:
np.eye(3)

array([[1., 0., 0.],
       [0., 1., 0.],
       [0., 0., 1.]])

**创建一个由3个整形数组成的未初始化的数组**

In [83]:
np.empty(3)

array([1., 1., 1.])

# 二、Numpy数据基础

## 1.Numpy数组的属性

**设置一组种子值，以保证每次程序执行时生成同样的随机数组**

In [84]:
np.random.seed(0) #设置随机数种子

x1 = np.random.randint(10, size=6) #一维数组
x2 = np.random.randint(10, size=(3, 4)) #二维数组
x3 = np.random.randint(10, size=(3, 4, 5)) #三维数组

In [85]:
print("x3 ndim:", x3.ndim)
print("x3 shape", x3.shape)
print("x3 size", x3.size)

x3 ndim: 3
x3 shape (3, 4, 5)
x3 size 60


In [86]:
print("dtype:", x3.dtype)

dtype: int64


In [87]:
print("itemsize", x3.itemsize, "bytes")
print("nbytes:", x3.nbytes, "bytes")
# 总字节数=itemsize * size=8 * 60

itemsize 8 bytes
nbytes: 480 bytes


## 2.数组的索引：获取单个元素

In [88]:
x1

array([5, 0, 3, 3, 7, 9])

In [89]:
x1[0]

5

In [90]:
x1[-1]

9

In [91]:
x2

array([[3, 5, 2, 4],
       [7, 6, 8, 8],
       [1, 6, 7, 7]])

In [92]:
x2[2, 0] #代表第三行第一列

1

In [93]:
x2[0, 0] = 12
x2

array([[12,  5,  2,  4],
       [ 7,  6,  8,  8],
       [ 1,  6,  7,  7]])

**Numpy数组为固定类型，若将float插入int类型的数组，会导致浮点型  
被切断为整形**

In [94]:
x1

array([5, 0, 3, 3, 7, 9])

In [95]:
x1[0] = 3.14159
x1

array([3, 0, 3, 3, 7, 9])

## 3.数组切片：获取子数组

**x[start: stop: step], step可省略**

### 3.1 一维字数组

In [96]:
x = np.arange(10)

In [97]:
x

array([0, 1, 2, 3, 4, 5, 6, 7, 8, 9])

In [98]:
x[:5] #前五个元素

array([0, 1, 2, 3, 4])

In [99]:
x[5:] #索引5之后元素

array([5, 6, 7, 8, 9])

In [100]:
x[4:7]

array([4, 5, 6])

In [101]:
x[::2] #从零开始每隔2取元素

array([0, 2, 4, 6, 8])

In [102]:
x[1::2] #从1开始每隔2取元素

array([1, 3, 5, 7, 9])

**step=-1时，start参数和stop参数默认被交换**

In [103]:
x

array([0, 1, 2, 3, 4, 5, 6, 7, 8, 9])

In [104]:
x[::-1]

array([9, 8, 7, 6, 5, 4, 3, 2, 1, 0])

In [105]:
x[5::-2] #从索引5开始每隔一个元素逆序

array([5, 3, 1])

### 3.2 多维字数组

In [106]:
x2

array([[12,  5,  2,  4],
       [ 7,  6,  8,  8],
       [ 1,  6,  7,  7]])

In [107]:
x2[:2, :3] #两行，三列

array([[12,  5,  2],
       [ 7,  6,  8]])

In [108]:
x2[:3, ::2] #三行，每隔一列

array([[12,  2],
       [ 7,  8],
       [ 1,  7]])

In [109]:
x2[::-1, ::-1] #逆序的子数组

array([[ 7,  7,  6,  1],
       [ 8,  8,  6,  7],
       [ 4,  2,  5, 12]])

### 3.3 获取数组的行和列

In [110]:
x2

array([[12,  5,  2,  4],
       [ 7,  6,  8,  8],
       [ 1,  6,  7,  7]])

In [111]:
print("x2的第一列", x2[:, 0])

x2的第一列 [12  7  1]


In [112]:
print("x2的第一行：", x2[0, :])

x2的第一行： [12  5  2  4]


**可省略空的切片**

In [113]:
print(x2[0]) #equal to x2[0, :]

[12  5  2  4]


### 3.4非副本视图的子数组

一般情况下，数组切片返回的是数组数据的视图，而普通python列表  
切片返回的是副本

In [114]:
print(x2)

[[12  5  2  4]
 [ 7  6  8  8]
 [ 1  6  7  7]]


In [115]:
x2_sub = x2[:2, :2]
print(x2_sub)

[[12  5]
 [ 7  6]]


**如果修改x2_sub，则x2也被修改了**

In [116]:
x2_sub[0, 0] = 99
print(x2_sub)

[[99  5]
 [ 7  6]]


In [117]:
print(x2)

[[99  5  2  4]
 [ 7  6  8  8]
 [ 1  6  7  7]]


### 3.5创建数组的副本

In [118]:
x2_sub_copy = x2[:2, :2].copy()
print(x2_sub_copy)

[[99  5]
 [ 7  6]]


**修改子数组的副本时，原始的数组不会改变**

In [119]:
x2_sub_copy[0, 0] = 42
print(x2_sub_copy)
print(x2_sub)
print(x2)

[[42  5]
 [ 7  6]]
[[99  5]
 [ 7  6]]
[[99  5  2  4]
 [ 7  6  8  8]
 [ 1  6  7  7]]


## 4.数组的变形

**最简单的方式通过reshape实现**

In [120]:
grid = np.arange(1, 10).reshape((3, 3))
print(grid)

[[1 2 3]
 [4 5 6]
 [7 8 9]]


**将一维数组变成二维的行或列矩阵**

In [121]:
x = np.array([1, 2, 3])

In [122]:
#通过reshape获得的行向量
x.reshape((1, 3))

array([[1, 2, 3]])

In [123]:
#通过newaxis获得的行向量
x[np.newaxis, : ]

array([[1, 2, 3]])

In [124]:
#通过变形获得的行向量
x.reshape((3, 1))

array([[1],
       [2],
       [3]])

In [125]:
#通过newaxis获得的列向量
x[:, np.newaxis].shape

(3, 1)

## 5.数组的拼接和分裂

### 5.1数组的拼接

**np.concatenate, np.vstack, np.hstack**

**一维数组的拼接**

In [126]:
x = np.array([1, 2, 3])
y = np.array([3, 2, 1])
np.concatenate([x, y])

array([1, 2, 3, 3, 2, 1])

In [127]:
z = [99, 99, 99]
print(np.concatenate([x, y, z]))

[ 1  2  3  3  2  1 99 99 99]


**二维数组的拼接**

In [128]:
grid = np.array([[1, 2, 3],
                 [4, 5, 6]])

In [129]:
#沿第一个轴拼接, 默认axis=0
np.concatenate([grid, grid])

array([[1, 2, 3],
       [4, 5, 6],
       [1, 2, 3],
       [4, 5, 6]])

In [130]:
#沿第二个轴拼接
np.concatenate([grid, grid], axis=1)

array([[1, 2, 3, 1, 2, 3],
       [4, 5, 6, 4, 5, 6]])

**沿固定维度处理数组时，使用np.vstack(垂直栈), np.hstack(水平栈)**

In [131]:
# 垂直栈数组
x = np.array([1, 2, 3])
grid = np.array([[9, 8, 7],
                 [6, 5, 4]])
np.vstack([x, grid])

array([[1, 2, 3],
       [9, 8, 7],
       [6, 5, 4]])

In [132]:
# 水平栈数组
y = np.array([[99],
             [99]])
np.hstack([grid, y])

array([[ 9,  8,  7, 99],
       [ 6,  5,  4, 99]])

与之类似的是，np.dstack将沿着第三个维度拼接数组

### 5.2 数组的分裂

**np.split, np.hsplit, np.vsplit**

上传一个索引列表作为参数，记录分裂点位置

In [133]:
x = [1, 2, 3, 99, 99, 3, 2, 1]
x1, x2, x3 = np.split(x, [3, 5])
print(x1, x2, x3)

[1 2 3] [99 99] [3 2 1]


In [134]:
grid = np.arange(16).reshape((4, 4))
grid

array([[ 0,  1,  2,  3],
       [ 4,  5,  6,  7],
       [ 8,  9, 10, 11],
       [12, 13, 14, 15]])

In [135]:
upper, lower = np.vsplit(grid, [2])
print(upper)
print(lower)

[[0 1 2 3]
 [4 5 6 7]]
[[ 8  9 10 11]
 [12 13 14 15]]


In [136]:
left, right = np.hsplit(grid, [2])
print(left)
print(right)

[[ 0  1]
 [ 4  5]
 [ 8  9]
 [12 13]]
[[ 2  3]
 [ 6  7]
 [10 11]
 [14 15]]


**同样，np.dsplit将沿着数组的第三个维度分裂**