# 数据操作

In [5]:
import torch

x = torch.arange(12)
x.shape

torch.Size([12])

In [6]:
x.numel()
# number of elements

12

In [8]:
X = x.reshape(3,4)
X

tensor([[ 0,  1,  2,  3],
        [ 4,  5,  6,  7],
        [ 8,  9, 10, 11]])

### 常见的标准算术运算符（+、-、*、/、和**）都可以被升级为按元素运算

In [10]:
x = torch.tensor([1.0, 2, 4, 8])
y = torch.tensor([2,2,2,2])
x+y, x-y, x*y, x/y, x**y

(tensor([ 3.,  4.,  6., 10.]),
 tensor([-1.,  0.,  2.,  6.]),
 tensor([ 2.,  4.,  8., 16.]),
 tensor([0.5000, 1.0000, 2.0000, 4.0000]),
 tensor([ 1.,  4., 16., 64.]))

### 把多个张量连结在一起

In [11]:
x = torch.arange(12, dtype = torch.float32).reshape((3,4))
y = torch.tensor([[2.0,1,4,3],[1,2,3,4],[4,3,2,1]])
torch.cat((x,y), dim = 0),torch.cat((x,y),dim = 1)

(tensor([[ 0.,  1.,  2.,  3.],
         [ 4.,  5.,  6.,  7.],
         [ 8.,  9., 10., 11.],
         [ 2.,  1.,  4.,  3.],
         [ 1.,  2.,  3.,  4.],
         [ 4.,  3.,  2.,  1.]]),
 tensor([[ 0.,  1.,  2.,  3.,  2.,  1.,  4.,  3.],
         [ 4.,  5.,  6.,  7.,  1.,  2.,  3.,  4.],
         [ 8.,  9., 10., 11.,  4.,  3.,  2.,  1.]]))

### 即使形状不同，我们仍然可以通过调用 *广播机制* （broadcasting mechanism）来执行按元素操作

In [13]:
a = torch.arange(3).reshape((3,1))
b = torch.arange(2).reshape((1,2))
a, b

(tensor([[0],
         [1],
         [2]]),
 tensor([[0, 1]]))

In [15]:
a+b

tensor([[0, 1],
        [1, 2],
        [2, 3]])

### 可以用[-1]选择最后一个元素，可以用[1:3]选择第二个和第三个元素

In [19]:
X[-1], X[1:3]

(tensor([ 8,  9, 10, 11]),
 tensor([[ 4,  5,  9,  7],
         [ 8,  9, 10, 11]]))

### 除读取外，我们还可以通过指定索引来将元素写入矩阵

In [20]:
X[1, 2] = 9
X

tensor([[ 0,  1,  2,  3],
        [ 4,  5,  9,  7],
        [ 8,  9, 10, 11]])

### 为多个元素赋值相同的值， 我们只需要索引所有元素，然后为他们赋值

In [21]:
X[0:2,:] = 2
X

tensor([[ 2,  2,  2,  2],
        [ 2,  2,  2,  2],
        [ 8,  9, 10, 11]])

### 转换为Numpy张量

In [22]:
A = X.numpy()
B = torch.tensor(A)
type(A), type(B)

(numpy.ndarray, torch.Tensor)

In [23]:
a = torch.tensor([3.5])
a, a.item(),float(a),int(a)

(tensor([3.5000]), 3.5, 3.5, 3)

# 数据预处理

In [25]:
import os
os.makedirs(os.path.join("..","data"),exist_os = True)
data_file = os.path.join("..","data","house_tiny.csv")
with open(data_file,'w') as f:
    f.write("")

TypeError: makedirs() got an unexpected keyword argument 'exist_os'

In [None]:
# pip install pandas
import pandas as pd

data = pd.read_csv(data_file)
inputs, outputs = data.iloc[:, 0:2], data.iloc[:,2]
inputs = inputs.fillna(inputs.mean())