In [12]:
import torch
from torch.autograd import Variable
import matplotlib.pyplot as plt
 
# 假数据
n_data = torch.ones(100, 2)         # 数据的基本形态
x0 = torch.normal(2*n_data, 1)      # 类型0 x data (tensor), shape=(100, 2)
y0 = torch.zeros(100)               # 类型0 y data (tensor), shape=(100, 1)
x1 = torch.normal(-2*n_data, 1)     # 类型1 x data (tensor), shape=(100, 1)
y1 = torch.ones(100)                # 类型1 y data (tensor), shape=(100, 1)
 
# 注意 x, y 数据的数据形式是一定要像下面一样 (torch.cat 是在合并数据)
x = torch.cat((x0, x1), 0).type(torch.FloatTensor)  # FloatTensor = 32-bit floating
y = torch.cat((y0, y1), ).type(torch.LongTensor)    # LongTensor = 64-bit integer
 
# torch 只能在 Variable 上训练, 所以把它们变成 Variable
x, y = Variable(x), Variable(y)
 
# plt.scatter(x.data.numpy()[:, 0], x.data.numpy()[:, 1], c=y.data.numpy(), s=100, lw=0, cmap=\'RdYlGn\')
# plt.show()
 
print(x.data.size())
print(y.data.size())

torch.Size([200, 2])
torch.Size([200])


In [13]:
import torch
import torch.nn.functional as F     # 激励函数都在这
 
class Net(torch.nn.Module):     # 继承 torch 的 Module
    def __init__(self, n_feature, n_hidden, n_output):
        super(Net, self).__init__()     # 继承 __init__ 功能
        self.hidden = torch.nn.Linear(n_feature, n_hidden)   # 隐藏层线性输出
        self.out = torch.nn.Linear(n_hidden, n_output)       # 输出层线性输出
 
    def forward(self, x):
        # 正向传播输入值, 神经网络分析出输出值
        x = F.relu(self.hidden(x))      # 激励函数(隐藏层的线性值)
        x = self.out(x)                 # 输出值, 但是这个不是预测值, 预测值还需要再另外计算
        return x
 
net = Net(n_feature=2, n_hidden=10, n_output=2) # 几个类别就几个 output
 
print(net)  # net 的结构

Net(
  (hidden): Linear(in_features=2, out_features=10, bias=True)
  (out): Linear(in_features=10, out_features=2, bias=True)
)


In [14]:
# optimizer 是训练的工具
optimizer = torch.optim.SGD(net.parameters(), lr=0.02)  # 传入 net 的所有参数, 学习率
# 算误差的时候, 注意真实值!不是! one-hot 形式的, 而是1D Tensor, (batch,)
# 但是预测值是2D tensor (batch, n_classes)
loss_func = torch.nn.CrossEntropyLoss()
 
for t in range(200):
    out = net(x)     # 喂给 net 训练数据 x, 输出分析值
 
    loss = loss_func(out, y)     # 计算两者的误差
    print(loss)
 
    optimizer.zero_grad()   # 清空上一步的残余更新参数值
    loss.backward()         # 误差反向传播, 计算参数更新值
    optimizer.step()        # 将参数更新值施加到 net 的 parameters 上

tensor(0.6471, grad_fn=<NllLossBackward>)
tensor(0.6123, grad_fn=<NllLossBackward>)
tensor(0.5805, grad_fn=<NllLossBackward>)
tensor(0.5515, grad_fn=<NllLossBackward>)
tensor(0.5248, grad_fn=<NllLossBackward>)
tensor(0.5003, grad_fn=<NllLossBackward>)
tensor(0.4777, grad_fn=<NllLossBackward>)
tensor(0.4568, grad_fn=<NllLossBackward>)
tensor(0.4374, grad_fn=<NllLossBackward>)
tensor(0.4195, grad_fn=<NllLossBackward>)
tensor(0.4028, grad_fn=<NllLossBackward>)
tensor(0.3872, grad_fn=<NllLossBackward>)
tensor(0.3726, grad_fn=<NllLossBackward>)
tensor(0.3590, grad_fn=<NllLossBackward>)
tensor(0.3463, grad_fn=<NllLossBackward>)
tensor(0.3343, grad_fn=<NllLossBackward>)
tensor(0.3230, grad_fn=<NllLossBackward>)
tensor(0.3124, grad_fn=<NllLossBackward>)
tensor(0.3024, grad_fn=<NllLossBackward>)
tensor(0.2929, grad_fn=<NllLossBackward>)
tensor(0.2840, grad_fn=<NllLossBackward>)
tensor(0.2755, grad_fn=<NllLossBackward>)
tensor(0.2675, grad_fn=<NllLossBackward>)
tensor(0.2599, grad_fn=<NllLossBac