In [19]:
import numpy as np
import torch
from torch.utils import data
from d2l import torch as d2l

In [20]:
true_w = torch.tensor([2, -3.4])
true_b = 4.2
features, labels = d2l.synthetic_data(true_w, true_b, 1000)

我们将features和labels作为API的参数传递，即 data_arrays
并通过数据迭代器指定batch_size
此外，布尔值is_train表⽰是否希望数据迭代器对象在每个迭代周期内打乱数据。

In [21]:
def load_array(data_arrays, batch_size, is_train=True): #@save
    """构造⼀个PyTorch数据迭代器"""
    dataset = data.TensorDataset(*data_arrays)
    return data.DataLoader(dataset, batch_size, shuffle=is_train)

In [22]:
batch_size = 10
data_iter = load_array((features, labels), batch_size)

In [23]:
next(iter(data_iter))

[tensor([[-0.6738,  0.0325],
         [ 0.4292,  0.8551],
         [ 0.0618,  0.0283],
         [ 1.6027, -1.1969],
         [ 0.3030,  0.2727],
         [ 0.1923, -1.1584],
         [ 0.6275,  0.7320],
         [-0.6998, -0.5226],
         [ 0.0558, -1.4260],
         [ 0.0160,  1.1050]]),
 tensor([[ 2.7392],
         [ 2.1400],
         [ 4.2152],
         [11.4881],
         [ 3.8805],
         [ 8.5037],
         [ 2.9686],
         [ 4.5913],
         [ 9.1532],
         [ 0.4598]])]

In [24]:
# nn是神经⽹络的缩写
from torch import nn
net = nn.Sequential(nn.Linear(2, 1))

# 初始化模型参数 w 和 b
net[0].weight.data.normal_(0, 0.01)
net[0].bias.data.fill_(0)

tensor([0.])

计算均⽅误差使⽤的是MSELoss类，也称为平⽅L2范数。
默认情况下，它返回所有样本损失的平均值。

In [25]:
loss = nn.MSELoss()

In [26]:
trainer = torch.optim.SGD(net.parameters(), lr=0.03)

In [27]:
# 训练模型
num_epochs = 3
for epoch in range(num_epochs):
    for X,y in data_iter:
        l = loss(net(X),y)
        trainer.zero_grad()
        l.backward()
        trainer.step()
    l = loss(net(features),labels)
    print(f'epoh {epoch + 1},loss {l:f}')

epoh 1,loss 0.000166
epoh 2,loss 0.000097
epoh 3,loss 0.000097


In [28]:
w = net[0].weight.data
print('w的估计误差：', true_w - w.reshape(true_w.shape))
b = net[0].bias.data
print('b的估计误差：', true_b - b)

w的估计误差： tensor([-6.2132e-04, -6.3419e-05])
b的估计误差： tensor([0.0001])
