Linear Regression Concise

In [1]:
import numpy as np
import torch
from torch.utils import data
from d2l import torch as d2l

true_w = torch.tensor([2, -3.4])
true_b = 4.2
features, labels = d2l.synthetic_data(true_w, true_b, 1000)

In [2]:
def load_array(data_arrays, batch_size, is_train=True):
    """Construct PyTorch data iterator"""
    dataset = data.TensorDataset(*data_arrays)
    return data.DataLoader(dataset, batch_size, shuffle=is_train)

batch_size = 10
data_iter = load_array((features, labels), batch_size)

next(iter(data_iter))

[tensor([[-0.0750,  1.7610],
         [ 0.3987,  1.0873],
         [ 0.7198, -0.8363],
         [-0.9120, -1.0509],
         [ 0.5244,  0.6419],
         [ 0.4225,  1.2222],
         [ 0.9591,  1.3644],
         [ 0.1329,  0.9615],
         [ 0.6141,  1.6781],
         [-0.3028,  1.5671]]),
 tensor([[-1.9333],
         [ 1.3062],
         [ 8.4846],
         [ 5.9551],
         [ 3.0693],
         [ 0.8845],
         [ 1.4841],
         [ 1.2021],
         [-0.2798],
         [-1.7189]])]

In [3]:
"""Define model layers"""
from torch import nn

net = nn.Sequential(nn.Linear(2, 1))

In [4]:
"""Initialize model parameters"""
net[0].weight.data.normal_(0, 0.01)
net[0].bias.data.fill_(0)

tensor([0.])

In [5]:
"""MSE Loss = L2 loss"""
loss = nn.MSELoss()

In [6]:
"""Initialize SGD instance"""
trainer = torch.optim.SGD(net.parameters(), lr=0.03)

In [7]:
num_epochs = 3
for epoch in range(num_epochs): # Main training loop
    for X, y in data_iter: # Loading data
        # 1. Compute the loss based on prediction and ground truth
        l = loss(net(X), y)
        # 2. Reset gradients back to 0
        trainer.zero_grad()
        # 3. Compute the gradients
        l.backward()
        # 4. Update parameters using gradients
        trainer.step()
    l = loss(net(features), labels)
    print(f'epoch {epoch + 1}, loss {l:f}')

epoch 1, loss 0.000206
epoch 2, loss 0.000096
epoch 3, loss 0.000097


In [8]:
w = net[0].weight.data
print('expected error of w: ', true_w - w.reshape(true_w.shape))
b = net[0].bias.data
print('expected error of b: ', true_b - b)

expected error of w:  tensor([ 0.0009, -0.0006])
expected error of b:  tensor([0.0005])
