In [1]:
# Training pipeline
# 1) Design model (input, output, forward pass)
# 2) Construct loss and optimizer 
# 3) Training loop
#   - forward pass: compute prediction
#   - backward pass: gradients
#   - update weights

In [2]:
import torch
import torch.nn as nn
# f = w * x
# f = 2 * x
X = torch.tensor([[1], [2], [3], [4]], dtype=torch.float32)
y = torch.tensor([[2], [4], [6], [8]], dtype=torch.float32)

n_samples, n_features = X.shape
print(n_samples, n_features)
input_size = n_features
output_size = n_features
model = nn.Linear(input_size, output_size, bias=False)

X_test = torch.tensor([5], dtype=torch.float32)
print(f'Prediction before training: f(5) = {model(X_test).item():.3f}')
# Training
lr = 0.01
n_iters = 100
loss = nn.MSELoss()
optimizer = torch.optim.SGD(model.parameters(), lr=lr)
for epoch in range(n_iters):
    y_pred = model(X)
    l = loss(y, y_pred)
    # Gradient
    l.backward()
    # Update weights
    optimizer.step()
    # zero update
    optimizer.zero_grad()
    if epoch % 10 == 0:
        [w] = model.parameters()
        print(f'epoch {epoch + 1}: w = {w[0][0].item():.3f}, loss={l:.8f}')

print(f'Predicted after training: f(5) = {model(X_test).item():.3f}')

4 1
Prediction before training: f(5) = -4.948
epoch 1: w = -0.541, loss=67.03077698
epoch 11: w = 1.500, loss=2.59808135
epoch 21: w = 1.902, loss=0.10070032
epoch 31: w = 1.981, loss=0.00390310
epoch 41: w = 1.996, loss=0.00015128
epoch 51: w = 1.999, loss=0.00000586
epoch 61: w = 2.000, loss=0.00000023
epoch 71: w = 2.000, loss=0.00000001
epoch 81: w = 2.000, loss=0.00000000
epoch 91: w = 2.000, loss=0.00000000
Predicted after training: f(5) = 10.000
