In [28]:
# 1) Design model (input, output size, forward pass)
# 2) Construct loss and optimizer
# 3) Training loop
#   - forward pass: compute prediction and loss
#   - backward pass: gradients
#   - update weights

import torch
import torch.nn as nn # nn -> neural networks

# f = w * x

# f = 2 * x 
X = torch.tensor([[1],[2],[3],[4]], dtype = torch.float32)
Y = torch.tensor([[2],[4],[6],[8]], dtype = torch.float32)

X_test = torch.tensor([5], dtype = torch.float32)

num_samples, num_features = X.shape # 4 samples, 1 feature
input_size = num_features
output_size = num_features

model = nn.Linear(in_features = input_size, out_features = output_size)

# get predictions before training with x = 5
print("prediction before training: ", model(X_test).item())

# training
learning_rate = 0.01
n_iters = 100

loss = nn.MSELoss() # mean squared error loss
optimizer = torch.optim.SGD(model.parameters(), lr = learning_rate) # stochastic gradient descent

for epoch in range(n_iters):
    # prediction = forward pass
    y_pred = model(X)

    # loss
    l = loss(Y, y_pred)

    # gradients = backward pass
    l.backward() # dl/dw

    # update weights
    optimizer.step()

    # zero gradients
    optimizer.zero_grad()

    if epoch % 10 == 0:
        [w, b] = model.parameters()
        print(f'epoch {epoch + 1}: w = {w[0][0].item():.3f}, loss = {l.item():.8f}')

print("prediction after training: ", model(X_test).item())


prediction before training:  -2.686307430267334
epoch 1: w = 0.031, loss = 52.83644104
epoch 11: w = 1.695, loss = 1.36730385
epoch 21: w = 1.963, loss = 0.03565737
epoch 31: w = 2.005, loss = 0.00118809
epoch 41: w = 2.012, loss = 0.00028086
epoch 51: w = 2.013, loss = 0.00024283
epoch 61: w = 2.012, loss = 0.00022813
epoch 71: w = 2.012, loss = 0.00021484
epoch 81: w = 2.012, loss = 0.00020233
epoch 91: w = 2.011, loss = 0.00019056
prediction after training:  10.022966384887695
