In [1]:
# 1) Design model (input, output size,forward pass)
# 2) Construct loss and optimizer
# 3) Training loop
#    -forward pass: compute prediction
#    -backward pass: gradients
#    -update weights... iterate this a couple of times

![image.png](attachment:image.png)

In [2]:
import torch
import torch.nn as nn

In [3]:
X = torch.tensor([1,2,3,4], dtype=torch.float32)
Y = torch.tensor([2,4,6,8], dtype=torch.float32)
w = torch.tensor(0.0, dtype=torch.float32, requires_grad=True)

In [4]:
def forward(x):
    return w*x

In [5]:
print(f'Prediction before training: f(5) = {forward(5):.3f}')

Prediction before training: f(5) = 0.000


In [6]:
# Training
learning_rate = 0.01
n_iters = 100
loss = nn.MSELoss()
optimizer = torch.optim.SGD([w], lr=learning_rate)

In [7]:
for epoch in range(n_iters):
    # prediction = forward pass
    y_pred = forward(X)
    
    # loss --still the same because it's still a callable function
    l = loss(Y,y_pred)
    
    # Gradients = backward pass (UPDATED)
    l.backward() # calculate the gradient of our loss --- dl/dw
    
    # update weights (UPDATED) - no need to manually update weights anymore
    optimizer.step()
    
    #zero gradients (ADDED) - still have to zero out our gradient, but different function from manual 
#     b/c when we call backwards, it will write our gradients and accumulate w.grad attribute
    optimizer.zero_grad()
    
        
    if epoch % 10 ==0:
        print(f'epoch {epoch+1}:w = {w:.3f}, loss = {l:.8f}')
print(f'Prediction after training: f(5) = {forward(5):.3f}')

epoch 1:w = 0.300, loss = 30.00000000
epoch 11:w = 1.665, loss = 1.16278565
epoch 21:w = 1.934, loss = 0.04506890
epoch 31:w = 1.987, loss = 0.00174685
epoch 41:w = 1.997, loss = 0.00006770
epoch 51:w = 1.999, loss = 0.00000262
epoch 61:w = 2.000, loss = 0.00000010
epoch 71:w = 2.000, loss = 0.00000000
epoch 81:w = 2.000, loss = 0.00000000
epoch 91:w = 2.000, loss = 0.00000000
Prediction after training: f(5) = 10.000
