#### We will be working on 4 steps
1. Prediction - Pytorch Model
2. Gradients Computation - Autograd
3. Loss Computation - Pytorch loss
4. Parameter updates - Pytorch Optimizer

<ol>
    <li> Design model (input, output size, forward pass)</li>
    <li> Construct loss and optimizer</li>
    <li> Training loop - n times iteration</li>
    <ol>
        <li>Forward Pass : Compute Prediction</li>
        <li>Backward Pass : Gradients</li>
        <li>Update weights</li>
    </ol>
</ol>

In [1]:
import torch
import torch.nn as nn

In [2]:
# y = w * x (we are ignoring bias b for now)
# y = 2 * x
# S remember after training model , the w should become 2
X = torch.tensor([[1],[2],[3],[4]], dtype=torch.float32)
Y = torch.tensor([[2],[4],[6],[8]], dtype=torch.float32)

In [3]:
X_test = torch.tensor([5], dtype=torch.float32)

In [4]:
n_samples, n_features = X.shape

In [5]:
n_samples, n_features

(4, 1)

#### Model Prediction

In [6]:
input_size = n_features
output_size = n_features
#model = nn.Linear(input_size, output_size)

In [7]:
# Dummy Example (Custom model)
class LinearRegression(nn.Module):
    
    def __init__(self, input_dim, output_dim):
        super(LinearRegression, self).__init__()
        
        #define layers
        self.lin = nn.Linear(input_dim, output_dim)
        
    def forward(self, x):
        return self.lin(x)
    
model = LinearRegression(input_size,output_size)

In [8]:
print(f'Prediction before training: f(5) = {model(X_test).item():.3f}')

Prediction before training: f(5) = -1.103


#### Training

In [9]:
learning_rate = 0.01
n_iters = 100

# Loss
loss = nn.MSELoss()
optimizer = torch.optim.SGD(model.parameters(),lr=learning_rate)

In [10]:
for epoch in range(n_iters):
    
    #Prediction - forward pass
    y_pred = model (X)
    
    #loss
    l = loss(Y, y_pred)
    
    #Gradient = backward pass
    l.backward() # this will calculate the gradient of our loss dl/dw
    
    #Update weights (Formula)
    optimizer.step()
        
    # Zero gradients
    optimizer.zero_grad()
    
    if epoch % 10 == 0:
        [w,b] = model.parameters()
        print(f'epoch {epoch+1}: w = {w[0][0].item():.3f}, loss = {l:.8f}')

epoch 1: w = -0.091, loss = 33.13217163
epoch 11: w = 1.235, loss = 1.23066711
epoch 21: w = 1.461, loss = 0.38356215
epoch 31: w = 1.509, loss = 0.34117323
epoch 41: w = 1.529, loss = 0.32079607
epoch 51: w = 1.544, loss = 0.30211076
epoch 61: w = 1.557, loss = 0.28452599
epoch 71: w = 1.570, loss = 0.26796505
epoch 81: w = 1.583, loss = 0.25236800
epoch 91: w = 1.595, loss = 0.23767877


In [11]:
print(f'Prediction after training: f(5) = {model(X_test).item():.3f}')

Prediction after training: f(5) = 9.189
