In [1]:
import torch
import torch.nn as nn
import torch.nn.functional as F
import torch.optim as optim

Linear Regression using Numpy

In [None]:
import numpy as np 

# Compute every step manually

# Linear regression
# f = w * x 

# here : f = 2 * x
X = np.array([1, 2, 3, 4], dtype=np.float32)
Y = np.array([2, 4, 6, 8], dtype=np.float32)

w = 0.0

# model output
def forward(x):
    return w * x

# loss = MSE
def loss(y, y_pred):
    return ((y_pred - y)**2).mean()

# J = MSE = 1/N * (w*x - y)**2
# dJ/dw = 1/N * 2x(w*x - y)
def gradient(x, y, y_pred):
    return np.mean(2*x*(y_pred - y))

print(f'Prediction before training: f(5) = {forward(5):.3f}')

# Training
learning_rate = 0.01
n_iters = 20

for epoch in range(n_iters):
    # predict = forward pass
    y_pred = forward(X)

    # loss
    l = loss(Y, y_pred)
    
    # calculate gradients
    dw = gradient(X, Y, y_pred)

    # update weights
    w -= learning_rate * dw

    if epoch % 2 == 0:
        print(f'epoch {epoch+1}: w = {w:.3f}, loss = {l:.8f}')
     
print(f'Prediction after training: f(5) = {forward(5):.3f}')

Linear Regression using torch

In [2]:

# 1) Design model (input, output, forward pass with different layers)
# 2) Construct loss and optimizer
# 3) Training loop
#       - Forward = compute prediction and loss
#       - Backward = compute gradients
#       - Update weights

import torch
import torch.nn as nn

# Linear regression
# f = w * x 

# here : f = 2 * x

# 0) Training samples, watch the shape!
X = torch.tensor([[1], [2], [3], [4]], dtype=torch.float32)
Y = torch.tensor([[2], [4], [6], [8]], dtype=torch.float32)

n_samples, n_features = X.shape
print(f'#samples: {n_samples}, #features: {n_features}')
# 0) create a test sample
X_test = torch.tensor([5], dtype=torch.float32)

# 1) Design Model, the model has to implement the forward pass!
# Here we can use a built-in model from PyTorch
input_size = n_features
output_size = n_features

# we can call this model with samples X
model = nn.Linear(input_size, output_size)

'''
class LinearRegression(nn.Module):
    def __init__(self, input_dim, output_dim):
        super(LinearRegression, self).__init__()
        # define diferent layers
        self.lin = nn.Linear(input_dim, output_dim)
    def forward(self, x):
        return self.lin(x)
model = LinearRegression(input_size, output_size)
'''

print(f'Prediction before training: f(5) = {model(X_test).item():.3f}')

# 2) Define loss and optimizer
learning_rate = 0.01
n_iters = 100

loss = nn.MSELoss()
optimizer = torch.optim.SGD(model.parameters(), lr=learning_rate)

# 3) Training loop
for epoch in range(n_iters):
    # predict = forward pass with our model
    y_predicted = model(X)

    # loss
    l = loss(Y, y_predicted)

    # calculate gradients = backward pass
    l.backward()

    # update weights
    optimizer.step()

    # zero the gradients after updating
    optimizer.zero_grad()

    if epoch % 10 == 0:
        [w, b] = model.parameters() # unpack parameters
        print('epoch ', epoch+1, ': w = ', w[0][0].item(), ' loss = ', l)



#samples: 4, #features: 1
Prediction before training: f(5) = 0.475
epoch  1 : w =  0.35713064670562744  loss =  tensor(26.8138, grad_fn=<MseLossBackward0>)
epoch  11 : w =  1.5481270551681519  loss =  tensor(0.7652, grad_fn=<MseLossBackward0>)
epoch  21 : w =  1.7452396154403687  loss =  tensor(0.0871, grad_fn=<MseLossBackward0>)
epoch  31 : w =  1.7823233604431152  loss =  tensor(0.0656, grad_fn=<MseLossBackward0>)
epoch  41 : w =  1.793507695198059  loss =  tensor(0.0614, grad_fn=<MseLossBackward0>)
epoch  51 : w =  1.8003720045089722  loss =  tensor(0.0578, grad_fn=<MseLossBackward0>)
epoch  61 : w =  1.8063918352127075  loss =  tensor(0.0544, grad_fn=<MseLossBackward0>)
epoch  71 : w =  1.8121305704116821  loss =  tensor(0.0513, grad_fn=<MseLossBackward0>)
epoch  81 : w =  1.8176833391189575  loss =  tensor(0.0483, grad_fn=<MseLossBackward0>)
epoch  91 : w =  1.8230690956115723  loss =  tensor(0.0455, grad_fn=<MseLossBackward0>)


In [4]:
torch.__version__

'1.13.1+cu116'