### 3. loss, optim -> torch

In [None]:
# model
# loss, optim
# training
# plot

import torch
import torch.nn as nn

# f = w * x

# f = 2 * x

X = torch.tensor([1, 2, 3, 4], dtype=torch.float32)
Y = torch.tensor([2, 4, 6, 8], dtype=torch.float32)

w = torch.tensor(0.0, dtype=torch.float32, requires_grad=True)

# model prediction
def forward(x):
    return w * x
    
# loss
# def loss(y, y_predicted):
#     return ((y_predicted-y)**2).mean()

# gradient
# MSE = 1/N * (w*x - y)**2
# dJ/dw = 1/N 2x (w*x -y)
def gradient(x, y, y_predicted):
        return np.dot(2*x, y_predicted-y).mean()
    
print(f'predcition before training: f(5) = {forward(5):.3f}')

# Training
learning_rate = 0.01
n_iters = 100

loss = nn.MSELoss()
optimizer = torch.optim.SGD([w], lr=learning_rate)

for epoch in range(n_iters):
    # predcition = forward pass
    y_pred = forward(X)
    
    # loss
    l = loss(Y, y_pred)
    
    # gradients
    # dw = gradient(X, Y, y_pred)
    l.backward() # dl/dw
    
    # update weights
#     with torch.no_grad():
#         w -= learning_rate * w.grad
    optimizer.step()
    
        
    # zero gradients
    w.grad.zero_()
    optimizer.zero_grad()
    
    if epoch%10 == 0:
        print(f'epoch {epoch+1}: w = {w:.3f}, loss = {l:.8f}')
        
print(f'predcition after training: f(5) = {forward(5):.3f}')

# increase w, decrease loss

### 4. Everything Pytorch

In [1]:
# model
# loss, optim
# training
# plot

import torch
import torch.nn as nn

# f = w * x

# f = 2 * x

X = torch.tensor([[1], [2], [3], [4]], dtype=torch.float32)
Y = torch.tensor([[2], [4], [6], [8]], dtype=torch.float32)
 
# w = torch.tensor(0.0, dtype=torch.float32, requires_grad=True)
n_samples, n_features = X.shape
print(f'#samples: {n_samples}, #features: {n_features}')

# 0) create a test sample
X_test = torch.tensor([5], dtype=torch.float32)


# 1) Design Model, the model has to implement the forward pass!
input_size = n_features
output_size = n_features


# model prediction
# def forward(x):
#     return w * x

# we can call this model with samples X
model = nn.Linear(input_size, output_size)

# class LinearRegression(nn.Module):
    
#     def __init__(self, input_dim, output_dim):
#         super(LinearRegression, self).__init__()
#         self.lin = nn.Linear(input_dim, output_dim)
    
#     def forward(self, x):
#         return self.lin(x)

# model = LinearRegression(input_size, output_size)


# loss
# def loss(y, y_predicted):
#     return ((y_predicted-y)**2).mean()

# gradient
# MSE = 1/N * (w*x - y)**2
# dJ/dw = 1/N 2x (w*x -y)
# def gradient(x, y, y_predicted):
#         return np.dot(2*x, y_predicted-y).mean()

print(f'Prediction before training: f(5) = {model(X_test).item():.3f}')

# Training
learning_rate = 0.01
n_iters = 100

loss = nn.MSELoss()
optimizer = torch.optim.SGD(model.parameters(), lr=learning_rate)

for epoch in range(n_iters):
    # predcition = forward pass
    y_pred = model(X)
    
    # loss
    l = loss(Y, y_pred)
    
    # gradients
    # dw = gradient(X, Y, y_pred)
    l.backward() # dl/dw
    
    # update weights
#     with torch.no_grad():
#         w -= learning_rate * w.grad
    optimizer.step()
    
        
    # zero gradients
#     w.grad.zero_()
    optimizer.zero_grad()
    
    if epoch%10 == 0:
        [w, b] = model.parameters()
        # print(f'epoch {epoch+1}: w = {w:.3f}, loss = {l:.8f}')
        print(f'epoch {epoch+1}: w = {w[0][0]:.3f}, loss = {l:.8f}')
        
print(f'Prediction after training: f(5) = {model(X_test).item():.3f}')

# increase w, decrease loss

#samples: 4, #features: 1
Prediction before training: f(5) = -5.226
epoch 1: w = -0.379, loss = 75.62565613
epoch 11: w = 1.613, loss = 1.95665741
epoch 21: w = 1.933, loss = 0.05066319
epoch 31: w = 1.985, loss = 0.00134826
epoch 41: w = 1.993, loss = 0.00007017
epoch 51: w = 1.995, loss = 0.00003506
epoch 61: w = 1.995, loss = 0.00003221
epoch 71: w = 1.995, loss = 0.00003032
epoch 81: w = 1.996, loss = 0.00002855
epoch 91: w = 1.996, loss = 0.00002689
Prediction after training: f(5) = 9.991
