In [1]:
import torch

# design our model(input, output size, forward pass)
# construct loss and optimizer
# training loop
##  - forward pass: compute the prediction
##  - backward pass: gradient
##  - update weights

In [3]:
import torch.nn as nn
# f = w * x
# f = 2 * x
X = torch.tensor([1,2,3,4], dtype=torch.float32)
Y = torch.tensor([2,4,6,8], dtype=torch.float32)
w = torch.tensor(0.0, dtype=torch.float32, requires_grad = True)

#model prediction
def forward(x):
    return w * x

print(f'prediction before training:  f(5) = {forward(5):.3f}')

#training
learning_rate = 0.01
n_iters = 100

loss = nn.MSELoss()
optimizer = torch.optim.SGD([w], lr=learning_rate)

for epoch in range(n_iters):
    y_pred = forward(X)
    
    l = loss(Y,y_pred)

    l.backward()
    optimizer.step()
    #zero gradient: clean previous gradient data
    optimizer.zero_grad()
    
    if epoch % 10 ==0:
        print(f'epoch {epoch+1}: w = {w:.3f}, loss = {l:.8f}')
print(f'Prediction after training: f(5) = {forward(5):.3f}')

prediction before training:  f(5) = 0.000
epoch 1: w = 0.300, loss = 30.00000000
epoch 11: w = 1.665, loss = 1.16278565
epoch 21: w = 1.934, loss = 0.04506890
epoch 31: w = 1.987, loss = 0.00174685
epoch 41: w = 1.997, loss = 0.00006770
epoch 51: w = 1.999, loss = 0.00000262
epoch 61: w = 2.000, loss = 0.00000010
epoch 71: w = 2.000, loss = 0.00000000
epoch 81: w = 2.000, loss = 0.00000000
epoch 91: w = 2.000, loss = 0.00000000
Prediction after training: f(5) = 10.000


In [33]:
import torch.nn as nn
# f = w * x
# f = 2 * x
X = torch.tensor([[1],[2],[3],[4]], dtype=torch.float32)
Y = torch.tensor([[2],[4],[6],[8]], dtype=torch.float32)

X_test = torch.tensor([5], dtype = torch.float32)
n_samples, n_features = X.shape
print(f'#samples: {n_samples}, #features: {n_features}')

input_size = n_features
output_size = n_features

#model = nn.Linear(input_size, output_size)

class LinearRegression(nn.Module):
    def __init__(self, input_dim, output_dim):
        super(LinearRegression, self).__init__()
        # define diferent layers: nn.Linear always use as the full connected layers
        self.lin = nn.Linear(input_dim, output_dim)

    def forward(self, x):
        return self.lin(x)

#model is a instantiation of class LinearRegression, we can call model to use the class
model = LinearRegression(input_size, output_size)



print(f'prediction before training:  f(5) = {model(X_test).item():.3f}')

#training
learning_rate = 0.01
n_iters = 100

loss = nn.MSELoss()
optimizer = torch.optim.SGD(model.parameters(), lr=learning_rate)

for epoch in range(n_iters):
    y_pred = model(X)
    
    l = loss(Y,y_pred)

    l.backward()
    #optimizer.step(): automatically to update weight
    optimizer.step()
    #zero gradient: clean previous gradient data
    optimizer.zero_grad()
    
    if epoch % 10 ==0:
        [w, b] = model.parameters()
        print(f'epoch {epoch+1}: w = {w[0][0].item():.3f}, loss = {l:.8f}')
        
print(f'Prediction after training: f(5) = {model(X_test).item():.3f}')

#samples: 4, #features: 1
prediction before training:  f(5) = -0.913
epoch 1: w = 0.315, loss = 39.27354431
epoch 11: w = 1.749, loss = 1.01692224
epoch 21: w = 1.979, loss = 0.02708483
epoch 31: w = 2.016, loss = 0.00143027
epoch 41: w = 2.021, loss = 0.00072406
epoch 51: w = 2.021, loss = 0.00066580
epoch 61: w = 2.021, loss = 0.00062663
epoch 71: w = 2.020, loss = 0.00059014
epoch 81: w = 2.020, loss = 0.00055579
epoch 91: w = 2.019, loss = 0.00052344
Prediction after training: f(5) = 10.038
