In [1]:
# Import Numpy & PyTorch
import numpy as np
import torch

## Linear Regression Model using PyTorch built-ins

Let's re-implement the same model using some built-in functions and classes from PyTorch.

And now using two different targets: Apples and Oranges

In [2]:
# Imports
import torch.nn as nn

In [3]:
# Input (temp, rainfall, humidity)
inputs = np.array([[73, 67, 43], [91, 88, 64], [87, 134, 58], [102, 43, 37], [69, 96, 70], [73, 67, 43], [91, 88, 64], [87, 134, 58], [102, 43, 37], [69, 96, 70], [73, 67, 43], [91, 88, 64], [87, 134, 58], [102, 43, 37], [69, 96, 70]], dtype='float32')
# Targets (apples, oranges)
targets = np.array([[56, 70], [81, 101], [119, 133], [22, 37], [103, 119], 
                    [56, 70], [81, 101], [119, 133], [22, 37], [103, 119], 
                    [56, 70], [81, 101], [119, 133], [22, 37], [103, 119]], dtype='float32')

In [4]:
inputs = torch.from_numpy(inputs)
targets = torch.from_numpy(targets)

### Dataset and DataLoader

We'll create a `TensorDataset`, which allows access to rows from `inputs` and `targets` as tuples. We'll also create a DataLoader, to split the data into batches while training. It also provides other utilities like shuffling and sampling.

In [5]:
# Import tensor dataset & data loader
from torch.utils.data import TensorDataset, DataLoader

In [6]:
# Define dataset
dataset = TensorDataset(inputs, targets)
dataset[0:3]

(tensor([[ 73.,  67.,  43.],
         [ 91.,  88.,  64.],
         [ 87., 134.,  58.]]),
 tensor([[ 56.,  70.],
         [ 81., 101.],
         [119., 133.]]))

In [7]:

# Define data loader
batch_size = 5
DL = DataLoader(dataset, batch_size, shuffle=True)
next(iter(DL))

[tensor([[ 73.,  67.,  43.],
         [ 73.,  67.,  43.],
         [ 87., 134.,  58.],
         [ 87., 134.,  58.],
         [102.,  43.,  37.]]),
 tensor([[ 56.,  70.],
         [ 56.,  70.],
         [119., 133.],
         [119., 133.],
         [ 22.,  37.]])]

### nn.Linear
Instead of initializing the weights & biases manually, we can define the model using `nn.Linear`.

In [8]:
# Define model
final_model = nn.Linear(3, 2)
print(final_model.weight, end="\n---------\n")
print(final_model.bias)

Parameter containing:
tensor([[ 0.5308,  0.3008, -0.5706],
        [ 0.4220, -0.2781, -0.2469]], requires_grad=True)
---------
Parameter containing:
tensor([-0.2845,  0.2698], requires_grad=True)


### Optimizer
Instead of manually manipulating the weights & biases using gradients, we can use the optimizer `optim.SGD`.

In [9]:
# Define optimizer
opt = torch.optim.SGD(final_model.parameters(), lr=1e-5)

### Loss Function
Instead of defining a loss function manually, we can use the built-in loss function `mse_loss`.

In [10]:
# Import nn.functional
import torch.nn.functional as F

In [11]:
# Define loss function
loss_fn = F.mse_loss

In [12]:
loss = loss_fn(final_model(inputs) , targets)
print(loss)

tensor(6830.4658, grad_fn=<MseLossBackward>)


### Train the model

We are ready to train the model now. We can define a utility function `fit` which trains the model for a given number of epochs.

In [13]:
# Define a utility function to train the model
def fit(num_epochs, final_model, loss_fn, opt):
    for epoch in range(num_epochs):
        for xb,yb in DL:
            # Generate predictions
            pred = final_model(xb)
            loss = loss_fn(pred,yb)
            # Perform gradient descent
            loss.backward()
            opt.step()
            opt.zero_grad()
    print('Training loss: ', loss_fn(final_model(inputs), targets))


In [14]:

# Train the model for 100 epochs
fit(100 , final_model , loss_fn, opt)

Training loss:  tensor(74.6290, grad_fn=<MseLossBackward>)


In [15]:

# Generate predictions
preds = final_model(inputs)
preds

tensor([[ 59.1765,  72.4023],
        [ 77.3886,  97.6060],
        [126.5622, 136.5799],
        [ 32.3130,  48.4546],
        [ 86.9168, 107.1836],
        [ 59.1765,  72.4023],
        [ 77.3886,  97.6060],
        [126.5622, 136.5799],
        [ 32.3130,  48.4546],
        [ 86.9168, 107.1836],
        [ 59.1765,  72.4023],
        [ 77.3886,  97.6060],
        [126.5622, 136.5799],
        [ 32.3130,  48.4546],
        [ 86.9168, 107.1836]], grad_fn=<AddmmBackward>)

In [16]:
# Compare with targets
targets

tensor([[ 56.,  70.],
        [ 81., 101.],
        [119., 133.],
        [ 22.,  37.],
        [103., 119.],
        [ 56.,  70.],
        [ 81., 101.],
        [119., 133.],
        [ 22.,  37.],
        [103., 119.],
        [ 56.,  70.],
        [ 81., 101.],
        [119., 133.],
        [ 22.,  37.],
        [103., 119.]])

Now we can define the model, optimizer and loss function exactly as before.

In [17]:
fit(100 , final_model , loss_fn, opt)

Training loss:  tensor(30.9783, grad_fn=<MseLossBackward>)


## Exercise 1:
 Try Linear Regression just using numpy (Without Tensorflow/Pytorch or other torch library). You can optionally use sklearn (if you want)
 
 
## Exercise 2:
 Try Linear regression on same prediction data using Tensorflow

 

In [18]:
# Input (temp, rainfall, humidity)
inputs = np.array([[73, 67, 43], [91, 88, 64], [87, 134, 58], [102, 43, 37], [69, 96, 70], [73, 67, 43], [91, 88, 64], [87, 134, 58], [102, 43, 37], [69, 96, 70], [73, 67, 43], [91, 88, 64], [87, 134, 58], [102, 43, 37], [69, 96, 70]], dtype='float32')
# Targets (apples, oranges)
targets = np.array([[56, 70], [81, 101], [119, 133], [22, 37], [103, 119], 
                    [56, 70], [81, 101], [119, 133], [22, 37], [103, 119], 
                    [56, 70], [81, 101], [119, 133], [22, 37], [103, 119]], dtype='float32')

x_shape = inputs.shape

In [19]:

# weights and biases
weights = np.random.rand(2,3)
biases = np.random.rand(15,2)
print("Weights:",weights,sep='\n')
print("Biases:",biases,sep="\n")

Weights:
[[0.12596533 0.62409758 0.18406869]
 [0.89527824 0.15662874 0.72851021]]
Biases:
[[0.71687701 0.78010178]
 [0.26797523 0.33826072]
 [0.96269716 0.90093092]
 [0.77980285 0.14769618]
 [0.51185647 0.18716205]
 [0.77718148 0.272468  ]
 [0.83991725 0.3393861 ]
 [0.2295112  0.46223362]
 [0.67177959 0.19421075]
 [0.35713336 0.19674661]
 [0.12734    0.07940858]
 [0.56644807 0.2378777 ]
 [0.67144469 0.04354616]
 [0.95352633 0.09169035]
 [0.59077171 0.22279846]]


In [20]:
# Define the model
def model(x):
    return x @ np.transpose(weights) + biases

In [21]:

# Generate predictions
preds = model(inputs)

In [22]:
# Compare with targets
print("Predictions : ", preds, sep="\n")
print("Targets : ",targets, sep="\n")

Predictions : 
[[ 59.64183783 107.95547842]
 [ 78.43180367 142.2165638 ]
 [106.22674084 142.03198199]
 [ 47.27500434 125.15599066]
 [ 82.00164031 127.99343506]
 [ 59.7021423  107.44784463]
 [ 79.00374569 142.21768919]
 [105.49355489 141.59328469]
 [ 47.16698108 125.20250522]
 [ 81.84691719 128.00301963]
 [ 59.05230083 107.25478522]
 [ 78.73027651 142.11618078]
 [105.93548838 141.17459724]
 [ 47.44872782 125.09998483]
 [ 82.08055555 128.02907148]]
Targets : 
[[ 56.  70.]
 [ 81. 101.]
 [119. 133.]
 [ 22.  37.]
 [103. 119.]
 [ 56.  70.]
 [ 81. 101.]
 [119. 133.]
 [ 22.  37.]
 [103. 119.]
 [ 56.  70.]
 [ 81. 101.]
 [119. 133.]
 [ 22.  37.]
 [103. 119.]]


In [23]:
# MSE loss
def mse(t1, t2):
    diff = t1 - t2
    return np.sum(diff * diff) / len(diff)

In [24]:
# Compute loss
loss = mse(preds, targets)
print(loss)

2460.781496581987


In [25]:
# compute gradients
biases_grad = (preds-targets)*2/x_shape[0]
weights_grad = (np.matmul(np.transpose((preds-targets)),inputs))*2/x_shape[0]

print("weights_grad:",weights_grad, sep="\n")
print("biases_grad:",biases_grad, sep="\n")

weights_grad:
[[   13.7377909  -1062.46478765  -517.24230427]
 [ 6740.16611682  4779.1837832   3456.62255232]]
biases_grad:
[[ 0.48557838  5.06073046]
 [-0.34242618  5.49554184]
 [-1.70310122  1.20426427]
 [ 3.37000058 11.75413209]
 [-2.79978129  1.19912468]
 [ 0.49361897  4.99304595]
 [-0.26616724  5.49569189]
 [-1.80085935  1.14577129]
 [ 3.35559748 11.76033403]
 [-2.82041104  1.20040262]
 [ 0.40697344  4.9673047 ]
 [-0.3026298   5.48215744]
 [-1.74193488  1.0899463 ]
 [ 3.39316371 11.74666464]
 [-2.78925926  1.2038762 ]]


Adjust weights

In [26]:
# Adjust weights
weights -= weights_grad * 1e-5
biases -= biases_grad * 1e-5

In [27]:
print("Weights:",weights,sep='\n')
print("Biases:",biases,sep="\n")

Weights:
[[0.12582796 0.63472223 0.18924111]
 [0.82787658 0.10883691 0.69394399]]
Biases:
[[0.71687216 0.78005118]
 [0.26797865 0.33820576]
 [0.96271419 0.90091888]
 [0.77976915 0.14757864]
 [0.51188447 0.18715006]
 [0.77717654 0.27241807]
 [0.83991991 0.33933115]
 [0.22952921 0.46222216]
 [0.67174604 0.19409315]
 [0.35716156 0.19673461]
 [0.12733593 0.07935891]
 [0.5664511  0.23782288]
 [0.67146211 0.04353526]
 [0.9534924  0.09157289]
 [0.59079961 0.22278642]]


In [28]:
# Calculate loss
preds = model(inputs)
loss = mse(preds, targets)
print(loss)

1784.8966030762442


In [29]:
# repeating same for 200 times
for i in range(200):
    preds = model(inputs)
    loss = mse(preds, targets)
    
    biases_grad = ((((inputs@np.transpose(weights))+biases)-targets))*2/x_shape[0]
    weights_grad = (np.matmul(np.transpose((((inputs@np.transpose(weights))+biases)-targets)),inputs))*2/x_shape[0]

    weights -= weights_grad * 1e-5
    biases -= biases_grad * 1e-5

In [30]:
# Calculate loss
preds = model(inputs)
loss = mse(preds, targets)
print(loss)

21.66265757735055


In [31]:
# Print predictions
print(preds)

[[ 57.98892842  71.76988012]
 [ 79.7953977  100.40364218]
 [122.66834403 132.62208658]
 [ 24.51684708  42.2187479 ]
 [ 96.43250042 115.43226239]
 [ 58.04921672  71.26238236]
 [ 80.36718646 100.40476727]
 [121.93535455 132.18350683]
 [ 24.40885277  42.26525   ]
 [ 96.27781876 115.44184439]
 [ 57.39954938  71.06937468]
 [ 80.09379056 100.30328607]
 [122.37716961 131.76493157]
 [ 24.69052401  42.16275708]
 [ 96.51139451 115.46788926]]


In [32]:
# Print targets
print(targets)

[[ 56.  70.]
 [ 81. 101.]
 [119. 133.]
 [ 22.  37.]
 [103. 119.]
 [ 56.  70.]
 [ 81. 101.]
 [119. 133.]
 [ 22.  37.]
 [103. 119.]
 [ 56.  70.]
 [ 81. 101.]
 [119. 133.]
 [ 22.  37.]
 [103. 119.]]
