In [1]:
import torch
import torch.nn as nn
import torch.nn.functional as F

import torch.optim as optim

def criterion(out, label):
    return (label - out)**2

# (data / label)
# note floating point number *.*
data = [(1.0,3.0), (2.0,6.0), (3.0,9.0), (4.0,12.0), (5.0,15.0), (6.0,18.0)]

# requires_grad turned on
W = torch.tensor([1.0], requires_grad=True)


X,label = data[1]

Y = X*W
loss = criterion(Y,label) 
loss.backward()

## loss = (label-X*W)**2
## d(loss)/dw = 2*(label-X*W)*(-X)=2*4*(-2)

W.grad

tensor([-16.])

In [2]:
### Training with manually updating W with "Backward" ###

import torch
#from torch.autograd import Variable
import torch.nn as nn
import torch.nn.functional as F

import torch.optim as optim

def criterion(out, label):
    return (label - out)**2


data = [(1.0,3.0), (2.0,6.0), (3.0,9.0), (4.0,12.0), (5.0,15.0), (6.0,18.0)]

W = torch.tensor([1.0], requires_grad=True)

lr = 0.01
temp = torch.tensor([0.0])


for epoch in range(20):
    for i, current_data in enumerate(data):

        W = temp
        W.requires_grad = True
        X, Y = current_data
        outputs = X*W
        loss = criterion(outputs, Y)
        loss.backward()
        W = W - lr* W.grad
        temp = W.detach()    # Not to deliver the grad, but just value
        print("Epoch {} - loss: {}".format(epoch, loss))


### Test the trained network ###            
for i, current_data in enumerate(data):
    X, Y = current_data 
    outputs = X*W  
    print("when x = {}, y = {}".format(X, outputs))

Epoch 0 - loss: tensor([9.], grad_fn=<PowBackward0>)
Epoch 0 - loss: tensor([34.5744], grad_fn=<PowBackward0>)
Epoch 0 - loss: tensor([65.8435], grad_fn=<PowBackward0>)
Epoch 0 - loss: tensor([78.7078], grad_fn=<PowBackward0>)
Epoch 0 - loss: tensor([56.8664], grad_fn=<PowBackward0>)
Epoch 0 - loss: tensor([20.4719], grad_fn=<PowBackward0>)
Epoch 1 - loss: tensor([0.0446], grad_fn=<PowBackward0>)
Epoch 1 - loss: tensor([0.1713], grad_fn=<PowBackward0>)
Epoch 1 - loss: tensor([0.3262], grad_fn=<PowBackward0>)
Epoch 1 - loss: tensor([0.3899], grad_fn=<PowBackward0>)
Epoch 1 - loss: tensor([0.2817], grad_fn=<PowBackward0>)
Epoch 1 - loss: tensor([0.1014], grad_fn=<PowBackward0>)
Epoch 2 - loss: tensor([0.0002], grad_fn=<PowBackward0>)
Epoch 2 - loss: tensor([0.0008], grad_fn=<PowBackward0>)
Epoch 2 - loss: tensor([0.0016], grad_fn=<PowBackward0>)
Epoch 2 - loss: tensor([0.0019], grad_fn=<PowBackward0>)
Epoch 2 - loss: tensor([0.0014], grad_fn=<PowBackward0>)
Epoch 2 - loss: tensor([0.0005

In [1]:
### Training with fancier version ###

import torch
import torch.nn as nn
import torch.nn.functional as F

import torch.optim as optim


class Net(nn.Module): ## nn.Module class is used
    def __init__(self):
        super(Net, self).__init__()
        self.fc1 = nn.Linear(1,1,bias=False)  # in dim, out dim
    def forward(self, x):
        x = self.fc1(x)
        return x

net = Net()

print(net)
print(list(net.parameters())) # parameters are randomized

#input = torch.randn(1)
#out = net(input)

#def criterion(out, label):
#    return (label - out)**2
criterion = nn.MSELoss()


optimizer = optim.SGD(net.parameters(), lr=0.01, momentum=0.5)
#optimizer = optim.Adam(net.parameters(), lr=0.005)


data = [(1.0,3.0), (2.0,6.0), (3.0,9.0), (4.0,12.0), (5.0,15.0), (6.0,18.0)]

for epoch in range(20): # 0 - 19
    for i, current_data in enumerate(data):
        X, Y = current_data
        X, Y = torch.FloatTensor([X]), torch.FloatTensor([Y])
        optimizer.zero_grad()   
        outputs = net(X)
        loss = criterion(outputs, Y)
        loss.backward()
        optimizer.step()    ## This line is equivalent to "W = W - lr* W.grad"
        print("Epoch {} - loss: {}".format(epoch, loss))

### Test the trained network ###            
for i, current_data in enumerate(data):
    X, Y = current_data
    X, Y = torch.FloatTensor([X]), torch.FloatTensor([Y])  
    out = net(torch.FloatTensor(X))  
    print("when x = {}, y = {}".format(X, out))
    

Net(
  (fc1): Linear(in_features=1, out_features=1, bias=False)
)
[Parameter containing:
tensor([[-0.5741]], requires_grad=True)]
Epoch 0 - loss: 12.774344444274902
Epoch 0 - loss: 49.07391357421875
Epoch 0 - loss: 91.39473724365234
Epoch 0 - loss: 96.44080352783203
Epoch 0 - loss: 42.489715576171875
Epoch 0 - loss: 0.20864400267601013
Epoch 1 - loss: 0.3510093092918396
Epoch 1 - loss: 3.348212242126465
Epoch 1 - loss: 9.052931785583496
Epoch 1 - loss: 12.011017799377441
Epoch 1 - loss: 6.783707618713379
Epoch 1 - loss: 0.27688172459602356
Epoch 2 - loss: 0.03688310459256172
Epoch 2 - loss: 0.4305545389652252
Epoch 2 - loss: 1.2311245203018188
Epoch 2 - loss: 1.6813257932662964
Epoch 2 - loss: 0.976023256778717
Epoch 2 - loss: 0.045382533222436905
Epoch 3 - loss: 0.005055175628513098
Epoch 3 - loss: 0.06049667298793793
Epoch 3 - loss: 0.17409490048885345
Epoch 3 - loss: 0.2385275512933731
Epoch 3 - loss: 0.13888661563396454
Epoch 3 - loss: 0.006547001656144857
Epoch 4 - loss: 0.0007154

In [2]:
for epoch in range(20):
    print(epoch)

0
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19


In [3]:
W = torch.tensor([1.0], requires_grad=True)
W = W*2
label = 1.0
loss = W*5 - label 
loss.backward()
W.grad

  W.grad
