In [1]:
import torch
import torch.nn as nn
import torch.nn.functional as F

import torch.optim as optim

def criterion(out, label):
    return (label - out)**2

# (data / label)
# note floating point number *.*
data = [(1.0,3.0), (2.0,6.0), (3.0,9.0), (4.0,12.0), (5.0,15.0), (6.0,18.0)]

# requires_grad turned on
W = torch.tensor([1.0], requires_grad=True)


X,label = data[1]

Y = X*W
loss = criterion(Y,label) 
loss.backward()

## loss = (label-X*W)**2
## d(loss)/dw = 2*(label-X*W)*(-X)=2*4*(-2)

W.grad

tensor([-16.])

In [3]:
### Training with manually updating W with "Backward" ###

import torch
#from torch.autograd import Variable
import torch.nn as nn
import torch.nn.functional as F

import torch.optim as optim

def criterion(out, label):
    return (label - out)**2


data = [(1.0,3.0), (2.0,6.0), (3.0,9.0), (4.0,12.0), (5.0,15.0), (6.0,18.0)]

W = torch.tensor([1.0], requires_grad=True)

lr = 0.01
temp = torch.tensor([0.0])


for epoch in range(20):
    for i, current_data in enumerate(data):
        W = torch.randn(1) # This line is for clean start
        W = temp
        W.requires_grad = True
        X, Y = current_data
        outputs = X*W
        loss = criterion(outputs, Y)
        loss.backward()
        W = W - lr* W.grad
        temp = W.detach()    # Not to deliver the grad, but just value
        print("Epoch {} - loss: {}".format(epoch, loss))


### Test the trained network ###            
for i, current_data in enumerate(data):
    X, Y = current_data 
    outputs = X*W  
    print("when x = {}, y = {}".format(X, outputs))

Epoch 0 - loss: tensor([9.], grad_fn=<PowBackward0>)
Epoch 0 - loss: tensor([34.5744], grad_fn=<PowBackward0>)
Epoch 0 - loss: tensor([65.8435], grad_fn=<PowBackward0>)
Epoch 0 - loss: tensor([78.7078], grad_fn=<PowBackward0>)
Epoch 0 - loss: tensor([56.8664], grad_fn=<PowBackward0>)
Epoch 0 - loss: tensor([20.4719], grad_fn=<PowBackward0>)
Epoch 1 - loss: tensor([0.0446], grad_fn=<PowBackward0>)
Epoch 1 - loss: tensor([0.1713], grad_fn=<PowBackward0>)
Epoch 1 - loss: tensor([0.3262], grad_fn=<PowBackward0>)
Epoch 1 - loss: tensor([0.3899], grad_fn=<PowBackward0>)
Epoch 1 - loss: tensor([0.2817], grad_fn=<PowBackward0>)
Epoch 1 - loss: tensor([0.1014], grad_fn=<PowBackward0>)
Epoch 2 - loss: tensor([0.0002], grad_fn=<PowBackward0>)
Epoch 2 - loss: tensor([0.0008], grad_fn=<PowBackward0>)
Epoch 2 - loss: tensor([0.0016], grad_fn=<PowBackward0>)
Epoch 2 - loss: tensor([0.0019], grad_fn=<PowBackward0>)
Epoch 2 - loss: tensor([0.0014], grad_fn=<PowBackward0>)
Epoch 2 - loss: tensor([0.0005

In [4]:
### Training with fancier version ###

import torch
import torch.nn as nn
import torch.nn.functional as F

import torch.optim as optim


class Net(nn.Module): ## nn.Module class is used
    def __init__(self):
        super(Net, self).__init__()
        self.fc1 = nn.Linear(1,1,bias=False)  # in dim, out dim
    def forward(self, x):
        x = self.fc1(x)
        return x

net = Net()

print(net)
print(list(net.parameters())) # parameters are randomized

#input = torch.randn(1)
#out = net(input)

#def criterion(out, label):
#    return (label - out)**2
criterion = nn.MSELoss()


optimizer = optim.SGD(net.parameters(), lr=0.01, momentum=0.5)
#optimizer = optim.Adam(net.parameters(), lr=0.005)


data = [(1.0,3.0), (2.0,6.0), (3.0,9.0), (4.0,12.0), (5.0,15.0), (6.0,18.0)]

for epoch in range(20): # 0 - 19
    for i, current_data in enumerate(data):
        X, Y = current_data
        X, Y = torch.FloatTensor([X]), torch.FloatTensor([Y])
        optimizer.zero_grad()   
        outputs = net(X)
        loss = criterion(outputs, Y)
        loss.backward()
        optimizer.step()    ## This line is equivalent to "W = W - lr* W.grad"
        print("Epoch {} - loss: {}".format(epoch, loss))

### Test the trained network ###            
for i, current_data in enumerate(data):
    X, Y = current_data
    X, Y = torch.FloatTensor([X]), torch.FloatTensor([Y])  
    out = net(torch.FloatTensor(X))  
    print("when x = {}, y = {}".format(X, out))
    

Net(
  (fc1): Linear(in_features=1, out_features=1, bias=False)
)
[Parameter containing:
tensor([[-0.0864]], requires_grad=True)]
Epoch 0 - loss: 9.525641441345215
Epoch 0 - loss: 36.59370422363281
Epoch 0 - loss: 68.1517333984375
Epoch 0 - loss: 71.91449737548828
Epoch 0 - loss: 31.683963775634766
Epoch 0 - loss: 0.15558268129825592
Epoch 1 - loss: 0.26174238324165344
Epoch 1 - loss: 2.4967117309570312
Epoch 1 - loss: 6.750637531280518
Epoch 1 - loss: 8.956439018249512
Epoch 1 - loss: 5.058509826660156
Epoch 1 - loss: 0.2064681500196457
Epoch 2 - loss: 0.02750319242477417
Epoch 2 - loss: 0.32105863094329834
Epoch 2 - loss: 0.9180330038070679
Epoch 2 - loss: 1.2537418603897095
Epoch 2 - loss: 0.7278085947036743
Epoch 2 - loss: 0.033841267228126526
Epoch 3 - loss: 0.0037695716600865126
Epoch 3 - loss: 0.0451115146279335
Epoch 3 - loss: 0.12982025742530823
Epoch 3 - loss: 0.17786748707294464
Epoch 3 - loss: 0.10356582701206207
Epoch 3 - loss: 0.004882082808762789
Epoch 4 - loss: 0.000533

In [5]:
for epoch in range(20):
    print(epoch)

0
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19


In [6]:
W = torch.tensor([1.0], requires_grad=True)
W = W*2
label = 1.0
loss = W*5 - label 
loss.backward()
W.grad

  W.grad


  W.grad
