In [1]:
import torch
import torch.nn as nn
import torch.nn.functional as F

import torch.optim as optim

def criterion(out, label):
    return (label - out)**2

# (data / label)
# note floating point number *.*
data = [(1.0,3.0), (2.0,6.0), (3.0,9.0), (4.0,12.0), (5.0,15.0), (6.0,18.0)]

# requires_grad turned on
W = torch.tensor([1.0], requires_grad=True)


X,label = data[1]

Y = X*W
loss = criterion(Y,label) 
loss.backward()

## loss = (label-X*W)**2
## d(loss)/dw = 2*(label-X*W)*(-X)=2*4*(-2)

W.grad

tensor([-16.])

In [2]:
### Training with manually updating W with "Backward" ###

import torch
#from torch.autograd import Variable
import torch.nn as nn
import torch.nn.functional as F

import torch.optim as optim

def criterion(out, label):
    return (label - out)**2


data = [(1.0,3.0), (2.0,6.0), (3.0,9.0), (4.0,12.0), (5.0,15.0), (6.0,18.0)]

W = torch.tensor([1.0], requires_grad=True)

lr = 0.01
temp = torch.tensor([0.0])


for epoch in range(20):
    for i, current_data in enumerate(data):
        W = torch.randn(1) # This line is for clean start
        W = temp
        W.requires_grad = True
        X, Y = current_data
        outputs = X*W
        loss = criterion(outputs, Y)
        loss.backward()
        W = W - lr* W.grad
        temp = W.detach()    # Not to deliver the grad, but just value
        print("Epoch {} - loss: {}".format(epoch, loss))


### Test the trained network ###            
for i, current_data in enumerate(data):
    X, Y = current_data 
    outputs = X*W  
    print("when x = {}, y = {}".format(X, outputs))

Epoch 0 - loss: tensor([9.], grad_fn=<PowBackward0>)
Epoch 1 - loss: tensor([0.0446], grad_fn=<PowBackward0>)
Epoch 2 - loss: tensor([0.0002], grad_fn=<PowBackward0>)
Epoch 3 - loss: tensor([1.0940e-06], grad_fn=<PowBackward0>)
Epoch 4 - loss: tensor([5.4275e-09], grad_fn=<PowBackward0>)
Epoch 5 - loss: tensor([2.7512e-11], grad_fn=<PowBackward0>)
Epoch 6 - loss: tensor([5.6843e-14], grad_fn=<PowBackward0>)
Epoch 7 - loss: tensor([0.], grad_fn=<PowBackward0>)
Epoch 8 - loss: tensor([0.], grad_fn=<PowBackward0>)
Epoch 9 - loss: tensor([0.], grad_fn=<PowBackward0>)
Epoch 10 - loss: tensor([0.], grad_fn=<PowBackward0>)
Epoch 11 - loss: tensor([0.], grad_fn=<PowBackward0>)
Epoch 12 - loss: tensor([0.], grad_fn=<PowBackward0>)
Epoch 13 - loss: tensor([0.], grad_fn=<PowBackward0>)
Epoch 14 - loss: tensor([0.], grad_fn=<PowBackward0>)
Epoch 15 - loss: tensor([0.], grad_fn=<PowBackward0>)
Epoch 16 - loss: tensor([0.], grad_fn=<PowBackward0>)
Epoch 17 - loss: tensor([0.], grad_fn=<PowBackward0>

In [8]:
### Training with fancier version ###

import torch
import torch.nn as nn
import torch.nn.functional as F

import torch.optim as optim


class Net(nn.Module): ## nn.Module class is used
    def __init__(self):
        super(Net, self).__init__()
        self.fc1 = nn.Linear(1,1,bias=False)  # in dim, out dim
    def forward(self, x):
        x = self.fc1(x)
        return x

net = Net()

print(net)
print(list(net.parameters())) # parameters are randomized

#input = torch.randn(1)
#out = net(input)

#def criterion(out, label):
#    return (label - out)**2
criterion = nn.MSELoss()


optimizer = optim.SGD(net.parameters(), lr=0.01, momentum=0.5)
#optimizer = optim.Adam(net.parameters(), lr=0.005)


data = [(1.0,3.0), (2.0,6.0), (3.0,9.0), (4.0,12.0), (5.0,15.0), (6.0,18.0)]

for epoch in range(20): # 0 - 19
    for i, current_data in enumerate(data):
        X, Y = current_data
        X, Y = torch.FloatTensor([X]), torch.FloatTensor([Y])
        optimizer.zero_grad()   
        outputs = net(X)
        loss = criterion(outputs, Y)
        loss.backward()
        optimizer.step()    ## This line is equivalent to "W = W - lr* W.grad"
        print("Epoch {} - loss: {}".format(epoch, loss))

### Test the trained network ###            
for i, current_data in enumerate(data):
    X, Y = current_data
    X, Y = torch.FloatTensor([X]), torch.FloatTensor([Y])  
    out = net(torch.FloatTensor(X))  
    print("when x = {}, y = {}".format(X, out))
    

Net(
  (fc1): Linear(in_features=1, out_features=1, bias=False)
)
[Parameter containing:
tensor([[0.0291]], requires_grad=True)]
Epoch 0 - loss: 8.826212882995605
Epoch 0 - loss: 33.90678024291992
Epoch 0 - loss: 63.14763259887695
Epoch 0 - loss: 66.63410186767578
Epoch 0 - loss: 29.357547760009766
Epoch 0 - loss: 0.14416028559207916
Epoch 1 - loss: 0.2425241470336914
Epoch 1 - loss: 2.3133928775787354
Epoch 1 - loss: 6.254979133605957
Epoch 1 - loss: 8.298823356628418
Epoch 1 - loss: 4.68709659576416
Epoch 1 - loss: 0.19130779802799225
Epoch 2 - loss: 0.025483811274170876
Epoch 2 - loss: 0.29748523235321045
Epoch 2 - loss: 0.8506273627281189
Epoch 2 - loss: 1.1616873741149902
Epoch 2 - loss: 0.6743685007095337
Epoch 2 - loss: 0.03135670721530914
Epoch 3 - loss: 0.003492799587547779
Epoch 3 - loss: 0.04179926961660385
Epoch 3 - loss: 0.1202886551618576
Epoch 3 - loss: 0.16480745375156403
Epoch 3 - loss: 0.09596136212348938
Epoch 3 - loss: 0.004523750860244036
Epoch 4 - loss: 0.00049435

In [6]:
for epoch in range(20):
    print(epoch)

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19


In [15]:
W = torch.tensor([1.0], requires_grad=True)
W = W*2
label = 1.0
loss = W*5 - label 
loss.backward()
W.grad

  W.grad


  W.grad
