In [5]:
import torch
#from torch.autograd import Variable

x_data = [1.0, 2.0, 3.0]
y_data = [2.0, 4.0, 6.0]


w = torch.tensor([1.0], requires_grad=True)

In [6]:
def forward(x):
    return x * w

# Loss function
def loss(x, y):
    y_pred = forward(x)
    return (y_pred - y) * (y_pred - y)

# Before training
print("predict (before training)",  4, forward(4).data[0])


predict (before training) 4 tensor(4.)


In [7]:
# Training loop
for epoch in range(10):
    for x_val, y_val in zip(x_data, y_data):
        l = loss(x_val, y_val)
        l.backward()
        print("\tgrad: ", x_val, y_val, w.grad.data[0])
        w.data = w.data - 0.01 * w.grad.data

        # Manually zero the gradients after updating weights
        w.grad.data.zero_()

    print("progress:", epoch, l.data[0])

# After training
print("predict (after training)",  4, forward(4).data[0])


	grad:  1.0 2.0 tensor(-2.)
	grad:  2.0 4.0 tensor(-7.8400)
	grad:  3.0 6.0 tensor(-16.2288)
progress: 0 tensor(7.3159)
	grad:  1.0 2.0 tensor(-1.4786)
	grad:  2.0 4.0 tensor(-5.7962)
	grad:  3.0 6.0 tensor(-11.9981)
progress: 1 tensor(3.9988)
	grad:  1.0 2.0 tensor(-1.0932)
	grad:  2.0 4.0 tensor(-4.2852)
	grad:  3.0 6.0 tensor(-8.8704)
progress: 2 tensor(2.1857)
	grad:  1.0 2.0 tensor(-0.8082)
	grad:  2.0 4.0 tensor(-3.1681)
	grad:  3.0 6.0 tensor(-6.5580)
progress: 3 tensor(1.1946)
	grad:  1.0 2.0 tensor(-0.5975)
	grad:  2.0 4.0 tensor(-2.3422)
	grad:  3.0 6.0 tensor(-4.8484)
progress: 4 tensor(0.6530)
	grad:  1.0 2.0 tensor(-0.4417)
	grad:  2.0 4.0 tensor(-1.7316)
	grad:  3.0 6.0 tensor(-3.5845)
progress: 5 tensor(0.3569)
	grad:  1.0 2.0 tensor(-0.3266)
	grad:  2.0 4.0 tensor(-1.2802)
	grad:  3.0 6.0 tensor(-2.6500)
progress: 6 tensor(0.1951)
	grad:  1.0 2.0 tensor(-0.2414)
	grad:  2.0 4.0 tensor(-0.9465)
	grad:  3.0 6.0 tensor(-1.9592)
progress: 7 tensor(0.1066)
	grad:  1.0 2.0 te

# [Online Derivatives](https://www.derivative-calculator.net/)

## Multiple weights

In [5]:
import numpy as np
import matplotlib.pyplot as plt
x_data = [1.0, 2.0, 3.0]
y_data = [2.0, 4.0, 6.0]


w1 = 1.0  # a random guess: random value, 1.0
w2 = 1.0
b = 1.0

# our model for the forward pass
def forward(x):
    return x ** 2 * w2 + x * w1 +b

# Loss function
def loss(x, y):
    y_pred = forward(x)
    return (y_pred - y) * (y_pred - y)

# compute gradient
def gradientb(x, y):  # d_loss/d_w
    return 2 * (b - y + w2 * x **2 + w1 * x)

# compute gradient
def gradientw1(x, y):  # d_loss/d_w
    return 2 * x * (x * w1 - y + w2 * x ** 2 + b)

# compute gradient
def gradientw2(x, y):  # d_loss/d_w
    return 2 * x ** 2 * (x ** 2 * w2 - y + w1 * x + b)



# Before training
print("predict (before training)",  4, forward(4))

# Training loop
for epoch in range(10):
    for x_val, y_val in zip(x_data, y_data):
        gradb = gradientb(x_val, y_val)
        gradw1 = gradientw1(x_val, y_val)
        gradw2 = gradientw2(x_val, y_val)
        b = w - 0.01 * gradb
        w1 = w1 - 0.01 * gradw1
        w2 = w2 - 0.01 * gradw2
        print("\tgradb: ", x_val, y_val, gradb)
        l = loss(x_val, y_val)

    print("progress:", epoch, "w=", w, "loss=", l)

# After training
print("predict (after training)",  "4 hours", forward(4))


predict (before training) 4 21.0
	gradb:  1.0 2.0 2.0
	gradb:  2.0 4.0 tensor([7.6224], grad_fn=<MulBackward>)
	gradb:  3.0 6.0 tensor([8.8671], grad_fn=<MulBackward>)
progress: 0 w= tensor([1.9512], requires_grad=True) loss= tensor([12.6686], grad_fn=<ThMulBackward>)
	gradb:  1.0 2.0 tensor([0.6023], grad_fn=<MulBackward>)
	gradb:  2.0 4.0 tensor([-2.9193], grad_fn=<MulBackward>)
	gradb:  3.0 6.0 tensor([-4.5753], grad_fn=<MulBackward>)
progress: 1 w= tensor([1.9512], requires_grad=True) loss= tensor([3.4102], grad_fn=<ThMulBackward>)
	gradb:  1.0 2.0 tensor([2.2954], grad_fn=<MulBackward>)
	gradb:  2.0 4.0 tensor([1.7823], grad_fn=<MulBackward>)
	gradb:  3.0 6.0 tensor([1.5181], grad_fn=<MulBackward>)
progress: 2 w= tensor([1.9512], requires_grad=True) loss= tensor([0.3655], grad_fn=<ThMulBackward>)
	gradb:  1.0 2.0 tensor([1.5035], grad_fn=<MulBackward>)
	gradb:  2.0 4.0 tensor([-0.3704], grad_fn=<MulBackward>)
	gradb:  3.0 6.0 tensor([-1.2211], grad_fn=<MulBackward>)
progress: 3 w=