In [0]:
import torch
import torchvision
import torch.nn as nn
import numpy as np
import torchvision.transforms as transforms

In [0]:
# create tensors
x = torch.tensor(1., requires_grad = True)
w = torch.tensor(2., requires_grad = True)
b = torch.tensor(3., requires_grad = True)

In [0]:
# build a computational graph
y = w*x + b

In [0]:
# compute gradients
y.backward()

In [6]:
# print out the gradient
print(x.grad)
print(w.grad)
print(b.grad)

tensor(2.)
tensor(1.)
tensor(1.)


In [0]:
# create tensors of shape (10, 3) and (10, 2)
x = torch.randn(10, 3)
y = torch.randn(10, 2)

In [8]:
# build a fully connected layer
linear = nn.Linear(3, 2)
print('w: ', linear.weight)
print('b: ', linear.bias)

w:  Parameter containing:
tensor([[-0.4549, -0.2026, -0.4567],
        [ 0.1771,  0.0871,  0.4816]], requires_grad=True)
b:  Parameter containing:
tensor([-0.3535,  0.4477], requires_grad=True)


In [0]:
# build loss function and optimizer
criterion = nn.MSELoss()
optimizer = torch.optim.SGD(linear.parameters(), lr=0.01)

In [0]:
# forward pass
pred = linear(x)

In [11]:
# compute loss
loss = criterion(pred, y)
print('loss: ', loss.item())

loss:  2.172520399093628


In [0]:
# backward pass
loss.backward()

In [13]:
# print out the gradients
print('dL/dw: ', linear.weight.grad)
print('dL/db: ', linear.bias.grad)

dL/dw:  tensor([[-0.5859, -0.4575, -0.1959],
        [ 0.0080,  0.0669,  0.1434]])
dL/db:  tensor([0.6162, 0.9035])


In [0]:
# 1-step gradient descent
optimizer.step()

In [15]:
# print out the loss after 1-step gradient descent
pred = linear(x)
loss = criterion(pred, y)
print('loss after 1 step optimization: ', loss.item())

loss after 1 step optimization:  2.1544740200042725


In [0]:
# create a numpy array
x = np.array([[1, 2], [3, 4]])

# convert the numpy array to a torch tensor
y = torch.from_numpy(x)

# convert the torch tensor to a numpy array
z = y.numpy()