# Pytorch Basics

https://github.com/yunjey/pytorch-tutorial/blob/master/tutorials/01-basics/pytorch_basics/main.py

In [1]:
import torch
import torchvision
import torch.nn as nn
import numpy as np
import torchvision.transforms as transforms

## Basic autograd example 1

In [2]:
# Create tensors
x = torch.tensor(1., requires_grad=True)
w = torch.tensor(2., requires_grad=True)
b = torch.tensor(3., requires_grad=True)

# Build a computational graph
y = w * x + b

# Compute gradients
y.backward()

In [3]:
x.grad

tensor(2.)

In [4]:
w.grad

tensor(1.)

In [5]:
b.grad

tensor(1.)

## Basic autograd example 2  

In [11]:
x = torch.randn(10, 3)
y = torch.randn(10, 2)

# Build a fully connected layer
linear = nn.Linear(3, 2)
print('w: ', linear.weight)
print('b: ', linear.bias)

w:  Parameter containing:
tensor([[ 0.4193,  0.4437, -0.5060],
        [ 0.2475,  0.5320,  0.2883]], requires_grad=True)
b:  Parameter containing:
tensor([ 0.4067, -0.3276], requires_grad=True)


In [12]:
# Build loss function and optimizer
criterion = nn.MSELoss()
optimizer = torch.optim.SGD(linear.parameters(), lr=0.01)

# Forward pass
pred = linear(x)

# Compute loss
loss = criterion(pred, y)
print('loss: ', loss.item())

loss:  1.6126983165740967


In [15]:
loss.backward()

In [16]:
print('dL/dw: ', linear.weight.grad)
print('dL/db: ', linear.bias.grad)

dL/dw:  tensor([[ 1.2357, -0.1020, -0.3568],
        [ 0.1118,  0.3095,  0.5238]])
dL/db:  tensor([ 0.8207, -0.2463])


In [17]:
# 1-step gradient descent
optimizer.step()

# Forward pass
pred = linear(x)

# Compute loss
loss = criterion(pred, y)
print('loss after 1 step optimization: ', loss.item())

loss after 1 step optimization:  1.5850390195846558


## Loading data from numpy   

In [18]:
x = np.array([[1, 2], [3, 4]])
x

array([[1, 2],
       [3, 4]])

In [19]:
y = torch.from_numpy(x)
y

tensor([[1, 2],
        [3, 4]])

In [20]:
z = y.numpy()
z

array([[1, 2],
       [3, 4]])

## Input pipline

In [21]:
# Download and construct CIFAR-10 dataset
train_dataset = torchvision.datasets.CIFAR10(root='./data/',
                                                                                 train=True,
                                                                                 transform=transforms.ToTensor(),
                                                                                 download=True)

image, label = train_dataset[0]
print(image.size())
print(label)

Downloading https://www.cs.toronto.edu/~kriz/cifar-10-python.tar.gz to ./data/cifar-10-python.tar.gz
torch.Size([3, 32, 32])
6


In [23]:
train_loader = torch.utils.data.DataLoader(dataset=train_dataset,
                                                                           batch_size=64,
                                                                           shuffle=True)

data_iter = iter(train_loader)

images, labels = data_iter.next()

In [25]:
print(images.size())
print(labels)

torch.Size([64, 3, 32, 32])
tensor([2, 0, 5, 9, 9, 9, 9, 5, 7, 2, 5, 8, 4, 5, 7, 9, 0, 1, 0, 6, 4, 3, 2, 8,
        7, 9, 6, 4, 3, 8, 2, 2, 3, 9, 1, 1, 1, 0, 9, 1, 0, 2, 9, 3, 4, 7, 1, 8,
        4, 2, 7, 9, 7, 7, 6, 6, 3, 8, 6, 2, 9, 8, 4, 0])


## Input pipline for custom dataset  

In [None]:
# You should build your custom dataset as below.
class CustomDataset(torch.utils.data.Dataset):
    def __init__(self):
        # TODO
        # 1. Initialize file paths or a list of file names. 
        pass
    def __getitem__(self, index):
        # TODO
        # 1. Read one data from file (e.g. using numpy.fromfile, PIL.Image.open).
        # 2. Preprocess the data (e.g. torchvision.Transform).
        # 3. Return a data pair (e.g. image and label).
        pass
    def __len__(self):
        # You should change 0 to the total size of your dataset.
        return 0 

# You can then use the prebuilt data loader. 
custom_dataset = CustomDataset()
train_loader = torch.utils.data.DataLoader(dataset=custom_dataset,
                                           batch_size=64, 
                                           shuffle=True)

## Pretrained model

In [27]:
resnet = torchvision.models.resnet18(pretrained=True)

# Finetune only the top layer
for param in resnet.parameters():
    param.requires_grad = False

resnet.fc = nn.Linear(resnet.fc.in_features, 100)

# Forward pass
images = torch.randn(64, 3, 224, 224)
outputs = resnet(images)
print(outputs.size())

torch.Size([64, 100])


## Save and load the model

In [29]:
# Save and load the entire model.
torch.save(resnet, './data/model.ckpt')
model = torch.load('./data/model.ckpt')

In [31]:
# Save and load only the model parameters (recommended)
torch.save(resnet.state_dict(), 'params.ckpt')
resnet.load_state_dict(torch.load('params.ckpt'))