In [0]:
import torch 
import torchvision
import torch.nn as nn
import numpy as np
import torchvision.transforms as transforms

#Create tensors

In [0]:
x = torch.tensor(1., requires_grad=True)
w = torch.tensor(2., requires_grad=True)
b = torch.tensor(3., requires_grad=True)

# Print out the gradients

In [0]:
print(x.grad) 

#Compute gradients

In [0]:
y.backward()

# Create tensors of shape (10, 3) and (10, 2)

In [0]:
x = torch.randn(10, 3)
y = torch.randn(10, 2)

# Build a fully connected layer

In [0]:
linear = nn.Linear(3, 2)

# Build loss function and optimizer.

In [0]:
criterion = nn.MSELoss()
optimizer = torch.optim.SGD(linear.parameters(), lr=0.01)
#optimizer = torch.optim.Adam(linear.parameters(), lr=0.01)
#optimizer = torch.optim.RMSprop(linear.parameters(), lr=0.01)

# Forward pass

In [0]:
pred = linear(x)

# Compute loss.

In [0]:
loss = criterion(pred, y)
print('loss: ', loss.item())

# Backward pass.

In [0]:
loss.backward()

# Print out the gradients.

In [0]:
print ('dL/dw: ', linear.weight.grad) 
print ('dL/db: ', linear.bias.grad)

# 1-step gradient descent.

In [0]:
optimizer.step()

# Print out the loss after 1-step gradient descent.

In [0]:
pred = linear(x)
loss = criterion(pred, y)
print('loss after 1 step optimization: ', loss.item())

#Loading data from numpy

In [0]:
# Create a numpy array.
x = np.array([[1, 2], [3, 4]])

# Convert the numpy array to a torch tensor.
y = torch.from_numpy(x)

# Convert the torch tensor to a numpy array.
z = y.numpy()

#Input pipline 

In [0]:
# Download and construct CIFAR-10 dataset.
train_dataset = torchvision.datasets.CIFAR10(root='../../data/',
                                             train=True, 
                                             transform=transforms.ToTensor(),
                                             download=True)

# Fetch one data pair (read data from disk).
image, label = train_dataset[0]
print (image.size())
print (label)

# Data loader (this provides queues and threads in a very simple way).
train_loader = torch.utils.data.DataLoader(dataset=train_dataset,
                                           batch_size=64, 
                                           shuffle=True)

# When iteration starts, queue and thread start to load data from files.
data_iter = iter(train_loader)

# Mini-batch images and labels.
images, labels = data_iter.next()

# Actual usage of the data loader is as below.
for images, labels in train_loader:
    # Training code should be written here.
    pass

#Pretrained model 

In [0]:
# Download and load the pretrained ResNet-18.
resnet = torchvision.models.resnet18(pretrained=True)

# If you want to finetune only the top layer of the model, set as below.
for param in resnet.parameters():
    param.requires_grad = False

# Replace the top layer for finetuning.
resnet.fc = nn.Linear(resnet.fc.in_features, 100)  # 100 is an example.

# Forward pass.
images = torch.randn(64, 3, 224, 224)
outputs = resnet(images)
print (outputs.size())     # (64, 100)

#Save and load the model   

In [0]:
# Save and load the entire model.
torch.save(resnet, 'model.pt')
model = torch.load('model.pt')

# Save and load only the model parameters (recommended).
torch.save(resnet.state_dict(), 'params.pt')
resnet.load_state_dict(torch.load('params.pt'))