# Pytorch Tutorial

Pytorch is a popular deep learning framework and it's easy to get started.

In [14]:
import torch
import torch.nn as nn
import torch.nn.functional as F
import torch.utils.data as data
import torchvision
import torchvision.transforms as transforms
from tqdm import tqdm
import numpy as np

BATCH_SIZE = 128
NUM_EPOCHS = 10

First, we read the mnist data, preprocess them and encapsulate them into dataloader form.

In [15]:
# preprocessing
normalize = transforms.Normalize(mean=[.5], std=[.5])
transform = transforms.Compose([transforms.ToTensor(), normalize])

# download and load the data
train_dataset = torchvision.datasets.MNIST(root='./mnist/', train=True, transform=transform, download=True)
test_dataset = torchvision.datasets.MNIST(root='./mnist/', train=False, transform=transform, download=False)

# encapsulate them into dataloader form
train_loader = data.DataLoader(train_dataset, batch_size=BATCH_SIZE, shuffle=True, drop_last=True)
test_loader = data.DataLoader(test_dataset, batch_size=BATCH_SIZE, shuffle=False, drop_last=True)

Then, we define the model, object function and optimizer that we use to classify.

In [16]:
class SimpleNet(nn.Module):
    
# TODO:define model
    def __init__(self):
        super(SimpleNet, self).__init__()
        self.conv1 = nn.Conv2d(1, 6, 5)
        self.conv2 = nn.Conv2d(6, 16, 5)
        self.fc1 = nn.Linear(256, 120) 
        self.fc2 = nn.Linear(120, 84)
        self.fc3 = nn.Linear(84, 10)
    
    def forward(self, x):
        x = F.relu(self.conv1(x))
        x = F.max_pool2d(x, 2, 2)
        x = F.relu(self.conv2(x))
        x = F.max_pool2d(x, 2, 2)
        x = x.view(x.shape[0],-1)
        x = F.relu(self.fc1(x))
        x = F.relu(self.fc2(x))
        x = self.fc3(x)
        x = F.log_softmax(x, dim=1)
        return x

    
model = SimpleNet()
# TODO:define loss function and optimiter
criterion = nn.CrossEntropyLoss()
optimizer = torch.optim.SGD(model.parameters(), lr=.1, momentum=0.9)

Next, we can start to train and evaluate!

In [17]:
train_acc=[]
# train and evaluate
for epoch in range(NUM_EPOCHS):
    for images, labels in tqdm(train_loader):
        # TODO:forward + backward + optimize
        predictions = model(images)
        loss=criterion(predictions,labels)
        optimizer.zero_grad()
        loss.backward()
        optimizer.step()     
        acc=(predictions.argmax(-1)==labels).float().mean().item()
        train_acc.append(acc)
        Training_accuracy=100*np.mean(train_acc)
    print('Training accuracy=%.2f%%.'% Training_accuracy)
    test_acc=[]
    for images, labels in tqdm(train_loader):
        predictions = model(images)     
        acc=(predictions.argmax(-1)==labels).float().mean().item()
        test_acc.append(acc)
        Testing_accuracy=100*np.mean(test_acc)
    # TODO:calculate the accuracy using traning and testing dataset
    print('Testing accuracy= %.2f%%.'% Testing_accuracy)

100%|██████████| 468/468 [00:31<00:00, 14.87it/s]
  0%|          | 2/468 [00:00<00:25, 18.48it/s]Training accuracy=86.76%.
100%|██████████| 468/468 [00:24<00:00, 19.43it/s]
  0%|          | 2/468 [00:00<00:34, 13.64it/s]Testing accuracy= 97.06%.
100%|██████████| 468/468 [00:33<00:00, 14.07it/s]
  0%|          | 2/468 [00:00<00:28, 16.63it/s]Training accuracy=92.03%.
100%|██████████| 468/468 [00:24<00:00, 19.42it/s]
  0%|          | 2/468 [00:00<00:35, 12.99it/s]Testing accuracy= 97.98%.
100%|██████████| 468/468 [00:33<00:00, 13.90it/s]
  0%|          | 2/468 [00:00<00:30, 15.48it/s]Training accuracy=94.00%.
100%|██████████| 468/468 [00:22<00:00, 20.36it/s]
  0%|          | 2/468 [00:00<00:32, 14.52it/s]Testing accuracy= 98.48%.
100%|██████████| 468/468 [00:31<00:00, 14.85it/s]
  0%|          | 2/468 [00:00<00:27, 16.85it/s]Training accuracy=95.04%.
100%|██████████| 468/468 [00:23<00:00, 19.58it/s]
  0%|          | 2/468 [00:00<00:33, 13.75it/s]Testing accuracy= 98.27%.
100%|██████████|

#### Q5:
Please print the training and testing accuracy.