# Simple CNN with MNIST dataset

In [107]:
import torch
import torch.nn as nn
import torch.nn.functional as F
from torch.utils.data import DataLoader
from torchvision import datasets, transforms
from torchvision.utils import make_grid

import numpy as np
import pandas as pd
from sklearn.metrics import confusion_matrix
import matplotlib.pyplot as plt
%matplotlib inline

## Load Dataset

In [108]:
# Convert MNIST dataset to a Tensor 4-dimensions (# Images, Height, Width, Color Channel)
transform = transforms.ToTensor()

In [109]:
# Train Data
train_data = datasets.MNIST(root="./cnn_data", train=True, download=True, transform=transform)

# Test Data
test_data = datasets.MNIST(root="./cnn_data", train=False, download=True, transform=transform)

In [110]:
train_data

Dataset MNIST
    Number of datapoints: 60000
    Root location: ./cnn_data
    Split: Train
    StandardTransform
Transform: ToTensor()

In [111]:
test_data

Dataset MNIST
    Number of datapoints: 10000
    Root location: ./cnn_data
    Split: Test
    StandardTransform
Transform: ToTensor()

## Dataloader

In [112]:
# Create Dataloaders
train_loader = DataLoader(train_data, batch_size=10, shuffle=True)
test_loader = DataLoader(test_data, batch_size=10, shuffle=False)

## Convolutional Layer

In [113]:
# Describe convolutional layers
conv1 = nn.Conv2d(1, 6, 3, 1) # Input Size, Number of Kernels, Kernel Size and Stride
conv2 = nn.Conv2d(6, 16, 3, 1)

In [114]:
# Grab  1 MNIST image
for i, (X_train, y_train) in enumerate(train_data):
    break

In [115]:
X_train.shape

torch.Size([1, 28, 28])

In [116]:
y_train

5

In [117]:
x = X_train.view(1, 1, 28, 28)

In [118]:
# Perform our first convolution
x = F.relu(conv1(x))

In [119]:
# 1 single image, 6 is the number of filters, 26x26 is the image new size
# size = (input + 2*padding - K_size)/stride) + 1 = (28 + 2*0 - 3)/1 + 1 = 26
x.shape

torch.Size([1, 6, 26, 26])

## Pooling Layer

In [120]:
# Pass through the pooling layer
x = F.max_pool2d(x, 2, 2)

In [121]:
# Stride of 2 and kernel Size of 2 -> Output divided by half
# input = 26, padding = 0, K_size = 2, stride = 2
# size = (input + 2*padding - K_size)/stride) + 1 = (26 + 2*0 - 2)/2 + 1 = 13
x.shape

torch.Size([1, 6, 13, 13])

## 2nd Convolutional Layer

In [122]:
x = F.relu(conv2(x))

In [124]:
# input = 13, padding = 0, K_size = 3, stride = 1
# size = (input + 2*padding - K_size)/stride) + 1 = (13 + 2*0 - 3)/1 + 1 = 11
x.shape

torch.Size([1, 16, 11, 11])

## 2D Pooling

In [125]:
# Pass through the pooling layer
x = F.max_pool2d(x, 2, 2)

In [None]:
# Stride of 2 and kernel Size of 2 -> Output divided by half
# input = 11, padding = 0, K_size = 2, stride = 2
# size = (input + 2*padding - K_size)/stride) + 1 = (11 + 2*0 - 2)/2 + 1 = Floor(5.5) = 5
x.shape

torch.Size([1, 16, 5, 5])

## Model