In [1]:
import torch
import torch.nn as nn
import torch.nn.functional as F
from torch.utils.data import DataLoader
from torchvision import datasets, transforms
from torchvision.utils import make_grid

import numpy as np
import pandas as pd
from sklearn.metrics import confusion_matrix
import matplotlib.pyplot as plt

In [2]:
transform = transforms.ToTensor()

In [3]:
train_data = datasets.MNIST(root='../Data/', train=True, download=True, transform=transform)

In [4]:
test_data = datasets.MNIST(root='../Data/', train=False, download=True, transform=transform)

In [5]:
train_data

Dataset MNIST
    Number of datapoints: 60000
    Root location: ../Data/
    Split: Train
    StandardTransform
Transform: ToTensor()

In [6]:
test_data

Dataset MNIST
    Number of datapoints: 10000
    Root location: ../Data/
    Split: Test
    StandardTransform
Transform: ToTensor()

In [7]:
train_loader = DataLoader(train_data, batch_size=10, shuffle=True)
test_loader = DataLoader(test_data, batch_size=10, shuffle=False)

In [8]:
# 1 color channel, 6 filters (output channels, arbitrary), 3x3 kernel, stride=1
conv1 = nn.Conv2d(1,6,3,1) # original img ---> 6 filters ---> pooling ---> conv2

# 6 input filters from conv1, 16 filters (arbitrary), 3x3 kernel, stride=1
conv2 = nn.Conv2d(6,16,3,1)

In [9]:
for i, (X_train, y_train) in enumerate(train_data):
    break

In [10]:
# (add dimension to batch size (1), 1, 28, 28)
x = X_train.view(1, 1, 28, 28) # conver to ----> 4D batch (batch of 1 image)

In [11]:
x = F.relu(conv1(x))

In [12]:
x.shape # (1 image, 6 filters, losing border info (28->26), same->26) because no paddings are added

torch.Size([1, 6, 26, 26])

In [13]:
x = F.max_pool2d(x,2,2) # (data, 2x2 kernel, stride=2)

In [15]:
x.shape # reduce the size by 2 (because of 2x2 kernel and stride=2)

torch.Size([1, 6, 13, 13])

In [16]:
x = F.relu(conv2(x))

In [17]:
x.shape

torch.Size([1, 16, 11, 11])

In [18]:
x = F.max_pool2d(x,2,2)

In [19]:
x.shape

torch.Size([1, 16, 5, 5])

In [21]:
((28-2)/2-2)/2 # how to get 5

5.5

In [23]:
x.view(-1,16*5*5).shape # keep first dimension, 16*5*5 to flatten

torch.Size([1, 400])