<a href="https://colab.research.google.com/github/LuhemRevorg/Deep-Learning/blob/main/MNIST_CNN's.ipynb" target="_parent"><img src="https://colab.research.google.com/assets/colab-badge.svg" alt="Open In Colab"/></a>

In [1]:
import torch
import torch.nn as nn
import torch.nn.functional as F
from torch.utils.data import DataLoader
from torchvision import datasets, transforms
from torchvision.utils import make_grid

import numpy as np
import pandas as pd
from sklearn.metrics import confusion_matrix
import itertools
import matplotlib.pyplot as plt
import seaborn as sns

In [2]:
# Convert MNIST image files into a tensor of 4-dimensions
transform = transforms.ToTensor()

In [3]:
# Train Data

train_data = datasets.MNIST(root='data', train=True, download=True, transform=transform)

100%|██████████| 9.91M/9.91M [00:00<00:00, 18.2MB/s]
100%|██████████| 28.9k/28.9k [00:00<00:00, 508kB/s]
100%|██████████| 1.65M/1.65M [00:00<00:00, 4.50MB/s]
100%|██████████| 4.54k/4.54k [00:00<00:00, 10.9MB/s]


In [4]:
# Test Data

test_data = datasets.MNIST(root='data', train=False, download=True, transform=transform)

In [5]:
train_loader=DataLoader(train_data,batch_size=10,shuffle=True)
test_loader=DataLoader(test_data,batch_size=10,shuffle=False)

In [6]:
# Defining our CNN model
# Describing Convolutional Layer and what it's doing

conv1 = nn.Conv2d(1, 6, 3, 1)
conv2 = nn.Conv2d(6, 16, 3, 1)

In [7]:
# Grab 1 image
for i, (X_train, y_train) in enumerate(train_data):
    break


In [8]:
X_train

tensor([[[0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
          0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
          0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
          0.0000, 0.0000, 0.0000, 0.0000],
         [0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
          0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
          0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
          0.0000, 0.0000, 0.0000, 0.0000],
         [0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
          0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
          0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
          0.0000, 0.0000, 0.0000, 0.0000],
         [0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
          0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
          0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,

In [9]:
x = X_train.view(1, 1, 28, 28)
x

tensor([[[[0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
           0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
           0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
           0.0000, 0.0000, 0.0000, 0.0000],
          [0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
           0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
           0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
           0.0000, 0.0000, 0.0000, 0.0000],
          [0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
           0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
           0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
           0.0000, 0.0000, 0.0000, 0.0000],
          [0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
           0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000,
           0.0000, 0.0000, 0.0000, 0.0000, 

In [10]:
# Perform our first convolution
x=F.relu(conv1(x))
x.shape

torch.Size([1, 6, 26, 26])

In [11]:
x=F.max_pool2d(x,2,2)
x.shape

torch.Size([1, 6, 13, 13])

In [12]:
x=F.relu(conv2(x))
x.shape

torch.Size([1, 16, 11, 11])

In [13]:
x=F.max_pool2d(x,2,2)
x.shape

torch.Size([1, 16, 5, 5])

In [14]:
# Model Class

class CNNModel(nn.Module):
    def __init__(self):
        super().__init__()
        self.conv1= nn.Conv2d(1,6,3,1)
        self.conv2 = nn.Conv2d(6, 16, 3, 1)
        self.fc1 = nn.Linear(5*5*16, 120)
        self.fc2 = nn.Linear(120, 84)
        self.fc3 = nn.Linear(84, 10)

    def forward(self, X):
      X=F.relu(self.conv1(X))
      X=F.max_pool2d(X,2,2)
      X=F.relu(self.conv2(X))
      X=F.max_pool2d(X,2,2)
      X=X.view(-1,5*5*16)
      X=F.relu(self.fc1(X))
      X=F.relu(self.fc2(X))
      X=self.fc3(X)
      return F.log_softmax(X,dim=1)


In [15]:
torch.manual_seed(41)

<torch._C.Generator at 0x7d61a3fea610>

In [21]:
model=CNNModel()

In [22]:
criterion=nn.CrossEntropyLoss()
optimizer=torch.optim.Adam(model.parameters(),lr=0.001)

In [23]:
epochs=5
train_losses=[]
test_losses=[]
train_correct=[]
test_correct=[]

for i in range(epochs):
  trn_corr=0
  tst_corr=0

  for b, (X_train, y_train) in enumerate(train_loader):
    b+=1
    y_pred=model(X_train)
    loss = criterion(y_pred, y_train)
    predicted = torch.max(y_pred.data, 1)[1]
    batch_corr=(predicted==y_train).sum()
    trn_corr+=batch_corr


    optimizer.zero_grad()
    loss.backward()
    optimizer.step()
    train_losses.append(loss.item())
    train_correct.append(trn_corr)

    if b%600 == 0:
      print(f'Epoch: {i} Batch: {b} Loss: {loss.item()}')

  train_losses.append(loss.item())
  train_correct.append(trn_corr)


  with torch.no_grad():
    for b, (X_test, y_test) in enumerate(test_loader):
      y_val=model(X_test)
      predicted = torch.max(y_val.data, 1)[1]
      tst_corr+=(predicted==y_test).sum()


  loss=criterion(y_val,y_test)
  test_losses.append(loss.item())
  test_correct.append(tst_corr)

Epoch: 0 Batch: 600 Loss: 0.16749794781208038
Epoch: 0 Batch: 1200 Loss: 0.15739747881889343
Epoch: 0 Batch: 1800 Loss: 0.059995800256729126
Epoch: 0 Batch: 2400 Loss: 0.0036465569864958525
Epoch: 0 Batch: 3000 Loss: 0.011178890243172646
Epoch: 0 Batch: 3600 Loss: 0.5766130685806274
Epoch: 0 Batch: 4200 Loss: 0.019300587475299835
Epoch: 0 Batch: 4800 Loss: 0.058529071509838104
Epoch: 0 Batch: 5400 Loss: 0.154725581407547
Epoch: 0 Batch: 6000 Loss: 0.02564663626253605
Epoch: 1 Batch: 600 Loss: 0.0035729079972952604
Epoch: 1 Batch: 1200 Loss: 0.03066287375986576
Epoch: 1 Batch: 1800 Loss: 0.12798944115638733
Epoch: 1 Batch: 2400 Loss: 0.05707661435008049
Epoch: 1 Batch: 3000 Loss: 0.009029540233314037
Epoch: 1 Batch: 3600 Loss: 0.3632652163505554
Epoch: 1 Batch: 4200 Loss: 0.015015484765172005
Epoch: 1 Batch: 4800 Loss: 6.57513301121071e-05
Epoch: 1 Batch: 5400 Loss: 0.13657617568969727
Epoch: 1 Batch: 6000 Loss: 0.0011966913007199764
Epoch: 2 Batch: 600 Loss: 0.0002664932399056852
Epoch