<a href="https://colab.research.google.com/github/Khanyecebani/Pytorch-/blob/main/CNN.ipynb" target="_parent"><img src="https://colab.research.google.com/assets/colab-badge.svg" alt="Open In Colab"/></a>

In [1]:
import torch
import torch.nn as nn
import torch.nn.functional as F
from torch.utils.data import DataLoader
from torchvision import datasets, transforms
from torchvision.utils import make_grid

import numpy as np
import pandas as pd
from sklearn.metrics import confusion_matrix
import matplotlib.pyplot as plt
%matplotlib inline

In [2]:
#Before we import the data,we need to transform it as we need to work in 4 dimensions by converting
#the image files to a tensor of 4 dim(# of images,height,width,color channel)

#We have to use the transform that we imported
transform = transforms.ToTensor()


In [3]:
#Set up training and test data

#Train data
train_data = datasets.MNIST(root='/cnn_data',train=True,download=True,transform=transform) #we use the datasets that we imported to load the MNIST dataset from that library and save it locally

Downloading http://yann.lecun.com/exdb/mnist/train-images-idx3-ubyte.gz
Failed to download (trying next):
HTTP Error 404: Not Found

Downloading https://ossci-datasets.s3.amazonaws.com/mnist/train-images-idx3-ubyte.gz
Downloading https://ossci-datasets.s3.amazonaws.com/mnist/train-images-idx3-ubyte.gz to /cnn_data/MNIST/raw/train-images-idx3-ubyte.gz


100%|██████████| 9.91M/9.91M [00:00<00:00, 16.4MB/s]


Extracting /cnn_data/MNIST/raw/train-images-idx3-ubyte.gz to /cnn_data/MNIST/raw

Downloading http://yann.lecun.com/exdb/mnist/train-labels-idx1-ubyte.gz
Failed to download (trying next):
HTTP Error 404: Not Found

Downloading https://ossci-datasets.s3.amazonaws.com/mnist/train-labels-idx1-ubyte.gz
Downloading https://ossci-datasets.s3.amazonaws.com/mnist/train-labels-idx1-ubyte.gz to /cnn_data/MNIST/raw/train-labels-idx1-ubyte.gz


100%|██████████| 28.9k/28.9k [00:00<00:00, 513kB/s]


Extracting /cnn_data/MNIST/raw/train-labels-idx1-ubyte.gz to /cnn_data/MNIST/raw

Downloading http://yann.lecun.com/exdb/mnist/t10k-images-idx3-ubyte.gz
Failed to download (trying next):
HTTP Error 404: Not Found

Downloading https://ossci-datasets.s3.amazonaws.com/mnist/t10k-images-idx3-ubyte.gz
Downloading https://ossci-datasets.s3.amazonaws.com/mnist/t10k-images-idx3-ubyte.gz to /cnn_data/MNIST/raw/t10k-images-idx3-ubyte.gz


100%|██████████| 1.65M/1.65M [00:00<00:00, 3.90MB/s]


Extracting /cnn_data/MNIST/raw/t10k-images-idx3-ubyte.gz to /cnn_data/MNIST/raw

Downloading http://yann.lecun.com/exdb/mnist/t10k-labels-idx1-ubyte.gz
Failed to download (trying next):
HTTP Error 404: Not Found

Downloading https://ossci-datasets.s3.amazonaws.com/mnist/t10k-labels-idx1-ubyte.gz
Downloading https://ossci-datasets.s3.amazonaws.com/mnist/t10k-labels-idx1-ubyte.gz to /cnn_data/MNIST/raw/t10k-labels-idx1-ubyte.gz


100%|██████████| 4.54k/4.54k [00:00<00:00, 10.5MB/s]

Extracting /cnn_data/MNIST/raw/t10k-labels-idx1-ubyte.gz to /cnn_data/MNIST/raw






In [4]:
#Test Data
test_data = datasets.MNIST(root='/cnn_data',train=False,download=True,transform=transform) #we use the datasets that we imported to load the MNIST dataset from that library and save it locally

In [5]:
train_data

Dataset MNIST
    Number of datapoints: 60000
    Root location: /cnn_data
    Split: Train
    StandardTransform
Transform: ToTensor()

In [6]:
test_data

Dataset MNIST
    Number of datapoints: 10000
    Root location: /cnn_data
    Split: Test
    StandardTransform
Transform: ToTensor()

In [7]:
#We have to create a small batch size for images (10)
train_loader = DataLoader(train_data,batch_size=10,shuffle=True) #we just want to shuffle the training data
test_loader = DataLoader(test_data,batch_size=10,shuffle=True)


In [8]:
#Define our CNN model
#We will have 2 convulational layers
conv1 = nn.Conv2d(1,6,3,1) #1 image,6 filters(outputs),kernel size of 3x3,stride of 1 at a time
conv2 = nn.Conv2d(6,16,3,1) #6 outputs from the first layer become the inputs to this layer,16 filters(outputs),kernel size of 3x3,stride of 1 at a time


In [9]:
#Grab 1 MNIST record(image) by looping through our data
for i, (X_Train,y_train) in enumerate(train_data):
  break

In [10]:
X_Train.shape #1 image of size 28x28 pixels

torch.Size([1, 28, 28])

In [11]:
#We have to change our image to a 4 dimension image
x = X_Train.view(1,1,28,28) #1 batch of 1 image of 28x28

In [12]:
#Perform our first convolution
x = F.relu(conv1(x)) #Rectified Linear Unit for our activation function

In [13]:
x.shape #the layer has run and the output is a single image with 6 filters and now a 26x26
#because we did not define any padding in our CNN and some pixels will be dropped


torch.Size([1, 6, 26, 26])

In [14]:
#We now get into the pooling layer
x = F.max_pool2d(x,2,2) #kernel of 2x2 and stride of 2

In [15]:
x.shape #pixels are now 13x13 as we have a kernel of 2x2 and stride of 2


torch.Size([1, 6, 13, 13])

In [16]:
#Do our second convolutional layer
x = F.relu(conv2(x))

In [17]:
x.shape #Image is now of 11x11 since we lost 2 pixels by not setting padding



torch.Size([1, 16, 11, 11])

In [18]:
#We get into another pooling layer
x = F.max_pool2d(x,2,2)

In [19]:
x.shape #image is now of 5x5 as 11/2 = 5.5 but we have to round down because we
#have already lost some data(pixels) in the pooling

torch.Size([1, 16, 5, 5])

In [None]:
#We now have to create a model for all the images instead of just 1

In [21]:
class ConvolutionalNetwork(nn.Module):
  def __init__(self):
    super().__init__()
    #we then need to bring our convulational networks defined before
    self.conv1 = nn.Conv2d(1,6,3,1)
    self.conv2 = nn.Conv2d(6,16,3,1)

    #We also need a fully connected layer
    self.fc1 = nn.Linear(5*5*16,120)
    self.fc2 = nn.Linear(120,84)
    self.fc3 = nn.Linear(84,10)

    #We now need a forward function to push everything forward

  def forward(self,X):
    X = F.relu(self.conv1(X))
    X = F.max_pool2d(X,2,2) #2x2 kernal and stride 2

    X = F.relu(self.conv2(X))
    X = F.max_pool2d(X,2,2) #2x2 kernal and stride 2

    #Re-View to flatten it out
    X = X.view(-1,16*5*5) #-1 so that we can vary the batch size

    #Fully Connected Layers
    X = F.relu(self.fc1(X))
    X = F.relu(self.fc2(X))
    X = self.fc3(X)
    return F.log_softmax(X,dim=1)


In [22]:
#Create an Instance of the model
torch.manual_seed(41)
model = ConvolutionalNetwork()
model

ConvolutionalNetwork(
  (conv1): Conv2d(1, 6, kernel_size=(3, 3), stride=(1, 1))
  (conv2): Conv2d(6, 16, kernel_size=(3, 3), stride=(1, 1))
  (fc1): Linear(in_features=400, out_features=120, bias=True)
  (fc2): Linear(in_features=120, out_features=84, bias=True)
  (fc3): Linear(in_features=84, out_features=10, bias=True)
)

In [24]:
#We need a Loss Function Optimizer
criterion = nn.CrossEntropyLoss()
optimizer = torch.optim.Adam(model.parameters(),lr=0.001)