# Convolutional Neural Network
- MNIST data
- 3 convolutional layers
- 2 fully connected layers

[MNIST] (https://en.wikipedia.org/wiki/MNIST_database)

## 1. Settings
### 1) Import required libraries

In [1]:
import numpy as np
import torch
import torch.nn as nn
import torch.optim as optim
import torch.nn.init as init
import torchvision.datasets as dset
import torchvision.transforms as transforms
from torch.utils.data import DataLoader

### 2) Set hyperparameters

In [2]:
batch_size = 16
learning_rate = 0.0002
num_epoch = 10

use_cuda = True
#device = torch.device("cuda" if use_cuda else "cpu")
device = torch.device("cuda" if torch.cuda.is_available() else "cpu")


## 2. Data

### 1) Download Data

In [3]:
mnist_train = dset.MNIST("./", train=True, transform=transforms.ToTensor(), target_transform=None, download=True)
mnist_test = dset.MNIST("./", train=False, transform=transforms.ToTensor(), target_transform=None, download=True)

### 2) Check Dataset

In [4]:
print(mnist_train.__getitem__(0)[0].size(), mnist_train.__len__())
mnist_test.__getitem__(0)[0].size(), mnist_test.__len__()

torch.Size([1, 28, 28]) 60000


(torch.Size([1, 28, 28]), 10000)

### 3) Set DataLoader

In [5]:
train_loader = torch.utils.data.DataLoader(mnist_train,batch_size=batch_size, shuffle=True,num_workers=2,drop_last=True)
test_loader = torch.utils.data.DataLoader(mnist_test,batch_size=batch_size, shuffle=False,num_workers=2,drop_last=True)

## 3. Model & Optimizer

### 1) CNN Model

In [13]:
class CNN(nn.Module):
    def __init__(self):
        super(CNN, self).__init__()
        self.layer = nn.Sequential(
            nn.Conv2d(1, 64, 3, 1, 1), #Cnv2d(in_channels, out_channels, kernel_size, stride=1, padding=0)
            nn.BatchNorm2d(64),
            nn.ReLU(),
            nn.Conv2d(64, 128, 3, 1, 1), 
            nn.BatchNorm2d(128),
            nn.ReLU(),
            nn.MaxPool2d(2,2),
            nn.Conv2d(128, 256, 3, 1, 1), 
            nn.BatchNorm2d(256),
            nn.ReLU(),
            nn.Conv2d(256, 512, 3, 1, 1),
            nn.BatchNorm2d(512),
            nn.ReLU(),
            nn.MaxPool2d(2,2)
        )
        self.fc_layer = nn.Sequential(
            nn.Linear(512*7*7,400),
            nn.ReLU(),
            nn.Linear(400,10)
        )       
        
    def forward(self,x):
        out = self.layer(x)
        out = out.view(batch_size,-1)
        out = self.fc_layer(out)

        return out

model = CNN() 
model = model.to(device)

### 2) Loss func & Optimizer

In [14]:
loss_func = nn.CrossEntropyLoss()
optimizer = torch.optim.SGD(model.parameters(), lr=learning_rate)

## 4. Train 

In [None]:
for i in range(num_epoch):
    for j,[image,label] in enumerate(train_loader):
        x = image.to(device)
        y_= label.to(device)
        
        output = model.forward(x)
        loss = loss_func(output,y_)
        
        loss.backward()
        optimizer.step()
        optimizer.zero_grad()
        
        if j % 1000 == 0:
            print(loss)          

tensor(1.3633, grad_fn=<NllLossBackward>)
tensor(0.5055, grad_fn=<NllLossBackward>)
tensor(0.3060, grad_fn=<NllLossBackward>)
tensor(0.2310, grad_fn=<NllLossBackward>)
tensor(0.2023, grad_fn=<NllLossBackward>)


In [None]:
#param_list = list(model.parameters())
#print(param_list)

## 5. Test

In [None]:
correct = 0
total = 0

with torch.no_grad(): 
    for image,label in test_loader:

        x = image.to(device)
        y_= label.to(device) 

        output = model.forward(x)
        _,output_index = torch.max(output,1)   
        total += label.size(0)
        correct += (output_index == y_).sum().float()
    
print("Accuracy of Test Data: {}".format(100*correct/total))