In [5]:
import torch
import torch.nn.functional as F
import torch.nn as nn
import torch.utils.data as Data
import torchvision
import matplotlib.pyplot as plt

In [3]:
#Hypter parameters
EPOCH = 1
BATCH_SIZE = 50
LR = 0.001
DOWNLOAD_MNIST = False

In [8]:
#Data
train_data = torchvision.datasets.MNIST(
    root = './mnist',
    train = True,
    transform = torchvision.transforms.ToTensor(),
    download = DOWNLOAD_MNIST
)

Downloading http://yann.lecun.com/exdb/mnist/train-images-idx3-ubyte.gz
Downloading http://yann.lecun.com/exdb/mnist/train-labels-idx1-ubyte.gz
Downloading http://yann.lecun.com/exdb/mnist/t10k-images-idx3-ubyte.gz
Downloading http://yann.lecun.com/exdb/mnist/t10k-labels-idx1-ubyte.gz
Processing...
Done!


In [94]:
train_loader = Data.DataLoader(train_data, BATCH_SIZE,shuffle = True)

In [95]:
test_data = torchvision.datasets.MNIST(
    root = './mnist',
    train = False,
    #transform = torchvision.transforms.ToTensor()
)

In [96]:
test_x = (torch.unsqueeze(test_data.test_data,dim = 1).type(torch.FloatTensor)/255.)[:2000]

In [97]:
test_y = test_data.test_labels[:2000]

In [98]:
#Build CNN
class CNN(nn.Module):
    def __init__(self):
        super(CNN,self).__init__()
        self.conv1 = nn.Sequential(
            nn.Conv2d(
                in_channels = 1,
                out_channels = 16,
                kernel_size = 5,
                stride = 1,
                padding = 2
            ),
            nn.ReLU(),
            nn.MaxPool2d(kernel_size=2)
        )
        self.conv2 = nn.Sequential(
            nn.Conv2d(16,32,5,1,2),
            nn.ReLU(),
            nn.MaxPool2d(2)
        )
        self.out = nn.Linear(32*7*7, 10)
        
    def forward(self,x):
        x = self.conv2(self.conv1(x))
        x = x.view(x.size(0),-1)
        return self.out(x)

In [117]:
cnn = CNN()

In [118]:
#loss function and optimizer
loss_func = nn.CrossEntropyLoss()
optimizer = torch.optim.Adam(cnn.parameters(),lr = LR)

In [120]:
for epoch in range(EPOCH):
    for step, (x,y) in enumerate(train_loader):
        output = cnn(x)
        loss = loss_func(output,y)
        
        optimizer.zero_grad()
        loss.backward()
        optimizer.step()
        
        if step % 50 == 0:
            test_output = cnn(test_x)
            pred_y = torch.max(test_output,1)[1].squeeze()
            accuracy = (sum(pred_y.numpy() == test_y.numpy()) / float(test_y.size(0)))
            print('Epoch: ',epoch, '| train loss: %.4f' % loss, '| test accuracy:', accuracy)

Epoch:  0 | train loss: 2.3311 | test accuracy: 0.1625
Epoch:  0 | train loss: 0.5621 | test accuracy: 0.7995
Epoch:  0 | train loss: 0.5041 | test accuracy: 0.8435
Epoch:  0 | train loss: 0.1679 | test accuracy: 0.9145
Epoch:  0 | train loss: 0.1244 | test accuracy: 0.9345
Epoch:  0 | train loss: 0.1764 | test accuracy: 0.9345
Epoch:  0 | train loss: 0.3054 | test accuracy: 0.952
Epoch:  0 | train loss: 0.0714 | test accuracy: 0.953
Epoch:  0 | train loss: 0.1616 | test accuracy: 0.963
Epoch:  0 | train loss: 0.1301 | test accuracy: 0.969
Epoch:  0 | train loss: 0.0768 | test accuracy: 0.965
Epoch:  0 | train loss: 0.1418 | test accuracy: 0.9675
Epoch:  0 | train loss: 0.1583 | test accuracy: 0.9745
Epoch:  0 | train loss: 0.1841 | test accuracy: 0.9685
Epoch:  0 | train loss: 0.1515 | test accuracy: 0.9715
Epoch:  0 | train loss: 0.1311 | test accuracy: 0.975
Epoch:  0 | train loss: 0.0455 | test accuracy: 0.9715


KeyboardInterrupt: 