In [1]:
import torch
import torch.nn as nn
import torch.nn.functional as F
import dataloader as dl
from torchvision import datasets, transforms
from torch.utils.data import DataLoader
import numpy as np

In [2]:
class Net(nn.Module):
    def __init__(self):
        super(Net, self).__init__()
        self.conv1 = nn.Conv2d(1, 20, 5, 1)
        self.conv2 = nn.Conv2d(20, 50, 5, 1)
        self.fc1 = nn.Linear(4*4*50, 500)
        self.fc2 = nn.Linear(500, 10)

    def forward(self, x):
        x = F.relu(self.conv1(x))
        x = F.max_pool2d(x, 2, 2)
        x = F.relu(self.conv2(x))
        x = F.max_pool2d(x, 2, 2)
        x = x.view(-1, 4*4*50)
        x = F.relu(self.fc1(x))
        x = self.fc2(x)
        return F.log_softmax(x, dim=1)

In [3]:
def count_correct(output,y):
    sum = 0
    for i in range(len(output)):
        y_hat = output[i].argmax()
        if( y_hat == y[i]):
            sum += 1
    return sum

In [4]:
def train(model_conv,epoch):
    data_set = dl.Ocr("train")
    test_set = dl.Ocr("test")
    momentum = 0.9
    learning_rate = 0.001
    loss_fn = F.nll_loss
    optimizer = torch.optim.SGD(model_conv.parameters(),learning_rate,momentum=momentum)
    dataloader = DataLoader(data_set, batch_size=60,shuffle=True)
    
    model_conv.train()
    for i in range(epoch):
        for _,(x,y) in enumerate(dataloader):
                optimizer.zero_grad()
                output = model_conv(x.float())
                loss = loss_fn(output,y)
                print("-",end="")
                loss.backward()
                optimizer.step()
        acc = get_accuracy(model_conv,data_set)
        print(f"   epoch: {i+1} accuracy: {acc}")
    return (model_conv,optimizer)

In [5]:
# saving the model:
def save_checkpoint(model,optimizer,num_epoch,epoch_prev,save_path='../resources/checkpoint.pth'):
    checkpoint = {'epoch':num_epoch + epoch_prev,
                  'state_dict': model.state_dict(),
                  'optimizer' : optimizer.state_dict()}

    torch.save(checkpoint,save_path)

In [6]:
def get_accuracy(model,dat_set):
    batch_size = 100
    data = DataLoader(dat_set, batch_size=batch_size)
    temp = 0
    for _,(x,y) in enumerate(data):
        predictions = model(x.float())
        temp += count_correct(predictions,y)
    acc = (temp/len(dat_set))*100
    return acc

In [10]:
model = Net()

In [11]:
(model,optimizer) = train(model,15)

------------------------   epoch: 1 accuracy: 32.150461320085164
------------------------   epoch: 2 accuracy: 89.3541518807665
------------------------   epoch: 3 accuracy: 93.54151880766501
------------------------   epoch: 4 accuracy: 98.93541518807665
------------------------   epoch: 5 accuracy: 99.14833215046131
------------------------   epoch: 6 accuracy: 96.23846699787083
------------------------   epoch: 7 accuracy: 99.57416607523066
------------------------   epoch: 8 accuracy: 99.78708303761533
------------------------   epoch: 9 accuracy: 99.9290276792051
------------------------   epoch: 10 accuracy: 99.78708303761533
------------------------   epoch: 11 accuracy: 100.0
------------------------   epoch: 12 accuracy: 100.0
------------------------   epoch: 13 accuracy: 99.9290276792051
------------------------   epoch: 14 accuracy: 99.9290276792051
------------------------   epoch: 15 accuracy: 100.0


In [12]:
data_set = dl.Ocr("test")
get_accuracy(model,data_set)

99.69909729187563

In [13]:
save_checkpoint(model,optimizer,10,0,save_path="../Data/checkpoint2.pth")