In [1]:
#importing different libraries
from __future__ import print_function, division
import os
import torch
import pandas as pd
from skimage import io, transform
import numpy as np
import matplotlib.pyplot as plt
from torch.utils.data import Dataset, DataLoader
from torchvision import transforms, utils
import torch.nn as nn
from torch.autograd import Variable

# Ignore warnings
import warnings
warnings.filterwarnings("ignore")

plt.ion()   # interactive mode

In [2]:
#changing the dataset(csv file) to the torch.tensor form
class FashionMNIST(Dataset):
    def __init__(self, csv_file, root_dir, transform=None, transform1=None):
        """
        Args:
            csv_file (string): Path to the csv file with annotations.
            root_dir (string): Directory with all the images.
            transform (callable, optional): Optional transform to be applied
                on a sample.
        """
        self.landmarks_frame = pd.read_csv(csv_file)
        self.root_dir = root_dir
        self.transform = transform
        self.transform1 = transform1

    def __len__(self):
        return len(self.landmarks_frame)

    def __getitem__(self, idx):
    
        image = torch.Tensor(self.landmarks_frame.iloc[idx, 1:].values.reshape(1,28,28))
        label = self.landmarks_frame.iloc[idx, 0].reshape(1)
        label = torch.LongTensor(label)
        image =self.transform1(image)
        
        image = self.transform(image)
        label = label[0]
        landmarks = (image, label)
        
        return landmarks


In [3]:
#creating the train dataset and test dataset
transform = transforms.Compose(
    [transforms.ToTensor(),
     transforms.Normalize((0.5, 0.5, 0.5), (0.5, 0.5, 0.5))])
train_dataset = FashionMNIST(csv_file='fdata/fashion-mnist_train.csv',
                             root_dir='fdata/',
                             transform=transform,
                             transform1=transforms.ToPILImage())

In [4]:
test_dataset = FashionMNIST(csv_file='fdata/fashion-mnist_test.csv',
                            root_dir='fdata/',
                            transform=transform,
                            transform1=transforms.ToPILImage())

In [5]:
#loading the train and test dataset
batch_size = 100
n_iters = 6000
num_epochs = 10

train_load = torch.utils.data.DataLoader(dataset=train_dataset,
                                        batch_size=batch_size,
                                        shuffle=True)

test_load = torch.utils.data.DataLoader(dataset=test_dataset,
                                        batch_size=batch_size,
                                        shuffle=False)

In [6]:
#Swish activation function
def swish(x):
    return x * F.sigmoid(x)

In [17]:
#creating the model class
torch.manual_seed(0)
class CNNModel(nn.Module):
    def __init__(self):
        super(CNNModel, self).__init__()
        
        self.cnn1 = nn.Conv2d(in_channels=1, out_channels=16, kernel_size=5, stride=1, padding=2)
        nn.init.xavier_uniform(self.cnn1.weight)
        self.bn1 = nn.BatchNorm2d(16)
        #self.dr1 = nn.Dropout2d(0.07)
        self.relu1 = nn.ReLU()
        
        self.pool1 = nn.MaxPool2d(kernel_size=2)
        
        self.cnn2 = nn.Conv2d(in_channels=16, out_channels=32, kernel_size=5, stride=1, padding=2)
        nn.init.xavier_uniform(self.cnn2.weight)
        self.bn2 = nn.BatchNorm2d(32)
        #self.dr2 = nn.Dropout2d(0.07)
        self.relu2 = nn.ReLU()
        
        self.pool2 = nn.MaxPool2d(kernel_size=2)
        
        self.cnn3 = nn.Conv2d(in_channels=32, out_channels=32, kernel_size=5, stride=1, padding=2)
        nn.init.xavier_uniform(self.cnn3.weight)
        self.bn3 = nn.BatchNorm2d(32)
        #self.dr3 = nn.Dropout2d(0.07)
        self.relu3 = nn.ReLU()
        
        #self.cnn4 = nn.Conv2d(in_channels=32, out_channels=32, kernel_size=5, stride=1, padding=2)
        #nn.init.xavier_uniform(self.cnn4.weight)
        #self.bn4 = nn.BatchNorm1d(32)
        #self.dr4 = nn.Dropout2d(0.07)
        #self.relu4 = nn.ReLU()
        
        self.fc = nn.Linear(32*7*7, 10)
        self.bn5 = nn.BatchNorm1d(10)
        nn.init.xavier_uniform(self.fc.weight)
        
    def forward(self, x):
        
        out = self.cnn1(x)
        out = self.bn1(out)
        #out = self.dr1(out)
        out = self.relu1(out)
        
        out = self.pool1(out)
        
        out = self.cnn2(out)
        out = self.bn2(out)
        #out = self.dr2(out)
        out = self.relu2(out)
        
        out = self.pool2(out)
        
        out = self.cnn3(out)
        out = self.bn3(out)
        #out = self.dr3(out)
        out = self.relu3(out)
        
        #out = self.cnn4(out)
        #out = self.bn4(out)
        #out = self.dr4(out)
        #out = self.relu4(out)
        
        out = out.view(out.size(0),-1)
        
        out = self.fc(out)
        out = self.bn5(out)
        
        return out

In [18]:
#instantiating the model class
model = CNNModel()

In [19]:
#instantiating the loss class
criterion = nn.CrossEntropyLoss()

In [20]:
#instantiating the optimizer class
learing_rate = 0.06

optimizer = torch.optim.Adagrad(model.parameters(), lr=learing_rate)

print(len(list(model.parameters())))

16


In [21]:
#training the model
iter = 0

for epoch in range(num_epochs):
    for i,(images, labels) in enumerate(train_load):
        images = Variable(images)
        labels = Variable(labels)
        
        optimizer.zero_grad()
        
        outputs = model(images)
        
        loss = criterion(outputs, labels)
        
        loss.backward()
        
        optimizer.step()
        
        iter += 1
        
        #testing the model
        if (iter%500) == 0:
            total = 0
            correct = 0
            for images, labels in test_load:
                images = Variable(images)
            
                outputs = model(images)
                _, predicts = torch.max(outputs.data, 1)
                
                total += labels.size(0)
                
                correct += (predicts == labels).sum()
            accuracy = 100 * (correct.item() / total)
                
            print('iterations {}, loss {}, accuracy {}'.format(iter, loss.data[0], accuracy))

iterations 500, loss 0.3865665793418884, accuracy 88.31
iterations 1000, loss 0.32070326805114746, accuracy 89.69
iterations 1500, loss 0.3125731647014618, accuracy 90.71000000000001
iterations 2000, loss 0.31422320008277893, accuracy 90.24
iterations 2500, loss 0.2363504022359848, accuracy 90.91
iterations 3000, loss 0.30532631278038025, accuracy 90.94
iterations 3500, loss 0.13100895285606384, accuracy 91.07
iterations 4000, loss 0.1430157721042633, accuracy 90.89
iterations 4500, loss 0.06790616363286972, accuracy 91.0
iterations 5000, loss 0.18560124933719635, accuracy 91.13
iterations 5500, loss 0.08033032715320587, accuracy 91.05
iterations 6000, loss 0.15602754056453705, accuracy 90.9


In [None]:
#Max accuracy = 91.13%