In [116]:
import pandas as pd
import numpy as np
import matplotlib.pyplot as plt
import torch
import torchvision
from torchvision import transforms
import torch.nn as nn
import torch.nn.functional as F
from scipy.io import loadmat
from torch.utils.data import DataLoader, Dataset
from torch.autograd import Variable

In [131]:
!wget http://ufldl.stanford.edu/housenumbers/train_32x32.mat
!wget http://ufldl.stanford.edu/housenumbers/test_32x32.mat

--2021-04-21 15:16:46--  http://ufldl.stanford.edu/housenumbers/train_32x32.mat
Resolving ufldl.stanford.edu (ufldl.stanford.edu)... 171.64.68.10
Connecting to ufldl.stanford.edu (ufldl.stanford.edu)|171.64.68.10|:80... connected.
HTTP request sent, awaiting response... 200 OK
Length: 182040794 (174M) [text/plain]
Saving to: ‘train_32x32.mat’


2021-04-21 15:16:49 (67.0 MB/s) - ‘train_32x32.mat’ saved [182040794/182040794]

--2021-04-21 15:16:49--  http://ufldl.stanford.edu/housenumbers/test_32x32.mat
Resolving ufldl.stanford.edu (ufldl.stanford.edu)... 171.64.68.10
Connecting to ufldl.stanford.edu (ufldl.stanford.edu)|171.64.68.10|:80... connected.
HTTP request sent, awaiting response... 200 OK
Length: 64275384 (61M) [text/plain]
Saving to: ‘test_32x32.mat’


2021-04-21 15:16:50 (56.3 MB/s) - ‘test_32x32.mat’ saved [64275384/64275384]



In [117]:
class SVHN_dataset(Dataset):

    def __init__(self, data,transform):
        # Transform data to Torch Tensors
        self.images = torch.tensor(data['X']).permute([3,2,0,1])
        self.labels = torch.tensor(data['y'])
        self.size = self.labels.shape[0]

        # replace label 10 with label 0
        self.labels[self.labels==10] = 0
        # convert to float and normalize images to 0..1 range
        self.images = torch.FloatTensor(self.images/255.)
        self.transform = transform

    def __len__(self):
        return self.size

    def __getitem__(self, idx):
        return self.images[idx], self.labels[idx]

In [118]:
class CNN(nn.Module):
  def __init__(self):
    super(CNN, self).__init__()

    self.layer1 = nn.Sequential(
        nn.Conv2d(3,6,(5,5),padding=2,stride=1),
        nn.BatchNorm2d(6),
        nn.ReLU(),
        nn.MaxPool2d(kernel_size=2, stride=2)
    )
    self.layer2 = nn.Sequential(
        nn.Conv2d(6,12,(3,3),padding=1,stride=1),
        nn.BatchNorm2d(12),
        nn.ReLU(),
        nn.MaxPool2d(kernel_size=2, stride=2)
    )
    self.layer3 = nn.Sequential(
        nn.Conv2d(12,24,(3,3),padding=1,stride=1),
        nn.BatchNorm2d(24),
        nn.ReLU(),
        nn.MaxPool2d(kernel_size=2, stride=2)
    )

    self.fc1 = nn.Linear(in_features=24*4*4, out_features=120)
    self.fc2 = nn.Linear(in_features=120, out_features=60)
    self.out = nn.Linear(in_features=60, out_features=10)
  

  def forward(self, x):
    out = self.layer1(x)
    # print(out.shape)

    out = self.layer2(out)
    # print(out.shape)

    out = self.layer3(out)
    # print(out.shape)

    out = out.reshape(-1, 24 * 4 * 4)
    out = self.fc1(out)
    out = F.relu(out)

    out = self.fc2(out)
    out = F.relu(out)

    out = self.out(out)
    out = F.softmax(out)
    # print(out.shape)

    return out

In [119]:
# initialize weights of CNN layers
def init_weights(m):
  mean = 0.0
  std = 0.001
  if isinstance(m, nn.Conv2d):
    m.weight.data.normal_(mean,std)
    if m.bias is not None:
      nn.init.constant_(m.bias.data, 0)
  elif isinstance(m, nn.BatchNorm2d):
    m.weight.data.normal_(mean,std)
    if m.bias is not None:
      nn.init.constant_(m.bias.data, 0)
  elif isinstance(m, nn.Linear):
    m.weight.data.normal_(mean,std)
    if m.bias is not None:
      nn.init.constant_(m.bias.data, 0)


In [120]:
transform = transforms.Compose(
      [
        transforms.ToTensor(),
        transforms.Normalize([0.5, 0.5, 0.5], [0.5, 0.5, 0.5])
        ]
    )

In [121]:
train = loadmat('train_32x32.mat')
test = loadmat('test_32x32.mat')

In [122]:
print(train['X'].shape)

(32, 32, 3, 73257)


In [123]:
train_SVHNdataset = SVHN_dataset(data = train, transform = transform)
test_SVHNdataset = SVHN_dataset(data = test, transform = transform)

In [124]:
params = {'batch_size': 512,
          'shuffle': True,
          'num_workers': 1,
          'pin_memory':True}

In [126]:
trainSVHN_loader = DataLoader(train_SVHNdataset, **params)
testSVHN_loader = DataLoader(test_SVHNdataset, **params)

In [127]:
model = CNN()
model.apply(init_weights)
device = torch.device("cuda:0" if torch.cuda.is_available() else cpu)
print(device)

cuda:0


In [128]:
model.to(device)

CNN(
  (layer1): Sequential(
    (0): Conv2d(3, 6, kernel_size=(5, 5), stride=(1, 1), padding=(2, 2))
    (1): BatchNorm2d(6, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
    (2): ReLU()
    (3): MaxPool2d(kernel_size=2, stride=2, padding=0, dilation=1, ceil_mode=False)
  )
  (layer2): Sequential(
    (0): Conv2d(6, 12, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1))
    (1): BatchNorm2d(12, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
    (2): ReLU()
    (3): MaxPool2d(kernel_size=2, stride=2, padding=0, dilation=1, ceil_mode=False)
  )
  (layer3): Sequential(
    (0): Conv2d(12, 24, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1))
    (1): BatchNorm2d(24, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
    (2): ReLU()
    (3): MaxPool2d(kernel_size=2, stride=2, padding=0, dilation=1, ceil_mode=False)
  )
  (fc1): Linear(in_features=384, out_features=120, bias=True)
  (fc2): Linear(in_features=120, out_features=60, bias=True)


In [129]:
learning_rate = 0.001
lossfunc = nn.CrossEntropyLoss()
optimizer = torch.optim.Adam(model.parameters(),lr=learning_rate)

In [130]:
num_epochs = 10
loss_values = list()
for epoch in range(num_epochs):
    # Training
    for X_train, y_train in trainSVHN_loader:
      # Transfer to GPU
      X_train_tensor = torch.tensor(X_train, dtype = torch.float)
      y_train_tensor = torch.tensor(y_train, dtype = torch.long)

      images, labels = Variable(X_train_tensor).to(device), Variable(y_train_tensor).to(device)

      # model computation
      outputs = model(images)
      target = torch.argmax(labels, dim=1)
      loss = lossfunc(outputs, target)
      optimizer.zero_grad()
      loss.backward()
      optimizer.step()

      print('Epoch -',epoch, 'loss - ', loss.item())
      loss_values.append(loss.item())


  import sys
  


Epoch - 0 loss -  2.3025848865509033
Epoch - 0 loss -  2.302403211593628
Epoch - 0 loss -  2.3022148609161377
Epoch - 0 loss -  2.3020172119140625
Epoch - 0 loss -  2.301811456680298
Epoch - 0 loss -  2.3015966415405273
Epoch - 0 loss -  2.301368474960327
Epoch - 0 loss -  2.3011248111724854
Epoch - 0 loss -  2.30086612701416
Epoch - 0 loss -  2.3005897998809814
Epoch - 0 loss -  2.300288438796997
Epoch - 0 loss -  2.299961805343628
Epoch - 0 loss -  2.29960298538208
Epoch - 0 loss -  2.299206495285034
Epoch - 0 loss -  2.2987663745880127
Epoch - 0 loss -  2.298271894454956
Epoch - 0 loss -  2.297717332839966
Epoch - 0 loss -  2.297088861465454
Epoch - 0 loss -  2.2963714599609375
Epoch - 0 loss -  2.2955477237701416
Epoch - 0 loss -  2.2945940494537354
Epoch - 0 loss -  2.2934820652008057
Epoch - 0 loss -  2.2921714782714844
Epoch - 0 loss -  2.290613889694214
Epoch - 0 loss -  2.288745641708374
Epoch - 0 loss -  2.286487579345703
Epoch - 0 loss -  2.2837417125701904
Epoch - 0 loss - 