In [1]:
import torch
import torch.nn as nn
import torch.nn.functional as F
import torchvision
import torchvision.transforms as transforms
import matplotlib.pyplot as plt
import numpy as np

# Device configuration
#device = torch.device('cuda' if torch.cuda.is_available() else 'cpu')
#print(device)
if torch.device("cuda"):
   device = torch.device("cuda")
   print(device)
else:
   device = torch.device("cpu")
   print(device)
# Hyper-parameters 
num_epochs = 1
batch_size = 4
learning_rate = 0.001

# dataset has PILImage images of range [0, 1]. 
# We transform them to Tensors of normalized range [-1, 1]
transform = transforms.Compose(
    [transforms.ToTensor(),
     transforms.Normalize((0.5, 0.5, 0.5), (0.5, 0.5, 0.5))])

# CIFAR10: 60000 32x32 color images in 10 classes, with 6000 images per class
train_dataset = torchvision.datasets.CIFAR100(root='./data', train=True,
                                        download=True, transform=transform)

test_dataset = torchvision.datasets.CIFAR100(root='./data', train=False,
                                       download=True, transform=transform)

train_loader = torch.utils.data.DataLoader(train_dataset, batch_size=batch_size,
                                          shuffle=True)

test_loader = torch.utils.data.DataLoader(test_dataset, batch_size=batch_size,
                                         shuffle=False)


def conv_block(in_channels, out_channels, pool = False): # Generalised convolution block
  layers = [
            nn.Conv2d(in_channels,out_channels, padding=1, kernel_size=3),
            nn.BatchNorm2d(out_channels),
            nn.ELU(inplace=True)
            ]
  if pool:
    layers.append(nn.MaxPool2d(2))
  return nn.Sequential(*layers)

def fcn_block(in_neuron, out_neuron, activation = True): # Generalised FCN(fully connected layer) block
  layers = [
            nn.BatchNorm1d(in_neuron),
            nn.Linear(in_neuron, out_neuron),
              ]
  if activation:
    layers.append(nn.ELU(inplace=True))

  return nn.Sequential(*layers)


class ConvNet(nn.Module):
    def __init__(self):
        super(ConvNet, self).__init__()
        self.conv1 = conv_block(3, 64)
        self.conv2 = conv_block(64, 128, pool=True)
        self.res1 = nn.Sequential(conv_block(128, 128), conv_block(128, 128))
        self.conv3 = conv_block(128, 256, pool=True)
        self.conv4 = conv_block(256, 512, pool=True)
        self.res2 = nn.Sequential(conv_block(512, 512), conv_block(512, 512))
        self.conv5 = conv_block(512, 1024, pool=True)
        self.conv6 = conv_block(1024, 1024, pool=True)
        self.res3 = nn.Sequential(conv_block(1024, 1024), conv_block(1024, 1024))
        # Fully Connected Layer
        self.fc1 = fcn_block(1024, 512)
        self.fc2 = fcn_block(512, 256)
        self.fc3 = fcn_block(256, 100, activation=False)


    def forward(self, x):
        # forward pass into Convolution layers
        out = self.conv1(x) 
        out = self.conv2(out) 
        out = self.res1(out) + out
        out = self.conv3(out) 
        out = self.conv4(out)
        out = self.res2(out) + out
        out = self.conv5(out) 
        out = self.conv6(out) 
        out = self.res3(out) + out
        
        # Flattening the output
        out = out.view(out.size(0),-1)
        # FCN
        out = self.fc1(out)
        out = self.fc2(out)
        out = self.fc3(out)

        return out

model = ConvNet().to(device)

criterion = nn.CrossEntropyLoss()
optimizer = torch.optim.SGD(model.parameters(), lr=learning_rate)

n_total_steps = len(train_loader)
for epoch in range(num_epochs):
    for i, (images, labels) in enumerate(train_loader):
        images = images.to(device)
        labels = labels.to(device)

        # Forward pass
        outputs = model(images)
        loss = criterion(outputs, labels)

        # Backward and optimize
        optimizer.zero_grad()
        loss.backward()
        optimizer.step()

        if (i+1) % 2000 == 0:
            print (f'Epoch [{epoch+1}/{num_epochs}], Step [{i+1}/{n_total_steps}], Loss: {loss.item():.4f}')

print('Finished Training')
PATH = './cnn.pth'
torch.save(model.state_dict(), PATH)

with torch.no_grad():
    n_correct = 0
    n_samples = 0
    n_class_correct = [0 for i in range(100)]
    n_class_samples = [0 for i in range(100)]
    for images, labels in test_loader:
        images = images.to(device)
        labels = labels.to(device)
        outputs = model(images)
        # max returns (value ,index)
        _, predicted = torch.max(outputs, 1)
        n_samples += labels.size(0)
        n_correct += (predicted == labels).sum().item()
        for i in range(labels.size(0)):
            label = labels[i].item()  # Convert tensor to Python integer
            pred = predicted[i].item()  # Convert tensor to Python integer
            n_class_correct[label] += (label == pred)
            n_class_samples[label] += 1


    acc = 100.0 * n_correct / n_samples
    print(f'Accuracy of the network: {acc} %')

    # for i in range(100):
    #     acc = 100.0 * n_class_correct[i] / n_class_samples[i]
    #     print(f'Accuracy of {Classes[i]}: {acc} %')

cpu
Downloading https://www.cs.toronto.edu/~kriz/cifar-100-python.tar.gz to ./data\cifar-100-python.tar.gz


 49%|████▊     | 82214912/169001437 [00:23<00:24, 3552029.39it/s]


KeyboardInterrupt: 