In [1]:
## Loading libs
import torch
from torch import nn
import torchvision
import torchvision.transforms as transforms


In [2]:
## Setting up Hyperparameters
batch_size = 64
num_classes = 10
lr = 0.001
num_epochs = 50 



In [3]:
## Device Agnostic codes
device = "cuda" if torch.cuda.is_available() else "cpu"
device

'cuda'

In [4]:
## Since we're goisng to use CIFAR-10 Dataset
## We need to create certain types of transforms

all_transforms = transforms.Compose([
    transforms.ToTensor(),
    transforms.Normalize(mean=[0.4914,0.4822, 0.4465],std=[0.2023, 0.1994, 0.2010])
    
])



In [5]:
## Loading datasets
train_datasets = torchvision.datasets.CIFAR10(root="./data",
                                             train=True,
                                             transform = all_transforms,
                                             download= True)


Downloading https://www.cs.toronto.edu/~kriz/cifar-10-python.tar.gz to ./data/cifar-10-python.tar.gz


100%|██████████| 170498071/170498071 [00:04<00:00, 34505159.47it/s]


Extracting ./data/cifar-10-python.tar.gz to ./data


In [6]:
## Creating test dataset

test_datasets = torchvision.datasets.CIFAR10(root='./data',
                                            train = False,
                                            transform = all_transforms,
                                            download = True)


Files already downloaded and verified


In [7]:
## Time to put dataset into dataloaders

train_loader = torch.utils.data.DataLoader(dataset = train_datasets,
                                          batch_size = batch_size,
                                          shuffle= True)

test_loader = torch.utils.data.DataLoader(dataset = test_datasets,
                                         batch_size = batch_size,
                                         shuffle = True)

In [8]:
# ## Creating a blue print of the Model
# class CNN(nn.Module):
#     def __init__(self, num_classes):
#         super(CNN, self).__init__()
        
#         self.layer_1 = nn.Conv2d(3,32,3)
#         self.layer_2 = nn.Conv2d(32,32,3)
#         self.max_pool1 = nn.MaxPool2d(2,2)
        
#         self.layer_3 = nn.Conv2d(32,64,3)
#         self.layer_4 = nn.Conv2d(64,64,3)
#         self.max_pool2 = nn.MaxPool2d(2,2)
        
#         self.fc1 = nn.Linear(1600, 28)
#         self.relu1 = nn.ReLU()
#         self.fc2 = nn.Linear(128, num_classes)
        
#     def forward(self,x):
#         out = self.layer_1(x)
#         out = self.layer_2(out)
#         out = self.max_pool1(out)
#         out = self.layer_3(out)
#         out = self.layer_4(out)
#         out = self.max_pool2(out)
        
#         ## reshape before feeding the ip into FCs
#         out = out.reshape(out.size(0), -1)
        
#         out = self.fc1(out)
#         out = self.relu1(out)
#         out = self.fc2(out)
        
#         return out
        
# Creating a CNN class
class CNN(nn.Module):
	#  Determine what layers and their order in CNN object 
    def __init__(self, num_classes):
        super(CNN, self).__init__()
        self.conv_layer1 = nn.Conv2d(in_channels=3, out_channels=32, kernel_size=3)
        self.conv_layer2 = nn.Conv2d(in_channels=32, out_channels=32, kernel_size=3)
        self.max_pool1 = nn.MaxPool2d(kernel_size = 2, stride = 2)
        
        self.conv_layer3 = nn.Conv2d(in_channels=32, out_channels=64, kernel_size=3)
        self.conv_layer4 = nn.Conv2d(in_channels=64, out_channels=64, kernel_size=3)
        self.max_pool2 = nn.MaxPool2d(kernel_size = 2, stride = 2)
        
        self.fc1 = nn.Linear(1600, 128)
        self.relu1 = nn.ReLU()
        self.fc2 = nn.Linear(128, num_classes)
    
    # Progresses data across layers    
    def forward(self, x):
        out = self.conv_layer1(x)
        out = self.conv_layer2(out)
        out = self.max_pool1(out)
        
        out = self.conv_layer3(out)
        out = self.conv_layer4(out)
        out = self.max_pool2(out)
                
        out = out.reshape(out.size(0), -1)
        
        out = self.fc1(out)
        out = self.relu1(out)
        out = self.fc2(out)
        return out

In [9]:
## Lets instantiate our model
model = CNN(num_classes)

model.to(device)

criterion = nn.CrossEntropyLoss()

optimizer = torch.optim.SGD(model.parameters(), lr = lr, weight_decay = 0.005, momentum = 0.9)


total_step = len(train_loader)



In [10]:
device

'cuda'

In [11]:
# We use the pre-defined number of epochs to determine how many iterations to train the network on
for epoch in range(num_epochs):
	#Load in the data in batches using the train_loader object
    for i, (images, labels) in enumerate(train_loader):  
        # Move tensors to the configured device
        images = images.to(device)
        labels = labels.to(device)
        
        # Forward pass
        outputs = model(images)
        loss = criterion(outputs, labels)
        
        # Backward and optimize
        optimizer.zero_grad()
        loss.backward()
        optimizer.step()

    print('Epoch [{}/{}], Loss: {:.4f}'.format(epoch+1, num_epochs, loss.item()))

            
            


Epoch [1/50], Loss: 1.7405
Epoch [2/50], Loss: 1.3588
Epoch [3/50], Loss: 1.6455
Epoch [4/50], Loss: 0.8769
Epoch [5/50], Loss: 1.3026
Epoch [6/50], Loss: 0.7920
Epoch [7/50], Loss: 0.9983
Epoch [8/50], Loss: 0.9312
Epoch [9/50], Loss: 0.5768
Epoch [10/50], Loss: 0.8994
Epoch [11/50], Loss: 1.1246
Epoch [12/50], Loss: 0.6203
Epoch [13/50], Loss: 0.7026
Epoch [14/50], Loss: 0.7538
Epoch [15/50], Loss: 0.5328
Epoch [16/50], Loss: 0.6767
Epoch [17/50], Loss: 0.5164
Epoch [18/50], Loss: 0.4878
Epoch [19/50], Loss: 0.9593
Epoch [20/50], Loss: 0.9969
Epoch [21/50], Loss: 0.9304
Epoch [22/50], Loss: 0.7156
Epoch [23/50], Loss: 0.6729
Epoch [24/50], Loss: 0.5601
Epoch [25/50], Loss: 0.8471
Epoch [26/50], Loss: 0.3296
Epoch [27/50], Loss: 0.3021
Epoch [28/50], Loss: 0.4058
Epoch [29/50], Loss: 0.4386
Epoch [30/50], Loss: 0.3073
Epoch [31/50], Loss: 0.6906
Epoch [32/50], Loss: 0.2270
Epoch [33/50], Loss: 0.3979
Epoch [34/50], Loss: 0.7494
Epoch [35/50], Loss: 0.0876
Epoch [36/50], Loss: 0.4830
E

In [12]:
with torch.no_grad():
    correct = 0
    total = 0
    for images, labels in train_loader:
        images = images.to(device)
        labels = labels.to(device)
        outputs = model(images)
        _, predicted = torch.max(outputs.data, 1)
        total += labels.size(0)
        correct += (predicted == labels).sum().item()
    
    print('Accuracy of the network on the {} train images: {} %'.format(50000, 100 * correct / total))




Accuracy of the network on the 50000 train images: 96.046 %
