In [1]:
import torch
import torch.nn as nn
import matplotlib.pyplot as plt

from torch.autograd import Variable

# Torchvision module contains various utilities, classes, models and datasets 
# used towards computer vision usecases
from torchvision import datasets
from torchvision import transforms
import torchvision

# Functional module contains helper functions
import torch.nn.functional as F

In [15]:
transform = transforms.Compose([
    transforms.Resize(256),
    transforms.CenterCrop(224),
    transforms.ToTensor(),
    transforms.Normalize(mean=[0.485, 0.456, 0.406], std=[0.229, 0.224, 0.225]),
])

batch_size = 4

trainset = torchvision.datasets.CIFAR10(root='./data', train=True,
                                        download=True, transform=transform)
trainloader = torch.utils.data.DataLoader(trainset, batch_size=batch_size,
                                          shuffle=True, num_workers=2)

testset = torchvision.datasets.CIFAR10(root='./data', train=False,
                                       download=True, transform=transform)
testloader = torch.utils.data.DataLoader(testset, batch_size=batch_size,
                                         shuffle=False, num_workers=2)

classes = ('plane', 'car', 'bird', 'cat',
           'deer', 'dog', 'frog', 'horse', 'ship', 'truck')


Files already downloaded and verified
Files already downloaded and verified


In [3]:
# The model
#net = torchvision.models.resnet50()

net = torch.hub.load('pytorch/vision:v0.6.0', 'alexnet', pretrained=True)

#Updating the second classifier
net.classifier[4] = nn.Linear(4096,1024)

#Updating the third and the last classifier that is the output layer of the network. Make sure to have 10 output nodes if we are going to get 10 class labels through our model.
net.classifier[6] = nn.Linear(1024,10)

# Our loss function
criterion = nn.CrossEntropyLoss()

# Our optimizer
learning_rate = 0.001
optimizer = torch.optim.SGD(net.parameters(), lr=learning_rate, momentum=0.9) 

Using cache found in C:\Users\merna/.cache\torch\hub\pytorch_vision_v0.6.0


In [5]:
for epoch in range(10):  # loop over the dataset multiple times

    running_loss = 0.0
    for i, data in enumerate(trainloader, 0):
        # get the inputs; data is a list of [inputs, labels]
        inputs, labels = data

        # zero the parameter gradients
        optimizer.zero_grad()

        # forward + backward + optimize
        outputs = net(inputs)
        loss = criterion(outputs, labels)
        loss.backward()
        optimizer.step()

        # print statistics
        running_loss += loss.item()
        if i % 2000 == 1999:    # print every 2000 mini-batches
            print('[%d, %5d] loss: %.3f' %
                  (epoch + 1, i + 1, running_loss / 2000))
            running_loss = 0.0

print('Finished Training')

[1,  2000] loss: 1.368
[1,  4000] loss: 1.040
[1,  6000] loss: 0.946
[1,  8000] loss: 0.869
[1, 10000] loss: 0.824
[1, 12000] loss: 0.784
[2,  2000] loss: 0.686
[2,  4000] loss: 0.679
[2,  6000] loss: 0.667
[2,  8000] loss: 0.701
[2, 10000] loss: 0.673
[2, 12000] loss: 0.637
[3,  2000] loss: 0.546
[3,  4000] loss: 0.546
[3,  6000] loss: 0.566
[3,  8000] loss: 0.555
[3, 10000] loss: 0.563
[3, 12000] loss: 0.574
[4,  2000] loss: 0.456
[4,  4000] loss: 0.467
[4,  6000] loss: 0.485
[4,  8000] loss: 0.493
[4, 10000] loss: 0.504
[4, 12000] loss: 0.503
[5,  2000] loss: 0.401
[5,  4000] loss: 0.412
[5,  6000] loss: 0.468
[5,  8000] loss: 0.436
[5, 10000] loss: 0.455
[5, 12000] loss: 0.462
[6,  2000] loss: 0.375
[6,  4000] loss: 0.375
[6,  6000] loss: 0.383
[6,  8000] loss: 0.401
[6, 10000] loss: 0.400
[6, 12000] loss: 0.436
[7,  2000] loss: 0.346
[7,  4000] loss: 0.369
[7,  6000] loss: 0.375
[7,  8000] loss: 0.384
[7, 10000] loss: 0.409
[7, 12000] loss: 0.405
[8,  2000] loss: 0.314
[8,  4000] 

In [6]:
correct = 0
total = 0
# since we're not training, we don't need to calculate the gradients for our outputs
with torch.no_grad():
    for data in testloader:
        images, labels = data
        # calculate outputs by running images through the network
        outputs = net(images)
        # the class with the highest energy is what we choose as prediction
        _, predicted = torch.max(outputs.data, 1)
        total += labels.size(0)
        correct += (predicted == labels).sum().item()

print('Accuracy of the network on the 10000 test images: %d %%' % (
    100 * correct / total))

Accuracy of the network on the 10000 test images: 79 %


In [None]:
# prepare to count predictions for each class
correct_pred = {classname: 0 for classname in classes}
total_pred = {classname: 0 for classname in classes}

# again no gradients needed
with torch.no_grad():
    for data in testloader:
        images, labels = data
        outputs = net(images)
        _, predictions = torch.max(outputs, 1)
        # collect the correct predictions for each class
        for label, prediction in zip(labels, predictions):
            if label == prediction:
                correct_pred[classes[label]] += 1
            total_pred[classes[label]] += 1


# print accuracy for each class
for classname, correct_count in correct_pred.items():
    accuracy = 100 * float(correct_count) / total_pred[classname]
    print("Accuracy for class {:5s} is: {:.1f} %".format(classname,
                                                   accuracy))

In [14]:
#torch.save(net.state_dict(), "./2.model.path")