# CNN para classificação - CIFAR10

Como criar e treinar uma rede usando CNN em Pythorch.
Nesse script iremos usaro dataset CIFAR10.

In [1]:
# Import libraries
import torch
import numpy as np
import matplotlib.pyplot as plt
%matplotlib inline

# PyTorch dataset
from torchvision import datasets
import torchvision.transforms as transforms
from torch.utils.data.sampler import SubsetRandomSampler

# PyTorch model
import torch.nn as nn
import torch.nn.functional as F
import torch.optim as optim

In [2]:
device = 'cuda' if torch.cuda.is_available() else 'cpu'
device

'cuda'

## Dataset

In [3]:
batch_size = 32
valid_size = 0.2 # proporção da divisão do banco de treinamento em train e valid 

In [4]:
train_transform = transforms.Compose([
    transforms.RandomHorizontalFlip(),
    transforms.RandomRotation(30),
    transforms.RandomAutocontrast(0.1),
    transforms.ToTensor(),
    transforms.Normalize((0.5, 0.5, 0.5), (0.5, 0.5, 0.5))
    ])

test_transform = transforms.Compose([
    transforms.ToTensor(),
    transforms.Normalize((0.5, 0.5, 0.5), (0.5, 0.5, 0.5))
    ])

In [5]:
# Baixar os datasets
train_data = datasets.CIFAR10('data', train=True,
                              download=True, transform=train_transform)
test_data = datasets.CIFAR10('data', train=False,
                             download=True, transform=test_transform)

Files already downloaded and verified
Files already downloaded and verified


- Dividir o dataset de treinamento  em em treinamento e validação

In [6]:
num_train = len(train_data)
indices = list(range(num_train))
np.random.shuffle(indices)
split = int(np.floor(valid_size * num_train))
train_idx, valid_idx = indices[split:], indices[:split]

In [7]:
train_sampler = SubsetRandomSampler(train_idx)
valid_sampler = SubsetRandomSampler(valid_idx)

Loaders

In [8]:
train_loader = torch.utils.data.DataLoader(train_data, batch_size=batch_size,sampler=train_sampler)
valid_loader = torch.utils.data.DataLoader(train_data, batch_size=batch_size, sampler=valid_sampler)

test_loader = torch.utils.data.DataLoader(test_data, batch_size=batch_size)

In [9]:
classes = ['airplane', 'automobile', 'bird', 'cat', 'deer', 'dog', 'frog', 'horse', 'ship', 'truck']
classes

['airplane',
 'automobile',
 'bird',
 'cat',
 'deer',
 'dog',
 'frog',
 'horse',
 'ship',
 'truck']

## Definindo a arquitetura

In [10]:

class Net(nn.Module):
    def __init__(self):
        super(Net, self).__init__()
        self.conv1 = nn.Conv2d(3, 16, 3, padding=1)
        self.conv2 = nn.Conv2d(16, 32, 3, padding=1)
        
        self.max = nn.MaxPool2d(2, 2)
        
        self.dropout = nn.Dropout(0.2)
        self.relu = nn.ReLU()
        
        self.flatten = nn.Flatten()
        
        self.linear = nn.Linear( 8*8*32, 256)
        self.output = nn.Linear( 256, 10)

    def forward(self, x):
        # 32,32,3
        x = self.relu(self.conv1(x))  # 32,32,16
        x = self.max(x) # 16,16,3
        x = self.dropout(x)
        
        x = self.relu(self.conv2(x)) # 16,16,32
        x = self.max(x) # 8, 8, 32
        x = self.dropout(x)
        
        x = self.flatten(x)
        
        x = self.dropout(self.linear(x))
        x = self.output(x)     
        
        return x

- Criar a rede

In [11]:
model = Net()
model

Net(
  (conv1): Conv2d(3, 16, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1))
  (conv2): Conv2d(16, 32, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1))
  (max): MaxPool2d(kernel_size=2, stride=2, padding=0, dilation=1, ceil_mode=False)
  (dropout): Dropout(p=0.2, inplace=False)
  (relu): ReLU()
  (flatten): Flatten(start_dim=1, end_dim=-1)
  (linear): Linear(in_features=2048, out_features=256, bias=True)
  (output): Linear(in_features=256, out_features=10, bias=True)
)

In [12]:
model.to(device)

Net(
  (conv1): Conv2d(3, 16, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1))
  (conv2): Conv2d(16, 32, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1))
  (max): MaxPool2d(kernel_size=2, stride=2, padding=0, dilation=1, ceil_mode=False)
  (dropout): Dropout(p=0.2, inplace=False)
  (relu): ReLU()
  (flatten): Flatten(start_dim=1, end_dim=-1)
  (linear): Linear(in_features=2048, out_features=256, bias=True)
  (output): Linear(in_features=256, out_features=10, bias=True)
)

- função de perda e otimizador

In [13]:
criterion = nn.CrossEntropyLoss()

In [14]:
optimizer = optim.SGD(model.parameters(), 0.01)

## Treinamento

In [15]:
n_epochs = 30

valid_loss_min = np.Inf 

In [17]:
for epoch in range(1, n_epochs):

    # keep track of training and validation loss
    train_loss = 0.0
    valid_loss = 0.0
    
    ###################
    # train the model #
    ###################
    model.train()
    for data, target in train_loader:
        # move tensors to GPU if CUDA is available
        data = data.to(device)
        target = target.to(device)
        
        optimizer.zero_grad()
        
        #print('debug devices: ', 
        output = model(data)

        loss = criterion(output, target)
        loss.backward()
        optimizer.step()

        train_loss += loss.item()*data.size(0)
        
    ######################    
    # validate the model #
    ######################
    model.eval() # não usar os dados para treinamento e otimiza o calculo
    for data, target in valid_loader:
        # move tensors to GPU if CUDA is available
        data = data.to(device)
        target = target.to(device)

        output = model(data)
        loss = criterion(output, target)
        valid_loss += loss.item()*data.size(0)
    
    # calculate average losses
    train_loss = train_loss/len(train_loader.sampler)
    valid_loss = valid_loss/len(valid_loader.sampler)
        
    # print training/validation statistics 
    print('Epoch: {} \tTraining Loss: {:.6f} \tValidation Loss: {:.6f}'.format(
        epoch, train_loss, valid_loss))
    
    # save model if validation loss has decreased
    if valid_loss <= valid_loss_min:
        print('Validation loss decreased ({:.6f} --> {:.6f}).  Saving model ...'.format(
        valid_loss_min,
        valid_loss))
        torch.save(model.state_dict(), 'model_cifar.pt')
        valid_loss_min = valid_loss

Epoch: 1 	Training Loss: 2.023996 	Validation Loss: 1.843944
Validation loss decreased (inf --> 1.843944).  Saving model ...
Epoch: 2 	Training Loss: 1.726765 	Validation Loss: 1.595590
Validation loss decreased (1.843944 --> 1.595590).  Saving model ...
Epoch: 3 	Training Loss: 1.570242 	Validation Loss: 1.526904
Validation loss decreased (1.595590 --> 1.526904).  Saving model ...
Epoch: 4 	Training Loss: 1.493770 	Validation Loss: 1.449503
Validation loss decreased (1.526904 --> 1.449503).  Saving model ...
Epoch: 5 	Training Loss: 1.445041 	Validation Loss: 1.390101
Validation loss decreased (1.449503 --> 1.390101).  Saving model ...
Epoch: 6 	Training Loss: 1.406915 	Validation Loss: 1.385088
Validation loss decreased (1.390101 --> 1.385088).  Saving model ...
Epoch: 7 	Training Loss: 1.370771 	Validation Loss: 1.312195
Validation loss decreased (1.385088 --> 1.312195).  Saving model ...
Epoch: 8 	Training Loss: 1.340893 	Validation Loss: 1.305970
Validation loss decreased (1.31219

## Teste do resultado

- carregar o modelo

In [18]:
model.load_state_dict(torch.load('model_cifar.pt'))


<All keys matched successfully>

In [23]:

test_loss = 0.0
class_correct = list(0. for i in range(10))
class_total = list(0. for i in range(10))

model.eval()  # não mudar pesos e ser otimizado


for data, target in test_loader:
    
    data = data.to(device)
    target = target.to(device)
    
    output = model(data)
    loss = criterion(output, target)
    test_loss += loss.item()*data.size(0)
    
    # convert output probabilities to predicted class
    _, pred = torch.max(output, 1)    
    # compare predictions to true label
    correct_tensor = pred.eq(target.data.view_as(pred))
    
    correct = np.squeeze(correct_tensor.numpy()) if device=='cpu' else np.squeeze(correct_tensor.cpu().numpy())
    
    # calculate test accuracy for each object class
    for i in range(len(target)):
        label = target.data[i]
        class_correct[label] += correct[i].item()
        class_total[label] += 1

# average test loss
test_loss = test_loss/len(test_loader.dataset)
print('Test Loss: {:.6f}\n'.format(test_loss))

for i in range(10):
    if class_total[i] > 0:
        print('Test Accuracy of %5s: %2d%% (%2d/%2d)' % (
            classes[i], 100 * class_correct[i] / class_total[i],
            np.sum(class_correct[i]), np.sum(class_total[i])))
    else:
        print('Test Accuracy of %5s: N/A (no training examples)' % (classes[i]))

print('\nTest Accuracy (Overall): %2d%% (%2d/%2d)' % (
    100. * np.sum(class_correct) / np.sum(class_total),
    np.sum(class_correct), np.sum(class_total)))

Test Loss: 0.980434

Test Accuracy of airplane: 68% (684/1000)
Test Accuracy of automobile: 77% (779/1000)
Test Accuracy of  bird: 47% (479/1000)
Test Accuracy of   cat: 46% (469/1000)
Test Accuracy of  deer: 64% (648/1000)
Test Accuracy of   dog: 55% (556/1000)
Test Accuracy of  frog: 75% (751/1000)
Test Accuracy of horse: 70% (705/1000)
Test Accuracy of  ship: 82% (820/1000)
Test Accuracy of truck: 69% (692/1000)

Test Accuracy (Overall): 65% (6583/10000)
