# CIFAR-10 Challange - 김영인

1. wide resnet 50-2
2. \+ Data Augmentation(RandomResizedCrop, RandomHorizontalFlip)
3. \+ Data Normalize
5. \+ Optimizer(momentum, scheduler)


In [2]:
import random

import torch
import numpy as np
from matplotlib import pyplot as plt

import torch.nn as nn
import torch.nn.functional as F
import torch.optim as optim

from torch.utils.data import Dataset, DataLoader
from torchvision import transforms, models, datasets

random_seed = 4332
torch.manual_seed(random_seed)
torch.cuda.manual_seed(random_seed)
torch.cuda.manual_seed_all(random_seed) # if use multi-GPU
torch.backends.cudnn.deterministic = True
torch.backends.cudnn.benchmark = False
np.random.seed(random_seed)
random.seed(random_seed)

device0 = torch.device("cuda:0" if torch.cuda.is_available() else "cpu")
device1 = torch.device("cuda:1" if torch.cuda.is_available() else "cpu")

device = device0
print(f"device: {device}") if torch.cuda.is_available() else print("device: cpu")

device: cuda:0


## Hyper parameter Setting 

In [3]:
learning_rate = 0.1
scheduler_step = 30
scheduler_gamma = 0.2
training_epochs = 100
batch_size = 64
momentum = 0.9
dropout_rate = 0.3

## Load & Preprocess Data

In [4]:
transform_train = transforms.Compose(
    [transforms.RandomResizedCrop(224), # data augmentation, 224: image size, ImageNet pretrained model에 맞추기 위해서 224 size로 설정
     transforms.RandomHorizontalFlip(), # data augmentation, 좌우로 대칭
     transforms.ToTensor(), # numpy array를 pytorch tensor로 바꿔주는 역할
     transforms.Normalize((0.4914, 0.4822, 0.4465), (0.2023, 0.1994, 0.2010)) # dataset의 mean, std를 이용해서 -1~1 로 normalize
    ])

transform_test = transforms.Compose([
    transforms.RandomResizedCrop(224),
    transforms.ToTensor(),
    transforms.Normalize((0.4914, 0.4822, 0.4465), (0.2023, 0.1994, 0.2010)),
])

trainset = datasets.CIFAR10(root='./data', train=True,
                                      download=True, transform=transforms.ToTensor())
trainloader = DataLoader(trainset, batch_size=batch_size,
                                         shuffle=True, num_workers=2)

testset = datasets.CIFAR10(root='./data', train=False,
                                      download=True, transform=transforms.ToTensor())
testloader = DataLoader(testset, batch_size=4,
                                        shuffle=False, num_workers=2)

classes = ('plane', 'car', 'bird', 'cat', 'deer', 'dog', 'frog', 'horse', 'ship', 'truck')

Files already downloaded and verified
Files already downloaded and verified


## Load and Define pretrained model and fine-tuning

In [5]:
print(models.wide_resnet50_2(pretrained=True).fc)

Linear(in_features=2048, out_features=1000, bias=True)


In [6]:
class WideResNet(nn.Module):
    def __init__ (self):
        super(WideResNet, self).__init__()
        self.resnet = models.wide_resnet50_2(pretrained=True)
        num_ftrs = self.resnet.fc.in_features
        self.resnet.fc = nn.Linear(num_ftrs, 10)
        
    def forward(self, x):
        x = self.resnet(x)
        return x

## Load Model

In [7]:
net = WideResNet()
net = net.to(device)

criterion = nn.CrossEntropyLoss() 
optimizer = optim.SGD(net.parameters(), lr=learning_rate, momentum=momentum)
scheduler = optim.lr_scheduler.StepLR(optimizer, 
                                      step_size = scheduler_step,
                                      gamma = scheduler_gamma)

## Train

In [8]:
net.train()

for epoch in range(training_epochs):
    running_loss = 0.0
    for i, data in enumerate(trainloader, 0):
        inputs, labels = data
        inputs, labels = inputs.to(device), labels.to(device)
        
        optimizer.zero_grad()

        outputs = net(inputs) 
        loss =  criterion(outputs, labels)
        loss.backward()
        
        optimizer.step()
        
        running_loss += loss.item()
        if i % 100 == 99:
            print('[%d, %5d] loss: %.3f' % (epoch + 1, i + 1, running_loss / 100))
            running_loss = 0.0
        
print('Finished Training')

[1,   100] loss: 4.876
[1,   200] loss: 2.744
[1,   300] loss: 2.191
[1,   400] loss: 2.072
[1,   500] loss: 2.014
[1,   600] loss: 1.993
[1,   700] loss: 1.944
[2,   100] loss: 1.865
[2,   200] loss: 1.825
[2,   300] loss: 1.798
[2,   400] loss: 1.759
[2,   500] loss: 1.705
[2,   600] loss: 1.702
[2,   700] loss: 1.663
[3,   100] loss: 2.043
[3,   200] loss: 1.727
[3,   300] loss: 1.662
[3,   400] loss: 1.624
[3,   500] loss: 1.603
[3,   600] loss: 1.582
[3,   700] loss: 1.592
[4,   100] loss: 1.502
[4,   200] loss: 1.530
[4,   300] loss: 1.504
[4,   400] loss: 1.479
[4,   500] loss: 1.458
[4,   600] loss: 1.476
[4,   700] loss: 1.468
[5,   100] loss: 1.390
[5,   200] loss: 1.426
[5,   300] loss: 1.393
[5,   400] loss: 1.377
[5,   500] loss: 1.359
[5,   600] loss: 1.386
[5,   700] loss: 1.352
[6,   100] loss: 1.352
[6,   200] loss: 1.311
[6,   300] loss: 1.330
[6,   400] loss: 1.290
[6,   500] loss: 1.341
[6,   600] loss: 1.316
[6,   700] loss: 1.292
[7,   100] loss: 1.248
[7,   200] 

[50,   200] loss: 0.079
[50,   300] loss: 0.084
[50,   400] loss: 0.082
[50,   500] loss: 0.089
[50,   600] loss: 0.099
[50,   700] loss: 0.102
[51,   100] loss: 0.098
[51,   200] loss: 0.072
[51,   300] loss: 0.066
[51,   400] loss: 0.071
[51,   500] loss: 0.099
[51,   600] loss: 0.088
[51,   700] loss: 0.095
[52,   100] loss: 0.092
[52,   200] loss: 0.092
[52,   300] loss: 0.086
[52,   400] loss: 0.074
[52,   500] loss: 0.099
[52,   600] loss: 0.094
[52,   700] loss: 0.074
[53,   100] loss: 0.055
[53,   200] loss: 0.066
[53,   300] loss: 0.080
[53,   400] loss: 0.079
[53,   500] loss: 0.079
[53,   600] loss: 0.086
[53,   700] loss: 0.081
[54,   100] loss: 0.127
[54,   200] loss: 0.097
[54,   300] loss: 0.074
[54,   400] loss: 0.072
[54,   500] loss: 0.074
[54,   600] loss: 0.073
[54,   700] loss: 0.081
[55,   100] loss: 0.058
[55,   200] loss: 0.063
[55,   300] loss: 0.065
[55,   400] loss: 0.080
[55,   500] loss: 0.064
[55,   600] loss: 0.063
[55,   700] loss: 0.086
[56,   100] loss

[99,   100] loss: 0.008
[99,   200] loss: 0.012
[99,   300] loss: 0.012
[99,   400] loss: 0.012
[99,   500] loss: 0.022
[99,   600] loss: 0.016
[99,   700] loss: 0.009
[100,   100] loss: 0.020
[100,   200] loss: 0.012
[100,   300] loss: 0.018
[100,   400] loss: 0.017
[100,   500] loss: 0.015
[100,   600] loss: 0.023
[100,   700] loss: 0.029
Finished Training


## Test

In [9]:
class_correct = np.zeros(10)
class_total = np.zeros(10)

net.eval()

with torch.no_grad():
    for data in testloader:
        images, labels = data
        images = images.to(device)
        labels = labels.to(device)
        outputs = net(images)
        _, predicted = torch.max(outputs, 1)
        c = (predicted == labels).squeeze()
        for i in range(4):
            label = labels[i]
            class_correct[label] += c[i].item()
            class_total[label] += 1


for i in range(10):
    print('Accuracy of %5s : %2f %%' % (
        classes[i], 100 * class_correct[i] / class_total[i]))
print('Mean Accuracy : ', 100*np.sum(class_correct)/np.sum(class_total))

Accuracy of plane : 79.900000 %
Accuracy of   car : 89.500000 %
Accuracy of  bird : 75.400000 %
Accuracy of   cat : 56.500000 %
Accuracy of  deer : 71.900000 %
Accuracy of   dog : 59.800000 %
Accuracy of  frog : 80.100000 %
Accuracy of horse : 81.200000 %
Accuracy of  ship : 88.200000 %
Accuracy of truck : 71.900000 %
Mean Accuracy :  75.44
