# CIFAR-10 Challange - 김영인

1. wide resnet 50-2
2. \+ Data Augmentation(RandomResizedCrop, RandomHorizontalFlip)
3. \+ Data Normalize
4. \+ regularization(weight decay)
5. \+ Optimizer(momentum, scheduler)


In [1]:
import random

import torch
import numpy as np
from matplotlib import pyplot as plt

import torch.nn as nn
import torch.nn.functional as F
import torch.optim as optim

from torch.utils.data import Dataset, DataLoader
from torchvision import transforms, models, datasets

random_seed = 4332
torch.manual_seed(random_seed)
torch.cuda.manual_seed(random_seed)
torch.cuda.manual_seed_all(random_seed) # if use multi-GPU
torch.backends.cudnn.deterministic = True
torch.backends.cudnn.benchmark = False
np.random.seed(random_seed)
random.seed(random_seed)

device0 = torch.device("cuda:0" if torch.cuda.is_available() else "cpu")
device1 = torch.device("cuda:1" if torch.cuda.is_available() else "cpu")

device = device0
print(f"device: {device}") if torch.cuda.is_available() else print("device: cpu")

device: cuda:0


## Hyper parameter Setting 

In [2]:
learning_rate = 0.1
scheduler_step = 30
scheduler_gamma = 0.2
training_epochs = 100
batch_size = 64
momentum = 0.9
weight_decay = 5e-4
dropout_rate = 0.3

## Load & Preprocess Data

In [3]:
transform_train = transforms.Compose(
    [transforms.RandomResizedCrop(224), # data augmentation, 224: image size, ImageNet pretrained model에 맞추기 위해서 224 size로 설정
     transforms.RandomHorizontalFlip(), # data augmentation, 좌우로 대칭
     transforms.ToTensor(), # numpy array를 pytorch tensor로 바꿔주는 역할
     transforms.Normalize((0.4914, 0.4822, 0.4465), (0.2023, 0.1994, 0.2010)) # dataset의 mean, std를 이용해서 -1~1 로 normalize
    ])

transform_test = transforms.Compose([
    transforms.RandomResizedCrop(224),
    transforms.ToTensor(),
    transforms.Normalize((0.4914, 0.4822, 0.4465), (0.2023, 0.1994, 0.2010)),
])

trainset = datasets.CIFAR10(root='./data', train=True,
                                      download=True, transform=transforms.ToTensor())
trainloader = DataLoader(trainset, batch_size=batch_size,
                                         shuffle=True, num_workers=2)

testset = datasets.CIFAR10(root='./data', train=False,
                                      download=True, transform=transforms.ToTensor())
testloader = DataLoader(testset, batch_size=4,
                                        shuffle=False, num_workers=2)

classes = ('plane', 'car', 'bird', 'cat', 'deer', 'dog', 'frog', 'horse', 'ship', 'truck')

Files already downloaded and verified
Files already downloaded and verified


## Load and Define pretrained model and fine-tuning

In [4]:
print(models.wide_resnet50_2(pretrained=True).fc)

Linear(in_features=2048, out_features=1000, bias=True)


In [5]:
class WideResNet(nn.Module):
    def __init__ (self):
        super(WideResNet, self).__init__()
        self.resnet = models.wide_resnet50_2(pretrained=True)
        num_ftrs = self.resnet.fc.in_features
        self.resnet.fc = nn.Linear(num_ftrs, 10)
        
    def forward(self, x):
        x = self.resnet(x)
        return x

## Load Model

In [6]:
net = WideResNet()
net = net.to(device)

criterion = nn.CrossEntropyLoss() 
optimizer = optim.SGD(net.parameters(), lr=learning_rate, momentum=momentum, weight_decay=weight_decay)
scheduler = optim.lr_scheduler.StepLR(optimizer, 
                                      step_size = scheduler_step,
                                      gamma = scheduler_gamma)

## Train

In [7]:
net.train()

for epoch in range(training_epochs):
    running_loss = 0.0
    for i, data in enumerate(trainloader, 0):
        inputs, labels = data
        inputs, labels = inputs.to(device), labels.to(device)
        
        optimizer.zero_grad()

        outputs = net(inputs) 
        loss =  criterion(outputs, labels)
        loss.backward()
        
        optimizer.step()
        
        running_loss += loss.item()
        if i % 100 == 99:
            print('[%d, %5d] loss: %.3f' % (epoch + 1, i + 1, running_loss / 100))
            running_loss = 0.0
        
print('Finished Training')

[1,   100] loss: 5.464
[1,   200] loss: 2.750
[1,   300] loss: 2.271
[1,   400] loss: 2.183
[1,   500] loss: 2.108
[1,   600] loss: 2.056
[1,   700] loss: 2.004
[2,   100] loss: 1.896
[2,   200] loss: 1.890
[2,   300] loss: 1.845
[2,   400] loss: 1.841
[2,   500] loss: 1.798
[2,   600] loss: 1.814
[2,   700] loss: 1.902
[3,   100] loss: 1.789
[3,   200] loss: 1.730
[3,   300] loss: 1.694
[3,   400] loss: 1.660
[3,   500] loss: 1.638
[3,   600] loss: 1.607
[3,   700] loss: 1.601
[4,   100] loss: 1.535
[4,   200] loss: 1.532
[4,   300] loss: 1.510
[4,   400] loss: 1.486
[4,   500] loss: 1.455
[4,   600] loss: 1.469
[4,   700] loss: 1.447
[5,   100] loss: 1.388
[5,   200] loss: 1.400
[5,   300] loss: 1.396
[5,   400] loss: 1.362
[5,   500] loss: 1.345
[5,   600] loss: 1.389
[5,   700] loss: 1.321
[6,   100] loss: 1.325
[6,   200] loss: 1.283
[6,   300] loss: 1.289
[6,   400] loss: 1.263
[6,   500] loss: 1.287
[6,   600] loss: 1.268
[6,   700] loss: 1.245
[7,   100] loss: 1.213
[7,   200] 

[50,   200] loss: 0.771
[50,   300] loss: 0.728
[50,   400] loss: 0.752
[50,   500] loss: 0.774
[50,   600] loss: 0.780
[50,   700] loss: 0.759
[51,   100] loss: 0.726
[51,   200] loss: 0.738
[51,   300] loss: 0.770
[51,   400] loss: 0.748
[51,   500] loss: 0.747
[51,   600] loss: 0.774
[51,   700] loss: 0.778
[52,   100] loss: 0.745
[52,   200] loss: 0.745
[52,   300] loss: 0.772
[52,   400] loss: 0.775
[52,   500] loss: 0.740
[52,   600] loss: 0.744
[52,   700] loss: 0.751
[53,   100] loss: 0.722
[53,   200] loss: 0.731
[53,   300] loss: 0.745
[53,   400] loss: 0.742
[53,   500] loss: 0.774
[53,   600] loss: 0.773
[53,   700] loss: 0.773
[54,   100] loss: 0.753
[54,   200] loss: 0.749
[54,   300] loss: 0.732
[54,   400] loss: 0.739
[54,   500] loss: 0.755
[54,   600] loss: 0.781
[54,   700] loss: 0.765
[55,   100] loss: 0.709
[55,   200] loss: 0.739
[55,   300] loss: 0.764
[55,   400] loss: 0.772
[55,   500] loss: 0.767
[55,   600] loss: 0.778
[55,   700] loss: 0.766
[56,   100] loss

[99,   100] loss: 0.668
[99,   200] loss: 0.686
[99,   300] loss: 0.695
[99,   400] loss: 0.726
[99,   500] loss: 0.739
[99,   600] loss: 0.756
[99,   700] loss: 0.763
[100,   100] loss: 0.707
[100,   200] loss: 0.715
[100,   300] loss: 0.714
[100,   400] loss: 0.732
[100,   500] loss: 0.736
[100,   600] loss: 0.748
[100,   700] loss: 0.725
Finished Training


## Test

In [8]:
class_correct = np.zeros(10)
class_total = np.zeros(10)

net.eval()

with torch.no_grad():
    for data in testloader:
        images, labels = data
        images = images.to(device)
        labels = labels.to(device)
        outputs = net(images)
        _, predicted = torch.max(outputs, 1)
        c = (predicted == labels).squeeze()
        for i in range(4):
            label = labels[i]
            class_correct[label] += c[i].item()
            class_total[label] += 1


for i in range(10):
    print('Accuracy of %5s : %2f %%' % (
        classes[i], 100 * class_correct[i] / class_total[i]))
print('Mean Accuracy : ', 100*np.sum(class_correct)/np.sum(class_total))

Accuracy of plane : 94.500000 %
Accuracy of   car : 75.000000 %
Accuracy of  bird : 47.500000 %
Accuracy of   cat : 38.000000 %
Accuracy of  deer : 64.000000 %
Accuracy of   dog : 10.400000 %
Accuracy of  frog : 58.100000 %
Accuracy of horse : 75.300000 %
Accuracy of  ship : 45.600000 %
Accuracy of truck : 64.700000 %
Mean Accuracy :  57.31
