In [1]:
import torch
import torch.nn as nn
import torch.nn.functional as F
import torchvision.transforms as transforms
import torchvision.datasets as datasets
import matplotlib.pyplot as plt
import numpy as np
import os
import time
import shutil
import torch.distributed as dist
import math
from PIL import Image
from tqdm import tqdm
from glob import glob
from sklearn.model_selection import train_test_split
from torch.utils.data import Dataset, DataLoader
from typing import Type, Any, Callable, Union, List, Optional
from torch import Tensor
from torch.hub import load_state_dict_from_url
from torch.utils.data.dataloader import default_collate
from torch.utils.data.sampler import BatchSampler
from collections.abc import Mapping, Sequence

os.environ["CUDA_DEVICE_ORDER"]="PCI_BUS_ID"   
os.environ["CUDA_VISIBLE_DEVICES"]="3"


In [2]:
train_path_path= f"{os.getcwd()}/data/split_train/train"
test_path_path= f"{os.getcwd()}/data/split_train/val"

In [3]:
batch_size=128
num_gpus=4
num_workers=8
lr=0.001

In [4]:
normalize = transforms.Normalize(mean=[0.507, 0.487, 0.441],
                                     std=[0.267, 0.256, 0.276])

In [5]:
dataset = datasets.ImageFolder(
        train_path_path,
        transforms.Compose([
        transforms.RandomRotation(degrees=45),
            
        transforms.RandomResizedCrop(96),
        transforms.ColorJitter(.3,.3,.3,.3),
        transforms.RandomHorizontalFlip(),
            transforms.RandomHorizontalFlip(),
            transforms.ToTensor(),
            normalize,
        ]))
for _ in range (19):
    aug_data = datasets.ImageFolder(
        train_path_path,
        transforms.Compose([
        transforms.RandomRotation(degrees=45),
            
        transforms.RandomResizedCrop(96),
        transforms.ColorJitter(.3,.3,.3,.3),
        transforms.RandomHorizontalFlip(),
            transforms.RandomHorizontalFlip(),
            transforms.ToTensor(),
            normalize,
        ]))
    dataset=torch.utils.data.ConcatDataset([dataset,aug_data])
valset = datasets.ImageFolder(
        test_path_path,
        transforms.Compose([
        transforms.RandomRotation(degrees=45),
            
        transforms.RandomResizedCrop(96),
        transforms.ColorJitter(.3,.3,.3,.3),
        transforms.RandomHorizontalFlip(),
            transforms.RandomHorizontalFlip(),
            transforms.ToTensor(),
            normalize,
        ]))
for _ in range (19):
    aug_data = datasets.ImageFolder(
        test_path_path,
        transforms.Compose([
        transforms.RandomRotation(degrees=45),
            
        transforms.RandomResizedCrop(96),
        transforms.ColorJitter(.3,.3,.3,.3),
        transforms.RandomHorizontalFlip(),
            transforms.RandomHorizontalFlip(),
            transforms.ToTensor(),
            normalize,
        ]))
    valset=torch.utils.data.ConcatDataset([valset,aug_data])

In [6]:
print(len(dataset))
print(len(valset))

80000
20000


In [7]:
train_loader = torch.utils.data.DataLoader(
        dataset, batch_size=batch_size, shuffle=True,
        num_workers=8, pin_memory=True,drop_last=True)

test_loader = torch.utils.data.DataLoader(
        valset, batch_size=batch_size, shuffle=True,
        num_workers=8, pin_memory=True,drop_last=True)

In [8]:
class Model(torch.nn.Module):
    def __init__(self):
        super(Model, self).__init__()
        self.layer_1 = nn.Conv2d(in_channels=3,out_channels=64,kernel_size=5,
                                 stride=2,padding=3)
        self.act_1 = nn.LeakyReLU(0.1)
        self.conv2_bn1 = nn.BatchNorm2d(64)
        self.max_1=nn.MaxPool2d(2,2)
        
        self.layer_2 = nn.Conv2d(in_channels=64,out_channels=128,kernel_size=4,
                                 stride=1,padding=2)
        self.act_2 = nn.LeakyReLU(0.1)
        self.conv2_bn2 = nn.BatchNorm2d(128)
        
        self.layer_3 = nn.Conv2d(in_channels=128,out_channels=128,kernel_size=4,
                                 stride=1,padding=2)
        self.act_3 = nn.LeakyReLU(0.1)
        self.conv2_bn3 = nn.BatchNorm2d(128)
        
        self.layer_4 = nn.Conv2d(in_channels=128,out_channels=128,kernel_size=1,
                                 stride=1)
        self.act_4 = nn.LeakyReLU(0.1)
        self.conv2_bn4 = nn.BatchNorm2d(128)
        
        self.max_1=nn.MaxPool2d(2,2)
        
        self.layer_5 = nn.Conv2d(in_channels=128,out_channels=256,kernel_size=3,
                                 stride=1,padding=2)
        self.act_5 = nn.LeakyReLU(0.1)
        self.conv2_bn5 = nn.BatchNorm2d(256)
        
        self.layer_6 = nn.Conv2d(in_channels=256,out_channels=256,kernel_size=3,
                                 stride=1,padding=2)
        self.act_6 = nn.LeakyReLU(0.1)
        self.conv2_bn6 = nn.BatchNorm2d(256)
        
        self.layer_7 = nn.Conv2d(in_channels=256,out_channels=256,kernel_size=1,
                                 stride=1)
        self.act_7 = nn.LeakyReLU(0.1)
        self.conv2_bn7 = nn.BatchNorm2d(256)
        
        self.max_2=nn.MaxPool2d(2,2)
        
        self.layer_8 = nn.Conv2d(in_channels=256,out_channels=512,kernel_size=2,
                                 stride=1,padding=2)
        self.act_8 = nn.LeakyReLU(0.1)
        self.conv2_bn8 = nn.BatchNorm2d(512)
        
        
        self.avgpool = nn.AdaptiveAvgPool2d((1, 1))
        
        self.fc_layer_1 = nn.Linear(512,10)
        self.act_9 = nn.LeakyReLU(0.1)
        
        for m in self.modules():
            if isinstance(m, nn.Conv2d):
                nn.init.kaiming_normal_(m.weight, mode='fan_out', nonlinearity='relu')
        
        

    def forward(self, x):
        out = self.layer_1(x)
        out = self.act_1(out)
        for module in list(self.modules())[2:-2]:
            out = module(out)
        out = torch.flatten(out,1)
        for module in list(self.modules())[-2:]:
            out = module(out)
        return out

In [9]:
model = Model()
model = model.cuda()
criterion = nn.CrossEntropyLoss().cuda()

In [10]:
# for name, param in model.named_parameters():
#     if param.requires_grad:
#         print (name, param.data)

In [11]:
from torchsummary import summary
summary(model,(3,96,96))

----------------------------------------------------------------
        Layer (type)               Output Shape         Param #
            Conv2d-1           [-1, 64, 49, 49]           4,864
         LeakyReLU-2           [-1, 64, 49, 49]               0
         LeakyReLU-3           [-1, 64, 49, 49]               0
       BatchNorm2d-4           [-1, 64, 49, 49]             128
         MaxPool2d-5           [-1, 64, 24, 24]               0
            Conv2d-6          [-1, 128, 25, 25]         131,200
         LeakyReLU-7          [-1, 128, 25, 25]               0
       BatchNorm2d-8          [-1, 128, 25, 25]             256
            Conv2d-9          [-1, 128, 26, 26]         262,272
        LeakyReLU-10          [-1, 128, 26, 26]               0
      BatchNorm2d-11          [-1, 128, 26, 26]             256
           Conv2d-12          [-1, 128, 26, 26]          16,512
        LeakyReLU-13          [-1, 128, 26, 26]               0
      BatchNorm2d-14          [-1, 128,

In [12]:
optimizer = torch.optim.Adam(model.parameters(), lr=lr, weight_decay=1e-4)
scheduler = torch.optim.lr_scheduler.StepLR(optimizer, step_size=50)

In [13]:
%cd /home/jupyter-deeplearning/res_model

/home/jupyter-deeplearning/res_model


In [None]:
trn_loss_list = []
val_loss_list = []
val_acc_list = []
total_epoch=500
model_char="2.0"
model_name=""
patience=10
start_early_stop_check=0
saving_start_epoch=10

for epoch in range(total_epoch):
    trn_loss = 0.0
    for i, data in enumerate(train_loader, 0):
        inputs, labels = data
        if torch.cuda.is_available():
            inputs=inputs.cuda()
            labels=labels.cuda()
        # grad init
        optimizer.zero_grad()
        # forward propagation
        output= model(inputs)
        # calculate loss
        loss=criterion(output, labels)
        # back propagation 
        loss.backward()
        # weight update
        optimizer.step()
        
        # trn_loss summary
        trn_loss += loss.item()
        # del (memory issue)
        del loss
        del output
    with torch.no_grad():
        val_loss = 0.0
        cor_match = 0
        for j, val in enumerate(test_loader):
            val_x, val_label = val
            if torch.cuda.is_available():
                val_x = val_x.cuda()
                val_label =val_label.cuda()
            val_output = model(val_x)
            v_loss = criterion(val_output, val_label)
            val_loss += v_loss
            _, predicted=torch.max(val_output,1)
            cor_match+=np.count_nonzero(predicted.cpu().detach()==val_label.cpu().detach())
    del val_output
    del v_loss
    del predicted
    
    scheduler.step()
    
    
    
    trn_loss_list.append(trn_loss/len(train_loader))
    val_loss_list.append(val_loss/len(test_loader))
    val_acc=cor_match/(len(test_loader)*batch_size)
    val_acc_list.append(val_acc)
    now = time.localtime()
    print ("%04d/%02d/%02d %02d:%02d:%02d" % (now.tm_year, now.tm_mon, now.tm_mday, now.tm_hour, now.tm_min, now.tm_sec))

    print("epoch: {}/{} | trn loss: {:.4f} | val loss: {:.4f} | val accuracy: {:.4f}% \n".format(
                epoch+1, total_epoch, trn_loss / len(train_loader), val_loss / len(test_loader), val_acc*100
            ))
    
    
    if epoch+1>2:
        if val_loss_list[-1]>val_loss_list[-2]:
            start_early_stop_check=1
    else:
        val_loss_min=val_loss_list[-1]
        
    if start_early_stop_check:
        early_stop_temp=val_loss_list[-patience:]
        if all(early_stop_temp[i]<early_stop_temp[i+1] for i in range (len(early_stop_temp)-1)):
            print("Early stop!")
            break
            
    if epoch+1>saving_start_epoch:
        if val_loss_list[-1]<val_loss_min:
            if os.path.isfile(model_name):
                os.remove(model_name)
            val_loss_min=val_loss_list[-1]
            model_name="Custom_model_"+model_char+"_{:.3f}".format(val_loss_min)
            torch.save(model, model_name)
            print("Model replaced and saved as ",model_name)

2020/11/10 03:55:13
epoch: 1/500 | trn loss: 1.8327 | val loss: 1.6520 | val accuracy: 39.7536% 

2020/11/10 03:56:21
epoch: 2/500 | trn loss: 1.5610 | val loss: 1.4856 | val accuracy: 46.1939% 

2020/11/10 03:57:30
epoch: 3/500 | trn loss: 1.4185 | val loss: 1.4234 | val accuracy: 48.8782% 

2020/11/10 03:58:40
epoch: 4/500 | trn loss: 1.3165 | val loss: 1.3355 | val accuracy: 52.2636% 

2020/11/10 03:59:49
epoch: 5/500 | trn loss: 1.2081 | val loss: 1.2359 | val accuracy: 55.5088% 

2020/11/10 04:00:58
epoch: 6/500 | trn loss: 1.1201 | val loss: 1.2536 | val accuracy: 56.1599% 

2020/11/10 04:02:07
epoch: 7/500 | trn loss: 1.0436 | val loss: 1.1960 | val accuracy: 58.0429% 

2020/11/10 04:03:18
epoch: 8/500 | trn loss: 0.9770 | val loss: 1.1775 | val accuracy: 58.9243% 

2020/11/10 04:04:25
epoch: 9/500 | trn loss: 0.9250 | val loss: 1.1690 | val accuracy: 59.1046% 

2020/11/10 04:05:36
epoch: 10/500 | trn loss: 0.8675 | val loss: 1.1541 | val accuracy: 60.2865% 

2020/11/10 04:06:49

2020/11/10 05:28:57
epoch: 81/500 | trn loss: 0.2079 | val loss: 1.0793 | val accuracy: 68.9503% 

2020/11/10 05:30:07
epoch: 82/500 | trn loss: 0.2066 | val loss: 1.0631 | val accuracy: 69.1306% 

2020/11/10 05:31:16
epoch: 83/500 | trn loss: 0.2061 | val loss: 1.0672 | val accuracy: 68.9153% 

2020/11/10 05:32:27
epoch: 84/500 | trn loss: 0.2018 | val loss: 1.0759 | val accuracy: 69.2808% 

2020/11/10 05:33:37
epoch: 85/500 | trn loss: 0.1982 | val loss: 1.0745 | val accuracy: 68.7750% 

2020/11/10 05:34:48
epoch: 86/500 | trn loss: 0.2018 | val loss: 1.0789 | val accuracy: 68.7600% 

2020/11/10 05:35:56
epoch: 87/500 | trn loss: 0.2016 | val loss: 1.0859 | val accuracy: 68.6749% 

2020/11/10 05:37:03
epoch: 88/500 | trn loss: 0.1998 | val loss: 1.1091 | val accuracy: 68.2592% 

2020/11/10 05:38:13
epoch: 89/500 | trn loss: 0.1961 | val loss: 1.0965 | val accuracy: 67.9688% 

2020/11/10 05:39:22
epoch: 90/500 | trn loss: 0.1992 | val loss: 1.0692 | val accuracy: 68.9453% 

2020/11/10

2020/11/10 07:06:45
epoch: 164/500 | trn loss: 0.1607 | val loss: 1.0798 | val accuracy: 69.5513% 

2020/11/10 07:07:49
epoch: 165/500 | trn loss: 0.1610 | val loss: 1.0558 | val accuracy: 70.1072% 

2020/11/10 07:08:51
epoch: 166/500 | trn loss: 0.1591 | val loss: 1.0649 | val accuracy: 69.4762% 

2020/11/10 07:09:55
epoch: 167/500 | trn loss: 0.1598 | val loss: 1.0746 | val accuracy: 69.3159% 

2020/11/10 07:10:59
epoch: 168/500 | trn loss: 0.1604 | val loss: 1.0753 | val accuracy: 69.5162% 

2020/11/10 07:12:03
epoch: 169/500 | trn loss: 0.1571 | val loss: 1.0675 | val accuracy: 69.7266% 

2020/11/10 07:13:07
epoch: 170/500 | trn loss: 0.1601 | val loss: 1.0761 | val accuracy: 69.6314% 

2020/11/10 07:14:11
epoch: 171/500 | trn loss: 0.1600 | val loss: 1.0708 | val accuracy: 69.2358% 

2020/11/10 07:15:14
epoch: 172/500 | trn loss: 0.1582 | val loss: 1.0789 | val accuracy: 69.4862% 

2020/11/10 07:16:18
epoch: 173/500 | trn loss: 0.1584 | val loss: 1.0727 | val accuracy: 69.5312% 



2020/11/10 08:34:43
epoch: 246/500 | trn loss: 0.1552 | val loss: 1.0608 | val accuracy: 69.9569% 

2020/11/10 08:35:48
epoch: 247/500 | trn loss: 0.1600 | val loss: 1.0714 | val accuracy: 69.2558% 

2020/11/10 08:36:53
epoch: 248/500 | trn loss: 0.1551 | val loss: 1.0656 | val accuracy: 69.3910% 

2020/11/10 08:37:58
epoch: 249/500 | trn loss: 0.1562 | val loss: 1.0498 | val accuracy: 69.8117% 

2020/11/10 08:39:03
epoch: 250/500 | trn loss: 0.1567 | val loss: 1.0634 | val accuracy: 69.4361% 

2020/11/10 08:40:08
epoch: 251/500 | trn loss: 0.1584 | val loss: 1.0492 | val accuracy: 70.1773% 

2020/11/10 08:41:13
epoch: 252/500 | trn loss: 0.1564 | val loss: 1.0665 | val accuracy: 69.4862% 

2020/11/10 08:42:18
epoch: 253/500 | trn loss: 0.1609 | val loss: 1.0688 | val accuracy: 69.3109% 

2020/11/10 08:43:23
epoch: 254/500 | trn loss: 0.1572 | val loss: 1.0588 | val accuracy: 69.6965% 

2020/11/10 08:44:28
epoch: 255/500 | trn loss: 0.1569 | val loss: 1.0831 | val accuracy: 69.2758% 



2020/11/10 10:03:06
epoch: 328/500 | trn loss: 0.1591 | val loss: 1.0528 | val accuracy: 70.0070% 

2020/11/10 10:04:12
epoch: 329/500 | trn loss: 0.1559 | val loss: 1.0682 | val accuracy: 69.3309% 

2020/11/10 10:05:18
epoch: 330/500 | trn loss: 0.1564 | val loss: 1.0717 | val accuracy: 69.4511% 

2020/11/10 10:06:25
epoch: 331/500 | trn loss: 0.1593 | val loss: 1.0813 | val accuracy: 69.4261% 

2020/11/10 10:07:30
epoch: 332/500 | trn loss: 0.1589 | val loss: 1.0657 | val accuracy: 70.0120% 

2020/11/10 10:08:36
epoch: 333/500 | trn loss: 0.1558 | val loss: 1.0641 | val accuracy: 69.7867% 

2020/11/10 10:09:40
epoch: 334/500 | trn loss: 0.1572 | val loss: 1.0760 | val accuracy: 69.6514% 

2020/11/10 10:10:45
epoch: 335/500 | trn loss: 0.1591 | val loss: 1.0526 | val accuracy: 69.6965% 

2020/11/10 10:11:52
epoch: 336/500 | trn loss: 0.1604 | val loss: 1.0767 | val accuracy: 69.0355% 

2020/11/10 10:12:56
epoch: 337/500 | trn loss: 0.1597 | val loss: 1.0614 | val accuracy: 69.9720% 



2020/11/10 11:24:40
epoch: 410/500 | trn loss: 0.1556 | val loss: 1.0632 | val accuracy: 69.8117% 

2020/11/10 11:25:38
epoch: 411/500 | trn loss: 0.1581 | val loss: 1.0668 | val accuracy: 69.7065% 

2020/11/10 11:26:37
epoch: 412/500 | trn loss: 0.1545 | val loss: 1.0582 | val accuracy: 69.5913% 

2020/11/10 11:27:35
epoch: 413/500 | trn loss: 0.1563 | val loss: 1.0588 | val accuracy: 69.8117% 

2020/11/10 11:28:33
epoch: 414/500 | trn loss: 0.1578 | val loss: 1.0831 | val accuracy: 69.2258% 

2020/11/10 11:29:32
epoch: 415/500 | trn loss: 0.1562 | val loss: 1.0656 | val accuracy: 69.5012% 

2020/11/10 11:30:31
epoch: 416/500 | trn loss: 0.1583 | val loss: 1.0453 | val accuracy: 70.0321% 

2020/11/10 11:31:30
epoch: 417/500 | trn loss: 0.1584 | val loss: 1.0748 | val accuracy: 69.5312% 

2020/11/10 11:32:28
epoch: 418/500 | trn loss: 0.1596 | val loss: 1.0601 | val accuracy: 70.0070% 

2020/11/10 11:33:27
epoch: 419/500 | trn loss: 0.1557 | val loss: 1.0612 | val accuracy: 69.6264% 



In [None]:
plt.figure(figsize=(15,15))
plt.ylabel("val_accuracy")
plt.xlabel("epoch")
plt.plot(val_acc_list)
plt.grid()

In [None]:
val_acc_list=np.array(val_acc_list)
np.savetxt("ver_2.0.txt", val_acc_list, delimiter=',')

### Evaluation

In [None]:
import torch
import pandas as pd
import argparse
import time
import torchvision
import torchvision.transforms as transforms
from torch.utils.data import Dataset, DataLoader

In [None]:
model.eval()

In [None]:
%cd /home/jupyter-deeplearning/Organize

In [None]:
normalize = transforms.Normalize(mean=[0.507, 0.487, 0.441],
                                     std=[0.267, 0.256, 0.276])
test_transform = transforms.Compose([
        transforms.ToTensor(),
        normalize
    ])

In [None]:
test_dataset = torchvision.datasets.ImageFolder('./data/test', transform=test_transform)

In [None]:
test_loader = DataLoader(test_dataset, batch_size=batch_size, num_workers=4, shuffle=False)

In [None]:
Category = []
for input, _ in test_loader:
    input = input.cuda()
    output = model(input)
    output = torch.argmax(output, dim=1)
    Category = Category + output.tolist()

In [None]:
Id = list(range(0, 8000))
samples = {
   'Id': Id,
   'Category': Category 
}
df = pd.DataFrame(samples, columns=['Id', 'Category'])

df.to_csv('submission_2.0_2.csv', index=False)
print('Done!!')