# [모의 캐글-의료] 흉부 CT 코로나 감염 여부 분류
- 이미지 binary 분류 과제
- 담당: 이녕민M

## Import Libraries

In [None]:
# !apt-get update && apt-get install -y python3-opencv

In [519]:
# !pip install sklearn
# ! pip install mxnet
# !pip install albumentations

In [134]:
import os, torch, copy, cv2, sys, random
# from datetime import datetime, timezone, timedelta
from PIL import Image
import numpy as np
import pandas as pd
from tqdm import tqdm
import torch
import torch.nn as nn
import torch.optim as optim
from torch.utils.data import DataLoader, Dataset,TensorDataset,random_split,SubsetRandomSampler, ConcatDataset
import torchvision.transforms as transforms
import matplotlib.pyplot as plt
import torchvision.utils
from sklearn.model_selection import KFold


import mxnet as mx
import random
import albumentations
from albumentations.pytorch import ToTensorV2

## Set Arguments & hyperparameters

In [135]:
# 시드(seed) 설정

RANDOM_SEED = 2022

torch.manual_seed(RANDOM_SEED)
torch.backends.cudnn.deterministic = True
torch.backends.cudnn.benchmark = False
np.random.seed(RANDOM_SEED)
random.seed(RANDOM_SEED)

In [136]:
# parameters

### 데이터 디렉토리 설정 ###
DATA_DIR= 'data'
NUM_CLS = 2

EPOCHS = 30
BATCH_SIZE = 32
LEARNING_RATE = 0.005
EARLY_STOPPING_PATIENCE = 15
INPUT_SHAPE = 512 # 크게하는게 좋다고 함

k = 5

os.environ["CUDA_VISIBLE_DEVICES"]="0"
DEVICE = torch.device('cuda' if torch.cuda.is_available() else 'cpu')

## Dataloader

#### Train & Validation Set loader

In [158]:
class CustomDataset(Dataset):
    def __init__(self, data_dir, mode, input_shape):
        self.data_dir = data_dir
        self.mode = mode
        self.input_shape = input_shape
        
        # Loading dataset
        self.db = self.data_loader()
        
        # Dataset split
        if self.mode == 'train':
            self.db = self.db[:int(len(self.db) * 0.8)]
        elif self.mode == 'val':
            self.db = self.db[int(len(self.db) * 0.8):]
            self.db.reset_index(inplace=True)
        else:
            print(f'!!! Invalid split {self.mode}... !!!')
            
        # Transform function
        # self.transform = transforms.Compose([transforms.Resize(self.input_shape),
        #                                      transforms.RandomHorizontalFlip(p=0.5),
        #                                      transforms.ToTensor(),
        #                                      transforms.Normalize([0.485, 0.456, 0.406], [0.229, 0.224, 0.225])])
        self.transform = albumentations.Compose([albumentations.Resize(512, 512), 
                                                 albumentations.RandomCrop(500, 500),
                                                 albumentations.HorizontalFlip(), # Same with transforms.RandomHorizontalFlip()
                                                 albumentations.VerticalFlip(),
                                                albumentations.Normalize([0.485, 0.456, 0.406], [0.229, 0.224, 0.225]),
                                                albumentations.pytorch.transforms.ToTensorV2()])
        
        
    def data_loader(self):
        print('Loading ' + self.mode + ' dataset..')
        if not os.path.isdir(self.data_dir):
            print(f'!!! Cannot find {self.data_dir}... !!!')
            sys.exit()
        
        # (COVID : 1, No : 0)
        db = pd.read_csv(os.path.join(self.data_dir, 'train.csv'))
        
        return db

    def __len__(self):
        return len(self.db)

    def __getitem__(self, index):
        data = copy.deepcopy(self.db.loc[index])

        # Loading image
        cvimg = cv2.imread(os.path.join(self.data_dir,'train',data['file_name']), cv2.IMREAD_COLOR | cv2.IMREAD_IGNORE_ORIENTATION)
        if not isinstance(cvimg, np.ndarray):
            raise IOError("Fail to read %s" % data['file_name'])

        # Preprocessing images
        image = cv2.cvtColor(cvimg, cv2.COLOR_BGR2RGB)
        trans_image = self.transform(image = image)
        trans_image = trans_image['image']
        
        
        # trans_image = self.transform(Image.fromarray(cvimg))
        

        return trans_image, data['COVID']


In [7]:
#이미지를 구현, hide-and-seek구현 함수(사용x)
def imshow(inp, title=None):
    """Imshow for Tensor."""
    inp = inp.numpy().transpose((1, 2, 0))
    mean = np.array([0.485, 0.456, 0.406])
    std = np.array([0.229, 0.224, 0.225])
    inp = std * inp + mean
    inp = np.clip(inp, 0, 1)
    plt.imshow(inp)
    if title is not None:
        plt.title(title)
    plt.pause(0.001)  # 갱신이 될 때까지 잠시 기다립니다.

def hide_patch(img):
    # get width and height of the image
    s = img.shape
    wd = s[0]
    ht = s[1]

    # possible grid size, 0 means no hiding
    # grid_sizes=[0,16,32,44,56]
    grid_sizes=[0,16,32,44,56]

    # hiding probability
    hide_prob = 0.5
 
    # randomly choose one grid size
    grid_size= grid_sizes[random.randint(0,len(grid_sizes)-1)]
    # print(grid_size)
    # hide the patches
    # if(grid_size<>0):
    if(grid_size!=0):
         for x in range(0,wd,grid_size):
             for y in range(0,ht,grid_size):
                 x_end = min(wd, x+grid_size)  
                 y_end = min(ht, y+grid_size)
                 if(random.random() <=  hide_prob):
                       img[x:x_end,y:y_end,:]=0

    return img


## Model

In [138]:
import torch.nn.functional as F

class custom_CNN(nn.Module):
    def __init__(self, num_classes):
        super(custom_CNN, self).__init__()
        self.conv1 = nn.Conv2d(in_channels=3, out_channels=8, kernel_size=5)
        self.pool = nn.MaxPool2d(kernel_size=2)
        self.conv2 = nn.Conv2d(in_channels=8, out_channels=25, kernel_size=5)
        
        self.fc1 = nn.Linear(in_features=25*29*29, out_features=128)
        self.fc2 = nn.Linear(in_features=128, out_features=num_classes)
        self.softmax = nn.Softmax(dim=1)
        
    def forward(self, x):
        x = self.pool(F.relu(self.conv1(x))) # (32, 3, 128, 128) -> (32, 8, 62, 62)
        x = self.pool(F.relu(self.conv2(x))) # (32, 8, 62, 62) -> (32, 25, 29, 29)
        
        x = torch.flatten(x,1)
        x = F.relu(self.fc1(x))
        x = F.relu(self.fc2(x))
        
        output = self.softmax(x)
        
        return output

In [159]:
import torchvision.models as models

class resnet(nn.Module):
    def __init__(self, numclasses):
        super(resnet, self).__init__()
        self.model = models.resnet34(pretrained=False)
        self.model.fc = nn.Linear(self.model.fc.in_features, numclasses)
        self.softmax = nn.Softmax(dim=1)
        
    def forward(self, input_img):
        x = self.model(input_img)
        x = self.softmax(x)
        return x

## Utils
### EarlyStopper

In [140]:
class LossEarlyStopper():
    """Early stopper
    
    Attributes:
        patience (int): loss가 줄어들지 않아도 학습할 epoch 수
        patience_counter (int): loss 가 줄어들지 않을 때 마다 1씩 증가, 감소 시 0으로 리셋
        min_loss (float): 최소 loss
        stop (bool): True 일 때 학습 중단

    """

    def __init__(self, patience: int)-> None:
        self.patience = patience

        self.patience_counter = 0
        self.min_loss = np.Inf
        self.stop = False
        self.save_model = False

    def check_early_stopping(self, loss: float)-> None:
        """Early stopping 여부 판단"""  

        if self.min_loss == np.Inf:
            self.min_loss = loss
            return None

        elif loss > self.min_loss:
            self.patience_counter += 1
            msg = f"Early stopping counter {self.patience_counter}/{self.patience}"

            if self.patience_counter == self.patience:
                self.stop = True
                
        elif loss <= self.min_loss:
            self.patience_counter = 0
            self.save_model = True
            msg = f"Validation loss decreased {self.min_loss} -> {loss}"
            self.min_loss = loss
        
        print(msg)

### Trainer

In [141]:
class Trainer():
    """ epoch에 대한 학습 및 검증 절차 정의"""
    
    def __init__(self, loss_fn, model, device, metric_fn, optimizer=None, scheduler=None):
        """ 초기화
        """
        self.loss_fn = loss_fn
        self.model = model
        self.device = device
        self.optimizer = optimizer
        self.scheduler = scheduler
        self.metric_fn = metric_fn

    def train_epoch(self, dataloader, epoch_index):
        """ 한 epoch에서 수행되는 학습 절차"""
        
        self.model.train()
        train_total_loss = 0
        target_lst = []
        pred_lst = []
        prob_lst = []

        for batch_index, (img, label) in enumerate(dataloader):
            img = img.to(self.device)
            label = label.to(self.device).float()
            
            pred = self.model(img)
            
            loss = self.loss_fn(pred[:,1], label)
            self.optimizer.zero_grad()
            loss.backward()
            self.optimizer.step()
            self.scheduler.step()
            
            train_total_loss += loss.item()
            prob_lst.extend(pred[:, 1].cpu().tolist())
            target_lst.extend(label.cpu().tolist())
            pred_lst.extend(pred.argmax(dim=1).cpu().tolist())
        self.train_mean_loss = train_total_loss / batch_index
        self.train_score, f1 = self.metric_fn(y_pred=pred_lst, y_answer=target_lst)
        msg = f'Epoch {epoch_index}, Train loss: {self.train_mean_loss}, Acc: {self.train_score}, F1-Macro: {f1}'
        print(msg)

    def validate_epoch(self, dataloader, epoch_index):
        """ 한 epoch에서 수행되는 검증 절차
        """
        self.model.eval()
        val_total_loss = 0
        target_lst = []
        pred_lst = []
        prob_lst = []

        for batch_index, (img, label) in enumerate(dataloader):
            img = img.to(self.device)
            label = label.to(self.device).float()
            pred = self.model(img)
            
            loss = self.loss_fn(pred[:,1], label)
            val_total_loss += loss.item()
            prob_lst.extend(pred[:, 1].cpu().tolist())
            target_lst.extend(label.cpu().tolist())
            pred_lst.extend(pred.argmax(dim=1).cpu().tolist())
        self.val_mean_loss = val_total_loss / batch_index
        self.validation_score, f1 = self.metric_fn(y_pred=pred_lst, y_answer=target_lst)
        msg = f'Epoch {epoch_index}, Val loss: {self.val_mean_loss}, Acc: {self.validation_score}, F1-Macro: {f1}'
        print(msg)

### Metrics

In [142]:
from sklearn.metrics import accuracy_score, f1_score

def get_metric_fn(y_pred, y_answer):
    """ 성능을 반환하는 함수"""
    
    assert len(y_pred) == len(y_answer), 'The size of prediction and answer are not same.'
    accuracy = accuracy_score(y_answer, y_pred)
    f1 = f1_score(y_answer, y_pred, average='macro')
    return accuracy, f1

## Train
### 학습을 위한 객체 선언

#### Load Dataset & Dataloader

In [492]:
# Load dataset & dataloader
train_dataset = CustomDataset(data_dir=DATA_DIR, mode='train', input_shape=INPUT_SHAPE)
validation_dataset = CustomDataset(data_dir=DATA_DIR, mode='val', input_shape=INPUT_SHAPE)
train_dataloader = DataLoader(train_dataset, batch_size=BATCH_SIZE, shuffle=True)
validation_dataloader = DataLoader(validation_dataset, batch_size=BATCH_SIZE, shuffle=True)
print('Train set samples:',len(train_dataset),  'Val set samples:', len(validation_dataset))

Loading train dataset..
Loading val dataset..
Train set samples: 581 Val set samples: 65


In [160]:
# Load dataset & dataloader (ab)
train_dataset = CustomDataset(data_dir=DATA_DIR, mode='train', input_shape=INPUT_SHAPE)
validation_dataset = CustomDataset(data_dir=DATA_DIR, mode='val', input_shape=INPUT_SHAPE)

dataset = ConcatDataset([train_dataset, validation_dataset])
splits=KFold(n_splits=k,shuffle=True, random_state=42)

train_dataloader = DataLoader(train_dataset, batch_size=BATCH_SIZE, shuffle=True)
validation_dataloader = DataLoader(validation_dataset, batch_size=BATCH_SIZE, shuffle=True)
print('Train set samples:',len(train_dataset),  'Val set samples:', len(validation_dataset))

Loading train dataset..
Loading val dataset..
Train set samples: 516 Val set samples: 130


#### Load model and other utils

In [161]:
# Load Model
# model = custom_CNN(NUM_CLS).to(DEVICE)
model = resnet(NUM_CLS).to(DEVICE)

# # Save Initial Model
# torch.save(model.state_dict(), 'initial.pt')

# Set optimizer, scheduler, loss function, metric function
optimizer = optim.Adam(model.parameters(), lr=LEARNING_RATE)
scheduler =  optim.lr_scheduler.OneCycleLR(optimizer=optimizer, pct_start=0.1, div_factor=1e5, max_lr=0.0001, epochs=EPOCHS, steps_per_epoch=len(train_dataloader))
loss_fn = nn.BCELoss()
metric_fn = get_metric_fn


# Set trainer
trainer = Trainer(loss_fn, model, DEVICE, metric_fn, optimizer, scheduler)

# Set earlystopper
early_stopper = LossEarlyStopper(patience=EARLY_STOPPING_PATIENCE)

In [147]:
model

resnet(
  (model): ResNet(
    (conv1): Conv2d(3, 64, kernel_size=(7, 7), stride=(2, 2), padding=(3, 3), bias=False)
    (bn1): BatchNorm2d(64, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
    (relu): ReLU(inplace=True)
    (maxpool): MaxPool2d(kernel_size=3, stride=2, padding=1, dilation=1, ceil_mode=False)
    (layer1): Sequential(
      (0): BasicBlock(
        (conv1): Conv2d(64, 64, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1), bias=False)
        (bn1): BatchNorm2d(64, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
        (relu): ReLU(inplace=True)
        (conv2): Conv2d(64, 64, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1), bias=False)
        (bn2): BatchNorm2d(64, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
      )
      (1): BasicBlock(
        (conv1): Conv2d(64, 64, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1), bias=False)
        (bn1): BatchNorm2d(64, eps=1e-05, momentum=0.1, affine=True, track_runnin

### epoch 단위 학습 진행

In [67]:
for epoch_index in tqdm(range(EPOCHS)):

    trainer.train_epoch(train_dataloader, epoch_index)
    trainer.validate_epoch(validation_dataloader, epoch_index)

    # early_stopping check
    early_stopper.check_early_stopping(loss=trainer.val_mean_loss)

    if early_stopper.stop:
        print('Early stopped')
        break

    if early_stopper.save_model:
        check_point = {
            'model': model.state_dict(),
            'optimizer': optimizer.state_dict(),
            'scheduler': scheduler.state_dict()
        }
        torch.save(check_point, 'best.pt')


  0% 0/30 [00:00<?, ?it/s]

Epoch 0, Train loss: 0.7290288044346703, Acc: 0.5628227194492255, F1-Macro: 0.5625311262361563


  3% 1/30 [00:43<21:02, 43.55s/it]

Epoch 0, Val loss: 0.9351228773593903, Acc: 0.49230769230769234, F1-Macro: 0.32989690721649484
Epoch 1, Train loss: 0.5783598290549384, Acc: 0.7590361445783133, F1-Macro: 0.7582562590646473
Epoch 1, Val loss: 0.9273214936256409, Acc: 0.6307692307692307, F1-Macro: 0.6285714285714286
Validation loss decreased 0.9351228773593903 -> 0.9273214936256409


  7% 2/30 [01:27<20:26, 43.80s/it]

Epoch 2, Train loss: 0.328860138853391, Acc: 0.9018932874354562, F1-Macro: 0.9012744265080714
Epoch 2, Val loss: 1.0944306552410126, Acc: 0.7230769230769231, F1-Macro: 0.7198275862068966
Early stopping counter 1/10


 10% 3/30 [02:12<19:44, 43.88s/it]

Epoch 3, Train loss: 0.09491647241844071, Acc: 0.9862306368330465, F1-Macro: 0.9861804861804861
Epoch 3, Val loss: 0.6738913916051388, Acc: 0.7384615384615385, F1-Macro: 0.7362138935306756
Validation loss decreased 0.9273214936256409 -> 0.6738913916051388


 13% 4/30 [02:55<18:54, 43.62s/it]

Epoch 4, Train loss: 0.03496186766359541, Acc: 0.9948364888123924, F1-Macro: 0.9948118978095672
Epoch 4, Val loss: 0.7430957239121199, Acc: 0.7692307692307693, F1-Macro: 0.7683535281539557
Early stopping counter 1/10


 17% 5/30 [03:38<18:06, 43.47s/it]

Epoch 5, Train loss: 0.03325988332896183, Acc: 0.9982788296041308, F1-Macro: 0.9982714352442751
Epoch 5, Val loss: 1.1020513474941254, Acc: 0.7076923076923077, F1-Macro: 0.7006060606060607
Early stopping counter 2/10


 20% 6/30 [04:21<17:24, 43.51s/it]

Epoch 6, Train loss: 0.09886101281477346, Acc: 0.9707401032702238, F1-Macro: 0.9705863959475517
Epoch 6, Val loss: 0.6647143638692796, Acc: 0.7384615384615385, F1-Macro: 0.7321212121212122
Validation loss decreased 0.6738913916051388 -> 0.6647143638692796


 23% 7/30 [05:04<16:36, 43.33s/it]

Epoch 7, Train loss: 0.13452754521535504, Acc: 0.9845094664371773, F1-Macro: 0.9844201117318436
Epoch 7, Val loss: 0.8683702635898953, Acc: 0.7076923076923077, F1-Macro: 0.6973780936045086
Early stopping counter 1/10


 27% 8/30 [05:49<16:04, 43.82s/it]

Epoch 8, Train loss: 0.1495537774430381, Acc: 0.9535283993115319, F1-Macro: 0.9533492929683436
Epoch 8, Val loss: 0.5791654512286186, Acc: 0.7384615384615385, F1-Macro: 0.7374673319078165
Validation loss decreased 0.6647143638692796 -> 0.5791654512286186


 30% 9/30 [06:33<15:20, 43.84s/it]

Epoch 9, Train loss: 0.03626256878487766, Acc: 0.9931153184165232, F1-Macro: 0.9930872834570722
Epoch 9, Val loss: 0.8948061764240265, Acc: 0.676923076923077, F1-Macro: 0.656084656084656
Early stopping counter 1/10


 33% 10/30 [07:16<14:32, 43.64s/it]

Epoch 10, Train loss: 0.014182086089729436, Acc: 1.0, F1-Macro: 1.0
Epoch 10, Val loss: 0.6085092797875404, Acc: 0.7538461538461538, F1-Macro: 0.7509578544061302
Early stopping counter 2/10


 37% 11/30 [07:56<13:29, 42.59s/it]

Epoch 11, Train loss: 0.003650686852375252, Acc: 1.0, F1-Macro: 1.0
Epoch 11, Val loss: 0.6245921514928341, Acc: 0.7692307692307693, F1-Macro: 0.767247553115302
Early stopping counter 3/10


 40% 12/30 [08:40<12:54, 43.02s/it]

Epoch 12, Train loss: 0.010709233258643912, Acc: 1.0, F1-Macro: 1.0
Epoch 12, Val loss: 1.0297811329364777, Acc: 0.7538461538461538, F1-Macro: 0.7509578544061302
Early stopping counter 4/10


 43% 13/30 [09:23<12:12, 43.06s/it]

Epoch 13, Train loss: 0.09652600886248466, Acc: 0.9948364888123924, F1-Macro: 0.9948165881075937
Epoch 13, Val loss: 2.568748414516449, Acc: 0.6461538461538462, F1-Macro: 0.6233308138070042
Early stopping counter 5/10


 47% 14/30 [10:07<11:32, 43.27s/it]

Epoch 14, Train loss: 0.3886534674093127, Acc: 0.9345955249569707, F1-Macro: 0.9343573093573092
Epoch 14, Val loss: 1.20190768991597, Acc: 0.7230769230769231, F1-Macro: 0.7075
Early stopping counter 6/10


 50% 15/30 [10:50<10:48, 43.21s/it]

Epoch 15, Train loss: 0.4394403100013733, Acc: 0.8364888123924269, F1-Macro: 0.8346053692200277
Epoch 15, Val loss: 0.7853747298941016, Acc: 0.6615384615384615, F1-Macro: 0.6549227799227799
Early stopping counter 7/10


 53% 16/30 [11:34<10:06, 43.30s/it]

Epoch 16, Train loss: 0.39370400624142754, Acc: 0.8485370051635112, F1-Macro: 0.8466172270621835
Epoch 16, Val loss: 1.6119196712970734, Acc: 0.676923076923077, F1-Macro: 0.656084656084656
Early stopping counter 8/10


 57% 17/30 [12:17<09:22, 43.27s/it]

Epoch 17, Train loss: 0.34664354307783973, Acc: 0.8537005163511188, F1-Macro: 0.8526089279265567
Epoch 17, Val loss: 0.8143983586342074, Acc: 0.676923076923077, F1-Macro: 0.6612062546537603
Early stopping counter 9/10


 60% 18/30 [13:00<08:39, 43.28s/it]

Epoch 18, Train loss: 0.3429244988494449, Acc: 0.8691910499139415, F1-Macro: 0.8683293971707341


 60% 18/30 [13:42<09:08, 45.71s/it]

Epoch 18, Val loss: 2.4883471727371216, Acc: 0.7230769230769231, F1-Macro: 0.7176640926640927
Early stopping counter 10/10
Early stopped





In [162]:
for fold, (train_idx,val_idx) in enumerate(splits.split(np.arange(len(dataset)))):

    print('Fold {}'.format(fold + 1))

    train_sampler = SubsetRandomSampler(train_idx)
    test_sampler = SubsetRandomSampler(val_idx)
    train_loader = DataLoader(dataset, batch_size=BATCH_SIZE, sampler=train_sampler)
    test_loader = DataLoader(dataset, batch_size=BATCH_SIZE, sampler=test_sampler)
    

    for epoch_index in tqdm(range(EPOCHS)):

        trainer.train_epoch(train_dataloader, epoch_index)
        trainer.validate_epoch(validation_dataloader, epoch_index)

        # early_stopping check
        early_stopper.check_early_stopping(loss=trainer.val_mean_loss)

        if early_stopper.stop:
            print('Early stopped')
            break

        if early_stopper.save_model:
            check_point = {
                'model': model.state_dict(),
                'optimizer': optimizer.state_dict(),
                'scheduler': scheduler.state_dict()
            }
            torch.save(check_point, 'best.pt2')


  0% 0/30 [00:00<?, ?it/s]

Fold 1
Epoch 0, Train loss: 0.7682837508618832, Acc: 0.5406976744186046, F1-Macro: 0.3761598930781356


  3% 1/30 [00:32<15:47, 32.68s/it]

Epoch 0, Val loss: 0.9458743780851364, Acc: 0.49230769230769234, F1-Macro: 0.32989690721649484
Epoch 1, Train loss: 0.6835463084280491, Acc: 0.6375968992248062, F1-Macro: 0.621313386209955


  7% 2/30 [01:06<15:22, 32.95s/it]

Epoch 1, Val loss: 1.1238063499331474, Acc: 0.5384615384615384, F1-Macro: 0.46560701562071805
Early stopping counter 1/15
Epoch 2, Train loss: 0.6616939418017864, Acc: 0.6569767441860465, F1-Macro: 0.6527392807035554


 10% 3/30 [01:39<14:54, 33.15s/it]

Epoch 2, Val loss: 0.995417557656765, Acc: 0.6307692307692307, F1-Macro: 0.61
Early stopping counter 2/15
Epoch 3, Train loss: 0.6181009039282799, Acc: 0.7248062015503876, F1-Macro: 0.7217589428115745
Epoch 3, Val loss: 0.8335439115762711, Acc: 0.6538461538461539, F1-Macro: 0.6478237312624164
Validation loss decreased 0.9458743780851364 -> 0.8335439115762711


 13% 4/30 [02:15<14:43, 33.97s/it]

Epoch 4, Train loss: 0.5384135842323303, Acc: 0.7674418604651163, F1-Macro: 0.7669376693766938
Epoch 4, Val loss: 1.2458857595920563, Acc: 0.6538461538461539, F1-Macro: 0.6426608026388125
Early stopping counter 1/15


 17% 5/30 [02:51<14:20, 34.44s/it]

Epoch 5, Train loss: 0.5277879517525434, Acc: 0.7596899224806202, F1-Macro: 0.7587621403148941
Epoch 5, Val loss: 0.6447358205914497, Acc: 0.7076923076923077, F1-Macro: 0.7065811356616774
Validation loss decreased 0.8335439115762711 -> 0.6447358205914497


 20% 6/30 [03:26<13:52, 34.69s/it]

Epoch 6, Train loss: 0.5083114635199308, Acc: 0.7868217054263565, F1-Macro: 0.7856592601543737
Epoch 6, Val loss: 1.5758882761001587, Acc: 0.5461538461538461, F1-Macro: 0.438136400263717
Early stopping counter 1/15


 23% 7/30 [04:02<13:24, 34.98s/it]

Epoch 7, Train loss: 0.49770407285541296, Acc: 0.7829457364341085, F1-Macro: 0.775819265143992
Epoch 7, Val loss: 1.434253841638565, Acc: 0.5692307692307692, F1-Macro: 0.48717948717948717
Early stopping counter 2/15


 27% 8/30 [04:38<13:01, 35.51s/it]

Epoch 8, Train loss: 0.45967961102724075, Acc: 0.812015503875969, F1-Macro: 0.8113345521023766
Epoch 8, Val loss: 0.9111808128654957, Acc: 0.6384615384615384, F1-Macro: 0.6135601796217822
Early stopping counter 3/15


 30% 9/30 [05:14<12:25, 35.51s/it]

Epoch 9, Train loss: 0.4393895398825407, Acc: 0.812015503875969, F1-Macro: 0.8108211282245109
Epoch 9, Val loss: 0.706253245472908, Acc: 0.7, F1-Macro: 0.6999822474702645
Early stopping counter 4/15


 33% 10/30 [05:50<11:50, 35.52s/it]

Epoch 10, Train loss: 0.39461581595242023, Acc: 0.8275193798449613, F1-Macro: 0.8271760114704187
Epoch 10, Val loss: 0.778014287352562, Acc: 0.6692307692307692, F1-Macro: 0.6668454615888908
Early stopping counter 5/15


 37% 11/30 [06:25<11:15, 35.56s/it]

Epoch 11, Train loss: 0.41729013342410326, Acc: 0.8391472868217055, F1-Macro: 0.8368674652903423
Epoch 11, Val loss: 0.8724043658003211, Acc: 0.6538461538461539, F1-Macro: 0.6233339772068764
Early stopping counter 6/15


 40% 12/30 [07:01<10:41, 35.65s/it]

Epoch 12, Train loss: 0.39234778191894293, Acc: 0.8624031007751938, F1-Macro: 0.8614408846966986
Epoch 12, Val loss: 0.7945217937231064, Acc: 0.7, F1-Macro: 0.688479262672811
Early stopping counter 7/15


 43% 13/30 [07:37<10:05, 35.61s/it]

Epoch 13, Train loss: 0.42370548378676176, Acc: 0.872093023255814, F1-Macro: 0.8700945987183399
Epoch 13, Val loss: 0.9107252359390259, Acc: 0.6923076923076923, F1-Macro: 0.6832358674463938
Early stopping counter 8/15


 47% 14/30 [08:12<09:27, 35.48s/it]

Epoch 14, Train loss: 0.43118566647171974, Acc: 0.813953488372093, F1-Macro: 0.8137268173818871
Epoch 14, Val loss: 2.1111379861831665, Acc: 0.5461538461538461, F1-Macro: 0.41801350633583734
Early stopping counter 9/15


 50% 15/30 [08:47<08:50, 35.39s/it]

Epoch 15, Train loss: 0.40662930719554424, Acc: 0.8449612403100775, F1-Macro: 0.8439272265323714
Epoch 15, Val loss: 0.644223190844059, Acc: 0.7230769230769231, F1-Macro: 0.7149122807017543
Validation loss decreased 0.6447358205914497 -> 0.644223190844059


 53% 16/30 [09:22<08:13, 35.25s/it]

Epoch 16, Train loss: 0.33563312143087387, Acc: 0.874031007751938, F1-Macro: 0.8731501057082452
Epoch 16, Val loss: 0.9240188002586365, Acc: 0.7, F1-Macro: 0.6842891836353446
Early stopping counter 1/15


 57% 17/30 [09:57<07:37, 35.21s/it]

Epoch 17, Train loss: 0.3492675945162773, Acc: 0.874031007751938, F1-Macro: 0.8739244674492821
Epoch 17, Val loss: 0.73789381980896, Acc: 0.7461538461538462, F1-Macro: 0.7457777777777779
Early stopping counter 2/15


 60% 18/30 [10:32<07:02, 35.18s/it]

Epoch 18, Train loss: 0.3066897913813591, Acc: 0.8624031007751938, F1-Macro: 0.8611510109719354
Epoch 18, Val loss: 0.7100876197218895, Acc: 0.7076923076923077, F1-Macro: 0.7059523809523809
Early stopping counter 3/15


 63% 19/30 [11:07<06:26, 35.15s/it]

Epoch 19, Train loss: 0.27630001585930586, Acc: 0.9031007751937985, F1-Macro: 0.9022549554464449
Epoch 19, Val loss: 0.5992663186043501, Acc: 0.7384615384615385, F1-Macro: 0.7333494208494209
Validation loss decreased 0.644223190844059 -> 0.5992663186043501


 67% 20/30 [11:42<05:52, 35.21s/it]

Epoch 20, Train loss: 0.3045996753498912, Acc: 0.9011627906976745, F1-Macro: 0.9005348199943305
Epoch 20, Val loss: 0.479233393445611, Acc: 0.7846153846153846, F1-Macro: 0.7845643939393939
Validation loss decreased 0.5992663186043501 -> 0.479233393445611


 70% 21/30 [12:18<05:16, 35.20s/it]

Epoch 21, Train loss: 0.2091509341262281, Acc: 0.9244186046511628, F1-Macro: 0.9241448199174505
Epoch 21, Val loss: 0.5212227269075811, Acc: 0.7538461538461538, F1-Macro: 0.7538461538461539
Early stopping counter 1/15


 73% 22/30 [12:53<04:42, 35.26s/it]

Epoch 22, Train loss: 0.21033362857997417, Acc: 0.9263565891472868, F1-Macro: 0.9259550171442381
Epoch 22, Val loss: 0.7659521102905273, Acc: 0.7769230769230769, F1-Macro: 0.7753143810715775
Early stopping counter 2/15


 77% 23/30 [13:29<04:07, 35.37s/it]

Epoch 23, Train loss: 0.21610141918063164, Acc: 0.9147286821705426, F1-Macro: 0.9141041162227603
Epoch 23, Val loss: 0.6090688835829496, Acc: 0.7384615384615385, F1-Macro: 0.7344388368180726
Early stopping counter 3/15


 80% 24/30 [14:04<03:32, 35.37s/it]

Epoch 24, Train loss: 0.24940579943358898, Acc: 0.9166666666666666, F1-Macro: 0.9162359798706617
Epoch 24, Val loss: 0.6049113869667053, Acc: 0.7923076923076923, F1-Macro: 0.7908099409976758
Early stopping counter 4/15


 83% 25/30 [14:39<02:56, 35.35s/it]

Epoch 25, Train loss: 0.17684346018359065, Acc: 0.939922480620155, F1-Macro: 0.9396447962691157
Epoch 25, Val loss: 0.604477159678936, Acc: 0.7384615384615385, F1-Macro: 0.7321212121212122
Early stopping counter 5/15


 87% 26/30 [15:15<02:21, 35.30s/it]

Epoch 26, Train loss: 0.16784880496561527, Acc: 0.9476744186046512, F1-Macro: 0.9473419635264102
Epoch 26, Val loss: 0.8495041653513908, Acc: 0.7769230769230769, F1-Macro: 0.7739130434782608
Early stopping counter 6/15


 90% 27/30 [15:50<01:45, 35.24s/it]

Epoch 27, Train loss: 0.20689245057292283, Acc: 0.9476744186046512, F1-Macro: 0.9473737888832228
Epoch 27, Val loss: 0.5257819592952728, Acc: 0.7846153846153846, F1-Macro: 0.7813025714972363
Early stopping counter 7/15


 93% 28/30 [16:25<01:10, 35.20s/it]

Epoch 28, Train loss: 0.16314261313527822, Acc: 0.939922480620155, F1-Macro: 0.9394620616051865
Epoch 28, Val loss: 0.6106783226132393, Acc: 0.7615384615384615, F1-Macro: 0.7563335147227765
Early stopping counter 8/15


 97% 29/30 [17:00<00:35, 35.17s/it]

Epoch 29, Train loss: 0.18079140887130052, Acc: 0.9321705426356589, F1-Macro: 0.9317395823490504
Epoch 29, Val loss: 0.5674663316458464, Acc: 0.7307692307692307, F1-Macro: 0.7235555015493043
Early stopping counter 9/15


100% 30/30 [17:35<00:00, 35.18s/it]
  0% 0/30 [00:00<?, ?it/s]

Fold 2


  0% 0/30 [00:01<?, ?it/s]


ValueError: Tried to step 512 times. The specified number of total steps is 510

## Inference
### 모델 로드

In [163]:
TRAINED_MODEL_PATH = 'best.pt2'

### Load dataset

In [164]:
class TestDataset(Dataset):
    def __init__(self, data_dir, input_shape):
        self.data_dir = data_dir
        self.input_shape = input_shape
        
        # Loading dataset
        self.db = self.data_loader()
        
        # Transform function
        # self.transform = transforms.Compose([transforms.Resize(self.input_shape),
        #                                      transforms.ToTensor(),
        #                                      transforms.Normalize([0.485, 0.456, 0.406], [0.229, 0.224, 0.225])])
        self.transform = albumentations.Compose([albumentations.Resize(512, 512), 
                                                 albumentations.RandomCrop(500, 500),
                                                 albumentations.HorizontalFlip(), # Same with transforms.RandomHorizontalFlip()
                                                 albumentations.VerticalFlip(),
                                                albumentations.Normalize([0.485, 0.456, 0.406], [0.229, 0.224, 0.225]),
                                                albumentations.pytorch.transforms.ToTensorV2()])

    def data_loader(self):
        print('Loading test dataset..')
        if not os.path.isdir(self.data_dir):
            print(f'!!! Cannot find {self.data_dir}... !!!')
            sys.exit()
        
        db = pd.read_csv(os.path.join(self.data_dir, 'sample_submission.csv'))
        return db
    
    def __len__(self):
        return len(self.db)
    
    def __getitem__(self, index):
        data = copy.deepcopy(self.db.loc[index])
        
        # Loading image
        cvimg = cv2.imread(os.path.join(self.data_dir,'test',data['file_name']), cv2.IMREAD_COLOR | cv2.IMREAD_IGNORE_ORIENTATION)
        if not isinstance(cvimg, np.ndarray):
            raise IOError("Fail to read %s" % data['file_name'])

        

        # Preprocessing images
        image = cv2.cvtColor(cvimg, cv2.COLOR_BGR2RGB)
        trans_image = self.transform(image = image)
        trans_image = trans_image['image']
        
        
        # trans_image = self.transform(Image.fromarray(cvimg))
        

        # trans_image = self.transform(Image.fromarray(cvimg))

        
        
        
        return trans_image, data['file_name']

In [165]:
# Load dataset & dataloader
test_dataset = TestDataset(data_dir=DATA_DIR, input_shape=INPUT_SHAPE)
test_dataloader = DataLoader(dataset=test_dataset, batch_size=BATCH_SIZE, shuffle=False)

Loading test dataset..


### 추론 진행

In [166]:
model.load_state_dict(torch.load(TRAINED_MODEL_PATH)['model'])

<All keys matched successfully>

In [167]:
model.load_state_dict(torch.load(TRAINED_MODEL_PATH)['model'])

# Prediction
file_lst = []
pred_lst = []
prob_lst = []
model.eval()
with torch.no_grad():
    for batch_index, (img, file_num) in tqdm(enumerate(test_dataloader)):
        img = img.to(DEVICE)
        pred = model(img)
        print(pred)
        file_lst.extend(list(file_num))
        pred_lst.extend(pred.argmax(dim=1).tolist())
        prob_lst.extend(pred[:, 1].tolist())

1it [00:00,  1.33it/s]

tensor([[9.9643e-01, 3.5694e-03],
        [9.9848e-01, 1.5247e-03],
        [9.4987e-01, 5.0131e-02],
        [7.0379e-02, 9.2962e-01],
        [9.9970e-01, 2.9999e-04],
        [4.7412e-03, 9.9526e-01],
        [4.5433e-02, 9.5457e-01],
        [5.0529e-02, 9.4947e-01],
        [9.9214e-01, 7.8635e-03],
        [1.5984e-03, 9.9840e-01],
        [9.9970e-01, 2.9728e-04],
        [6.4048e-01, 3.5952e-01],
        [9.9665e-01, 3.3550e-03],
        [8.8154e-01, 1.1846e-01],
        [9.2237e-01, 7.7632e-02],
        [9.0158e-01, 9.8420e-02],
        [9.8807e-01, 1.1933e-02],
        [9.8912e-01, 1.0878e-02],
        [9.9457e-01, 5.4262e-03],
        [9.9986e-01, 1.4212e-04],
        [9.9979e-01, 2.0895e-04],
        [9.9909e-01, 9.0904e-04],
        [2.6382e-01, 7.3618e-01],
        [9.9630e-01, 3.7042e-03],
        [1.6673e-02, 9.8333e-01],
        [9.9990e-01, 1.0128e-04],
        [9.9802e-01, 1.9762e-03],
        [7.1208e-01, 2.8792e-01],
        [1.3364e-01, 8.6636e-01],
        [2.711

2it [00:01,  1.38it/s]

tensor([[0.0013, 0.9987],
        [0.9966, 0.0034],
        [0.9016, 0.0984],
        [0.4069, 0.5931],
        [0.4772, 0.5228],
        [0.4845, 0.5155],
        [0.1936, 0.8064],
        [0.9617, 0.0383],
        [0.0213, 0.9787],
        [0.6659, 0.3341],
        [0.9261, 0.0739],
        [0.0040, 0.9960],
        [0.2905, 0.7095],
        [0.3863, 0.6137],
        [0.0363, 0.9637],
        [0.8933, 0.1067],
        [0.3067, 0.6933],
        [0.9568, 0.0432],
        [0.1547, 0.8453],
        [0.0035, 0.9965],
        [0.8412, 0.1588],
        [0.4900, 0.5100],
        [0.1730, 0.8270],
        [0.4589, 0.5411],
        [0.6529, 0.3471],
        [0.0040, 0.9960],
        [0.9168, 0.0832],
        [0.6601, 0.3399],
        [0.0182, 0.9818],
        [0.9973, 0.0027],
        [0.9906, 0.0094],
        [0.9553, 0.0447]], device='cuda:0')


4it [00:02,  1.82it/s]

tensor([[7.3598e-04, 9.9926e-01],
        [1.1086e-03, 9.9889e-01],
        [5.1649e-02, 9.4835e-01],
        [3.6460e-02, 9.6354e-01],
        [8.3130e-01, 1.6870e-01],
        [9.9849e-01, 1.5113e-03],
        [9.8914e-01, 1.0857e-02],
        [9.8298e-01, 1.7021e-02],
        [9.7614e-01, 2.3861e-02],
        [9.9857e-01, 1.4312e-03],
        [2.8216e-03, 9.9718e-01],
        [7.7684e-01, 2.2316e-01],
        [9.9993e-01, 7.1884e-05],
        [9.9452e-01, 5.4806e-03],
        [2.2632e-03, 9.9774e-01],
        [1.8441e-02, 9.8156e-01],
        [1.1681e-06, 1.0000e+00],
        [4.9995e-01, 5.0005e-01],
        [8.6279e-01, 1.3721e-01],
        [4.5730e-01, 5.4270e-01],
        [1.3032e-01, 8.6968e-01],
        [2.0276e-01, 7.9724e-01],
        [9.9866e-01, 1.3435e-03],
        [4.6370e-03, 9.9536e-01],
        [9.8784e-01, 1.2164e-02],
        [4.6391e-02, 9.5361e-01],
        [7.4403e-01, 2.5597e-01],
        [9.9238e-01, 7.6187e-03],
        [3.9123e-01, 6.0877e-01],
        [6.911




### 결과 저장

In [168]:
df = pd.DataFrame({'file_name':file_lst, 'COVID':pred_lst})
# df.sort_values(by=['file_name'], inplace=True)
df.to_csv('prediction2.csv', index=False)