## Import

In [1]:
import os
import cv2
from PIL import Image
import pandas as pd
import numpy as np

import torch
import torch.nn as nn
import torch.nn.functional as F
from torch.utils.data import Dataset, DataLoader
from torchvision import transforms
from torch.optim.lr_scheduler import _LRScheduler

from tqdm import tqdm
import albumentations as A
from albumentations.pytorch import ToTensorV2

from torchvision import models
from torchsummary import summary
import torch.nn.functional as F

# GPU 사용이 가능할 경우, GPU를 사용할 수 있게 함.'
os.environ['CUDA_VISIBLE_DEVICES'] = '2'
device = "cuda" if torch.cuda.is_available() else "cpu"
device = torch.device(device)
print(device)

print(os.environ.get('CUDA_VISIBLE_DEVICES'))

  from .autonotebook import tqdm as notebook_tqdm


cuda
2


## Utils

In [2]:
# RLE 인코딩 함수
def rle_encode(mask):
    pixels = mask.flatten()
    pixels = np.concatenate([[0], pixels, [0]])
    runs = np.where(pixels[1:] != pixels[:-1])[0] + 1
    runs[1::2] -= runs[::2]
    return ' '.join(str(x) for x in runs)

# 클래스별 IoU를 계산하기 위한 함수
def calculate_iou_per_class(y_true, y_pred, class_id):
    intersection = np.sum((y_true == class_id) & (y_pred == class_id))
    union = np.sum((y_true == class_id) | (y_pred == class_id))
    iou = intersection / union if union > 0 else 0
    return iou

In [3]:
import torch
import torch.nn as nn
import torch.autograd as autograd

class GradReverseFunction(autograd.Function):
    @staticmethod
    def forward(ctx, x, l):
        ctx.l = l
        return x.view_as(x)

    @staticmethod
    def backward(ctx, grad_output):
        return grad_output.neg() * ctx.l, None

def grad_reverse(x, l):
    return GradReverseFunction.apply(x, l)

class GradReverse(nn.Module):
    def __init__(self, l):
        super(GradReverse, self).__init__()
        self.l = nn.Parameter(torch.tensor(l), requires_grad=False)

    def forward(self, x):
        return grad_reverse(x, self.l)


## Dataset, Data Loader

출력이미지 크기 키우기->ex) resnet 2048->1024->512->256 conv 256->512->1024->2048

In [4]:
class CustomDataset(Dataset):
    def __init__(self, csv_file, transform=None, infer=False):
        self.data = pd.read_csv(csv_file)
        self.transform = transform
        self.infer = infer

    def __len__(self):
        return len(self.data)

    def __getitem__(self, idx):
        directory_path = "/mnt/nas27/Dataset/Samsung_DM"
        img_path = self.data.iloc[idx, 1]
        img_path = os.path.join(directory_path, img_path[2:])
        image = cv2.imread(img_path)
        image = cv2.cvtColor(image, cv2.COLOR_BGR2RGB)
        #image = cv2.cvtColor(image, cv2.COLOR_BGR2GRAY)
        
        if self.infer:
            if self.transform:
                image = self.transform(image=image)['image']
            return image
        
        mask_path = self.data.iloc[idx, 2]
        mask_path = os.path.join(directory_path, mask_path[2:])
        mask = cv2.imread(mask_path)
        #mask = cv2.cvtColor(mask, cv2.COLOR_BGR2RGB)
        mask = cv2.cvtColor(mask, cv2.COLOR_BGR2GRAY)
        mask[mask == 255] = 12 #배경을 픽셀값 12로 간주

        if self.transform:
            augmented = self.transform(image=image, mask=mask)
            image = augmented['image']
            mask = augmented['mask']

        return image, mask

class CustomDataset_target(Dataset):
    def __init__(self, csv_file, transform=None, infer=False):
        self.data = pd.read_csv(csv_file)
        self.transform = transform
        self.infer = infer

    def __len__(self):
        return len(self.data)

    def __getitem__(self, idx):
        directory_path = "/mnt/nas27/Dataset/Samsung_DM"
        img_path = self.data.iloc[idx, 1]
        img_path = os.path.join(directory_path, img_path[2:])
        image = cv2.imread(img_path)
        image = cv2.cvtColor(image, cv2.COLOR_BGR2RGB)
        
        if self.infer:
            if self.transform:
                image = self.transform(image=image)['image']
            return image


        if self.transform:
            augmented = self.transform(image=image)
            image = augmented['image']
            

        return image
     

transform = A.Compose(
    [   
        #A.Resize(224, 224),
        A.Resize(128, 128),
        A.Normalize(),
        
        # 변형
        # A.VerticalFlip(p=0.5),
        # A.RandomRotate90(p=0.5),
        # A.HueSaturationValue(p=0.2),
        
        ToTensorV2()
    ]
)

Warmup

In [5]:
# class WarmUpLR(_LRScheduler):
#     def __init__(self, optimizer, total_iters, last_epoch=-1):
#         self.total_iters = total_iters
#         super(WarmUpLR, self).__init__(optimizer, last_epoch)

#     def get_lr(self):
#         return [base_lr * self.last_epoch / self.total_iters for base_lr in self.base_lrs]


## Define Model

In [6]:
#Unet의 기본이 되는 conv블럭
class ConvBlock(nn.Module):
    def __init__(self, in_channels, out_channels):
        super(ConvBlock, self).__init__()
        self.conv1 = nn.Conv2d(in_channels, out_channels, kernel_size=3, padding=1)
        self.bn1 = nn.BatchNorm2d(out_channels)
        self.relu1 = nn.ReLU()
        
        self.conv2 = nn.Conv2d(out_channels, out_channels, kernel_size=3, padding=1)  # 여기서 in_channels는 out_channels와 동일해야 합니다.
        self.bn2 = nn.BatchNorm2d(out_channels)
        self.relu2 = nn.ReLU()

    def forward(self, x):
        x = self.conv1(x)
        x = self.bn1(x)
        x = self.relu1(x)
        
        x = self.conv2(x)
        x = self.bn2(x)
        x = self.relu2(x)
        return x

#인코더 블럭
class EncoderBlock(nn.Module):
    def __init__(self, in_channels, out_channels):
        super(EncoderBlock,self).__init__()
        self.convblock1 = ConvBlock(in_channels, out_channels)  # 첫 번째 ConvBlock의 in_channels는 입력 이미지의 채널 수와 일치해야 합니다.
        #self.convblock2 = ConvBlock(out_channels, out_channels)  # 두 번째 ConvBlock의 in_channels는 out_channels와 일치해야 합니다.
        self.maxpool = nn.MaxPool2d(kernel_size=2, stride=2)

    def forward(self,x):
        x = self.convblock1(x)
        #x = self.convblock2(x)
        p = self.maxpool(x)
        return x , p
#디코더 블럭
#디코더는 업샘플링 이후 스킵연결과 붙어서 convblock을 통과해야함
#skip보다 작은 x x먼저 업샘플링 32 -> 64 , skip과 결합 6464 
class DecoderBlock(nn.Module):
    def __init__(self, channels):
        super(DecoderBlock,self).__init__()
        self.upsample = nn.ConvTranspose2d(channels*2, channels, kernel_size=4, stride=2, padding=1)#x 업샘플링
        self.convblock1 = ConvBlock(channels*2, channels)#차원감소
        #self.convblock2 = ConvBlock(channels, channels)
    def forward(self,x,skip):
        x = self.upsample(x)
        x = torch.cat([x, skip], dim=1)
        x = self.convblock1(x)
        #x = self.convblock2(x)
        return x
        
#Unet구조 middle의 xm값의 움직임에 주의
class Unet(nn.Module):
    def __init__(self,n_classes):
        super(Unet,self).__init__()
        self.encoder1 = EncoderBlock(3,64)
        self.encoder2 = EncoderBlock(64,128)
        self.encoder3 = EncoderBlock(128,256)
        self.encoder4 = EncoderBlock(256,512)
        
        self.middleconv = ConvBlock(512,1024)
        
        
        self.decoder4 = DecoderBlock(512)
        self.decoder3 = DecoderBlock(256)
        self.decoder2 = DecoderBlock(128)
        self.decoder1 = DecoderBlock(64)
        self.segmap = nn.Conv2d(64,n_classes, kernel_size=1)
        
        ##
        # self.domain_classifier = nn.Sequential(
        #     nn.Conv3d(1024, 64, kernel_size=3, padding=1),
        #     nn.ReLU(),
        #     nn.Conv3d(64, 32, kernel_size=3, padding=1),
        #     nn.ReLU(),
        #     nn.Flatten(),
        #     nn.Linear(32 * 16 * 16 * 16, 1),
        #     nn.Sigmoid()
        # )

        # self.grad_reverse = GradReverse(0.0)
        ##

    def forward(self,x):
        x1,p = self.encoder1(x)#3->64   #P:256,256 x1 :512,512
        x2,p = self.encoder2(p)#64->128 #P:128,128 x2:256,256
        x3,p = self.encoder3(p)#128->256#p:64,64 x3:128,128
        x4,p = self.encoder4(p)#256->512#p:32,32 x4:64,64
        
        xm = self.middleconv(p)#512->1024#32,32
        
        x = self.decoder4(xm,x4)#뉴런:1024->512->512 #출력tensor:64,64
        x = self.decoder3(x,x3)#뉴런:512->256->256 #출력tensor:128,128
        x = self.decoder2(x,x2)#뉴런:256->128->128 #출력tensor:256,256
        x = self.decoder1(x,x1)#뉴런:128->64->64 #출력tensor:512,512
        x = self.segmap(x)

        # 도메인 분류기에 GradReverse 적용
        #feat = self.grad_reverse(x)
        #domain_output = self.domain_classifier(x)

        return x

## ResNet50

In [7]:
# import torch.nn as nn
# import torchvision.models as models

# class UNetWithResnet50Encoder(nn.Module):
#     def __init__(self, n_classes):
#         super().__init__()
        
#         # ResNet50 백본을 불러옵니다.
#         self.resnet = models.resnet50(pretrained=True)
        
#         # 인코더 부분
#         self.encoder0 = nn.Sequential(
#             self.resnet.conv1,
#             self.resnet.bn1,
#             self.resnet.relu,
#             self.resnet.maxpool
#         )
#         self.encoder1 = self.resnet.layer1
#         self.encoder2 = self.resnet.layer2
#         self.encoder3 = self.resnet.layer3
#         self.encoder4 = self.resnet.layer4
        
#         # 중간 컨볼루션
#         self.middle_conv = nn.Sequential(
#             nn.Conv2d(2048, 1024, kernel_size=3, padding=1),
#             nn.ReLU()
#         )
        
#         # 디코더 부분
#         self.decoder3 = nn.Sequential(
#             nn.ConvTranspose2d(1024+1024, 512, kernel_size=2, stride=2),
#             nn.ReLU()
#         )
#         self.decoder2 = nn.Sequential(
#             nn.ConvTranspose2d(512+512, 256, kernel_size=2, stride=2),
#             nn.ReLU()
#         )
#         # 디코더 부분
#         self.decoder1 = nn.Sequential(
#             nn.ConvTranspose2d(256+256, 128, kernel_size=2, stride=2),  # 출력 채널 수를 128로 변경
#             nn.ReLU()
#         )
#         self.decoder0 = nn.Sequential(
#             nn.ConvTranspose2d(128+64, n_classes, kernel_size=2, stride=2),  # 입력 채널 수를 192로 변경
#             nn.ReLU()
#         )
        
#     def forward(self, x):
#         # 인코더 부분
#         x0 = self.encoder0(x)
#         x1 = self.encoder1(x0)
#         x2 = self.encoder2(x1)
#         x3 = self.encoder3(x2)
#         x4 = self.encoder4(x3)
        
#         # 중간 컨볼루션 후 업샘플링
#         middle = self.middle_conv(x4)
#         middle_upsampled = nn.functional.interpolate(middle, scale_factor=2, mode='bilinear', align_corners=True)

#         # 디코더 부분 (skip connection 추가)
#         d3 = self.decoder3(torch.cat([middle_upsampled, x3], dim=1))
#         d2 = self.decoder2(torch.cat([d3, x2], dim=1))
#         d1 = self.decoder1(torch.cat([d2, x1], dim=1))
#         out = self.decoder0(torch.cat([d1, x0], dim=1))
        
#         return out


In [8]:
LR = 0.001
EP = 5
BATCH_SIZE = 64
ACCMULATION_STEP = 1 
N_CLASSES = 13 #IoU 점수측정하기 위한 클래스의 개수
# WUP_ITERS = 10  # 웜업을 위한 반복 횟수
# model 초기화
#model = Unet_resnet18(n_classes = N_CLASSES).to(device)
#model = ResNet50(num_classes=N_CLASSES).to(device)
model = Unet(n_classes = N_CLASSES).to(device)

# loss function과 optimizer 정의

criterion =nn.CrossEntropyLoss()
domain_criterion = nn.BCELoss()
optimizer = torch.optim.Adam(model.parameters(), lr=LR)
optimizer.zero_grad() 
#optimizer = torch.optim.SGD(model.parameters(), lr=LR, momentum=0.9, nesterov=True)
# Warmup을 위한 스케줄러 설정
# scheduler_warmup = WarmUpLR(optimizer, WUP_ITERS)

dataset = CustomDataset(csv_file=os.path.join("/mnt/nas27/Dataset/Samsung_DM",'./train_source.csv'), transform=transform)
dataloader = DataLoader(dataset, batch_size=BATCH_SIZE, shuffle=True, num_workers=8)
valid_dataset = CustomDataset(csv_file=os.path.join("/mnt/nas27/Dataset/Samsung_DM",'./val_source.csv'), transform=transform)
valid_dataloader = DataLoader(valid_dataset, batch_size=BATCH_SIZE, shuffle=False, num_workers=8)
target_dataset = CustomDataset_target(csv_file=os.path.join("/mnt/nas27/Dataset/Samsung_DM",'./train_target.csv'), transform=transform)
target_dataloader = DataLoader(target_dataset, batch_size=BATCH_SIZE, shuffle=False, num_workers=8)
test_dataset = CustomDataset(csv_file=os.path.join("/mnt/nas27/Dataset/Samsung_DM",'./test.csv'), transform=transform, infer=True)
test_dataloader = DataLoader(test_dataset, batch_size=BATCH_SIZE, shuffle=False, num_workers=8)

In [9]:
# import pandas as pd
# import os

# # 데이터셋을 불러옵니다.
# csv_file = os.path.join("/mnt/nas27/Dataset/Samsung_DM", './train_source.csv')
# data = pd.read_csv(csv_file)

# # 클래스별 샘플 수를 저장할 리스트를 초기화합니다.
# class_sample_counts = [0] * N_CLASSES  # num_classes는 클래스의 총 개수입니다.

# # 데이터셋을 순회하면서 클래스별 샘플 수를 세고 저장합니다.
# for idx in range(len(data)):
#     mask_path = os.path.join("/mnt/nas27/Dataset/Samsung_DM", data.iloc[idx, 2][2:])  # 마스크 이미지 경로
#     mask = cv2.imread(mask_path, cv2.IMREAD_GRAYSCALE)
#     mask[mask == 255] = 12  # 배경 클래스로 처리

#     # 각 클래스의 샘플 수를 카운트합니다.
#     for class_id in range(N_CLASSES):
#         class_sample_counts[class_id] += (mask == class_id).sum()

# # 클래스별 가중치를 계산합니다.
# total_samples = sum(class_sample_counts)
# class_weights = [total_samples / count for count in class_sample_counts]

# # 클래스별 가중치를 텐서로 변환합니다.
# class_weights = torch.tensor(class_weights).to(device)

In [10]:
# print(class_sample_counts)
# print(class_weights)

In [11]:
# import matplotlib.pyplot as plt

# # 데이터로더에서 배치 하나를 가져옵니다.
# dataiter = iter(dataloader)
# images, masks = next(dataiter)

# # 이미지를 시각화합니다.
# for i in range(images.size(0)):
#     image = images[i].permute(1, 2, 0).numpy()  # 이미지를 CHW에서 HWC로 변환
#     mask = masks[i].numpy()

#     plt.figure(figsize=(8, 8))
#     plt.subplot(1, 2, 1)
#     plt.imshow(image)
#     plt.title("Image")

#     plt.subplot(1, 2, 2)
#     plt.imshow(mask, cmap='gray')
#     plt.title("Mask")

#     plt.show()


In [12]:
# for images, masks in tqdm(dataloader):
#     a = images.float().to(device)
#     b = masks.long().to(device)
#     break

# # PyTorch Tensor를 NumPy 배열로 변환
# a_numpy = a[3].cpu().numpy()  # 첫 번째 이미지만 선택하거나 필요한 이미지를 선택하세요.
# a_numpy = np.transpose(a_numpy, (1, 2, 0))
# b_numpy = b[3].cpu().numpy()
# b_numpy = b_numpy*12

# # 이미지를 저장
# cv2.imwrite('image_source.png', a_numpy)  # 이미지 저장
# cv2.imwrite('image_mask.png', b_numpy)   # 마스크 저장

In [13]:

# for epoch in range(2):  # 5 에폭 동안 학습합니다.
          
#     # 클래스별 IoU를 누적할 리스트 초기화
#     train_class_ious = []
    
#     # 학습
#     model.train()
#     epoch_loss = 0
    
#     for images, masks in tqdm(dataloader):
#         images = images.float().to(device)
#         masks = masks.long().to(device)

#         optimizer.zero_grad()
#         outputs = model(images)
#         mask_spueeze = masks.squeeze(1)
#         loss = criterion(outputs, masks.squeeze(1))
#         loss.backward()
#         optimizer.step()

#         epoch_loss += loss.item()

## Model Train

In [14]:
import random
torch.cuda.empty_cache()

for epoch in range(EP):
    # 클래스별 IoU를 누적할 리스트 초기화
    train_class_ious = []
    # 학습
    model.train()
    epoch_loss = 0
    for images, masks in tqdm(dataloader):
        images = images.float().to(device)
        masks = masks.long().to(device)

        optimizer.zero_grad()
        outputs = model(images)
        loss = criterion(outputs, masks.squeeze(1))
        loss.backward()
        optimizer.step()
        # if (epoch+1) % ACCMULATION_STEP == 0:
        #     optimizer.step()
        #     optimizer.zero_grad()
            # # Warmup 스케줄러 업데이트
            # if epoch < WUP_ITERS:
            #     scheduler_warmup.step()
        
        epoch_loss += loss.item()

        # train 클래스별 IoU 계산
        outputs = torch.softmax(outputs, dim=1).cpu()
        outputs = torch.argmax(outputs, dim=1).numpy()

        for class_id in range(N_CLASSES):
            iou = calculate_iou_per_class(np.array(masks.cpu()), np.array(outputs), class_id)
            train_class_ious.append(iou)

    train_class_ious = np.array(train_class_ious).reshape(N_CLASSES, -1)
    train_class_ious = np.mean(train_class_ious, axis=1)
    print("--IoU Scores Train--")
    for class_id, iou in enumerate(train_class_ious):
        print(f'Class{class_id}: {iou:.4f}', end=" ")
        if (class_id+1) % 7 == 0:
            print()

    # mIoU 계산
    train_mIoU = np.mean(train_class_ious)

    # validation
    val_loss = 0
    val_class_ious = []  # 클래스별 IoU를 누적할 리스트 초기화
    with torch.no_grad():
        model.eval()
        for images, masks in tqdm(valid_dataloader):
            images = images.float().to(device)
            masks = masks.long().to(device)
            outputs = model(images)

            # validation loss 계산
            val_loss += criterion(outputs, masks.squeeze(1)).item()

            # validation 클래스별 IoU 계산
            outputs = torch.softmax(outputs, dim=1).cpu()
            outputs = torch.argmax(outputs, dim=1).numpy()

            for class_id in range(N_CLASSES):
                iou = calculate_iou_per_class(np.array(masks.cpu()), np.array(outputs), class_id)
                val_class_ious.append(iou)

    val_class_ious = np.array(val_class_ious).reshape(N_CLASSES, -1)
    val_class_ious = np.mean(val_class_ious, axis=1)
    print("--IoU Scores Valid--")
    for class_id, iou in enumerate(val_class_ious):
        print(f'Class{class_id}: {iou:.4f}', end=" ")
        if (class_id+1) % 7 == 0:
            print("")

    # mIoU 계산
    val_mIoU = np.mean(val_class_ious)

    # 에폭마다 결과 출력 
    print(f"\nEpoch{epoch+1}")
    print(f"Train Loss: {(epoch_loss/len(dataloader))}, Train mIoU Score: {train_mIoU:.4f}")
    print(f"Validation Loss: {val_loss/len(valid_dataloader)}, Validation mIoU Score: {val_mIoU:.4f}")
    print("___________________________________________________________________________________________\n")


100%|██████████| 35/35 [02:20<00:00,  4.01s/it]


--IoU Scores Train--
Class0: 0.0919 Class1: 0.1953 Class2: 0.2588 Class3: 0.2539 Class4: 0.2671 Class5: 0.3098 Class6: 0.2792 
Class7: 0.2973 Class8: 0.3514 Class9: 0.2943 Class10: 0.3301 Class11: 0.3522 Class12: 0.3387 

100%|██████████| 8/8 [00:30<00:00,  3.87s/it]


--IoU Scores Valid--
Class0: 0.2100 Class1: 0.3960 Class2: 0.1967 Class3: 0.2884 Class4: 0.4174 Class5: 0.2735 Class6: 0.2752 
Class7: 0.2285 Class8: 0.2304 Class9: 0.4168 Class10: 0.2455 Class11: 0.2834 Class12: 0.3153 
Epoch1
Train Loss: 1.1496937922069004, Train mIoU Score: 0.2785
Validation Loss: 0.9325250685214996, Validation mIoU Score: 0.2905
___________________________________________________________________________________________



100%|██████████| 35/35 [02:00<00:00,  3.44s/it]


--IoU Scores Train--
Class0: 0.3349 Class1: 0.3334 Class2: 0.3635 Class3: 0.3202 Class4: 0.3398 Class5: 0.3738 Class6: 0.3326 
Class7: 0.3451 Class8: 0.4009 Class9: 0.3274 Class10: 0.3527 Class11: 0.3792 Class12: 0.3678 

100%|██████████| 8/8 [00:24<00:00,  3.08s/it]


--IoU Scores Valid--
Class0: 0.2096 Class1: 0.4105 Class2: 0.1666 Class3: 0.3302 Class4: 0.4321 Class5: 0.2306 Class6: 0.3139 
Class7: 0.1982 Class8: 0.2690 Class9: 0.4354 Class10: 0.2218 Class11: 0.3274 Class12: 0.3184 
Epoch2
Train Loss: 0.5872848442622594, Train mIoU Score: 0.3516
Validation Loss: 0.8319521546363831, Validation mIoU Score: 0.2972
___________________________________________________________________________________________



100%|██████████| 35/35 [02:16<00:00,  3.91s/it]


--IoU Scores Train--
Class0: 0.3530 Class1: 0.3603 Class2: 0.3838 Class3: 0.3360 Class4: 0.3627 Class5: 0.3906 Class6: 0.3512 
Class7: 0.3870 Class8: 0.4249 Class9: 0.3828 Class10: 0.3882 Class11: 0.4303 Class12: 0.3925 

100%|██████████| 8/8 [00:33<00:00,  4.13s/it]


--IoU Scores Valid--
Class0: 0.2625 Class1: 0.4658 Class2: 0.2133 Class3: 0.3709 Class4: 0.4845 Class5: 0.3010 Class6: 0.3618 
Class7: 0.2447 Class8: 0.3052 Class9: 0.4970 Class10: 0.2803 Class11: 0.3739 Class12: 0.3800 
Epoch3
Train Loss: 0.4564221177782331, Train mIoU Score: 0.3803
Validation Loss: 0.5285428613424301, Validation mIoU Score: 0.3493
___________________________________________________________________________________________



100%|██████████| 35/35 [02:24<00:00,  4.14s/it]


--IoU Scores Train--
Class0: 0.4049 Class1: 0.4071 Class2: 0.4243 Class3: 0.3877 Class4: 0.4170 Class5: 0.4360 Class6: 0.3935 
Class7: 0.4225 Class8: 0.4634 Class9: 0.4129 Class10: 0.4515 Class11: 0.4668 Class12: 0.4268 

100%|██████████| 8/8 [00:23<00:00,  2.88s/it]


--IoU Scores Valid--
Class0: 0.2615 Class1: 0.3927 Class2: 0.2104 Class3: 0.3339 Class4: 0.4309 Class5: 0.2779 Class6: 0.3187 
Class7: 0.2011 Class8: 0.2966 Class9: 0.4364 Class10: 0.2497 Class11: 0.3480 Class12: 0.3574 
Epoch4
Train Loss: 0.3920575669833592, Train mIoU Score: 0.4242
Validation Loss: 0.824469156563282, Validation mIoU Score: 0.3166
___________________________________________________________________________________________



100%|██████████| 35/35 [02:23<00:00,  4.11s/it]


--IoU Scores Train--
Class0: 0.4640 Class1: 0.4520 Class2: 0.4653 Class3: 0.4362 Class4: 0.4554 Class5: 0.4798 Class6: 0.4417 
Class7: 0.4778 Class8: 0.5077 Class9: 0.4431 Class10: 0.4922 Class11: 0.4966 Class12: 0.4487 

100%|██████████| 8/8 [00:28<00:00,  3.62s/it]

--IoU Scores Valid--
Class0: 0.3095 Class1: 0.4807 Class2: 0.2571 Class3: 0.3852 Class4: 0.5061 Class5: 0.3378 Class6: 0.3876 
Class7: 0.2689 Class8: 0.3391 Class9: 0.4990 Class10: 0.2983 Class11: 0.4052 Class12: 0.4349 
Epoch5
Train Loss: 0.35549231001308984, Train mIoU Score: 0.4662
Validation Loss: 0.5135640799999237, Validation mIoU Score: 0.3776
___________________________________________________________________________________________






In [15]:
# with torch.no_grad():
#     model.eval()
#     result = []
#     for images in tqdm(valid_dataloader):
#         images = images.float().to(device)
#         outputs = model(images)
#         outputs = torch.softmax(outputs, dim=1).cpu()
#         outputs = torch.argmax(outputs, dim=1).numpy()
#         for class_id in range(N_CLASSES):
#             iou = calculate_iou_per_class(np.array(masks.cpu()), np.array(outputs), class_id)
#             result.append(iou)

#     result = np.array(result).reshape(N_CLASSES, -1)
#     result = np.mean(result, axis=1)

In [16]:
# import random
# torch.cuda.empty_cache()

# for epoch in range(EP):
#     # 클래스별 IoU를 누적할 리스트 초기화
#     train_class_ious = []
#     # 학습
#     model.train()
#     epoch_loss = 0
#     for images in tqdm(target_dataloader):
#         images = images.float().to(device)

#         optimizer.zero_grad()
#         _, outputs = model(images)
#         target_domain = torch.zeros_like(outputs).to(device)
#         loss = domain_criterion(outputs, target_domain)
#         loss.backward()
#         optimizer.step()
        
#         epoch_loss += loss.item()

#         avg_domain_loss = epoch_loss / len(target_dataloader)
#     print(f"Epoch [{epoch + 1}/{EP}] - Domain Loss: {avg_domain_loss:.4f}")


In [17]:
# with torch.no_grad():
#     model.eval()
#     result = []
#     for images in tqdm(valid_dataloader):
#         images = images.float().to(device)
#         outputs = model(images)
#         outputs = torch.softmax(outputs, dim=1).cpu()
#         outputs = torch.argmax(outputs, dim=1).numpy()
#         for class_id in range(N_CLASSES):
#             iou = calculate_iou_per_class(np.array(masks.cpu()), np.array(outputs), class_id)
#             result.append(iou)

#     result = np.array(result).reshape(N_CLASSES, -1)
#     result = np.mean(result, axis=1)

## Inference

In [18]:
# test_dataset = CustomDataset(csv_file='./test.csv', transform=transform, infer=True)
# test_dataloader = DataLoader(test_dataset, batch_size=16, shuffle=False, num_workers=4)

In [19]:
# with torch.no_grad():
#     model.eval()
#     result = []
#     for images in tqdm(test_dataloader):
#         images = images.float().to(device)
#         outputs = model(images)
#         outputs = torch.softmax(outputs, dim=1).cpu()
#         outputs = torch.argmax(outputs, dim=1).numpy()
#         # batch에 존재하는 각 이미지에 대해서 반복
#         for pred in outputs:
#             pred = pred.astype(np.uint8)
#             pred = Image.fromarray(pred) # 이미지로 변환
#             pred = pred.resize((960, 540), Image.NEAREST) # 960 x 540 사이즈로 변환
#             pred = np.array(pred) # 다시 수치로 변환
#             # class 0 ~ 11에 해당하는 경우에 마스크 형성 / 12(배경)는 제외하고 진행
#             for class_id in range(12):
#                 class_mask = (pred == class_id).astype(np.uint8)
#                 if np.sum(class_mask) > 0: # 마스크가 존재하는 경우 encode
#                     mask_rle = rle_encode(class_mask)
#                     result.append(mask_rle)
#                 else: # 마스크가 존재하지 않는 경우 -1
#                     result.append(-1)
        

## Submission

In [20]:
# submit = pd.read_csv('./sample_submission.csv')
# submit['mask_rle'] = result
# submit

In [21]:
# submit.to_csv('./baseline_submit.csv', index=False)