<a href="https://colab.research.google.com/github/R12942159/DeepLearning/blob/main/DLCV_hw1_p3_deeplabv3.ipynb" target="_parent"><img src="https://colab.research.google.com/assets/colab-badge.svg" alt="Open In Colab"/></a>

In [1]:
from google.colab import drive
drive.mount('/content/drive')

Mounted at /content/drive


In [2]:
import torch


# Get cuda from GPU device for training.
device = "cuda" if torch.cuda.is_available() else "cpu"
print(f"Using: {device}")

Using: cuda


In [3]:
import os


train_paths = '/content/drive/MyDrive/NTU_DLCV/hw1/p3_data/train'
img_paths_train = sorted([os.path.join(train_paths, i) for i in os.listdir(train_paths) if i.endswith('.jpg')])
mask_paths_train = sorted([os.path.join(train_paths, i) for i in os.listdir(train_paths) if i.endswith('.png')])

val_paths = '/content/drive/MyDrive/NTU_DLCV/hw1/p3_data/validation'
img_paths_val = sorted([os.path.join(val_paths, i) for i in os.listdir(val_paths) if i.endswith('.jpg')])
mask_paths_val = sorted([os.path.join(val_paths, i) for i in os.listdir(val_paths) if i.endswith('.png')])

In [4]:
len(img_paths_train), len(mask_paths_train), len(img_paths_val), len(mask_paths_val)

(2000, 2000, 257, 257)

In [5]:
import torch
import random
import numpy as np
from PIL import Image
from copy import deepcopy
from torchvision.transforms.functional import hflip, vflip, to_tensor, normalize


class LandDataset(torch.utils.data.Dataset):
    def __init__(self, img_paths, mask_paths, transform, mode, augment=False):
        self.img_paths = img_paths
        self.mask_paths = mask_paths
        self.transform = transform
        self.mode = mode

        # Data Augmentation
        def original(x): return x
        if augment:
            self.augment = [original, hflip, vflip]
        else:
            self.augment = [original]

        # double check the len of img and mask.
        assert len(self.img_paths) == len(self.mask_paths)

    def __len__(self):
        return len(self.img_paths)

    def __getitem__(self, idx):
        # get img path
        img_path = self.img_paths[idx]
        # Read img
        img = Image.open(img_path).convert('RGB')
        # Normalize Image with VGG16's mean and std
        # (H, W, C) -> (C, H, W)
        img = self.transform(img)

        if self.mode != 'test':
            # get mask path
            mask_path = self.mask_paths[idx]
            mask = Image.open(mask_path).convert('RGB')
            mask = np.array(mask)
            # Binarize mask from [0~255] to (0 or 1)
            mask = (mask >= 128).astype(int)

            # squeeze [a,b,c] into [x,y] with 7 category(6 classes + 1 background)
            mask = 100 * mask[:, :, 0] + 10 * mask[:, :, 1] + 1 * mask[:, :, 2]
            raw_mask = deepcopy(mask) # Only perform numerical conversion on the most original data
            mask[raw_mask == 11] = 0  # (Cyan: 011) Urban land
            mask[raw_mask == 110] = 1  # (Yellow: 110) Agriculture land
            mask[raw_mask == 101] = 2  # (Purple: 101) Rangeland
            mask[raw_mask == 10] = 3  # (Green: 010) Forest land
            mask[raw_mask == 1] = 4  # (Blue: 001) Water
            mask[raw_mask == 111] = 5  # (White: 111) Barren land
            mask[raw_mask == 0] = 6  # (Black: 000) Unknown
            mask = torch.tensor(mask)

            # random Data Augmentation
            augmentor = random.choice(self.augment)
            img = augmentor(img)
            mask = augmentor(mask)

            # mask = mask.to(torch.float)  # 将目标标签转换为浮点数类型
            return img, mask
        else:
            return img

In [6]:
import torchvision.transforms as tr


# IMG_SIZE : 512*512
BATCH_SIZE = 4

# https://pytorch.org/vision/main/models/generated/torchvision.models.segmentation.deeplabv3_resnet50.html#torchvision.models.segmentation.deeplabv3_resnet50
mean=[0.485, 0.456, 0.406]
std=[0.229, 0.224, 0.225]

train_ds = LandDataset(img_paths_train,
                       mask_paths_train,
                       transform = tr.Compose([
                          tr.ToTensor(),
                          tr.Normalize(mean=mean, std=std),
                          ]),
                       mode = 'train',
                       augment = True,)
val_ds = LandDataset(img_paths_val,
                     mask_paths_val,
                     transform = tr.Compose([
                          tr.ToTensor(),
                          tr.Normalize(mean=mean, std=std),
                          ]),
                     mode = 'val',
                     augment = False,)

# num_workers > 0: accelerate loading data by muli-process
train_loader = torch.utils.data.DataLoader(train_ds, BATCH_SIZE, shuffle=True, num_workers=6)
val_loader = torch.utils.data.DataLoader(val_ds, BATCH_SIZE*2, shuffle=False, num_workers=6)

In [7]:
from torchvision.models.segmentation.deeplabv3 import deeplabv3_resnet50, deeplabv3_resnet101, DeepLabHead, FCNHead


# https://pytorch.org/hub/pytorch_vision_deeplabv3_resnet101/
# output['out'] contains the semantic masks, and output['aux'] contains the auxiliary loss values per-pixel
# https://pytorch.org/vision/main/_modules/torchvision/models/segmentation/deeplabv3.html#deeplabv3_resnet50
def deeplabv3(mode, num_classes=7):
    if mode == 'resnet101':
        model =  deeplabv3_resnet101(pretrained=True)
        # DeepLabHead在处理复杂场景、小物体和物体边缘时通常表现更好,
        # ASPP-Conv2d(256, 256, 3, padding=1, bias=False)-nn.BatchNorm2d(256)-nn.ReLU()-nn.Conv2d(256, num_classes, 1)
        model.aux_classifier = FCNHead(1024, num_classes)
        model.classifier = DeepLabHead(2048, num_classes)
    elif mode == 'resnet50':
        model = deeplabv3_resnet50(pretrained=True)
        model.aux_classifier = FCNHead(1024, num_classes)
        model.classifier = DeepLabHead(2048, num_classes)

    return model

In [8]:
def mean_iou_score(pred, labels, num_classes=6):
    '''
    Compute mean IoU score over 6 classes
    '''
    mean_iou = []
    for i in range(num_classes):
        tp_fp = torch.sum(pred == i)
        tp_fn = torch.sum(labels == i)
        tp = torch.sum((pred == i) * (labels == i))
        # avoid nan
        if (tp_fp + tp_fn - tp) == 0:
            # iou = 0.
            continue
        else:
            iou = tp / (tp_fp + tp_fn - tp)
        mean_iou.append(iou)

    return sum(mean_iou) / len(mean_iou)

In [9]:
from tqdm import tqdm


def train(dataloader, model, loss_fn, optimizer):
    size = len(dataloader.dataset) # number of samples
    num_batches = len(dataloader) # batches per epoch
    model.train() # to training mode.
    epoch_loss, epoch_iou = 0, 0
    for batch_i, (x, y) in enumerate(tqdm(dataloader, leave=False)):
        x, y = x.to(device, non_blocking=True), y.to(device, non_blocking=True) # move data to GPU

        # Compute prediction loss
        pred = model(x)
        pred_out, pred_aux = pred['out'], pred['aux']
        loss = loss_fn(pred_out, y) + loss_fn(pred_aux, y)
        # Optimization by gradients
        optimizer.zero_grad() # set prevision gradient to 0
        loss.backward() # backpropagation to compute gradients
        optimizer.step() # update model params
        # scheduler.step()

        pred_out = torch.argmax(pred_out, dim=1) # 沿着通道维度选择具有最高分数的通道
        pred_out = pred_out.to(torch.float)  # 将目标标签转换为浮点数类型
        # log
        epoch_loss += loss.item() # tensor -> python value
        epoch_iou += mean_iou_score(pred_out, y).item()

    # return avg loss of epoch, iou of epoch
    return epoch_loss/num_batches, epoch_iou/num_batches


def test(dataloader, model, loss_fn):
    size = len(dataloader.dataset) # number of samples
    num_batches = len(dataloader) # batches per epoch

    model.eval() # model to test mode.
    epoch_loss = 0
    epoch_iou = 0
    # No gradient for test data
    with torch.no_grad():
        for batch_i, (x, y) in enumerate(dataloader):
            x, y = x.to(device), y.to(device)

            # Compute prediction loss
            pred = model(x)
            pred = pred['out']
            loss = loss_fn(pred, y)

            pred = torch.argmax(pred, dim=1) # 沿着通道维度选择具有最高分数的通道
            pred = pred.to(torch.float)  # 将目标标签转换为浮点数类型

            # write to logs
            epoch_loss += loss.item()
            epoch_iou += mean_iou_score(pred, y).item()

    return epoch_loss/num_batches, epoch_iou/num_batches

#### Cross Entropy Loss

\begin{align}
L_{ce,i} \quad = \quad
\begin{cases}
  & -log(p_i)   \qquad, \text{ if } y_i= 1\\
  & -log(1-p_i) \; \;    ,\text{ if } y_i=0
\end{cases}
    \end{align}
#### Focal Loss

\begin{align}
L_{focal,i} \quad = \quad
\begin{cases}
  & -\alpha (1-p_i)^rlog(p_i)   \qquad     ,\text{ if } y_i= 1\\
  & -(1-\alpha)p_i^rlog(1-p_i)  \ \ \ \,   ,\text{ if } y_i=0
\end{cases}
    \end{align}

In [10]:
# ref. https://blog.csdn.net/qq_39732684/article/details/105794637
from torch import nn


class focal_loss(nn.Module):
    def __init__(self, alpha=0.25, gamma=2): # Assume that the positive and negative sample ratio is 3:1
        super(focal_loss, self).__init__()
        self.alpha = alpha
        self.gamma = gamma
        self.CrossEntropyLoss = nn.CrossEntropyLoss(ignore_index=6) # 用于指定在计算损失时应忽略的类别索引,参数被设置为背景类别的索引，以确保这些像素不会影响模型的训练

    def forward(self, preds, labels):
        Lce = -self.CrossEntropyLoss(preds, labels) # log(pi) or log(1-pi)
        Lfocal = -1 * (self.alpha) * ((1-torch.exp(Lce)) ** self.gamma) * Lce

        return Lfocal

In [11]:
from torch.optim.lr_scheduler import StepLR


EPOCHS = 100
logs = {
    'train_loss': [], 'val_loss': [],
    'train_mean_iou': [], 'val_mean_iou': [],
}

model = deeplabv3(mode='resnet101')
model = model.to(device)
loss_fn = focal_loss()
optimizer = torch.optim.Adam(model.parameters(), lr=5e-5)
# citaion: Encoder-Decoder with Atrous Separable Convolution for Semantic Image Segmentation(Liang-Chieh Chen, Yukun Zhu, George Papandreou, Florian Schroff, and Hartwig Adam)
# optimizer = torch.optim.SGD(model.parameters(), lr=0.05, momentum=0.9, weight_decay=4e-5)
# scheduler = StepLR(optimizer, step_size=2, gamma=0.94) # 每2个周期衰减一次, 衰减率为0.94


# Earlystopping
patience = 5
counter = 0
best_IOU = 0

for epoch in tqdm(range(EPOCHS)):
    train_loss, train_mean_iou = train(train_loader, model, loss_fn, optimizer)
    val_loss, val_mean_iou = test(val_loader, model, loss_fn)
    logs['train_loss'].append(train_loss)
    logs['val_loss'].append(val_loss)
    logs['train_mean_iou'].append(train_mean_iou)
    logs['val_mean_iou'].append(val_mean_iou)

    print(f'EPOCH: {(epoch+1):04d} train_loss: {train_loss:.4f} val_loss: {val_loss:.4f}, train_mean_iou: {train_mean_iou:.3f}, val_mean_iou: {val_mean_iou:.3f}')

    # On epoch end
    torch.save(model.state_dict(), f"/content/drive/MyDrive/NTU_DLCV/hw1/p3_data/deeplabv3_result/restnet101_{epoch+1}model.pth")
    # check improvement
    if best_IOU < val_mean_iou:
        counter = 0
        best_IOU = val_mean_iou
        torch.save(model.state_dict(), "deeplabv3_restnet101_BestIOU.pth")
        print('Best_IOU saved!')
    else:
        counter += 1
    if counter >= patience:
        print("Earlystop!")
        break

Downloading: "https://download.pytorch.org/models/deeplabv3_resnet101_coco-586e9e4e.pth" to /root/.cache/torch/hub/checkpoints/deeplabv3_resnet101_coco-586e9e4e.pth
100%|██████████| 233M/233M [00:00<00:00, 356MB/s]
  0%|          | 0/100 [00:00<?, ?it/s]
  0%|          | 0/500 [00:00<?, ?it/s][A
  0%|          | 1/500 [00:13<1:48:20, 13.03s/it][A
  0%|          | 2/500 [00:13<47:27,  5.72s/it]  [A
  1%|          | 3/500 [00:14<28:01,  3.38s/it][A
  1%|          | 4/500 [00:14<18:53,  2.29s/it][A
  1%|          | 5/500 [00:15<13:50,  1.68s/it][A
  1%|          | 6/500 [00:16<10:48,  1.31s/it][A
  1%|▏         | 7/500 [00:16<08:53,  1.08s/it][A
  2%|▏         | 8/500 [00:17<07:37,  1.08it/s][A
  2%|▏         | 9/500 [00:17<06:46,  1.21it/s][A
  2%|▏         | 10/500 [00:18<06:11,  1.32it/s][A
  2%|▏         | 11/500 [00:19<05:47,  1.41it/s][A
  2%|▏         | 12/500 [00:19<05:30,  1.48it/s][A
  3%|▎         | 13/500 [00:44<1:03:46,  7.86s/it][A
  3%|▎         | 14/500 [00:4

EPOCH: 0001 train_loss: 0.2161 val_loss: 0.0212, train_mean_iou: 0.300, val_mean_iou: 0.457


  1%|          | 1/100 [06:18<10:25:20, 378.99s/it]

Best_IOU saved!



  0%|          | 0/500 [00:00<?, ?it/s][A
  0%|          | 1/500 [00:00<08:01,  1.04it/s][A
  0%|          | 2/500 [00:01<06:14,  1.33it/s][A
  1%|          | 3/500 [00:02<05:40,  1.46it/s][A
  1%|          | 4/500 [00:02<05:24,  1.53it/s][A
  1%|          | 5/500 [00:03<05:15,  1.57it/s][A
  1%|          | 6/500 [00:04<05:10,  1.59it/s][A
  1%|▏         | 7/500 [00:04<05:06,  1.61it/s][A
  2%|▏         | 8/500 [00:05<05:04,  1.62it/s][A
  2%|▏         | 9/500 [00:05<05:02,  1.63it/s][A
  2%|▏         | 10/500 [00:06<04:59,  1.63it/s][A
  2%|▏         | 11/500 [00:07<04:59,  1.63it/s][A
  2%|▏         | 12/500 [00:07<04:57,  1.64it/s][A
  3%|▎         | 13/500 [00:08<04:56,  1.64it/s][A
  3%|▎         | 14/500 [00:08<04:56,  1.64it/s][A
  3%|▎         | 15/500 [00:09<04:56,  1.64it/s][A
  3%|▎         | 16/500 [00:10<04:55,  1.64it/s][A
  3%|▎         | 17/500 [00:10<04:54,  1.64it/s][A
  4%|▎         | 18/500 [00:11<04:53,  1.64it/s][A
  4%|▍         | 19/500 [00:1

EPOCH: 0002 train_loss: 0.0965 val_loss: 0.0176, train_mean_iou: 0.377, val_mean_iou: 0.485


  2%|▏         | 2/100 [11:38<9:21:57, 344.05s/it] 

Best_IOU saved!



  0%|          | 0/500 [00:00<?, ?it/s][A
  0%|          | 1/500 [00:00<07:56,  1.05it/s][A
  0%|          | 2/500 [00:01<06:15,  1.33it/s][A
  1%|          | 3/500 [00:02<05:42,  1.45it/s][A
  1%|          | 4/500 [00:02<05:25,  1.52it/s][A
  1%|          | 5/500 [00:03<05:16,  1.56it/s][A
  1%|          | 6/500 [00:04<05:10,  1.59it/s][A
  1%|▏         | 7/500 [00:04<05:06,  1.61it/s][A
  2%|▏         | 8/500 [00:05<05:04,  1.62it/s][A
  2%|▏         | 9/500 [00:05<05:01,  1.63it/s][A
  2%|▏         | 10/500 [00:06<05:00,  1.63it/s][A
  2%|▏         | 11/500 [00:07<04:58,  1.64it/s][A
  2%|▏         | 12/500 [00:07<04:57,  1.64it/s][A
  3%|▎         | 13/500 [00:08<04:56,  1.64it/s][A
  3%|▎         | 14/500 [00:08<04:55,  1.64it/s][A
  3%|▎         | 15/500 [00:09<04:55,  1.64it/s][A
  3%|▎         | 16/500 [00:10<04:55,  1.64it/s][A
  3%|▎         | 17/500 [00:10<04:54,  1.64it/s][A
  4%|▎         | 18/500 [00:11<04:53,  1.64it/s][A
  4%|▍         | 19/500 [00:1

EPOCH: 0003 train_loss: 0.0717 val_loss: 0.0241, train_mean_iou: 0.393, val_mean_iou: 0.479


  3%|▎         | 3/100 [16:57<8:57:32, 332.50s/it]
  0%|          | 0/500 [00:00<?, ?it/s][A
  0%|          | 1/500 [00:00<07:56,  1.05it/s][A
  0%|          | 2/500 [00:01<06:14,  1.33it/s][A
  1%|          | 3/500 [00:02<05:39,  1.46it/s][A
  1%|          | 4/500 [00:02<05:24,  1.53it/s][A
  1%|          | 5/500 [00:03<05:16,  1.57it/s][A
  1%|          | 6/500 [00:03<05:10,  1.59it/s][A
  1%|▏         | 7/500 [00:04<05:06,  1.61it/s][A
  2%|▏         | 8/500 [00:05<05:04,  1.62it/s][A
  2%|▏         | 9/500 [00:05<05:02,  1.63it/s][A
  2%|▏         | 10/500 [00:06<05:00,  1.63it/s][A
  2%|▏         | 11/500 [00:07<04:58,  1.64it/s][A
  2%|▏         | 12/500 [00:07<04:57,  1.64it/s][A
  3%|▎         | 13/500 [00:08<04:57,  1.64it/s][A
  3%|▎         | 14/500 [00:08<04:56,  1.64it/s][A
  3%|▎         | 15/500 [00:09<04:56,  1.64it/s][A
  3%|▎         | 16/500 [00:10<04:55,  1.64it/s][A
  3%|▎         | 17/500 [00:10<04:54,  1.64it/s][A
  4%|▎         | 18/500 [00:11<

EPOCH: 0004 train_loss: 0.0604 val_loss: 0.0113, train_mean_iou: 0.411, val_mean_iou: 0.521


  4%|▍         | 4/100 [22:16<8:43:41, 327.31s/it]

Best_IOU saved!



  0%|          | 0/500 [00:00<?, ?it/s][A
  0%|          | 1/500 [00:00<07:42,  1.08it/s][A
  0%|          | 2/500 [00:01<06:08,  1.35it/s][A
  1%|          | 3/500 [00:02<05:37,  1.47it/s][A
  1%|          | 4/500 [00:02<05:23,  1.53it/s][A
  1%|          | 5/500 [00:03<05:15,  1.57it/s][A
  1%|          | 6/500 [00:03<05:09,  1.59it/s][A
  1%|▏         | 7/500 [00:04<05:06,  1.61it/s][A
  2%|▏         | 8/500 [00:05<05:03,  1.62it/s][A
  2%|▏         | 9/500 [00:05<05:01,  1.63it/s][A
  2%|▏         | 10/500 [00:06<05:00,  1.63it/s][A
  2%|▏         | 11/500 [00:07<04:59,  1.63it/s][A
  2%|▏         | 12/500 [00:07<04:57,  1.64it/s][A
  3%|▎         | 13/500 [00:08<04:56,  1.64it/s][A
  3%|▎         | 14/500 [00:08<04:55,  1.64it/s][A
  3%|▎         | 15/500 [00:09<04:54,  1.65it/s][A
  3%|▎         | 16/500 [00:10<04:54,  1.64it/s][A
  3%|▎         | 17/500 [00:10<04:54,  1.64it/s][A
  4%|▎         | 18/500 [00:11<04:53,  1.64it/s][A
  4%|▍         | 19/500 [00:1

EPOCH: 0005 train_loss: 0.0496 val_loss: 0.0220, train_mean_iou: 0.433, val_mean_iou: 0.522


  5%|▌         | 5/100 [27:36<8:33:55, 324.59s/it]

Best_IOU saved!



  0%|          | 0/500 [00:00<?, ?it/s][A
  0%|          | 1/500 [00:00<07:54,  1.05it/s][A
  0%|          | 2/500 [00:01<06:15,  1.33it/s][A
  1%|          | 3/500 [00:02<05:42,  1.45it/s][A
  1%|          | 4/500 [00:02<05:26,  1.52it/s][A
  1%|          | 5/500 [00:03<05:17,  1.56it/s][A
  1%|          | 6/500 [00:04<05:11,  1.59it/s][A
  1%|▏         | 7/500 [00:04<05:07,  1.60it/s][A
  2%|▏         | 8/500 [00:05<05:05,  1.61it/s][A
  2%|▏         | 9/500 [00:05<05:02,  1.62it/s][A
  2%|▏         | 10/500 [00:06<05:00,  1.63it/s][A
  2%|▏         | 11/500 [00:07<04:59,  1.63it/s][A
  2%|▏         | 12/500 [00:07<04:58,  1.64it/s][A
  3%|▎         | 13/500 [00:08<04:57,  1.64it/s][A
  3%|▎         | 14/500 [00:08<04:57,  1.64it/s][A
  3%|▎         | 15/500 [00:09<04:56,  1.64it/s][A
  3%|▎         | 16/500 [00:10<04:56,  1.63it/s][A
  3%|▎         | 17/500 [00:10<04:56,  1.63it/s][A
  4%|▎         | 18/500 [00:11<04:55,  1.63it/s][A
  4%|▍         | 19/500 [00:1

EPOCH: 0006 train_loss: 0.0456 val_loss: 0.1840, train_mean_iou: 0.433, val_mean_iou: 0.411


  6%|▌         | 6/100 [32:55<8:25:42, 322.79s/it]
  0%|          | 0/500 [00:00<?, ?it/s][A
  0%|          | 1/500 [00:00<08:05,  1.03it/s][A
  0%|          | 2/500 [00:01<06:18,  1.32it/s][A
  1%|          | 3/500 [00:02<05:43,  1.45it/s][A
  1%|          | 4/500 [00:02<05:27,  1.51it/s][A
  1%|          | 5/500 [00:03<05:17,  1.56it/s][A
  1%|          | 6/500 [00:04<05:11,  1.59it/s][A
  1%|▏         | 7/500 [00:04<05:08,  1.60it/s][A
  2%|▏         | 8/500 [00:05<05:05,  1.61it/s][A
  2%|▏         | 9/500 [00:05<05:03,  1.62it/s][A
  2%|▏         | 10/500 [00:06<05:01,  1.62it/s][A
  2%|▏         | 11/500 [00:07<04:59,  1.63it/s][A
  2%|▏         | 12/500 [00:07<04:58,  1.63it/s][A
  3%|▎         | 13/500 [00:08<04:57,  1.64it/s][A
  3%|▎         | 14/500 [00:08<04:56,  1.64it/s][A
  3%|▎         | 15/500 [00:09<04:55,  1.64it/s][A
  3%|▎         | 16/500 [00:10<04:54,  1.64it/s][A
  3%|▎         | 17/500 [00:10<04:54,  1.64it/s][A
  4%|▎         | 18/500 [00:11<

EPOCH: 0007 train_loss: 0.0393 val_loss: 0.0355, train_mean_iou: 0.443, val_mean_iou: 0.508


  7%|▋         | 7/100 [38:14<8:18:29, 321.61s/it]
  0%|          | 0/500 [00:00<?, ?it/s][A
  0%|          | 1/500 [00:01<08:18,  1.00it/s][A
  0%|          | 2/500 [00:01<06:23,  1.30it/s][A
  1%|          | 3/500 [00:02<05:46,  1.43it/s][A
  1%|          | 4/500 [00:02<05:29,  1.51it/s][A
  1%|          | 5/500 [00:03<05:18,  1.56it/s][A
  1%|          | 6/500 [00:04<05:12,  1.58it/s][A
  1%|▏         | 7/500 [00:04<05:08,  1.60it/s][A
  2%|▏         | 8/500 [00:05<05:05,  1.61it/s][A
  2%|▏         | 9/500 [00:05<05:02,  1.62it/s][A
  2%|▏         | 10/500 [00:06<05:01,  1.63it/s][A
  2%|▏         | 11/500 [00:07<04:59,  1.64it/s][A
  2%|▏         | 12/500 [00:07<04:58,  1.64it/s][A
  3%|▎         | 13/500 [00:08<04:57,  1.64it/s][A
  3%|▎         | 14/500 [00:08<04:56,  1.64it/s][A
  3%|▎         | 15/500 [00:09<04:55,  1.64it/s][A
  3%|▎         | 16/500 [00:10<04:55,  1.64it/s][A
  3%|▎         | 17/500 [00:10<04:54,  1.64it/s][A
  4%|▎         | 18/500 [00:11<

EPOCH: 0008 train_loss: 0.0385 val_loss: 0.1338, train_mean_iou: 0.450, val_mean_iou: 0.445


  8%|▊         | 8/100 [43:34<8:11:57, 320.85s/it]
  0%|          | 0/500 [00:00<?, ?it/s][A
  0%|          | 1/500 [00:00<07:56,  1.05it/s][A
  0%|          | 2/500 [00:01<06:15,  1.32it/s][A
  1%|          | 3/500 [00:02<05:42,  1.45it/s][A
  1%|          | 4/500 [00:02<05:24,  1.53it/s][A
  1%|          | 5/500 [00:03<05:15,  1.57it/s][A
  1%|          | 6/500 [00:03<05:09,  1.59it/s][A
  1%|▏         | 7/500 [00:04<05:07,  1.60it/s][A
  2%|▏         | 8/500 [00:05<05:04,  1.62it/s][A
  2%|▏         | 9/500 [00:05<05:01,  1.63it/s][A
  2%|▏         | 10/500 [00:06<05:00,  1.63it/s][A
  2%|▏         | 11/500 [00:07<04:59,  1.63it/s][A
  2%|▏         | 12/500 [00:07<04:58,  1.64it/s][A
  3%|▎         | 13/500 [00:08<04:57,  1.64it/s][A
  3%|▎         | 14/500 [00:08<04:56,  1.64it/s][A
  3%|▎         | 15/500 [00:09<04:55,  1.64it/s][A
  3%|▎         | 16/500 [00:10<04:56,  1.63it/s][A
  3%|▎         | 17/500 [00:10<04:54,  1.64it/s][A
  4%|▎         | 18/500 [00:11<

EPOCH: 0009 train_loss: 0.0338 val_loss: 0.0150, train_mean_iou: 0.462, val_mean_iou: 0.538


  9%|▉         | 9/100 [48:53<8:06:03, 320.48s/it]

Best_IOU saved!



  0%|          | 0/500 [00:00<?, ?it/s][A
  0%|          | 1/500 [00:00<07:54,  1.05it/s][A
  0%|          | 2/500 [00:01<06:14,  1.33it/s][A
  1%|          | 3/500 [00:02<05:41,  1.45it/s][A
  1%|          | 4/500 [00:02<05:25,  1.52it/s][A
  1%|          | 5/500 [00:03<05:15,  1.57it/s][A
  1%|          | 6/500 [00:03<05:10,  1.59it/s][A
  1%|▏         | 7/500 [00:04<05:07,  1.60it/s][A
  2%|▏         | 8/500 [00:05<05:03,  1.62it/s][A
  2%|▏         | 9/500 [00:05<05:02,  1.63it/s][A
  2%|▏         | 10/500 [00:06<05:00,  1.63it/s][A
  2%|▏         | 11/500 [00:07<04:59,  1.64it/s][A
  2%|▏         | 12/500 [00:07<04:58,  1.64it/s][A
  3%|▎         | 13/500 [00:08<04:57,  1.64it/s][A
  3%|▎         | 14/500 [00:08<04:56,  1.64it/s][A
  3%|▎         | 15/500 [00:09<04:56,  1.63it/s][A
  3%|▎         | 16/500 [00:10<04:55,  1.64it/s][A
  3%|▎         | 17/500 [00:10<04:54,  1.64it/s][A
  4%|▎         | 18/500 [00:11<04:53,  1.64it/s][A
  4%|▍         | 19/500 [00:1

EPOCH: 0010 train_loss: 0.0357 val_loss: 0.0205, train_mean_iou: 0.459, val_mean_iou: 0.520


 10%|█         | 10/100 [54:12<8:00:06, 320.07s/it]
  0%|          | 0/500 [00:00<?, ?it/s][A
  0%|          | 1/500 [00:00<07:52,  1.06it/s][A
  0%|          | 2/500 [00:01<06:12,  1.34it/s][A
  1%|          | 3/500 [00:02<05:39,  1.46it/s][A
  1%|          | 4/500 [00:02<05:24,  1.53it/s][A
  1%|          | 5/500 [00:03<05:15,  1.57it/s][A
  1%|          | 6/500 [00:03<05:10,  1.59it/s][A
  1%|▏         | 7/500 [00:04<05:06,  1.61it/s][A
  2%|▏         | 8/500 [00:05<05:04,  1.62it/s][A
  2%|▏         | 9/500 [00:05<05:02,  1.62it/s][A
  2%|▏         | 10/500 [00:06<05:00,  1.63it/s][A
  2%|▏         | 11/500 [00:07<04:59,  1.63it/s][A
  2%|▏         | 12/500 [00:07<04:58,  1.64it/s][A
  3%|▎         | 13/500 [00:08<04:58,  1.63it/s][A
  3%|▎         | 14/500 [00:08<04:56,  1.64it/s][A
  3%|▎         | 15/500 [00:09<04:56,  1.64it/s][A
  3%|▎         | 16/500 [00:10<04:55,  1.64it/s][A
  3%|▎         | 17/500 [00:10<04:55,  1.64it/s][A
  4%|▎         | 18/500 [00:11

EPOCH: 0011 train_loss: 0.0304 val_loss: 0.0077, train_mean_iou: 0.465, val_mean_iou: 0.571


 11%|█         | 11/100 [59:32<7:54:34, 319.94s/it]

Best_IOU saved!



  0%|          | 0/500 [00:00<?, ?it/s][A
  0%|          | 1/500 [00:00<07:59,  1.04it/s][A
  0%|          | 2/500 [00:01<06:15,  1.33it/s][A
  1%|          | 3/500 [00:02<05:43,  1.45it/s][A
  1%|          | 4/500 [00:02<05:26,  1.52it/s][A
  1%|          | 5/500 [00:03<05:16,  1.56it/s][A
  1%|          | 6/500 [00:04<05:11,  1.59it/s][A
  1%|▏         | 7/500 [00:04<05:07,  1.60it/s][A
  2%|▏         | 8/500 [00:05<05:04,  1.62it/s][A
  2%|▏         | 9/500 [00:05<05:02,  1.62it/s][A
  2%|▏         | 10/500 [00:06<05:00,  1.63it/s][A
  2%|▏         | 11/500 [00:07<04:59,  1.63it/s][A
  2%|▏         | 12/500 [00:07<04:59,  1.63it/s][A
  3%|▎         | 13/500 [00:08<04:57,  1.64it/s][A
  3%|▎         | 14/500 [00:08<04:56,  1.64it/s][A
  3%|▎         | 15/500 [00:09<04:56,  1.64it/s][A
  3%|▎         | 16/500 [00:10<04:55,  1.64it/s][A
  3%|▎         | 17/500 [00:10<04:54,  1.64it/s][A
  4%|▎         | 18/500 [00:11<04:53,  1.64it/s][A
  4%|▍         | 19/500 [00:1

EPOCH: 0012 train_loss: 0.0252 val_loss: 0.0203, train_mean_iou: 0.476, val_mean_iou: 0.527


 12%|█▏        | 12/100 [1:04:51<7:48:53, 319.70s/it]
  0%|          | 0/500 [00:00<?, ?it/s][A
  0%|          | 1/500 [00:00<08:05,  1.03it/s][A
  0%|          | 2/500 [00:01<06:19,  1.31it/s][A
  1%|          | 3/500 [00:02<05:43,  1.45it/s][A
  1%|          | 4/500 [00:02<05:26,  1.52it/s][A
  1%|          | 5/500 [00:03<05:16,  1.57it/s][A
  1%|          | 6/500 [00:04<05:10,  1.59it/s][A
  1%|▏         | 7/500 [00:04<05:07,  1.60it/s][A
  2%|▏         | 8/500 [00:05<05:04,  1.62it/s][A
  2%|▏         | 9/500 [00:05<05:02,  1.62it/s][A
  2%|▏         | 10/500 [00:06<05:01,  1.63it/s][A
  2%|▏         | 11/500 [00:07<04:59,  1.63it/s][A
  2%|▏         | 12/500 [00:07<04:59,  1.63it/s][A
  3%|▎         | 13/500 [00:08<04:58,  1.63it/s][A
  3%|▎         | 14/500 [00:08<04:57,  1.63it/s][A
  3%|▎         | 15/500 [00:09<04:57,  1.63it/s][A
  3%|▎         | 16/500 [00:10<04:56,  1.63it/s][A
  3%|▎         | 17/500 [00:10<04:55,  1.64it/s][A
  4%|▎         | 18/500 [00:

EPOCH: 0013 train_loss: 0.0225 val_loss: 0.0117, train_mean_iou: 0.487, val_mean_iou: 0.570


 13%|█▎        | 13/100 [1:10:10<7:43:14, 319.48s/it]
  0%|          | 0/500 [00:00<?, ?it/s][A
  0%|          | 1/500 [00:00<07:49,  1.06it/s][A
  0%|          | 2/500 [00:01<06:09,  1.35it/s][A
  1%|          | 3/500 [00:02<05:39,  1.46it/s][A
  1%|          | 4/500 [00:02<05:24,  1.53it/s][A
  1%|          | 5/500 [00:03<05:15,  1.57it/s][A
  1%|          | 6/500 [00:03<05:09,  1.60it/s][A
  1%|▏         | 7/500 [00:04<05:05,  1.61it/s][A
  2%|▏         | 8/500 [00:05<05:03,  1.62it/s][A
  2%|▏         | 9/500 [00:05<05:01,  1.63it/s][A
  2%|▏         | 10/500 [00:06<04:59,  1.64it/s][A
  2%|▏         | 11/500 [00:07<04:58,  1.64it/s][A
  2%|▏         | 12/500 [00:07<04:57,  1.64it/s][A
  3%|▎         | 13/500 [00:08<04:56,  1.64it/s][A
  3%|▎         | 14/500 [00:08<04:56,  1.64it/s][A
  3%|▎         | 15/500 [00:09<04:56,  1.64it/s][A
  3%|▎         | 16/500 [00:10<04:54,  1.64it/s][A
  3%|▎         | 17/500 [00:10<04:54,  1.64it/s][A
  4%|▎         | 18/500 [00:

EPOCH: 0014 train_loss: 0.0253 val_loss: 0.0410, train_mean_iou: 0.483, val_mean_iou: 0.498


 14%|█▍        | 14/100 [1:15:29<7:37:32, 319.21s/it]
  0%|          | 0/500 [00:00<?, ?it/s][A
  0%|          | 1/500 [00:00<07:52,  1.06it/s][A
  0%|          | 2/500 [00:01<06:13,  1.34it/s][A
  1%|          | 3/500 [00:02<05:40,  1.46it/s][A
  1%|          | 4/500 [00:02<05:24,  1.53it/s][A
  1%|          | 5/500 [00:03<05:15,  1.57it/s][A
  1%|          | 6/500 [00:03<05:10,  1.59it/s][A
  1%|▏         | 7/500 [00:04<05:06,  1.61it/s][A
  2%|▏         | 8/500 [00:05<05:04,  1.62it/s][A
  2%|▏         | 9/500 [00:05<05:03,  1.62it/s][A
  2%|▏         | 10/500 [00:06<05:00,  1.63it/s][A
  2%|▏         | 11/500 [00:07<04:58,  1.64it/s][A
  2%|▏         | 12/500 [00:07<04:57,  1.64it/s][A
  3%|▎         | 13/500 [00:08<04:57,  1.64it/s][A
  3%|▎         | 14/500 [00:08<04:55,  1.64it/s][A
  3%|▎         | 15/500 [00:09<04:55,  1.64it/s][A
  3%|▎         | 16/500 [00:10<04:54,  1.64it/s][A
  3%|▎         | 17/500 [00:10<04:54,  1.64it/s][A
  4%|▎         | 18/500 [00:

EPOCH: 0015 train_loss: 0.0210 val_loss: 0.0068, train_mean_iou: 0.491, val_mean_iou: 0.583


 15%|█▌        | 15/100 [1:20:48<7:32:17, 319.26s/it]

Best_IOU saved!



  0%|          | 0/500 [00:00<?, ?it/s][A
  0%|          | 1/500 [00:00<08:08,  1.02it/s][A
  0%|          | 2/500 [00:01<06:18,  1.32it/s][A
  1%|          | 3/500 [00:02<05:43,  1.45it/s][A
  1%|          | 4/500 [00:02<05:26,  1.52it/s][A
  1%|          | 5/500 [00:03<05:17,  1.56it/s][A
  1%|          | 6/500 [00:04<05:11,  1.58it/s][A
  1%|▏         | 7/500 [00:04<05:07,  1.60it/s][A
  2%|▏         | 8/500 [00:05<05:05,  1.61it/s][A
  2%|▏         | 9/500 [00:05<05:04,  1.61it/s][A
  2%|▏         | 10/500 [00:06<05:01,  1.63it/s][A
  2%|▏         | 11/500 [00:07<04:59,  1.63it/s][A
  2%|▏         | 12/500 [00:07<04:59,  1.63it/s][A
  3%|▎         | 13/500 [00:08<04:57,  1.63it/s][A
  3%|▎         | 14/500 [00:08<04:56,  1.64it/s][A
  3%|▎         | 15/500 [00:09<04:55,  1.64it/s][A
  3%|▎         | 16/500 [00:10<04:55,  1.64it/s][A
  3%|▎         | 17/500 [00:10<04:54,  1.64it/s][A
  4%|▎         | 18/500 [00:11<04:53,  1.64it/s][A
  4%|▍         | 19/500 [00:1

EPOCH: 0016 train_loss: 0.0166 val_loss: 0.0148, train_mean_iou: 0.506, val_mean_iou: 0.559


 16%|█▌        | 16/100 [1:26:07<7:26:50, 319.18s/it]
  0%|          | 0/500 [00:00<?, ?it/s][A
  0%|          | 1/500 [00:01<08:18,  1.00it/s][A
  0%|          | 2/500 [00:01<06:23,  1.30it/s][A
  1%|          | 3/500 [00:02<05:46,  1.44it/s][A
  1%|          | 4/500 [00:02<05:28,  1.51it/s][A
  1%|          | 5/500 [00:03<05:17,  1.56it/s][A
  1%|          | 6/500 [00:04<05:12,  1.58it/s][A
  1%|▏         | 7/500 [00:04<05:08,  1.60it/s][A
  2%|▏         | 8/500 [00:05<05:04,  1.61it/s][A
  2%|▏         | 9/500 [00:05<05:02,  1.62it/s][A
  2%|▏         | 10/500 [00:06<05:00,  1.63it/s][A
  2%|▏         | 11/500 [00:07<04:58,  1.64it/s][A
  2%|▏         | 12/500 [00:07<04:58,  1.63it/s][A
  3%|▎         | 13/500 [00:08<04:57,  1.64it/s][A
  3%|▎         | 14/500 [00:08<04:56,  1.64it/s][A
  3%|▎         | 15/500 [00:09<04:56,  1.64it/s][A
  3%|▎         | 16/500 [00:10<04:55,  1.64it/s][A
  3%|▎         | 17/500 [00:10<04:54,  1.64it/s][A
  4%|▎         | 18/500 [00:

EPOCH: 0017 train_loss: 0.0174 val_loss: 0.0225, train_mean_iou: 0.504, val_mean_iou: 0.534


 17%|█▋        | 17/100 [1:31:26<7:21:30, 319.16s/it]
  0%|          | 0/500 [00:00<?, ?it/s][A
  0%|          | 1/500 [00:00<08:01,  1.04it/s][A
  0%|          | 2/500 [00:01<06:16,  1.32it/s][A
  1%|          | 3/500 [00:02<05:42,  1.45it/s][A
  1%|          | 4/500 [00:02<05:26,  1.52it/s][A
  1%|          | 5/500 [00:03<05:16,  1.56it/s][A
  1%|          | 6/500 [00:04<05:10,  1.59it/s][A
  1%|▏         | 7/500 [00:04<05:07,  1.61it/s][A
  2%|▏         | 8/500 [00:05<05:04,  1.62it/s][A
  2%|▏         | 9/500 [00:05<05:02,  1.62it/s][A
  2%|▏         | 10/500 [00:06<05:00,  1.63it/s][A
  2%|▏         | 11/500 [00:07<04:59,  1.63it/s][A
  2%|▏         | 12/500 [00:07<04:58,  1.64it/s][A
  3%|▎         | 13/500 [00:08<04:57,  1.64it/s][A
  3%|▎         | 14/500 [00:08<04:55,  1.64it/s][A
  3%|▎         | 15/500 [00:09<04:55,  1.64it/s][A
  3%|▎         | 16/500 [00:10<04:55,  1.64it/s][A
  3%|▎         | 17/500 [00:10<04:54,  1.64it/s][A
  4%|▎         | 18/500 [00:

EPOCH: 0018 train_loss: 0.0142 val_loss: 0.0127, train_mean_iou: 0.508, val_mean_iou: 0.574


 18%|█▊        | 18/100 [1:36:45<7:16:02, 319.05s/it]
  0%|          | 0/500 [00:00<?, ?it/s][A
  0%|          | 1/500 [00:00<07:57,  1.05it/s][A
  0%|          | 2/500 [00:01<06:13,  1.33it/s][A
  1%|          | 3/500 [00:02<05:40,  1.46it/s][A
  1%|          | 4/500 [00:02<05:24,  1.53it/s][A
  1%|          | 5/500 [00:03<05:15,  1.57it/s][A
  1%|          | 6/500 [00:03<05:10,  1.59it/s][A
  1%|▏         | 7/500 [00:04<05:07,  1.60it/s][A
  2%|▏         | 8/500 [00:05<05:03,  1.62it/s][A
  2%|▏         | 9/500 [00:05<05:00,  1.63it/s][A
  2%|▏         | 10/500 [00:06<04:59,  1.63it/s][A
  2%|▏         | 11/500 [00:07<04:58,  1.64it/s][A
  2%|▏         | 12/500 [00:07<04:57,  1.64it/s][A
  3%|▎         | 13/500 [00:08<04:56,  1.64it/s][A
  3%|▎         | 14/500 [00:08<04:56,  1.64it/s][A
  3%|▎         | 15/500 [00:09<04:55,  1.64it/s][A
  3%|▎         | 16/500 [00:10<04:55,  1.64it/s][A
  3%|▎         | 17/500 [00:10<04:54,  1.64it/s][A
  4%|▎         | 18/500 [00:

EPOCH: 0019 train_loss: 0.0212 val_loss: 0.1512, train_mean_iou: 0.492, val_mean_iou: 0.531


 19%|█▉        | 19/100 [1:42:04<7:10:35, 318.96s/it]
  0%|          | 0/500 [00:00<?, ?it/s][A
  0%|          | 1/500 [00:00<08:11,  1.02it/s][A
  0%|          | 2/500 [00:01<06:19,  1.31it/s][A
  1%|          | 3/500 [00:02<05:43,  1.44it/s][A
  1%|          | 4/500 [00:02<05:26,  1.52it/s][A
  1%|          | 5/500 [00:03<05:17,  1.56it/s][A
  1%|          | 6/500 [00:04<05:11,  1.59it/s][A
  1%|▏         | 7/500 [00:04<05:07,  1.60it/s][A
  2%|▏         | 8/500 [00:05<05:04,  1.62it/s][A
  2%|▏         | 9/500 [00:05<05:02,  1.62it/s][A
  2%|▏         | 10/500 [00:06<05:00,  1.63it/s][A
  2%|▏         | 11/500 [00:07<04:59,  1.63it/s][A
  2%|▏         | 12/500 [00:07<04:58,  1.64it/s][A
  3%|▎         | 13/500 [00:08<04:57,  1.64it/s][A
  3%|▎         | 14/500 [00:08<04:56,  1.64it/s][A
  3%|▎         | 15/500 [00:09<04:55,  1.64it/s][A
  3%|▎         | 16/500 [00:10<04:55,  1.64it/s][A
  3%|▎         | 17/500 [00:10<04:55,  1.63it/s][A
  4%|▎         | 18/500 [00:

EPOCH: 0020 train_loss: 0.0175 val_loss: 0.0079, train_mean_iou: 0.503, val_mean_iou: 0.577


 19%|█▉        | 19/100 [1:47:23<7:37:48, 339.12s/it]

Earlystop!



