<a href="https://colab.research.google.com/github/R12942159/DeepLearning/blob/main/DLCV_hw1_p3_deeplabv3.ipynb" target="_parent"><img src="https://colab.research.google.com/assets/colab-badge.svg" alt="Open In Colab"/></a>

In [1]:
from google.colab import drive
drive.mount('/content/drive')

Mounted at /content/drive


In [2]:
import torch


# Get cuda from GPU device for training.
device = "cuda" if torch.cuda.is_available() else "cpu"
print(f"Using: {device}")

Using: cuda


In [3]:
import os


train_paths = '/content/drive/MyDrive/NTU_DLCV/p3_data/train'
img_paths_train = sorted([os.path.join(train_paths, i) for i in os.listdir(train_paths) if i.endswith('.jpg')])
mask_paths_train = sorted([os.path.join(train_paths, i) for i in os.listdir(train_paths) if i.endswith('.png')])

val_paths = '/content/drive/MyDrive/NTU_DLCV/p3_data/validation'
img_paths_val = sorted([os.path.join(val_paths, i) for i in os.listdir(val_paths) if i.endswith('.jpg')])
mask_paths_val = sorted([os.path.join(val_paths, i) for i in os.listdir(val_paths) if i.endswith('.png')])

In [4]:
len(img_paths_train), len(mask_paths_train), len(img_paths_val), len(mask_paths_val)

(2000, 2000, 257, 257)

In [5]:
import torch
import random
import numpy as np
from PIL import Image
from copy import deepcopy
from torchvision.transforms.functional import hflip, vflip, to_tensor, normalize


class LandDataset(torch.utils.data.Dataset):
    def __init__(self, img_paths, mask_paths, transform, mode, augment=False):
        self.img_paths = img_paths
        self.mask_paths = mask_paths
        self.transform = transform
        self.mode = mode

        # Data Augmentation
        def original(x): return x
        if augment:
            self.augment = [original, hflip, vflip]
        else:
            self.augment = [original]

        # double check the len of img and mask.
        assert len(self.img_paths) == len(self.mask_paths)

    def __len__(self):
        return len(self.img_paths)

    def __getitem__(self, idx):
        # get img path
        img_path = self.img_paths[idx]
        # Read img
        img = Image.open(img_path).convert('RGB')
        # Normalize Image with VGG16's mean and std
        # (H, W, C) -> (C, H, W)
        img = self.transform(img)

        if self.mode != 'test':
            # get mask path
            mask_path = self.mask_paths[idx]
            mask = Image.open(mask_path).convert('RGB')
            mask = np.array(mask)
            # Binarize mask from [0~255] to (0 or 1)
            mask = (mask >= 128).astype(int)

            # squeeze [a,b,c] into [x,y] with 7 category(6 classes + 1 background)
            mask = 100 * mask[:, :, 0] + 10 * mask[:, :, 1] + 1 * mask[:, :, 2]
            raw_mask = deepcopy(mask) # Only perform numerical conversion on the most original data
            mask[raw_mask == 11] = 0  # (Cyan: 011) Urban land
            mask[raw_mask == 110] = 1  # (Yellow: 110) Agriculture land
            mask[raw_mask == 101] = 2  # (Purple: 101) Rangeland
            mask[raw_mask == 10] = 3  # (Green: 010) Forest land
            mask[raw_mask == 1] = 4  # (Blue: 001) Water
            mask[raw_mask == 111] = 5  # (White: 111) Barren land
            mask[raw_mask == 0] = 6  # (Black: 000) Unknown
            mask = torch.tensor(mask)

            # random Data Augmentation
            augmentor = random.choice(self.augment)
            img = augmentor(img)
            mask = augmentor(mask)

            # mask = mask.to(torch.float)  # 将目标标签转换为浮点数类型
            return img, mask
        else:
            return img

In [6]:
import torchvision.transforms as tr


# IMG_SIZE : 512*512
BATCH_SIZE = 4

# https://pytorch.org/vision/main/models/generated/torchvision.models.segmentation.deeplabv3_resnet50.html#torchvision.models.segmentation.deeplabv3_resnet50
mean=[0.485, 0.456, 0.406]
std=[0.229, 0.224, 0.225]

train_ds = LandDataset(img_paths_train,
                       mask_paths_train,
                       transform = tr.Compose([
                          tr.ToTensor(),
                          tr.Normalize(mean=mean, std=std),
                          ]),
                       mode = 'train',
                       augment = True,)
val_ds = LandDataset(img_paths_val,
                     mask_paths_val,
                     transform = tr.Compose([
                          tr.ToTensor(),
                          tr.Normalize(mean=mean, std=std),
                          ]),
                     mode = 'val',
                     augment = False,)

# num_workers > 0: accelerate loading data by muli-process
train_loader = torch.utils.data.DataLoader(train_ds, BATCH_SIZE, shuffle=True, num_workers=4)
val_loader = torch.utils.data.DataLoader(val_ds, BATCH_SIZE*2, shuffle=False, num_workers=4)

In [7]:
from torchvision.models.segmentation.deeplabv3 import deeplabv3_resnet101, DeepLabHead, FCNHead


# https://pytorch.org/hub/pytorch_vision_deeplabv3_resnet101/
# output['out'] contains the semantic masks, and output['aux'] contains the auxiliary loss values per-pixel
def deeplabv3(mode):
    if mode == 'resnet101':
        model =  deeplabv3_resnet101(pretrained=True)
    elif mode == 'resnet50':
        model = deeplabv3_resnet50(pretrained=True)

    return model

In [8]:
def mean_iou_score(pred, labels, num_classes=6):
    '''
    Compute mean IoU score over 6 classes
    '''
    mean_iou = []
    for i in range(num_classes):
        tp_fp = torch.sum(pred == i)
        tp_fn = torch.sum(labels == i)
        tp = torch.sum((pred == i) * (labels == i))
        # avoid nan
        if (tp_fp + tp_fn - tp) == 0:
            iou = 0.
        else:
            iou = tp / (tp_fp + tp_fn - tp)
        mean_iou.append(iou)

    return sum(mean_iou) / len(mean_iou)

In [9]:
from tqdm import tqdm


def train(dataloader, model, loss_fn, optimizer):
    size = len(dataloader.dataset) # number of samples
    num_batches = len(dataloader) # batches per epoch
    model.train() # to training mode.
    epoch_loss, epoch_iou = 0, 0
    for batch_i, (x, y) in enumerate(tqdm(dataloader, leave=False)):
        x, y = x.to(device, non_blocking=True), y.to(device, non_blocking=True) # move data to GPU

        # Compute prediction loss
        pred = model(x)
        pred_out, pred_aux = pred['out'], pred['aux']
        loss = loss_fn(pred_out, y) + loss_fn(pred_aux, y)
        # Optimization by gradients
        optimizer.zero_grad() # set prevision gradient to 0
        loss.backward() # backpropagation to compute gradients
        optimizer.step() # update model params
        scheduler.step()

        pred_out = torch.argmax(pred_out, dim=1) # 沿着通道维度选择具有最高分数的通道
        pred_out = pred_out.to(torch.float)  # 将目标标签转换为浮点数类型
        # log
        epoch_loss += loss.item() # tensor -> python value
        epoch_iou += mean_iou_score(pred_out, y).item()

    # return avg loss of epoch, iou of epoch
    return epoch_loss/num_batches, epoch_iou/num_batches


def test(dataloader, model, loss_fn):
    size = len(dataloader.dataset) # number of samples
    num_batches = len(dataloader) # batches per epoch

    model.eval() # model to test mode.
    epoch_loss = 0
    epoch_iou = 0
    # No gradient for test data
    with torch.no_grad():
        for batch_i, (x, y) in enumerate(dataloader):
            x, y = x.to(device), y.to(device)

            # Compute prediction loss
            pred = model(x)
            pred = pred['out']
            loss = loss_fn(pred, y)

            pred = torch.argmax(pred, dim=1) # 沿着通道维度选择具有最高分数的通道
            pred = pred.to(torch.float)  # 将目标标签转换为浮点数类型

            # write to logs
            epoch_loss += loss.item()
            epoch_iou += mean_iou_score(pred, y).item()

    return epoch_loss/num_batches, epoch_iou/num_batches

#### Cross Entropy Loss

\begin{align}
L_{ce,i} \quad = \quad
\begin{cases}
  & -log(p_i)   \qquad, \text{ if } y_i= 1\\
  & -log(1-p_i) \; \;    ,\text{ if } y_i=0
\end{cases}
    \end{align}
#### Focal Loss

\begin{align}
L_{focal,i} \quad = \quad
\begin{cases}
  & -\alpha (1-p_i)^rlog(p_i)   \qquad     ,\text{ if } y_i= 1\\
  & -(1-\alpha)p_i^rlog(1-p_i)  \ \ \ \,   ,\text{ if } y_i=0
\end{cases}
    \end{align}

In [10]:
# ref. https://blog.csdn.net/qq_39732684/article/details/105794637
from torch import nn


class focal_loss(nn.Module):
    def __init__(self, alpha=0.25, gamma=2): # Assume that the positive and negative sample ratio is 3:1
        super(focal_loss, self).__init__()
        self.alpha = alpha
        self.gamma = gamma
        self.CrossEntropyLoss = nn.CrossEntropyLoss()

    def forward(self, preds, labels):
        Lce = -self.CrossEntropyLoss(preds, labels) # log(pi) or log(1-pi)
        Lfocal = -1 * (self.alpha) * ((1-torch.exp(Lce)) ** self.gamma) * Lce

        return Lfocal

In [11]:
from torch.optim.lr_scheduler import StepLR


EPOCHS = 100
logs = {
    'train_loss': [], 'val_loss': [],
    'train_mean_iou': [], 'val_mean_iou': [],
}

model = deeplabv3(mode='resnet101')
model = model.to(device)
loss_fn = focal_loss()
# citaion: Encoder-Decoder with Atrous Separable Convolution for Semantic Image Segmentation(Liang-Chieh Chen, Yukun Zhu, George Papandreou, Florian Schroff, and Hartwig Adam)
optimizer = torch.optim.SGD(model.parameters(), lr=0.05, momentum=0.9, weight_decay=4e-5)
scheduler = StepLR(optimizer, step_size=2, gamma=0.94) # 每2个周期衰减一次, 衰减率为0.94


# Earlystopping
patience = 7
counter = 0
best_IOU = 0

for epoch in tqdm(range(EPOCHS)):
    train_loss, train_mean_iou = train(train_loader, model, loss_fn, optimizer)
    val_loss, val_mean_iou = test(val_loader, model, loss_fn)
    logs['train_loss'].append(train_loss)
    logs['val_loss'].append(val_loss)
    logs['train_mean_iou'].append(train_mean_iou)
    logs['val_mean_iou'].append(val_mean_iou)

    print(f'EPOCH: {(epoch+1):04d} train_loss: {train_loss:.4f} val_loss: {val_loss:.4f}, train_mean_iou: {train_mean_iou:.3f}, val_mean_iou: {val_mean_iou:.3f}')

    # On epoch end
    torch.save(model.state_dict(), "deeplabv3_restnet101_lastmodel.pth")
    # check improvement
    if best_IOU < val_mean_iou:
        counter = 0
        best_IOU = val_mean_iou
        torch.save(model.state_dict(), "deeplabv3_restnet101_BestIOU.pth")
        print('Best_IOU saved!')
    else:
        counter += 1
    if counter >= patience:
        print("Earlystop!")
        break

Downloading: "https://download.pytorch.org/models/deeplabv3_resnet101_coco-586e9e4e.pth" to /root/.cache/torch/hub/checkpoints/deeplabv3_resnet101_coco-586e9e4e.pth
100%|██████████| 233M/233M [00:01<00:00, 228MB/s]
  0%|          | 0/100 [00:00<?, ?it/s]
  0%|          | 0/500 [00:00<?, ?it/s][A
  0%|          | 1/500 [00:17<2:24:31, 17.38s/it][A
  0%|          | 2/500 [00:19<1:07:53,  8.18s/it][A
  1%|          | 3/500 [00:20<43:27,  5.25s/it]  [A
  1%|          | 4/500 [00:22<31:58,  3.87s/it][A
  1%|          | 5/500 [00:24<25:38,  3.11s/it][A
  1%|          | 6/500 [00:26<21:49,  2.65s/it][A
  1%|▏         | 7/500 [00:27<19:23,  2.36s/it][A
  2%|▏         | 8/500 [00:29<17:48,  2.17s/it][A
  2%|▏         | 9/500 [01:06<1:45:48, 12.93s/it][A
  2%|▏         | 10/500 [01:08<1:17:31,  9.49s/it][A
  2%|▏         | 11/500 [01:09<58:13,  7.14s/it]  [A
  2%|▏         | 12/500 [01:11<44:57,  5.53s/it][A
  3%|▎         | 13/500 [01:13<35:46,  4.41s/it][A
  3%|▎         | 14/500

EPOCH: 0001 train_loss: 0.3500 val_loss: 0.1553, train_mean_iou: 0.196, val_mean_iou: 0.242


  1%|          | 1/100 [18:28<30:29:19, 1108.68s/it]

Best_IOU saved!



  0%|          | 0/500 [00:00<?, ?it/s][A
  0%|          | 1/500 [00:02<18:24,  2.21s/it][A
  0%|          | 2/500 [00:04<16:59,  2.05s/it][A
  1%|          | 3/500 [00:06<16:31,  1.99s/it][A
  1%|          | 4/500 [00:08<16:20,  1.98s/it][A
  1%|          | 5/500 [00:09<16:15,  1.97s/it][A
  1%|          | 6/500 [00:11<16:11,  1.97s/it][A
  1%|▏         | 7/500 [00:13<16:09,  1.97s/it][A
  2%|▏         | 8/500 [00:15<16:06,  1.97s/it][A
  2%|▏         | 9/500 [00:17<16:03,  1.96s/it][A
  2%|▏         | 10/500 [00:19<16:00,  1.96s/it][A
  2%|▏         | 11/500 [00:21<15:57,  1.96s/it][A
  2%|▏         | 12/500 [00:23<15:52,  1.95s/it][A
  3%|▎         | 13/500 [00:25<15:49,  1.95s/it][A
  3%|▎         | 14/500 [00:27<15:42,  1.94s/it][A
  3%|▎         | 15/500 [00:29<15:38,  1.94s/it][A
  3%|▎         | 16/500 [00:31<15:33,  1.93s/it][A
  3%|▎         | 17/500 [00:33<15:30,  1.93s/it][A
  4%|▎         | 18/500 [00:35<15:28,  1.93s/it][A
  4%|▍         | 19/500 [00:3

EPOCH: 0002 train_loss: 0.2713 val_loss: 0.1517, train_mean_iou: 0.211, val_mean_iou: 0.245


  2%|▏         | 2/100 [34:59<28:17:52, 1039.52s/it]

Best_IOU saved!



  0%|          | 0/500 [00:00<?, ?it/s][A
  0%|          | 1/500 [00:02<17:47,  2.14s/it][A
  0%|          | 2/500 [00:04<16:32,  1.99s/it][A
  1%|          | 3/500 [00:05<16:07,  1.95s/it][A
  1%|          | 4/500 [00:07<15:58,  1.93s/it][A
  1%|          | 5/500 [00:09<15:51,  1.92s/it][A
  1%|          | 6/500 [00:11<15:46,  1.92s/it][A
  1%|▏         | 7/500 [00:13<15:39,  1.91s/it][A
  2%|▏         | 8/500 [00:15<15:37,  1.91s/it][A
  2%|▏         | 9/500 [00:17<15:36,  1.91s/it][A
  2%|▏         | 10/500 [00:19<15:35,  1.91s/it][A
  2%|▏         | 11/500 [00:21<15:34,  1.91s/it][A
  2%|▏         | 12/500 [00:23<15:31,  1.91s/it][A
  3%|▎         | 13/500 [00:24<15:27,  1.91s/it][A
  3%|▎         | 14/500 [00:26<15:24,  1.90s/it][A
  3%|▎         | 15/500 [00:28<15:22,  1.90s/it][A
  3%|▎         | 16/500 [00:30<15:23,  1.91s/it][A
  3%|▎         | 17/500 [00:32<15:23,  1.91s/it][A
  4%|▎         | 18/500 [00:34<15:20,  1.91s/it][A
  4%|▍         | 19/500 [00:3

EPOCH: 0003 train_loss: 0.2817 val_loss: 0.1394, train_mean_iou: 0.209, val_mean_iou: 0.245


  3%|▎         | 3/100 [51:30<27:24:33, 1017.26s/it]
  0%|          | 0/500 [00:00<?, ?it/s][A
  0%|          | 1/500 [00:02<17:50,  2.15s/it][A
  0%|          | 2/500 [00:04<16:34,  2.00s/it][A
  1%|          | 3/500 [00:05<16:09,  1.95s/it][A
  1%|          | 4/500 [00:07<16:01,  1.94s/it][A
  1%|          | 5/500 [00:09<15:54,  1.93s/it][A
  1%|          | 6/500 [00:11<15:48,  1.92s/it][A
  1%|▏         | 7/500 [00:13<15:42,  1.91s/it][A
  2%|▏         | 8/500 [00:15<15:39,  1.91s/it][A
  2%|▏         | 9/500 [00:17<15:39,  1.91s/it][A
  2%|▏         | 10/500 [00:19<15:35,  1.91s/it][A
  2%|▏         | 11/500 [00:21<15:30,  1.90s/it][A
  2%|▏         | 12/500 [00:23<15:28,  1.90s/it][A
  3%|▎         | 13/500 [00:24<15:26,  1.90s/it][A
  3%|▎         | 14/500 [00:26<15:24,  1.90s/it][A
  3%|▎         | 15/500 [00:28<15:23,  1.90s/it][A
  3%|▎         | 16/500 [00:30<15:22,  1.91s/it][A
  3%|▎         | 17/500 [00:32<15:17,  1.90s/it][A
  4%|▎         | 18/500 [00:3

EPOCH: 0004 train_loss: 0.2780 val_loss: 0.1070, train_mean_iou: 0.210, val_mean_iou: 0.251


  4%|▍         | 4/100 [1:08:01<26:51:12, 1007.00s/it]

Best_IOU saved!



  0%|          | 0/500 [00:00<?, ?it/s][A
  0%|          | 1/500 [00:02<17:50,  2.15s/it][A
  0%|          | 2/500 [00:04<16:33,  1.99s/it][A
  1%|          | 3/500 [00:05<16:14,  1.96s/it][A
  1%|          | 4/500 [00:07<16:00,  1.94s/it][A
  1%|          | 5/500 [00:09<15:49,  1.92s/it][A
  1%|          | 6/500 [00:11<15:45,  1.91s/it][A
  1%|▏         | 7/500 [00:13<15:42,  1.91s/it][A
  2%|▏         | 8/500 [00:15<15:39,  1.91s/it][A
  2%|▏         | 9/500 [00:17<15:39,  1.91s/it][A
  2%|▏         | 10/500 [00:19<15:35,  1.91s/it][A
  2%|▏         | 11/500 [00:21<15:31,  1.90s/it][A
  2%|▏         | 12/500 [00:23<15:31,  1.91s/it][A
  3%|▎         | 13/500 [00:24<15:28,  1.91s/it][A
  3%|▎         | 14/500 [00:26<15:26,  1.91s/it][A
  3%|▎         | 15/500 [00:28<15:25,  1.91s/it][A
  3%|▎         | 16/500 [00:30<15:22,  1.91s/it][A
  3%|▎         | 17/500 [00:32<15:19,  1.90s/it][A
  4%|▎         | 18/500 [00:34<15:16,  1.90s/it][A
  4%|▍         | 19/500 [00:3

EPOCH: 0005 train_loss: 0.2786 val_loss: 0.1251, train_mean_iou: 0.210, val_mean_iou: 0.247


  5%|▌         | 5/100 [1:24:33<26:25:30, 1001.37s/it]
  0%|          | 0/500 [00:00<?, ?it/s][A
  0%|          | 1/500 [00:02<17:49,  2.14s/it][A
  0%|          | 2/500 [00:04<16:36,  2.00s/it][A
  1%|          | 3/500 [00:05<16:12,  1.96s/it][A
  1%|          | 4/500 [00:07<15:55,  1.93s/it][A
  1%|          | 5/500 [00:09<15:50,  1.92s/it][A
  1%|          | 6/500 [00:11<15:46,  1.92s/it][A
  1%|▏         | 7/500 [00:13<15:41,  1.91s/it][A
  2%|▏         | 8/500 [00:15<15:39,  1.91s/it][A
  2%|▏         | 9/500 [00:17<15:37,  1.91s/it][A
  2%|▏         | 10/500 [00:19<15:37,  1.91s/it][A
  2%|▏         | 11/500 [00:21<15:33,  1.91s/it][A
  2%|▏         | 12/500 [00:23<15:30,  1.91s/it][A
  3%|▎         | 13/500 [00:24<15:28,  1.91s/it][A
  3%|▎         | 14/500 [00:26<15:29,  1.91s/it][A
  3%|▎         | 15/500 [00:28<15:26,  1.91s/it][A
  3%|▎         | 16/500 [00:30<15:25,  1.91s/it][A
  3%|▎         | 17/500 [00:32<15:21,  1.91s/it][A
  4%|▎         | 18/500 [00

EPOCH: 0006 train_loss: 0.2875 val_loss: 0.1636, train_mean_iou: 0.200, val_mean_iou: 0.237


  6%|▌         | 6/100 [1:41:03<26:02:49, 997.55s/it] 
  0%|          | 0/500 [00:00<?, ?it/s][A
  0%|          | 1/500 [00:02<18:12,  2.19s/it][A
  0%|          | 2/500 [00:04<16:46,  2.02s/it][A
  1%|          | 3/500 [00:05<16:12,  1.96s/it][A
  1%|          | 4/500 [00:07<15:55,  1.93s/it][A
  1%|          | 5/500 [00:09<15:47,  1.91s/it][A
  1%|          | 6/500 [00:11<15:43,  1.91s/it][A
  1%|▏         | 7/500 [00:13<15:39,  1.91s/it][A
  2%|▏         | 8/500 [00:15<15:34,  1.90s/it][A
  2%|▏         | 9/500 [00:17<15:33,  1.90s/it][A
  2%|▏         | 10/500 [00:19<15:30,  1.90s/it][A
  2%|▏         | 11/500 [00:21<15:29,  1.90s/it][A
  2%|▏         | 12/500 [00:23<15:27,  1.90s/it][A
  3%|▎         | 13/500 [00:24<15:25,  1.90s/it][A
  3%|▎         | 14/500 [00:26<15:24,  1.90s/it][A
  3%|▎         | 15/500 [00:28<15:23,  1.91s/it][A
  3%|▎         | 16/500 [00:30<15:20,  1.90s/it][A
  3%|▎         | 17/500 [00:32<15:21,  1.91s/it][A
  4%|▎         | 18/500 [00

EPOCH: 0007 train_loss: 0.2790 val_loss: 0.1293, train_mean_iou: 0.211, val_mean_iou: 0.248


  7%|▋         | 7/100 [1:57:33<25:42:12, 994.97s/it]
  0%|          | 0/500 [00:00<?, ?it/s][A
  0%|          | 1/500 [00:02<17:51,  2.15s/it][A
  0%|          | 2/500 [00:04<16:32,  1.99s/it][A
  1%|          | 3/500 [00:05<16:05,  1.94s/it][A
  1%|          | 4/500 [00:07<15:52,  1.92s/it][A
  1%|          | 5/500 [00:09<15:46,  1.91s/it][A
  1%|          | 6/500 [00:11<15:41,  1.90s/it][A
  1%|▏         | 7/500 [00:13<15:35,  1.90s/it][A
  2%|▏         | 8/500 [00:15<15:32,  1.89s/it][A
  2%|▏         | 9/500 [00:17<15:30,  1.89s/it][A
  2%|▏         | 10/500 [00:19<15:28,  1.90s/it][A
  2%|▏         | 11/500 [00:21<15:29,  1.90s/it][A
  2%|▏         | 12/500 [00:22<15:26,  1.90s/it][A
  3%|▎         | 13/500 [00:24<15:24,  1.90s/it][A
  3%|▎         | 14/500 [00:26<15:19,  1.89s/it][A
  3%|▎         | 15/500 [00:28<15:20,  1.90s/it][A
  3%|▎         | 16/500 [00:30<15:18,  1.90s/it][A
  3%|▎         | 17/500 [00:32<15:16,  1.90s/it][A
  4%|▎         | 18/500 [00:

EPOCH: 0008 train_loss: 0.2806 val_loss: 0.1463, train_mean_iou: 0.205, val_mean_iou: 0.246


  8%|▊         | 8/100 [2:14:01<25:22:27, 992.91s/it]
  0%|          | 0/500 [00:00<?, ?it/s][A
  0%|          | 1/500 [00:02<17:56,  2.16s/it][A
  0%|          | 2/500 [00:04<16:34,  2.00s/it][A
  1%|          | 3/500 [00:05<16:10,  1.95s/it][A
  1%|          | 4/500 [00:07<15:59,  1.93s/it][A
  1%|          | 5/500 [00:09<15:54,  1.93s/it][A
  1%|          | 6/500 [00:11<15:48,  1.92s/it][A
  1%|▏         | 7/500 [00:13<15:47,  1.92s/it][A
  2%|▏         | 8/500 [00:15<15:45,  1.92s/it][A
  2%|▏         | 9/500 [00:17<15:40,  1.92s/it][A
  2%|▏         | 10/500 [00:19<15:37,  1.91s/it][A
  2%|▏         | 11/500 [00:21<15:34,  1.91s/it][A
  2%|▏         | 12/500 [00:23<15:32,  1.91s/it][A
  3%|▎         | 13/500 [00:25<15:33,  1.92s/it][A
  3%|▎         | 14/500 [00:26<15:31,  1.92s/it][A
  3%|▎         | 15/500 [00:28<15:30,  1.92s/it][A
  3%|▎         | 16/500 [00:30<15:29,  1.92s/it][A
  3%|▎         | 17/500 [00:32<15:28,  1.92s/it][A
  4%|▎         | 18/500 [00:

EPOCH: 0009 train_loss: 0.2815 val_loss: 0.1458, train_mean_iou: 0.206, val_mean_iou: 0.242


  9%|▉         | 9/100 [2:30:30<25:03:56, 991.61s/it]
  0%|          | 0/500 [00:00<?, ?it/s][A
  0%|          | 1/500 [00:02<17:49,  2.14s/it][A
  0%|          | 2/500 [00:04<16:34,  2.00s/it][A
  1%|          | 3/500 [00:05<16:11,  1.95s/it][A
  1%|          | 4/500 [00:07<15:58,  1.93s/it][A
  1%|          | 5/500 [00:09<15:50,  1.92s/it][A
  1%|          | 6/500 [00:11<15:48,  1.92s/it][A
  1%|▏         | 7/500 [00:13<15:42,  1.91s/it][A
  2%|▏         | 8/500 [00:15<15:38,  1.91s/it][A
  2%|▏         | 9/500 [00:17<15:34,  1.90s/it][A
  2%|▏         | 10/500 [00:19<15:32,  1.90s/it][A
  2%|▏         | 11/500 [00:21<15:30,  1.90s/it][A
  2%|▏         | 12/500 [00:23<15:28,  1.90s/it][A
  3%|▎         | 13/500 [00:24<15:26,  1.90s/it][A
  3%|▎         | 14/500 [00:26<15:22,  1.90s/it][A
  3%|▎         | 15/500 [00:28<15:21,  1.90s/it][A
  3%|▎         | 16/500 [00:30<15:21,  1.90s/it][A
  3%|▎         | 17/500 [00:32<15:19,  1.90s/it][A
  4%|▎         | 18/500 [00:

EPOCH: 0010 train_loss: 0.2811 val_loss: 0.1178, train_mean_iou: 0.206, val_mean_iou: 0.250


 10%|█         | 10/100 [2:47:00<24:46:42, 991.14s/it]
  0%|          | 0/500 [00:00<?, ?it/s][A
  0%|          | 1/500 [00:02<17:55,  2.16s/it][A
  0%|          | 2/500 [00:04<16:39,  2.01s/it][A
  1%|          | 3/500 [00:05<16:12,  1.96s/it][A
  1%|          | 4/500 [00:07<15:59,  1.94s/it][A
  1%|          | 5/500 [00:09<15:51,  1.92s/it][A
  1%|          | 6/500 [00:11<15:44,  1.91s/it][A
  1%|▏         | 7/500 [00:13<15:40,  1.91s/it][A
  2%|▏         | 8/500 [00:15<15:37,  1.91s/it][A
  2%|▏         | 9/500 [00:17<15:33,  1.90s/it][A
  2%|▏         | 10/500 [00:19<15:31,  1.90s/it][A
  2%|▏         | 11/500 [00:21<15:30,  1.90s/it][A
  2%|▏         | 12/500 [00:23<15:28,  1.90s/it][A
  3%|▎         | 13/500 [00:24<15:26,  1.90s/it][A
  3%|▎         | 14/500 [00:26<15:27,  1.91s/it][A
  3%|▎         | 15/500 [00:28<15:23,  1.91s/it][A
  3%|▎         | 16/500 [00:30<15:19,  1.90s/it][A
  3%|▎         | 17/500 [00:32<15:18,  1.90s/it][A
  4%|▎         | 18/500 [00

EPOCH: 0011 train_loss: 0.2750 val_loss: 0.1194, train_mean_iou: 0.211, val_mean_iou: 0.250


 10%|█         | 10/100 [3:03:29<27:31:28, 1100.98s/it]

Earlystop!



