In [1]:
import os
import zarr
import timm
import random
import json
import gc
import warnings
import numpy as np
import pandas as pd
import torch.nn as nn
from pathlib import Path
import matplotlib.pyplot as plt
from torch.utils.data import DataLoader, Dataset
from collections import defaultdict
import sys
import torch
from torch.cuda.amp import autocast, GradScaler

# import torchvision.transforms.functional as F
import random

warnings.filterwarnings("ignore")
sys.path.append("./src/")

from src.config import CFG
from src.dataloader import (
    read_zarr,
    read_info_json,
    scale_coordinates,
    create_dataset,
    create_segmentation_map,
    EziiDataset,
    drop_padding,
)
from src.network import Unet3D
from src.utils import save_images, PadToSize
from src.metric import (
    score,
    create_cls_pos,
    create_cls_pos_sikii,
    create_df,
    SegmentationLoss,
    DiceLoss,
)
from src.kaggle_notebook_metric import compute_lb, extract_particle_results
from src.inference import inference, inference2pos, create_gt_df
from metric import visualize_epoch_results

import wandb
from pathlib import Path

notebook_name = os.path.join(Path().resolve()).split("/")[-1]

param = {
    "model": CFG.model_name,
    "resolution": CFG.resolution,
    "augmentation_prob": CFG.augmentation_prob,
    "slice": CFG.slice_,
    "epochs": CFG.epochs,
    "lr": CFG.lr,
    "batch_size": CFG.batch_size,
    "weight_decay": CFG.weight_decay,
    "num_workers": CFG.num_workers,
    "augment_data_ratio": CFG.augment_data_ratio,
}
wandb.init(project="czii2024", name=notebook_name, config=param)

Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.
[34m[1mwandb[0m: Currently logged in as: [33mtatuya[0m ([33mlatent-walkers[0m). Use [1m`wandb login --relogin`[0m to force relogin


In [2]:
train_dataset = EziiDataset(
    exp_names=CFG.train_exp_names,
    base_dir="../../inputs/train/",
    particles_name=CFG.particles_name,
    resolution=CFG.resolution,
    zarr_type=CFG.train_zarr_types,
    train=True,
    augmentation=True,
    slice=True,
    pre_read=True,
)

# train_nshuffle_dataset = EziiDataset(
#     exp_names=CFG.train_exp_names,
#     base_dir="../../inputs/train/",
#     particles_name=CFG.particles_name,
#     resolution=CFG.resolution,
#     zarr_type=CFG.train_zarr_types,
#     augmentation=False,
#     train=True,
# )

valid_dataset = EziiDataset(
    exp_names=CFG.valid_exp_names,
    base_dir="../../inputs/train/",
    particles_name=CFG.particles_name,
    resolution=CFG.resolution,
    zarr_type=CFG.valid_zarr_types,
    augmentation=False,
    train=True,
    slice=True,
    pre_read=True,
)

from tqdm import tqdm

train_loader = DataLoader(
    train_dataset,
    batch_size=CFG.batch_size,
    shuffle=True,
    drop_last=True,
    pin_memory=True,
    num_workers=CFG.num_workers,
)
# train_nshuffle_loader = DataLoader(
#     train_nshuffle_dataset,
#     batch_size=1,
#     shuffle=True,
#     drop_last=True,
#     pin_memory=True,
#     num_workers=CFG.num_workers,
# )
valid_loader = DataLoader(
    valid_dataset,
    batch_size=1,
    shuffle=False,
    pin_memory=True,
    num_workers=CFG.num_workers,
)

for data in tqdm(train_loader):
    normalized_tomogram = data["normalized_tomogram"]
    segmentation_map = data["segmentation_map"]
    break

normalized_tomogram.shape

100%|██████████| 517/517 [01:24<00:00,  6.11it/s]
100%|██████████| 2/2 [00:03<00:00,  1.64s/it]
  0%|          | 0/258 [00:02<?, ?it/s]


torch.Size([2, 16, 630, 630])

In [3]:
# 学習時のデータパターン

z_list = []

for i in range(len(train_dataset)):
    z = train_dataset[i]["zarr_type"]
    z_list.append(z)

np.unique(np.array(z_list), return_counts=True)

(array(['ctfdeconvolved', 'denoised', 'isonetcorrected', 'none', 'wbp'],
       dtype='<U15'),
 array([ 55,  55,  55, 297,  55]))

In [4]:
encoder = timm.create_model(
    model_name=CFG.model_name,
    pretrained=True,
    in_chans=3,
    num_classes=0,
    global_pool="",
    features_only=True,
)
model = Unet3D(encoder=encoder, num_domains=5).to("cuda")
# model.load_state_dict(torch.load("./pretrained_model.pth"))
# model.load_state_dict(
#     torch.load(
#         "../../../../../../../../mnt/d/kaggle-tmp-models/czii2024/exp059-recreate-baseline-renet34d-dstride-attention/model_4.pth"
#     )
# )
# model.load_state_dict(torch.load("./best_model.pth"))

<All keys matched successfully>

In [5]:
# input-test

x = torch.randn(2, 16, 1, 64, 64).cuda()
model(x, torch.tensor([2, 0]).cuda()).shape

torch.Size([2, 7, 16, 64, 64])

In [6]:
# # "encoder"と名のつくパラメータは学習しない
# for layer, param in model.named_parameters():
#     if "encoder" in layer:
#         param.requires_grad = False

In [7]:
import matplotlib.pyplot as plt
import numpy as np
from matplotlib.colors import ListedColormap
from matplotlib.patches import Patch

# サンプルデータ
num_classes = len(CFG.particles_name)  # クラス数
colors = plt.cm.tab10(
    np.arange(len(CFG.particles_name))
)  # "tab10" カラーマップから色を取得

# ListedColormap を作成
class_colormap = ListedColormap(colors)


# カラーバー付きプロット
def plot_with_colormap(data, title, original_tomogram):
    masked_data = np.ma.masked_where(data <= 0, data)  # クラス0をマスク
    plt.imshow(original_tomogram, cmap="gray")
    im = plt.imshow(masked_data, cmap=class_colormap)
    plt.title(title)
    plt.axis("off")
    return im

In [8]:
import torch
import random
import torchvision.transforms.functional as TF


# 回転
# 3Dテンソルの各軸に対して指定した角度で回転する関数
def rotate_3d(tomogram, segmentation_map, angle):
    """Rotates the 3D tensors tomogram and segmentation_map around the Z-axis."""
    rotated_tomogram = TF.rotate(tomogram, angle, expand=False)
    rotated_segmentation_map = TF.rotate(segmentation_map, angle, expand=False)
    return rotated_tomogram, rotated_segmentation_map


# 平行移動
# 指定された範囲でランダムに平行移動
def translate_3d(tomogram, segmentation_map, max_shift):
    """Translates the 3D tensors by a random shift within max_shift."""
    shift_x = random.randint(-max_shift, max_shift)
    shift_y = random.randint(-max_shift, max_shift)
    translated_tomogram = TF.affine(
        tomogram, angle=0, translate=(shift_x, shift_y), scale=1, shear=0
    )
    translated_segmentation_map = TF.affine(
        segmentation_map, angle=0, translate=(shift_x, shift_y), scale=1, shear=0
    )
    return translated_tomogram, translated_segmentation_map


# フリップ
# 縦横（上下左右）ランダムフリップ
def flip_3d(tomogram, segmentation_map):
    """Randomly flips the 3D tensors along height or width."""
    if random.random() > 0.5:  # Horizontal flip
        tomogram = torch.flip(tomogram, dims=[-1])
        segmentation_map = torch.flip(segmentation_map, dims=[-1])
    if random.random() > 0.5:  # Vertical flip
        tomogram = torch.flip(tomogram, dims=[-2])
        segmentation_map = torch.flip(segmentation_map, dims=[-2])
    return tomogram, segmentation_map


# クロッピング
# 入力テンソルを中心またはランダムクロップで切り取る
def crop_3d(tomogram, segmentation_map, crop_size):
    """Crops the 3D tensors to the specified crop_size."""
    _, depth, height, width = tomogram.size()
    crop_d, crop_h, crop_w = crop_size

    if crop_h > height or crop_w > width:
        raise ValueError("Crop size cannot be larger than the original size.")

    start_h = random.randint(0, height - crop_h)  # Random starting position for height
    start_w = random.randint(0, width - crop_w)  # Random starting position for width

    cropped_tomogram = tomogram[
        :, :, start_h : start_h + crop_h, start_w : start_w + crop_w
    ]
    cropped_segmentation_map = segmentation_map[
        :, :, start_h : start_h + crop_h, start_w : start_w + crop_w
    ]

    return cropped_tomogram, cropped_segmentation_map


# Mixup
# 2つのサンプルを線形補間して混合
def mixup(tomogram, segmentation_map, alpha=0.4):
    """Applies mixup augmentation to the batch."""
    lam = random.betavariate(alpha, alpha)
    batch_size = tomogram.size(0)
    index = torch.randperm(batch_size)

    mixed_tomogram = lam * tomogram + (1 - lam) * tomogram[index, :]
    mixed_segmentation_map = (
        lam * segmentation_map + (1 - lam) * segmentation_map[index, :]
    )

    return mixed_tomogram, mixed_segmentation_map


# Cutmix
# ランダム領域を切り取って別のサンプルに貼り付け
def cutmix(tomogram, segmentation_map, alpha=1.0):
    """Applies cutmix augmentation to the batch."""
    lam = random.betavariate(alpha, alpha)
    batch_size, depth, height, width = tomogram.size()
    index = torch.randperm(batch_size)

    cx = random.randint(0, width)
    cy = random.randint(0, height)
    cw = int(width * (1 - lam))
    ch = int(height * (1 - lam))

    x1 = max(cx - cw // 2, 0)
    x2 = min(cx + cw // 2, width)
    y1 = max(cy - ch // 2, 0)
    y2 = min(cy + ch // 2, height)

    tomogram[:, :, y1:y2, x1:x2] = tomogram[index, :, y1:y2, x1:x2]
    segmentation_map[:, :, y1:y2, x1:x2] = segmentation_map[index, :, y1:y2, x1:x2]

    return tomogram, segmentation_map


# データ拡張の組み合わせ適用
def augment_data(
    tomogram,
    segmentation_map,
    crop_size=(16, 256, 256),
    max_shift=10,
    rotation_angle=30,
    p=0.5,
    mixup_alpha=0.4,
    cutmix_alpha=1.0,
):
    """Applies a combination of rotation, translation, flipping, cropping, mixup, and cutmix to the inputs with probabilities."""
    if random.random() < p:
        tomogram, segmentation_map = rotate_3d(
            tomogram,
            segmentation_map,
            angle=random.uniform(-rotation_angle, rotation_angle),
        )
    if random.random() < p:
        tomogram, segmentation_map = translate_3d(
            tomogram, segmentation_map, max_shift=max_shift
        )
    if random.random() < p:
        tomogram, segmentation_map = flip_3d(tomogram, segmentation_map)
    if random.random() < p:
        tomogram, segmentation_map = crop_3d(
            tomogram, segmentation_map, crop_size=crop_size
        )
    if random.random() < p:
        tomogram, segmentation_map = mixup(
            tomogram, segmentation_map, alpha=mixup_alpha
        )
    # if random.random() < p:
    #     tomogram, segmentation_map = cutmix(
    #         tomogram, segmentation_map, alpha=cutmix_alpha
    #     )
    return tomogram, segmentation_map


# 使用例
# バッチサイズ6, 深さ16, 高さ320, 幅320のランダムテンソル
tomogram = torch.rand((6, 16, 320, 320))
segmentation_map = torch.randint(0, 2, (6, 16, 320, 320))  # ラベルは0または1

# データ拡張の適用
aug_tomogram, aug_segmentation_map = augment_data(tomogram, segmentation_map, p=0.7)
print("Original shape:", tomogram.shape)
print("Augmented shape:", aug_tomogram.shape)

Original shape: torch.Size([6, 16, 320, 320])
Augmented shape: torch.Size([6, 16, 320, 320])


In [9]:
# model.encoderのパラメータを固定

# for param in model.encoder.parameters():
#     param.requires_grad = False

In [10]:
from transformers import get_cosine_schedule_with_warmup

optimizer = torch.optim.Adam(
    model.parameters(), lr=CFG.lr, weight_decay=CFG.weight_decay
)
criterion = nn.CrossEntropyLoss(
    #  weight=torch.tensor([2.0, 32, 32, 32, 32, 32, 32]).to("cuda")
)
# criterion = DiceLoss()
scheduler = get_cosine_schedule_with_warmup(
    optimizer,
    num_warmup_steps=10,
    num_training_steps=CFG.epochs * len(train_loader),
    # * batch_size,
)
scaler = GradScaler()
seg_loss = SegmentationLoss(criterion)
padf = PadToSize(CFG.resolution)

In [11]:
# b, c, d, h, w = CFG.batch_size, 1, 96, 320, 320

In [12]:
def preprocess_tensor(tensor):
    batch_size, depth, height, width = tensor.shape
    tensor = tensor.unsqueeze(2)  # (b, d, h, w) -> (b, d, 1, h, w)
    return tensor

In [13]:
padf = PadToSize(CFG.resolution)
padf(normalized_tomogram).shape

torch.Size([2, 16, 640, 640])

In [None]:
best_model = None
best_constant = 0
best_score = -100
best_particle_score = {}

grand_train_loss = []
grand_valid_loss = []
grand_train_score = []
grand_valid_score = []

for epoch in range(CFG.epochs):
    model.train()
    train_loss = []
    valid_loss = []
    with tqdm(train_loader, desc=f"Epoch {epoch + 1}/{CFG.epochs} [Training]") as tq:
        for data in tq:
            normalized_tomogram = data["normalized_tomogram"]
            segmentation_map = data["segmentation_map"]
            zarr_embedding_idx = data["zarr_type_embedding_idx"]

            normalized_tomogram = padf(normalized_tomogram)
            segmentation_map = padf(segmentation_map)

            # データ拡張
            normalized_tomogram, segmentation_map = augment_data(
                normalized_tomogram, segmentation_map, p=CFG.augmentation_prob
            )
            normalized_tomogram = normalized_tomogram.cuda()
            segmentation_map = segmentation_map.long().cuda()
            zarr_embedding_idx = zarr_embedding_idx.cuda()

            optimizer.zero_grad()

            with autocast():
                pred = model(preprocess_tensor(normalized_tomogram), zarr_embedding_idx)
                loss = seg_loss(pred, segmentation_map)
            # loss.backward()
            # optimizer.step()
            scaler.scale(loss).backward()
            scaler.step(optimizer)
            scaler.update()
            scheduler.step()
            train_loss.append(loss.item())

            # 確率予測
            prob_pred = torch.softmax(pred, dim=1)
            tq.set_postfix({"loss": f"{np.mean(train_loss):.4f}"})

    del normalized_tomogram, segmentation_map, zarr_embedding_idx, pred, loss
    gc.collect()
    torch.cuda.empty_cache()

    with tqdm(valid_loader, desc=f"Epoch {epoch + 1}/{CFG.epochs} [Validation]") as tq:
        with torch.no_grad():
            for data in tq:
                normalized_tomogram = data["normalized_tomogram"].cuda()
                segmentation_map = data["segmentation_map"].long().cuda()
                zarr_embedding_idx = data["zarr_type_embedding_idx"].cuda()

                normalized_tomogram = padf(normalized_tomogram)
                segmentation_map = padf(segmentation_map)

                with autocast():
                    pred = model(
                        preprocess_tensor(normalized_tomogram), zarr_embedding_idx
                    )
                    loss = seg_loss(pred, segmentation_map)
                valid_loss.append(loss.item())

                # 確率予測
                prob_pred = torch.softmax(pred, dim=1)
                tq.set_postfix({"loss": f"{np.mean(valid_loss):.4f}"})

    del normalized_tomogram, segmentation_map, zarr_embedding_idx, pred, loss
    gc.collect()
    torch.cuda.empty_cache()

    # # ############### validation ################
    train_nshuffle_original_tomogram = defaultdict(list)
    train_nshuffle_pred_tomogram = defaultdict(list)
    train_nshuffle_gt_tomogram = defaultdict(list)

    valid_original_tomogram = defaultdict(list)
    valid_pred_tomogram = defaultdict(list)
    valid_gt_tomogram = defaultdict(list)

    train_mean_scores = []
    valid_mean_scores = []

    # モデルの保存
    make_dir_ = (
        f"../../../../../../../../mnt/d/kaggle-tmp-models/czii2024/{notebook_name}/"
    )
    os.makedirs(make_dir_, exist_ok=True)
    torch.save(model.state_dict(), make_dir_ + f"model_{epoch}.pth")

    # ############### validation ################
    train_nshuffle_original_tomogram = defaultdict(list)
    train_nshuffle_pred_tomogram = defaultdict(list)
    train_nshuffle_gt_tomogram = defaultdict(list)

    valid_original_tomogram = defaultdict(list)
    valid_pred_tomogram = defaultdict(list)
    valid_gt_tomogram = defaultdict(list)

    train_mean_scores = []
    valid_mean_scores = []

    train_inferenced_array = {}
    train_pred_array = []
    train_gt_array = []
    valid_inferenced_array = {}
    valid_gt_array = []

    # for exp_name in tqdm(CFG.train_exp_names):
    for exp_name in [CFG.valid_exp_name]:  # 5つのデータで試す
        # inferenced_array = inference(model, exp_name, train=False)
        inferenced_array, n_tomogram, segmentation_map = inference(
            model, exp_name, train=False
        )
        valid_inferenced_array[exp_name] = inferenced_array
        base_dir = "../../inputs/train/overlay/ExperimentRuns/"
        gt_df = create_gt_df(base_dir, [exp_name])
        valid_gt_array.append(gt_df)

    valid_gt_array = pd.concat(valid_gt_array)

    b_constant = 0
    b_score = -100
    b_particle_score = {}
    for constant in tqdm(np.linspace(0.05, 0.9, 15)):
        valid_pred_array = []
        sikii = {
            "apo-ferritin": constant,
            "beta-amylase": constant,
            "beta-galactosidase": constant,
            "ribosome": constant,
            "thyroglobulin": constant,
            "virus-like-particle": constant,
        }
        for exp_name in [CFG.valid_exp_name]:  # 5つのデータで試す
            pred_df = inference2pos(
                pred_segmask=valid_inferenced_array[exp_name],
                exp_name=exp_name,
                sikii_dict=sikii,
            )
            valid_pred_array.append(pred_df)

        valid_pred_array = pd.concat(valid_pred_array)

        if len(valid_pred_array) != 0:
            # score_ = score(
            #     valid_pred_array,
            #     valid_gt_array,
            #     row_id_column_name="index",
            #     distance_multiplier=0.5,
            #     beta=4,
            # )
            result_df, score_ = compute_lb(
                valid_pred_array,
                "../../inputs/train/overlay/ExperimentRuns/",
                CFG.valid_exp_names,
            )
            particle_score = extract_particle_results(result_df)

            if score_ > b_score:
                b_score = score_
                b_constant = constant
                b_particle_score = particle_score

        import gc
        import torch.cuda as cuda

        # del valid_pred_array, valid_gt_array
        gc.collect()
        cuda.empty_cache()

    # print("constant", b_constant, "score", b_score)

    # wandb-log
    train_info = {
        "01_epoch": epoch,
        "02_train_loss": np.mean(train_loss),
        "03_valid_loss": np.mean(valid_loss),
        # "train_score": np.mean(train_mean_scores),
        "04_valid_best_score": b_score,
        "05_valid_best_constant": b_constant,
    }
    train_info = {**train_info, **b_particle_score}
    wandb.log(train_info)

    # score-update
    if b_score > best_score:
        best_constant = b_constant
        best_score = b_score
        # best_score = np.mean(valid_mean_scores)
        best_model = model.state_dict()
        torch.save(best_model, f"./best_model.pth")

    print(
        f"train-epoch-loss:{np.mean(train_loss):.4f}",
        # f"valid-epoch-loss:{np.mean(valid_loss):.4f}",
        # f"train-beta4-score:{np.mean(train_mean_scores):.4f}",
        f"valid-beta4-score:{b_score:.4f}",
    )

    grand_train_loss.append(np.mean(train_loss))
    # grand_valid_loss.append(np.mean(valid_loss))
    # grand_train_score.append(np.mean(train_mean_scores))
    grand_valid_score.append(b_score)

Epoch 1/150 [Training]: 100%|██████████| 258/258 [04:09<00:00,  1.04it/s, loss=0.0327]
Epoch 1/150 [Validation]: 100%|██████████| 2/2 [00:01<00:00,  1.27it/s, loss=0.0049]
100%|██████████| 15/15 [00:32<00:00,  2.14s/it]


train-epoch-loss:0.0327 valid-beta4-score:0.3605


Epoch 2/150 [Training]: 100%|██████████| 258/258 [04:25<00:00,  1.03s/it, loss=0.0304]
Epoch 2/150 [Validation]: 100%|██████████| 2/2 [00:01<00:00,  1.36it/s, loss=0.0027]
100%|██████████| 15/15 [00:33<00:00,  2.24s/it]


train-epoch-loss:0.0304 valid-beta4-score:0.3593


Epoch 3/150 [Training]: 100%|██████████| 258/258 [04:21<00:00,  1.01s/it, loss=0.0283]
Epoch 3/150 [Validation]: 100%|██████████| 2/2 [00:01<00:00,  1.33it/s, loss=0.0013]
100%|██████████| 15/15 [00:34<00:00,  2.30s/it]


train-epoch-loss:0.0283 valid-beta4-score:0.3771


Epoch 4/150 [Training]: 100%|██████████| 258/258 [04:16<00:00,  1.01it/s, loss=0.0286]
Epoch 4/150 [Validation]: 100%|██████████| 2/2 [00:01<00:00,  1.39it/s, loss=0.0300]
100%|██████████| 15/15 [00:33<00:00,  2.26s/it]


train-epoch-loss:0.0286 valid-beta4-score:0.3753


Epoch 5/150 [Training]: 100%|██████████| 258/258 [04:03<00:00,  1.06it/s, loss=0.0274]
Epoch 5/150 [Validation]: 100%|██████████| 2/2 [00:01<00:00,  1.34it/s, loss=0.0172]
100%|██████████| 15/15 [00:35<00:00,  2.36s/it]


train-epoch-loss:0.0274 valid-beta4-score:0.3790


Epoch 6/150 [Training]: 100%|██████████| 258/258 [04:17<00:00,  1.00it/s, loss=0.0276]
Epoch 6/150 [Validation]: 100%|██████████| 2/2 [00:01<00:00,  1.35it/s, loss=0.0191]
100%|██████████| 15/15 [00:35<00:00,  2.35s/it]


train-epoch-loss:0.0276 valid-beta4-score:0.3773


Epoch 7/150 [Training]: 100%|██████████| 258/258 [04:16<00:00,  1.01it/s, loss=0.0266]
Epoch 7/150 [Validation]: 100%|██████████| 2/2 [00:01<00:00,  1.40it/s, loss=0.0270]
100%|██████████| 15/15 [00:34<00:00,  2.29s/it]


train-epoch-loss:0.0266 valid-beta4-score:0.3776


Epoch 8/150 [Training]: 100%|██████████| 258/258 [04:15<00:00,  1.01it/s, loss=0.0260]
Epoch 8/150 [Validation]: 100%|██████████| 2/2 [00:01<00:00,  1.36it/s, loss=0.0152]
100%|██████████| 15/15 [00:33<00:00,  2.26s/it]


train-epoch-loss:0.0260 valid-beta4-score:0.3759


Epoch 9/150 [Training]: 100%|██████████| 258/258 [04:25<00:00,  1.03s/it, loss=0.0254]
Epoch 9/150 [Validation]: 100%|██████████| 2/2 [00:01<00:00,  1.29it/s, loss=0.0270]
100%|██████████| 15/15 [00:31<00:00,  2.12s/it]


train-epoch-loss:0.0254 valid-beta4-score:0.3545


Epoch 10/150 [Training]: 100%|██████████| 258/258 [04:35<00:00,  1.07s/it, loss=0.0271]
Epoch 10/150 [Validation]: 100%|██████████| 2/2 [00:01<00:00,  1.40it/s, loss=0.0070]
100%|██████████| 15/15 [00:35<00:00,  2.34s/it]


train-epoch-loss:0.0271 valid-beta4-score:0.3689


Epoch 11/150 [Training]: 100%|██████████| 258/258 [04:30<00:00,  1.05s/it, loss=0.0243]
Epoch 11/150 [Validation]: 100%|██████████| 2/2 [00:01<00:00,  1.36it/s, loss=0.0260]
100%|██████████| 15/15 [00:34<00:00,  2.32s/it]


train-epoch-loss:0.0243 valid-beta4-score:0.3545


Epoch 12/150 [Training]: 100%|██████████| 258/258 [04:34<00:00,  1.06s/it, loss=0.0244]
Epoch 12/150 [Validation]: 100%|██████████| 2/2 [00:01<00:00,  1.36it/s, loss=0.0213]
100%|██████████| 15/15 [00:34<00:00,  2.30s/it]


train-epoch-loss:0.0244 valid-beta4-score:0.3545


Epoch 13/150 [Training]: 100%|██████████| 258/258 [04:17<00:00,  1.00it/s, loss=0.0247]
Epoch 13/150 [Validation]: 100%|██████████| 2/2 [00:01<00:00,  1.35it/s, loss=0.0014]
100%|██████████| 15/15 [00:35<00:00,  2.37s/it]


train-epoch-loss:0.0247 valid-beta4-score:0.3523


Epoch 14/150 [Training]: 100%|██████████| 258/258 [04:19<00:00,  1.00s/it, loss=0.0251]
Epoch 14/150 [Validation]: 100%|██████████| 2/2 [00:01<00:00,  1.35it/s, loss=0.0387]
100%|██████████| 15/15 [00:34<00:00,  2.30s/it]


train-epoch-loss:0.0251 valid-beta4-score:0.3571


Epoch 15/150 [Training]: 100%|██████████| 258/258 [04:44<00:00,  1.10s/it, loss=0.0244]
Epoch 15/150 [Validation]: 100%|██████████| 2/2 [00:01<00:00,  1.36it/s, loss=0.0177]
100%|██████████| 15/15 [00:35<00:00,  2.34s/it]


train-epoch-loss:0.0244 valid-beta4-score:0.3688


Epoch 16/150 [Training]: 100%|██████████| 258/258 [04:19<00:00,  1.01s/it, loss=0.0268]
Epoch 16/150 [Validation]: 100%|██████████| 2/2 [00:01<00:00,  1.36it/s, loss=0.0097]
100%|██████████| 15/15 [00:36<00:00,  2.41s/it]


train-epoch-loss:0.0268 valid-beta4-score:0.3913


Epoch 17/150 [Training]: 100%|██████████| 258/258 [04:23<00:00,  1.02s/it, loss=0.0288]
Epoch 17/150 [Validation]: 100%|██████████| 2/2 [00:01<00:00,  1.37it/s, loss=0.0301]
100%|██████████| 15/15 [00:34<00:00,  2.31s/it]


train-epoch-loss:0.0288 valid-beta4-score:0.3634


Epoch 18/150 [Training]: 100%|██████████| 258/258 [04:09<00:00,  1.03it/s, loss=0.0256]
Epoch 18/150 [Validation]: 100%|██████████| 2/2 [00:01<00:00,  1.36it/s, loss=0.0045]
100%|██████████| 15/15 [00:32<00:00,  2.17s/it]


train-epoch-loss:0.0256 valid-beta4-score:0.3466


Epoch 19/150 [Training]: 100%|██████████| 258/258 [04:34<00:00,  1.06s/it, loss=0.0271]
Epoch 19/150 [Validation]: 100%|██████████| 2/2 [00:01<00:00,  1.37it/s, loss=0.0138]
100%|██████████| 15/15 [00:34<00:00,  2.31s/it]


train-epoch-loss:0.0271 valid-beta4-score:0.3488


Epoch 20/150 [Training]: 100%|██████████| 258/258 [04:12<00:00,  1.02it/s, loss=0.0225]
Epoch 20/150 [Validation]: 100%|██████████| 2/2 [00:01<00:00,  1.37it/s, loss=0.0021]
100%|██████████| 15/15 [00:35<00:00,  2.35s/it]


train-epoch-loss:0.0225 valid-beta4-score:0.3858


Epoch 21/150 [Training]: 100%|██████████| 258/258 [04:23<00:00,  1.02s/it, loss=0.0261]
Epoch 21/150 [Validation]: 100%|██████████| 2/2 [00:01<00:00,  1.39it/s, loss=0.0223]
100%|██████████| 15/15 [00:34<00:00,  2.28s/it]


train-epoch-loss:0.0261 valid-beta4-score:0.3628


Epoch 22/150 [Training]: 100%|██████████| 258/258 [04:15<00:00,  1.01it/s, loss=0.0236]
Epoch 22/150 [Validation]: 100%|██████████| 2/2 [00:01<00:00,  1.38it/s, loss=0.0044]
100%|██████████| 15/15 [00:35<00:00,  2.40s/it]


train-epoch-loss:0.0236 valid-beta4-score:0.3590


Epoch 23/150 [Training]: 100%|██████████| 258/258 [04:10<00:00,  1.03it/s, loss=0.0275]
Epoch 23/150 [Validation]: 100%|██████████| 2/2 [00:01<00:00,  1.37it/s, loss=0.0193]
100%|██████████| 15/15 [00:35<00:00,  2.35s/it]


train-epoch-loss:0.0275 valid-beta4-score:0.3699


Epoch 24/150 [Training]: 100%|██████████| 258/258 [04:05<00:00,  1.05it/s, loss=0.0273]
Epoch 24/150 [Validation]: 100%|██████████| 2/2 [00:01<00:00,  1.38it/s, loss=0.0303]
100%|██████████| 15/15 [00:40<00:00,  2.70s/it]


train-epoch-loss:0.0273 valid-beta4-score:0.3695


Epoch 25/150 [Training]: 100%|██████████| 258/258 [04:06<00:00,  1.05it/s, loss=0.0244]
Epoch 25/150 [Validation]: 100%|██████████| 2/2 [00:01<00:00,  1.41it/s, loss=0.0008]
100%|██████████| 15/15 [00:34<00:00,  2.33s/it]


train-epoch-loss:0.0244 valid-beta4-score:0.3497


Epoch 26/150 [Training]: 100%|██████████| 258/258 [04:24<00:00,  1.03s/it, loss=0.0237]
Epoch 26/150 [Validation]: 100%|██████████| 2/2 [00:01<00:00,  1.39it/s, loss=0.0046]
100%|██████████| 15/15 [00:34<00:00,  2.33s/it]


train-epoch-loss:0.0237 valid-beta4-score:0.3891


Epoch 27/150 [Training]: 100%|██████████| 258/258 [04:21<00:00,  1.01s/it, loss=0.0234]
Epoch 27/150 [Validation]: 100%|██████████| 2/2 [00:01<00:00,  1.36it/s, loss=0.0234]
100%|██████████| 15/15 [00:35<00:00,  2.36s/it]


train-epoch-loss:0.0234 valid-beta4-score:0.3701


Epoch 28/150 [Training]: 100%|██████████| 258/258 [04:15<00:00,  1.01it/s, loss=0.0236]
Epoch 28/150 [Validation]: 100%|██████████| 2/2 [00:01<00:00,  1.38it/s, loss=0.0132]
100%|██████████| 15/15 [00:35<00:00,  2.36s/it]


train-epoch-loss:0.0236 valid-beta4-score:0.3971


Epoch 29/150 [Training]: 100%|██████████| 258/258 [05:03<00:00,  1.18s/it, loss=0.0251]
Epoch 29/150 [Validation]: 100%|██████████| 2/2 [00:01<00:00,  1.31it/s, loss=0.0024]
100%|██████████| 15/15 [00:34<00:00,  2.32s/it]


train-epoch-loss:0.0251 valid-beta4-score:0.3904


Epoch 30/150 [Training]: 100%|██████████| 258/258 [04:24<00:00,  1.02s/it, loss=0.0240]
Epoch 30/150 [Validation]: 100%|██████████| 2/2 [00:01<00:00,  1.38it/s, loss=0.0014]
100%|██████████| 15/15 [00:35<00:00,  2.38s/it]


train-epoch-loss:0.0240 valid-beta4-score:0.3588


Epoch 31/150 [Training]: 100%|██████████| 258/258 [04:27<00:00,  1.04s/it, loss=0.0229]
Epoch 31/150 [Validation]: 100%|██████████| 2/2 [00:01<00:00,  1.39it/s, loss=0.0264]
100%|██████████| 15/15 [00:36<00:00,  2.41s/it]


train-epoch-loss:0.0229 valid-beta4-score:0.3878


Epoch 32/150 [Training]: 100%|██████████| 258/258 [04:17<00:00,  1.00it/s, loss=0.0235]
Epoch 32/150 [Validation]: 100%|██████████| 2/2 [00:01<00:00,  1.41it/s, loss=0.0141]
100%|██████████| 15/15 [00:35<00:00,  2.39s/it]


train-epoch-loss:0.0235 valid-beta4-score:0.4006


Epoch 33/150 [Training]: 100%|██████████| 258/258 [04:15<00:00,  1.01it/s, loss=0.0239]
Epoch 33/150 [Validation]: 100%|██████████| 2/2 [00:01<00:00,  1.37it/s, loss=0.0363]
100%|██████████| 15/15 [00:35<00:00,  2.37s/it]


train-epoch-loss:0.0239 valid-beta4-score:0.3954


Epoch 34/150 [Training]: 100%|██████████| 258/258 [04:20<00:00,  1.01s/it, loss=0.0232]
Epoch 34/150 [Validation]: 100%|██████████| 2/2 [00:01<00:00,  1.39it/s, loss=0.0009]
100%|██████████| 15/15 [00:35<00:00,  2.39s/it]


train-epoch-loss:0.0232 valid-beta4-score:0.3620


Epoch 35/150 [Training]: 100%|██████████| 258/258 [04:17<00:00,  1.00it/s, loss=0.0240]
Epoch 35/150 [Validation]: 100%|██████████| 2/2 [00:01<00:00,  1.40it/s, loss=0.0024]
100%|██████████| 15/15 [00:35<00:00,  2.37s/it]


train-epoch-loss:0.0240 valid-beta4-score:0.3804


Epoch 36/150 [Training]: 100%|██████████| 258/258 [04:27<00:00,  1.04s/it, loss=0.0245]
Epoch 36/150 [Validation]: 100%|██████████| 2/2 [00:01<00:00,  1.35it/s, loss=0.0171]
100%|██████████| 15/15 [00:35<00:00,  2.39s/it]


train-epoch-loss:0.0245 valid-beta4-score:0.3790


Epoch 37/150 [Training]: 100%|██████████| 258/258 [04:22<00:00,  1.02s/it, loss=0.0227]
Epoch 37/150 [Validation]: 100%|██████████| 2/2 [00:01<00:00,  1.39it/s, loss=0.0148]
100%|██████████| 15/15 [00:35<00:00,  2.38s/it]


train-epoch-loss:0.0227 valid-beta4-score:0.3838


Epoch 38/150 [Training]: 100%|██████████| 258/258 [04:15<00:00,  1.01it/s, loss=0.0239]
Epoch 38/150 [Validation]: 100%|██████████| 2/2 [00:01<00:00,  1.39it/s, loss=0.0411]
100%|██████████| 15/15 [00:36<00:00,  2.41s/it]


train-epoch-loss:0.0239 valid-beta4-score:0.3835


Epoch 39/150 [Training]: 100%|██████████| 258/258 [04:28<00:00,  1.04s/it, loss=0.0254]
Epoch 39/150 [Validation]: 100%|██████████| 2/2 [00:01<00:00,  1.37it/s, loss=0.0212]
100%|██████████| 15/15 [00:36<00:00,  2.42s/it]


train-epoch-loss:0.0254 valid-beta4-score:0.3617


Epoch 40/150 [Training]: 100%|██████████| 258/258 [04:31<00:00,  1.05s/it, loss=0.0229]
Epoch 40/150 [Validation]: 100%|██████████| 2/2 [00:01<00:00,  1.33it/s, loss=0.0180]
100%|██████████| 15/15 [00:36<00:00,  2.43s/it]


train-epoch-loss:0.0229 valid-beta4-score:0.3998


Epoch 41/150 [Training]: 100%|██████████| 258/258 [04:23<00:00,  1.02s/it, loss=0.0229]
Epoch 41/150 [Validation]: 100%|██████████| 2/2 [00:01<00:00,  1.37it/s, loss=0.0011]
100%|██████████| 15/15 [00:36<00:00,  2.41s/it]


train-epoch-loss:0.0229 valid-beta4-score:0.3792


Epoch 42/150 [Training]: 100%|██████████| 258/258 [04:26<00:00,  1.03s/it, loss=0.0212]
Epoch 42/150 [Validation]: 100%|██████████| 2/2 [00:01<00:00,  1.36it/s, loss=0.0098]
100%|██████████| 15/15 [00:36<00:00,  2.41s/it]


train-epoch-loss:0.0212 valid-beta4-score:0.3988


Epoch 43/150 [Training]: 100%|██████████| 258/258 [04:24<00:00,  1.03s/it, loss=0.0206]
Epoch 43/150 [Validation]: 100%|██████████| 2/2 [00:01<00:00,  1.39it/s, loss=0.0054]
100%|██████████| 15/15 [00:36<00:00,  2.40s/it]


train-epoch-loss:0.0206 valid-beta4-score:0.4125


Epoch 44/150 [Training]: 100%|██████████| 258/258 [04:12<00:00,  1.02it/s, loss=0.0218]
Epoch 44/150 [Validation]: 100%|██████████| 2/2 [00:01<00:00,  1.40it/s, loss=0.0025]
100%|██████████| 15/15 [00:36<00:00,  2.40s/it]


train-epoch-loss:0.0218 valid-beta4-score:0.3829


Epoch 45/150 [Training]: 100%|██████████| 258/258 [04:04<00:00,  1.06it/s, loss=0.0197]
Epoch 45/150 [Validation]: 100%|██████████| 2/2 [00:01<00:00,  1.40it/s, loss=0.0299]
100%|██████████| 15/15 [00:35<00:00,  2.40s/it]


train-epoch-loss:0.0197 valid-beta4-score:0.3316


Epoch 46/150 [Training]: 100%|██████████| 258/258 [04:19<00:00,  1.01s/it, loss=0.0209]
Epoch 46/150 [Validation]: 100%|██████████| 2/2 [00:01<00:00,  1.38it/s, loss=0.0268]
100%|██████████| 15/15 [00:36<00:00,  2.40s/it]


train-epoch-loss:0.0209 valid-beta4-score:0.3727


Epoch 47/150 [Training]: 100%|██████████| 258/258 [04:08<00:00,  1.04it/s, loss=0.0224]
Epoch 47/150 [Validation]: 100%|██████████| 2/2 [00:01<00:00,  1.40it/s, loss=0.0145]
100%|██████████| 15/15 [00:35<00:00,  2.36s/it]


train-epoch-loss:0.0224 valid-beta4-score:0.3963


Epoch 48/150 [Training]: 100%|██████████| 258/258 [04:11<00:00,  1.03it/s, loss=0.0233]
Epoch 48/150 [Validation]: 100%|██████████| 2/2 [00:01<00:00,  1.39it/s, loss=0.0298]
100%|██████████| 15/15 [00:35<00:00,  2.37s/it]


train-epoch-loss:0.0233 valid-beta4-score:0.3691


Epoch 49/150 [Training]: 100%|██████████| 258/258 [04:28<00:00,  1.04s/it, loss=0.0237]
Epoch 49/150 [Validation]: 100%|██████████| 2/2 [00:01<00:00,  1.35it/s, loss=0.0271]
100%|██████████| 15/15 [00:35<00:00,  2.38s/it]


train-epoch-loss:0.0237 valid-beta4-score:0.4031


Epoch 50/150 [Training]: 100%|██████████| 258/258 [04:21<00:00,  1.01s/it, loss=0.0237]
Epoch 50/150 [Validation]: 100%|██████████| 2/2 [00:01<00:00,  1.38it/s, loss=0.0251]
100%|██████████| 15/15 [00:35<00:00,  2.40s/it]


train-epoch-loss:0.0237 valid-beta4-score:0.4094


Epoch 51/150 [Training]: 100%|██████████| 258/258 [04:13<00:00,  1.02it/s, loss=0.0239]
Epoch 51/150 [Validation]: 100%|██████████| 2/2 [00:01<00:00,  1.37it/s, loss=0.0015]
100%|██████████| 15/15 [00:36<00:00,  2.42s/it]


train-epoch-loss:0.0239 valid-beta4-score:0.3721


Epoch 52/150 [Training]: 100%|██████████| 258/258 [03:58<00:00,  1.08it/s, loss=0.0243]
Epoch 52/150 [Validation]: 100%|██████████| 2/2 [00:01<00:00,  1.37it/s, loss=0.0199]
100%|██████████| 15/15 [00:36<00:00,  2.41s/it]


train-epoch-loss:0.0243 valid-beta4-score:0.4014


Epoch 53/150 [Training]: 100%|██████████| 258/258 [04:23<00:00,  1.02s/it, loss=0.0208]
Epoch 53/150 [Validation]: 100%|██████████| 2/2 [00:01<00:00,  1.37it/s, loss=0.0153]
100%|██████████| 15/15 [00:35<00:00,  2.38s/it]


train-epoch-loss:0.0208 valid-beta4-score:0.3916


Epoch 54/150 [Training]:  69%|██████▉   | 178/258 [03:13<01:51,  1.39s/it, loss=0.0222]

In [None]:
# train_lossとvalid_lossのプロット

plt.plot(grand_train_loss, label="train_loss")
plt.plot(grand_valid_loss, label="valid_loss")
plt.legend()
plt.show()

In [None]:
# train_scoreとvalid_scoreのプロット
plt.plot(grand_train_score, label="train_score")
plt.plot(grand_valid_score, label="valid_score")
plt.legend()
plt.show()

In [None]:
random.random()