## Carga modulo comun

In [1]:
import sys
import os
sys.path.append(os.path.abspath('../../common'))

In [2]:
import torch
import torch.nn as nn
import torch.nn.functional as F

from purrfect.dataset import load_partition,save_partition, create_train_valid_loaders, RandomTransform

from purrfect.training import train_model
import torch.optim as optim

from purrfect.active_learning import create_new_partition, test_model

from sklearn.model_selection import train_test_split
#from purrfect.submission import create_submission

In [3]:
DEVICE = torch.device('cuda' if torch.cuda.is_available() else 'cpu')
BATCH_SIZE = 32*2
USE_AUTOCAST = True
EARLY_STOPPING_PATIENCE = 5
EARLY_STOPPING_GRACE_PERIOD = 8

## Definición modelo

In [4]:
class GradientMagnitude(nn.Module):
    def __init__(self):
        super(GradientMagnitude, self).__init__()
        # Define Sobel filters for computing gradients in x and y directions
        sobel_x = torch.tensor([[-1, 0, 1], [-2, 0, 2], [-1, 0, 1]], dtype=torch.float32,device=DEVICE)
        sobel_y = torch.tensor([[-1, -2, -1], [0, 0, 0], [1, 2, 1]], dtype=torch.float32,device=DEVICE)
        
        # Sobel filters need to be reshaped for convolution: (out_channels, in_channels, height, width)
        # Apply the filters across all channels by expanding them to shape (C, 1, 3, 3)
        self.sobel_x = sobel_x.view(1, 1, 3, 3)
        self.sobel_y = sobel_y.view(1, 1, 3, 3)
    
    def forward(self, x):
        B, C, W, H = x.shape
        
        # Apply Sobel filters to compute gradients in x and y directions for all channels
        grad_x = F.conv2d(x, self.sobel_x.expand(C, 1, 3, 3), groups=C, padding=1)
        grad_y = F.conv2d(x, self.sobel_y.expand(C, 1, 3, 3), groups=C, padding=1)
        
        # Compute gradient magnitude: sqrt(grad_x^2 + grad_y^2)
        grad_mag = torch.sqrt(grad_x**2 + grad_y**2)
        
        return grad_mag
def aggregate_similarity_cosine(tensor):
    # tensor is of shape (B, 2, H, W)
    #B, C, H, W = tensor.shape
    #assert C == 2, "The channel dimension must represent 2D vectors (x, y components)"

    # Define shifts for neighboring vectors (up, down, left, right) and stack them
    shift_up = F.pad(tensor[:, :, 1:, :], (0, 0, 0, 1))  # Shift up
    shift_down = F.pad(tensor[:, :, :-1, :], (0, 0, 1, 0))  # Shift down
    shift_left = F.pad(tensor[:, :, :, 1:], (0, 1, 0, 0))  # Shift left
    shift_right = F.pad(tensor[:, :, :, :-1], (1, 0, 0, 0))  # Shift right

    # Stack shifted neighbors into a single tensor of shape (B, 2, H, W, 4)
    neighbors = torch.stack((shift_up, shift_down, shift_left, shift_right), dim=4)  # (B, 2, H, W, 4)
    # Calculate dot product for all neighbors
    dot_product = (tensor.unsqueeze(4) * neighbors).sum(dim=1,keepdim=True)  # (B, 1, H, W, 4)
    # Calculate mean, max, and min along the neighbor dimension (dim=4)
    #mean_similarity = dot_product.mean(dim=4, keepdim=True)  # (B, 1, H, W, 1)
    max_similarity = dot_product.max(dim=4, keepdim=True).values  # (B, 1, H, W, 1)
    min_similarity = dot_product.min(dim=4, keepdim=True).values  # (B, 1, H, W, 1)

    # Concatenate mean, max, and min similarities along the channel dimension
    aggregate_similarity = torch.cat((max_similarity, min_similarity), dim=1)  # (B, 3, H, W,1)

    return aggregate_similarity.squeeze(-1)  # (B, 3, H, W)
class ChannelAdder(nn.Module):
    def __init__(self):
        super(ChannelAdder, self).__init__()
        self.grad_magnitude = GradientMagnitude()

    def forward(self, x):
        
        # Extract the first two channels (e1 and e2) and the third channel (delta) directly
        e = x[:, :2, :, :]  # Shape (B, 2, H, W)
        delta = x[:, 2:3, :, :]  # Shape (B, 1, H, W)

        # Calculate the magnitude in one step (B, 1, H, W)
        magnitude = torch.norm(e, dim=1, keepdim=True)  # Efficient norm calculation

        # Calculate the angle using atan2 to avoid division by zero and handle quadrant
        angle = 0.5 * torch.atan2(e[:, 0, :, :], e[:, 1, :, :]).unsqueeze(1)  # (B, 1, H, W)

        # Compute the weighted components e1_weighted and e2_weighted
        e_norm = e / magnitude  # Split along channel dimension

        cross_product = e[:, 0:1, :, :] * e[:, 1:2, :, :]  # Efficient cross-product (B, 1, H, W)

        simmilarity = aggregate_similarity_cosine(e_norm)
        # Concatenate all the channels (original and new) into the output tensor
        output = torch.cat([
            e,
            magnitude,
            angle,
            e_norm,
            self.grad_magnitude(e),
            #cross_product,
            #delta,
            simmilarity #min max and mean simmilarity
        ], dim=1)
        #output = torch.cat([output, self.grad_magnitude(output)], dim=1)

        return output

In [5]:
BN_MOMENTUM = 0.1
def kaiming_init(module,
                 a=0,
                 mode='fan_out',
                 nonlinearity='relu',
                 bias=0,
                 distribution='normal'):
    assert distribution in ['uniform', 'normal']
    if distribution == 'uniform':
        nn.init.kaiming_uniform_(
            module.weight, a=a, mode=mode, nonlinearity=nonlinearity)
    else:
        nn.init.kaiming_normal_(
            module.weight, a=a, mode=mode, nonlinearity=nonlinearity)
    if hasattr(module, 'bias') and module.bias is not None:
        nn.init.constant_(module.bias, bias)
class PA(nn.Module):
    def __init__(self, inplanes, planes, kernel_size=1, stride=1):
        super(PA, self).__init__()

        self.inplanes = inplanes
        self.inter_planes = planes // 2
        self.planes = planes
        self.kernel_size = kernel_size
        self.stride = stride
        self.padding = (kernel_size - 1) // 2
        ratio = 4

        self.conv_q_right = nn.Conv2d(self.inplanes, 1, kernel_size=1, stride=stride, padding=0, bias=False)
        self.conv_v_right = nn.Conv2d(self.inplanes, self.inter_planes, kernel_size=1, stride=stride, padding=0,
                                      bias=False)
        # self.conv_up = nn.Conv2d(self.inter_planes, self.planes, kernel_size=1, stride=1, padding=0, bias=False)
        self.conv_up = nn.Sequential(
            nn.Conv2d(self.inter_planes, self.inter_planes // ratio, kernel_size=1),
            nn.LayerNorm([self.inter_planes // ratio, 1, 1]),
            nn.ReLU(inplace=True),
            nn.Conv2d(self.inter_planes // ratio, self.planes, kernel_size=1)
        )
        self.softmax_right = nn.Softmax(dim=2)
        self.sigmoid = nn.Sigmoid()

        self.conv_q_left = nn.Conv2d(self.inplanes, self.inter_planes, kernel_size=1, stride=stride, padding=0,
                                     bias=False)  # g
        self.avg_pool = nn.AdaptiveAvgPool2d(1)
        self.conv_v_left = nn.Conv2d(self.inplanes, self.inter_planes, kernel_size=1, stride=stride, padding=0,
                                     bias=False)  # theta
        self.softmax_left = nn.Softmax(dim=2)

        self.reset_parameters()
    def reset_parameters(self):
        kaiming_init(self.conv_q_right, mode='fan_in')
        kaiming_init(self.conv_v_right, mode='fan_in')
        kaiming_init(self.conv_q_left, mode='fan_in')
        kaiming_init(self.conv_v_left, mode='fan_in')

        self.conv_q_right.inited = True
        self.conv_v_right.inited = True
        self.conv_q_left.inited = True
        self.conv_v_left.inited = True

    def spatial_pool_mask(self, x):
        input_x = self.conv_v_right(x)

        batch, channel, height, width = input_x.size()

        # [N, IC, H*W]
        input_x = input_x.view(batch, channel, height * width)

        # [N, 1, H, W]
        context_mask = self.conv_q_right(x)

        # [N, 1, H*W]
        context_mask = context_mask.view(batch, 1, height * width)

        # [N, 1, H*W]
        context_mask = self.softmax_right(context_mask)

        # [N, IC, 1]
        # context = torch.einsum('ndw,new->nde', input_x, context_mask)
        context = torch.matmul(input_x, context_mask.transpose(1, 2))

        # [N, IC, 1, 1]
        context = context.unsqueeze(-1)

        # [N, OC, 1, 1]
        context = self.conv_up(context)

        # [N, OC, 1, 1]
        mask_ch = self.sigmoid(context)
        return mask_ch

    def channel_pool_mask(self, x):
        # [N, IC, H, W]
        g_x = self.conv_q_left(x)

        batch, channel, height, width = g_x.size()

        # [N, IC, 1, 1]
        avg_x = self.avg_pool(g_x)

        batch, channel, avg_x_h, avg_x_w = avg_x.size()

        # [N, 1, IC]
        avg_x = avg_x.view(batch, channel, avg_x_h * avg_x_w).permute(0, 2, 1)

        # [N, IC, H*W]
        theta_x = self.conv_v_left(x).view(batch, self.inter_planes, height * width)

        # [N, IC, H*W]
        theta_x = self.softmax_left(theta_x)

        # [N, 1, H*W]
        # context = torch.einsum('nde,new->ndw', avg_x, theta_x)
        context = torch.matmul(avg_x, theta_x)

        # [N, 1, H, W]
        context = context.view(batch, 1, height, width)

        # [N, 1, H, W]
        mask_sp = self.sigmoid(context)
        return mask_sp
    def forward(self, x, y):
        sp_mask = self.spatial_pool_mask(y)
        ch_mask = self.channel_pool_mask(y)
        return x * sp_mask * ch_mask
    

class PSA(nn.Module):
    def __init__(self, inplanes, planes, kernel_size=1, stride=1):
        super(PSA, self).__init__()
        self.pa = PA(inplanes, planes, kernel_size, stride)

    def forward(self, x):
        return self.pa(x,x)

class ConBnRelu(nn.Module):
    def __init__(self, in_channels, out_channels, kernel_size, stride=1, padding=0, dilation=1,bias=True,use_bn=False,use_relu=True):
        super(ConBnRelu, self).__init__()

        self.conv = nn.Conv2d(in_channels, out_channels, kernel_size=kernel_size, stride=stride, padding=padding,
                              dilation=dilation, bias=bias)
        if use_bn and use_relu:
            self.output = nn.Sequential(
                nn.BatchNorm2d(out_channels, momentum=BN_MOMENTUM),
                nn.ReLU(inplace=True)
            )
        elif use_bn:
            self.output = nn.BatchNorm2d(out_channels, momentum=BN_MOMENTUM)
        elif use_relu:
            self.output = nn.ReLU(inplace=True)
        else:
            self.output = nn.Identity()
        
        
    def forward(self, x):
        return self.output(self.conv(x))
class ResBlock(nn.Module):
    expansion = 1

    def __init__(self, in_channels, out_channels, use_attention=False):
        super(ResBlock, self).__init__()
        self.rescale = nn.Conv2d(in_channels, out_channels, kernel_size=1, stride=1, padding=0, bias=True)

        if use_attention:
            self.seq1 = nn.Sequential(
                ConBnRelu(out_channels, out_channels, kernel_size=3, stride=1, padding=1, bias=True),
                PSA(out_channels, out_channels),
                #ConBnRelu(out_channels, out_channels, kernel_size=3, stride=1, padding=1, bias=True),
                #PSA(out_channels, out_channels),
                ConBnRelu(out_channels, out_channels, kernel_size=3, stride=1, padding=1, bias=True,use_relu=False),
            )
            self.seq2 = nn.Sequential(
                ConBnRelu(out_channels, out_channels, kernel_size=3, stride=1, padding=1, bias=True),
                PSA(out_channels, out_channels),
                #ConBnRelu(out_channels, out_channels, kernel_size=3, stride=1, padding=1, bias=True),
                #PSA(out_channels, out_channels),
                ConBnRelu(out_channels, out_channels, kernel_size=3, stride=1, padding=1, bias=True,use_relu=False)
            )
        else:
            self.seq1 = nn.Sequential(
                ConBnRelu(out_channels, out_channels, kernel_size=3, stride=1, padding=1, bias=True),
                #ConBnRelu(out_channels, out_channels, kernel_size=3, stride=1, padding=1, bias=True),
                ConBnRelu(out_channels, out_channels, kernel_size=3, stride=1, padding=1, bias=True,use_relu=False)
            )
            self.seq2 = nn.Sequential(
                ConBnRelu(out_channels, out_channels, kernel_size=3, stride=1, padding=1, bias=True),
                #ConBnRelu(out_channels, out_channels, kernel_size=3, stride=1, padding=1, bias=True),
                ConBnRelu(out_channels, out_channels, kernel_size=3, stride=1, padding=1, bias=True, use_relu=False)
            )

        

    def forward(self, x):
        x = self.rescale(x)
        x = F.relu(self.seq1(x) + x, inplace=True)
        x = F.relu(self.seq2(x) + x, inplace=True)
        return x

class UNetEncoder(nn.Module):
    def __init__(self, i_ch=16):
        super(UNetEncoder, self).__init__()
        # Encoder
        self.encoder1 = nn.Sequential(
            nn.AvgPool2d(2),  # i_chx128x128 -> i_chx64x64
            ResBlock(i_ch, i_ch * 2)  # i_chx64x64 -> (i_ch * 2)x64x64
        )
        self.encoder2 = nn.Sequential(
            nn.AvgPool2d(2),  # (i_ch * 2)x64x64 -> (i_ch * 2)x32x32
            ResBlock(i_ch * 2, i_ch * 4)  # (i_ch * 2)x32x32 -> (i_ch * 4)x32x32
        )
        self.encoder3 = nn.Sequential(
            nn.AvgPool2d(2),  # (i_ch * 4)x32x32 -> (i_ch * 4)x16x16
            ResBlock(i_ch * 4, i_ch * 8)  # (i_ch * 4)x16x16 -> (i_ch * 8)x16x16
        )
        self.encoder4 = nn.Sequential(
            nn.AvgPool2d(2),  # (i_ch * 8)x16x16 -> (i_ch * 8)x8x8
            ResBlock(i_ch * 8, i_ch * 16)  # (i_ch * 8)x8x8 -> (i_ch * 16)x8x8
        )
    def forward(self, x):
        e1 = self.encoder1(x)
        e2 = self.encoder2(e1)
        e3 = self.encoder3(e2)
        e4 = self.encoder4(e3)
        return e1, e2, e3, e4
class UNetDecoder(nn.Module):
    def __init__(self, i_ch=16):
        super(UNetDecoder, self).__init__()
        # Decoder
        self.attention4 = PA(i_ch * 16, i_ch * 16)
        self.upconv4 = nn.ConvTranspose2d(i_ch * 16*2, i_ch * 16, kernel_size=2, stride=2)  # (i_ch * 16)x8x8 -> (i_ch * 8)x16x16
        self.decoder4 = ResBlock(i_ch * 16, i_ch * 8)  # (i_ch * 16)x16x16 -> (i_ch * 8)x16x16

        self.attention3 = PA(i_ch * 8, i_ch * 8)
        self.upconv3 = nn.ConvTranspose2d(i_ch * 8*2, i_ch * 8, kernel_size=2, stride=2)  # (i_ch * 8)x16x16 -> (i_ch * 4)x32x32
        self.decoder3 = ResBlock(i_ch * 8, i_ch * 4)  # (i_ch * 8)x32x32 -> (i_ch * 4)x32x32

        self.attention2 = PA(i_ch * 4, i_ch * 4)
        self.upconv2 = nn.ConvTranspose2d(i_ch * 4*2, i_ch * 4, kernel_size=2, stride=2)  # (i_ch * 4)x32x32 -> (i_ch * 2)x64x64
        self.decoder2 = ResBlock(i_ch * 4, i_ch * 2)  # (i_ch * 4)x64x64 -> (i_ch * 2)x64x64

        self.attention1 = PA(i_ch*2, i_ch*2)
        self.upconv1 = nn.ConvTranspose2d(i_ch * 2*2, i_ch*2, kernel_size=2, stride=2)  # (i_ch * 2)x64x64 -> i_chx128x128
        self.decoder1 = ResBlock(i_ch * 2, i_ch)  # (i_ch * 2)x128x128 -> i_chx128x128
    def forward(self, x, e1, e2, e3, e4):
        d4 = torch.cat((self.attention4(e4, x), x), dim=1)
        d4 = self.upconv4(d4)
        d4 = self.decoder4(d4)

        d3 = torch.cat((self.attention3(e3, d4), d4), dim=1)
        d3 = self.upconv3(d3)
        d3 = self.decoder3(d3)

        
        d2 = torch.cat((self.attention2(e2, d3), d3), dim=1)
        d2 = self.upconv2(d2)
        d2 = self.decoder2(d2)

        
        d1 = torch.cat((self.attention1(e1, d2), d2), dim=1)
        d1 = self.upconv1(d1)
        d1 = self.decoder1(d1)
        return d1
class UNetBottleneck(nn.Module):
    def __init__(self,input_ch=16):
        super(UNetBottleneck, self).__init__()
        self.bottleneck = nn.Sequential(
            ResBlock(input_ch * 16, input_ch*16),
            ResBlock(input_ch * 16, input_ch*16)
        )
    def forward(self, x):
        return self.bottleneck(x)
class MultiHeadUNet(nn.Module):
    def __init__(self, in_channels, out_channels, i_ch=16):
        super(MultiHeadUNet, self).__init__()
        
        self.embedder1 = nn.Sequential(
            ResBlock(in_channels, i_ch),  # in_channelsx128x128 -> i_chx128x128
            ResBlock(i_ch, i_ch),  # i_chx128x128 -> i_chx128x128
        )
        self.embedder2 = nn.Sequential(
            ResBlock(in_channels, i_ch),  # in_channelsx128x128 -> i_chx128x128
            ResBlock(i_ch, i_ch),  # i_chx128x128 -> i_chx128x128
        )
        self.embedder3 = nn.Sequential(
            ResBlock(in_channels, i_ch),  # in_channelsx128x128 -> i_chx128x128
            ResBlock(i_ch, i_ch),  # i_chx128x128 -> i_chx128x128
        )

        self.embedder4 = nn.Sequential(
            ResBlock(in_channels, i_ch),  # in_channelsx128x128 -> i_chx128x128
            ResBlock(i_ch, i_ch),  # i_chx128x128 -> i_chx128x128
        )

        self.embedder5 = nn.Sequential(
            ResBlock(in_channels, i_ch),  # in_channelsx128x128 -> i_chx128x128
            ResBlock(i_ch, i_ch),  # i_chx128x128 -> i_chx128x128
        )
        
        self.encoder1 = UNetEncoder(i_ch)
        self.encoder2 = UNetEncoder(i_ch)
        self.encoder3 = UNetEncoder(i_ch)
        self.encoder4 = UNetEncoder(i_ch)
        self.encoder5 = UNetEncoder(i_ch)

        self.compress_e1 = nn.Conv2d(i_ch * 2 * 5, i_ch * 2, kernel_size=1)
        self.compress_e2 = nn.Conv2d(i_ch * 4 * 5, i_ch * 4, kernel_size=1)
        self.compress_e3 = nn.Conv2d(i_ch * 8 * 5, i_ch * 8, kernel_size=1)
        self.compress_e4 = nn.Conv2d(i_ch * 16 * 5, i_ch * 16, kernel_size=1)

        self.bottleneck = UNetBottleneck(i_ch)
        self.decoder = UNetDecoder(i_ch)
        self.output = nn.Conv2d(i_ch, out_channels, kernel_size=1)
    def freeze_encoder(self,freeze=True):
        for param in self.encoder1.parameters():
            param.requires_grad = not freeze
        for param in self.encoder2.parameters():
            param.requires_grad = not freeze
        for param in self.encoder3.parameters():
            param.requires_grad = not freeze
        for param in self.encoder4.parameters():
            param.requires_grad = not freeze
        for param in self.encoder5.parameters():
            param.requires_grad = not freeze
    def forward(self, x1,x2,x3,x4,x5):
        e1_1,e2_1,e3_1,e4_1 = self.encoder1(self.embedder1(x1))
        e1_2,e2_2,e3_2,e4_2 = self.encoder2(self.embedder2(x2))
        e1_3,e2_3,e3_3,e4_3 = self.encoder3(self.embedder3(x3))
        e1_4,e2_4,e3_4,e4_4 = self.encoder4(self.embedder4(x4))
        e1_5,e2_5,e3_5,e4_5 = self.encoder5(self.embedder5(x5))

        e1 = torch.cat([e1_1,e1_2,e1_3,e1_4,e1_5],dim=1)
        e2 = torch.cat([e2_1,e2_2,e2_3,e2_4,e2_5],dim=1)
        e3 = torch.cat([e3_1,e3_2,e3_3,e3_4,e3_5],dim=1)
        e4 = torch.cat([e4_1,e4_2,e4_3,e4_4,e4_5],dim=1)

        e1 = self.compress_e1(e1)
        e2 = self.compress_e2(e2)
        e3 = self.compress_e3(e3)
        e4 = self.compress_e4(e4)

        b = self.bottleneck(e4)
        d = self.decoder(b, e1, e2, e3, e4)
        return self.output(d)

class KappaPredictor(nn.Module):
    def __init__(self):
        super(KappaPredictor, self).__init__()
        self.channel_adder = ChannelAdder()
        self.bn = nn.BatchNorm2d(10)
        self.unet = MultiHeadUNet(2, 1,i_ch=8)
    def freeze_encoder(self,freeze=True):
        if freeze:
            for param in self.bn.parameters():
                param.requires_grad = not freeze
        self.unet.freeze_encoder(freeze)
    def forward(self, x):
        x = self.channel_adder(x)
        x = self.bn(x)
        x1,x2,x3,x4,x5 = torch.split(x, 2, dim=1)
        out = self.unet(x1,x2,x3,x4,x5)
        return out

## Creación particion inicial

In [6]:
def create_next_partitions(current_partition,k=1):#Creacion de particiones train y valid
    init_partition = []
    for i in range(k):
        init_partition += load_partition(f"partition_{k*current_partition+(i+1)}.json")
        #print(f"partition_{k*current_partition+(i+1)}.json")

    train_partition, val_partition = train_test_split(init_partition, test_size=0.2, random_state=42)
    save_partition(f"partition_{current_partition+1}_train.json","partitions",train_partition)
    save_partition(f"partition_{current_partition+1}_val.json","partitions",val_partition)

In [7]:
def load_best_model_so_far(model, last_saved_partition):
    best_loss = float('inf')
    best_partition = 0
    for partition in range(1,last_saved_partition+1):
        checkpoint = torch.load(f"models/last_checkpoint_partition_{partition}.pth",weights_only=False)
        if checkpoint['best_loss'] < best_loss:
            best_loss = checkpoint['best_loss']
            best_partition = partition
    model.load_state_dict(torch.load(f"models/best_model_partition_{best_partition}.pth",weights_only=True))
    print(f"Loaded best model from partition {best_partition} with loss {best_loss}")
def load_last_best_model(model, last_saved_partition):
    #for from last_saved_partition to 1 looking if exists a best model file. if there is then load it and return
    for partition in range(last_saved_partition,0,-1):
        if os.path.exists(f"models/best_model_partition_{partition}.pth"):
            model.load_state_dict(torch.load(f"models/best_model_partition_{partition}.pth",weights_only=True))
            print(f"Loaded best model from partition {partition}")
            return
    print(f"There is no best model saved")

In [8]:
create_next_partitions(0,1)

In [9]:
def many_partitions_v2(start,end,model,criterion,transform=None,full_frecuency=5):
    for current_partition in range(start,end):
        if current_partition %full_frecuency==1:
            print(f"Partition {current_partition}: training full")
            model.freeze_encoder(False)
        else:
            print(f"Partition {current_partition}: training decoder")
            model.freeze_encoder(True)
        load_last_best_model(model,current_partition-1)
        create_next_partitions(current_partition-1)
        train_loader, val_loader = create_train_valid_loaders(
            f"partition_{current_partition}_train.json",
            f"partition_{current_partition}_val.json",
            "partitions",
            batch_size=BATCH_SIZE,
            transform=transform,
        )
        best_model_path = os.path.join(
            "models", f"best_model_partition_{current_partition}.pth"
        )
        last_checkpoint_path = os.path.join(
            "models", f"last_checkpoint_partition_{current_partition}.pth"
        )
        optimizer = optim.SGD(model.parameters(), lr=0.01, momentum=0.9, weight_decay=0.0001)
        #optim.AdamW(model.parameters())
        train_model(
            model,
            train_loader,
            val_loader,
            best_model_path,
            last_checkpoint_path,
            criterion,
            optimizer,
            num_epochs=100,
            device=DEVICE,
            early_stopping_patience=EARLY_STOPPING_PATIENCE,
            use_autocast=USE_AUTOCAST,
            early_stopping_grace_period=EARLY_STOPPING_GRACE_PERIOD,
        )
        if os.path.exists(best_model_path):
            model.load_state_dict(torch.load(best_model_path,weights_only=True))
            test_model(model,criterion,device=DEVICE,batch_size=BATCH_SIZE,experiment_name=f"adamw_atunet_freeze__{current_partition}")
        else:
            print("No best model found in partition",current_partition)
        

## Carga modelo

In [10]:
class L2LogLoss(nn.Module):
    def __init__(self):
        super(L2LogLoss, self).__init__()
    def rescale(self, x):
        return x.sign()*(x.abs().log1p())
    def forward(self, y_pred, y_true):
        return F.mse_loss(self.rescale(y_pred),self.rescale(y_true))
class L1LogLoss(nn.Module):
    def __init__(self):
        super(L1LogLoss, self).__init__()
    def rescale(self, x):
        return x.sign()*(x.abs().log1p())
    def forward(self, y_pred, y_true):
        return F.l1_loss(self.rescale(y_pred),self.rescale(y_true))

In [11]:
#Define model
model = KappaPredictor().to(DEVICE)
# Define Loss
criterion = L1LogLoss()
transform = None#RandomTransform()

In [12]:
sum([p.numel() for p in model.parameters() if p.requires_grad])

5742735

In [13]:
many_partitions_v2(1,11,model,criterion,transform=transform)

Partition 1: training full
There is no best model saved
Epoch [1/100]


Train Epoch 1: 100%|██████████| 77/77 [01:10<00:00,  1.09it/s, WMAPE=9.75, DICE=0.606, DPEAKS=224, Loss=0.04]
Validate Epoch 1: 100%|██████████| 20/20 [00:09<00:00,  2.12it/s, WMAPE=3.77, DICE=0.547, DPEAKS=227, Loss=0.0252]


Saving best model
Epoch [2/100]


Train Epoch 2: 100%|██████████| 77/77 [01:08<00:00,  1.12it/s, WMAPE=2.74, DICE=0.541, DPEAKS=225, Loss=0.0254]
Validate Epoch 2: 100%|██████████| 20/20 [00:09<00:00,  2.13it/s, WMAPE=2.29, DICE=0.528, DPEAKS=229, Loss=0.0251]


Saving best model
Epoch [3/100]


Train Epoch 3: 100%|██████████| 77/77 [01:08<00:00,  1.13it/s, WMAPE=2.65, DICE=0.523, DPEAKS=225, Loss=0.0254]
Validate Epoch 3: 100%|██████████| 20/20 [00:10<00:00,  1.99it/s, WMAPE=3.32, DICE=0.512, DPEAKS=229, Loss=0.0251]


Saving best model
Epoch [4/100]


Train Epoch 4: 100%|██████████| 77/77 [01:09<00:00,  1.10it/s, WMAPE=2.67, DICE=0.508, DPEAKS=224, Loss=0.0253]
Validate Epoch 4: 100%|██████████| 20/20 [00:09<00:00,  2.07it/s, WMAPE=3.02, DICE=0.498, DPEAKS=230, Loss=0.025]


Saving best model
Epoch [5/100]


Train Epoch 5: 100%|██████████| 77/77 [01:09<00:00,  1.11it/s, WMAPE=2.71, DICE=0.503, DPEAKS=224, Loss=0.0254]
Validate Epoch 5: 100%|██████████| 20/20 [00:09<00:00,  2.01it/s, WMAPE=2.29, DICE=0.502, DPEAKS=227, Loss=0.025]


Epoch [6/100]


Train Epoch 6: 100%|██████████| 77/77 [01:08<00:00,  1.12it/s, WMAPE=2.71, DICE=0.506, DPEAKS=224, Loss=0.0253]
Validate Epoch 6: 100%|██████████| 20/20 [00:09<00:00,  2.09it/s, WMAPE=1.92, DICE=0.509, DPEAKS=229, Loss=0.0251]


Epoch [7/100]


Train Epoch 7: 100%|██████████| 77/77 [01:09<00:00,  1.12it/s, WMAPE=2.64, DICE=0.51, DPEAKS=224, Loss=0.0253]
Validate Epoch 7: 100%|██████████| 20/20 [00:09<00:00,  2.07it/s, WMAPE=2.73, DICE=0.505, DPEAKS=227, Loss=0.025]


Saving best model
Epoch [8/100]


Train Epoch 8: 100%|██████████| 77/77 [01:09<00:00,  1.11it/s, WMAPE=2.68, DICE=0.51, DPEAKS=225, Loss=0.0253]
Validate Epoch 8: 100%|██████████| 20/20 [00:10<00:00,  1.99it/s, WMAPE=2.15, DICE=0.511, DPEAKS=228, Loss=0.0251]


Epoch [9/100]


Train Epoch 9: 100%|██████████| 77/77 [01:12<00:00,  1.06it/s, WMAPE=2.65, DICE=0.511, DPEAKS=224, Loss=0.0253]
Validate Epoch 9: 100%|██████████| 20/20 [00:09<00:00,  2.03it/s, WMAPE=3.59, DICE=0.503, DPEAKS=228, Loss=0.0251]


Epoch [10/100]


Train Epoch 10: 100%|██████████| 77/77 [01:13<00:00,  1.05it/s, WMAPE=2.68, DICE=0.513, DPEAKS=224, Loss=0.0253]
Validate Epoch 10: 100%|██████████| 20/20 [00:10<00:00,  1.95it/s, WMAPE=2.99, DICE=0.506, DPEAKS=229, Loss=0.025]


Epoch [11/100]


Train Epoch 11: 100%|██████████| 77/77 [01:10<00:00,  1.10it/s, WMAPE=2.7, DICE=0.513, DPEAKS=224, Loss=0.0253]
Validate Epoch 11: 100%|██████████| 20/20 [00:09<00:00,  2.08it/s, WMAPE=2, DICE=0.514, DPEAKS=230, Loss=0.0251]


Epoch [12/100]


Train Epoch 12: 100%|██████████| 77/77 [01:10<00:00,  1.10it/s, WMAPE=2.65, DICE=0.513, DPEAKS=224, Loss=0.0253]
Validate Epoch 12: 100%|██████████| 20/20 [00:09<00:00,  2.03it/s, WMAPE=2.44, DICE=0.503, DPEAKS=230, Loss=0.025]


early stopping: 5 epochs without improvement
Training complete.


Validate Epoch test: 100%|██████████| 486/486 [02:55<00:00,  2.78it/s, WMAPE=2.77, DICE=0.508, DPEAKS=225, Loss=0.0251]


Partition 2: training decoder
Loaded best model from partition 1
Epoch [1/100]


Train Epoch 1: 100%|██████████| 77/77 [01:09<00:00,  1.10it/s, WMAPE=2.78, DICE=0.51, DPEAKS=224, Loss=0.0251]
Validate Epoch 1: 100%|██████████| 20/20 [00:10<00:00,  1.84it/s, WMAPE=2.63, DICE=0.511, DPEAKS=223, Loss=0.025]


Saving best model
Epoch [2/100]


Train Epoch 2: 100%|██████████| 77/77 [01:05<00:00,  1.18it/s, WMAPE=2.8, DICE=0.512, DPEAKS=224, Loss=0.0251]
Validate Epoch 2: 100%|██████████| 20/20 [00:09<00:00,  2.02it/s, WMAPE=3.45, DICE=0.506, DPEAKS=223, Loss=0.025]


Epoch [3/100]


Train Epoch 3: 100%|██████████| 77/77 [01:06<00:00,  1.16it/s, WMAPE=2.8, DICE=0.512, DPEAKS=225, Loss=0.0251]
Validate Epoch 3: 100%|██████████| 20/20 [00:09<00:00,  2.06it/s, WMAPE=3.06, DICE=0.505, DPEAKS=223, Loss=0.025]


Saving best model
Epoch [4/100]


Train Epoch 4: 100%|██████████| 77/77 [01:07<00:00,  1.15it/s, WMAPE=2.8, DICE=0.513, DPEAKS=225, Loss=0.0252]
Validate Epoch 4: 100%|██████████| 20/20 [00:09<00:00,  2.04it/s, WMAPE=2.81, DICE=0.513, DPEAKS=223, Loss=0.025]


Epoch [5/100]


Train Epoch 5: 100%|██████████| 77/77 [01:07<00:00,  1.15it/s, WMAPE=2.76, DICE=0.513, DPEAKS=225, Loss=0.0252]
Validate Epoch 5: 100%|██████████| 20/20 [00:09<00:00,  2.01it/s, WMAPE=4.3, DICE=0.507, DPEAKS=223, Loss=0.0252]


Epoch [6/100]


Train Epoch 6: 100%|██████████| 77/77 [01:07<00:00,  1.13it/s, WMAPE=2.83, DICE=0.512, DPEAKS=224, Loss=0.0252]
Validate Epoch 6: 100%|██████████| 20/20 [00:09<00:00,  2.00it/s, WMAPE=2.9, DICE=0.518, DPEAKS=223, Loss=0.025]


Saving best model
Epoch [7/100]


Train Epoch 7: 100%|██████████| 77/77 [01:08<00:00,  1.12it/s, WMAPE=2.8, DICE=0.514, DPEAKS=224, Loss=0.0252]
Validate Epoch 7: 100%|██████████| 20/20 [00:10<00:00,  1.99it/s, WMAPE=2.42, DICE=0.503, DPEAKS=223, Loss=0.025]


Epoch [8/100]


Train Epoch 8: 100%|██████████| 77/77 [01:09<00:00,  1.11it/s, WMAPE=2.8, DICE=0.513, DPEAKS=225, Loss=0.0252]
Validate Epoch 8: 100%|██████████| 20/20 [00:10<00:00,  1.97it/s, WMAPE=4.02, DICE=0.517, DPEAKS=224, Loss=0.0251]


Epoch [9/100]


Train Epoch 9: 100%|██████████| 77/77 [01:09<00:00,  1.11it/s, WMAPE=2.79, DICE=0.512, DPEAKS=224, Loss=0.0252]
Validate Epoch 9: 100%|██████████| 20/20 [00:10<00:00,  1.95it/s, WMAPE=2.66, DICE=0.521, DPEAKS=226, Loss=0.025]


Epoch [10/100]


Train Epoch 10: 100%|██████████| 77/77 [01:09<00:00,  1.10it/s, WMAPE=2.79, DICE=0.512, DPEAKS=224, Loss=0.0252]
Validate Epoch 10: 100%|██████████| 20/20 [00:10<00:00,  1.97it/s, WMAPE=1.39, DICE=0.513, DPEAKS=223, Loss=0.0254]


Epoch [11/100]


Train Epoch 11: 100%|██████████| 77/77 [01:10<00:00,  1.09it/s, WMAPE=2.81, DICE=0.512, DPEAKS=225, Loss=0.0252]
Validate Epoch 11: 100%|██████████| 20/20 [00:10<00:00,  1.95it/s, WMAPE=1.89, DICE=0.505, DPEAKS=225, Loss=0.0252]


early stopping: 5 epochs without improvement
Training complete.


Validate Epoch test: 100%|██████████| 486/486 [03:06<00:00,  2.61it/s, WMAPE=2.87, DICE=0.512, DPEAKS=225, Loss=0.0251]


Partition 3: training decoder
Loaded best model from partition 2
Epoch [1/100]


Train Epoch 1: 100%|██████████| 77/77 [01:17<00:00,  1.01s/it, WMAPE=2.66, DICE=0.513, DPEAKS=223, Loss=0.0252]
Validate Epoch 1: 100%|██████████| 20/20 [00:12<00:00,  1.61it/s, WMAPE=1.35, DICE=0.506, DPEAKS=224, Loss=0.0255]


Saving best model
Epoch [2/100]


Train Epoch 2: 100%|██████████| 77/77 [01:14<00:00,  1.04it/s, WMAPE=2.62, DICE=0.512, DPEAKS=225, Loss=0.0252]
Validate Epoch 2: 100%|██████████| 20/20 [00:10<00:00,  1.86it/s, WMAPE=1.8, DICE=0.504, DPEAKS=223, Loss=0.0253]


Saving best model
Epoch [3/100]


Train Epoch 3: 100%|██████████| 77/77 [01:13<00:00,  1.05it/s, WMAPE=2.61, DICE=0.511, DPEAKS=225, Loss=0.0251]
Validate Epoch 3: 100%|██████████| 20/20 [00:10<00:00,  1.88it/s, WMAPE=3, DICE=0.52, DPEAKS=223, Loss=0.0252]


Saving best model
Epoch [4/100]


Train Epoch 4: 100%|██████████| 77/77 [01:12<00:00,  1.06it/s, WMAPE=2.67, DICE=0.511, DPEAKS=224, Loss=0.0252]
Validate Epoch 4: 100%|██████████| 20/20 [00:10<00:00,  1.87it/s, WMAPE=3.27, DICE=0.522, DPEAKS=223, Loss=0.0253]


Epoch [5/100]


Train Epoch 5: 100%|██████████| 77/77 [01:12<00:00,  1.06it/s, WMAPE=2.64, DICE=0.511, DPEAKS=225, Loss=0.0252]
Validate Epoch 5: 100%|██████████| 20/20 [00:10<00:00,  1.86it/s, WMAPE=1.53, DICE=0.514, DPEAKS=223, Loss=0.0254]


Epoch [6/100]


Train Epoch 6: 100%|██████████| 77/77 [01:12<00:00,  1.06it/s, WMAPE=2.63, DICE=0.51, DPEAKS=225, Loss=0.0252]
Validate Epoch 6: 100%|██████████| 20/20 [00:10<00:00,  1.86it/s, WMAPE=2.76, DICE=0.51, DPEAKS=222, Loss=0.0252]


Saving best model
Epoch [7/100]


Train Epoch 7: 100%|██████████| 77/77 [01:12<00:00,  1.06it/s, WMAPE=2.61, DICE=0.51, DPEAKS=225, Loss=0.0252]
Validate Epoch 7: 100%|██████████| 20/20 [00:10<00:00,  1.87it/s, WMAPE=2.55, DICE=0.513, DPEAKS=224, Loss=0.0252]


Saving best model
Epoch [8/100]


Train Epoch 8: 100%|██████████| 77/77 [01:12<00:00,  1.07it/s, WMAPE=2.65, DICE=0.511, DPEAKS=225, Loss=0.0252]
Validate Epoch 8: 100%|██████████| 20/20 [00:10<00:00,  1.87it/s, WMAPE=2.25, DICE=0.511, DPEAKS=225, Loss=0.0252]


Epoch [9/100]


Train Epoch 9: 100%|██████████| 77/77 [01:12<00:00,  1.07it/s, WMAPE=2.61, DICE=0.509, DPEAKS=225, Loss=0.0252]
Validate Epoch 9: 100%|██████████| 20/20 [00:10<00:00,  1.87it/s, WMAPE=4, DICE=0.503, DPEAKS=223, Loss=0.0255]


Epoch [10/100]


Train Epoch 10: 100%|██████████| 77/77 [01:11<00:00,  1.08it/s, WMAPE=2.64, DICE=0.51, DPEAKS=224, Loss=0.0252]
Validate Epoch 10: 100%|██████████| 20/20 [00:10<00:00,  1.88it/s, WMAPE=2.65, DICE=0.509, DPEAKS=225, Loss=0.0252]


Saving best model
Epoch [11/100]


Train Epoch 11: 100%|██████████| 77/77 [01:11<00:00,  1.07it/s, WMAPE=2.63, DICE=0.509, DPEAKS=225, Loss=0.0252]
Validate Epoch 11: 100%|██████████| 20/20 [00:10<00:00,  1.89it/s, WMAPE=2.73, DICE=0.517, DPEAKS=224, Loss=0.0252]


Epoch [12/100]


Train Epoch 12: 100%|██████████| 77/77 [01:10<00:00,  1.09it/s, WMAPE=2.65, DICE=0.51, DPEAKS=225, Loss=0.0252]
Validate Epoch 12: 100%|██████████| 20/20 [00:10<00:00,  1.92it/s, WMAPE=3.13, DICE=0.517, DPEAKS=224, Loss=0.0252]


Epoch [13/100]


Train Epoch 13: 100%|██████████| 77/77 [01:09<00:00,  1.10it/s, WMAPE=2.64, DICE=0.509, DPEAKS=225, Loss=0.0252]
Validate Epoch 13: 100%|██████████| 20/20 [00:10<00:00,  1.93it/s, WMAPE=2.78, DICE=0.521, DPEAKS=223, Loss=0.0252]


Epoch [14/100]


Train Epoch 14: 100%|██████████| 77/77 [01:10<00:00,  1.10it/s, WMAPE=2.62, DICE=0.509, DPEAKS=224, Loss=0.0252]
Validate Epoch 14: 100%|██████████| 20/20 [00:10<00:00,  1.92it/s, WMAPE=3.35, DICE=0.518, DPEAKS=225, Loss=0.0253]


Epoch [15/100]


Train Epoch 15: 100%|██████████| 77/77 [01:09<00:00,  1.10it/s, WMAPE=2.64, DICE=0.509, DPEAKS=224, Loss=0.0252]
Validate Epoch 15: 100%|██████████| 20/20 [00:10<00:00,  1.95it/s, WMAPE=2.82, DICE=0.52, DPEAKS=224, Loss=0.0252]


early stopping: 5 epochs without improvement
Training complete.


Validate Epoch test: 100%|██████████| 486/486 [03:01<00:00,  2.67it/s, WMAPE=2.66, DICE=0.508, DPEAKS=225, Loss=0.0251]


Partition 4: training decoder
Loaded best model from partition 3
Epoch [1/100]


Train Epoch 1: 100%|██████████| 77/77 [01:14<00:00,  1.03it/s, WMAPE=2.72, DICE=0.511, DPEAKS=226, Loss=0.0252]
Validate Epoch 1: 100%|██████████| 20/20 [00:11<00:00,  1.75it/s, WMAPE=2.62, DICE=0.521, DPEAKS=225, Loss=0.025]


Saving best model
Epoch [2/100]


Train Epoch 2: 100%|██████████| 77/77 [01:11<00:00,  1.08it/s, WMAPE=2.76, DICE=0.511, DPEAKS=225, Loss=0.0251]
Validate Epoch 2: 100%|██████████| 20/20 [00:10<00:00,  1.94it/s, WMAPE=1.96, DICE=0.506, DPEAKS=225, Loss=0.0251]


Epoch [3/100]


Train Epoch 3: 100%|██████████| 77/77 [01:09<00:00,  1.11it/s, WMAPE=2.74, DICE=0.512, DPEAKS=225, Loss=0.0252]
Validate Epoch 3: 100%|██████████| 20/20 [00:10<00:00,  1.90it/s, WMAPE=3.78, DICE=0.523, DPEAKS=225, Loss=0.0251]


Epoch [4/100]


Train Epoch 4: 100%|██████████| 77/77 [01:10<00:00,  1.10it/s, WMAPE=2.71, DICE=0.509, DPEAKS=225, Loss=0.0252]
Validate Epoch 4: 100%|██████████| 20/20 [00:09<00:00,  2.05it/s, WMAPE=3.39, DICE=0.523, DPEAKS=225, Loss=0.025]


Epoch [5/100]


Train Epoch 5: 100%|██████████| 77/77 [01:06<00:00,  1.16it/s, WMAPE=2.75, DICE=0.51, DPEAKS=224, Loss=0.0251]
Validate Epoch 5: 100%|██████████| 20/20 [00:09<00:00,  2.06it/s, WMAPE=3.03, DICE=0.517, DPEAKS=225, Loss=0.025]


Saving best model
Epoch [6/100]


Train Epoch 6: 100%|██████████| 77/77 [01:09<00:00,  1.10it/s, WMAPE=2.74, DICE=0.512, DPEAKS=224, Loss=0.0252]
Validate Epoch 6: 100%|██████████| 20/20 [00:10<00:00,  1.91it/s, WMAPE=2.82, DICE=0.5, DPEAKS=226, Loss=0.025]


Saving best model
Epoch [7/100]


Train Epoch 7:  86%|████████▌ | 66/77 [01:00<00:10,  1.06it/s, loss=0.026] 

In [15]:
many_partitions_v2(10,11,model,criterion,transform=transform)

Partition 10: training decoder
Loaded best model from partition 9
Epoch [1/100]


Train Epoch 1: 100%|██████████| 77/77 [01:14<00:00,  1.03it/s, WMAPE=2.36, DICE=0.0675, DPEAKS=38.4, Loss=8.52e-5]
Validate Epoch 1: 100%|██████████| 20/20 [00:10<00:00,  1.86it/s, WMAPE=1.79, DICE=0.0596, DPEAKS=32.9, Loss=4.94e-5]


Saving best model
Epoch [2/100]


Train Epoch 2: 100%|██████████| 77/77 [01:09<00:00,  1.11it/s, WMAPE=1.9, DICE=0.0585, DPEAKS=30.6, Loss=4.94e-5]
Validate Epoch 2: 100%|██████████| 20/20 [00:10<00:00,  1.88it/s, WMAPE=1.79, DICE=0.0585, DPEAKS=31.8, Loss=4.8e-5]


Saving best model
Epoch [3/100]


Train Epoch 3: 100%|██████████| 77/77 [01:12<00:00,  1.06it/s, WMAPE=1.9, DICE=0.0587, DPEAKS=30.8, Loss=4.98e-5]
Validate Epoch 3: 100%|██████████| 20/20 [00:10<00:00,  1.86it/s, WMAPE=1.82, DICE=0.0583, DPEAKS=31.7, Loss=4.78e-5]


Saving best model
Epoch [4/100]


Train Epoch 4: 100%|██████████| 77/77 [01:14<00:00,  1.04it/s, WMAPE=1.87, DICE=0.0586, DPEAKS=30.1, Loss=4.88e-5]
Validate Epoch 4: 100%|██████████| 20/20 [00:09<00:00,  2.01it/s, WMAPE=1.82, DICE=0.0581, DPEAKS=31, Loss=4.95e-5]


Epoch [5/100]


Train Epoch 5: 100%|██████████| 77/77 [01:11<00:00,  1.08it/s, WMAPE=1.94, DICE=0.059, DPEAKS=31.6, Loss=5.18e-5]
Validate Epoch 5: 100%|██████████| 20/20 [00:10<00:00,  1.89it/s, WMAPE=1.77, DICE=0.0592, DPEAKS=32.3, Loss=4.84e-5]


Epoch [6/100]


Train Epoch 6: 100%|██████████| 77/77 [01:13<00:00,  1.05it/s, WMAPE=1.84, DICE=0.0583, DPEAKS=30.8, Loss=4.7e-5]
Validate Epoch 6: 100%|██████████| 20/20 [00:11<00:00,  1.81it/s, WMAPE=1.74, DICE=0.0583, DPEAKS=30.5, Loss=4.81e-5]


Epoch [7/100]


Train Epoch 7: 100%|██████████| 77/77 [01:15<00:00,  1.01it/s, WMAPE=1.85, DICE=0.058, DPEAKS=31.4, Loss=4.74e-5]
Validate Epoch 7: 100%|██████████| 20/20 [00:10<00:00,  1.82it/s, WMAPE=2.09, DICE=0.059, DPEAKS=32.3, Loss=6.43e-5]


Epoch [8/100]


Train Epoch 8: 100%|██████████| 77/77 [01:10<00:00,  1.10it/s, WMAPE=1.89, DICE=0.0583, DPEAKS=30.4, Loss=4.88e-5]
Validate Epoch 8: 100%|██████████| 20/20 [00:09<00:00,  2.01it/s, WMAPE=1.8, DICE=0.0586, DPEAKS=32.7, Loss=4.86e-5]


early stopping: 5 epochs without improvement
Training complete.


Validate Epoch test: 100%|██████████| 486/486 [03:02<00:00,  2.67it/s, WMAPE=1.87, DICE=0.058, DPEAKS=31.8, Loss=4.86e-5]


In [18]:
criterion = L1LogLoss()
many_partitions_v2(11,21,model,criterion,transform=transform)

Partition 11: training full
Loaded best model from partition 10
Epoch [1/100]


Train Epoch 1: 100%|██████████| 77/77 [01:16<00:00,  1.01it/s, WMAPE=2.81, DICE=0.083, DPEAKS=56.1, Loss=0.00867]
Validate Epoch 1: 100%|██████████| 20/20 [00:11<00:00,  1.81it/s, WMAPE=2.09, DICE=0.0673, DPEAKS=47.8, Loss=0.00631]


Saving best model
Epoch [2/100]


Train Epoch 2: 100%|██████████| 77/77 [01:08<00:00,  1.12it/s, WMAPE=2.26, DICE=0.0655, DPEAKS=41, Loss=0.00671]
Validate Epoch 2: 100%|██████████| 20/20 [00:09<00:00,  2.08it/s, WMAPE=1.91, DICE=0.0608, DPEAKS=38.4, Loss=0.00565]


Saving best model
Epoch [3/100]


Train Epoch 3: 100%|██████████| 77/77 [01:09<00:00,  1.11it/s, WMAPE=2.01, DICE=0.0602, DPEAKS=35.2, Loss=0.00597]
Validate Epoch 3: 100%|██████████| 20/20 [00:10<00:00,  1.88it/s, WMAPE=1.87, DICE=0.0615, DPEAKS=39.6, Loss=0.00572]


Epoch [4/100]


Train Epoch 4: 100%|██████████| 77/77 [01:14<00:00,  1.03it/s, WMAPE=1.99, DICE=0.0601, DPEAKS=33.8, Loss=0.00586]
Validate Epoch 4: 100%|██████████| 20/20 [00:09<00:00,  2.02it/s, WMAPE=2.73, DICE=0.0591, DPEAKS=36.7, Loss=0.00787]


Epoch [5/100]


Train Epoch 5: 100%|██████████| 77/77 [01:09<00:00,  1.10it/s, WMAPE=2.03, DICE=0.0614, DPEAKS=35.9, Loss=0.00603]
Validate Epoch 5: 100%|██████████| 20/20 [00:09<00:00,  2.10it/s, WMAPE=2.07, DICE=0.0593, DPEAKS=33.6, Loss=0.00624]


Epoch [6/100]


Train Epoch 6: 100%|██████████| 77/77 [01:08<00:00,  1.12it/s, WMAPE=2.05, DICE=0.0623, DPEAKS=36.1, Loss=0.00608]
Validate Epoch 6: 100%|██████████| 20/20 [00:09<00:00,  2.06it/s, WMAPE=2, DICE=0.0586, DPEAKS=34, Loss=0.00594]


Epoch [7/100]


Train Epoch 7: 100%|██████████| 77/77 [01:09<00:00,  1.11it/s, WMAPE=1.8, DICE=0.06, DPEAKS=33.9, Loss=0.00537]
Validate Epoch 7: 100%|██████████| 20/20 [00:10<00:00,  1.96it/s, WMAPE=1.9, DICE=0.0585, DPEAKS=34.5, Loss=0.00584]


Epoch [8/100]


Train Epoch 8: 100%|██████████| 77/77 [01:10<00:00,  1.09it/s, WMAPE=1.76, DICE=0.0588, DPEAKS=31.9, Loss=0.00527]
Validate Epoch 8: 100%|██████████| 20/20 [00:10<00:00,  1.88it/s, WMAPE=1.99, DICE=0.0596, DPEAKS=34.6, Loss=0.00606]


early stopping: 6 epochs without improvement
Training complete.


Validate Epoch test: 100%|██████████| 486/486 [03:04<00:00,  2.64it/s, WMAPE=1.93, DICE=0.0609, DPEAKS=34.8, Loss=0.00561]


Partition 12: training decoder
Loaded best model from partition 11
Epoch [1/100]


Train Epoch 1: 100%|██████████| 77/77 [01:17<00:00,  1.01s/it, WMAPE=2.32, DICE=0.0721, DPEAKS=41.5, Loss=0.00707]
Validate Epoch 1: 100%|██████████| 20/20 [00:11<00:00,  1.77it/s, WMAPE=1.92, DICE=0.0604, DPEAKS=34.8, Loss=0.00552]


Saving best model
Epoch [2/100]


Train Epoch 2: 100%|██████████| 77/77 [01:06<00:00,  1.17it/s, WMAPE=1.87, DICE=0.0595, DPEAKS=32.7, Loss=0.00551]
Validate Epoch 2: 100%|██████████| 20/20 [00:10<00:00,  1.91it/s, WMAPE=1.88, DICE=0.0586, DPEAKS=30.6, Loss=0.00542]


Saving best model
Epoch [3/100]


Train Epoch 3: 100%|██████████| 77/77 [01:09<00:00,  1.11it/s, WMAPE=1.89, DICE=0.059, DPEAKS=31.5, Loss=0.00557]
Validate Epoch 3: 100%|██████████| 20/20 [00:10<00:00,  2.00it/s, WMAPE=2.02, DICE=0.0587, DPEAKS=29.9, Loss=0.00585]


Epoch [4/100]


Train Epoch 4: 100%|██████████| 77/77 [01:07<00:00,  1.14it/s, WMAPE=1.85, DICE=0.0586, DPEAKS=31.4, Loss=0.00545]
Validate Epoch 4: 100%|██████████| 20/20 [00:09<00:00,  2.03it/s, WMAPE=1.83, DICE=0.059, DPEAKS=29.6, Loss=0.00539]


Saving best model
Epoch [5/100]


Train Epoch 5: 100%|██████████| 77/77 [01:09<00:00,  1.11it/s, WMAPE=1.9, DICE=0.0588, DPEAKS=32.1, Loss=0.0056]
Validate Epoch 5: 100%|██████████| 20/20 [00:09<00:00,  2.05it/s, WMAPE=2.02, DICE=0.0599, DPEAKS=33.2, Loss=0.00595]


Epoch [6/100]


Train Epoch 6: 100%|██████████| 77/77 [01:05<00:00,  1.18it/s, WMAPE=1.83, DICE=0.0584, DPEAKS=31.3, Loss=0.00539]
Validate Epoch 6: 100%|██████████| 20/20 [00:09<00:00,  2.08it/s, WMAPE=1.82, DICE=0.0582, DPEAKS=30.7, Loss=0.0054]


Epoch [7/100]


Train Epoch 7: 100%|██████████| 77/77 [01:11<00:00,  1.08it/s, WMAPE=1.82, DICE=0.0582, DPEAKS=31.4, Loss=0.00536]
Validate Epoch 7: 100%|██████████| 20/20 [00:09<00:00,  2.04it/s, WMAPE=1.89, DICE=0.0581, DPEAKS=30.8, Loss=0.00536]


Saving best model
Epoch [8/100]


Train Epoch 8: 100%|██████████| 77/77 [01:09<00:00,  1.11it/s, WMAPE=1.8, DICE=0.0583, DPEAKS=32.7, Loss=0.00531]
Validate Epoch 8: 100%|██████████| 20/20 [00:09<00:00,  2.01it/s, WMAPE=1.89, DICE=0.0585, DPEAKS=29.2, Loss=0.00548]


Epoch [9/100]


Train Epoch 9: 100%|██████████| 77/77 [01:06<00:00,  1.16it/s, WMAPE=1.79, DICE=0.0583, DPEAKS=31.9, Loss=0.00528]
Validate Epoch 9: 100%|██████████| 20/20 [00:09<00:00,  2.11it/s, WMAPE=2.02, DICE=0.0584, DPEAKS=27.5, Loss=0.00582]


Epoch [10/100]


Train Epoch 10: 100%|██████████| 77/77 [01:05<00:00,  1.18it/s, WMAPE=1.79, DICE=0.058, DPEAKS=31.4, Loss=0.00524]
Validate Epoch 10: 100%|██████████| 20/20 [00:09<00:00,  2.11it/s, WMAPE=1.89, DICE=0.0587, DPEAKS=28.1, Loss=0.00554]


Epoch [11/100]


Train Epoch 11: 100%|██████████| 77/77 [01:04<00:00,  1.19it/s, WMAPE=1.74, DICE=0.058, DPEAKS=30.9, Loss=0.00516]
Validate Epoch 11: 100%|██████████| 20/20 [00:09<00:00,  2.05it/s, WMAPE=1.91, DICE=0.0584, DPEAKS=28.7, Loss=0.00545]


Epoch [12/100]


Train Epoch 12: 100%|██████████| 77/77 [01:04<00:00,  1.19it/s, WMAPE=1.76, DICE=0.0581, DPEAKS=31.7, Loss=0.00519]
Validate Epoch 12: 100%|██████████| 20/20 [00:09<00:00,  2.07it/s, WMAPE=1.92, DICE=0.0585, DPEAKS=28.6, Loss=0.00552]


early stopping: 5 epochs without improvement
Training complete.


Validate Epoch test: 100%|██████████| 486/486 [02:54<00:00,  2.78it/s, WMAPE=1.87, DICE=0.0581, DPEAKS=32.7, Loss=0.00541]


Partition 13: training decoder
Loaded best model from partition 12
Epoch [1/100]


Train Epoch 1: 100%|██████████| 77/77 [01:11<00:00,  1.08it/s, WMAPE=2.1, DICE=0.0627, DPEAKS=35.7, Loss=0.0062]
Validate Epoch 1: 100%|██████████| 20/20 [00:10<00:00,  1.86it/s, WMAPE=1.8, DICE=0.0576, DPEAKS=31.2, Loss=0.00531]


Saving best model
Epoch [2/100]


Train Epoch 2: 100%|██████████| 77/77 [01:06<00:00,  1.17it/s, WMAPE=1.84, DICE=0.0577, DPEAKS=31.5, Loss=0.00544]
Validate Epoch 2: 100%|██████████| 20/20 [00:09<00:00,  2.06it/s, WMAPE=1.85, DICE=0.0577, DPEAKS=30.6, Loss=0.00532]


Epoch [3/100]


Train Epoch 3: 100%|██████████| 77/77 [01:07<00:00,  1.14it/s, WMAPE=1.88, DICE=0.0582, DPEAKS=32.7, Loss=0.00551]
Validate Epoch 3: 100%|██████████| 20/20 [00:10<00:00,  1.99it/s, WMAPE=1.88, DICE=0.0587, DPEAKS=34.9, Loss=0.00554]


Epoch [4/100]


Train Epoch 4: 100%|██████████| 77/77 [01:06<00:00,  1.15it/s, WMAPE=1.84, DICE=0.0577, DPEAKS=32.2, Loss=0.00545]
Validate Epoch 4: 100%|██████████| 20/20 [00:10<00:00,  2.00it/s, WMAPE=1.83, DICE=0.0573, DPEAKS=31.8, Loss=0.00534]


Epoch [5/100]


Train Epoch 5: 100%|██████████| 77/77 [01:06<00:00,  1.15it/s, WMAPE=1.78, DICE=0.0574, DPEAKS=31.1, Loss=0.00519]
Validate Epoch 5: 100%|██████████| 20/20 [00:09<00:00,  2.03it/s, WMAPE=2.2, DICE=0.0572, DPEAKS=31.1, Loss=0.00608]


Epoch [6/100]


Train Epoch 6: 100%|██████████| 77/77 [01:07<00:00,  1.14it/s, WMAPE=1.8, DICE=0.0577, DPEAKS=31.5, Loss=0.00531]
Validate Epoch 6: 100%|██████████| 20/20 [00:09<00:00,  2.05it/s, WMAPE=1.89, DICE=0.0581, DPEAKS=32.2, Loss=0.00547]


Epoch [7/100]


Train Epoch 7: 100%|██████████| 77/77 [01:06<00:00,  1.16it/s, WMAPE=1.74, DICE=0.0577, DPEAKS=32.4, Loss=0.00516]
Validate Epoch 7: 100%|██████████| 20/20 [00:09<00:00,  2.05it/s, WMAPE=1.94, DICE=0.0577, DPEAKS=31.2, Loss=0.00547]


Epoch [8/100]


Train Epoch 8: 100%|██████████| 77/77 [01:10<00:00,  1.10it/s, WMAPE=1.73, DICE=0.0574, DPEAKS=32, Loss=0.00506]
Validate Epoch 8: 100%|██████████| 20/20 [00:09<00:00,  2.02it/s, WMAPE=1.91, DICE=0.0573, DPEAKS=30.7, Loss=0.00557]


early stopping: 7 epochs without improvement
Training complete.


Validate Epoch test: 100%|██████████| 486/486 [03:00<00:00,  2.69it/s, WMAPE=1.81, DICE=0.0577, DPEAKS=31.5, Loss=0.00542]


Partition 14: training decoder
Loaded best model from partition 13
Epoch [1/100]


Train Epoch 1: 100%|██████████| 77/77 [01:10<00:00,  1.09it/s, WMAPE=2.18, DICE=0.0638, DPEAKS=36.8, Loss=0.00639]
Validate Epoch 1: 100%|██████████| 20/20 [00:10<00:00,  1.86it/s, WMAPE=1.85, DICE=0.0578, DPEAKS=29.4, Loss=0.00549]


Saving best model
Epoch [2/100]


Train Epoch 2: 100%|██████████| 77/77 [01:07<00:00,  1.13it/s, WMAPE=1.89, DICE=0.0579, DPEAKS=32.2, Loss=0.00547]
Validate Epoch 2: 100%|██████████| 20/20 [00:09<00:00,  2.01it/s, WMAPE=1.87, DICE=0.0576, DPEAKS=32, Loss=0.00548]


Saving best model
Epoch [3/100]


Train Epoch 3: 100%|██████████| 77/77 [01:09<00:00,  1.11it/s, WMAPE=1.87, DICE=0.0576, DPEAKS=32.7, Loss=0.00548]
Validate Epoch 3: 100%|██████████| 20/20 [00:09<00:00,  2.04it/s, WMAPE=2.01, DICE=0.0576, DPEAKS=30.6, Loss=0.00604]


Epoch [4/100]


Train Epoch 4: 100%|██████████| 77/77 [01:09<00:00,  1.11it/s, WMAPE=1.86, DICE=0.0581, DPEAKS=32.6, Loss=0.00543]
Validate Epoch 4: 100%|██████████| 20/20 [00:10<00:00,  1.88it/s, WMAPE=1.93, DICE=0.0573, DPEAKS=31.8, Loss=0.00572]


Epoch [5/100]


Train Epoch 5: 100%|██████████| 77/77 [01:09<00:00,  1.11it/s, WMAPE=1.86, DICE=0.0577, DPEAKS=31.2, Loss=0.00537]
Validate Epoch 5: 100%|██████████| 20/20 [00:10<00:00,  1.99it/s, WMAPE=1.9, DICE=0.0576, DPEAKS=30.4, Loss=0.00557]


Epoch [6/100]


Train Epoch 6: 100%|██████████| 77/77 [01:07<00:00,  1.14it/s, WMAPE=1.88, DICE=0.0585, DPEAKS=32.9, Loss=0.00544]
Validate Epoch 6: 100%|██████████| 20/20 [00:09<00:00,  2.02it/s, WMAPE=1.91, DICE=0.0579, DPEAKS=30.8, Loss=0.00571]


Epoch [7/100]


Train Epoch 7: 100%|██████████| 77/77 [01:07<00:00,  1.14it/s, WMAPE=1.84, DICE=0.0579, DPEAKS=32.8, Loss=0.00531]
Validate Epoch 7: 100%|██████████| 20/20 [00:10<00:00,  1.99it/s, WMAPE=2.12, DICE=0.058, DPEAKS=31.4, Loss=0.00614]


Epoch [8/100]


Train Epoch 8: 100%|██████████| 77/77 [01:07<00:00,  1.14it/s, WMAPE=1.78, DICE=0.0578, DPEAKS=32.3, Loss=0.00517]
Validate Epoch 8: 100%|██████████| 20/20 [00:09<00:00,  2.04it/s, WMAPE=1.89, DICE=0.0575, DPEAKS=30.7, Loss=0.0056]


early stopping: 6 epochs without improvement
Training complete.


Validate Epoch test: 100%|██████████| 486/486 [02:58<00:00,  2.72it/s, WMAPE=1.83, DICE=0.0576, DPEAKS=32.1, Loss=0.00536]


Partition 15: training decoder
Loaded best model from partition 14
Epoch [1/100]


Train Epoch 1: 100%|██████████| 77/77 [01:11<00:00,  1.07it/s, WMAPE=2.14, DICE=0.0649, DPEAKS=39.5, Loss=0.00643]
Validate Epoch 1: 100%|██████████| 20/20 [00:10<00:00,  1.83it/s, WMAPE=1.83, DICE=0.0579, DPEAKS=30.1, Loss=0.00538]


Saving best model
Epoch [2/100]


Train Epoch 2: 100%|██████████| 77/77 [01:06<00:00,  1.16it/s, WMAPE=1.85, DICE=0.0574, DPEAKS=31.6, Loss=0.00548]
Validate Epoch 2: 100%|██████████| 20/20 [00:09<00:00,  2.03it/s, WMAPE=1.81, DICE=0.0573, DPEAKS=29.5, Loss=0.00525]


Saving best model
Epoch [3/100]


Train Epoch 3: 100%|██████████| 77/77 [01:06<00:00,  1.16it/s, WMAPE=1.93, DICE=0.059, DPEAKS=32.6, Loss=0.00568]
Validate Epoch 3: 100%|██████████| 20/20 [00:10<00:00,  2.00it/s, WMAPE=1.87, DICE=0.059, DPEAKS=31.1, Loss=0.00547]


Epoch [4/100]


Train Epoch 4: 100%|██████████| 77/77 [01:07<00:00,  1.14it/s, WMAPE=1.86, DICE=0.0576, DPEAKS=31.5, Loss=0.00548]
Validate Epoch 4: 100%|██████████| 20/20 [00:09<00:00,  2.03it/s, WMAPE=1.84, DICE=0.0584, DPEAKS=31, Loss=0.00533]


Epoch [5/100]


Train Epoch 5: 100%|██████████| 77/77 [01:06<00:00,  1.16it/s, WMAPE=1.83, DICE=0.0576, DPEAKS=31.8, Loss=0.00542]
Validate Epoch 5: 100%|██████████| 20/20 [00:09<00:00,  2.07it/s, WMAPE=1.88, DICE=0.0582, DPEAKS=30.7, Loss=0.00551]


Epoch [6/100]


Train Epoch 6: 100%|██████████| 77/77 [01:06<00:00,  1.16it/s, WMAPE=1.8, DICE=0.0573, DPEAKS=31.2, Loss=0.00534]
Validate Epoch 6: 100%|██████████| 20/20 [00:09<00:00,  2.06it/s, WMAPE=1.92, DICE=0.0585, DPEAKS=30.6, Loss=0.00569]


Epoch [7/100]


Train Epoch 7: 100%|██████████| 77/77 [01:06<00:00,  1.16it/s, WMAPE=1.8, DICE=0.0574, DPEAKS=31.7, Loss=0.0053]
Validate Epoch 7: 100%|██████████| 20/20 [00:09<00:00,  2.02it/s, WMAPE=1.85, DICE=0.0572, DPEAKS=29.8, Loss=0.00533]


Epoch [8/100]


Train Epoch 8: 100%|██████████| 77/77 [01:07<00:00,  1.14it/s, WMAPE=1.74, DICE=0.0574, DPEAKS=31.7, Loss=0.00516]
Validate Epoch 8: 100%|██████████| 20/20 [00:10<00:00,  1.97it/s, WMAPE=1.86, DICE=0.0576, DPEAKS=31.5, Loss=0.00548]


early stopping: 6 epochs without improvement
Training complete.


Validate Epoch test: 100%|██████████| 486/486 [02:55<00:00,  2.77it/s, WMAPE=1.82, DICE=0.0571, DPEAKS=31.2, Loss=0.00534]


Partition 16: training full
Loaded best model from partition 15
Epoch [1/100]


Train Epoch 1: 100%|██████████| 77/77 [01:14<00:00,  1.03it/s, WMAPE=2.85, DICE=0.0894, DPEAKS=61.6, Loss=0.0089]
Validate Epoch 1: 100%|██████████| 20/20 [00:10<00:00,  1.85it/s, WMAPE=1.82, DICE=0.0629, DPEAKS=37.8, Loss=0.00592]


Saving best model
Epoch [2/100]


Train Epoch 2: 100%|██████████| 77/77 [01:08<00:00,  1.12it/s, WMAPE=2.03, DICE=0.0607, DPEAKS=35.9, Loss=0.00602]
Validate Epoch 2: 100%|██████████| 20/20 [00:09<00:00,  2.07it/s, WMAPE=1.86, DICE=0.0582, DPEAKS=34.3, Loss=0.00572]


Saving best model
Epoch [3/100]


Train Epoch 3: 100%|██████████| 77/77 [01:09<00:00,  1.10it/s, WMAPE=1.99, DICE=0.0588, DPEAKS=33.5, Loss=0.00589]
Validate Epoch 3: 100%|██████████| 20/20 [00:10<00:00,  1.99it/s, WMAPE=1.78, DICE=0.0585, DPEAKS=33.4, Loss=0.00543]


Saving best model
Epoch [4/100]


Train Epoch 4: 100%|██████████| 77/77 [01:09<00:00,  1.11it/s, WMAPE=1.93, DICE=0.059, DPEAKS=35, Loss=0.00573]
Validate Epoch 4: 100%|██████████| 20/20 [00:09<00:00,  2.05it/s, WMAPE=1.94, DICE=0.0633, DPEAKS=41.6, Loss=0.00613]


Epoch [5/100]


Train Epoch 5: 100%|██████████| 77/77 [01:09<00:00,  1.11it/s, WMAPE=1.89, DICE=0.0598, DPEAKS=36.1, Loss=0.0056]
Validate Epoch 5: 100%|██████████| 20/20 [00:09<00:00,  2.06it/s, WMAPE=1.8, DICE=0.0592, DPEAKS=36.1, Loss=0.0054]


Saving best model
Epoch [6/100]


Train Epoch 6: 100%|██████████| 77/77 [01:09<00:00,  1.11it/s, WMAPE=1.89, DICE=0.0596, DPEAKS=35, Loss=0.00559]
Validate Epoch 6: 100%|██████████| 20/20 [00:09<00:00,  2.02it/s, WMAPE=1.69, DICE=0.0582, DPEAKS=35, Loss=0.00539]


Saving best model
Epoch [7/100]


Train Epoch 7: 100%|██████████| 77/77 [01:10<00:00,  1.10it/s, WMAPE=1.76, DICE=0.0586, DPEAKS=34.3, Loss=0.00527]
Validate Epoch 7: 100%|██████████| 20/20 [00:09<00:00,  2.05it/s, WMAPE=1.73, DICE=0.0575, DPEAKS=35, Loss=0.00536]


Saving best model
Epoch [8/100]


Train Epoch 8: 100%|██████████| 77/77 [01:09<00:00,  1.11it/s, WMAPE=1.81, DICE=0.0595, DPEAKS=36.6, Loss=0.00545]
Validate Epoch 8: 100%|██████████| 20/20 [00:10<00:00,  1.90it/s, WMAPE=1.74, DICE=0.058, DPEAKS=36.3, Loss=0.00534]


Saving best model
Epoch [9/100]


Train Epoch 9: 100%|██████████| 77/77 [01:12<00:00,  1.06it/s, WMAPE=1.63, DICE=0.0573, DPEAKS=31.8, Loss=0.00488]
Validate Epoch 9: 100%|██████████| 20/20 [00:09<00:00,  2.05it/s, WMAPE=1.9, DICE=0.0589, DPEAKS=34.8, Loss=0.00586]


Epoch [10/100]


Train Epoch 10: 100%|██████████| 77/77 [01:09<00:00,  1.11it/s, WMAPE=1.59, DICE=0.0575, DPEAKS=34.2, Loss=0.00478]
Validate Epoch 10: 100%|██████████| 20/20 [00:09<00:00,  2.05it/s, WMAPE=1.86, DICE=0.0569, DPEAKS=31.9, Loss=0.00568]


Epoch [11/100]


Train Epoch 11: 100%|██████████| 77/77 [01:11<00:00,  1.07it/s, WMAPE=1.51, DICE=0.0563, DPEAKS=32, Loss=0.00456]
Validate Epoch 11: 100%|██████████| 20/20 [00:09<00:00,  2.05it/s, WMAPE=1.78, DICE=0.0566, DPEAKS=32.3, Loss=0.00553]


Epoch [12/100]


Train Epoch 12: 100%|██████████| 77/77 [01:11<00:00,  1.08it/s, WMAPE=1.64, DICE=0.0573, DPEAKS=34, Loss=0.00494]
Validate Epoch 12: 100%|██████████| 20/20 [00:09<00:00,  2.01it/s, WMAPE=1.82, DICE=0.0587, DPEAKS=34.2, Loss=0.00571]


Epoch [13/100]


Train Epoch 13: 100%|██████████| 77/77 [01:10<00:00,  1.09it/s, WMAPE=1.5, DICE=0.0564, DPEAKS=31.5, Loss=0.00453]
Validate Epoch 13: 100%|██████████| 20/20 [00:10<00:00,  1.99it/s, WMAPE=1.82, DICE=0.0549, DPEAKS=30.6, Loss=0.00558]


early stopping: 5 epochs without improvement
Training complete.


Validate Epoch test: 100%|██████████| 486/486 [03:01<00:00,  2.68it/s, WMAPE=1.9, DICE=0.0581, DPEAKS=33.4, Loss=0.00549]


Partition 17: training decoder
Loaded best model from partition 16
Epoch [1/100]


Train Epoch 1: 100%|██████████| 77/77 [01:12<00:00,  1.06it/s, WMAPE=2.22, DICE=0.0642, DPEAKS=35.6, Loss=0.0066]
Validate Epoch 1: 100%|██████████| 20/20 [00:11<00:00,  1.77it/s, WMAPE=1.76, DICE=0.0566, DPEAKS=30.1, Loss=0.00541]


Saving best model
Epoch [2/100]


Train Epoch 2: 100%|██████████| 77/77 [01:12<00:00,  1.06it/s, WMAPE=1.87, DICE=0.056, DPEAKS=29.8, Loss=0.0055]
Validate Epoch 2: 100%|██████████| 20/20 [00:10<00:00,  1.92it/s, WMAPE=1.79, DICE=0.0567, DPEAKS=29.4, Loss=0.00536]


Saving best model
Epoch [3/100]


Train Epoch 3: 100%|██████████| 77/77 [01:11<00:00,  1.07it/s, WMAPE=1.84, DICE=0.0561, DPEAKS=29.7, Loss=0.00541]
Validate Epoch 3: 100%|██████████| 20/20 [00:10<00:00,  1.99it/s, WMAPE=1.71, DICE=0.0557, DPEAKS=29.9, Loss=0.00522]


Saving best model
Epoch [4/100]


Train Epoch 4: 100%|██████████| 77/77 [01:08<00:00,  1.12it/s, WMAPE=1.9, DICE=0.0562, DPEAKS=29.8, Loss=0.0055]
Validate Epoch 4: 100%|██████████| 20/20 [00:09<00:00,  2.05it/s, WMAPE=1.73, DICE=0.0565, DPEAKS=29.7, Loss=0.00527]


Epoch [5/100]


Train Epoch 5: 100%|██████████| 77/77 [01:06<00:00,  1.16it/s, WMAPE=1.75, DICE=0.0556, DPEAKS=30.1, Loss=0.00514]
Validate Epoch 5: 100%|██████████| 20/20 [00:09<00:00,  2.02it/s, WMAPE=2.03, DICE=0.056, DPEAKS=30.4, Loss=0.006]


Epoch [6/100]


Train Epoch 6: 100%|██████████| 77/77 [01:08<00:00,  1.12it/s, WMAPE=1.81, DICE=0.0559, DPEAKS=29.8, Loss=0.00528]
Validate Epoch 6: 100%|██████████| 20/20 [00:10<00:00,  1.98it/s, WMAPE=1.86, DICE=0.0561, DPEAKS=29.3, Loss=0.00566]


Epoch [7/100]


Train Epoch 7: 100%|██████████| 77/77 [01:10<00:00,  1.10it/s, WMAPE=1.77, DICE=0.0558, DPEAKS=30.9, Loss=0.00517]
Validate Epoch 7: 100%|██████████| 20/20 [00:10<00:00,  1.97it/s, WMAPE=1.95, DICE=0.0569, DPEAKS=29.1, Loss=0.00603]


Epoch [8/100]


Train Epoch 8: 100%|██████████| 77/77 [01:11<00:00,  1.08it/s, WMAPE=1.73, DICE=0.0559, DPEAKS=30.8, Loss=0.00504]
Validate Epoch 8: 100%|██████████| 20/20 [00:10<00:00,  1.94it/s, WMAPE=1.88, DICE=0.056, DPEAKS=29.7, Loss=0.00562]


early stopping: 5 epochs without improvement
Training complete.


Validate Epoch test: 100%|██████████| 486/486 [03:04<00:00,  2.63it/s, WMAPE=1.79, DICE=0.0555, DPEAKS=31, Loss=0.00525]


Partition 18: training decoder
Loaded best model from partition 17
Epoch [1/100]


Train Epoch 1: 100%|██████████| 77/77 [01:17<00:00,  1.01s/it, WMAPE=2.08, DICE=0.0617, DPEAKS=33.8, Loss=0.00631]
Validate Epoch 1: 100%|██████████| 20/20 [00:11<00:00,  1.75it/s, WMAPE=1.86, DICE=0.0555, DPEAKS=31.7, Loss=0.00545]


Saving best model
Epoch [2/100]


Train Epoch 2: 100%|██████████| 77/77 [01:13<00:00,  1.05it/s, WMAPE=1.89, DICE=0.0572, DPEAKS=29.8, Loss=0.00566]
Validate Epoch 2: 100%|██████████| 20/20 [00:10<00:00,  1.85it/s, WMAPE=2.08, DICE=0.0559, DPEAKS=34.5, Loss=0.00593]


Epoch [3/100]


Train Epoch 3: 100%|██████████| 77/77 [01:14<00:00,  1.04it/s, WMAPE=1.79, DICE=0.0556, DPEAKS=30.4, Loss=0.00536]
Validate Epoch 3: 100%|██████████| 20/20 [00:10<00:00,  1.84it/s, WMAPE=1.86, DICE=0.055, DPEAKS=31.5, Loss=0.00539]


Saving best model
Epoch [4/100]


Train Epoch 4: 100%|██████████| 77/77 [01:12<00:00,  1.06it/s, WMAPE=1.78, DICE=0.0555, DPEAKS=28.7, Loss=0.00529]
Validate Epoch 4: 100%|██████████| 20/20 [00:10<00:00,  1.90it/s, WMAPE=1.89, DICE=0.0551, DPEAKS=31.6, Loss=0.00569]


Epoch [5/100]


Train Epoch 5: 100%|██████████| 77/77 [01:12<00:00,  1.06it/s, WMAPE=1.75, DICE=0.0555, DPEAKS=28.8, Loss=0.00527]
Validate Epoch 5: 100%|██████████| 20/20 [00:10<00:00,  1.88it/s, WMAPE=1.83, DICE=0.0549, DPEAKS=31.9, Loss=0.00542]


Epoch [6/100]


Train Epoch 6: 100%|██████████| 77/77 [01:11<00:00,  1.08it/s, WMAPE=1.72, DICE=0.0555, DPEAKS=29.3, Loss=0.00515]
Validate Epoch 6: 100%|██████████| 20/20 [00:10<00:00,  1.91it/s, WMAPE=1.79, DICE=0.055, DPEAKS=33.3, Loss=0.0054]


Epoch [7/100]


Train Epoch 7: 100%|██████████| 77/77 [01:11<00:00,  1.08it/s, WMAPE=1.72, DICE=0.056, DPEAKS=30.3, Loss=0.00517]
Validate Epoch 7: 100%|██████████| 20/20 [00:10<00:00,  1.98it/s, WMAPE=1.98, DICE=0.0568, DPEAKS=35.5, Loss=0.006]


Epoch [8/100]


Train Epoch 8: 100%|██████████| 77/77 [01:09<00:00,  1.10it/s, WMAPE=1.7, DICE=0.0558, DPEAKS=29.6, Loss=0.00511]
Validate Epoch 8: 100%|██████████| 20/20 [00:10<00:00,  1.98it/s, WMAPE=1.88, DICE=0.0553, DPEAKS=32.2, Loss=0.00552]


early stopping: 5 epochs without improvement
Training complete.


Validate Epoch test: 100%|██████████| 486/486 [02:58<00:00,  2.72it/s, WMAPE=1.83, DICE=0.0552, DPEAKS=31.1, Loss=0.00531]


Partition 19: training decoder
Loaded best model from partition 18
Epoch [1/100]


Train Epoch 1: 100%|██████████| 77/77 [01:13<00:00,  1.05it/s, WMAPE=2.19, DICE=0.0616, DPEAKS=35.2, Loss=0.00661]
Validate Epoch 1: 100%|██████████| 20/20 [00:11<00:00,  1.77it/s, WMAPE=1.7, DICE=0.0557, DPEAKS=31.3, Loss=0.00519]


Saving best model
Epoch [2/100]


Train Epoch 2: 100%|██████████| 77/77 [01:09<00:00,  1.11it/s, WMAPE=1.83, DICE=0.0555, DPEAKS=30, Loss=0.0054]
Validate Epoch 2: 100%|██████████| 20/20 [00:10<00:00,  1.98it/s, WMAPE=1.74, DICE=0.055, DPEAKS=30.5, Loss=0.00541]


Epoch [3/100]


Train Epoch 3: 100%|██████████| 77/77 [01:10<00:00,  1.09it/s, WMAPE=1.81, DICE=0.055, DPEAKS=27.9, Loss=0.00533]
Validate Epoch 3: 100%|██████████| 20/20 [00:10<00:00,  1.98it/s, WMAPE=1.89, DICE=0.0554, DPEAKS=31.5, Loss=0.00558]


Epoch [4/100]


Train Epoch 4: 100%|██████████| 77/77 [01:08<00:00,  1.12it/s, WMAPE=1.77, DICE=0.0552, DPEAKS=29.3, Loss=0.00523]
Validate Epoch 4: 100%|██████████| 20/20 [00:09<00:00,  2.06it/s, WMAPE=1.68, DICE=0.0554, DPEAKS=32.7, Loss=0.00513]


Saving best model
Epoch [5/100]


Train Epoch 5: 100%|██████████| 77/77 [01:05<00:00,  1.18it/s, WMAPE=1.77, DICE=0.0554, DPEAKS=28.5, Loss=0.00521]
Validate Epoch 5: 100%|██████████| 20/20 [00:09<00:00,  2.13it/s, WMAPE=1.7, DICE=0.0562, DPEAKS=31.7, Loss=0.00518]


Epoch [6/100]


Train Epoch 6: 100%|██████████| 77/77 [01:03<00:00,  1.20it/s, WMAPE=1.73, DICE=0.0551, DPEAKS=30.1, Loss=0.00509]
Validate Epoch 6: 100%|██████████| 20/20 [00:09<00:00,  2.13it/s, WMAPE=1.83, DICE=0.0556, DPEAKS=31.9, Loss=0.00534]


Epoch [7/100]


Train Epoch 7: 100%|██████████| 77/77 [01:03<00:00,  1.21it/s, WMAPE=1.81, DICE=0.0563, DPEAKS=31, Loss=0.00534]
Validate Epoch 7: 100%|██████████| 20/20 [00:09<00:00,  2.14it/s, WMAPE=1.87, DICE=0.0573, DPEAKS=31.4, Loss=0.00588]


Epoch [8/100]


Train Epoch 8: 100%|██████████| 77/77 [01:06<00:00,  1.16it/s, WMAPE=1.69, DICE=0.0553, DPEAKS=28.6, Loss=0.00502]
Validate Epoch 8: 100%|██████████| 20/20 [00:10<00:00,  1.91it/s, WMAPE=1.73, DICE=0.0549, DPEAKS=32.1, Loss=0.00524]


Epoch [9/100]


Train Epoch 9: 100%|██████████| 77/77 [01:08<00:00,  1.12it/s, WMAPE=1.65, DICE=0.0551, DPEAKS=28, Loss=0.00487]
Validate Epoch 9: 100%|██████████| 20/20 [00:09<00:00,  2.02it/s, WMAPE=1.81, DICE=0.0555, DPEAKS=30.3, Loss=0.00542]


early stopping: 5 epochs without improvement
Training complete.


Validate Epoch test: 100%|██████████| 486/486 [02:55<00:00,  2.77it/s, WMAPE=1.76, DICE=0.0552, DPEAKS=31.3, Loss=0.00521]


Partition 20: training decoder
Loaded best model from partition 19
Epoch [1/100]


Train Epoch 1: 100%|██████████| 77/77 [01:11<00:00,  1.08it/s, WMAPE=2.19, DICE=0.0644, DPEAKS=38.1, Loss=0.00667]
Validate Epoch 1: 100%|██████████| 20/20 [00:11<00:00,  1.81it/s, WMAPE=1.77, DICE=0.0551, DPEAKS=34.1, Loss=0.00522]


Saving best model
Epoch [2/100]


Train Epoch 2: 100%|██████████| 77/77 [01:08<00:00,  1.13it/s, WMAPE=1.79, DICE=0.0549, DPEAKS=31.5, Loss=0.0054]
Validate Epoch 2: 100%|██████████| 20/20 [00:09<00:00,  2.07it/s, WMAPE=1.78, DICE=0.055, DPEAKS=31.4, Loss=0.00518]


Saving best model
Epoch [3/100]


Train Epoch 3: 100%|██████████| 77/77 [01:04<00:00,  1.19it/s, WMAPE=1.79, DICE=0.0549, DPEAKS=31.9, Loss=0.00539]
Validate Epoch 3: 100%|██████████| 20/20 [00:09<00:00,  2.12it/s, WMAPE=1.85, DICE=0.0546, DPEAKS=31.2, Loss=0.00537]


Epoch [4/100]


Train Epoch 4: 100%|██████████| 77/77 [01:03<00:00,  1.21it/s, WMAPE=1.78, DICE=0.0554, DPEAKS=31.6, Loss=0.00535]
Validate Epoch 4: 100%|██████████| 20/20 [00:09<00:00,  2.14it/s, WMAPE=1.84, DICE=0.056, DPEAKS=33.2, Loss=0.00534]


Epoch [5/100]


Train Epoch 5: 100%|██████████| 77/77 [01:03<00:00,  1.21it/s, WMAPE=1.73, DICE=0.0548, DPEAKS=31.6, Loss=0.0052]
Validate Epoch 5: 100%|██████████| 20/20 [00:09<00:00,  2.03it/s, WMAPE=1.78, DICE=0.0549, DPEAKS=32.5, Loss=0.00518]


Epoch [6/100]


Train Epoch 6: 100%|██████████| 77/77 [01:07<00:00,  1.14it/s, WMAPE=1.74, DICE=0.0549, DPEAKS=31.8, Loss=0.00523]
Validate Epoch 6: 100%|██████████| 20/20 [00:09<00:00,  2.06it/s, WMAPE=1.91, DICE=0.0557, DPEAKS=33.7, Loss=0.00547]


Epoch [7/100]


Train Epoch 7: 100%|██████████| 77/77 [01:06<00:00,  1.17it/s, WMAPE=1.74, DICE=0.0554, DPEAKS=31.7, Loss=0.00525]
Validate Epoch 7: 100%|██████████| 20/20 [00:09<00:00,  2.02it/s, WMAPE=1.83, DICE=0.0551, DPEAKS=32.9, Loss=0.00529]


Epoch [8/100]


Train Epoch 8: 100%|██████████| 77/77 [01:05<00:00,  1.18it/s, WMAPE=1.68, DICE=0.0551, DPEAKS=32.3, Loss=0.00505]
Validate Epoch 8: 100%|██████████| 20/20 [00:09<00:00,  2.10it/s, WMAPE=1.81, DICE=0.0553, DPEAKS=32.5, Loss=0.00525]


early stopping: 6 epochs without improvement
Training complete.


Validate Epoch test: 100%|██████████| 486/486 [02:52<00:00,  2.81it/s, WMAPE=1.78, DICE=0.055, DPEAKS=30.4, Loss=0.00521]
