## Carga modulo comun

In [1]:
import sys
import os
sys.path.append(os.path.abspath('../../common'))

In [2]:
import torch
import torch.nn as nn
import torch.nn.functional as F

from purrfect.dataset import EPKADataset, load_partition,save_partition, create_train_valid_loaders
from torch.utils.data import DataLoader

from purrfect.training import train_model,train_validate
import torch.optim as optim

from purrfect.metrics import MetricAccumulator
from purrfect.active_learning import create_new_partition,create_next_partitions, test_model

from sklearn.model_selection import train_test_split
from purrfect.submission import create_submission

In [3]:
DEVICE = torch.device('cuda' if torch.cuda.is_available() else 'cpu')

## Definición modelo

In [4]:
# Define the double convolution block
class DoubleConv(nn.Module):
    def __init__(self, in_channels, out_channels):
        super(DoubleConv, self).__init__()
        self.conv = nn.Sequential(
            nn.Conv2d(in_channels, out_channels, kernel_size=3, padding=1),
            nn.BatchNorm2d(out_channels),
            nn.ReLU(inplace=True),
            nn.Conv2d(out_channels, out_channels, kernel_size=3, padding=1),
            nn.BatchNorm2d(out_channels),
            nn.ReLU(inplace=True)
        )

    def forward(self, x):
        return self.conv(x)

class ChannelAdder(nn.Module):
    def __init__(self):
        super(ChannelAdder, self).__init__()
        # Define Sobel and Laplacian kernels as tensors
        self.sobel_x = torch.tensor([[-1., 0., 1.],
                                     [-2., 0., 2.],
                                     [-1., 0., 1.]], dtype=torch.float32,device=DEVICE).unsqueeze(0).unsqueeze(0)
        
        self.sobel_y = torch.tensor([[-1., -2., -1.],
                                     [ 0.,  0.,  0.],
                                     [ 1.,  2.,  1.]], dtype=torch.float32,device=DEVICE).unsqueeze(0).unsqueeze(0)
        
        self.laplacian_kernel = torch.tensor([[0.,  1., 0.],
                                              [1., -4., 1.],
                                              [0.,  1., 0.]], dtype=torch.float32,device=DEVICE).unsqueeze(0).unsqueeze(0)

    def forward(self, x):
        epsilon = 1e-8

        # Extract the first, second, and third channels
        first_channel = x[:, 0, :, :].unsqueeze(1)  # e1 (first channel)
        second_channel = x[:, 1, :, :].unsqueeze(1)  # e2 (second channel)
        third_channel = x[:, 2, :, :].unsqueeze(1)  # error (third channel)

        # 1. Compute the first new channel: sqrt(first_channel^2 + second_channel^2)
        new_channel1 = torch.sqrt(first_channel**2 + second_channel**2)

        # 2. Compute the second new channel: 1/2 * arctan(channel2 / channel1)
        new_channel2 = 0.5 * torch.atan(second_channel / (first_channel + epsilon))

        # 3. Compute Sobel gradients and Laplacians for e1 (first_channel)
        grad_e1_x = F.conv2d(first_channel, self.sobel_x, padding=1)
        grad_e1_y = F.conv2d(first_channel, self.sobel_y, padding=1)
        grad_e1_magnitude = torch.sqrt(grad_e1_x**2 + grad_e1_y**2)
        #laplacian_e1 = F.conv2d(first_channel, self.laplacian_kernel, padding=1)

        # 4. Compute Sobel gradients and Laplacians for e2 (second_channel)
        grad_e2_x = F.conv2d(second_channel, self.sobel_x, padding=1)
        grad_e2_y = F.conv2d(second_channel, self.sobel_y, padding=1)
        grad_e2_magnitude = torch.sqrt(grad_e2_x**2 + grad_e2_y**2)
        #laplacian_e2 = F.conv2d(second_channel, self.laplacian_kernel, padding=1)

        # 5. Compute weighted ellipticity channels (e1_weighted, e2_weighted)
        e1_weighted = first_channel / (third_channel + epsilon)
        e2_weighted = second_channel / (third_channel + epsilon)

        # Concatenate all the channels (original and new) into the output tensor
        output = torch.cat([
            x,                 # Original 3 channels
            new_channel1,      # sqrt(channel1^2 + channel2^2)
            new_channel2,      # 1/2 * arctan(channel2 / channel1)
            #grad_e1_x,         # Gradient X of channel1
            #grad_e1_y,         # Gradient Y of channel1
            #grad_e2_x,         # Gradient X of channel2
            #grad_e2_y,         # Gradient Y of channel2
            grad_e1_magnitude, # Gradient magnitude of channel1
            grad_e2_magnitude, # Gradient magnitude of channel2
            #laplacian_e1,      # Laplacian of channel1
            #laplacian_e2,      # Laplacian of channel2
            e1_weighted,       # e1_weighted
            e2_weighted        # e2_weighted
        ], dim=1)

        return output

# Define the U-Net model
class UNet(nn.Module):
    def __init__(self, in_channels, out_channels):
        super(UNet, self).__init__()
        # Channel Adder
        self.channel_adder = ChannelAdder()
        # Encoder
        self.encoder1 = DoubleConv(in_channels+6, 64)
        self.encoder2 = DoubleConv(64, 128)
        self.encoder3 = DoubleConv(128, 256)
        self.encoder4 = DoubleConv(256, 512)

        # Bottleneck
        self.bottleneck = DoubleConv(512, 1024)

        # Decoder
        self.upconv4 = nn.ConvTranspose2d(1024, 512, kernel_size=2, stride=2)
        self.decoder4 = DoubleConv(1024, 512)
        self.upconv3 = nn.ConvTranspose2d(512, 256, kernel_size=2, stride=2)
        self.decoder3 = DoubleConv(512, 256)
        self.upconv2 = nn.ConvTranspose2d(256, 128, kernel_size=2, stride=2)
        self.decoder2 = DoubleConv(256, 128)
        self.upconv1 = nn.ConvTranspose2d(128, 64, kernel_size=2, stride=2)
        self.decoder1 = DoubleConv(128, 64)

        # Final output layer
        self.final_conv = nn.Conv2d(64, out_channels, kernel_size=1)

    def forward(self, x):
        # Agregar features
        x = self.channel_adder(x)
        
        # Encoder
        e1 = self.encoder1(x)
        e2 = self.encoder2(F.max_pool2d(e1, 2))
        e3 = self.encoder3(F.max_pool2d(e2, 2))
        e4 = self.encoder4(F.max_pool2d(e3, 2))

        # Bottleneck
        b = self.bottleneck(F.max_pool2d(e4, 2))

        # Decoder with skip connections
        d4 = self.upconv4(b)
        d4 = torch.cat((e4, d4), dim=1)
        d4 = self.decoder4(d4)

        d3 = self.upconv3(d4)
        d3 = torch.cat((e3, d3), dim=1)
        d3 = self.decoder3(d3)

        d2 = self.upconv2(d3)
        d2 = torch.cat((e2, d2), dim=1)
        d2 = self.decoder2(d2)

        d1 = self.upconv1(d2)
        d1 = torch.cat((e1, d1), dim=1)
        d1 = self.decoder1(d1)

        # Final output
        out = self.final_conv(d1)
        return out

## Creación particion inicial

In [5]:
#Creacion de particiones train y valid
init_partition = load_partition("partition_1.json")
train_partition, val_partition = train_test_split(init_partition, test_size=0.2, random_state=42)
save_partition("partition_1_train.json","partitions",train_partition)
save_partition("partition_1_val.json","partitions",val_partition)

## Carga modelo

In [6]:
#Define model
model = UNet( 3, 1)
model = model.to(DEVICE)

In [7]:

# Define Loss
criterion = torch.nn.L1Loss()
current_partition = 1

In [8]:
train_loader, val_loader = create_train_valid_loaders(
    f"partition_{current_partition}_train.json",
    f"partition_{current_partition}_val.json",
    "partitions",
    batch_size=16,
)
best_model_path = os.path.join(
    "models", f"best_model_partition_{current_partition}.pth"
)
last_checkpoint_path = os.path.join(
    "models", f"last_checkpoint_partition_{current_partition}.pth"
)
optimizer = optim.Adam(model.parameters())
train_model(
    model,
    train_loader,
    val_loader,
    best_model_path,
    last_checkpoint_path,
    criterion,
    optimizer,
    num_epochs=50,
    device=DEVICE,
    early_stopping_patience=3,
)

Epoch [1/50]


Train Epoch 1: 100%|██████████| 307/307 [02:09<00:00,  2.38it/s, WMAPE=5.39, DICE=0.24, DPEAKS=135, Loss=0.021]
Validate Epoch 1: 100%|██████████| 77/77 [00:11<00:00,  6.53it/s, WMAPE=4.17, DICE=0.131, DPEAKS=94.6, Loss=0.013]


Saving best model
Epoch [2/50]


Train Epoch 2: 100%|██████████| 307/307 [02:08<00:00,  2.40it/s, WMAPE=2.85, DICE=0.11, DPEAKS=86.9, Loss=0.00949]
Validate Epoch 2: 100%|██████████| 77/77 [00:11<00:00,  6.55it/s, WMAPE=2.37, DICE=0.103, DPEAKS=87.9, Loss=0.00815]


Saving best model
Epoch [3/50]


Train Epoch 3: 100%|██████████| 307/307 [02:09<00:00,  2.38it/s, WMAPE=2.5, DICE=0.0905, DPEAKS=75.2, Loss=0.00817]
Validate Epoch 3: 100%|██████████| 77/77 [00:11<00:00,  6.56it/s, WMAPE=2.61, DICE=0.133, DPEAKS=83.4, Loss=0.0111]


Epoch [4/50]


Train Epoch 4: 100%|██████████| 307/307 [02:08<00:00,  2.39it/s, WMAPE=2.37, DICE=0.0851, DPEAKS=73, Loss=0.00791]
Validate Epoch 4: 100%|██████████| 77/77 [00:11<00:00,  6.58it/s, WMAPE=1.82, DICE=0.0741, DPEAKS=61.6, Loss=0.00673]


Saving best model
Epoch [5/50]


Train Epoch 5: 100%|██████████| 307/307 [02:08<00:00,  2.38it/s, WMAPE=2.24, DICE=0.0724, DPEAKS=61.4, Loss=0.00725]
Validate Epoch 5: 100%|██████████| 77/77 [00:11<00:00,  6.60it/s, WMAPE=2.72, DICE=0.0708, DPEAKS=65.7, Loss=0.00828]


Epoch [6/50]


Train Epoch 6: 100%|██████████| 307/307 [02:09<00:00,  2.38it/s, WMAPE=2.28, DICE=0.0777, DPEAKS=65.6, Loss=0.00746]
Validate Epoch 6: 100%|██████████| 77/77 [00:11<00:00,  6.57it/s, WMAPE=5.81, DICE=0.215, DPEAKS=144, Loss=0.022]


Epoch [7/50]


Train Epoch 7: 100%|██████████| 307/307 [02:07<00:00,  2.40it/s, WMAPE=2.34, DICE=0.0781, DPEAKS=67.3, Loss=0.0075]
Validate Epoch 7: 100%|██████████| 77/77 [00:10<00:00,  7.06it/s, WMAPE=3.11, DICE=0.074, DPEAKS=61.3, Loss=0.00956]


early stopping: 3 epochs without improvement
Training complete.


In [9]:
#Cargar mejor modelo de la particion actual
model.load_state_dict(torch.load(best_model_path,weights_only=True))
test_model(model,criterion,device=DEVICE,batch_size=16)

Validate Epoch test: 100%|██████████| 1941/1941 [04:42<00:00,  6.87it/s, WMAPE=1.91, DICE=0.0763, DPEAKS=59.1, Loss=0.00697]


In [10]:
create_next_partitions(current_partition,model,criterion,device=DEVICE)

Validate Epoch partition_2_train: 100%|██████████| 307/307 [00:47<00:00,  6.51it/s, WMAPE=1.92, DICE=0.0762, DPEAKS=58.4, Loss=0.00694]
Validate Epoch partition_2_val: 100%|██████████| 77/77 [00:11<00:00,  6.71it/s, WMAPE=1.97, DICE=0.0756, DPEAKS=58.4, Loss=0.00698]


In [11]:
current_partition=2

In [12]:
train_loader, val_loader = create_train_valid_loaders(
    f"partition_{current_partition}_train.json",
    f"partition_{current_partition}_val.json",
    "partitions",
    batch_size=16,
)
best_model_path = os.path.join(
    "models", f"best_model_partition_{current_partition}.pth"
)
last_checkpoint_path = os.path.join(
    "models", f"last_checkpoint_partition_{current_partition}.pth"
)
optimizer = optim.Adam(model.parameters())
train_model(
    model,
    train_loader,
    val_loader,
    best_model_path,
    last_checkpoint_path,
    criterion,
    optimizer,
    num_epochs=50,
    device=DEVICE,
    early_stopping_patience=3,
)

Epoch [1/50]


Train Epoch 1:   0%|          | 0/307 [00:00<?, ?it/s]

Train Epoch 1: 100%|██████████| 307/307 [02:00<00:00,  2.54it/s, WMAPE=2.49, DICE=0.0837, DPEAKS=65.6, Loss=0.0077]
Validate Epoch 1: 100%|██████████| 77/77 [00:10<00:00,  7.03it/s, WMAPE=3.71, DICE=0.15, DPEAKS=95.2, Loss=0.0113]


Saving best model
Epoch [2/50]


Train Epoch 2: 100%|██████████| 307/307 [02:07<00:00,  2.40it/s, WMAPE=2.61, DICE=0.0857, DPEAKS=71, Loss=0.00771]
Validate Epoch 2: 100%|██████████| 77/77 [00:11<00:00,  6.54it/s, WMAPE=8.86, DICE=0.0876, DPEAKS=60.3, Loss=0.023]


Epoch [3/50]


Train Epoch 3: 100%|██████████| 307/307 [02:10<00:00,  2.35it/s, WMAPE=2.45, DICE=0.0774, DPEAKS=62.5, Loss=0.0072]
Validate Epoch 3: 100%|██████████| 77/77 [00:11<00:00,  6.54it/s, WMAPE=11, DICE=0.0909, DPEAKS=82.5, Loss=0.0303]


Epoch [4/50]


Train Epoch 4: 100%|██████████| 307/307 [02:08<00:00,  2.39it/s, WMAPE=2.28, DICE=0.0725, DPEAKS=59.4, Loss=0.00671]
Validate Epoch 4: 100%|██████████| 77/77 [00:11<00:00,  6.62it/s, WMAPE=3.02, DICE=0.12, DPEAKS=80.6, Loss=0.009]


Saving best model
Epoch [5/50]


Train Epoch 5: 100%|██████████| 307/307 [02:11<00:00,  2.34it/s, WMAPE=2.25, DICE=0.0714, DPEAKS=54, Loss=0.00664]
Validate Epoch 5: 100%|██████████| 77/77 [00:11<00:00,  6.48it/s, WMAPE=7.12, DICE=0.0757, DPEAKS=61.2, Loss=0.0202]


Epoch [6/50]


Train Epoch 6: 100%|██████████| 307/307 [02:11<00:00,  2.33it/s, WMAPE=1.99, DICE=0.0635, DPEAKS=49.1, Loss=0.00591]
Validate Epoch 6: 100%|██████████| 77/77 [00:11<00:00,  6.48it/s, WMAPE=2.19, DICE=0.0642, DPEAKS=52.1, Loss=0.0064]


Saving best model
Epoch [7/50]


Train Epoch 7: 100%|██████████| 307/307 [02:10<00:00,  2.35it/s, WMAPE=1.98, DICE=0.0622, DPEAKS=50.4, Loss=0.00586]
Validate Epoch 7: 100%|██████████| 77/77 [00:11<00:00,  6.54it/s, WMAPE=13.7, DICE=0.116, DPEAKS=71.7, Loss=0.0358]


Epoch [8/50]


Train Epoch 8: 100%|██████████| 307/307 [02:10<00:00,  2.36it/s, WMAPE=2.22, DICE=0.0728, DPEAKS=56, Loss=0.00651]
Validate Epoch 8: 100%|██████████| 77/77 [00:11<00:00,  6.56it/s, WMAPE=3.34, DICE=0.0832, DPEAKS=65.5, Loss=0.00917]


Epoch [9/50]


Train Epoch 9: 100%|██████████| 307/307 [02:09<00:00,  2.36it/s, WMAPE=1.9, DICE=0.0587, DPEAKS=48.3, Loss=0.00558]
Validate Epoch 9: 100%|██████████| 77/77 [00:11<00:00,  6.55it/s, WMAPE=2.25, DICE=0.0571, DPEAKS=47.5, Loss=0.00632]


Saving best model
Epoch [10/50]


Train Epoch 10: 100%|██████████| 307/307 [02:10<00:00,  2.36it/s, WMAPE=1.82, DICE=0.0566, DPEAKS=44.2, Loss=0.00534]
Validate Epoch 10: 100%|██████████| 77/77 [00:11<00:00,  6.52it/s, WMAPE=2.39, DICE=0.0609, DPEAKS=55.1, Loss=0.00692]


Epoch [11/50]


Train Epoch 11: 100%|██████████| 307/307 [02:10<00:00,  2.35it/s, WMAPE=1.78, DICE=0.0544, DPEAKS=42.8, Loss=0.00518]
Validate Epoch 11: 100%|██████████| 77/77 [00:11<00:00,  6.54it/s, WMAPE=2.72, DICE=0.0544, DPEAKS=41.4, Loss=0.00744]


Epoch [12/50]


Train Epoch 12: 100%|██████████| 307/307 [02:10<00:00,  2.35it/s, WMAPE=1.79, DICE=0.0539, DPEAKS=42.9, Loss=0.00528]
Validate Epoch 12: 100%|██████████| 77/77 [00:11<00:00,  6.55it/s, WMAPE=3.79, DICE=0.073, DPEAKS=66.4, Loss=0.0108]


early stopping: 3 epochs without improvement
Training complete.


In [13]:
create_next_partitions(current_partition,model,criterion,device=DEVICE)

Validate Epoch partition_3_train: 100%|██████████| 307/307 [00:49<00:00,  6.21it/s, WMAPE=3.61, DICE=0.0725, DPEAKS=61.9, Loss=0.011]
Validate Epoch partition_3_val: 100%|██████████| 77/77 [00:12<00:00,  6.23it/s, WMAPE=3.59, DICE=0.0727, DPEAKS=58.2, Loss=0.0109]


In [14]:
current_partition=3
best_model_path = os.path.join(
    "models", f"best_model_partition_{current_partition}.pth"
)
last_checkpoint_path = os.path.join(
    "models", f"last_checkpoint_partition_{current_partition}.pth"
)

In [15]:
train_loader, val_loader = create_train_valid_loaders(
    f"partition_{current_partition}_train.json",
    f"partition_{current_partition}_val.json",
    "partitions",
    batch_size=16,
)
optimizer = optim.Adam(model.parameters())
train_model(
    model,
    train_loader,
    val_loader,
    best_model_path,
    last_checkpoint_path,
    criterion,
    optimizer,
    num_epochs=50,
    device=DEVICE,
    early_stopping_patience=3,
)

Epoch [1/50]


Train Epoch 1: 100%|██████████| 307/307 [02:08<00:00,  2.38it/s, WMAPE=2.05, DICE=0.0571, DPEAKS=49.1, Loss=0.00587]
Validate Epoch 1: 100%|██████████| 77/77 [00:11<00:00,  6.60it/s, WMAPE=2.08, DICE=0.0622, DPEAKS=54.3, Loss=0.00575]


Saving best model
Epoch [2/50]


Train Epoch 2: 100%|██████████| 307/307 [02:08<00:00,  2.38it/s, WMAPE=2.02, DICE=0.0591, DPEAKS=51.2, Loss=0.00577]
Validate Epoch 2: 100%|██████████| 77/77 [00:11<00:00,  6.64it/s, WMAPE=5.84, DICE=0.0619, DPEAKS=53, Loss=0.0147]


Epoch [3/50]


Train Epoch 3: 100%|██████████| 307/307 [02:08<00:00,  2.38it/s, WMAPE=1.84, DICE=0.0536, DPEAKS=44.1, Loss=0.0053]
Validate Epoch 3: 100%|██████████| 77/77 [00:11<00:00,  6.59it/s, WMAPE=2.04, DICE=0.0609, DPEAKS=56.6, Loss=0.00597]


Epoch [4/50]


Train Epoch 4: 100%|██████████| 307/307 [02:08<00:00,  2.39it/s, WMAPE=1.8, DICE=0.0536, DPEAKS=49.5, Loss=0.00529]
Validate Epoch 4: 100%|██████████| 77/77 [00:11<00:00,  6.59it/s, WMAPE=2.05, DICE=0.0499, DPEAKS=40.8, Loss=0.00534]


Saving best model
Epoch [5/50]


Train Epoch 5: 100%|██████████| 307/307 [02:08<00:00,  2.39it/s, WMAPE=1.71, DICE=0.0497, DPEAKS=42.5, Loss=0.00498]
Validate Epoch 5: 100%|██████████| 77/77 [00:11<00:00,  6.63it/s, WMAPE=3.62, DICE=0.0495, DPEAKS=43.5, Loss=0.00953]


Epoch [6/50]


Train Epoch 6: 100%|██████████| 307/307 [02:08<00:00,  2.40it/s, WMAPE=1.68, DICE=0.0493, DPEAKS=42.1, Loss=0.00488]
Validate Epoch 6: 100%|██████████| 77/77 [00:11<00:00,  6.63it/s, WMAPE=2.08, DICE=0.0511, DPEAKS=46.3, Loss=0.0058]


Epoch [7/50]


Train Epoch 7: 100%|██████████| 307/307 [02:08<00:00,  2.39it/s, WMAPE=1.59, DICE=0.0473, DPEAKS=38.3, Loss=0.00458]
Validate Epoch 7: 100%|██████████| 77/77 [00:11<00:00,  6.59it/s, WMAPE=2.2, DICE=0.0616, DPEAKS=55.9, Loss=0.00639]


early stopping: 3 epochs without improvement
Training complete.


In [16]:
#Cargar mejor modelo de la particion actual
model.load_state_dict(torch.load(best_model_path,weights_only=True))
test_model(model,criterion,device=DEVICE,batch_size=16)
create_next_partitions(current_partition,model,criterion,device=DEVICE)

Validate Epoch test: 100%|██████████| 1941/1941 [04:56<00:00,  6.55it/s, WMAPE=1.85, DICE=0.0492, DPEAKS=34.6, Loss=0.00542]
Validate Epoch partition_4_train: 100%|██████████| 307/307 [00:49<00:00,  6.22it/s, WMAPE=1.82, DICE=0.0491, DPEAKS=35.7, Loss=0.00536]
Validate Epoch partition_4_val: 100%|██████████| 77/77 [00:12<00:00,  6.26it/s, WMAPE=1.87, DICE=0.0494, DPEAKS=32.6, Loss=0.00539]


In [8]:
current_partition=4

In [9]:
train_loader, val_loader = create_train_valid_loaders(
    f"partition_{current_partition}_train.json",
    f"partition_{current_partition}_val.json",
    "partitions",
    batch_size=16,
)
best_model_path = os.path.join(
    "models", f"best_model_partition_{current_partition}.pth"
)
last_checkpoint_path = os.path.join(
    "models", f"last_checkpoint_partition_{current_partition}.pth"
)
optimizer = optim.Adam(model.parameters(), lr=0.00001)
train_model(
    model,
    train_loader,
    val_loader,
    best_model_path,
    last_checkpoint_path,
    criterion,
    optimizer,
    num_epochs=50,
    device=DEVICE,
    early_stopping_patience=3,
)

Epoch [1/50]


Train Epoch 1: 100%|██████████| 307/307 [02:07<00:00,  2.41it/s, loss=0.0474]
Validate Epoch 1: 100%|██████████| 77/77 [00:11<00:00,  6.47it/s, loss=0.0462]


Saving best model
Epoch [2/50]


Train Epoch 2: 100%|██████████| 307/307 [02:03<00:00,  2.49it/s, loss=0.032] 
Validate Epoch 2: 100%|██████████| 77/77 [00:11<00:00,  7.00it/s, loss=0.0335]


Saving best model
Epoch [3/50]


Train Epoch 3: 100%|██████████| 307/307 [02:02<00:00,  2.51it/s, loss=0.0287]
Validate Epoch 3: 100%|██████████| 77/77 [00:11<00:00,  6.50it/s, loss=0.0297]


Saving best model
Epoch [4/50]


Train Epoch 4: 100%|██████████| 307/307 [02:02<00:00,  2.50it/s, loss=0.0232]
Validate Epoch 4: 100%|██████████| 77/77 [00:10<00:00,  7.19it/s, loss=0.0239]


Saving best model
Epoch [5/50]


Train Epoch 5: 100%|██████████| 307/307 [01:58<00:00,  2.59it/s, loss=0.0244]
Validate Epoch 5: 100%|██████████| 77/77 [00:10<00:00,  7.18it/s, loss=0.0213]


Saving best model
Epoch [6/50]


Train Epoch 6: 100%|██████████| 307/307 [01:58<00:00,  2.59it/s, loss=0.021] 
Validate Epoch 6: 100%|██████████| 77/77 [00:10<00:00,  7.18it/s, loss=0.0199]


Saving best model
Epoch [7/50]


Train Epoch 7: 100%|██████████| 307/307 [01:58<00:00,  2.58it/s, loss=0.0179]
Validate Epoch 7: 100%|██████████| 77/77 [00:10<00:00,  7.15it/s, loss=0.0195]


Saving best model
Epoch [8/50]


Train Epoch 8: 100%|██████████| 307/307 [01:58<00:00,  2.59it/s, loss=0.0173]
Validate Epoch 8: 100%|██████████| 77/77 [00:10<00:00,  7.11it/s, loss=0.0225]


Epoch [9/50]


Train Epoch 9: 100%|██████████| 307/307 [02:05<00:00,  2.44it/s, loss=0.017] 
Validate Epoch 9: 100%|██████████| 77/77 [00:11<00:00,  6.55it/s, loss=0.0204]


Epoch [10/50]


Train Epoch 10: 100%|██████████| 307/307 [02:09<00:00,  2.36it/s, loss=0.022] 
Validate Epoch 10: 100%|██████████| 77/77 [00:11<00:00,  6.56it/s, loss=0.0185]


Saving best model
Epoch [11/50]


Train Epoch 11: 100%|██████████| 307/307 [02:10<00:00,  2.36it/s, loss=0.0159]
Validate Epoch 11: 100%|██████████| 77/77 [00:11<00:00,  6.53it/s, loss=0.0174]


Saving best model
Epoch [12/50]


Train Epoch 12: 100%|██████████| 307/307 [02:10<00:00,  2.35it/s, loss=0.0169]
Validate Epoch 12: 100%|██████████| 77/77 [00:11<00:00,  6.52it/s, loss=0.0179]


Saving best model
Epoch [13/50]


Train Epoch 13: 100%|██████████| 307/307 [02:11<00:00,  2.34it/s, loss=0.0475]
Validate Epoch 13: 100%|██████████| 77/77 [00:11<00:00,  6.51it/s, loss=0.0503]


Epoch [14/50]


Train Epoch 14: 100%|██████████| 307/307 [02:11<00:00,  2.33it/s, loss=0.0154]
Validate Epoch 14: 100%|██████████| 77/77 [00:11<00:00,  6.44it/s, loss=0.0178]


Saving best model
Epoch [15/50]


Train Epoch 15: 100%|██████████| 307/307 [02:10<00:00,  2.35it/s, loss=0.0152]
Validate Epoch 15: 100%|██████████| 77/77 [00:10<00:00,  7.04it/s, loss=0.018] 


Epoch [16/50]


Train Epoch 16: 100%|██████████| 307/307 [02:00<00:00,  2.54it/s, loss=0.0164]
Validate Epoch 16: 100%|██████████| 77/77 [00:10<00:00,  7.06it/s, loss=0.018] 


Epoch [17/50]


Train Epoch 17: 100%|██████████| 307/307 [02:00<00:00,  2.54it/s, loss=0.0139]
Validate Epoch 17: 100%|██████████| 77/77 [00:10<00:00,  7.05it/s, loss=0.0181]


early stopping: 3 epochs without improvement
Training complete.


In [10]:
#Cargar mejor modelo de la particion actual
model.load_state_dict(torch.load(best_model_path,weights_only=True))
test_model(model,criterion,device=DEVICE,batch_size=16)
create_next_partitions(current_partition,model,criterion,device=DEVICE)

Validate Epoch test: 100%|██████████| 1941/1941 [04:53<00:00,  6.62it/s, loss=0.0201]
Validate Epoch partition_5_train: 100%|██████████| 307/307 [00:50<00:00,  6.05it/s, loss=0.0164]
Validate Epoch partition_5_val: 100%|██████████| 77/77 [00:12<00:00,  6.09it/s, loss=0.0192]


In [7]:
current_partition=5

In [8]:
train_loader, val_loader = create_train_valid_loaders(
    f"partition_{current_partition}_train.json",
    f"partition_{current_partition}_val.json",
    "partitions",
    batch_size=16,
)
best_model_path = os.path.join(
    "models", f"best_model_partition_{current_partition}.pth"
)
last_checkpoint_path = os.path.join(
    "models", f"last_checkpoint_partition_{current_partition}.pth"
)
optimizer = optim.Adam(model.parameters(), lr=0.00001)
train_model(
    model,
    train_loader,
    val_loader,
    best_model_path,
    last_checkpoint_path,
    criterion,
    optimizer,
    num_epochs=50,
    device=DEVICE,
    early_stopping_patience=3,
)

Epoch [8/50]


Train Epoch 8: 100%|██████████| 307/307 [02:08<00:00,  2.40it/s, WMAPE=4.54, DICE=0.228, DPEAKS=124, Loss=0.013]
Validate Epoch 8: 100%|██████████| 77/77 [00:11<00:00,  6.61it/s, WMAPE=5.91, DICE=0.289, DPEAKS=146, Loss=0.0178]


Epoch [9/50]


Train Epoch 9: 100%|██████████| 307/307 [02:07<00:00,  2.41it/s, WMAPE=4.5, DICE=0.224, DPEAKS=123, Loss=0.0128]
Validate Epoch 9: 100%|██████████| 77/77 [00:11<00:00,  6.56it/s, WMAPE=5.66, DICE=0.289, DPEAKS=150, Loss=0.0196]


early stopping: 3 epochs without improvement
Training complete.


In [9]:
#Cargar mejor modelo de la particion actual
model.load_state_dict(torch.load(best_model_path,weights_only=True))
test_model(model,criterion,device=DEVICE,batch_size=16)
create_next_partitions(current_partition,model,criterion,device=DEVICE)

Validate Epoch test: 100%|██████████| 1941/1941 [04:56<00:00,  6.54it/s, WMAPE=4.41, DICE=0.272, DPEAKS=125, Loss=0.0174]
Validate Epoch partition_6_train: 100%|██████████| 307/307 [00:51<00:00,  5.97it/s, WMAPE=4.37, DICE=0.271, DPEAKS=123, Loss=0.0175]
Validate Epoch partition_6_val: 100%|██████████| 77/77 [00:12<00:00,  6.01it/s, WMAPE=4.67, DICE=0.272, DPEAKS=128, Loss=0.0176]


In [7]:
current_partition=3
best_model_path = os.path.join(
    "models", f"best_model_partition_{current_partition}.pth"
)
model.load_state_dict(torch.load(best_model_path,weights_only=True))
create_submission(model, "partition_3",submission_path="submissions",device=DEVICE)

                                                                                        