# Multi-task SELD


In [1]:
import torch
from torchinfo import summary

from datasets import create_dataloaders
from multi_task import MultiTaskSELD, train_model

SAMPLE_RATE = 24000
FRAME_LENGTH = SAMPLE_RATE // 10
MAX_EVENTS = 5
NUM_CLASSES = 13
BATCH_SIZE = 256

device = torch.device('cuda' if torch.cuda.is_available() else 'cpu')
print(f'Using device: {device}')

Using device: cuda


## Model

In [2]:
model_args = {
    'backbone': 'seldnet',
    'num_classes': NUM_CLASSES,
    'num_events': MAX_EVENTS,
    'input_dim': 7,
    'hidden_dim': 64,
    'dropout': 0.05,
    'rnn_layers': 2,
    'mhsa_layers': 2,
}
train_dataloader, _ = create_dataloaders(BATCH_SIZE)
model = MultiTaskSELD(**model_args)
features, *_ = next(iter(train_dataloader))
summary(model, input_data=[features])

Layer (type:depth-idx)                   Output Shape              Param #
MultiTaskSELD                            [256, 50, 13, 4]          --
├─SELDNetBackbone: 1-1                   [256, 50, 128]            --
│    └─Sequential: 2-1                   [256, 64, 2, 50]          --
│    │    └─ConvBlock: 3-1               [256, 64, 16, 50]         4,224
│    │    └─ConvBlock: 3-2               [256, 64, 4, 50]          37,056
│    │    └─ConvBlock: 3-3               [256, 64, 2, 50]          37,056
│    └─GRU: 2-2                          [256, 50, 256]            494,592
│    └─ModuleList: 2-5                   --                        (recursive)
│    │    └─MultiheadAttention: 3-4      [256, 50, 128]            66,048
│    └─ModuleList: 2-6                   --                        (recursive)
│    │    └─LayerNorm: 3-5               [256, 50, 128]            256
│    └─ModuleList: 2-5                   --                        (recursive)
│    │    └─MultiheadAttention: 3-6  

## Evaluation

In [3]:
model_args = {
    'backbone': 'seldnet',
    'num_classes': NUM_CLASSES,
    'num_events': MAX_EVENTS,
    'input_dim': 7,
    'hidden_dim': 64,
    'dropout': 0.05,
    'rnn_layers': 2,
    'mhsa_layers': 2,
}
train_dataloader, test_dataloader = create_dataloaders(BATCH_SIZE)
model = train_model(
    model_args,
    train_dataloader,
    test_dataloader,
    epochs=250,
    device=device,
    sde_weight=0.0,
)

Epoch 1/250: 100%|██████████| 12/12 [00:17<00:00,  1.47s/it, loss=0.0566, test_loss=0.0344]
Epoch 2/250: 100%|██████████| 12/12 [00:17<00:00,  1.44s/it, loss=0.0278, test_loss=0.0308]
Epoch 3/250: 100%|██████████| 12/12 [00:17<00:00,  1.42s/it, loss=0.0256, test_loss=0.0294]
Epoch 4/250: 100%|██████████| 12/12 [00:17<00:00,  1.44s/it, loss=0.0239, test_loss=0.0289]
Epoch 5/250: 100%|██████████| 12/12 [00:17<00:00,  1.43s/it, loss=0.0225, test_loss=0.0293]
Epoch 6/250: 100%|██████████| 12/12 [00:17<00:00,  1.49s/it, loss=0.0213, test_loss=0.0293]
Epoch 7/250: 100%|██████████| 12/12 [00:18<00:00,  1.52s/it, loss=0.0201, test_loss=0.0296]
Epoch 8/250: 100%|██████████| 12/12 [00:19<00:00,  1.59s/it, loss=0.0188, test_loss=0.0294]
Epoch 9/250: 100%|██████████| 12/12 [00:19<00:00,  1.63s/it, loss=0.0177, test_loss=0.0302]
Epoch 10/250: 100%|██████████| 12/12 [00:19<00:00,  1.59s/it, loss=0.0165, test_loss=0.0291]


Macro: ER=0.89, F=0.04, LE=134.01, LR=0.08
Micro: ER=0.89, F=0.10, LE=31.64, LR=0.17


Epoch 11/250: 100%|██████████| 12/12 [00:20<00:00,  1.68s/it, loss=0.0155, test_loss=0.0283]
Epoch 12/250: 100%|██████████| 12/12 [00:20<00:00,  1.72s/it, loss=0.0144, test_loss=0.0297]
Epoch 13/250: 100%|██████████| 12/12 [00:19<00:00,  1.66s/it, loss=0.0137, test_loss=0.0275]
Epoch 14/250: 100%|██████████| 12/12 [00:20<00:00,  1.74s/it, loss=0.013, test_loss=0.0282]
Epoch 15/250: 100%|██████████| 12/12 [00:20<00:00,  1.72s/it, loss=0.0123, test_loss=0.0269]
Epoch 16/250: 100%|██████████| 12/12 [00:20<00:00,  1.72s/it, loss=0.0119, test_loss=0.0277]
Epoch 17/250: 100%|██████████| 12/12 [00:21<00:00,  1.77s/it, loss=0.0114, test_loss=0.0271]
Epoch 18/250: 100%|██████████| 12/12 [00:21<00:00,  1.77s/it, loss=0.0109, test_loss=0.0281]
Epoch 19/250: 100%|██████████| 12/12 [00:21<00:00,  1.78s/it, loss=0.0106, test_loss=0.0273]
Epoch 20/250: 100%|██████████| 12/12 [00:21<00:00,  1.78s/it, loss=0.0102, test_loss=0.0264]


Macro: ER=0.79, F=0.07, LE=134.17, LR=0.16
Micro: ER=0.79, F=0.19, LE=30.97, LR=0.39


Epoch 21/250: 100%|██████████| 12/12 [00:21<00:00,  1.81s/it, loss=0.0099, test_loss=0.0273]
Epoch 22/250: 100%|██████████| 12/12 [00:21<00:00,  1.80s/it, loss=0.0096, test_loss=0.027]
Epoch 23/250: 100%|██████████| 12/12 [00:21<00:00,  1.82s/it, loss=0.00929, test_loss=0.0268]
Epoch 24/250: 100%|██████████| 12/12 [00:21<00:00,  1.82s/it, loss=0.00918, test_loss=0.0262]
Epoch 25/250: 100%|██████████| 12/12 [00:21<00:00,  1.82s/it, loss=0.00899, test_loss=0.0289]
Epoch 26/250: 100%|██████████| 12/12 [00:21<00:00,  1.82s/it, loss=0.00884, test_loss=0.0275]
Epoch 27/250: 100%|██████████| 12/12 [00:21<00:00,  1.79s/it, loss=0.00878, test_loss=0.0268]
Epoch 28/250: 100%|██████████| 12/12 [00:21<00:00,  1.81s/it, loss=0.00847, test_loss=0.0266]
Epoch 29/250: 100%|██████████| 12/12 [00:21<00:00,  1.81s/it, loss=0.00832, test_loss=0.0277]
Epoch 30/250: 100%|██████████| 12/12 [00:21<00:00,  1.80s/it, loss=0.00823, test_loss=0.0259]


Macro: ER=0.77, F=0.09, LE=123.77, LR=0.18
Micro: ER=0.77, F=0.24, LE=31.19, LR=0.44


Epoch 31/250: 100%|██████████| 12/12 [00:21<00:00,  1.78s/it, loss=0.00807, test_loss=0.0256]
Epoch 32/250: 100%|██████████| 12/12 [00:21<00:00,  1.78s/it, loss=0.00812, test_loss=0.0261]
Epoch 33/250: 100%|██████████| 12/12 [00:21<00:00,  1.83s/it, loss=0.00794, test_loss=0.0269]
Epoch 34/250: 100%|██████████| 12/12 [00:21<00:00,  1.79s/it, loss=0.00782, test_loss=0.0263]
Epoch 35/250: 100%|██████████| 12/12 [00:21<00:00,  1.79s/it, loss=0.00777, test_loss=0.0255]
Epoch 36/250: 100%|██████████| 12/12 [00:21<00:00,  1.83s/it, loss=0.00763, test_loss=0.0275]
Epoch 37/250: 100%|██████████| 12/12 [00:21<00:00,  1.78s/it, loss=0.00736, test_loss=0.0257]
Epoch 38/250: 100%|██████████| 12/12 [00:21<00:00,  1.77s/it, loss=0.00715, test_loss=0.0258]
Epoch 39/250: 100%|██████████| 12/12 [00:21<00:00,  1.76s/it, loss=0.00723, test_loss=0.0252]
Epoch 40/250: 100%|██████████| 12/12 [00:21<00:00,  1.77s/it, loss=0.00717, test_loss=0.0263]


Macro: ER=0.75, F=0.10, LE=110.74, LR=0.20
Micro: ER=0.75, F=0.26, LE=32.95, LR=0.47


Epoch 41/250: 100%|██████████| 12/12 [00:21<00:00,  1.77s/it, loss=0.0071, test_loss=0.0262]
Epoch 42/250: 100%|██████████| 12/12 [00:21<00:00,  1.77s/it, loss=0.00692, test_loss=0.0257]
Epoch 43/250: 100%|██████████| 12/12 [00:21<00:00,  1.83s/it, loss=0.0069, test_loss=0.0267]
Epoch 44/250: 100%|██████████| 12/12 [00:20<00:00,  1.75s/it, loss=0.0069, test_loss=0.0266]
Epoch 45/250: 100%|██████████| 12/12 [00:21<00:00,  1.80s/it, loss=0.00673, test_loss=0.0271]
Epoch 46/250: 100%|██████████| 12/12 [00:21<00:00,  1.75s/it, loss=0.00675, test_loss=0.0244]
Epoch 47/250: 100%|██████████| 12/12 [00:21<00:00,  1.83s/it, loss=0.00665, test_loss=0.0243]
Epoch 48/250: 100%|██████████| 12/12 [00:22<00:00,  1.83s/it, loss=0.00656, test_loss=0.0249]
Epoch 49/250: 100%|██████████| 12/12 [00:22<00:00,  1.86s/it, loss=0.00642, test_loss=0.0252]
Epoch 50/250: 100%|██████████| 12/12 [00:22<00:00,  1.88s/it, loss=0.00639, test_loss=0.0274]


Macro: ER=0.75, F=0.11, LE=110.73, LR=0.21
Micro: ER=0.75, F=0.27, LE=34.23, LR=0.49


Epoch 51/250: 100%|██████████| 12/12 [00:22<00:00,  1.85s/it, loss=0.00646, test_loss=0.0254]
Epoch 52/250: 100%|██████████| 12/12 [00:22<00:00,  1.84s/it, loss=0.0063, test_loss=0.025]
Epoch 53/250: 100%|██████████| 12/12 [00:22<00:00,  1.86s/it, loss=0.0063, test_loss=0.025]
Epoch 54/250: 100%|██████████| 12/12 [00:22<00:00,  1.86s/it, loss=0.0062, test_loss=0.0254]
Epoch 55/250: 100%|██████████| 12/12 [00:22<00:00,  1.83s/it, loss=0.00616, test_loss=0.0246]
Epoch 56/250: 100%|██████████| 12/12 [00:22<00:00,  1.88s/it, loss=0.00617, test_loss=0.0264]
Epoch 57/250: 100%|██████████| 12/12 [00:22<00:00,  1.86s/it, loss=0.00605, test_loss=0.0254]
Epoch 58/250: 100%|██████████| 12/12 [00:22<00:00,  1.88s/it, loss=0.0061, test_loss=0.0257]
Epoch 59/250: 100%|██████████| 12/12 [00:21<00:00,  1.82s/it, loss=0.00599, test_loss=0.0257]
Epoch 60/250: 100%|██████████| 12/12 [00:22<00:00,  1.85s/it, loss=0.00597, test_loss=0.0245]


Macro: ER=0.73, F=0.12, LE=101.95, LR=0.21
Micro: ER=0.73, F=0.29, LE=28.79, LR=0.49


Epoch 61/250: 100%|██████████| 12/12 [00:22<00:00,  1.87s/it, loss=0.00589, test_loss=0.0249]
Epoch 62/250: 100%|██████████| 12/12 [00:21<00:00,  1.82s/it, loss=0.0058, test_loss=0.0242]
Epoch 63/250: 100%|██████████| 12/12 [00:22<00:00,  1.87s/it, loss=0.00578, test_loss=0.0262]
Epoch 64/250: 100%|██████████| 12/12 [00:22<00:00,  1.86s/it, loss=0.00569, test_loss=0.0262]
Epoch 65/250: 100%|██████████| 12/12 [00:21<00:00,  1.82s/it, loss=0.00569, test_loss=0.0247]
Epoch 66/250: 100%|██████████| 12/12 [00:22<00:00,  1.83s/it, loss=0.0057, test_loss=0.0253]
Epoch 67/250: 100%|██████████| 12/12 [00:22<00:00,  1.86s/it, loss=0.00562, test_loss=0.0256]
Epoch 68/250: 100%|██████████| 12/12 [00:22<00:00,  1.84s/it, loss=0.00559, test_loss=0.025]
Epoch 69/250: 100%|██████████| 12/12 [00:22<00:00,  1.85s/it, loss=0.00553, test_loss=0.025]
Epoch 70/250: 100%|██████████| 12/12 [00:21<00:00,  1.81s/it, loss=0.00543, test_loss=0.025]


Macro: ER=0.74, F=0.11, LE=101.71, LR=0.21
Micro: ER=0.74, F=0.28, LE=29.15, LR=0.49


Epoch 71/250: 100%|██████████| 12/12 [00:21<00:00,  1.82s/it, loss=0.00539, test_loss=0.024]
Epoch 72/250: 100%|██████████| 12/12 [00:22<00:00,  1.87s/it, loss=0.00546, test_loss=0.0262]
Epoch 73/250: 100%|██████████| 12/12 [00:22<00:00,  1.87s/it, loss=0.00534, test_loss=0.0265]
Epoch 74/250: 100%|██████████| 12/12 [00:21<00:00,  1.83s/it, loss=0.00524, test_loss=0.0253]
Epoch 75/250: 100%|██████████| 12/12 [00:22<00:00,  1.87s/it, loss=0.0052, test_loss=0.0259]
Epoch 76/250: 100%|██████████| 12/12 [00:22<00:00,  1.86s/it, loss=0.00535, test_loss=0.0266]
Epoch 77/250: 100%|██████████| 12/12 [00:22<00:00,  1.86s/it, loss=0.00523, test_loss=0.0247]
Epoch 78/250: 100%|██████████| 12/12 [00:22<00:00,  1.85s/it, loss=0.00518, test_loss=0.0253]
Epoch 79/250: 100%|██████████| 12/12 [00:22<00:00,  1.86s/it, loss=0.00512, test_loss=0.0252]
Epoch 80/250: 100%|██████████| 12/12 [00:22<00:00,  1.84s/it, loss=0.0051, test_loss=0.0247]


Macro: ER=0.74, F=0.11, LE=79.54, LR=0.20
Micro: ER=0.74, F=0.27, LE=28.63, LR=0.48


Epoch 81/250: 100%|██████████| 12/12 [00:22<00:00,  1.89s/it, loss=0.00504, test_loss=0.0249]
Epoch 82/250: 100%|██████████| 12/12 [00:22<00:00,  1.87s/it, loss=0.00504, test_loss=0.0267]
Epoch 83/250: 100%|██████████| 12/12 [00:22<00:00,  1.85s/it, loss=0.00505, test_loss=0.0264]
Epoch 84/250: 100%|██████████| 12/12 [00:22<00:00,  1.84s/it, loss=0.005, test_loss=0.0249]
Epoch 85/250: 100%|██████████| 12/12 [00:22<00:00,  1.87s/it, loss=0.00493, test_loss=0.0246]
Epoch 86/250: 100%|██████████| 12/12 [00:21<00:00,  1.80s/it, loss=0.00486, test_loss=0.0247]
Epoch 87/250: 100%|██████████| 12/12 [00:21<00:00,  1.79s/it, loss=0.00481, test_loss=0.0265]
Epoch 88/250: 100%|██████████| 12/12 [00:21<00:00,  1.81s/it, loss=0.00486, test_loss=0.0259]
Epoch 89/250: 100%|██████████| 12/12 [00:22<00:00,  1.86s/it, loss=0.00484, test_loss=0.0248]
Epoch 90/250: 100%|██████████| 12/12 [00:21<00:00,  1.82s/it, loss=0.00478, test_loss=0.0247]


Macro: ER=0.72, F=0.13, LE=78.75, LR=0.22
Micro: ER=0.72, F=0.29, LE=28.09, LR=0.48


Epoch 91/250: 100%|██████████| 12/12 [00:21<00:00,  1.77s/it, loss=0.00473, test_loss=0.0245]
Epoch 92/250: 100%|██████████| 12/12 [00:21<00:00,  1.79s/it, loss=0.00468, test_loss=0.0259]
Epoch 93/250: 100%|██████████| 12/12 [00:21<00:00,  1.80s/it, loss=0.00468, test_loss=0.0261]
Epoch 94/250: 100%|██████████| 12/12 [00:21<00:00,  1.80s/it, loss=0.00469, test_loss=0.0241]
Epoch 95/250: 100%|██████████| 12/12 [00:21<00:00,  1.78s/it, loss=0.00458, test_loss=0.0249]
Epoch 96/250: 100%|██████████| 12/12 [00:21<00:00,  1.82s/it, loss=0.00455, test_loss=0.0256]
Epoch 97/250: 100%|██████████| 12/12 [00:22<00:00,  1.86s/it, loss=0.00454, test_loss=0.0253]
Epoch 98/250: 100%|██████████| 12/12 [00:21<00:00,  1.82s/it, loss=0.00452, test_loss=0.0253]
Epoch 99/250: 100%|██████████| 12/12 [00:22<00:00,  1.86s/it, loss=0.00447, test_loss=0.0252]
Epoch 100/250: 100%|██████████| 12/12 [00:21<00:00,  1.79s/it, loss=0.00445, test_loss=0.0244]


Macro: ER=0.72, F=0.13, LE=68.53, LR=0.23
Micro: ER=0.72, F=0.29, LE=28.58, LR=0.50


Epoch 101/250: 100%|██████████| 12/12 [00:22<00:00,  1.84s/it, loss=0.00442, test_loss=0.0256]
Epoch 102/250: 100%|██████████| 12/12 [00:22<00:00,  1.86s/it, loss=0.00446, test_loss=0.0257]
Epoch 103/250: 100%|██████████| 12/12 [00:22<00:00,  1.86s/it, loss=0.00442, test_loss=0.0268]
Epoch 104/250: 100%|██████████| 12/12 [00:21<00:00,  1.81s/it, loss=0.00434, test_loss=0.0257]
Epoch 105/250: 100%|██████████| 12/12 [00:22<00:00,  1.85s/it, loss=0.00434, test_loss=0.026]
Epoch 106/250: 100%|██████████| 12/12 [00:22<00:00,  1.86s/it, loss=0.00428, test_loss=0.0253]
Epoch 107/250: 100%|██████████| 12/12 [00:21<00:00,  1.83s/it, loss=0.00432, test_loss=0.025]
Epoch 108/250: 100%|██████████| 12/12 [00:21<00:00,  1.78s/it, loss=0.00426, test_loss=0.0253]
Epoch 109/250: 100%|██████████| 12/12 [00:21<00:00,  1.80s/it, loss=0.00431, test_loss=0.0255]
Epoch 110/250: 100%|██████████| 12/12 [00:21<00:00,  1.77s/it, loss=0.00429, test_loss=0.0246]


Macro: ER=0.72, F=0.13, LE=67.71, LR=0.24
Micro: ER=0.72, F=0.29, LE=29.47, LR=0.50


Epoch 111/250: 100%|██████████| 12/12 [00:21<00:00,  1.83s/it, loss=0.00413, test_loss=0.0262]
Epoch 112/250: 100%|██████████| 12/12 [00:22<00:00,  1.89s/it, loss=0.00415, test_loss=0.0254]
Epoch 113/250: 100%|██████████| 12/12 [00:21<00:00,  1.76s/it, loss=0.00413, test_loss=0.0256]
Epoch 114/250: 100%|██████████| 12/12 [00:21<00:00,  1.81s/it, loss=0.00407, test_loss=0.0271]
Epoch 115/250: 100%|██████████| 12/12 [00:21<00:00,  1.81s/it, loss=0.00406, test_loss=0.0256]
Epoch 116/250: 100%|██████████| 12/12 [00:22<00:00,  1.84s/it, loss=0.00395, test_loss=0.0288]
Epoch 117/250: 100%|██████████| 12/12 [00:22<00:00,  1.84s/it, loss=0.00396, test_loss=0.0271]
Epoch 118/250: 100%|██████████| 12/12 [00:21<00:00,  1.82s/it, loss=0.00393, test_loss=0.026]
Epoch 119/250: 100%|██████████| 12/12 [00:20<00:00,  1.75s/it, loss=0.00391, test_loss=0.0252]
Epoch 120/250: 100%|██████████| 12/12 [00:22<00:00,  1.84s/it, loss=0.00392, test_loss=0.0263]


Macro: ER=0.74, F=0.14, LE=45.53, LR=0.26
Micro: ER=0.74, F=0.28, LE=30.33, LR=0.53


Epoch 121/250: 100%|██████████| 12/12 [00:22<00:00,  1.88s/it, loss=0.00383, test_loss=0.0268]
Epoch 122/250: 100%|██████████| 12/12 [00:23<00:00,  1.95s/it, loss=0.00385, test_loss=0.0275]
Epoch 123/250: 100%|██████████| 12/12 [00:21<00:00,  1.82s/it, loss=0.00387, test_loss=0.0258]
Epoch 124/250: 100%|██████████| 12/12 [00:22<00:00,  1.85s/it, loss=0.00382, test_loss=0.027]
Epoch 125/250: 100%|██████████| 12/12 [00:21<00:00,  1.77s/it, loss=0.00381, test_loss=0.0259]
Epoch 126/250: 100%|██████████| 12/12 [00:21<00:00,  1.79s/it, loss=0.00383, test_loss=0.0266]
Epoch 127/250: 100%|██████████| 12/12 [00:21<00:00,  1.78s/it, loss=0.00379, test_loss=0.0264]
Epoch 128/250: 100%|██████████| 12/12 [00:22<00:00,  1.86s/it, loss=0.00379, test_loss=0.0294]
Epoch 129/250: 100%|██████████| 12/12 [00:21<00:00,  1.79s/it, loss=0.00386, test_loss=0.0247]
Epoch 130/250: 100%|██████████| 12/12 [00:22<00:00,  1.85s/it, loss=0.00377, test_loss=0.0258]


Macro: ER=0.74, F=0.14, LE=44.41, LR=0.26
Micro: ER=0.74, F=0.27, LE=29.53, LR=0.53


Epoch 131/250: 100%|██████████| 12/12 [00:22<00:00,  1.89s/it, loss=0.00365, test_loss=0.0271]
Epoch 132/250: 100%|██████████| 12/12 [00:21<00:00,  1.79s/it, loss=0.00366, test_loss=0.026]
Epoch 133/250: 100%|██████████| 12/12 [00:21<00:00,  1.75s/it, loss=0.00366, test_loss=0.025]
Epoch 134/250: 100%|██████████| 12/12 [00:21<00:00,  1.79s/it, loss=0.00362, test_loss=0.0268]
Epoch 135/250: 100%|██████████| 12/12 [00:21<00:00,  1.79s/it, loss=0.00352, test_loss=0.0265]
Epoch 136/250: 100%|██████████| 12/12 [00:20<00:00,  1.74s/it, loss=0.00356, test_loss=0.0268]
Epoch 137/250: 100%|██████████| 12/12 [00:21<00:00,  1.78s/it, loss=0.00355, test_loss=0.0269]
Epoch 138/250: 100%|██████████| 12/12 [00:21<00:00,  1.76s/it, loss=0.00355, test_loss=0.026]
Epoch 139/250: 100%|██████████| 12/12 [00:21<00:00,  1.79s/it, loss=0.00349, test_loss=0.0272]
Epoch 140/250: 100%|██████████| 12/12 [00:21<00:00,  1.76s/it, loss=0.00347, test_loss=0.0255]


Macro: ER=0.72, F=0.14, LE=43.96, LR=0.26
Micro: ER=0.72, F=0.29, LE=29.21, LR=0.53


Epoch 141/250: 100%|██████████| 12/12 [00:21<00:00,  1.80s/it, loss=0.00344, test_loss=0.0281]
Epoch 142/250: 100%|██████████| 12/12 [00:21<00:00,  1.75s/it, loss=0.00342, test_loss=0.0265]
Epoch 143/250: 100%|██████████| 12/12 [00:20<00:00,  1.74s/it, loss=0.00343, test_loss=0.0258]
Epoch 144/250: 100%|██████████| 12/12 [00:21<00:00,  1.76s/it, loss=0.00338, test_loss=0.0259]
Epoch 145/250: 100%|██████████| 12/12 [00:22<00:00,  1.86s/it, loss=0.00334, test_loss=0.0265]
Epoch 146/250: 100%|██████████| 12/12 [00:22<00:00,  1.85s/it, loss=0.00336, test_loss=0.0257]
Epoch 147/250: 100%|██████████| 12/12 [00:22<00:00,  1.84s/it, loss=0.0033, test_loss=0.0266]
Epoch 148/250: 100%|██████████| 12/12 [00:22<00:00,  1.88s/it, loss=0.00329, test_loss=0.0265]
Epoch 149/250: 100%|██████████| 12/12 [00:21<00:00,  1.80s/it, loss=0.00323, test_loss=0.027]
Epoch 150/250: 100%|██████████| 12/12 [00:21<00:00,  1.78s/it, loss=0.00328, test_loss=0.0264]


Macro: ER=0.74, F=0.15, LE=44.88, LR=0.27
Micro: ER=0.74, F=0.28, LE=29.61, LR=0.53


Epoch 151/250: 100%|██████████| 12/12 [00:21<00:00,  1.80s/it, loss=0.00327, test_loss=0.0283]
Epoch 152/250: 100%|██████████| 12/12 [00:21<00:00,  1.82s/it, loss=0.00327, test_loss=0.0278]
Epoch 153/250: 100%|██████████| 12/12 [00:21<00:00,  1.77s/it, loss=0.00325, test_loss=0.0259]
Epoch 154/250: 100%|██████████| 12/12 [00:21<00:00,  1.78s/it, loss=0.00322, test_loss=0.0262]
Epoch 155/250: 100%|██████████| 12/12 [00:21<00:00,  1.80s/it, loss=0.00312, test_loss=0.0271]
Epoch 156/250: 100%|██████████| 12/12 [00:21<00:00,  1.81s/it, loss=0.00311, test_loss=0.0272]
Epoch 157/250: 100%|██████████| 12/12 [00:21<00:00,  1.80s/it, loss=0.00312, test_loss=0.027]
Epoch 158/250: 100%|██████████| 12/12 [00:21<00:00,  1.81s/it, loss=0.00309, test_loss=0.0267]
Epoch 159/250: 100%|██████████| 12/12 [00:21<00:00,  1.77s/it, loss=0.00308, test_loss=0.0268]
Epoch 160/250: 100%|██████████| 12/12 [00:21<00:00,  1.77s/it, loss=0.0031, test_loss=0.0259]


Macro: ER=0.73, F=0.14, LE=44.80, LR=0.27
Micro: ER=0.73, F=0.29, LE=30.30, LR=0.54


Epoch 161/250: 100%|██████████| 12/12 [00:21<00:00,  1.83s/it, loss=0.00306, test_loss=0.0287]
Epoch 162/250: 100%|██████████| 12/12 [00:21<00:00,  1.78s/it, loss=0.00308, test_loss=0.0253]
Epoch 163/250: 100%|██████████| 12/12 [00:21<00:00,  1.78s/it, loss=0.00303, test_loss=0.026]
Epoch 164/250: 100%|██████████| 12/12 [00:21<00:00,  1.82s/it, loss=0.003, test_loss=0.0267]
Epoch 165/250: 100%|██████████| 12/12 [00:21<00:00,  1.80s/it, loss=0.003, test_loss=0.0289]
Epoch 166/250: 100%|██████████| 12/12 [00:21<00:00,  1.76s/it, loss=0.00302, test_loss=0.0285]
Epoch 167/250: 100%|██████████| 12/12 [00:21<00:00,  1.80s/it, loss=0.00301, test_loss=0.0266]
Epoch 168/250: 100%|██████████| 12/12 [00:21<00:00,  1.83s/it, loss=0.00296, test_loss=0.0274]
Epoch 169/250: 100%|██████████| 12/12 [00:20<00:00,  1.75s/it, loss=0.00296, test_loss=0.0253]
Epoch 170/250: 100%|██████████| 12/12 [00:21<00:00,  1.82s/it, loss=0.0029, test_loss=0.0266]


Macro: ER=0.75, F=0.15, LE=43.53, LR=0.28
Micro: ER=0.75, F=0.28, LE=29.75, LR=0.54


Epoch 171/250: 100%|██████████| 12/12 [00:21<00:00,  1.81s/it, loss=0.0029, test_loss=0.0272]
Epoch 172/250: 100%|██████████| 12/12 [00:21<00:00,  1.82s/it, loss=0.00287, test_loss=0.0274]
Epoch 173/250: 100%|██████████| 12/12 [00:21<00:00,  1.80s/it, loss=0.00285, test_loss=0.0275]
Epoch 174/250: 100%|██████████| 12/12 [00:21<00:00,  1.77s/it, loss=0.00284, test_loss=0.0274]
Epoch 175/250: 100%|██████████| 12/12 [00:21<00:00,  1.78s/it, loss=0.00283, test_loss=0.027]
Epoch 176/250: 100%|██████████| 12/12 [00:21<00:00,  1.83s/it, loss=0.00286, test_loss=0.0279]
Epoch 177/250: 100%|██████████| 12/12 [00:21<00:00,  1.77s/it, loss=0.00284, test_loss=0.0268]
Epoch 178/250: 100%|██████████| 12/12 [00:21<00:00,  1.81s/it, loss=0.00279, test_loss=0.0262]
Epoch 179/250: 100%|██████████| 12/12 [00:21<00:00,  1.79s/it, loss=0.00274, test_loss=0.0277]
Epoch 180/250: 100%|██████████| 12/12 [00:21<00:00,  1.78s/it, loss=0.0027, test_loss=0.0259]


Macro: ER=0.73, F=0.13, LE=45.00, LR=0.28
Micro: ER=0.73, F=0.29, LE=30.01, LR=0.54


Epoch 181/250: 100%|██████████| 12/12 [00:21<00:00,  1.83s/it, loss=0.00271, test_loss=0.026]
Epoch 182/250: 100%|██████████| 12/12 [00:21<00:00,  1.79s/it, loss=0.00268, test_loss=0.027]
Epoch 183/250: 100%|██████████| 12/12 [00:21<00:00,  1.80s/it, loss=0.00268, test_loss=0.0279]
Epoch 184/250: 100%|██████████| 12/12 [00:21<00:00,  1.80s/it, loss=0.00268, test_loss=0.027]
Epoch 185/250: 100%|██████████| 12/12 [00:22<00:00,  1.84s/it, loss=0.00265, test_loss=0.0288]
Epoch 186/250: 100%|██████████| 12/12 [00:21<00:00,  1.78s/it, loss=0.00266, test_loss=0.0274]
Epoch 187/250: 100%|██████████| 12/12 [00:21<00:00,  1.81s/it, loss=0.00269, test_loss=0.0281]
Epoch 188/250: 100%|██████████| 12/12 [00:21<00:00,  1.79s/it, loss=0.00265, test_loss=0.0269]
Epoch 189/250: 100%|██████████| 12/12 [00:21<00:00,  1.82s/it, loss=0.00261, test_loss=0.0273]
Epoch 190/250: 100%|██████████| 12/12 [00:21<00:00,  1.79s/it, loss=0.00257, test_loss=0.0276]


Macro: ER=0.76, F=0.14, LE=45.49, LR=0.30
Micro: ER=0.76, F=0.28, LE=30.97, LR=0.53


Epoch 191/250: 100%|██████████| 12/12 [00:21<00:00,  1.80s/it, loss=0.00259, test_loss=0.0273]
Epoch 192/250: 100%|██████████| 12/12 [00:21<00:00,  1.78s/it, loss=0.0026, test_loss=0.0259]
Epoch 193/250: 100%|██████████| 12/12 [00:21<00:00,  1.79s/it, loss=0.00255, test_loss=0.0264]
Epoch 194/250: 100%|██████████| 12/12 [00:21<00:00,  1.80s/it, loss=0.00256, test_loss=0.0278]
Epoch 195/250: 100%|██████████| 12/12 [00:21<00:00,  1.81s/it, loss=0.00256, test_loss=0.0281]
Epoch 196/250: 100%|██████████| 12/12 [00:21<00:00,  1.81s/it, loss=0.00251, test_loss=0.0294]
Epoch 197/250: 100%|██████████| 12/12 [00:21<00:00,  1.77s/it, loss=0.00258, test_loss=0.0266]
Epoch 198/250: 100%|██████████| 12/12 [00:21<00:00,  1.80s/it, loss=0.00261, test_loss=0.0267]
Epoch 199/250: 100%|██████████| 12/12 [00:21<00:00,  1.78s/it, loss=0.00262, test_loss=0.0272]
Epoch 200/250: 100%|██████████| 12/12 [00:21<00:00,  1.78s/it, loss=0.00251, test_loss=0.027]


Macro: ER=0.74, F=0.15, LE=46.00, LR=0.31
Micro: ER=0.74, F=0.29, LE=30.72, LR=0.55


Epoch 201/250: 100%|██████████| 12/12 [00:21<00:00,  1.77s/it, loss=0.00249, test_loss=0.0262]
Epoch 202/250: 100%|██████████| 12/12 [00:21<00:00,  1.80s/it, loss=0.0025, test_loss=0.0272]
Epoch 203/250: 100%|██████████| 12/12 [00:21<00:00,  1.78s/it, loss=0.00249, test_loss=0.0272]
Epoch 204/250: 100%|██████████| 12/12 [00:21<00:00,  1.82s/it, loss=0.00242, test_loss=0.0279]
Epoch 205/250: 100%|██████████| 12/12 [00:21<00:00,  1.82s/it, loss=0.00238, test_loss=0.0273]
Epoch 206/250: 100%|██████████| 12/12 [00:22<00:00,  1.83s/it, loss=0.00238, test_loss=0.0272]
Epoch 207/250: 100%|██████████| 12/12 [00:21<00:00,  1.82s/it, loss=0.00236, test_loss=0.0277]
Epoch 208/250: 100%|██████████| 12/12 [00:22<00:00,  1.85s/it, loss=0.00234, test_loss=0.0283]
Epoch 209/250: 100%|██████████| 12/12 [00:21<00:00,  1.80s/it, loss=0.00233, test_loss=0.0272]
Epoch 210/250: 100%|██████████| 12/12 [00:21<00:00,  1.81s/it, loss=0.00232, test_loss=0.0281]


Macro: ER=0.78, F=0.13, LE=48.47, LR=0.31
Micro: ER=0.78, F=0.26, LE=31.79, LR=0.56


Epoch 211/250: 100%|██████████| 12/12 [00:21<00:00,  1.78s/it, loss=0.00238, test_loss=0.0274]
Epoch 212/250: 100%|██████████| 12/12 [00:21<00:00,  1.79s/it, loss=0.0024, test_loss=0.0262]
Epoch 213/250: 100%|██████████| 12/12 [00:21<00:00,  1.78s/it, loss=0.00234, test_loss=0.028]
Epoch 214/250: 100%|██████████| 12/12 [00:21<00:00,  1.83s/it, loss=0.00229, test_loss=0.0292]
Epoch 215/250: 100%|██████████| 12/12 [00:21<00:00,  1.79s/it, loss=0.00225, test_loss=0.0285]
Epoch 216/250: 100%|██████████| 12/12 [00:21<00:00,  1.77s/it, loss=0.00223, test_loss=0.0263]
Epoch 217/250: 100%|██████████| 12/12 [00:21<00:00,  1.80s/it, loss=0.00226, test_loss=0.0282]
Epoch 218/250: 100%|██████████| 12/12 [00:21<00:00,  1.80s/it, loss=0.00226, test_loss=0.0279]
Epoch 219/250: 100%|██████████| 12/12 [00:21<00:00,  1.77s/it, loss=0.00224, test_loss=0.0275]
Epoch 220/250: 100%|██████████| 12/12 [00:21<00:00,  1.78s/it, loss=0.0022, test_loss=0.0268]


Macro: ER=0.75, F=0.14, LE=46.12, LR=0.31
Micro: ER=0.75, F=0.28, LE=30.42, LR=0.55


Epoch 221/250: 100%|██████████| 12/12 [00:21<00:00,  1.78s/it, loss=0.00222, test_loss=0.0266]
Epoch 222/250: 100%|██████████| 12/12 [00:21<00:00,  1.77s/it, loss=0.00219, test_loss=0.026]
Epoch 223/250: 100%|██████████| 12/12 [00:21<00:00,  1.81s/it, loss=0.00217, test_loss=0.0283]
Epoch 224/250: 100%|██████████| 12/12 [00:21<00:00,  1.78s/it, loss=0.00224, test_loss=0.0276]
Epoch 225/250: 100%|██████████| 12/12 [00:21<00:00,  1.78s/it, loss=0.00222, test_loss=0.0268]
Epoch 226/250: 100%|██████████| 12/12 [00:21<00:00,  1.78s/it, loss=0.00222, test_loss=0.0267]
Epoch 227/250: 100%|██████████| 12/12 [00:21<00:00,  1.80s/it, loss=0.00218, test_loss=0.0272]
Epoch 228/250: 100%|██████████| 12/12 [00:21<00:00,  1.80s/it, loss=0.00217, test_loss=0.0274]
Epoch 229/250: 100%|██████████| 12/12 [00:21<00:00,  1.82s/it, loss=0.00216, test_loss=0.0268]
Epoch 230/250: 100%|██████████| 12/12 [00:20<00:00,  1.73s/it, loss=0.00212, test_loss=0.0271]


Macro: ER=0.74, F=0.15, LE=46.55, LR=0.30
Micro: ER=0.74, F=0.28, LE=30.40, LR=0.50


Epoch 231/250: 100%|██████████| 12/12 [00:21<00:00,  1.82s/it, loss=0.00215, test_loss=0.0294]
Epoch 232/250: 100%|██████████| 12/12 [00:21<00:00,  1.76s/it, loss=0.00211, test_loss=0.0272]
Epoch 233/250: 100%|██████████| 12/12 [00:21<00:00,  1.80s/it, loss=0.00212, test_loss=0.0283]
Epoch 234/250: 100%|██████████| 12/12 [00:21<00:00,  1.79s/it, loss=0.00214, test_loss=0.0268]
Epoch 235/250: 100%|██████████| 12/12 [00:22<00:00,  1.85s/it, loss=0.00213, test_loss=0.0296]
Epoch 236/250: 100%|██████████| 12/12 [00:21<00:00,  1.76s/it, loss=0.00213, test_loss=0.027]
Epoch 237/250: 100%|██████████| 12/12 [00:21<00:00,  1.81s/it, loss=0.00214, test_loss=0.0274]
Epoch 238/250: 100%|██████████| 12/12 [00:21<00:00,  1.78s/it, loss=0.00207, test_loss=0.0275]
Epoch 239/250: 100%|██████████| 12/12 [00:21<00:00,  1.79s/it, loss=0.00204, test_loss=0.0265]
Epoch 240/250: 100%|██████████| 12/12 [00:21<00:00,  1.79s/it, loss=0.002, test_loss=0.0273]


Macro: ER=0.76, F=0.14, LE=48.73, LR=0.33
Micro: ER=0.76, F=0.29, LE=30.60, LR=0.56


Epoch 241/250: 100%|██████████| 12/12 [00:21<00:00,  1.79s/it, loss=0.002, test_loss=0.0267]
Epoch 242/250: 100%|██████████| 12/12 [00:21<00:00,  1.80s/it, loss=0.00199, test_loss=0.0275]
Epoch 243/250: 100%|██████████| 12/12 [00:21<00:00,  1.80s/it, loss=0.00197, test_loss=0.0271]
Epoch 244/250: 100%|██████████| 12/12 [00:21<00:00,  1.80s/it, loss=0.00194, test_loss=0.0284]
Epoch 245/250: 100%|██████████| 12/12 [00:21<00:00,  1.79s/it, loss=0.00191, test_loss=0.027]
Epoch 246/250: 100%|██████████| 12/12 [00:21<00:00,  1.80s/it, loss=0.00192, test_loss=0.0274]
Epoch 247/250: 100%|██████████| 12/12 [00:21<00:00,  1.81s/it, loss=0.00191, test_loss=0.027]
Epoch 248/250: 100%|██████████| 12/12 [00:21<00:00,  1.79s/it, loss=0.00195, test_loss=0.0273]
Epoch 249/250: 100%|██████████| 12/12 [00:21<00:00,  1.77s/it, loss=0.00196, test_loss=0.0274]
Epoch 250/250: 100%|██████████| 12/12 [00:21<00:00,  1.81s/it, loss=0.00205, test_loss=0.0289]

Macro: ER=0.78, F=0.15, LE=47.33, LR=0.33
Micro: ER=0.78, F=0.27, LE=31.75, LR=0.54
Micro @ epoch 189: ER=0.76, F=0.17, LE=46.21, LR=0.33
Macro @ epoch 189: ER=0.76, F=0.29, LE=30.87, LR=0.57





### Data normalization


In [3]:
model_args = {
    'backbone': 'seldnet',
    'num_classes': NUM_CLASSES,
    'num_events': MAX_EVENTS,
    'input_dim': 7,
    'hidden_dim': 64,
    'dropout': 0.05,
    'rnn_layers': 2,
    'mhsa_layers': 2,
}
train_dataloader, test_dataloader = create_dataloaders(BATCH_SIZE, normalized=True)
model = train_model(
    model_args,
    train_dataloader,
    test_dataloader,
    epochs=250,
    device=device,
    sde_weight=0.0,
)

Epoch 1/250: 100%|██████████| 12/12 [00:18<00:00,  1.52s/it, loss=0.0535, test_loss=0.0322]
Epoch 2/250: 100%|██████████| 12/12 [00:18<00:00,  1.51s/it, loss=0.0253, test_loss=0.0287]
Epoch 3/250: 100%|██████████| 12/12 [00:17<00:00,  1.49s/it, loss=0.0227, test_loss=0.0276]
Epoch 4/250: 100%|██████████| 12/12 [00:17<00:00,  1.46s/it, loss=0.021, test_loss=0.0272]
Epoch 5/250: 100%|██████████| 12/12 [00:18<00:00,  1.51s/it, loss=0.0198, test_loss=0.0273]
Epoch 6/250: 100%|██████████| 12/12 [00:18<00:00,  1.55s/it, loss=0.0185, test_loss=0.0276]
Epoch 7/250: 100%|██████████| 12/12 [00:18<00:00,  1.50s/it, loss=0.0175, test_loss=0.0274]
Epoch 8/250: 100%|██████████| 12/12 [00:18<00:00,  1.55s/it, loss=0.0166, test_loss=0.0281]
Epoch 9/250: 100%|██████████| 12/12 [00:18<00:00,  1.54s/it, loss=0.0157, test_loss=0.0273]
Epoch 10/250: 100%|██████████| 12/12 [00:19<00:00,  1.60s/it, loss=0.0149, test_loss=0.0265]


Macro: ER=0.85, F=0.07, LE=133.06, LR=0.09
Micro: ER=0.85, F=0.16, LE=27.56, LR=0.20


Epoch 11/250: 100%|██████████| 12/12 [00:19<00:00,  1.62s/it, loss=0.0141, test_loss=0.0273]
Epoch 12/250: 100%|██████████| 12/12 [00:19<00:00,  1.63s/it, loss=0.0135, test_loss=0.0269]
Epoch 13/250: 100%|██████████| 12/12 [00:20<00:00,  1.71s/it, loss=0.0128, test_loss=0.0273]
Epoch 14/250: 100%|██████████| 12/12 [00:20<00:00,  1.73s/it, loss=0.0125, test_loss=0.0276]
Epoch 15/250: 100%|██████████| 12/12 [00:19<00:00,  1.66s/it, loss=0.0117, test_loss=0.026]
Epoch 16/250: 100%|██████████| 12/12 [00:20<00:00,  1.71s/it, loss=0.0111, test_loss=0.0264]
Epoch 17/250: 100%|██████████| 12/12 [00:20<00:00,  1.69s/it, loss=0.0105, test_loss=0.0259]
Epoch 18/250: 100%|██████████| 12/12 [00:20<00:00,  1.73s/it, loss=0.0103, test_loss=0.026]
Epoch 19/250: 100%|██████████| 12/12 [00:20<00:00,  1.71s/it, loss=0.0099, test_loss=0.0268]
Epoch 20/250: 100%|██████████| 12/12 [00:20<00:00,  1.74s/it, loss=0.0098, test_loss=0.0267]


Macro: ER=0.79, F=0.08, LE=134.14, LR=0.16
Micro: ER=0.79, F=0.22, LE=31.30, LR=0.39


Epoch 21/250: 100%|██████████| 12/12 [00:20<00:00,  1.70s/it, loss=0.00971, test_loss=0.0271]
Epoch 22/250: 100%|██████████| 12/12 [00:21<00:00,  1.82s/it, loss=0.00939, test_loss=0.0263]
Epoch 23/250: 100%|██████████| 12/12 [00:21<00:00,  1.79s/it, loss=0.00912, test_loss=0.0268]
Epoch 24/250: 100%|██████████| 12/12 [00:21<00:00,  1.80s/it, loss=0.00875, test_loss=0.0262]
Epoch 25/250: 100%|██████████| 12/12 [00:21<00:00,  1.79s/it, loss=0.00849, test_loss=0.0263]
Epoch 26/250: 100%|██████████| 12/12 [00:21<00:00,  1.83s/it, loss=0.00833, test_loss=0.0243]
Epoch 27/250: 100%|██████████| 12/12 [00:21<00:00,  1.83s/it, loss=0.00808, test_loss=0.0255]
Epoch 28/250: 100%|██████████| 12/12 [00:21<00:00,  1.81s/it, loss=0.00808, test_loss=0.0252]
Epoch 29/250: 100%|██████████| 12/12 [00:21<00:00,  1.80s/it, loss=0.00799, test_loss=0.0248]
Epoch 30/250: 100%|██████████| 12/12 [00:20<00:00,  1.72s/it, loss=0.00779, test_loss=0.0253]


Macro: ER=0.76, F=0.09, LE=121.11, LR=0.16
Micro: ER=0.76, F=0.25, LE=28.77, LR=0.40


Epoch 31/250: 100%|██████████| 12/12 [00:21<00:00,  1.76s/it, loss=0.00775, test_loss=0.0256]
Epoch 32/250: 100%|██████████| 12/12 [00:21<00:00,  1.83s/it, loss=0.00774, test_loss=0.0254]
Epoch 33/250: 100%|██████████| 12/12 [00:21<00:00,  1.81s/it, loss=0.0075, test_loss=0.0254]
Epoch 34/250: 100%|██████████| 12/12 [00:22<00:00,  1.84s/it, loss=0.00752, test_loss=0.0249]
Epoch 35/250: 100%|██████████| 12/12 [00:21<00:00,  1.82s/it, loss=0.00731, test_loss=0.0251]
Epoch 36/250: 100%|██████████| 12/12 [00:21<00:00,  1.82s/it, loss=0.00713, test_loss=0.0254]
Epoch 37/250: 100%|██████████| 12/12 [00:21<00:00,  1.83s/it, loss=0.00705, test_loss=0.025]
Epoch 38/250: 100%|██████████| 12/12 [00:21<00:00,  1.81s/it, loss=0.00698, test_loss=0.0247]
Epoch 39/250: 100%|██████████| 12/12 [00:21<00:00,  1.81s/it, loss=0.00693, test_loss=0.0254]
Epoch 40/250: 100%|██████████| 12/12 [00:21<00:00,  1.81s/it, loss=0.0068, test_loss=0.0241]


Macro: ER=0.71, F=0.11, LE=108.56, LR=0.19
Micro: ER=0.71, F=0.30, LE=27.39, LR=0.46


Epoch 41/250: 100%|██████████| 12/12 [00:21<00:00,  1.82s/it, loss=0.00677, test_loss=0.0242]
Epoch 42/250: 100%|██████████| 12/12 [00:21<00:00,  1.83s/it, loss=0.00678, test_loss=0.0241]
Epoch 43/250: 100%|██████████| 12/12 [00:22<00:00,  1.87s/it, loss=0.00664, test_loss=0.0261]
Epoch 44/250: 100%|██████████| 12/12 [00:22<00:00,  1.86s/it, loss=0.00661, test_loss=0.025]
Epoch 45/250: 100%|██████████| 12/12 [00:21<00:00,  1.83s/it, loss=0.00639, test_loss=0.025]
Epoch 46/250: 100%|██████████| 12/12 [00:22<00:00,  1.85s/it, loss=0.00634, test_loss=0.0244]
Epoch 47/250: 100%|██████████| 12/12 [00:22<00:00,  1.88s/it, loss=0.00626, test_loss=0.0245]
Epoch 48/250: 100%|██████████| 12/12 [00:22<00:00,  1.83s/it, loss=0.00627, test_loss=0.0245]
Epoch 49/250: 100%|██████████| 12/12 [00:22<00:00,  1.86s/it, loss=0.00621, test_loss=0.0256]
Epoch 50/250: 100%|██████████| 12/12 [00:22<00:00,  1.87s/it, loss=0.00617, test_loss=0.0246]


Macro: ER=0.72, F=0.11, LE=109.06, LR=0.20
Micro: ER=0.72, F=0.30, LE=27.18, LR=0.48


Epoch 51/250: 100%|██████████| 12/12 [00:22<00:00,  1.85s/it, loss=0.00613, test_loss=0.0249]
Epoch 52/250: 100%|██████████| 12/12 [00:22<00:00,  1.85s/it, loss=0.00605, test_loss=0.0245]
Epoch 53/250: 100%|██████████| 12/12 [00:21<00:00,  1.83s/it, loss=0.00596, test_loss=0.0244]
Epoch 54/250: 100%|██████████| 12/12 [00:22<00:00,  1.86s/it, loss=0.006, test_loss=0.0255]
Epoch 55/250: 100%|██████████| 12/12 [00:22<00:00,  1.86s/it, loss=0.00597, test_loss=0.0248]
Epoch 56/250: 100%|██████████| 12/12 [00:22<00:00,  1.88s/it, loss=0.0058, test_loss=0.0249]
Epoch 57/250: 100%|██████████| 12/12 [00:22<00:00,  1.83s/it, loss=0.00579, test_loss=0.0242]
Epoch 58/250: 100%|██████████| 12/12 [00:21<00:00,  1.83s/it, loss=0.00577, test_loss=0.0239]
Epoch 59/250: 100%|██████████| 12/12 [00:22<00:00,  1.86s/it, loss=0.00564, test_loss=0.0253]
Epoch 60/250: 100%|██████████| 12/12 [00:21<00:00,  1.82s/it, loss=0.00557, test_loss=0.0248]


Macro: ER=0.72, F=0.12, LE=109.16, LR=0.20
Micro: ER=0.72, F=0.30, LE=27.25, LR=0.48


Epoch 61/250: 100%|██████████| 12/12 [00:21<00:00,  1.81s/it, loss=0.00561, test_loss=0.0252]
Epoch 62/250: 100%|██████████| 12/12 [00:22<00:00,  1.85s/it, loss=0.00556, test_loss=0.0245]
Epoch 63/250: 100%|██████████| 12/12 [00:22<00:00,  1.85s/it, loss=0.00556, test_loss=0.0248]
Epoch 64/250: 100%|██████████| 12/12 [00:21<00:00,  1.82s/it, loss=0.00547, test_loss=0.0247]
Epoch 65/250: 100%|██████████| 12/12 [00:21<00:00,  1.80s/it, loss=0.00541, test_loss=0.0247]
Epoch 66/250: 100%|██████████| 12/12 [00:21<00:00,  1.81s/it, loss=0.00537, test_loss=0.0246]
Epoch 67/250: 100%|██████████| 12/12 [00:21<00:00,  1.83s/it, loss=0.00536, test_loss=0.0248]
Epoch 68/250: 100%|██████████| 12/12 [00:21<00:00,  1.78s/it, loss=0.00526, test_loss=0.0247]
Epoch 69/250: 100%|██████████| 12/12 [00:21<00:00,  1.77s/it, loss=0.00519, test_loss=0.0248]
Epoch 70/250: 100%|██████████| 12/12 [00:21<00:00,  1.81s/it, loss=0.00513, test_loss=0.025]


Macro: ER=0.73, F=0.12, LE=96.79, LR=0.20
Micro: ER=0.73, F=0.29, LE=26.81, LR=0.48


Epoch 71/250: 100%|██████████| 12/12 [00:21<00:00,  1.83s/it, loss=0.00508, test_loss=0.0255]
Epoch 72/250: 100%|██████████| 12/12 [00:22<00:00,  1.86s/it, loss=0.00515, test_loss=0.0251]
Epoch 73/250: 100%|██████████| 12/12 [00:21<00:00,  1.82s/it, loss=0.00513, test_loss=0.024]
Epoch 74/250: 100%|██████████| 12/12 [00:21<00:00,  1.81s/it, loss=0.00504, test_loss=0.0251]
Epoch 75/250: 100%|██████████| 12/12 [00:21<00:00,  1.80s/it, loss=0.00495, test_loss=0.0248]
Epoch 76/250: 100%|██████████| 12/12 [00:21<00:00,  1.79s/it, loss=0.00497, test_loss=0.0243]
Epoch 77/250: 100%|██████████| 12/12 [00:21<00:00,  1.80s/it, loss=0.00494, test_loss=0.0243]
Epoch 78/250: 100%|██████████| 12/12 [00:22<00:00,  1.86s/it, loss=0.00495, test_loss=0.0249]
Epoch 79/250: 100%|██████████| 12/12 [00:21<00:00,  1.81s/it, loss=0.00487, test_loss=0.0249]
Epoch 80/250: 100%|██████████| 12/12 [00:22<00:00,  1.90s/it, loss=0.00484, test_loss=0.0254]


Macro: ER=0.73, F=0.12, LE=87.75, LR=0.21
Micro: ER=0.73, F=0.30, LE=26.89, LR=0.48


Epoch 81/250: 100%|██████████| 12/12 [00:22<00:00,  1.90s/it, loss=0.00482, test_loss=0.0242]
Epoch 82/250: 100%|██████████| 12/12 [00:22<00:00,  1.89s/it, loss=0.0048, test_loss=0.0248]
Epoch 83/250: 100%|██████████| 12/12 [00:22<00:00,  1.89s/it, loss=0.00478, test_loss=0.0253]
Epoch 84/250: 100%|██████████| 12/12 [00:22<00:00,  1.88s/it, loss=0.00477, test_loss=0.0251]
Epoch 85/250: 100%|██████████| 12/12 [00:22<00:00,  1.91s/it, loss=0.00469, test_loss=0.0252]
Epoch 86/250: 100%|██████████| 12/12 [00:22<00:00,  1.91s/it, loss=0.00473, test_loss=0.0251]
Epoch 87/250: 100%|██████████| 12/12 [00:22<00:00,  1.87s/it, loss=0.0046, test_loss=0.0248]
Epoch 88/250: 100%|██████████| 12/12 [00:22<00:00,  1.90s/it, loss=0.00454, test_loss=0.0247]
Epoch 89/250: 100%|██████████| 12/12 [00:22<00:00,  1.86s/it, loss=0.00444, test_loss=0.0252]
Epoch 90/250: 100%|██████████| 12/12 [00:22<00:00,  1.88s/it, loss=0.00454, test_loss=0.0249]


Macro: ER=0.72, F=0.12, LE=75.97, LR=0.21
Micro: ER=0.72, F=0.30, LE=25.99, LR=0.48


Epoch 91/250: 100%|██████████| 12/12 [00:22<00:00,  1.89s/it, loss=0.00452, test_loss=0.026]
Epoch 92/250: 100%|██████████| 12/12 [00:22<00:00,  1.91s/it, loss=0.00443, test_loss=0.0247]
Epoch 93/250: 100%|██████████| 12/12 [00:22<00:00,  1.88s/it, loss=0.00438, test_loss=0.0244]
Epoch 94/250: 100%|██████████| 12/12 [00:22<00:00,  1.89s/it, loss=0.0044, test_loss=0.0253]
Epoch 95/250: 100%|██████████| 12/12 [00:22<00:00,  1.91s/it, loss=0.00437, test_loss=0.0248]
Epoch 96/250: 100%|██████████| 12/12 [00:22<00:00,  1.85s/it, loss=0.00434, test_loss=0.0247]
Epoch 97/250: 100%|██████████| 12/12 [00:22<00:00,  1.88s/it, loss=0.00432, test_loss=0.0244]
Epoch 98/250: 100%|██████████| 12/12 [00:22<00:00,  1.89s/it, loss=0.00425, test_loss=0.0247]
Epoch 99/250: 100%|██████████| 12/12 [00:22<00:00,  1.87s/it, loss=0.00424, test_loss=0.0251]
Epoch 100/250: 100%|██████████| 12/12 [00:22<00:00,  1.89s/it, loss=0.00416, test_loss=0.0251]


Macro: ER=0.71, F=0.13, LE=77.63, LR=0.23
Micro: ER=0.71, F=0.32, LE=25.97, LR=0.50


Epoch 101/250: 100%|██████████| 12/12 [00:22<00:00,  1.89s/it, loss=0.00415, test_loss=0.026]
Epoch 102/250: 100%|██████████| 12/12 [00:23<00:00,  1.95s/it, loss=0.00417, test_loss=0.025]
Epoch 103/250: 100%|██████████| 12/12 [00:22<00:00,  1.91s/it, loss=0.00412, test_loss=0.0257]
Epoch 104/250: 100%|██████████| 12/12 [00:22<00:00,  1.88s/it, loss=0.0041, test_loss=0.0251]
Epoch 105/250: 100%|██████████| 12/12 [00:22<00:00,  1.92s/it, loss=0.00408, test_loss=0.0257]
Epoch 106/250: 100%|██████████| 12/12 [00:22<00:00,  1.89s/it, loss=0.0041, test_loss=0.0258]
Epoch 107/250: 100%|██████████| 12/12 [00:22<00:00,  1.91s/it, loss=0.00407, test_loss=0.0252]
Epoch 108/250: 100%|██████████| 12/12 [00:22<00:00,  1.90s/it, loss=0.00405, test_loss=0.0254]
Epoch 109/250: 100%|██████████| 12/12 [00:22<00:00,  1.91s/it, loss=0.00401, test_loss=0.0255]
Epoch 110/250: 100%|██████████| 12/12 [00:22<00:00,  1.90s/it, loss=0.0039, test_loss=0.0262]


Macro: ER=0.73, F=0.14, LE=64.71, LR=0.24
Micro: ER=0.73, F=0.30, LE=26.21, LR=0.50


Epoch 111/250: 100%|██████████| 12/12 [00:22<00:00,  1.89s/it, loss=0.00389, test_loss=0.0253]
Epoch 112/250: 100%|██████████| 12/12 [00:23<00:00,  1.93s/it, loss=0.00393, test_loss=0.0254]
Epoch 113/250: 100%|██████████| 12/12 [00:22<00:00,  1.90s/it, loss=0.00387, test_loss=0.0249]
Epoch 114/250: 100%|██████████| 12/12 [00:22<00:00,  1.90s/it, loss=0.00381, test_loss=0.0253]
Epoch 115/250: 100%|██████████| 12/12 [00:23<00:00,  1.93s/it, loss=0.00379, test_loss=0.0251]
Epoch 116/250: 100%|██████████| 12/12 [00:23<00:00,  1.92s/it, loss=0.00372, test_loss=0.0252]
Epoch 117/250: 100%|██████████| 12/12 [00:23<00:00,  1.98s/it, loss=0.00373, test_loss=0.0261]
Epoch 118/250: 100%|██████████| 12/12 [00:23<00:00,  1.97s/it, loss=0.00373, test_loss=0.0259]
Epoch 119/250: 100%|██████████| 12/12 [00:22<00:00,  1.92s/it, loss=0.00366, test_loss=0.0257]
Epoch 120/250: 100%|██████████| 12/12 [00:22<00:00,  1.90s/it, loss=0.00362, test_loss=0.0254]


Macro: ER=0.72, F=0.15, LE=63.84, LR=0.26
Micro: ER=0.72, F=0.32, LE=26.08, LR=0.51


Epoch 121/250: 100%|██████████| 12/12 [00:23<00:00,  1.93s/it, loss=0.00366, test_loss=0.0265]
Epoch 122/250: 100%|██████████| 12/12 [00:23<00:00,  1.95s/it, loss=0.00369, test_loss=0.026]
Epoch 123/250: 100%|██████████| 12/12 [00:22<00:00,  1.91s/it, loss=0.00364, test_loss=0.0254]
Epoch 124/250: 100%|██████████| 12/12 [00:22<00:00,  1.89s/it, loss=0.00362, test_loss=0.0258]
Epoch 125/250: 100%|██████████| 12/12 [00:23<00:00,  1.94s/it, loss=0.00357, test_loss=0.0257]
Epoch 126/250: 100%|██████████| 12/12 [00:22<00:00,  1.87s/it, loss=0.0035, test_loss=0.0257]
Epoch 127/250: 100%|██████████| 12/12 [00:22<00:00,  1.91s/it, loss=0.00355, test_loss=0.0255]
Epoch 128/250: 100%|██████████| 12/12 [00:23<00:00,  1.93s/it, loss=0.00348, test_loss=0.0262]
Epoch 129/250: 100%|██████████| 12/12 [00:22<00:00,  1.89s/it, loss=0.00346, test_loss=0.0255]
Epoch 130/250: 100%|██████████| 12/12 [00:22<00:00,  1.91s/it, loss=0.00344, test_loss=0.0256]


Macro: ER=0.73, F=0.15, LE=64.33, LR=0.27
Micro: ER=0.73, F=0.31, LE=26.57, LR=0.53


Epoch 131/250: 100%|██████████| 12/12 [00:23<00:00,  1.93s/it, loss=0.00342, test_loss=0.0258]
Epoch 132/250: 100%|██████████| 12/12 [00:23<00:00,  1.92s/it, loss=0.00338, test_loss=0.025]
Epoch 133/250: 100%|██████████| 12/12 [00:23<00:00,  1.96s/it, loss=0.00335, test_loss=0.0264]
Epoch 134/250: 100%|██████████| 12/12 [00:23<00:00,  1.94s/it, loss=0.00332, test_loss=0.0265]
Epoch 135/250: 100%|██████████| 12/12 [00:23<00:00,  1.95s/it, loss=0.00331, test_loss=0.026]
Epoch 136/250: 100%|██████████| 12/12 [00:22<00:00,  1.91s/it, loss=0.00329, test_loss=0.0261]
Epoch 137/250: 100%|██████████| 12/12 [00:23<00:00,  1.95s/it, loss=0.00327, test_loss=0.0269]
Epoch 138/250: 100%|██████████| 12/12 [00:23<00:00,  1.94s/it, loss=0.00329, test_loss=0.0263]
Epoch 139/250: 100%|██████████| 12/12 [00:23<00:00,  1.96s/it, loss=0.00326, test_loss=0.0268]
Epoch 140/250: 100%|██████████| 12/12 [00:22<00:00,  1.91s/it, loss=0.00326, test_loss=0.026]


Macro: ER=0.73, F=0.16, LE=53.97, LR=0.28
Micro: ER=0.73, F=0.32, LE=25.96, LR=0.50


Epoch 141/250: 100%|██████████| 12/12 [00:23<00:00,  1.93s/it, loss=0.00321, test_loss=0.0257]
Epoch 142/250: 100%|██████████| 12/12 [00:22<00:00,  1.90s/it, loss=0.00314, test_loss=0.0254]
Epoch 143/250: 100%|██████████| 12/12 [00:22<00:00,  1.88s/it, loss=0.00313, test_loss=0.0247]
Epoch 144/250: 100%|██████████| 12/12 [00:23<00:00,  1.93s/it, loss=0.00311, test_loss=0.0269]
Epoch 145/250: 100%|██████████| 12/12 [00:22<00:00,  1.89s/it, loss=0.00311, test_loss=0.026]
Epoch 146/250: 100%|██████████| 12/12 [00:23<00:00,  1.94s/it, loss=0.00313, test_loss=0.0269]
Epoch 147/250: 100%|██████████| 12/12 [00:23<00:00,  1.95s/it, loss=0.00307, test_loss=0.0261]
Epoch 148/250: 100%|██████████| 12/12 [00:23<00:00,  1.92s/it, loss=0.00306, test_loss=0.0264]
Epoch 149/250: 100%|██████████| 12/12 [00:22<00:00,  1.89s/it, loss=0.00302, test_loss=0.0263]
Epoch 150/250: 100%|██████████| 12/12 [00:22<00:00,  1.90s/it, loss=0.003, test_loss=0.026]


Macro: ER=0.73, F=0.14, LE=64.91, LR=0.27
Micro: ER=0.73, F=0.32, LE=26.16, LR=0.51


Epoch 151/250: 100%|██████████| 12/12 [00:23<00:00,  1.98s/it, loss=0.00298, test_loss=0.0258]
Epoch 152/250: 100%|██████████| 12/12 [00:24<00:00,  2.05s/it, loss=0.00297, test_loss=0.0266]
Epoch 153/250: 100%|██████████| 12/12 [00:24<00:00,  2.01s/it, loss=0.00294, test_loss=0.0257]
Epoch 154/250: 100%|██████████| 12/12 [00:24<00:00,  2.02s/it, loss=0.00294, test_loss=0.0262]
Epoch 155/250: 100%|██████████| 12/12 [00:24<00:00,  2.01s/it, loss=0.00294, test_loss=0.0266]
Epoch 156/250: 100%|██████████| 12/12 [00:24<00:00,  2.00s/it, loss=0.00291, test_loss=0.0263]
Epoch 157/250: 100%|██████████| 12/12 [00:24<00:00,  2.03s/it, loss=0.00294, test_loss=0.0268]
Epoch 158/250: 100%|██████████| 12/12 [00:24<00:00,  2.03s/it, loss=0.00295, test_loss=0.0271]
Epoch 159/250: 100%|██████████| 12/12 [00:24<00:00,  2.04s/it, loss=0.00278, test_loss=0.0272]
Epoch 160/250: 100%|██████████| 12/12 [00:24<00:00,  2.03s/it, loss=0.0028, test_loss=0.0261]


Macro: ER=0.73, F=0.15, LE=64.85, LR=0.29
Micro: ER=0.73, F=0.31, LE=26.59, LR=0.52


Epoch 161/250: 100%|██████████| 12/12 [00:23<00:00,  1.97s/it, loss=0.00286, test_loss=0.0259]
Epoch 162/250: 100%|██████████| 12/12 [00:23<00:00,  1.98s/it, loss=0.00285, test_loss=0.0265]
Epoch 163/250: 100%|██████████| 12/12 [00:23<00:00,  1.97s/it, loss=0.00289, test_loss=0.0258]
Epoch 164/250: 100%|██████████| 12/12 [00:23<00:00,  1.98s/it, loss=0.0028, test_loss=0.0262]
Epoch 165/250: 100%|██████████| 12/12 [00:23<00:00,  1.97s/it, loss=0.00272, test_loss=0.0262]
Epoch 166/250: 100%|██████████| 12/12 [00:23<00:00,  1.97s/it, loss=0.00274, test_loss=0.0273]
Epoch 167/250: 100%|██████████| 12/12 [00:23<00:00,  1.92s/it, loss=0.00274, test_loss=0.0262]
Epoch 168/250: 100%|██████████| 12/12 [00:23<00:00,  1.93s/it, loss=0.00272, test_loss=0.0277]
Epoch 169/250: 100%|██████████| 12/12 [00:22<00:00,  1.90s/it, loss=0.00275, test_loss=0.0262]
Epoch 170/250: 100%|██████████| 12/12 [00:21<00:00,  1.83s/it, loss=0.00272, test_loss=0.027]


Macro: ER=0.75, F=0.17, LE=52.19, LR=0.31
Micro: ER=0.75, F=0.31, LE=26.58, LR=0.53


Epoch 171/250: 100%|██████████| 12/12 [00:21<00:00,  1.82s/it, loss=0.00272, test_loss=0.026]
Epoch 172/250: 100%|██████████| 12/12 [00:22<00:00,  1.86s/it, loss=0.00279, test_loss=0.0266]
Epoch 173/250: 100%|██████████| 12/12 [00:22<00:00,  1.85s/it, loss=0.00274, test_loss=0.0263]
Epoch 174/250: 100%|██████████| 12/12 [00:21<00:00,  1.82s/it, loss=0.00267, test_loss=0.0264]
Epoch 175/250: 100%|██████████| 12/12 [00:22<00:00,  1.86s/it, loss=0.00264, test_loss=0.0264]
Epoch 176/250: 100%|██████████| 12/12 [00:22<00:00,  1.84s/it, loss=0.00265, test_loss=0.027]
Epoch 177/250: 100%|██████████| 12/12 [00:22<00:00,  1.88s/it, loss=0.0026, test_loss=0.0271]
Epoch 178/250: 100%|██████████| 12/12 [00:22<00:00,  1.86s/it, loss=0.00257, test_loss=0.0265]
Epoch 179/250: 100%|██████████| 12/12 [00:22<00:00,  1.86s/it, loss=0.00257, test_loss=0.0264]
Epoch 180/250: 100%|██████████| 12/12 [00:22<00:00,  1.88s/it, loss=0.00254, test_loss=0.027]


Macro: ER=0.76, F=0.17, LE=51.59, LR=0.31
Micro: ER=0.76, F=0.31, LE=26.87, LR=0.53


Epoch 181/250: 100%|██████████| 12/12 [00:22<00:00,  1.86s/it, loss=0.00249, test_loss=0.0262]
Epoch 182/250: 100%|██████████| 12/12 [00:22<00:00,  1.89s/it, loss=0.00246, test_loss=0.0268]
Epoch 183/250: 100%|██████████| 12/12 [00:22<00:00,  1.87s/it, loss=0.00251, test_loss=0.0271]
Epoch 184/250: 100%|██████████| 12/12 [00:22<00:00,  1.87s/it, loss=0.00252, test_loss=0.0271]
Epoch 185/250: 100%|██████████| 12/12 [00:22<00:00,  1.86s/it, loss=0.00247, test_loss=0.0267]
Epoch 186/250: 100%|██████████| 12/12 [00:22<00:00,  1.87s/it, loss=0.00243, test_loss=0.0276]
Epoch 187/250: 100%|██████████| 12/12 [00:22<00:00,  1.86s/it, loss=0.00244, test_loss=0.0267]
Epoch 188/250: 100%|██████████| 12/12 [00:22<00:00,  1.92s/it, loss=0.0024, test_loss=0.0272]
Epoch 189/250: 100%|██████████| 12/12 [00:22<00:00,  1.88s/it, loss=0.0024, test_loss=0.0275]
Epoch 190/250: 100%|██████████| 12/12 [00:22<00:00,  1.88s/it, loss=0.00241, test_loss=0.0269]


Macro: ER=0.76, F=0.17, LE=52.40, LR=0.32
Micro: ER=0.76, F=0.31, LE=26.90, LR=0.53


Epoch 191/250: 100%|██████████| 12/12 [00:22<00:00,  1.87s/it, loss=0.0024, test_loss=0.0275]
Epoch 192/250: 100%|██████████| 12/12 [00:22<00:00,  1.88s/it, loss=0.00236, test_loss=0.0274]
Epoch 193/250: 100%|██████████| 12/12 [00:21<00:00,  1.83s/it, loss=0.00242, test_loss=0.0267]
Epoch 194/250: 100%|██████████| 12/12 [00:21<00:00,  1.83s/it, loss=0.00245, test_loss=0.0272]
Epoch 195/250: 100%|██████████| 12/12 [00:22<00:00,  1.87s/it, loss=0.00239, test_loss=0.0269]
Epoch 196/250: 100%|██████████| 12/12 [00:22<00:00,  1.84s/it, loss=0.00233, test_loss=0.0266]
Epoch 197/250: 100%|██████████| 12/12 [00:22<00:00,  1.90s/it, loss=0.00234, test_loss=0.028]
Epoch 198/250: 100%|██████████| 12/12 [00:22<00:00,  1.84s/it, loss=0.00232, test_loss=0.0262]
Epoch 199/250: 100%|██████████| 12/12 [00:22<00:00,  1.87s/it, loss=0.00233, test_loss=0.0278]
Epoch 200/250: 100%|██████████| 12/12 [00:22<00:00,  1.86s/it, loss=0.00239, test_loss=0.0268]


Macro: ER=0.75, F=0.16, LE=51.91, LR=0.29
Micro: ER=0.75, F=0.31, LE=27.09, LR=0.53


Epoch 201/250: 100%|██████████| 12/12 [00:22<00:00,  1.85s/it, loss=0.00235, test_loss=0.0263]
Epoch 202/250: 100%|██████████| 12/12 [00:22<00:00,  1.88s/it, loss=0.00227, test_loss=0.0272]
Epoch 203/250: 100%|██████████| 12/12 [00:22<00:00,  1.84s/it, loss=0.00224, test_loss=0.0265]
Epoch 204/250: 100%|██████████| 12/12 [00:22<00:00,  1.87s/it, loss=0.00221, test_loss=0.0274]
Epoch 205/250: 100%|██████████| 12/12 [00:22<00:00,  1.86s/it, loss=0.00221, test_loss=0.0267]
Epoch 206/250: 100%|██████████| 12/12 [00:22<00:00,  1.87s/it, loss=0.00221, test_loss=0.0272]
Epoch 207/250: 100%|██████████| 12/12 [00:22<00:00,  1.89s/it, loss=0.0022, test_loss=0.0273]
Epoch 208/250: 100%|██████████| 12/12 [00:22<00:00,  1.89s/it, loss=0.0022, test_loss=0.0281]
Epoch 209/250: 100%|██████████| 12/12 [00:22<00:00,  1.86s/it, loss=0.00219, test_loss=0.0267]
Epoch 210/250: 100%|██████████| 12/12 [00:22<00:00,  1.90s/it, loss=0.00219, test_loss=0.0273]


Macro: ER=0.77, F=0.16, LE=52.67, LR=0.32
Micro: ER=0.77, F=0.30, LE=28.05, LR=0.54


Epoch 211/250: 100%|██████████| 12/12 [00:22<00:00,  1.86s/it, loss=0.00215, test_loss=0.0269]
Epoch 212/250: 100%|██████████| 12/12 [00:22<00:00,  1.86s/it, loss=0.00214, test_loss=0.0274]
Epoch 213/250: 100%|██████████| 12/12 [00:22<00:00,  1.90s/it, loss=0.00213, test_loss=0.028]
Epoch 214/250: 100%|██████████| 12/12 [00:22<00:00,  1.85s/it, loss=0.00211, test_loss=0.0274]
Epoch 215/250: 100%|██████████| 12/12 [00:22<00:00,  1.85s/it, loss=0.0021, test_loss=0.0275]
Epoch 216/250: 100%|██████████| 12/12 [00:22<00:00,  1.87s/it, loss=0.00207, test_loss=0.0274]
Epoch 217/250: 100%|██████████| 12/12 [00:22<00:00,  1.85s/it, loss=0.0021, test_loss=0.0264]
Epoch 218/250: 100%|██████████| 12/12 [00:22<00:00,  1.87s/it, loss=0.00213, test_loss=0.0272]
Epoch 219/250: 100%|██████████| 12/12 [00:22<00:00,  1.87s/it, loss=0.00215, test_loss=0.0279]
Epoch 220/250: 100%|██████████| 12/12 [00:22<00:00,  1.88s/it, loss=0.00214, test_loss=0.0278]


Macro: ER=0.78, F=0.17, LE=52.43, LR=0.32
Micro: ER=0.78, F=0.29, LE=27.31, LR=0.51


Epoch 221/250: 100%|██████████| 12/12 [00:22<00:00,  1.88s/it, loss=0.00204, test_loss=0.0271]
Epoch 222/250: 100%|██████████| 12/12 [00:24<00:00,  2.07s/it, loss=0.00206, test_loss=0.0276]
Epoch 223/250: 100%|██████████| 12/12 [00:24<00:00,  2.02s/it, loss=0.00204, test_loss=0.0273]
Epoch 224/250: 100%|██████████| 12/12 [00:23<00:00,  1.99s/it, loss=0.00206, test_loss=0.0264]
Epoch 225/250: 100%|██████████| 12/12 [00:24<00:00,  2.00s/it, loss=0.00204, test_loss=0.0274]
Epoch 226/250: 100%|██████████| 12/12 [00:23<00:00,  1.99s/it, loss=0.00201, test_loss=0.0276]
Epoch 227/250: 100%|██████████| 12/12 [00:23<00:00,  1.98s/it, loss=0.00202, test_loss=0.0281]
Epoch 228/250: 100%|██████████| 12/12 [00:23<00:00,  1.96s/it, loss=0.00201, test_loss=0.0259]
Epoch 229/250: 100%|██████████| 12/12 [00:24<00:00,  2.00s/it, loss=0.00199, test_loss=0.0274]
Epoch 230/250: 100%|██████████| 12/12 [00:23<00:00,  1.96s/it, loss=0.002, test_loss=0.027]


Macro: ER=0.76, F=0.18, LE=51.75, LR=0.32
Micro: ER=0.76, F=0.31, LE=26.68, LR=0.51


Epoch 231/250: 100%|██████████| 12/12 [00:23<00:00,  1.98s/it, loss=0.00195, test_loss=0.027]
Epoch 232/250: 100%|██████████| 12/12 [00:23<00:00,  1.95s/it, loss=0.00196, test_loss=0.026]
Epoch 233/250: 100%|██████████| 12/12 [00:23<00:00,  1.96s/it, loss=0.00193, test_loss=0.0274]
Epoch 234/250: 100%|██████████| 12/12 [00:23<00:00,  1.99s/it, loss=0.00191, test_loss=0.0271]
Epoch 235/250: 100%|██████████| 12/12 [00:24<00:00,  2.03s/it, loss=0.0019, test_loss=0.0277]
Epoch 236/250: 100%|██████████| 12/12 [00:23<00:00,  1.95s/it, loss=0.00194, test_loss=0.0276]
Epoch 237/250: 100%|██████████| 12/12 [00:22<00:00,  1.90s/it, loss=0.00194, test_loss=0.0273]
Epoch 238/250: 100%|██████████| 12/12 [00:23<00:00,  1.93s/it, loss=0.0019, test_loss=0.0278]
Epoch 239/250: 100%|██████████| 12/12 [00:23<00:00,  1.92s/it, loss=0.00191, test_loss=0.0279]
Epoch 240/250: 100%|██████████| 12/12 [00:23<00:00,  1.95s/it, loss=0.00189, test_loss=0.0275]


Macro: ER=0.77, F=0.18, LE=52.17, LR=0.32
Micro: ER=0.77, F=0.31, LE=27.34, LR=0.53


Epoch 241/250: 100%|██████████| 12/12 [00:23<00:00,  1.95s/it, loss=0.00191, test_loss=0.0278]
Epoch 242/250: 100%|██████████| 12/12 [00:22<00:00,  1.91s/it, loss=0.0019, test_loss=0.0272]
Epoch 243/250: 100%|██████████| 12/12 [00:23<00:00,  1.92s/it, loss=0.00186, test_loss=0.0277]
Epoch 244/250: 100%|██████████| 12/12 [00:22<00:00,  1.90s/it, loss=0.00188, test_loss=0.0267]
Epoch 245/250: 100%|██████████| 12/12 [00:22<00:00,  1.90s/it, loss=0.00183, test_loss=0.0272]
Epoch 246/250: 100%|██████████| 12/12 [00:23<00:00,  1.97s/it, loss=0.00182, test_loss=0.027]
Epoch 247/250: 100%|██████████| 12/12 [00:23<00:00,  1.95s/it, loss=0.0018, test_loss=0.0269]
Epoch 248/250: 100%|██████████| 12/12 [00:23<00:00,  1.99s/it, loss=0.00178, test_loss=0.0271]
Epoch 249/250: 100%|██████████| 12/12 [00:24<00:00,  2.02s/it, loss=0.00179, test_loss=0.0274]
Epoch 250/250: 100%|██████████| 12/12 [00:24<00:00,  2.01s/it, loss=0.00177, test_loss=0.0277]

Macro: ER=0.77, F=0.16, LE=52.54, LR=0.30
Micro: ER=0.77, F=0.30, LE=27.86, LR=0.52
Micro @ epoch 221: ER=0.76, F=0.18, LE=52.33, LR=0.33
Macro @ epoch 221: ER=0.76, F=0.31, LE=27.10, LR=0.53





### Data augmentation


In [None]:
model_args = {
    'backbone': 'seldnet',
    'num_classes': NUM_CLASSES,
    'num_events': MAX_EVENTS,
    'input_dim': 7,
    'hidden_dim': 64,
    'dropout': 0.05,
    'rnn_layers': 2,
    'mhsa_layers': 2,
}
train_dataloader, test_dataloader = create_dataloaders(
    BATCH_SIZE, augments=[0, 1, 2, 3, 4, 5, 6, 7]
)
model = train_model(
    model_args,
    train_dataloader,
    test_dataloader,
    epochs=40,
    device=device,
    sde_weight=0.0,
)
torch.save(model.state_dict(), 'data/seldnet_augmented.pth')

Epoch 1/40: 100%|██████████| 95/95 [02:31<00:00,  1.60s/it, loss=0.0302, test_loss=0.0282]
Epoch 2/40: 100%|██████████| 95/95 [02:29<00:00,  1.58s/it, loss=0.0205, test_loss=0.028]
Epoch 3/40: 100%|██████████| 95/95 [02:26<00:00,  1.54s/it, loss=0.0158, test_loss=0.0259]
Epoch 4/40: 100%|██████████| 95/95 [02:26<00:00,  1.54s/it, loss=0.013, test_loss=0.0229]
Epoch 5/40: 100%|██████████| 95/95 [02:26<00:00,  1.54s/it, loss=0.0113, test_loss=0.024]
Epoch 6/40: 100%|██████████| 95/95 [02:28<00:00,  1.57s/it, loss=0.01, test_loss=0.0239]
Epoch 7/40: 100%|██████████| 95/95 [02:25<00:00,  1.53s/it, loss=0.00936, test_loss=0.0231]
Epoch 8/40: 100%|██████████| 95/95 [02:24<00:00,  1.52s/it, loss=0.00865, test_loss=0.0205]
Epoch 9/40: 100%|██████████| 95/95 [02:25<00:00,  1.53s/it, loss=0.00821, test_loss=0.023]
Epoch 10/40: 100%|██████████| 95/95 [02:24<00:00,  1.52s/it, loss=0.0078, test_loss=0.0215]


Macro: ER=0.68, F=0.13, LE=120.42, LR=0.21
Micro: ER=0.68, F=0.34, LE=25.36, LR=0.53


Epoch 11/40: 100%|██████████| 95/95 [02:24<00:00,  1.52s/it, loss=0.00746, test_loss=0.0203]
Epoch 12/40: 100%|██████████| 95/95 [02:24<00:00,  1.52s/it, loss=0.00727, test_loss=0.0205]
Epoch 13/40: 100%|██████████| 95/95 [02:23<00:00,  1.51s/it, loss=0.00692, test_loss=0.0205]
Epoch 14/40: 100%|██████████| 95/95 [02:22<00:00,  1.49s/it, loss=0.00678, test_loss=0.0214]
Epoch 15/40: 100%|██████████| 95/95 [02:17<00:00,  1.45s/it, loss=0.00659, test_loss=0.0201]
Epoch 16/40: 100%|██████████| 95/95 [02:22<00:00,  1.50s/it, loss=0.00642, test_loss=0.0203]
Epoch 17/40: 100%|██████████| 95/95 [02:23<00:00,  1.51s/it, loss=0.00638, test_loss=0.0218]
Epoch 18/40: 100%|██████████| 95/95 [02:24<00:00,  1.52s/it, loss=0.00619, test_loss=0.0193]
Epoch 19/40: 100%|██████████| 95/95 [02:25<00:00,  1.53s/it, loss=0.00605, test_loss=0.02]
Epoch 20/40: 100%|██████████| 95/95 [02:26<00:00,  1.54s/it, loss=0.00591, test_loss=0.021]


Macro: ER=0.66, F=0.15, LE=118.57, LR=0.23
Micro: ER=0.66, F=0.39, LE=21.51, LR=0.56


Epoch 21/40: 100%|██████████| 95/95 [02:26<00:00,  1.54s/it, loss=0.0058, test_loss=0.0193]
Epoch 22/40: 100%|██████████| 95/95 [02:26<00:00,  1.54s/it, loss=0.00572, test_loss=0.0207]
Epoch 23/40: 100%|██████████| 95/95 [02:26<00:00,  1.54s/it, loss=0.0056, test_loss=0.0194]
Epoch 24/40: 100%|██████████| 95/95 [02:24<00:00,  1.52s/it, loss=0.00554, test_loss=0.0186]
Epoch 25/40: 100%|██████████| 95/95 [02:25<00:00,  1.53s/it, loss=0.00545, test_loss=0.0202]
Epoch 26/40: 100%|██████████| 95/95 [02:27<00:00,  1.55s/it, loss=0.0053, test_loss=0.0202]
Epoch 27/40: 100%|██████████| 95/95 [02:27<00:00,  1.55s/it, loss=0.00526, test_loss=0.0208]
Epoch 28/40: 100%|██████████| 95/95 [02:26<00:00,  1.54s/it, loss=0.00521, test_loss=0.0216]
Epoch 29/40: 100%|██████████| 95/95 [02:22<00:00,  1.50s/it, loss=0.00503, test_loss=0.0194]
Epoch 30/40: 100%|██████████| 95/95 [02:22<00:00,  1.50s/it, loss=0.00493, test_loss=0.0212]


Macro: ER=0.65, F=0.16, LE=108.72, LR=0.25
Micro: ER=0.65, F=0.40, LE=24.21, LR=0.60


Epoch 31/40: 100%|██████████| 95/95 [02:22<00:00,  1.50s/it, loss=0.0048, test_loss=0.0207]
Epoch 32/40: 100%|██████████| 95/95 [02:23<00:00,  1.51s/it, loss=0.00474, test_loss=0.0198]
Epoch 33/40: 100%|██████████| 95/95 [02:22<00:00,  1.50s/it, loss=0.00463, test_loss=0.0201]
Epoch 34/40: 100%|██████████| 95/95 [02:22<00:00,  1.50s/it, loss=0.00457, test_loss=0.0208]
Epoch 35/40: 100%|██████████| 95/95 [02:22<00:00,  1.50s/it, loss=0.00456, test_loss=0.0245]
Epoch 36/40: 100%|██████████| 95/95 [02:22<00:00,  1.50s/it, loss=0.00476, test_loss=0.0199]
Epoch 37/40: 100%|██████████| 95/95 [02:22<00:00,  1.50s/it, loss=0.00434, test_loss=0.0197]
Epoch 38/40: 100%|██████████| 95/95 [02:21<00:00,  1.49s/it, loss=0.00425, test_loss=0.0201]
Epoch 39/40: 100%|██████████| 95/95 [02:23<00:00,  1.51s/it, loss=0.00448, test_loss=0.0205]
Epoch 40/40: 100%|██████████| 95/95 [02:23<00:00,  1.51s/it, loss=0.00412, test_loss=0.0201]

Macro: ER=0.64, F=0.19, LE=49.90, LR=0.32
Micro: ER=0.64, F=0.41, LE=22.30, LR=0.62
Micro @ epoch 37: ER=0.62, F=0.21, LE=48.73, LR=0.30
Macro @ epoch 37: ER=0.62, F=0.44, LE=19.54, LR=0.58





### Distance estimation


In [6]:
model_args = {
    'backbone': 'seldnet',
    'num_classes': NUM_CLASSES,
    'num_events': MAX_EVENTS,
    'input_dim': 7,
    'hidden_dim': 64,
    'dropout': 0.05,
    'rnn_layers': 2,
    'mhsa_layers': 2,
}
train_dataloader, test_dataloader = create_dataloaders(BATCH_SIZE)
model = train_model(
    model_args,
    train_dataloader,
    test_dataloader,
    epochs=250,
    device=device,
    sde_weight=0.5,
)

Epoch 1/250: 100%|██████████| 12/12 [00:16<00:00,  1.41s/it, loss=0.152, test_loss=0.183]
Epoch 2/250: 100%|██████████| 12/12 [00:17<00:00,  1.46s/it, loss=0.11, test_loss=0.257]
Epoch 3/250: 100%|██████████| 12/12 [00:17<00:00,  1.49s/it, loss=0.0891, test_loss=0.152]
Epoch 4/250: 100%|██████████| 12/12 [00:16<00:00,  1.41s/it, loss=0.0781, test_loss=0.136]
Epoch 5/250: 100%|██████████| 12/12 [00:18<00:00,  1.57s/it, loss=0.0734, test_loss=0.178]
Epoch 6/250: 100%|██████████| 12/12 [00:18<00:00,  1.53s/it, loss=0.0676, test_loss=0.14]
Epoch 7/250: 100%|██████████| 12/12 [00:19<00:00,  1.59s/it, loss=0.0632, test_loss=0.14]
Epoch 8/250: 100%|██████████| 12/12 [00:20<00:00,  1.73s/it, loss=0.0612, test_loss=0.146]
Epoch 9/250: 100%|██████████| 12/12 [00:21<00:00,  1.76s/it, loss=0.0597, test_loss=0.151]
Epoch 10/250: 100%|██████████| 12/12 [00:20<00:00,  1.68s/it, loss=0.0582, test_loss=0.138]


Macro: ER=0.87, F=0.03, LE=136.22, LR=0.13
Micro: ER=0.87, F=0.09, LE=38.82, LR=0.26


Epoch 11/250: 100%|██████████| 12/12 [00:20<00:00,  1.72s/it, loss=0.0556, test_loss=0.138]
Epoch 12/250: 100%|██████████| 12/12 [00:21<00:00,  1.77s/it, loss=0.0536, test_loss=0.15]
Epoch 13/250: 100%|██████████| 12/12 [00:20<00:00,  1.71s/it, loss=0.0532, test_loss=0.124]
Epoch 14/250: 100%|██████████| 12/12 [00:21<00:00,  1.80s/it, loss=0.0514, test_loss=0.131]
Epoch 15/250: 100%|██████████| 12/12 [00:21<00:00,  1.81s/it, loss=0.0505, test_loss=0.128]
Epoch 16/250: 100%|██████████| 12/12 [00:21<00:00,  1.82s/it, loss=0.0489, test_loss=0.138]
Epoch 17/250: 100%|██████████| 12/12 [00:21<00:00,  1.78s/it, loss=0.0476, test_loss=0.13]
Epoch 18/250: 100%|██████████| 12/12 [00:21<00:00,  1.82s/it, loss=0.0463, test_loss=0.133]
Epoch 19/250: 100%|██████████| 12/12 [00:21<00:00,  1.81s/it, loss=0.0456, test_loss=0.141]
Epoch 20/250: 100%|██████████| 12/12 [00:21<00:00,  1.75s/it, loss=0.0447, test_loss=0.128]


Macro: ER=0.81, F=0.06, LE=136.30, LR=0.18
Micro: ER=0.81, F=0.16, LE=38.13, LR=0.41


Epoch 21/250: 100%|██████████| 12/12 [00:22<00:00,  1.85s/it, loss=0.0441, test_loss=0.142]
Epoch 22/250: 100%|██████████| 12/12 [00:21<00:00,  1.83s/it, loss=0.0439, test_loss=0.14]
Epoch 23/250: 100%|██████████| 12/12 [00:21<00:00,  1.79s/it, loss=0.0435, test_loss=0.128]
Epoch 24/250: 100%|██████████| 12/12 [00:21<00:00,  1.82s/it, loss=0.0433, test_loss=0.135]
Epoch 25/250: 100%|██████████| 12/12 [00:21<00:00,  1.82s/it, loss=0.0427, test_loss=0.133]
Epoch 26/250: 100%|██████████| 12/12 [00:21<00:00,  1.81s/it, loss=0.0424, test_loss=0.129]
Epoch 27/250: 100%|██████████| 12/12 [00:21<00:00,  1.81s/it, loss=0.0419, test_loss=0.126]
Epoch 28/250: 100%|██████████| 12/12 [00:22<00:00,  1.84s/it, loss=0.0421, test_loss=0.128]
Epoch 29/250: 100%|██████████| 12/12 [00:21<00:00,  1.82s/it, loss=0.0414, test_loss=0.128]
Epoch 30/250: 100%|██████████| 12/12 [00:22<00:00,  1.85s/it, loss=0.0409, test_loss=0.133]


Macro: ER=0.81, F=0.07, LE=126.58, LR=0.21
Micro: ER=0.81, F=0.20, LE=37.91, LR=0.50


Epoch 31/250: 100%|██████████| 12/12 [00:21<00:00,  1.82s/it, loss=0.0405, test_loss=0.127]
Epoch 32/250: 100%|██████████| 12/12 [00:22<00:00,  1.84s/it, loss=0.0404, test_loss=0.129]
Epoch 33/250: 100%|██████████| 12/12 [00:22<00:00,  1.84s/it, loss=0.0399, test_loss=0.132]
Epoch 34/250: 100%|██████████| 12/12 [00:22<00:00,  1.85s/it, loss=0.0388, test_loss=0.132]
Epoch 35/250: 100%|██████████| 12/12 [00:21<00:00,  1.80s/it, loss=0.0383, test_loss=0.126]
Epoch 36/250: 100%|██████████| 12/12 [00:22<00:00,  1.86s/it, loss=0.0355, test_loss=0.123]
Epoch 37/250: 100%|██████████| 12/12 [00:21<00:00,  1.82s/it, loss=0.0339, test_loss=0.124]
Epoch 38/250: 100%|██████████| 12/12 [00:22<00:00,  1.86s/it, loss=0.0336, test_loss=0.126]
Epoch 39/250: 100%|██████████| 12/12 [00:22<00:00,  1.86s/it, loss=0.033, test_loss=0.122]
Epoch 40/250: 100%|██████████| 12/12 [00:22<00:00,  1.86s/it, loss=0.0328, test_loss=0.123]


Macro: ER=0.80, F=0.07, LE=126.84, LR=0.21
Micro: ER=0.80, F=0.20, LE=38.63, LR=0.50


Epoch 41/250: 100%|██████████| 12/12 [00:22<00:00,  1.87s/it, loss=0.0326, test_loss=0.132]
Epoch 42/250: 100%|██████████| 12/12 [00:22<00:00,  1.86s/it, loss=0.0321, test_loss=0.127]
Epoch 43/250: 100%|██████████| 12/12 [00:22<00:00,  1.83s/it, loss=0.0317, test_loss=0.132]
Epoch 44/250: 100%|██████████| 12/12 [00:21<00:00,  1.79s/it, loss=0.0316, test_loss=0.132]
Epoch 45/250: 100%|██████████| 12/12 [00:21<00:00,  1.76s/it, loss=0.0311, test_loss=0.133]
Epoch 46/250: 100%|██████████| 12/12 [00:21<00:00,  1.76s/it, loss=0.0309, test_loss=0.128]
Epoch 47/250: 100%|██████████| 12/12 [00:21<00:00,  1.76s/it, loss=0.0306, test_loss=0.131]
Epoch 48/250: 100%|██████████| 12/12 [00:21<00:00,  1.79s/it, loss=0.0302, test_loss=0.136]
Epoch 49/250: 100%|██████████| 12/12 [00:21<00:00,  1.75s/it, loss=0.0298, test_loss=0.125]
Epoch 50/250: 100%|██████████| 12/12 [00:21<00:00,  1.78s/it, loss=0.0296, test_loss=0.131]


Macro: ER=0.80, F=0.07, LE=128.12, LR=0.21
Micro: ER=0.80, F=0.22, LE=38.55, LR=0.50


Epoch 51/250: 100%|██████████| 12/12 [00:21<00:00,  1.79s/it, loss=0.0292, test_loss=0.135]
Epoch 52/250: 100%|██████████| 12/12 [00:21<00:00,  1.77s/it, loss=0.029, test_loss=0.128]
Epoch 53/250: 100%|██████████| 12/12 [00:21<00:00,  1.76s/it, loss=0.0287, test_loss=0.134]
Epoch 54/250: 100%|██████████| 12/12 [00:20<00:00,  1.75s/it, loss=0.0285, test_loss=0.13]
Epoch 55/250: 100%|██████████| 12/12 [00:21<00:00,  1.76s/it, loss=0.0284, test_loss=0.132]
Epoch 56/250: 100%|██████████| 12/12 [00:21<00:00,  1.77s/it, loss=0.0278, test_loss=0.128]
Epoch 57/250: 100%|██████████| 12/12 [00:21<00:00,  1.75s/it, loss=0.0275, test_loss=0.126]
Epoch 58/250: 100%|██████████| 12/12 [00:21<00:00,  1.78s/it, loss=0.0279, test_loss=0.138]
Epoch 59/250: 100%|██████████| 12/12 [00:21<00:00,  1.76s/it, loss=0.0278, test_loss=0.131]
Epoch 60/250: 100%|██████████| 12/12 [00:21<00:00,  1.80s/it, loss=0.0275, test_loss=0.135]


Macro: ER=0.81, F=0.08, LE=118.08, LR=0.22
Micro: ER=0.81, F=0.22, LE=38.17, LR=0.52


Epoch 61/250: 100%|██████████| 12/12 [00:20<00:00,  1.74s/it, loss=0.0271, test_loss=0.13]
Epoch 62/250: 100%|██████████| 12/12 [00:21<00:00,  1.79s/it, loss=0.0264, test_loss=0.129]
Epoch 63/250: 100%|██████████| 12/12 [00:21<00:00,  1.78s/it, loss=0.0265, test_loss=0.132]
Epoch 64/250: 100%|██████████| 12/12 [00:21<00:00,  1.80s/it, loss=0.0268, test_loss=0.139]
Epoch 65/250: 100%|██████████| 12/12 [00:20<00:00,  1.75s/it, loss=0.0264, test_loss=0.132]
Epoch 66/250: 100%|██████████| 12/12 [00:21<00:00,  1.77s/it, loss=0.0257, test_loss=0.126]
Epoch 67/250: 100%|██████████| 12/12 [00:21<00:00,  1.78s/it, loss=0.0255, test_loss=0.13]
Epoch 68/250: 100%|██████████| 12/12 [00:21<00:00,  1.78s/it, loss=0.0252, test_loss=0.133]
Epoch 69/250: 100%|██████████| 12/12 [00:21<00:00,  1.81s/it, loss=0.0256, test_loss=0.135]
Epoch 70/250: 100%|██████████| 12/12 [00:21<00:00,  1.77s/it, loss=0.0256, test_loss=0.132]


Macro: ER=0.80, F=0.08, LE=120.23, LR=0.22
Micro: ER=0.80, F=0.22, LE=37.93, LR=0.52


Epoch 71/250: 100%|██████████| 12/12 [00:21<00:00,  1.79s/it, loss=0.0254, test_loss=0.141]
Epoch 72/250: 100%|██████████| 12/12 [00:21<00:00,  1.78s/it, loss=0.0247, test_loss=0.128]
Epoch 73/250: 100%|██████████| 12/12 [00:22<00:00,  1.86s/it, loss=0.0248, test_loss=0.132]
Epoch 74/250: 100%|██████████| 12/12 [00:22<00:00,  1.90s/it, loss=0.0244, test_loss=0.127]
Epoch 75/250: 100%|██████████| 12/12 [00:22<00:00,  1.86s/it, loss=0.0244, test_loss=0.123]
Epoch 76/250: 100%|██████████| 12/12 [00:23<00:00,  1.93s/it, loss=0.0244, test_loss=0.145]
Epoch 77/250: 100%|██████████| 12/12 [00:22<00:00,  1.87s/it, loss=0.0242, test_loss=0.131]
Epoch 78/250: 100%|██████████| 12/12 [00:22<00:00,  1.89s/it, loss=0.0243, test_loss=0.13]
Epoch 79/250: 100%|██████████| 12/12 [00:22<00:00,  1.89s/it, loss=0.024, test_loss=0.142]
Epoch 80/250: 100%|██████████| 12/12 [00:22<00:00,  1.86s/it, loss=0.0238, test_loss=0.128]


Macro: ER=0.79, F=0.08, LE=120.36, LR=0.22
Micro: ER=0.79, F=0.22, LE=38.13, LR=0.52


Epoch 81/250: 100%|██████████| 12/12 [00:22<00:00,  1.85s/it, loss=0.024, test_loss=0.133]
Epoch 82/250: 100%|██████████| 12/12 [00:22<00:00,  1.86s/it, loss=0.0237, test_loss=0.133]
Epoch 83/250: 100%|██████████| 12/12 [00:22<00:00,  1.90s/it, loss=0.0232, test_loss=0.14]
Epoch 84/250: 100%|██████████| 12/12 [00:22<00:00,  1.89s/it, loss=0.023, test_loss=0.135]
Epoch 85/250: 100%|██████████| 12/12 [00:22<00:00,  1.90s/it, loss=0.0229, test_loss=0.135]
Epoch 86/250: 100%|██████████| 12/12 [00:22<00:00,  1.91s/it, loss=0.0232, test_loss=0.134]
Epoch 87/250: 100%|██████████| 12/12 [00:22<00:00,  1.87s/it, loss=0.0229, test_loss=0.127]
Epoch 88/250: 100%|██████████| 12/12 [00:22<00:00,  1.87s/it, loss=0.0231, test_loss=0.137]
Epoch 89/250: 100%|██████████| 12/12 [00:22<00:00,  1.90s/it, loss=0.0227, test_loss=0.131]
Epoch 90/250: 100%|██████████| 12/12 [00:22<00:00,  1.88s/it, loss=0.0226, test_loss=0.129]


Macro: ER=0.80, F=0.08, LE=121.32, LR=0.22
Micro: ER=0.80, F=0.22, LE=37.03, LR=0.53


Epoch 91/250: 100%|██████████| 12/12 [00:22<00:00,  1.91s/it, loss=0.0225, test_loss=0.138]
Epoch 92/250: 100%|██████████| 12/12 [00:22<00:00,  1.87s/it, loss=0.0227, test_loss=0.133]
Epoch 93/250: 100%|██████████| 12/12 [00:22<00:00,  1.90s/it, loss=0.0226, test_loss=0.129]
Epoch 94/250: 100%|██████████| 12/12 [00:22<00:00,  1.88s/it, loss=0.0223, test_loss=0.132]
Epoch 95/250: 100%|██████████| 12/12 [00:22<00:00,  1.89s/it, loss=0.0222, test_loss=0.145]
Epoch 96/250: 100%|██████████| 12/12 [00:22<00:00,  1.91s/it, loss=0.022, test_loss=0.141]
Epoch 97/250: 100%|██████████| 12/12 [00:22<00:00,  1.89s/it, loss=0.0224, test_loss=0.129]
Epoch 98/250: 100%|██████████| 12/12 [00:22<00:00,  1.91s/it, loss=0.0221, test_loss=0.131]
Epoch 99/250: 100%|██████████| 12/12 [00:22<00:00,  1.90s/it, loss=0.0223, test_loss=0.136]
Epoch 100/250: 100%|██████████| 12/12 [00:22<00:00,  1.88s/it, loss=0.022, test_loss=0.133]


Macro: ER=0.81, F=0.08, LE=117.86, LR=0.22
Micro: ER=0.81, F=0.22, LE=36.11, LR=0.52


Epoch 101/250: 100%|██████████| 12/12 [00:22<00:00,  1.89s/it, loss=0.0221, test_loss=0.133]
Epoch 102/250: 100%|██████████| 12/12 [00:22<00:00,  1.88s/it, loss=0.0218, test_loss=0.137]
Epoch 103/250: 100%|██████████| 12/12 [00:22<00:00,  1.88s/it, loss=0.0216, test_loss=0.132]
Epoch 104/250: 100%|██████████| 12/12 [00:22<00:00,  1.89s/it, loss=0.0216, test_loss=0.129]
Epoch 105/250: 100%|██████████| 12/12 [00:22<00:00,  1.87s/it, loss=0.0215, test_loss=0.133]
Epoch 106/250: 100%|██████████| 12/12 [00:22<00:00,  1.91s/it, loss=0.0214, test_loss=0.138]
Epoch 107/250: 100%|██████████| 12/12 [00:22<00:00,  1.86s/it, loss=0.0211, test_loss=0.132]
Epoch 108/250: 100%|██████████| 12/12 [00:23<00:00,  1.93s/it, loss=0.0215, test_loss=0.137]
Epoch 109/250: 100%|██████████| 12/12 [00:22<00:00,  1.83s/it, loss=0.0214, test_loss=0.138]
Epoch 110/250: 100%|██████████| 12/12 [00:21<00:00,  1.81s/it, loss=0.0211, test_loss=0.129]


Macro: ER=0.81, F=0.08, LE=120.25, LR=0.22
Micro: ER=0.81, F=0.22, LE=37.35, LR=0.52


Epoch 111/250: 100%|██████████| 12/12 [00:21<00:00,  1.81s/it, loss=0.0211, test_loss=0.137]
Epoch 112/250: 100%|██████████| 12/12 [00:21<00:00,  1.80s/it, loss=0.021, test_loss=0.134]
Epoch 113/250: 100%|██████████| 12/12 [00:21<00:00,  1.81s/it, loss=0.0208, test_loss=0.134]
Epoch 114/250: 100%|██████████| 12/12 [00:22<00:00,  1.84s/it, loss=0.0212, test_loss=0.133]
Epoch 115/250: 100%|██████████| 12/12 [00:22<00:00,  1.85s/it, loss=0.0211, test_loss=0.142]
Epoch 116/250: 100%|██████████| 12/12 [00:21<00:00,  1.83s/it, loss=0.0206, test_loss=0.131]
Epoch 117/250: 100%|██████████| 12/12 [00:21<00:00,  1.83s/it, loss=0.0206, test_loss=0.13]
Epoch 118/250: 100%|██████████| 12/12 [00:21<00:00,  1.81s/it, loss=0.0207, test_loss=0.134]
Epoch 119/250: 100%|██████████| 12/12 [00:22<00:00,  1.86s/it, loss=0.0207, test_loss=0.135]
Epoch 120/250: 100%|██████████| 12/12 [00:21<00:00,  1.82s/it, loss=0.0205, test_loss=0.128]


Macro: ER=0.78, F=0.08, LE=118.44, LR=0.22
Micro: ER=0.78, F=0.24, LE=36.12, LR=0.53


Epoch 121/250: 100%|██████████| 12/12 [00:21<00:00,  1.83s/it, loss=0.0204, test_loss=0.132]
Epoch 122/250: 100%|██████████| 12/12 [00:22<00:00,  1.85s/it, loss=0.0205, test_loss=0.128]
Epoch 123/250: 100%|██████████| 12/12 [00:21<00:00,  1.83s/it, loss=0.0203, test_loss=0.133]
Epoch 124/250: 100%|██████████| 12/12 [00:21<00:00,  1.83s/it, loss=0.0204, test_loss=0.132]
Epoch 125/250: 100%|██████████| 12/12 [00:21<00:00,  1.83s/it, loss=0.0204, test_loss=0.131]
Epoch 126/250: 100%|██████████| 12/12 [00:22<00:00,  1.84s/it, loss=0.0203, test_loss=0.127]
Epoch 127/250: 100%|██████████| 12/12 [00:22<00:00,  1.84s/it, loss=0.0203, test_loss=0.141]
Epoch 128/250: 100%|██████████| 12/12 [00:21<00:00,  1.83s/it, loss=0.0204, test_loss=0.141]
Epoch 129/250: 100%|██████████| 12/12 [00:22<00:00,  1.85s/it, loss=0.0205, test_loss=0.136]
Epoch 130/250: 100%|██████████| 12/12 [00:21<00:00,  1.82s/it, loss=0.0203, test_loss=0.138]


Macro: ER=0.81, F=0.08, LE=116.41, LR=0.22
Micro: ER=0.81, F=0.23, LE=35.81, LR=0.53


Epoch 131/250: 100%|██████████| 12/12 [00:22<00:00,  1.91s/it, loss=0.02, test_loss=0.124]
Epoch 132/250: 100%|██████████| 12/12 [00:23<00:00,  1.99s/it, loss=0.0198, test_loss=0.137]
Epoch 133/250: 100%|██████████| 12/12 [00:23<00:00,  1.95s/it, loss=0.0197, test_loss=0.132]
Epoch 134/250: 100%|██████████| 12/12 [00:23<00:00,  2.00s/it, loss=0.0198, test_loss=0.134]
Epoch 135/250: 100%|██████████| 12/12 [00:23<00:00,  2.00s/it, loss=0.0197, test_loss=0.132]
Epoch 136/250: 100%|██████████| 12/12 [00:23<00:00,  1.99s/it, loss=0.0197, test_loss=0.129]
Epoch 137/250: 100%|██████████| 12/12 [00:23<00:00,  1.97s/it, loss=0.0198, test_loss=0.127]
Epoch 138/250: 100%|██████████| 12/12 [00:23<00:00,  1.97s/it, loss=0.0195, test_loss=0.127]
Epoch 139/250: 100%|██████████| 12/12 [00:23<00:00,  1.96s/it, loss=0.0193, test_loss=0.133]
Epoch 140/250: 100%|██████████| 12/12 [00:23<00:00,  1.99s/it, loss=0.0192, test_loss=0.129]


Macro: ER=0.80, F=0.09, LE=117.76, LR=0.23
Micro: ER=0.80, F=0.25, LE=34.72, LR=0.54


Epoch 141/250: 100%|██████████| 12/12 [00:23<00:00,  1.97s/it, loss=0.0195, test_loss=0.131]
Epoch 142/250: 100%|██████████| 12/12 [00:23<00:00,  1.95s/it, loss=0.0192, test_loss=0.129]
Epoch 143/250: 100%|██████████| 12/12 [00:23<00:00,  1.97s/it, loss=0.0191, test_loss=0.132]
Epoch 144/250: 100%|██████████| 12/12 [00:23<00:00,  1.94s/it, loss=0.019, test_loss=0.131]
Epoch 145/250: 100%|██████████| 12/12 [00:23<00:00,  1.95s/it, loss=0.0189, test_loss=0.131]
Epoch 146/250: 100%|██████████| 12/12 [00:23<00:00,  1.97s/it, loss=0.0189, test_loss=0.132]
Epoch 147/250: 100%|██████████| 12/12 [00:23<00:00,  1.97s/it, loss=0.0185, test_loss=0.141]
Epoch 148/250: 100%|██████████| 12/12 [00:23<00:00,  1.95s/it, loss=0.0181, test_loss=0.136]
Epoch 149/250: 100%|██████████| 12/12 [00:23<00:00,  1.95s/it, loss=0.0178, test_loss=0.136]
Epoch 150/250: 100%|██████████| 12/12 [00:23<00:00,  1.98s/it, loss=0.0175, test_loss=0.134]


Macro: ER=0.80, F=0.09, LE=116.80, LR=0.23
Micro: ER=0.80, F=0.24, LE=36.57, LR=0.54


Epoch 151/250: 100%|██████████| 12/12 [00:23<00:00,  1.96s/it, loss=0.0179, test_loss=0.132]
Epoch 152/250: 100%|██████████| 12/12 [00:23<00:00,  1.95s/it, loss=0.0178, test_loss=0.129]
Epoch 153/250: 100%|██████████| 12/12 [00:23<00:00,  1.94s/it, loss=0.0176, test_loss=0.134]
Epoch 154/250: 100%|██████████| 12/12 [00:23<00:00,  1.98s/it, loss=0.0174, test_loss=0.13]
Epoch 155/250: 100%|██████████| 12/12 [00:23<00:00,  1.96s/it, loss=0.0177, test_loss=0.123]
Epoch 156/250: 100%|██████████| 12/12 [00:23<00:00,  1.97s/it, loss=0.0176, test_loss=0.128]
Epoch 157/250: 100%|██████████| 12/12 [00:23<00:00,  1.94s/it, loss=0.0173, test_loss=0.129]
Epoch 158/250: 100%|██████████| 12/12 [00:23<00:00,  1.98s/it, loss=0.0171, test_loss=0.128]
Epoch 159/250: 100%|██████████| 12/12 [00:23<00:00,  1.96s/it, loss=0.0172, test_loss=0.128]
Epoch 160/250: 100%|██████████| 12/12 [00:23<00:00,  1.99s/it, loss=0.0172, test_loss=0.123]


Macro: ER=0.81, F=0.08, LE=106.10, LR=0.23
Micro: ER=0.81, F=0.23, LE=37.10, LR=0.56


Epoch 161/250: 100%|██████████| 12/12 [00:23<00:00,  1.94s/it, loss=0.017, test_loss=0.132]
Epoch 162/250: 100%|██████████| 12/12 [00:23<00:00,  1.98s/it, loss=0.0164, test_loss=0.135]
Epoch 163/250: 100%|██████████| 12/12 [00:23<00:00,  1.98s/it, loss=0.0167, test_loss=0.128]
Epoch 164/250: 100%|██████████| 12/12 [00:23<00:00,  1.96s/it, loss=0.0166, test_loss=0.136]
Epoch 165/250: 100%|██████████| 12/12 [00:23<00:00,  1.99s/it, loss=0.0164, test_loss=0.135]
Epoch 166/250: 100%|██████████| 12/12 [00:23<00:00,  1.97s/it, loss=0.0165, test_loss=0.13]
Epoch 167/250: 100%|██████████| 12/12 [00:23<00:00,  1.98s/it, loss=0.0165, test_loss=0.132]
Epoch 168/250: 100%|██████████| 12/12 [00:23<00:00,  2.00s/it, loss=0.0164, test_loss=0.129]
Epoch 169/250: 100%|██████████| 12/12 [00:23<00:00,  1.95s/it, loss=0.0163, test_loss=0.13]
Epoch 170/250: 100%|██████████| 12/12 [00:23<00:00,  1.95s/it, loss=0.0164, test_loss=0.127]


Macro: ER=0.79, F=0.09, LE=104.52, LR=0.23
Micro: ER=0.79, F=0.24, LE=36.22, LR=0.54


Epoch 171/250: 100%|██████████| 12/12 [00:23<00:00,  1.94s/it, loss=0.0167, test_loss=0.129]
Epoch 172/250: 100%|██████████| 12/12 [00:23<00:00,  2.00s/it, loss=0.0167, test_loss=0.13]
Epoch 173/250: 100%|██████████| 12/12 [00:23<00:00,  1.97s/it, loss=0.0162, test_loss=0.131]
Epoch 174/250: 100%|██████████| 12/12 [00:23<00:00,  1.96s/it, loss=0.0162, test_loss=0.133]
Epoch 175/250: 100%|██████████| 12/12 [00:23<00:00,  1.98s/it, loss=0.0163, test_loss=0.131]
Epoch 176/250: 100%|██████████| 12/12 [00:23<00:00,  1.95s/it, loss=0.016, test_loss=0.133]
Epoch 177/250: 100%|██████████| 12/12 [00:24<00:00,  2.02s/it, loss=0.0163, test_loss=0.136]
Epoch 178/250: 100%|██████████| 12/12 [00:23<00:00,  1.97s/it, loss=0.016, test_loss=0.139]
Epoch 179/250: 100%|██████████| 12/12 [00:23<00:00,  1.97s/it, loss=0.0161, test_loss=0.132]
Epoch 180/250: 100%|██████████| 12/12 [00:23<00:00,  1.97s/it, loss=0.016, test_loss=0.128]


Macro: ER=0.80, F=0.09, LE=104.11, LR=0.24
Micro: ER=0.80, F=0.24, LE=37.08, LR=0.55


Epoch 181/250: 100%|██████████| 12/12 [00:23<00:00,  1.98s/it, loss=0.016, test_loss=0.133]
Epoch 182/250: 100%|██████████| 12/12 [00:23<00:00,  1.95s/it, loss=0.0157, test_loss=0.128]
Epoch 183/250: 100%|██████████| 12/12 [00:24<00:00,  2.01s/it, loss=0.0157, test_loss=0.129]
Epoch 184/250: 100%|██████████| 12/12 [00:23<00:00,  1.93s/it, loss=0.0156, test_loss=0.135]
Epoch 185/250: 100%|██████████| 12/12 [00:23<00:00,  1.92s/it, loss=0.0157, test_loss=0.131]
Epoch 186/250: 100%|██████████| 12/12 [00:22<00:00,  1.90s/it, loss=0.0156, test_loss=0.132]
Epoch 187/250: 100%|██████████| 12/12 [00:22<00:00,  1.89s/it, loss=0.0153, test_loss=0.135]
Epoch 188/250: 100%|██████████| 12/12 [00:22<00:00,  1.91s/it, loss=0.0153, test_loss=0.131]
Epoch 189/250: 100%|██████████| 12/12 [00:22<00:00,  1.91s/it, loss=0.0152, test_loss=0.128]
Epoch 190/250: 100%|██████████| 12/12 [00:23<00:00,  1.94s/it, loss=0.0151, test_loss=0.135]


Macro: ER=0.83, F=0.08, LE=104.15, LR=0.24
Micro: ER=0.83, F=0.23, LE=35.86, LR=0.56


Epoch 191/250: 100%|██████████| 12/12 [00:23<00:00,  1.93s/it, loss=0.0152, test_loss=0.13]
Epoch 192/250: 100%|██████████| 12/12 [00:23<00:00,  1.93s/it, loss=0.0151, test_loss=0.135]
Epoch 193/250: 100%|██████████| 12/12 [00:23<00:00,  1.92s/it, loss=0.0152, test_loss=0.129]
Epoch 194/250: 100%|██████████| 12/12 [00:23<00:00,  1.94s/it, loss=0.0151, test_loss=0.135]
Epoch 195/250: 100%|██████████| 12/12 [00:23<00:00,  1.94s/it, loss=0.0152, test_loss=0.132]
Epoch 196/250: 100%|██████████| 12/12 [00:23<00:00,  1.93s/it, loss=0.0152, test_loss=0.129]
Epoch 197/250: 100%|██████████| 12/12 [00:22<00:00,  1.91s/it, loss=0.0151, test_loss=0.134]
Epoch 198/250: 100%|██████████| 12/12 [00:22<00:00,  1.91s/it, loss=0.0151, test_loss=0.129]
Epoch 199/250: 100%|██████████| 12/12 [00:22<00:00,  1.90s/it, loss=0.0151, test_loss=0.136]
Epoch 200/250: 100%|██████████| 12/12 [00:23<00:00,  1.92s/it, loss=0.0149, test_loss=0.133]


Macro: ER=0.82, F=0.09, LE=103.74, LR=0.23
Micro: ER=0.82, F=0.23, LE=35.65, LR=0.55


Epoch 201/250: 100%|██████████| 12/12 [00:23<00:00,  1.93s/it, loss=0.015, test_loss=0.133]
Epoch 202/250: 100%|██████████| 12/12 [00:23<00:00,  1.93s/it, loss=0.0149, test_loss=0.132]
Epoch 203/250: 100%|██████████| 12/12 [00:23<00:00,  1.96s/it, loss=0.0149, test_loss=0.136]
Epoch 204/250: 100%|██████████| 12/12 [00:23<00:00,  1.93s/it, loss=0.0149, test_loss=0.135]
Epoch 205/250: 100%|██████████| 12/12 [00:22<00:00,  1.88s/it, loss=0.0149, test_loss=0.127]
Epoch 206/250: 100%|██████████| 12/12 [00:22<00:00,  1.90s/it, loss=0.0148, test_loss=0.129]
Epoch 207/250: 100%|██████████| 12/12 [00:22<00:00,  1.90s/it, loss=0.015, test_loss=0.141]
Epoch 208/250: 100%|██████████| 12/12 [00:23<00:00,  1.93s/it, loss=0.0149, test_loss=0.133]
Epoch 209/250: 100%|██████████| 12/12 [00:23<00:00,  1.92s/it, loss=0.0149, test_loss=0.132]
Epoch 210/250: 100%|██████████| 12/12 [00:22<00:00,  1.90s/it, loss=0.0148, test_loss=0.133]


Macro: ER=0.81, F=0.09, LE=92.18, LR=0.24
Micro: ER=0.81, F=0.25, LE=35.22, LR=0.57


Epoch 211/250: 100%|██████████| 12/12 [00:22<00:00,  1.85s/it, loss=0.015, test_loss=0.13]
Epoch 212/250: 100%|██████████| 12/12 [00:22<00:00,  1.84s/it, loss=0.015, test_loss=0.13]
Epoch 213/250: 100%|██████████| 12/12 [00:21<00:00,  1.81s/it, loss=0.015, test_loss=0.134]
Epoch 214/250: 100%|██████████| 12/12 [00:22<00:00,  1.86s/it, loss=0.015, test_loss=0.134]
Epoch 215/250: 100%|██████████| 12/12 [00:22<00:00,  1.86s/it, loss=0.0149, test_loss=0.131]
Epoch 216/250: 100%|██████████| 12/12 [00:22<00:00,  1.86s/it, loss=0.0149, test_loss=0.128]
Epoch 217/250: 100%|██████████| 12/12 [00:22<00:00,  1.84s/it, loss=0.0146, test_loss=0.139]
Epoch 218/250: 100%|██████████| 12/12 [00:22<00:00,  1.84s/it, loss=0.0148, test_loss=0.13]
Epoch 219/250: 100%|██████████| 12/12 [00:22<00:00,  1.84s/it, loss=0.0148, test_loss=0.142]
Epoch 220/250: 100%|██████████| 12/12 [00:21<00:00,  1.82s/it, loss=0.0147, test_loss=0.129]


Macro: ER=0.78, F=0.09, LE=104.72, LR=0.24
Micro: ER=0.78, F=0.26, LE=35.13, LR=0.55


Epoch 221/250: 100%|██████████| 12/12 [00:21<00:00,  1.83s/it, loss=0.0146, test_loss=0.134]
Epoch 222/250: 100%|██████████| 12/12 [00:21<00:00,  1.83s/it, loss=0.0145, test_loss=0.13]
Epoch 223/250: 100%|██████████| 12/12 [00:21<00:00,  1.83s/it, loss=0.0147, test_loss=0.139]
Epoch 224/250: 100%|██████████| 12/12 [00:22<00:00,  1.85s/it, loss=0.0147, test_loss=0.137]
Epoch 225/250: 100%|██████████| 12/12 [00:22<00:00,  1.84s/it, loss=0.0145, test_loss=0.136]
Epoch 226/250: 100%|██████████| 12/12 [00:22<00:00,  1.84s/it, loss=0.0144, test_loss=0.135]
Epoch 227/250: 100%|██████████| 12/12 [00:22<00:00,  1.83s/it, loss=0.0144, test_loss=0.127]
Epoch 228/250: 100%|██████████| 12/12 [00:22<00:00,  1.87s/it, loss=0.0142, test_loss=0.13]
Epoch 229/250: 100%|██████████| 12/12 [00:22<00:00,  1.90s/it, loss=0.0143, test_loss=0.131]
Epoch 230/250: 100%|██████████| 12/12 [00:22<00:00,  1.91s/it, loss=0.0141, test_loss=0.132]


Macro: ER=0.79, F=0.09, LE=94.39, LR=0.24
Micro: ER=0.79, F=0.25, LE=34.63, LR=0.55


Epoch 231/250: 100%|██████████| 12/12 [00:23<00:00,  1.92s/it, loss=0.0141, test_loss=0.128]
Epoch 232/250: 100%|██████████| 12/12 [00:22<00:00,  1.91s/it, loss=0.0142, test_loss=0.13]
Epoch 233/250: 100%|██████████| 12/12 [00:22<00:00,  1.91s/it, loss=0.0142, test_loss=0.129]
Epoch 234/250: 100%|██████████| 12/12 [00:23<00:00,  1.93s/it, loss=0.0142, test_loss=0.133]
Epoch 235/250: 100%|██████████| 12/12 [00:22<00:00,  1.85s/it, loss=0.0143, test_loss=0.132]
Epoch 236/250: 100%|██████████| 12/12 [00:22<00:00,  1.87s/it, loss=0.0143, test_loss=0.129]
Epoch 237/250: 100%|██████████| 12/12 [00:22<00:00,  1.87s/it, loss=0.0144, test_loss=0.135]
Epoch 238/250: 100%|██████████| 12/12 [00:22<00:00,  1.86s/it, loss=0.0143, test_loss=0.133]
Epoch 239/250: 100%|██████████| 12/12 [00:22<00:00,  1.88s/it, loss=0.0143, test_loss=0.131]
Epoch 240/250: 100%|██████████| 12/12 [00:22<00:00,  1.85s/it, loss=0.0143, test_loss=0.132]


Macro: ER=0.79, F=0.09, LE=93.16, LR=0.24
Micro: ER=0.79, F=0.25, LE=35.26, LR=0.56


Epoch 241/250: 100%|██████████| 12/12 [00:22<00:00,  1.84s/it, loss=0.0144, test_loss=0.133]
Epoch 242/250: 100%|██████████| 12/12 [00:22<00:00,  1.85s/it, loss=0.0142, test_loss=0.132]
Epoch 243/250: 100%|██████████| 12/12 [00:22<00:00,  1.87s/it, loss=0.014, test_loss=0.135]
Epoch 244/250: 100%|██████████| 12/12 [00:22<00:00,  1.86s/it, loss=0.014, test_loss=0.134]
Epoch 245/250: 100%|██████████| 12/12 [00:22<00:00,  1.86s/it, loss=0.0142, test_loss=0.127]
Epoch 246/250: 100%|██████████| 12/12 [00:22<00:00,  1.85s/it, loss=0.014, test_loss=0.131]
Epoch 247/250: 100%|██████████| 12/12 [00:22<00:00,  1.85s/it, loss=0.014, test_loss=0.139]
Epoch 248/250: 100%|██████████| 12/12 [00:22<00:00,  1.85s/it, loss=0.0141, test_loss=0.134]
Epoch 249/250: 100%|██████████| 12/12 [00:22<00:00,  1.86s/it, loss=0.0141, test_loss=0.135]
Epoch 250/250: 100%|██████████| 12/12 [00:22<00:00,  1.85s/it, loss=0.0142, test_loss=0.131]

Macro: ER=0.80, F=0.10, LE=94.94, LR=0.25
Micro: ER=0.80, F=0.26, LE=35.13, LR=0.56
Micro @ epoch 246: ER=0.79, F=0.11, LE=93.29, LR=0.24
Macro @ epoch 246: ER=0.79, F=0.26, LE=35.12, LR=0.55



