In [1]:
import os
import random
import pandas as pd
import numpy as np
import mxnet as mx
import torch
import torch.nn as nn
import torch.nn.functional as F
import torch.optim as opt
from torch.utils.data import Dataset, DataLoader
from pytorch_metric_learning import losses
from einops import rearrange, repeat
import optuna
from optuna.trial import TrialState
from tqdm import tqdm

In [2]:
def file_to_embed(embeds, file):
    emb = []
    for f in file:
        emb.append(embeds[f][0])
    return torch.stack(emb)

In [3]:
MIN_NUM_PATCHES = 16

In [4]:
device = torch.device("cuda:1" if torch.cuda.is_available() else "cpu")
device

device(type='cuda', index=1)

In [5]:
class AdienceDataset(Dataset):
    def __init__(self, annot_file, img_dir):
        self.img_lbls = pd.read_csv(annot_file, header=None)
        self.img_dir = img_dir
    
    def __len__(self):
        return len(self.img_lbls)
    
    def __getitem__(self, idx):
        img_file = self.img_lbls.iloc[idx, 0]
        img_path = os.path.join(self.img_dir, img_file)
        image = mx.image.imread(img_path)
        if image.shape[1] != 112:
            image = mx.image.resize_short(image, 112)
        image = mx.nd.transpose(image, axes=(2,0,1))
        image = torch.tensor(image.asnumpy()).type(torch.FloatTensor)
        label = self.img_lbls.iloc[idx, 1]

        return image, label, img_file

In [6]:
train_data = AdienceDataset("../train.csv", "../cropped_Adience/")
val_data = AdienceDataset("../val.csv", "../cropped_Adience/")

In [7]:
class CosFace(nn.Module):
    r"""Implement of CosFace (https://arxiv.org/pdf/1801.09414.pdf):
    Args:
        in_features: size of each input sample
        out_features: size of each output sample
        device_id: the ID of GPU where the model will be trained by model parallel.
                       if device_id=None, it will be trained on CPU without model parallel.
        s: norm of input feature
        m: margin
        cos(theta)-m
    """

    def __init__(self, in_features, out_features, device_id, s=64.0, m=0.35):
        super(CosFace, self).__init__()
        self.in_features = in_features
        self.out_features = out_features
        self.device_id = device_id
        self.s = s
        self.m = m
        print("self.device_id", self.device_id)
        self.weight = nn.Parameter(torch.FloatTensor(out_features, in_features))
        nn.init.xavier_uniform_(self.weight)

    def forward(self, input, label):
        # --------------------------- cos(theta) & phi(theta) ---------------------------

        if self.device_id == None:
            cosine = F.linear(F.normalize(input), F.normalize(self.weight))
        else:
            x = input
            sub_weights = torch.chunk(self.weight, len(self.device_id), dim=0)
            temp_x = x.cuda(self.device_id[0])
            weight = sub_weights[0].cuda(self.device_id[0])
            cosine = F.linear(F.normalize(temp_x), F.normalize(weight))
            for i in range(1, len(self.device_id)):
                temp_x = x.cuda(self.device_id[i])
                weight = sub_weights[i].cuda(self.device_id[i])
                cosine = torch.cat((cosine, F.linear(F.normalize(temp_x), F.normalize(weight)).cuda(self.device_id[0])),
                                   dim=1)
        phi = cosine - self.m
        # --------------------------- convert label to one-hot ---------------------------
        one_hot = torch.zeros(cosine.size())
        if self.device_id != None:
            one_hot = one_hot.cuda(self.device_id[0])
        # one_hot = one_hot.cuda() if cosine.is_cuda else one_hot

        one_hot.scatter_(1, label.view(-1, 1).long(), 1)
        # -------------torch.where(out_i = {x_i if condition_i else y_i) -------------
        output = (one_hot * phi) + (
                    (1.0 - one_hot) * cosine)  # you can use torch.where if your torch.__version__ is 0.4
        output *= self.s

        return output

    def __repr__(self):
        return self.__class__.__name__ + '(' \
               + 'in_features = ' + str(self.in_features) \
               + ', out_features = ' + str(self.out_features) \
               + ', s = ' + str(self.s) \
               + ', m = ' + str(self.m) + ')'

In [8]:
class Residual(nn.Module):
    def __init__(self, fn):
        super().__init__()
        self.fn = fn
    def forward(self, x, **kwargs):
        return self.fn(x, **kwargs) + x

In [9]:
class PreNorm(nn.Module):
    def __init__(self, dim, fn):
        super().__init__()
        self.norm = nn.LayerNorm(dim)
        self.fn = fn
    def forward(self, x, **kwargs):
        return self.fn(self.norm(x), **kwargs)

In [10]:
class FeedForward(nn.Module):
    def __init__(self, dim, hidden_dim, dropout = 0.):
        super().__init__()
        self.net = nn.Sequential(
            nn.Linear(dim, hidden_dim),
            nn.GELU(),
            nn.Dropout(dropout),
            nn.Linear(hidden_dim, dim),
            nn.Dropout(dropout)
        )
    def forward(self, x):
        return self.net(x)

In [11]:
class Attention(nn.Module):
    def __init__(self, dim, heads = 8, dim_head = 64, dropout = 0.):
        super().__init__()
        inner_dim = dim_head *  heads
        self.heads = heads
        self.scale = dim ** -0.5

        self.to_qkv = nn.Linear(dim, inner_dim * 3, bias = False)
        self.to_out = nn.Sequential(
            nn.Linear(inner_dim, dim),
            nn.Dropout(dropout)
        )

    def forward(self, x, mask = None):
        b, n, _, h = *x.shape, self.heads
        qkv = self.to_qkv(x).chunk(3, dim = -1)

        q, k, v = map(lambda t: rearrange(t, 'b n (h d) -> b h n d', h = h), qkv)
        dots = torch.einsum('bhid,bhjd->bhij', q, k) * self.scale
        mask_value = -torch.finfo(dots.dtype).max
        #embed()
        if mask is not None:
            mask = F.pad(mask.flatten(1), (1, 0), value = True)
            assert mask.shape[-1] == dots.shape[-1], 'mask has incorrect dimensions'
            mask = mask[:, None, :] * mask[:, :, None]
            dots.masked_fill_(~mask, mask_value)
            del mask

        attn = dots.softmax(dim=-1)

        out = torch.einsum('bhij,bhjd->bhid', attn, v)
        out = rearrange(out, 'b h n d -> b n (h d)')
        out =  self.to_out(out)

        return out

In [12]:
class Transformer(nn.Module):
    def __init__(self, dim, depth, heads, dim_head, mlp_dim, dropout):
        super().__init__()
        self.layers = nn.ModuleList([])
        for _ in range(depth):
            self.layers.append(nn.ModuleList([
                Residual(PreNorm(dim, Attention(dim, heads = heads, dim_head = dim_head, dropout = dropout))),
                Residual(PreNorm(dim, FeedForward(dim, mlp_dim, dropout = dropout)))
            ]))
    def forward(self, x, mask = None):
        for attn, ff in self.layers:
            x = attn(x, mask = mask)
            #embed()
            x = ff(x)
        return x

In [13]:
class ViTs_face(nn.Module):
    def __init__(self, *, loss_type, GPU_ID, num_class, image_size, patch_size, ac_patch_size,
                         pad, dim, depth, heads, mlp_dim, pool = 'mean', channels = 3, dim_head = 64, dropout = 0., emb_dropout = 0.):
        super().__init__()
        assert image_size % patch_size == 0, 'Image dimensions must be divisible by the patch size.'
        num_patches = (image_size // patch_size) ** 2
        patch_dim = channels * ac_patch_size ** 2
        assert num_patches > MIN_NUM_PATCHES, f'your number of patches ({num_patches}) is way too small for attention to be effective (at least 16). Try decreasing your patch size'
        assert pool in {'cls', 'mean'}, 'pool type must be either cls (cls token) or mean (mean pooling)'

        self.patch_size = patch_size
        self.soft_split = nn.Unfold(kernel_size=(ac_patch_size, ac_patch_size), stride=(self.patch_size, self.patch_size), padding=(pad, pad))


        self.pos_embedding = nn.Parameter(torch.randn(1, num_patches + 1, dim))
        self.patch_to_embedding = nn.Linear(patch_dim, dim)
        self.cls_token = nn.Parameter(torch.randn(1, 1, dim))
        self.dropout = nn.Dropout(emb_dropout)

        self.transformer = Transformer(dim, depth, heads, dim_head, mlp_dim, dropout)

        self.pool = pool
        self.to_latent = nn.Identity()

        self.mlp_head = nn.Sequential(
            nn.LayerNorm(dim),
        )
        self.loss_type = loss_type
        self.GPU_ID = GPU_ID
        if self.loss_type == 'None':
            print("no loss for vit_face")
        else:
            if self.loss_type == 'CosFace':
                self.loss = CosFace(in_features=dim, out_features=num_class, device_id=self.GPU_ID)

    def forward(self, img, label= None , mask = None):
        p = self.patch_size
        x = self.soft_split(img).transpose(1, 2)
        x = self.patch_to_embedding(x)
        b, n, _ = x.shape

        cls_tokens = repeat(self.cls_token, '() n d -> b n d', b = b)
        x = torch.cat((cls_tokens, x), dim=1)
        x += self.pos_embedding[:, :(n + 1)]
        x = self.dropout(x)
        x = self.transformer(x, mask)

        # y = x[:, 0]
        z = x[:, 1:].mean(dim = 1)

        # y = self.to_latent(y)
        # emb_y = self.mlp_head(y)
        z = self.to_latent(z)
        emb_z = self.mlp_head(z)
        # emb = torch.cat((emb_y, emb_z), dim=1)
        emb = emb_z
        if label is not None:
            x = self.loss(emb, label)
            return x, emb
        else:
            return emb

In [14]:
class ViT_plus(nn.Module):
    def __init__(self):
        super(ViT_plus, self).__init__()
        
        self.fc1 = nn.Linear(in_features=512, out_features=512)
        self.fc2 = nn.Linear(in_features=512, out_features=2)
        
    def forward(self, x):
        x = self.fc1(x)
        x_cosface = x
        x_classification = self.fc2(x)
        
        return x_cosface, x_classification

In [15]:
model = ViTs_face(
            loss_type='CosFace',
            GPU_ID=[device],
            num_class=93431,
            image_size=112,
            patch_size=8,
            ac_patch_size=12,
            pad=4,
            dim=512,
            depth=20,
            heads=8,
            mlp_dim=2048,
            dropout=0.1,
            emb_dropout=0.1
        ).to(device)
model.load_state_dict(
    torch.load("../Backbone_VITs_Epoch_2_Batch_12000_Time_2021-03-17-04-05_checkpoint.pth", map_location=device)
)

self.device_id [device(type='cuda', index=1)]


<All keys matched successfully>

In [16]:
for param in model.parameters():
    param.requires_grad = False

In [17]:
embeds = {}
model.eval()

with torch.no_grad():
    for img, label, file in train_data:
        img = img.to(device)
        embeds[file] = model(torch.unsqueeze(img, 0))

    for img, label, file in val_data:
        img = img.to(device)
        embeds[file] = model(torch.unsqueeze(img, 0))

In [18]:
best_accu = 0.0
def objective(trial):
    model_xtr = ViT_plus().to(device)
    
    loss_lr = trial.suggest_float("loss_learning_rate", 1e-4, 1e-2, log=True)
    arc_margin = losses.ArcFaceLoss(2, 512).to(device)
    loss_optimizer = opt.AdamW(arc_margin.parameters(), lr=loss_lr)
    
    lr = trial.suggest_float("learning_rate", 1e-5, 1e-1, log=True)
    wd = trial.suggest_float('weight_decay', 1e-4, 1e-2, log=True)
    eps = trial.suggest_float("epsilon", 1e-9, 1e-7, log=True)
    optimizer = opt.AdamW(model_xtr.parameters(), lr=lr, eps=eps, weight_decay=wd)
    
    criterion = nn.CrossEntropyLoss()
    
    batch_size = trial.suggest_int('batch_size', 50, 300)
    num_epochs = trial.suggest_int('epochs', 10, 100)
    
    print("Learning rate for Loss: "+ str(loss_lr))
    print("Learning rate: "+ str(lr))
    print("Weight decay: "+ str(wd))
    print("Epsilon: "+ str(eps))
    print("Batch size: "+ str(batch_size))
    print("Number of epochs: "+ str(num_epochs))
    
    for epoch in tqdm(range(num_epochs), desc="Epochs"):
        train_loader = DataLoader(train_data, batch_size=batch_size, shuffle=True, num_workers=4)
        val_loader = DataLoader(val_data, batch_size=batch_size, shuffle=False, num_workers=4)
        
        # training loop
        running_loss = []
        running_accu = []
        
        model_xtr.train()
        for img, label, file in tqdm(train_loader, desc="Training", leave=False):
            img, label = img.to(device), label.to(device)

            x = file_to_embed(embeds, file)
            
            optimizer.zero_grad()
            embed, output = model_xtr(x)
            
            pred = torch.argmax(output, 1)
            accuracy = torch.eq(pred, label).sum() / len(img)

            class_loss = criterion(output, label)
            arc_loss = arc_margin(embed, label)
            loss = class_loss + arc_loss
            loss.backward()
            loss_optimizer.step()
            optimizer.step()

            running_accu.append(accuracy.cpu().detach().numpy())
            running_loss.append(loss.cpu().detach().numpy())
        print("Epoch: {}/{} - Loss: {:.4f} - Accuracy: {:.4f}".format(epoch+1, num_epochs, np.mean(running_loss), np.mean(running_accu)))
        
        # validation loop
        val_loss = []
        val_accu = []

        model_xtr.eval()
        with torch.no_grad():
            for img, label, file in tqdm(val_loader):
                img, label = img.to(device), label.to(device)
                
                x = file_to_embed(embeds, file)
                
                embed, output = model_xtr(x)
                
                pred = torch.argmax(output, 1)
                accuracy = torch.eq(pred, label).sum() / len(img)
                
                class_loss = criterion(output, label)
                arc_loss = arc_margin(embed, label)
                loss = class_loss + arc_loss
                
                val_accu.append(accuracy.cpu().detach().numpy())
                val_loss.append(loss.cpu().detach().numpy())
        val_accu = np.mean(val_accu)
        val_loss = np.mean(val_loss)
        print("Val Loss: {:.4f} - Val Accuracy: {:.4f}".format(val_loss, val_accu))
        
        trial.report(val_accu, epoch)
        if trial.should_prune():
            raise optuna.exceptions.TrialPruned()
    
    global best_accu
    if val_accu > best_accu:
        best_accu = val_accu
        print("Saving best model...")
        torch.save(model_xtr.state_dict(), "../vit_12-8_arcface_mean_only.pt")
            
    return val_accu

In [19]:
study = optuna.create_study(direction='maximize',
                            study_name='arcface-12-8-mean-only-vit-study',
                            storage='sqlite:///study1.db',
                            load_if_exists=True)
study.optimize(objective, n_trials=20)

pruned_trials = study.get_trials(deepcopy=False, states=[TrialState.PRUNED])
complete_trials = study.get_trials(deepcopy=False, states=[TrialState.COMPLETE])

# Display the study statistics
print("\nStudy statistics: ")
print("  Number of finished trials: ", len(study.trials))
print("  Number of pruned trials: ", len(pruned_trials))
print("  Number of complete trials: ", len(complete_trials))

[32m[I 2023-12-14 22:16:22,919][0m A new study created in RDB with name: arcface-12-8-mean-only-vit-study[0m


Learning rate for Loss: 0.0005376476220126488
Learning rate: 0.0951473049247803
Weight decay: 0.005325118649485834
Epsilon: 1.5452523761763e-09
Batch size: 123
Number of epochs: 17


Epochs:   0%|          | 0/17 [00:00<?, ?it/s]
Training:   0%|          | 0/114 [00:00<?, ?it/s][A
Training:   1%|          | 1/114 [00:01<02:53,  1.54s/it][A
Training:   4%|▎         | 4/114 [00:01<00:35,  3.08it/s][A
Training:   5%|▌         | 6/114 [00:02<00:38,  2.84it/s][A
Training:   6%|▌         | 7/114 [00:02<00:31,  3.39it/s][A
Training:   8%|▊         | 9/114 [00:03<00:35,  2.94it/s][A
Training:  11%|█         | 12/114 [00:03<00:20,  4.97it/s][A
Training:  12%|█▏        | 14/114 [00:04<00:23,  4.25it/s][A
Training:  15%|█▍        | 17/114 [00:05<00:26,  3.73it/s][A
Training:  18%|█▊        | 21/114 [00:05<00:22,  4.21it/s][A
Training:  20%|██        | 23/114 [00:05<00:17,  5.12it/s][A
Training:  22%|██▏       | 25/114 [00:06<00:20,  4.33it/s][A
Training:  24%|██▎       | 27/114 [00:06<00:16,  5.21it/s][A
Training:  25%|██▌       | 29/114 [00:07<00:19,  4.28it/s][A
Training:  26%|██▋       | 30/114 [00:07<00:20,  4.19it/s][A
Training:  28%|██▊       | 32/114 [00

Epoch: 1/17 - Loss: 182.3364 - Accuracy: 0.7514



  0%|          | 0/15 [00:00<?, ?it/s][A
  7%|▋         | 1/15 [00:01<00:20,  1.45s/it][A
 20%|██        | 3/15 [00:01<00:05,  2.38it/s][A
 33%|███▎      | 5/15 [00:02<00:04,  2.32it/s][A
 47%|████▋     | 7/15 [00:02<00:02,  3.50it/s][A
 60%|██████    | 9/15 [00:03<00:01,  3.23it/s][A
 80%|████████  | 12/15 [00:03<00:00,  5.29it/s][A
100%|██████████| 15/15 [00:04<00:00,  3.60it/s][A
Epochs:   6%|▌         | 1/17 [00:30<08:09, 30.62s/it]

Val Loss: 6.5567 - Val Accuracy: 0.9022



Training:   0%|          | 0/114 [00:00<?, ?it/s][A
Training:   1%|          | 1/114 [00:01<02:18,  1.23s/it][A
Training:   2%|▏         | 2/114 [00:01<01:06,  1.68it/s][A
Training:   4%|▍         | 5/114 [00:01<00:32,  3.35it/s][A
Training:   5%|▌         | 6/114 [00:02<00:31,  3.41it/s][A
Training:   8%|▊         | 9/114 [00:02<00:27,  3.79it/s][A
Training:   9%|▉         | 10/114 [00:03<00:26,  3.90it/s][A
Training:  11%|█         | 12/114 [00:03<00:18,  5.49it/s][A
Training:  11%|█▏        | 13/114 [00:03<00:22,  4.41it/s][A
Training:  12%|█▏        | 14/114 [00:03<00:22,  4.50it/s][A
Training:  13%|█▎        | 15/114 [00:03<00:19,  5.20it/s][A
Training:  15%|█▍        | 17/114 [00:04<00:20,  4.67it/s][A
Training:  16%|█▌        | 18/114 [00:04<00:19,  5.04it/s][A
Training:  17%|█▋        | 19/114 [00:04<00:19,  4.81it/s][A
Training:  18%|█▊        | 21/114 [00:05<00:22,  4.18it/s][A
Training:  19%|█▉        | 22/114 [00:05<00:19,  4.77it/s][A
Training:  20%|██    

Epoch: 2/17 - Loss: 5.5481 - Accuracy: 0.8843



  0%|          | 0/15 [00:00<?, ?it/s][A
  7%|▋         | 1/15 [00:01<00:15,  1.11s/it][A
 20%|██        | 3/15 [00:01<00:04,  2.92it/s][A
 27%|██▋       | 4/15 [00:01<00:02,  3.80it/s][A
 33%|███▎      | 5/15 [00:02<00:04,  2.48it/s][A
 60%|██████    | 9/15 [00:02<00:01,  3.75it/s][A
 80%|████████  | 12/15 [00:02<00:00,  5.72it/s][A
100%|██████████| 15/15 [00:03<00:00,  4.06it/s][A
Epochs:  12%|█▏        | 2/17 [00:59<07:23, 29.57s/it]

Val Loss: 4.5914 - Val Accuracy: 0.9232



Training:   0%|          | 0/114 [00:00<?, ?it/s][A
Training:   1%|          | 1/114 [00:01<02:14,  1.19s/it][A
Training:   2%|▏         | 2/114 [00:01<01:09,  1.61it/s][A
Training:   4%|▎         | 4/114 [00:01<00:31,  3.47it/s][A
Training:   4%|▍         | 5/114 [00:02<00:40,  2.69it/s][A
Training:   5%|▌         | 6/114 [00:02<00:32,  3.32it/s][A
Training:   6%|▌         | 7/114 [00:02<00:27,  3.94it/s][A
Training:   8%|▊         | 9/114 [00:03<00:35,  2.96it/s][A
Training:   9%|▉         | 10/114 [00:03<00:29,  3.49it/s][A
Training:  11%|█▏        | 13/114 [00:04<00:25,  3.89it/s][A
Training:  15%|█▍        | 17/114 [00:04<00:20,  4.71it/s][A
Training:  18%|█▊        | 20/114 [00:04<00:14,  6.61it/s][A
Training:  19%|█▉        | 22/114 [00:05<00:20,  4.46it/s][A
Training:  22%|██▏       | 25/114 [00:06<00:20,  4.40it/s][A
Training:  23%|██▎       | 26/114 [00:06<00:19,  4.53it/s][A
Training:  25%|██▍       | 28/114 [00:06<00:15,  5.63it/s][A
Training:  25%|██▌     

Epoch: 3/17 - Loss: 4.9080 - Accuracy: 0.8923



  0%|          | 0/15 [00:00<?, ?it/s][A
  7%|▋         | 1/15 [00:01<00:20,  1.45s/it][A
 13%|█▎        | 2/15 [00:01<00:08,  1.45it/s][A
 27%|██▋       | 4/15 [00:01<00:03,  3.34it/s][A
 33%|███▎      | 5/15 [00:02<00:04,  2.23it/s][A
 47%|████▋     | 7/15 [00:02<00:02,  3.79it/s][A
 60%|██████    | 9/15 [00:03<00:01,  3.49it/s][A
 73%|███████▎  | 11/15 [00:03<00:00,  4.85it/s][A
 87%|████████▋ | 13/15 [00:04<00:00,  4.19it/s][A
100%|██████████| 15/15 [00:04<00:00,  3.52it/s][A
Epochs:  18%|█▊        | 3/17 [01:29<06:55, 29.67s/it]

Val Loss: 7.0906 - Val Accuracy: 0.9022



Training:   0%|          | 0/114 [00:00<?, ?it/s][A
Training:   1%|          | 1/114 [00:01<02:33,  1.36s/it][A
Training:   4%|▎         | 4/114 [00:01<00:32,  3.41it/s][A
Training:   5%|▌         | 6/114 [00:02<00:39,  2.73it/s][A
Training:   7%|▋         | 8/114 [00:02<00:26,  3.93it/s][A
Training:   9%|▉         | 10/114 [00:03<00:31,  3.32it/s][A
Training:  11%|█         | 12/114 [00:03<00:22,  4.59it/s][A
Training:  12%|█▏        | 14/114 [00:04<00:26,  3.77it/s][A
Training:  14%|█▍        | 16/114 [00:04<00:19,  4.99it/s][A
Training:  16%|█▌        | 18/114 [00:05<00:25,  3.72it/s][A
Training:  17%|█▋        | 19/114 [00:05<00:22,  4.16it/s][A
Training:  18%|█▊        | 21/114 [00:05<00:16,  5.68it/s][A
Training:  20%|██        | 23/114 [00:06<00:23,  3.82it/s][A
Training:  23%|██▎       | 26/114 [00:07<00:25,  3.45it/s][A
Training:  25%|██▍       | 28/114 [00:07<00:19,  4.44it/s][A
Training:  26%|██▋       | 30/114 [00:08<00:21,  3.84it/s][A
Training:  28%|██▊  

Epoch: 4/17 - Loss: 4.8701 - Accuracy: 0.8927



  0%|          | 0/15 [00:00<?, ?it/s][A
  7%|▋         | 1/15 [00:01<00:21,  1.53s/it][A
 20%|██        | 3/15 [00:01<00:05,  2.29it/s][A
 33%|███▎      | 5/15 [00:02<00:03,  2.59it/s][A
 47%|████▋     | 7/15 [00:02<00:02,  3.49it/s][A
 60%|██████    | 9/15 [00:03<00:02,  2.92it/s][A
 73%|███████▎  | 11/15 [00:03<00:00,  4.10it/s][A
100%|██████████| 15/15 [00:04<00:00,  3.36it/s][A
Epochs:  24%|██▎       | 4/17 [01:59<06:28, 29.89s/it]

Val Loss: 5.7914 - Val Accuracy: 0.9073



Training:   0%|          | 0/114 [00:00<?, ?it/s][A
Training:   1%|          | 1/114 [00:01<02:33,  1.35s/it][A
Training:   3%|▎         | 3/114 [00:01<00:47,  2.36it/s][A
Training:   4%|▍         | 5/114 [00:02<00:39,  2.77it/s][A
Training:   6%|▌         | 7/114 [00:02<00:25,  4.19it/s][A
Training:   7%|▋         | 8/114 [00:02<00:24,  4.36it/s][A
Training:   8%|▊         | 9/114 [00:03<00:36,  2.89it/s][A
Training:  10%|▉         | 11/114 [00:03<00:23,  4.32it/s][A
Training:  11%|█▏        | 13/114 [00:04<00:32,  3.13it/s][A
Training:  13%|█▎        | 15/114 [00:04<00:23,  4.20it/s][A
Training:  14%|█▍        | 16/114 [00:04<00:22,  4.28it/s][A
Training:  15%|█▍        | 17/114 [00:05<00:29,  3.28it/s][A
Training:  16%|█▌        | 18/114 [00:05<00:24,  3.90it/s][A
Training:  18%|█▊        | 20/114 [00:05<00:17,  5.38it/s][A
Training:  18%|█▊        | 21/114 [00:06<00:28,  3.29it/s][A
Training:  20%|██        | 23/114 [00:06<00:19,  4.65it/s][A
Training:  22%|██▏    

Epoch: 5/17 - Loss: 3.4672 - Accuracy: 0.9076



  0%|          | 0/15 [00:00<?, ?it/s][A
  7%|▋         | 1/15 [00:01<00:22,  1.61s/it][A
 33%|███▎      | 5/15 [00:02<00:04,  2.29it/s][A
 47%|████▋     | 7/15 [00:02<00:02,  3.42it/s][A
 60%|██████    | 9/15 [00:03<00:01,  3.15it/s][A
100%|██████████| 15/15 [00:04<00:00,  3.45it/s][A
Epochs:  29%|██▉       | 5/17 [02:28<05:56, 29.75s/it]

Val Loss: 2.9648 - Val Accuracy: 0.9241



Training:   0%|          | 0/114 [00:00<?, ?it/s][A
Training:   1%|          | 1/114 [00:01<02:30,  1.33s/it][A
Training:   4%|▎         | 4/114 [00:01<00:30,  3.55it/s][A
Training:   5%|▌         | 6/114 [00:02<00:39,  2.74it/s][A
Training:   7%|▋         | 8/114 [00:02<00:27,  3.81it/s][A
Training:   9%|▉         | 10/114 [00:03<00:28,  3.70it/s][A
Training:  11%|█         | 12/114 [00:03<00:20,  4.88it/s][A
Training:  11%|█▏        | 13/114 [00:03<00:25,  3.92it/s][A
Training:  12%|█▏        | 14/114 [00:03<00:22,  4.48it/s][A
Training:  13%|█▎        | 15/114 [00:04<00:19,  4.99it/s][A
Training:  14%|█▍        | 16/114 [00:04<00:18,  5.18it/s][A
Training:  15%|█▍        | 17/114 [00:04<00:26,  3.67it/s][A
Training:  17%|█▋        | 19/114 [00:04<00:18,  5.10it/s][A
Training:  18%|█▊        | 20/114 [00:05<00:18,  5.08it/s][A
Training:  18%|█▊        | 21/114 [00:05<00:24,  3.76it/s][A
Training:  19%|█▉        | 22/114 [00:05<00:20,  4.47it/s][A
Training:  21%|██   

Epoch: 6/17 - Loss: 4.1501 - Accuracy: 0.8983



  0%|          | 0/15 [00:00<?, ?it/s][A
  7%|▋         | 1/15 [00:01<00:17,  1.27s/it][A
 20%|██        | 3/15 [00:01<00:04,  2.61it/s][A
 33%|███▎      | 5/15 [00:02<00:03,  2.64it/s][A
 53%|█████▎    | 8/15 [00:02<00:01,  4.72it/s][A
 67%|██████▋   | 10/15 [00:03<00:01,  3.84it/s][A
100%|██████████| 15/15 [00:03<00:00,  3.97it/s][A
Epochs:  35%|███▌      | 6/17 [02:58<05:24, 29.53s/it]

Val Loss: 3.5254 - Val Accuracy: 0.5891



Training:   0%|          | 0/114 [00:00<?, ?it/s][A
Training:   1%|          | 1/114 [00:01<01:53,  1.00s/it][A
Training:   4%|▎         | 4/114 [00:01<00:24,  4.53it/s][A
Training:   5%|▌         | 6/114 [00:01<00:30,  3.58it/s][A
Training:   7%|▋         | 8/114 [00:02<00:21,  4.91it/s][A
Training:   9%|▉         | 10/114 [00:02<00:24,  4.26it/s][A
Training:  11%|█         | 12/114 [00:02<00:17,  5.71it/s][A
Training:  12%|█▏        | 14/114 [00:03<00:21,  4.75it/s][A
Training:  14%|█▍        | 16/114 [00:03<00:15,  6.22it/s][A
Training:  16%|█▌        | 18/114 [00:04<00:20,  4.61it/s][A
Training:  18%|█▊        | 20/114 [00:04<00:16,  5.66it/s][A
Training:  18%|█▊        | 21/114 [00:04<00:22,  4.10it/s][A
Training:  20%|██        | 23/114 [00:04<00:16,  5.51it/s][A
Training:  22%|██▏       | 25/114 [00:05<00:21,  4.17it/s][A
Training:  24%|██▎       | 27/114 [00:05<00:16,  5.32it/s][A
Training:  25%|██▌       | 29/114 [00:06<00:19,  4.37it/s][A
Training:  27%|██▋  

Epoch: 7/17 - Loss: 5.4089 - Accuracy: 0.8945



  0%|          | 0/15 [00:00<?, ?it/s][A
  7%|▋         | 1/15 [00:00<00:13,  1.03it/s][A
 33%|███▎      | 5/15 [00:01<00:02,  3.66it/s][A
 40%|████      | 6/15 [00:01<00:02,  4.16it/s][A
 60%|██████    | 9/15 [00:02<00:01,  4.17it/s][A
 67%|██████▋   | 10/15 [00:02<00:01,  4.64it/s][A
 87%|████████▋ | 13/15 [00:03<00:00,  4.84it/s][A
100%|██████████| 15/15 [00:03<00:00,  4.36it/s][A
Epochs:  41%|████      | 7/17 [03:24<04:46, 28.63s/it]

Val Loss: 3.5182 - Val Accuracy: 0.8934



Training:   0%|          | 0/114 [00:00<?, ?it/s][A
Training:   1%|          | 1/114 [00:01<02:06,  1.12s/it][A
Training:   4%|▍         | 5/114 [00:01<00:37,  2.88it/s][A
Training:   7%|▋         | 8/114 [00:02<00:21,  5.04it/s][A
Training:   9%|▉         | 10/114 [00:02<00:24,  4.29it/s][A
Training:  11%|█         | 12/114 [00:02<00:18,  5.37it/s][A
Training:  12%|█▏        | 14/114 [00:03<00:21,  4.70it/s][A
Training:  15%|█▍        | 17/114 [00:04<00:24,  4.00it/s][A
Training:  17%|█▋        | 19/114 [00:04<00:19,  4.92it/s][A
Training:  18%|█▊        | 21/114 [00:04<00:20,  4.56it/s][A
Training:  21%|██        | 24/114 [00:05<00:13,  6.43it/s][A
Training:  23%|██▎       | 26/114 [00:05<00:19,  4.55it/s][A
Training:  25%|██▍       | 28/114 [00:06<00:15,  5.69it/s][A
Training:  26%|██▋       | 30/114 [00:06<00:18,  4.42it/s][A
Training:  27%|██▋       | 31/114 [00:06<00:17,  4.76it/s][A
Training:  29%|██▉       | 33/114 [00:07<00:19,  4.21it/s][A
Training:  30%|██▉ 

Epoch: 8/17 - Loss: 5.9712 - Accuracy: 0.8896



  0%|          | 0/15 [00:00<?, ?it/s][A
  7%|▋         | 1/15 [00:01<00:17,  1.26s/it][A
 20%|██        | 3/15 [00:01<00:04,  2.74it/s][A
 33%|███▎      | 5/15 [00:02<00:03,  2.83it/s][A
 60%|██████    | 9/15 [00:02<00:01,  3.92it/s][A
100%|██████████| 15/15 [00:03<00:00,  4.03it/s][A
Epochs:  47%|████▋     | 8/17 [03:52<04:16, 28.47s/it]

Val Loss: 8.4299 - Val Accuracy: 0.9223



Training:   0%|          | 0/114 [00:00<?, ?it/s][A
Training:   1%|          | 1/114 [00:01<02:32,  1.35s/it][A
Training:   3%|▎         | 3/114 [00:01<00:45,  2.44it/s][A
Training:   4%|▍         | 5/114 [00:02<00:40,  2.67it/s][A
Training:   6%|▌         | 7/114 [00:02<00:25,  4.17it/s][A
Training:   8%|▊         | 9/114 [00:02<00:27,  3.77it/s][A
Training:  10%|▉         | 11/114 [00:03<00:19,  5.15it/s][A
Training:  11%|█▏        | 13/114 [00:03<00:25,  3.96it/s][A
Training:  13%|█▎        | 15/114 [00:04<00:21,  4.71it/s][A
Training:  15%|█▍        | 17/114 [00:04<00:23,  4.11it/s][A
Training:  17%|█▋        | 19/114 [00:04<00:20,  4.58it/s][A
Training:  18%|█▊        | 21/114 [00:05<00:20,  4.62it/s][A
Training:  20%|██        | 23/114 [00:05<00:20,  4.53it/s][A
Training:  22%|██▏       | 25/114 [00:06<00:19,  4.54it/s][A
Training:  24%|██▎       | 27/114 [00:06<00:20,  4.27it/s][A
Training:  25%|██▌       | 29/114 [00:07<00:17,  4.86it/s][A
Training:  26%|██▋   

Epoch: 9/17 - Loss: 12.6010 - Accuracy: 0.8711



  0%|          | 0/15 [00:00<?, ?it/s][A
  7%|▋         | 1/15 [00:01<00:18,  1.29s/it][A
 20%|██        | 3/15 [00:01<00:04,  2.63it/s][A
 33%|███▎      | 5/15 [00:02<00:03,  2.64it/s][A
 47%|████▋     | 7/15 [00:02<00:01,  4.14it/s][A
 60%|██████    | 9/15 [00:02<00:01,  3.83it/s][A
 73%|███████▎  | 11/15 [00:03<00:00,  4.73it/s][A
100%|██████████| 15/15 [00:03<00:00,  3.94it/s][A
Epochs:  53%|█████▎    | 9/17 [04:22<03:50, 28.87s/it]

Val Loss: 33.0737 - Val Accuracy: 0.6736



Training:   0%|          | 0/114 [00:00<?, ?it/s][A
Training:   1%|          | 1/114 [00:01<02:13,  1.18s/it][A
Training:   2%|▏         | 2/114 [00:01<01:03,  1.76it/s][A
Training:   4%|▎         | 4/114 [00:01<00:27,  3.98it/s][A
Training:   4%|▍         | 5/114 [00:02<00:37,  2.87it/s][A
Training:   5%|▌         | 6/114 [00:02<00:31,  3.47it/s][A
Training:   8%|▊         | 9/114 [00:02<00:27,  3.88it/s][A
Training:  10%|▉         | 11/114 [00:03<00:19,  5.23it/s][A
Training:  11%|█▏        | 13/114 [00:03<00:24,  4.07it/s][A
Training:  13%|█▎        | 15/114 [00:03<00:18,  5.38it/s][A
Training:  15%|█▍        | 17/114 [00:04<00:24,  3.99it/s][A
Training:  17%|█▋        | 19/114 [00:04<00:18,  5.13it/s][A
Training:  18%|█▊        | 21/114 [00:05<00:24,  3.82it/s][A
Training:  19%|█▉        | 22/114 [00:05<00:22,  4.12it/s][A
Training:  20%|██        | 23/114 [00:05<00:19,  4.67it/s][A
Training:  22%|██▏       | 25/114 [00:06<00:21,  4.19it/s][A
Training:  23%|██▎    

Epoch: 10/17 - Loss: 8.8986 - Accuracy: 0.8909



  0%|          | 0/15 [00:00<?, ?it/s][A
  7%|▋         | 1/15 [00:01<00:18,  1.33s/it][A
 20%|██        | 3/15 [00:01<00:04,  2.59it/s][A
 33%|███▎      | 5/15 [00:02<00:03,  2.76it/s][A
 47%|████▋     | 7/15 [00:02<00:01,  4.32it/s][A
 60%|██████    | 9/15 [00:02<00:01,  3.66it/s][A
 80%|████████  | 12/15 [00:03<00:00,  5.90it/s][A
100%|██████████| 15/15 [00:03<00:00,  4.11it/s][A
Epochs:  59%|█████▉    | 10/17 [04:52<03:23, 29.06s/it]

Val Loss: 3.5411 - Val Accuracy: 0.9236



Training:   0%|          | 0/114 [00:00<?, ?it/s][A
Training:   1%|          | 1/114 [00:01<02:13,  1.18s/it][A
Training:   4%|▎         | 4/114 [00:01<00:28,  3.82it/s][A
Training:   5%|▌         | 6/114 [00:01<00:27,  3.89it/s][A
Training:   8%|▊         | 9/114 [00:02<00:26,  3.93it/s][A
Training:  10%|▉         | 11/114 [00:02<00:20,  5.06it/s][A
Training:  11%|█▏        | 13/114 [00:03<00:23,  4.35it/s][A
Training:  12%|█▏        | 14/114 [00:03<00:20,  4.79it/s][A
Training:  15%|█▍        | 17/114 [00:04<00:19,  4.85it/s][A
Training:  16%|█▌        | 18/114 [00:04<00:18,  5.29it/s][A
Training:  17%|█▋        | 19/114 [00:04<00:18,  5.22it/s][A
Training:  18%|█▊        | 21/114 [00:04<00:21,  4.31it/s][A
Training:  19%|█▉        | 22/114 [00:05<00:19,  4.77it/s][A
Training:  20%|██        | 23/114 [00:05<00:18,  5.00it/s][A
Training:  22%|██▏       | 25/114 [00:05<00:19,  4.49it/s][A
Training:  24%|██▎       | 27/114 [00:05<00:14,  5.97it/s][A
Training:  25%|██▌  

Epoch: 11/17 - Loss: 11.2609 - Accuracy: 0.8939



  0%|          | 0/15 [00:00<?, ?it/s][A
  7%|▋         | 1/15 [00:01<00:18,  1.29s/it][A
 20%|██        | 3/15 [00:01<00:04,  2.66it/s][A
 33%|███▎      | 5/15 [00:02<00:03,  2.77it/s][A
 60%|██████    | 9/15 [00:02<00:01,  3.69it/s][A
 80%|████████  | 12/15 [00:03<00:00,  5.54it/s][A
100%|██████████| 15/15 [00:03<00:00,  3.75it/s][A
Epochs:  65%|██████▍   | 11/17 [05:21<02:55, 29.20s/it]

Val Loss: 11.2421 - Val Accuracy: 0.8672



Training:   0%|          | 0/114 [00:00<?, ?it/s][A
Training:   1%|          | 1/114 [00:01<02:49,  1.50s/it][A
Training:   4%|▎         | 4/114 [00:01<00:34,  3.16it/s][A
Training:   5%|▌         | 6/114 [00:02<00:31,  3.38it/s][A
Training:   8%|▊         | 9/114 [00:02<00:28,  3.67it/s][A
Training:  11%|█▏        | 13/114 [00:03<00:27,  3.73it/s][A
Training:  13%|█▎        | 15/114 [00:04<00:21,  4.70it/s][A
Training:  15%|█▍        | 17/114 [00:04<00:26,  3.63it/s][A
Training:  17%|█▋        | 19/114 [00:05<00:21,  4.41it/s][A
Training:  18%|█▊        | 21/114 [00:05<00:25,  3.67it/s][A
Training:  20%|██        | 23/114 [00:06<00:19,  4.68it/s][A
Training:  22%|██▏       | 25/114 [00:06<00:23,  3.86it/s][A
Training:  25%|██▍       | 28/114 [00:06<00:15,  5.62it/s][A
Training:  26%|██▋       | 30/114 [00:07<00:19,  4.39it/s][A
Training:  28%|██▊       | 32/114 [00:07<00:14,  5.49it/s][A
Training:  30%|██▉       | 34/114 [00:08<00:17,  4.45it/s][A
Training:  32%|███▏ 

Epoch: 12/17 - Loss: 6.3388 - Accuracy: 0.8991



  0%|          | 0/15 [00:00<?, ?it/s][A
  7%|▋         | 1/15 [00:01<00:19,  1.40s/it][A
 13%|█▎        | 2/15 [00:01<00:08,  1.47it/s][A
 33%|███▎      | 5/15 [00:02<00:03,  3.02it/s][A
 40%|████      | 6/15 [00:02<00:02,  3.56it/s][A
 60%|██████    | 9/15 [00:02<00:01,  4.16it/s][A
 67%|██████▋   | 10/15 [00:03<00:01,  4.67it/s][A
 87%|████████▋ | 13/15 [00:03<00:00,  5.02it/s][A
100%|██████████| 15/15 [00:03<00:00,  3.96it/s][A
Epochs:  71%|███████   | 12/17 [05:51<02:27, 29.47s/it]

Val Loss: 4.4869 - Val Accuracy: 0.9308



Training:   0%|          | 0/114 [00:00<?, ?it/s][A
Training:   1%|          | 1/114 [00:01<03:11,  1.70s/it][A
Training:   3%|▎         | 3/114 [00:01<00:53,  2.08it/s][A
Training:   4%|▍         | 5/114 [00:02<00:40,  2.66it/s][A
Training:   6%|▌         | 7/114 [00:02<00:25,  4.19it/s][A
Training:   8%|▊         | 9/114 [00:03<00:30,  3.48it/s][A
Training:  10%|▉         | 11/114 [00:03<00:21,  4.83it/s][A
Training:  11%|█▏        | 13/114 [00:03<00:24,  4.10it/s][A
Training:  15%|█▍        | 17/114 [00:04<00:20,  4.63it/s][A
Training:  17%|█▋        | 19/114 [00:04<00:16,  5.60it/s][A
Training:  18%|█▊        | 21/114 [00:05<00:20,  4.53it/s][A
Training:  20%|██        | 23/114 [00:05<00:15,  5.75it/s][A
Training:  22%|██▏       | 25/114 [00:06<00:21,  4.21it/s][A
Training:  24%|██▎       | 27/114 [00:06<00:16,  5.43it/s][A
Training:  25%|██▌       | 29/114 [00:07<00:20,  4.11it/s][A
Training:  26%|██▋       | 30/114 [00:07<00:18,  4.50it/s][A
Training:  28%|██▊   

Epoch: 13/17 - Loss: 12.6209 - Accuracy: 0.8893



  0%|          | 0/15 [00:00<?, ?it/s][A
  7%|▋         | 1/15 [00:01<00:19,  1.41s/it][A
 20%|██        | 3/15 [00:01<00:05,  2.40it/s][A
 33%|███▎      | 5/15 [00:02<00:03,  2.53it/s][A
 40%|████      | 6/15 [00:02<00:02,  3.05it/s][A
 53%|█████▎    | 8/15 [00:02<00:01,  4.81it/s][A
 67%|██████▋   | 10/15 [00:03<00:01,  3.31it/s][A
 87%|████████▋ | 13/15 [00:03<00:00,  4.10it/s][A
100%|██████████| 15/15 [00:04<00:00,  3.53it/s][A
Epochs:  76%|███████▋  | 13/17 [06:21<01:58, 29.60s/it]

Val Loss: 11.4038 - Val Accuracy: 0.8921



Training:   0%|          | 0/114 [00:00<?, ?it/s][A
Training:   1%|          | 1/114 [00:01<02:12,  1.17s/it][A
Training:   2%|▏         | 2/114 [00:01<01:01,  1.81it/s][A
Training:   4%|▎         | 4/114 [00:01<00:26,  4.17it/s][A
Training:   5%|▌         | 6/114 [00:02<00:30,  3.59it/s][A
Training:   7%|▋         | 8/114 [00:02<00:20,  5.08it/s][A
Training:   8%|▊         | 9/114 [00:02<00:29,  3.57it/s][A
Training:  10%|▉         | 11/114 [00:02<00:20,  5.14it/s][A
Training:  11%|█▏        | 13/114 [00:03<00:26,  3.78it/s][A
Training:  14%|█▍        | 16/114 [00:03<00:18,  5.25it/s][A
Training:  15%|█▍        | 17/114 [00:04<00:24,  3.89it/s][A
Training:  17%|█▋        | 19/114 [00:04<00:18,  5.13it/s][A
Training:  18%|█▊        | 20/114 [00:04<00:17,  5.44it/s][A
Training:  18%|█▊        | 21/114 [00:05<00:25,  3.67it/s][A
Training:  20%|██        | 23/114 [00:05<00:17,  5.22it/s][A
Training:  22%|██▏       | 25/114 [00:06<00:21,  4.14it/s][A
Training:  24%|██▎    

Epoch: 14/17 - Loss: 17.1170 - Accuracy: 0.8829



  0%|          | 0/15 [00:00<?, ?it/s][A
  7%|▋         | 1/15 [00:01<00:20,  1.49s/it][A
 13%|█▎        | 2/15 [00:01<00:09,  1.38it/s][A
 33%|███▎      | 5/15 [00:02<00:03,  2.88it/s][A
 40%|████      | 6/15 [00:02<00:02,  3.21it/s][A
 60%|██████    | 9/15 [00:03<00:01,  3.97it/s][A
 67%|██████▋   | 10/15 [00:03<00:01,  4.37it/s][A
 80%|████████  | 12/15 [00:03<00:00,  5.75it/s][A
 87%|████████▋ | 13/15 [00:03<00:00,  4.27it/s][A
100%|██████████| 15/15 [00:04<00:00,  3.52it/s][A
Epochs:  82%|████████▏ | 14/17 [06:51<01:29, 29.69s/it]

Val Loss: 40.6657 - Val Accuracy: 0.9158



Training:   0%|          | 0/114 [00:00<?, ?it/s][A
Training:   1%|          | 1/114 [00:01<02:25,  1.29s/it][A
Training:   3%|▎         | 3/114 [00:01<00:41,  2.67it/s][A
Training:   4%|▍         | 5/114 [00:01<00:34,  3.14it/s][A
Training:   6%|▌         | 7/114 [00:02<00:21,  4.87it/s][A
Training:   8%|▊         | 9/114 [00:02<00:23,  4.41it/s][A
Training:  10%|▉         | 11/114 [00:02<00:20,  5.05it/s][A
Training:  11%|█         | 12/114 [00:02<00:18,  5.50it/s][A
Training:  11%|█▏        | 13/114 [00:03<00:21,  4.79it/s][A
Training:  13%|█▎        | 15/114 [00:03<00:22,  4.42it/s][A
Training:  15%|█▍        | 17/114 [00:04<00:19,  4.85it/s][A
Training:  16%|█▌        | 18/114 [00:04<00:17,  5.39it/s][A
Training:  17%|█▋        | 19/114 [00:04<00:19,  4.77it/s][A
Training:  18%|█▊        | 20/114 [00:04<00:17,  5.38it/s][A
Training:  18%|█▊        | 21/114 [00:05<00:21,  4.30it/s][A
Training:  19%|█▉        | 22/114 [00:05<00:19,  4.75it/s][A
Training:  20%|██    

Epoch: 15/17 - Loss: 14.2045 - Accuracy: 0.9024



  0%|          | 0/15 [00:00<?, ?it/s][A
  7%|▋         | 1/15 [00:01<00:14,  1.05s/it][A
 13%|█▎        | 2/15 [00:01<00:07,  1.84it/s][A
 33%|███▎      | 5/15 [00:01<00:02,  3.39it/s][A
 40%|████      | 6/15 [00:01<00:02,  3.85it/s][A
 47%|████▋     | 7/15 [00:02<00:01,  4.48it/s][A
 60%|██████    | 9/15 [00:02<00:01,  4.01it/s][A
 67%|██████▋   | 10/15 [00:02<00:01,  4.07it/s][A
 73%|███████▎  | 11/15 [00:03<00:00,  4.76it/s][A
 87%|████████▋ | 13/15 [00:03<00:00,  4.21it/s][A
100%|██████████| 15/15 [00:03<00:00,  3.89it/s][A
Epochs:  88%|████████▊ | 15/17 [07:20<00:58, 29.35s/it]

Val Loss: 9.6712 - Val Accuracy: 0.8932



Training:   0%|          | 0/114 [00:00<?, ?it/s][A
Training:   1%|          | 1/114 [00:01<02:18,  1.23s/it][A
Training:   3%|▎         | 3/114 [00:01<00:39,  2.79it/s][A
Training:   4%|▍         | 5/114 [00:01<00:36,  2.98it/s][A
Training:   7%|▋         | 8/114 [00:02<00:19,  5.51it/s][A
Training:   9%|▉         | 10/114 [00:02<00:27,  3.84it/s][A
Training:  11%|█▏        | 13/114 [00:03<00:23,  4.27it/s][A
Training:  13%|█▎        | 15/114 [00:03<00:18,  5.30it/s][A
Training:  14%|█▍        | 16/114 [00:03<00:17,  5.46it/s][A
Training:  15%|█▍        | 17/114 [00:04<00:23,  4.09it/s][A
Training:  17%|█▋        | 19/114 [00:04<00:16,  5.60it/s][A
Training:  18%|█▊        | 20/114 [00:04<00:18,  4.97it/s][A
Training:  18%|█▊        | 21/114 [00:05<00:24,  3.78it/s][A
Training:  20%|██        | 23/114 [00:05<00:17,  5.08it/s][A
Training:  21%|██        | 24/114 [00:05<00:18,  4.91it/s][A
Training:  22%|██▏       | 25/114 [00:05<00:19,  4.59it/s][A
Training:  24%|██▎  

Epoch: 16/17 - Loss: 28.6940 - Accuracy: 0.8806



  0%|          | 0/15 [00:00<?, ?it/s][A
  7%|▋         | 1/15 [00:01<00:16,  1.20s/it][A
 13%|█▎        | 2/15 [00:01<00:07,  1.64it/s][A
 33%|███▎      | 5/15 [00:02<00:03,  3.03it/s][A
 40%|████      | 6/15 [00:02<00:02,  3.32it/s][A
 60%|██████    | 9/15 [00:02<00:01,  4.46it/s][A
 67%|██████▋   | 10/15 [00:03<00:01,  3.87it/s][A
 80%|████████  | 12/15 [00:03<00:00,  5.44it/s][A
 87%|████████▋ | 13/15 [00:03<00:00,  5.09it/s][A
100%|██████████| 15/15 [00:03<00:00,  3.76it/s][A
Epochs:  94%|█████████▍| 16/17 [07:49<00:29, 29.26s/it]

Val Loss: 12.1382 - Val Accuracy: 0.9125



Training:   0%|          | 0/114 [00:00<?, ?it/s][A
Training:   1%|          | 1/114 [00:01<02:20,  1.25s/it][A
Training:   3%|▎         | 3/114 [00:01<00:41,  2.71it/s][A
Training:   4%|▍         | 5/114 [00:01<00:33,  3.23it/s][A
Training:   6%|▌         | 7/114 [00:02<00:22,  4.68it/s][A
Training:   8%|▊         | 9/114 [00:02<00:24,  4.26it/s][A
Training:   9%|▉         | 10/114 [00:02<00:22,  4.64it/s][A
Training:  11%|█▏        | 13/114 [00:03<00:19,  5.19it/s][A
Training:  12%|█▏        | 14/114 [00:03<00:18,  5.30it/s][A
Training:  14%|█▍        | 16/114 [00:03<00:14,  6.94it/s][A
Training:  15%|█▍        | 17/114 [00:04<00:21,  4.49it/s][A
Training:  17%|█▋        | 19/114 [00:04<00:17,  5.54it/s][A
Training:  18%|█▊        | 21/114 [00:04<00:20,  4.47it/s][A
Training:  20%|██        | 23/114 [00:05<00:15,  5.88it/s][A
Training:  22%|██▏       | 25/114 [00:05<00:18,  4.84it/s][A
Training:  24%|██▎       | 27/114 [00:05<00:13,  6.25it/s][A
Training:  25%|██▌   

Epoch: 17/17 - Loss: 10.0227 - Accuracy: 0.9042



  0%|          | 0/15 [00:00<?, ?it/s][A
  7%|▋         | 1/15 [00:01<00:16,  1.20s/it][A
 27%|██▋       | 4/15 [00:01<00:03,  3.42it/s][A
 33%|███▎      | 5/15 [00:02<00:03,  2.74it/s][A
 53%|█████▎    | 8/15 [00:02<00:01,  4.92it/s][A
 60%|██████    | 9/15 [00:02<00:01,  3.50it/s][A
 80%|████████  | 12/15 [00:02<00:00,  5.56it/s][A
100%|██████████| 15/15 [00:03<00:00,  4.03it/s][A
Epochs: 100%|██████████| 17/17 [08:16<00:00, 29.23s/it]


Val Loss: 11.4858 - Val Accuracy: 0.9207
Saving best model...


[32m[I 2023-12-14 22:24:40,663][0m Trial 0 finished with value: 0.9206787347793579 and parameters: {'loss_learning_rate': 0.0005376476220126488, 'learning_rate': 0.0951473049247803, 'weight_decay': 0.005325118649485834, 'epsilon': 1.5452523761763e-09, 'batch_size': 123, 'epochs': 17}. Best is trial 0 with value: 0.9206787347793579.[0m


Learning rate for Loss: 0.0017350666898728663
Learning rate: 0.008226302275945433
Weight decay: 0.0019297756421957702
Epsilon: 1.7694055881118126e-09
Batch size: 67
Number of epochs: 46


Epochs:   0%|          | 0/46 [00:00<?, ?it/s]
Training:   0%|          | 0/209 [00:00<?, ?it/s][A
Training:   0%|          | 1/209 [00:00<02:57,  1.17it/s][A
Training:   2%|▏         | 4/209 [00:00<00:38,  5.26it/s][A
Training:   3%|▎         | 6/209 [00:01<00:36,  5.52it/s][A
Training:   4%|▍         | 9/209 [00:01<00:31,  6.38it/s][A
Training:   6%|▌         | 13/209 [00:02<00:26,  7.51it/s][A
Training:   7%|▋         | 15/209 [00:02<00:21,  8.85it/s][A
Training:   8%|▊         | 17/209 [00:02<00:23,  8.19it/s][A
Training:   9%|▉         | 19/209 [00:02<00:19,  9.58it/s][A
Training:  10%|█         | 21/209 [00:03<00:24,  7.82it/s][A
Training:  11%|█▏        | 24/209 [00:03<00:17, 10.72it/s][A
Training:  12%|█▏        | 26/209 [00:03<00:20,  8.92it/s][A
Training:  13%|█▎        | 28/209 [00:03<00:20,  8.99it/s][A
Training:  14%|█▍        | 30/209 [00:03<00:21,  8.25it/s][A
Training:  15%|█▌        | 32/209 [00:04<00:19,  9.01it/s][A
Training:  16%|█▋        | 34/209 [0

Epoch: 1/46 - Loss: 5.0967 - Accuracy: 0.8541



  0%|          | 0/27 [00:00<?, ?it/s][A
  4%|▎         | 1/27 [00:01<00:27,  1.05s/it][A
 19%|█▊        | 5/27 [00:01<00:04,  4.46it/s][A
 33%|███▎      | 9/27 [00:01<00:02,  6.07it/s][A
 48%|████▊     | 13/27 [00:02<00:01,  7.48it/s][A
 56%|█████▌    | 15/27 [00:02<00:01,  8.42it/s][A
 63%|██████▎   | 17/27 [00:02<00:01,  8.21it/s][A
 70%|███████   | 19/27 [00:02<00:00,  8.95it/s][A
 78%|███████▊  | 21/27 [00:03<00:00,  8.19it/s][A
100%|██████████| 27/27 [00:03<00:00,  7.36it/s][A
Epochs:   2%|▏         | 1/46 [00:27<20:43, 27.63s/it]

Val Loss: 2.7249 - Val Accuracy: 0.8992



Training:   0%|          | 0/209 [00:00<?, ?it/s][A
Training:   0%|          | 1/209 [00:00<03:08,  1.11it/s][A
Training:   1%|▏         | 3/209 [00:01<00:57,  3.60it/s][A
Training:   2%|▏         | 5/209 [00:01<00:45,  4.50it/s][A
Training:   3%|▎         | 7/209 [00:01<00:31,  6.51it/s][A
Training:   4%|▍         | 9/209 [00:01<00:28,  7.11it/s][A
Training:   5%|▌         | 11/209 [00:01<00:25,  7.76it/s][A
Training:   6%|▌         | 13/209 [00:02<00:25,  7.79it/s][A
Training:   7%|▋         | 15/209 [00:02<00:21,  9.19it/s][A
Training:   8%|▊         | 17/209 [00:02<00:22,  8.36it/s][A
Training:  10%|█         | 21/209 [00:02<00:19,  9.79it/s][A
Training:  11%|█         | 23/209 [00:03<00:17, 10.80it/s][A
Training:  12%|█▏        | 25/209 [00:03<00:18,  9.87it/s][A
Training:  13%|█▎        | 27/209 [00:03<00:17, 10.14it/s][A
Training:  14%|█▍        | 29/209 [00:03<00:19,  9.29it/s][A
Training:  15%|█▍        | 31/209 [00:03<00:18,  9.41it/s][A
Training:  16%|█▌    

Epoch: 2/46 - Loss: 3.1399 - Accuracy: 0.9229



  0%|          | 0/27 [00:00<?, ?it/s][A
  4%|▎         | 1/27 [00:00<00:17,  1.50it/s][A
 15%|█▍        | 4/27 [00:00<00:03,  6.37it/s][A
 22%|██▏       | 6/27 [00:01<00:02,  7.34it/s][A
 30%|██▉       | 8/27 [00:01<00:01,  9.62it/s][A
 37%|███▋      | 10/27 [00:01<00:02,  7.91it/s][A
 48%|████▊     | 13/27 [00:01<00:02,  6.96it/s][A
 63%|██████▎   | 17/27 [00:02<00:01,  7.30it/s][A
 78%|███████▊  | 21/27 [00:02<00:00,  8.08it/s][A
100%|██████████| 27/27 [00:03<00:00,  8.16it/s][A
Epochs:   4%|▍         | 2/46 [00:54<20:00, 27.28s/it]

Val Loss: 3.7877 - Val Accuracy: 0.8970



Training:   0%|          | 0/209 [00:00<?, ?it/s][A
Training:   0%|          | 1/209 [00:00<02:31,  1.37it/s][A
Training:   2%|▏         | 5/209 [00:01<00:40,  5.09it/s][A
Training:   4%|▍         | 8/209 [00:01<00:24,  8.28it/s][A
Training:   5%|▍         | 10/209 [00:01<00:25,  7.83it/s][A
Training:   6%|▌         | 13/209 [00:01<00:23,  8.21it/s][A
Training:   7%|▋         | 15/209 [00:02<00:21,  8.89it/s][A
Training:   8%|▊         | 17/209 [00:02<00:23,  8.32it/s][A
Training:   9%|▉         | 19/209 [00:02<00:22,  8.42it/s][A
Training:  10%|█         | 21/209 [00:02<00:20,  9.35it/s][A
Training:  11%|█         | 23/209 [00:03<00:23,  7.80it/s][A
Training:  12%|█▏        | 25/209 [00:03<00:20,  9.01it/s][A
Training:  13%|█▎        | 27/209 [00:03<00:21,  8.41it/s][A
Training:  14%|█▍        | 29/209 [00:03<00:19,  9.45it/s][A
Training:  15%|█▍        | 31/209 [00:03<00:20,  8.71it/s][A
Training:  16%|█▋        | 34/209 [00:04<00:17,  9.89it/s][A
Training:  17%|█▋  

Epoch: 3/46 - Loss: 2.7915 - Accuracy: 0.9194



  0%|          | 0/27 [00:00<?, ?it/s][A
  4%|▎         | 1/27 [00:00<00:21,  1.21it/s][A
 15%|█▍        | 4/27 [00:00<00:04,  5.32it/s][A
 22%|██▏       | 6/27 [00:01<00:03,  5.48it/s][A
 30%|██▉       | 8/27 [00:01<00:02,  7.55it/s][A
 37%|███▋      | 10/27 [00:01<00:02,  7.11it/s][A
 44%|████▍     | 12/27 [00:01<00:01,  8.29it/s][A
 52%|█████▏    | 14/27 [00:02<00:01,  8.61it/s][A
 59%|█████▉    | 16/27 [00:02<00:01,  8.56it/s][A
 67%|██████▋   | 18/27 [00:02<00:00,  9.22it/s][A
 74%|███████▍  | 20/27 [00:02<00:00,  8.61it/s][A
 78%|███████▊  | 21/27 [00:02<00:00,  8.40it/s][A
 85%|████████▌ | 23/27 [00:03<00:00,  9.13it/s][A
 89%|████████▉ | 24/27 [00:03<00:00,  8.61it/s][A
100%|██████████| 27/27 [00:03<00:00,  7.75it/s][A
Epochs:   7%|▋         | 3/46 [01:22<19:36, 27.37s/it]

Val Loss: 3.0126 - Val Accuracy: 0.9047



Training:   0%|          | 0/209 [00:00<?, ?it/s][A
Training:   0%|          | 1/209 [00:00<02:33,  1.36it/s][A
Training:   2%|▏         | 4/209 [00:00<00:35,  5.79it/s][A
Training:   3%|▎         | 6/209 [00:01<00:36,  5.55it/s][A
Training:   4%|▍         | 9/209 [00:01<00:25,  7.86it/s][A
Training:   5%|▌         | 11/209 [00:01<00:21,  9.12it/s][A
Training:   6%|▌         | 13/209 [00:01<00:21,  9.21it/s][A
Training:   7%|▋         | 15/209 [00:02<00:20,  9.51it/s][A
Training:   8%|▊         | 17/209 [00:02<00:20,  9.49it/s][A
Training:   9%|▉         | 19/209 [00:02<00:19,  9.71it/s][A
Training:  10%|█         | 21/209 [00:02<00:20,  9.27it/s][A
Training:  11%|█         | 22/209 [00:02<00:20,  9.08it/s][A
Training:  11%|█▏        | 24/209 [00:02<00:18,  9.93it/s][A
Training:  12%|█▏        | 26/209 [00:03<00:20,  8.78it/s][A
Training:  13%|█▎        | 28/209 [00:03<00:18, 10.05it/s][A
Training:  14%|█▍        | 30/209 [00:03<00:20,  8.59it/s][A
Training:  15%|█▌   

Epoch: 4/46 - Loss: 2.5351 - Accuracy: 0.9266



  0%|          | 0/27 [00:00<?, ?it/s][A
  4%|▎         | 1/27 [00:00<00:23,  1.09it/s][A
  7%|▋         | 2/27 [00:01<00:12,  1.93it/s][A
 19%|█▊        | 5/27 [00:01<00:04,  4.75it/s][A
 22%|██▏       | 6/27 [00:01<00:04,  4.68it/s][A
 33%|███▎      | 9/27 [00:01<00:02,  6.90it/s][A
 37%|███▋      | 10/27 [00:02<00:02,  5.71it/s][A
 48%|████▊     | 13/27 [00:02<00:01,  7.64it/s][A
 52%|█████▏    | 14/27 [00:02<00:02,  6.45it/s][A
 63%|██████▎   | 17/27 [00:02<00:01,  9.23it/s][A
 70%|███████   | 19/27 [00:03<00:00,  8.55it/s][A
 78%|███████▊  | 21/27 [00:03<00:00,  7.98it/s][A
 81%|████████▏ | 22/27 [00:03<00:00,  7.62it/s][A
 93%|█████████▎| 25/27 [00:03<00:00,  9.13it/s][A
100%|██████████| 27/27 [00:04<00:00,  6.59it/s][A
Epochs:   9%|▊         | 4/46 [01:50<19:21, 27.65s/it]

Val Loss: 2.5211 - Val Accuracy: 0.9331



Training:   0%|          | 0/209 [00:00<?, ?it/s][A
Training:   0%|          | 1/209 [00:00<02:59,  1.16it/s][A
Training:   2%|▏         | 4/209 [00:01<00:40,  5.04it/s][A
Training:   3%|▎         | 6/209 [00:01<00:34,  5.87it/s][A
Training:   4%|▍         | 8/209 [00:01<00:24,  8.05it/s][A
Training:   5%|▍         | 10/209 [00:01<00:27,  7.23it/s][A
Training:   6%|▌         | 13/209 [00:02<00:28,  6.86it/s][A
Training:   8%|▊         | 17/209 [00:02<00:26,  7.35it/s][A
Training:  10%|▉         | 20/209 [00:02<00:19,  9.65it/s][A
Training:  11%|█         | 22/209 [00:03<00:23,  8.06it/s][A
Training:  12%|█▏        | 25/209 [00:03<00:22,  8.28it/s][A
Training:  13%|█▎        | 27/209 [00:03<00:19,  9.57it/s][A
Training:  14%|█▍        | 29/209 [00:03<00:21,  8.32it/s][A
Training:  15%|█▍        | 31/209 [00:04<00:18,  9.84it/s][A
Training:  16%|█▌        | 33/209 [00:04<00:20,  8.61it/s][A
Training:  17%|█▋        | 36/209 [00:04<00:15, 11.42it/s][A
Training:  18%|█▊   

Epoch: 5/46 - Loss: 2.6262 - Accuracy: 0.9200



  0%|          | 0/27 [00:00<?, ?it/s][A
  4%|▎         | 1/27 [00:00<00:19,  1.34it/s][A
  7%|▋         | 2/27 [00:00<00:09,  2.51it/s][A
 19%|█▊        | 5/27 [00:01<00:04,  5.46it/s][A
 22%|██▏       | 6/27 [00:01<00:03,  5.26it/s][A
 33%|███▎      | 9/27 [00:01<00:02,  7.39it/s][A
 37%|███▋      | 10/27 [00:01<00:02,  6.28it/s][A
 48%|████▊     | 13/27 [00:02<00:01,  8.50it/s][A
 52%|█████▏    | 14/27 [00:02<00:01,  7.27it/s][A
 63%|██████▎   | 17/27 [00:02<00:01,  9.31it/s][A
 67%|██████▋   | 18/27 [00:02<00:01,  7.49it/s][A
 78%|███████▊  | 21/27 [00:03<00:00,  9.61it/s][A
 85%|████████▌ | 23/27 [00:03<00:00,  8.66it/s][A
 93%|█████████▎| 25/27 [00:03<00:00,  8.16it/s][A
100%|██████████| 27/27 [00:03<00:00,  6.97it/s][A
Epochs:  11%|█         | 5/46 [02:17<18:54, 27.67s/it]

Val Loss: 3.4530 - Val Accuracy: 0.8817



Training:   0%|          | 0/209 [00:00<?, ?it/s][A
Training:   0%|          | 1/209 [00:00<03:20,  1.04it/s][A
Training:   1%|          | 2/209 [00:01<01:46,  1.95it/s][A
Training:   2%|▏         | 4/209 [00:01<00:46,  4.43it/s][A
Training:   3%|▎         | 6/209 [00:01<00:51,  3.97it/s][A
Training:   4%|▍         | 9/209 [00:01<00:29,  6.83it/s][A
Training:   5%|▌         | 11/209 [00:02<00:35,  5.50it/s][A
Training:   7%|▋         | 14/209 [00:02<00:34,  5.67it/s][A
Training:   8%|▊         | 16/209 [00:03<00:28,  6.88it/s][A
Training:   9%|▊         | 18/209 [00:03<00:29,  6.41it/s][A
Training:  10%|▉         | 20/209 [00:03<00:24,  7.84it/s][A
Training:  11%|█         | 22/209 [00:03<00:25,  7.29it/s][A
Training:  11%|█▏        | 24/209 [00:04<00:21,  8.62it/s][A
Training:  12%|█▏        | 26/209 [00:04<00:23,  7.75it/s][A
Training:  14%|█▍        | 29/209 [00:04<00:18,  9.70it/s][A
Training:  15%|█▍        | 31/209 [00:04<00:21,  8.34it/s][A
Training:  16%|█▌    

Epoch: 6/46 - Loss: 2.7023 - Accuracy: 0.9203



  0%|          | 0/27 [00:00<?, ?it/s][A
  4%|▎         | 1/27 [00:00<00:24,  1.04it/s][A
 15%|█▍        | 4/27 [00:01<00:04,  4.74it/s][A
 22%|██▏       | 6/27 [00:01<00:04,  4.92it/s][A
 33%|███▎      | 9/27 [00:02<00:03,  5.16it/s][A
 48%|████▊     | 13/27 [00:02<00:02,  5.86it/s][A
 63%|██████▎   | 17/27 [00:03<00:01,  6.85it/s][A
 78%|███████▊  | 21/27 [00:03<00:00,  7.28it/s][A
100%|██████████| 27/27 [00:04<00:00,  6.74it/s][A
Epochs:  13%|█▎        | 6/46 [02:48<19:12, 28.80s/it]

Val Loss: 2.3893 - Val Accuracy: 0.9337



Training:   0%|          | 0/209 [00:00<?, ?it/s][A
Training:   0%|          | 1/209 [00:00<03:03,  1.13it/s][A
Training:   1%|          | 2/209 [00:01<01:29,  2.32it/s][A
Training:   2%|▏         | 4/209 [00:01<00:40,  5.12it/s][A
Training:   3%|▎         | 6/209 [00:01<00:38,  5.22it/s][A
Training:   4%|▍         | 8/209 [00:01<00:27,  7.33it/s][A
Training:   5%|▍         | 10/209 [00:02<00:31,  6.22it/s][A
Training:   6%|▌         | 13/209 [00:02<00:28,  6.98it/s][A
Training:   7%|▋         | 15/209 [00:02<00:22,  8.52it/s][A
Training:   8%|▊         | 17/209 [00:02<00:24,  7.93it/s][A
Training:   9%|▉         | 19/209 [00:02<00:21,  8.68it/s][A
Training:  10%|█         | 21/209 [00:03<00:19,  9.59it/s][A
Training:  11%|█         | 23/209 [00:03<00:19,  9.30it/s][A
Training:  12%|█▏        | 25/209 [00:03<00:19,  9.34it/s][A
Training:  13%|█▎        | 27/209 [00:03<00:20,  9.00it/s][A
Training:  14%|█▍        | 29/209 [00:04<00:23,  7.74it/s][A
Training:  15%|█▍    

Epoch: 7/46 - Loss: 2.4720 - Accuracy: 0.9237



  0%|          | 0/27 [00:00<?, ?it/s][A
  4%|▎         | 1/27 [00:00<00:15,  1.67it/s][A
  7%|▋         | 2/27 [00:00<00:08,  2.94it/s][A
 11%|█         | 3/27 [00:00<00:05,  4.06it/s][A
 22%|██▏       | 6/27 [00:01<00:03,  6.27it/s][A
 33%|███▎      | 9/27 [00:01<00:02,  7.85it/s][A
 37%|███▋      | 10/27 [00:01<00:02,  6.52it/s][A
 48%|████▊     | 13/27 [00:01<00:01,  9.72it/s][A
 56%|█████▌    | 15/27 [00:02<00:01,  7.91it/s][A
 63%|██████▎   | 17/27 [00:02<00:01,  8.77it/s][A
 70%|███████   | 19/27 [00:02<00:00,  8.57it/s][A
 78%|███████▊  | 21/27 [00:02<00:00,  8.51it/s][A
 81%|████████▏ | 22/27 [00:03<00:00,  8.52it/s][A
 89%|████████▉ | 24/27 [00:03<00:00,  9.44it/s][A
100%|██████████| 27/27 [00:03<00:00,  7.52it/s][A
Epochs:  15%|█▌        | 7/46 [03:17<18:37, 28.66s/it]

Val Loss: 2.5630 - Val Accuracy: 0.9138



Training:   0%|          | 0/209 [00:00<?, ?it/s][A
Training:   0%|          | 1/209 [00:00<02:59,  1.16it/s][A
Training:   1%|          | 2/209 [00:00<01:28,  2.34it/s][A
Training:   2%|▏         | 4/209 [00:01<00:40,  5.06it/s][A
Training:   3%|▎         | 6/209 [00:01<00:36,  5.50it/s][A
Training:   4%|▍         | 9/209 [00:01<00:29,  6.82it/s][A
Training:   5%|▍         | 10/209 [00:01<00:27,  7.24it/s][A
Training:   6%|▌         | 12/209 [00:01<00:21,  9.24it/s][A
Training:   7%|▋         | 14/209 [00:02<00:26,  7.41it/s][A
Training:   8%|▊         | 17/209 [00:02<00:21,  9.03it/s][A
Training:   9%|▉         | 19/209 [00:02<00:21,  8.92it/s][A
Training:  10%|█         | 21/209 [00:03<00:21,  8.86it/s][A
Training:  11%|█         | 22/209 [00:03<00:24,  7.56it/s][A
Training:  11%|█▏        | 24/209 [00:03<00:20,  9.21it/s][A
Training:  12%|█▏        | 26/209 [00:03<00:26,  6.82it/s][A
Training:  14%|█▍        | 29/209 [00:04<00:19,  9.31it/s][A
Training:  15%|█▍    

Epoch: 8/46 - Loss: 2.6398 - Accuracy: 0.9182



  0%|          | 0/27 [00:00<?, ?it/s][A
  4%|▎         | 1/27 [00:00<00:21,  1.23it/s][A
  7%|▋         | 2/27 [00:00<00:10,  2.29it/s][A
 15%|█▍        | 4/27 [00:01<00:04,  4.83it/s][A
 19%|█▊        | 5/27 [00:01<00:04,  4.48it/s][A
 30%|██▉       | 8/27 [00:01<00:02,  7.63it/s][A
 37%|███▋      | 10/27 [00:01<00:02,  6.85it/s][A
 44%|████▍     | 12/27 [00:02<00:01,  8.18it/s][A
 52%|█████▏    | 14/27 [00:02<00:01,  7.01it/s][A
 63%|██████▎   | 17/27 [00:02<00:01,  7.12it/s][A
 74%|███████▍  | 20/27 [00:03<00:00,  9.09it/s][A
 81%|████████▏ | 22/27 [00:03<00:00,  8.36it/s][A
 89%|████████▉ | 24/27 [00:03<00:00,  9.59it/s][A
100%|██████████| 27/27 [00:03<00:00,  7.03it/s][A
Epochs:  17%|█▋        | 8/46 [03:46<18:17, 28.88s/it]

Val Loss: 2.8589 - Val Accuracy: 0.8417



Training:   0%|          | 0/209 [00:00<?, ?it/s][A
Training:   0%|          | 1/209 [00:00<03:04,  1.13it/s][A
Training:   1%|▏         | 3/209 [00:01<01:02,  3.30it/s][A
Training:   2%|▏         | 5/209 [00:01<00:46,  4.36it/s][A
Training:   3%|▎         | 7/209 [00:01<00:31,  6.49it/s][A
Training:   4%|▍         | 9/209 [00:01<00:35,  5.69it/s][A
Training:   6%|▌         | 12/209 [00:02<00:23,  8.51it/s][A
Training:   7%|▋         | 14/209 [00:02<00:28,  6.88it/s][A
Training:   8%|▊         | 16/209 [00:02<00:23,  8.31it/s][A
Training:   9%|▊         | 18/209 [00:03<00:28,  6.70it/s][A
Training:  10%|█         | 21/209 [00:03<00:29,  6.31it/s][A
Training:  11%|█         | 23/209 [00:03<00:24,  7.51it/s][A
Training:  12%|█▏        | 25/209 [00:04<00:26,  6.95it/s][A
Training:  14%|█▍        | 29/209 [00:04<00:25,  7.08it/s][A
Training:  15%|█▌        | 32/209 [00:04<00:19,  9.21it/s][A
Training:  16%|█▋        | 34/209 [00:05<00:23,  7.43it/s][A
Training:  17%|█▋    

Epoch: 9/46 - Loss: 2.3361 - Accuracy: 0.9240



  0%|          | 0/27 [00:00<?, ?it/s][A
  4%|▎         | 1/27 [00:00<00:25,  1.02it/s][A
 15%|█▍        | 4/27 [00:01<00:05,  4.58it/s][A
 22%|██▏       | 6/27 [00:01<00:04,  4.77it/s][A
 33%|███▎      | 9/27 [00:01<00:03,  5.84it/s][A
 37%|███▋      | 10/27 [00:02<00:02,  5.86it/s][A
 48%|████▊     | 13/27 [00:02<00:02,  6.89it/s][A
 63%|██████▎   | 17/27 [00:02<00:01,  7.12it/s][A
 78%|███████▊  | 21/27 [00:03<00:00,  8.00it/s][A
100%|██████████| 27/27 [00:03<00:00,  7.08it/s][A
Epochs:  20%|█▉        | 9/46 [04:15<17:52, 28.99s/it]

Val Loss: 2.7511 - Val Accuracy: 0.8412



Training:   0%|          | 0/209 [00:00<?, ?it/s][A
Training:   0%|          | 1/209 [00:00<03:14,  1.07it/s][A
Training:   2%|▏         | 5/209 [00:01<00:51,  3.97it/s][A
Training:   3%|▎         | 7/209 [00:01<00:35,  5.64it/s][A
Training:   4%|▍         | 9/209 [00:01<00:36,  5.50it/s][A
Training:   6%|▌         | 12/209 [00:02<00:24,  8.03it/s][A
Training:   7%|▋         | 14/209 [00:02<00:25,  7.55it/s][A
Training:   8%|▊         | 16/209 [00:02<00:21,  9.16it/s][A
Training:   9%|▊         | 18/209 [00:02<00:26,  7.20it/s][A
Training:  10%|█         | 21/209 [00:03<00:26,  7.06it/s][A
Training:  11%|█         | 23/209 [00:03<00:22,  8.23it/s][A
Training:  12%|█▏        | 25/209 [00:04<00:37,  4.89it/s][A
Training:  12%|█▏        | 26/209 [00:04<00:37,  4.83it/s][A
Training:  13%|█▎        | 28/209 [00:04<00:28,  6.31it/s][A
Training:  14%|█▍        | 30/209 [00:05<00:29,  6.12it/s][A
Training:  16%|█▌        | 33/209 [00:05<00:22,  7.72it/s][A
Training:  17%|█▋   

Epoch: 10/46 - Loss: 2.4544 - Accuracy: 0.9212



  0%|          | 0/27 [00:00<?, ?it/s][A
  4%|▎         | 1/27 [00:00<00:22,  1.15it/s][A
 15%|█▍        | 4/27 [00:01<00:04,  5.07it/s][A
 22%|██▏       | 6/27 [00:01<00:04,  4.68it/s][A
 30%|██▉       | 8/27 [00:01<00:03,  6.21it/s][A
 37%|███▋      | 10/27 [00:02<00:03,  5.62it/s][A
 48%|████▊     | 13/27 [00:02<00:03,  4.62it/s][A
 52%|█████▏    | 14/27 [00:03<00:02,  4.65it/s][A
 63%|██████▎   | 17/27 [00:03<00:01,  6.32it/s][A
 67%|██████▋   | 18/27 [00:03<00:01,  6.64it/s][A
 78%|███████▊  | 21/27 [00:03<00:00,  8.02it/s][A
 81%|████████▏ | 22/27 [00:03<00:00,  8.17it/s][A
100%|██████████| 27/27 [00:04<00:00,  6.25it/s][A
Epochs:  22%|██▏       | 10/46 [04:45<17:27, 29.09s/it]

Val Loss: 2.6379 - Val Accuracy: 0.9337



Training:   0%|          | 0/209 [00:00<?, ?it/s][A
Training:   0%|          | 1/209 [00:00<03:16,  1.06it/s][A
Training:   1%|▏         | 3/209 [00:01<01:00,  3.41it/s][A
Training:   2%|▏         | 5/209 [00:01<00:49,  4.16it/s][A
Training:   4%|▍         | 8/209 [00:01<00:27,  7.34it/s][A
Training:   5%|▍         | 10/209 [00:02<00:33,  5.99it/s][A
Training:   6%|▌         | 12/209 [00:02<00:26,  7.57it/s][A
Training:   7%|▋         | 14/209 [00:02<00:42,  4.55it/s][A
Training:   8%|▊         | 16/209 [00:03<00:34,  5.54it/s][A
Training:   8%|▊         | 17/209 [00:03<00:33,  5.74it/s][A
Training:   9%|▉         | 19/209 [00:03<00:26,  7.14it/s][A
Training:  10%|█         | 21/209 [00:03<00:27,  6.93it/s][A
Training:  11%|█         | 23/209 [00:03<00:21,  8.71it/s][A
Training:  12%|█▏        | 25/209 [00:04<00:22,  8.07it/s][A
Training:  13%|█▎        | 27/209 [00:04<00:18,  9.86it/s][A
Training:  14%|█▍        | 29/209 [00:04<00:22,  8.13it/s][A
Training:  15%|█▍   

Epoch: 11/46 - Loss: 2.3805 - Accuracy: 0.9235



  0%|          | 0/27 [00:00<?, ?it/s][A
  4%|▎         | 1/27 [00:00<00:19,  1.34it/s][A
 11%|█         | 3/27 [00:00<00:05,  4.05it/s][A
 19%|█▊        | 5/27 [00:01<00:03,  5.95it/s][A
 22%|██▏       | 6/27 [00:01<00:04,  4.77it/s][A
 33%|███▎      | 9/27 [00:02<00:04,  4.16it/s][A
 44%|████▍     | 12/27 [00:02<00:02,  6.62it/s][A
 52%|█████▏    | 14/27 [00:02<00:02,  6.09it/s][A
 63%|██████▎   | 17/27 [00:03<00:01,  7.14it/s][A
 78%|███████▊  | 21/27 [00:03<00:00,  8.40it/s][A
100%|██████████| 27/27 [00:03<00:00,  6.91it/s][A
Epochs:  24%|██▍       | 11/46 [05:13<16:52, 28.92s/it]

Val Loss: 2.5810 - Val Accuracy: 0.9154



Training:   0%|          | 0/209 [00:00<?, ?it/s][A
Training:   0%|          | 1/209 [00:00<02:38,  1.31it/s][A
Training:   1%|          | 2/209 [00:00<01:22,  2.50it/s][A
Training:   2%|▏         | 5/209 [00:01<01:05,  3.10it/s][A
Training:   3%|▎         | 6/209 [00:01<00:54,  3.73it/s][A
Training:   4%|▍         | 8/209 [00:02<00:42,  4.78it/s][A
Training:   4%|▍         | 9/209 [00:02<00:36,  5.42it/s][A
Training:   5%|▌         | 11/209 [00:02<00:26,  7.44it/s][A
Training:   6%|▌         | 13/209 [00:02<00:28,  6.89it/s][A
Training:   7%|▋         | 15/209 [00:02<00:22,  8.80it/s][A
Training:   8%|▊         | 17/209 [00:03<00:25,  7.52it/s][A
Training:  10%|▉         | 20/209 [00:03<00:25,  7.44it/s][A
Training:  11%|█         | 23/209 [00:03<00:18, 10.11it/s][A
Training:  12%|█▏        | 25/209 [00:03<00:21,  8.69it/s][A
Training:  13%|█▎        | 28/209 [00:04<00:22,  7.99it/s][A
Training:  15%|█▍        | 31/209 [00:04<00:16, 10.52it/s][A
Training:  16%|█▌     

Epoch: 12/46 - Loss: 2.3143 - Accuracy: 0.9249



  0%|          | 0/27 [00:00<?, ?it/s][A
  4%|▎         | 1/27 [00:00<00:24,  1.07it/s][A
 19%|█▊        | 5/27 [00:01<00:04,  4.83it/s][A
 30%|██▉       | 8/27 [00:01<00:02,  7.96it/s][A
 37%|███▋      | 10/27 [00:01<00:02,  7.56it/s][A
 48%|████▊     | 13/27 [00:01<00:01,  8.29it/s][A
 56%|█████▌    | 15/27 [00:02<00:01,  8.81it/s][A
 63%|██████▎   | 17/27 [00:02<00:01,  8.54it/s][A
 70%|███████   | 19/27 [00:02<00:00,  8.50it/s][A
 78%|███████▊  | 21/27 [00:02<00:00,  8.32it/s][A
 81%|████████▏ | 22/27 [00:03<00:00,  7.88it/s][A
 93%|█████████▎| 25/27 [00:03<00:00,  8.92it/s][A
100%|██████████| 27/27 [00:03<00:00,  7.56it/s][A
Epochs:  26%|██▌       | 12/46 [05:41<16:15, 28.69s/it]

Val Loss: 3.0901 - Val Accuracy: 0.9053



Training:   0%|          | 0/209 [00:00<?, ?it/s][A
Training:   0%|          | 1/209 [00:00<03:02,  1.14it/s][A
Training:   1%|▏         | 3/209 [00:01<00:56,  3.66it/s][A
Training:   2%|▏         | 5/209 [00:01<00:40,  5.08it/s][A
Training:   4%|▍         | 8/209 [00:01<00:23,  8.64it/s][A
Training:   5%|▍         | 10/209 [00:01<00:31,  6.30it/s][A
Training:   6%|▌         | 13/209 [00:02<00:26,  7.39it/s][A
Training:   7%|▋         | 15/209 [00:02<00:25,  7.72it/s][A
Training:   8%|▊         | 17/209 [00:02<00:24,  7.75it/s][A
Training:   9%|▊         | 18/209 [00:02<00:25,  7.60it/s][A
Training:  10%|▉         | 20/209 [00:02<00:20,  9.33it/s][A
Training:  11%|█         | 22/209 [00:03<00:23,  7.83it/s][A
Training:  12%|█▏        | 25/209 [00:03<00:22,  8.28it/s][A
Training:  12%|█▏        | 26/209 [00:03<00:23,  7.83it/s][A
Training:  13%|█▎        | 28/209 [00:03<00:19,  9.37it/s][A
Training:  14%|█▍        | 30/209 [00:04<00:22,  7.87it/s][A
Training:  16%|█▌   

Epoch: 13/46 - Loss: 2.4195 - Accuracy: 0.9194



  0%|          | 0/27 [00:00<?, ?it/s][A
  4%|▎         | 1/27 [00:00<00:21,  1.24it/s][A
 19%|█▊        | 5/27 [00:01<00:04,  4.85it/s][A
 30%|██▉       | 8/27 [00:01<00:02,  7.97it/s][A
 37%|███▋      | 10/27 [00:01<00:02,  7.40it/s][A
 48%|████▊     | 13/27 [00:02<00:01,  7.57it/s][A
 56%|█████▌    | 15/27 [00:02<00:01,  8.42it/s][A
 63%|██████▎   | 17/27 [00:02<00:01,  7.05it/s][A
 78%|███████▊  | 21/27 [00:03<00:00,  7.94it/s][A
 81%|████████▏ | 22/27 [00:03<00:00,  7.92it/s][A
 93%|█████████▎| 25/27 [00:03<00:00,  8.94it/s][A
100%|██████████| 27/27 [00:03<00:00,  7.16it/s][A
Epochs:  28%|██▊       | 13/46 [06:08<15:30, 28.20s/it]

Val Loss: 2.3770 - Val Accuracy: 0.9342



Training:   0%|          | 0/209 [00:00<?, ?it/s][A
Training:   0%|          | 1/209 [00:00<02:38,  1.31it/s][A
Training:   1%|▏         | 3/209 [00:00<00:55,  3.70it/s][A
Training:   2%|▏         | 5/209 [00:01<00:40,  5.08it/s][A
Training:   4%|▍         | 8/209 [00:01<00:24,  8.19it/s][A
Training:   5%|▍         | 10/209 [00:01<00:26,  7.61it/s][A
Training:   6%|▌         | 13/209 [00:02<00:25,  7.76it/s][A
Training:   8%|▊         | 16/209 [00:02<00:18, 10.55it/s][A
Training:   9%|▊         | 18/209 [00:02<00:26,  7.34it/s][A
Training:  10%|▉         | 20/209 [00:02<00:22,  8.57it/s][A
Training:  11%|█         | 22/209 [00:03<00:25,  7.31it/s][A
Training:  11%|█▏        | 24/209 [00:03<00:23,  8.03it/s][A
Training:  12%|█▏        | 26/209 [00:03<00:19,  9.17it/s][A
Training:  13%|█▎        | 28/209 [00:04<00:28,  6.42it/s][A
Training:  15%|█▍        | 31/209 [00:04<00:26,  6.69it/s][A
Training:  16%|█▋        | 34/209 [00:04<00:19,  9.03it/s][A
Training:  17%|█▋   

Epoch: 14/46 - Loss: 2.6728 - Accuracy: 0.9135



  0%|          | 0/27 [00:00<?, ?it/s][A
  4%|▎         | 1/27 [00:00<00:19,  1.30it/s][A
 19%|█▊        | 5/27 [00:01<00:04,  5.08it/s][A
 30%|██▉       | 8/27 [00:01<00:02,  8.07it/s][A
 37%|███▋      | 10/27 [00:01<00:02,  8.08it/s][A
 44%|████▍     | 12/27 [00:01<00:01,  9.37it/s][A
 52%|█████▏    | 14/27 [00:01<00:01,  8.90it/s][A
 59%|█████▉    | 16/27 [00:02<00:01, 10.05it/s][A
 67%|██████▋   | 18/27 [00:02<00:01,  8.77it/s][A
 74%|███████▍  | 20/27 [00:02<00:00,  9.86it/s][A
 81%|████████▏ | 22/27 [00:02<00:00,  8.18it/s][A
 89%|████████▉ | 24/27 [00:02<00:00,  9.60it/s][A
100%|██████████| 27/27 [00:03<00:00,  7.96it/s][A
Epochs:  30%|███       | 14/46 [06:35<14:48, 27.77s/it]

Val Loss: 2.7901 - Val Accuracy: 0.8624



Training:   0%|          | 0/209 [00:00<?, ?it/s][A
Training:   0%|          | 1/209 [00:00<02:40,  1.30it/s][A
Training:   1%|▏         | 3/209 [00:00<00:48,  4.21it/s][A
Training:   2%|▏         | 5/209 [00:01<00:36,  5.64it/s][A
Training:   4%|▍         | 8/209 [00:01<00:22,  9.08it/s][A
Training:   5%|▍         | 10/209 [00:01<00:25,  7.69it/s][A
Training:   6%|▌         | 12/209 [00:01<00:20,  9.55it/s][A
Training:   7%|▋         | 14/209 [00:02<00:24,  7.81it/s][A
Training:   8%|▊         | 16/209 [00:02<00:20,  9.60it/s][A
Training:   9%|▊         | 18/209 [00:02<00:25,  7.56it/s][A
Training:  10%|▉         | 20/209 [00:02<00:22,  8.49it/s][A
Training:  11%|█         | 22/209 [00:03<00:23,  7.92it/s][A
Training:  11%|█         | 23/209 [00:03<00:24,  7.57it/s][A
Training:  12%|█▏        | 25/209 [00:03<00:23,  7.99it/s][A
Training:  13%|█▎        | 27/209 [00:03<00:22,  8.09it/s][A
Training:  14%|█▍        | 29/209 [00:03<00:20,  8.65it/s][A
Training:  15%|█▍   

Epoch: 15/46 - Loss: 2.4706 - Accuracy: 0.9197



  0%|          | 0/27 [00:00<?, ?it/s][A
  4%|▎         | 1/27 [00:00<00:17,  1.52it/s][A
 11%|█         | 3/27 [00:00<00:05,  4.73it/s][A
 19%|█▊        | 5/27 [00:01<00:03,  5.98it/s][A
 26%|██▌       | 7/27 [00:01<00:02,  8.21it/s][A
 33%|███▎      | 9/27 [00:01<00:02,  8.16it/s][A
 41%|████      | 11/27 [00:01<00:01,  9.61it/s][A
 48%|████▊     | 13/27 [00:01<00:01,  9.55it/s][A
 59%|█████▉    | 16/27 [00:01<00:00, 13.14it/s][A
 67%|██████▋   | 18/27 [00:02<00:00, 10.30it/s][A
 74%|███████▍  | 20/27 [00:02<00:00, 10.81it/s][A
 81%|████████▏ | 22/27 [00:02<00:00,  8.46it/s][A
100%|██████████| 27/27 [00:03<00:00,  8.56it/s][A
Epochs:  33%|███▎      | 15/46 [07:02<14:13, 27.54s/it]

Val Loss: 2.6288 - Val Accuracy: 0.8988



Training:   0%|          | 0/209 [00:00<?, ?it/s][A
Training:   0%|          | 1/209 [00:00<02:46,  1.25it/s][A
Training:   1%|▏         | 3/209 [00:00<00:54,  3.79it/s][A
Training:   2%|▏         | 5/209 [00:01<00:41,  4.89it/s][A
Training:   3%|▎         | 7/209 [00:01<00:29,  6.81it/s][A
Training:   4%|▍         | 9/209 [00:01<00:31,  6.44it/s][A
Training:   6%|▌         | 13/209 [00:02<00:27,  7.19it/s][A
Training:   7%|▋         | 15/209 [00:02<00:23,  8.23it/s][A
Training:   8%|▊         | 17/209 [00:02<00:25,  7.44it/s][A
Training:   9%|▉         | 19/209 [00:02<00:21,  8.69it/s][A
Training:  10%|█         | 21/209 [00:03<00:25,  7.47it/s][A
Training:  11%|█▏        | 24/209 [00:03<00:17, 10.39it/s][A
Training:  12%|█▏        | 26/209 [00:03<00:22,  8.15it/s][A
Training:  14%|█▍        | 29/209 [00:03<00:19,  9.19it/s][A
Training:  15%|█▍        | 31/209 [00:04<00:18,  9.80it/s][A
Training:  16%|█▌        | 33/209 [00:04<00:20,  8.53it/s][A
Training:  17%|█▋    

Epoch: 16/46 - Loss: 2.1798 - Accuracy: 0.9295



  0%|          | 0/27 [00:00<?, ?it/s][A
  4%|▎         | 1/27 [00:00<00:19,  1.34it/s][A
 11%|█         | 3/27 [00:00<00:05,  4.23it/s][A
 19%|█▊        | 5/27 [00:01<00:04,  4.98it/s][A
 26%|██▌       | 7/27 [00:01<00:02,  7.12it/s][A
 33%|███▎      | 9/27 [00:01<00:02,  7.91it/s][A
 41%|████      | 11/27 [00:01<00:01,  9.17it/s][A
 48%|████▊     | 13/27 [00:01<00:01, 10.23it/s][A
 56%|█████▌    | 15/27 [00:02<00:01,  9.97it/s][A
 63%|██████▎   | 17/27 [00:02<00:00, 10.85it/s][A
 70%|███████   | 19/27 [00:02<00:00, 10.98it/s][A
 78%|███████▊  | 21/27 [00:02<00:00,  9.82it/s][A
 85%|████████▌ | 23/27 [00:02<00:00, 11.18it/s][A
 93%|█████████▎| 25/27 [00:02<00:00,  9.97it/s][A
100%|██████████| 27/27 [00:03<00:00,  8.33it/s][A
Epochs:  35%|███▍      | 16/46 [07:29<13:43, 27.45s/it]

Val Loss: 2.4864 - Val Accuracy: 0.9114



Training:   0%|          | 0/209 [00:00<?, ?it/s][A
Training:   0%|          | 1/209 [00:00<02:46,  1.25it/s][A
Training:   2%|▏         | 4/209 [00:00<00:38,  5.32it/s][A
Training:   3%|▎         | 6/209 [00:01<00:36,  5.54it/s][A
Training:   4%|▍         | 9/209 [00:01<00:32,  6.13it/s][A
Training:   6%|▌         | 12/209 [00:01<00:22,  8.71it/s][A
Training:   7%|▋         | 14/209 [00:02<00:27,  7.12it/s][A
Training:   8%|▊         | 16/209 [00:02<00:22,  8.59it/s][A
Training:   9%|▊         | 18/209 [00:02<00:25,  7.50it/s][A
Training:  10%|▉         | 20/209 [00:02<00:20,  9.12it/s][A
Training:  11%|█         | 22/209 [00:03<00:25,  7.38it/s][A
Training:  12%|█▏        | 25/209 [00:03<00:25,  7.25it/s][A
Training:  14%|█▍        | 29/209 [00:04<00:22,  7.96it/s][A
Training:  15%|█▌        | 32/209 [00:04<00:18,  9.70it/s][A
Training:  16%|█▋        | 34/209 [00:04<00:22,  7.92it/s][A
Training:  18%|█▊        | 37/209 [00:05<00:25,  6.87it/s][A
Training:  20%|█▉   

Epoch: 17/46 - Loss: 2.2611 - Accuracy: 0.9271



  0%|          | 0/27 [00:00<?, ?it/s][A
  4%|▎         | 1/27 [00:00<00:20,  1.27it/s][A
 19%|█▊        | 5/27 [00:01<00:04,  5.20it/s][A
 33%|███▎      | 9/27 [00:01<00:02,  6.90it/s][A
 48%|████▊     | 13/27 [00:01<00:01,  8.93it/s][A
 63%|██████▎   | 17/27 [00:02<00:01,  9.61it/s][A
 74%|███████▍  | 20/27 [00:02<00:00, 11.21it/s][A
 81%|████████▏ | 22/27 [00:02<00:00, 11.48it/s][A
 89%|████████▉ | 24/27 [00:02<00:00, 11.31it/s][A
100%|██████████| 27/27 [00:02<00:00,  9.16it/s][A
Epochs:  37%|███▋      | 17/46 [07:57<13:13, 27.37s/it]

Val Loss: 2.4198 - Val Accuracy: 0.9309



Training:   0%|          | 0/209 [00:00<?, ?it/s][A
Training:   0%|          | 1/209 [00:00<02:13,  1.55it/s][A
Training:   1%|▏         | 3/209 [00:00<00:44,  4.60it/s][A
Training:   2%|▏         | 5/209 [00:00<00:32,  6.31it/s][A
Training:   3%|▎         | 7/209 [00:01<00:23,  8.60it/s][A
Training:   4%|▍         | 9/209 [00:01<00:26,  7.62it/s][A
Training:   5%|▌         | 11/209 [00:01<00:23,  8.50it/s][A
Training:   6%|▌         | 13/209 [00:02<00:29,  6.71it/s][A
Training:   7%|▋         | 15/209 [00:02<00:23,  8.40it/s][A
Training:   8%|▊         | 17/209 [00:02<00:27,  6.90it/s][A
Training:   9%|▉         | 19/209 [00:02<00:22,  8.58it/s][A
Training:  10%|█         | 21/209 [00:03<00:28,  6.49it/s][A
Training:  12%|█▏        | 25/209 [00:03<00:25,  7.17it/s][A
Training:  14%|█▍        | 29/209 [00:04<00:23,  7.80it/s][A
Training:  15%|█▌        | 32/209 [00:04<00:17,  9.84it/s][A
Training:  16%|█▋        | 34/209 [00:04<00:19,  8.85it/s][A
Training:  18%|█▊    

Epoch: 18/46 - Loss: 2.3995 - Accuracy: 0.9257



  0%|          | 0/27 [00:00<?, ?it/s][A
  4%|▎         | 1/27 [00:00<00:20,  1.25it/s][A
 19%|█▊        | 5/27 [00:01<00:04,  5.08it/s][A
 30%|██▉       | 8/27 [00:01<00:02,  8.37it/s][A
 37%|███▋      | 10/27 [00:01<00:02,  7.97it/s][A
 48%|████▊     | 13/27 [00:02<00:01,  7.26it/s][A
 63%|██████▎   | 17/27 [00:02<00:01,  9.12it/s][A
 78%|███████▊  | 21/27 [00:02<00:00, 10.38it/s][A
 89%|████████▉ | 24/27 [00:02<00:00, 11.29it/s][A
100%|██████████| 27/27 [00:03<00:00,  8.43it/s][A
Epochs:  39%|███▉      | 18/46 [08:24<12:47, 27.42s/it]

Val Loss: 2.2374 - Val Accuracy: 0.9397



Training:   0%|          | 0/209 [00:00<?, ?it/s][A
Training:   0%|          | 1/209 [00:00<02:28,  1.40it/s][A
Training:   1%|▏         | 3/209 [00:00<00:47,  4.30it/s][A
Training:   2%|▏         | 5/209 [00:01<00:42,  4.75it/s][A
Training:   4%|▍         | 9/209 [00:01<00:29,  6.85it/s][A
Training:   6%|▌         | 13/209 [00:02<00:24,  8.01it/s][A
Training:   8%|▊         | 17/209 [00:02<00:23,  8.06it/s][A
Training:   9%|▉         | 19/209 [00:02<00:20,  9.15it/s][A
Training:  10%|█         | 21/209 [00:02<00:21,  8.92it/s][A
Training:  11%|█▏        | 24/209 [00:02<00:15, 11.64it/s][A
Training:  12%|█▏        | 26/209 [00:03<00:19,  9.62it/s][A
Training:  14%|█▍        | 29/209 [00:03<00:18,  9.50it/s][A
Training:  15%|█▍        | 31/209 [00:03<00:18,  9.70it/s][A
Training:  16%|█▌        | 33/209 [00:04<00:19,  9.01it/s][A
Training:  17%|█▋        | 35/209 [00:04<00:18,  9.32it/s][A
Training:  18%|█▊        | 37/209 [00:04<00:17,  9.69it/s][A
Training:  19%|█▊   

Epoch: 19/46 - Loss: 2.6850 - Accuracy: 0.9248



  0%|          | 0/27 [00:00<?, ?it/s][A
  4%|▎         | 1/27 [00:00<00:20,  1.26it/s][A
 19%|█▊        | 5/27 [00:01<00:04,  5.29it/s][A
 33%|███▎      | 9/27 [00:01<00:02,  6.87it/s][A
 37%|███▋      | 10/27 [00:01<00:02,  6.74it/s][A
 48%|████▊     | 13/27 [00:02<00:01,  7.23it/s][A
 63%|██████▎   | 17/27 [00:02<00:01,  8.29it/s][A
 78%|███████▊  | 21/27 [00:02<00:00,  9.28it/s][A
100%|██████████| 27/27 [00:03<00:00,  8.12it/s][A
Epochs:  41%|████▏     | 19/46 [08:51<12:16, 27.28s/it]

Val Loss: 3.6288 - Val Accuracy: 0.9326



Training:   0%|          | 0/209 [00:00<?, ?it/s][A
Training:   0%|          | 1/209 [00:00<02:37,  1.32it/s][A
Training:   1%|▏         | 3/209 [00:00<00:49,  4.17it/s][A
Training:   2%|▏         | 5/209 [00:01<00:37,  5.43it/s][A
Training:   4%|▍         | 8/209 [00:01<00:21,  9.51it/s][A
Training:   5%|▍         | 10/209 [00:01<00:27,  7.30it/s][A
Training:   6%|▌         | 12/209 [00:01<00:21,  9.11it/s][A
Training:   7%|▋         | 14/209 [00:02<00:23,  8.20it/s][A
Training:   8%|▊         | 16/209 [00:02<00:19,  9.95it/s][A
Training:   9%|▊         | 18/209 [00:02<00:26,  7.08it/s][A
Training:  10%|▉         | 20/209 [00:02<00:21,  8.75it/s][A
Training:  11%|█         | 22/209 [00:03<00:23,  8.08it/s][A
Training:  12%|█▏        | 25/209 [00:03<00:23,  7.97it/s][A
Training:  13%|█▎        | 28/209 [00:03<00:16, 10.78it/s][A
Training:  14%|█▍        | 30/209 [00:03<00:20,  8.72it/s][A
Training:  16%|█▌        | 33/209 [00:04<00:21,  8.24it/s][A
Training:  18%|█▊   

Epoch: 20/46 - Loss: 2.3024 - Accuracy: 0.9255



  0%|          | 0/27 [00:00<?, ?it/s][A
  4%|▎         | 1/27 [00:00<00:21,  1.22it/s][A
  7%|▋         | 2/27 [00:01<00:11,  2.14it/s][A
 19%|█▊        | 5/27 [00:01<00:04,  5.38it/s][A
 22%|██▏       | 6/27 [00:01<00:03,  5.57it/s][A
 33%|███▎      | 9/27 [00:01<00:02,  6.38it/s][A
 41%|████      | 11/27 [00:01<00:01,  8.24it/s][A
 48%|████▊     | 13/27 [00:02<00:01,  7.23it/s][A
 59%|█████▉    | 16/27 [00:02<00:01,  9.11it/s][A
 67%|██████▋   | 18/27 [00:02<00:01,  8.63it/s][A
 74%|███████▍  | 20/27 [00:02<00:00, 10.09it/s][A
 81%|████████▏ | 22/27 [00:03<00:00,  9.27it/s][A
 89%|████████▉ | 24/27 [00:03<00:00, 10.68it/s][A
100%|██████████| 27/27 [00:03<00:00,  7.69it/s][A
Epochs:  43%|████▎     | 20/46 [09:18<11:43, 27.04s/it]

Val Loss: 2.7052 - Val Accuracy: 0.9187



Training:   0%|          | 0/209 [00:00<?, ?it/s][A
Training:   0%|          | 1/209 [00:00<02:46,  1.25it/s][A
Training:   1%|▏         | 3/209 [00:00<00:52,  3.96it/s][A
Training:   2%|▏         | 5/209 [00:01<00:35,  5.79it/s][A
Training:   4%|▍         | 8/209 [00:01<00:20,  9.76it/s][A
Training:   5%|▍         | 10/209 [00:01<00:29,  6.81it/s][A
Training:   6%|▌         | 13/209 [00:02<00:26,  7.40it/s][A
Training:   8%|▊         | 17/209 [00:02<00:24,  7.92it/s][A
Training:  10%|▉         | 20/209 [00:02<00:18, 10.07it/s][A
Training:  11%|█         | 22/209 [00:03<00:24,  7.49it/s][A
Training:  12%|█▏        | 25/209 [00:03<00:25,  7.26it/s][A
Training:  13%|█▎        | 28/209 [00:03<00:19,  9.25it/s][A
Training:  14%|█▍        | 30/209 [00:04<00:21,  8.32it/s][A
Training:  16%|█▌        | 33/209 [00:04<00:21,  8.05it/s][A
Training:  18%|█▊        | 37/209 [00:04<00:18,  9.16it/s][A
Training:  20%|█▉        | 41/209 [00:05<00:17,  9.54it/s][A
Training:  21%|██   

Epoch: 21/46 - Loss: 2.3687 - Accuracy: 0.9211



  0%|          | 0/27 [00:00<?, ?it/s][A
  4%|▎         | 1/27 [00:00<00:18,  1.42it/s][A
  7%|▋         | 2/27 [00:00<00:10,  2.44it/s][A
 19%|█▊        | 5/27 [00:01<00:03,  6.39it/s][A
 26%|██▌       | 7/27 [00:01<00:02,  7.18it/s][A
 33%|███▎      | 9/27 [00:01<00:02,  6.85it/s][A
 44%|████▍     | 12/27 [00:01<00:01,  8.92it/s][A
 52%|█████▏    | 14/27 [00:02<00:01,  7.48it/s][A
 59%|█████▉    | 16/27 [00:02<00:01,  8.74it/s][A
 67%|██████▋   | 18/27 [00:02<00:01,  8.16it/s][A
 74%|███████▍  | 20/27 [00:02<00:00,  9.75it/s][A
 81%|████████▏ | 22/27 [00:03<00:00,  8.84it/s][A
100%|██████████| 27/27 [00:03<00:00,  7.99it/s][A
Epochs:  46%|████▌     | 21/46 [09:45<11:16, 27.05s/it]

Val Loss: 2.4546 - Val Accuracy: 0.9071



Training:   0%|          | 0/209 [00:00<?, ?it/s][A
Training:   0%|          | 1/209 [00:00<02:28,  1.40it/s][A
Training:   2%|▏         | 4/209 [00:00<00:33,  6.10it/s][A
Training:   3%|▎         | 6/209 [00:01<00:34,  5.90it/s][A
Training:   4%|▍         | 9/209 [00:01<00:26,  7.52it/s][A
Training:   5%|▌         | 11/209 [00:01<00:23,  8.52it/s][A
Training:   6%|▌         | 13/209 [00:01<00:25,  7.75it/s][A
Training:   8%|▊         | 16/209 [00:02<00:18, 10.60it/s][A
Training:   9%|▊         | 18/209 [00:02<00:20,  9.14it/s][A
Training:  10%|█         | 21/209 [00:02<00:21,  8.59it/s][A
Training:  11%|█▏        | 24/209 [00:02<00:16, 10.91it/s][A
Training:  12%|█▏        | 26/209 [00:03<00:17, 10.30it/s][A
Training:  14%|█▍        | 29/209 [00:03<00:19,  9.09it/s][A
Training:  16%|█▌        | 33/209 [00:03<00:19,  9.20it/s][A
Training:  17%|█▋        | 36/209 [00:04<00:15, 10.91it/s][A
Training:  18%|█▊        | 38/209 [00:04<00:20,  8.54it/s][A
Training:  20%|█▉   

Epoch: 22/46 - Loss: 2.0793 - Accuracy: 0.9294



  0%|          | 0/27 [00:00<?, ?it/s][A
  4%|▎         | 1/27 [00:00<00:16,  1.60it/s][A
  7%|▋         | 2/27 [00:00<00:09,  2.59it/s][A
 19%|█▊        | 5/27 [00:01<00:03,  5.91it/s][A
 26%|██▌       | 7/27 [00:01<00:02,  7.61it/s][A
 33%|███▎      | 9/27 [00:01<00:02,  7.28it/s][A
 37%|███▋      | 10/27 [00:01<00:02,  7.08it/s][A
 48%|████▊     | 13/27 [00:01<00:01,  9.45it/s][A
 56%|█████▌    | 15/27 [00:02<00:01,  9.29it/s][A
 63%|██████▎   | 17/27 [00:02<00:01,  9.95it/s][A
 70%|███████   | 19/27 [00:02<00:00,  9.52it/s][A
 78%|███████▊  | 21/27 [00:02<00:00, 10.02it/s][A
 85%|████████▌ | 23/27 [00:03<00:00,  8.56it/s][A
 93%|█████████▎| 25/27 [00:03<00:00, 10.07it/s][A
100%|██████████| 27/27 [00:03<00:00,  7.87it/s][A
Epochs:  48%|████▊     | 22/46 [10:11<10:40, 26.69s/it]

Val Loss: 2.3663 - Val Accuracy: 0.9397



Training:   0%|          | 0/209 [00:00<?, ?it/s][A
Training:   0%|          | 1/209 [00:00<02:26,  1.42it/s][A
Training:   2%|▏         | 4/209 [00:00<00:32,  6.24it/s][A
Training:   3%|▎         | 6/209 [00:01<00:35,  5.67it/s][A
Training:   4%|▍         | 9/209 [00:01<00:31,  6.33it/s][A
Training:   5%|▌         | 11/209 [00:01<00:25,  7.84it/s][A
Training:   6%|▌         | 13/209 [00:02<00:26,  7.33it/s][A
Training:   7%|▋         | 15/209 [00:02<00:24,  8.05it/s][A
Training:   8%|▊         | 17/209 [00:02<00:22,  8.69it/s][A
Training:   9%|▉         | 19/209 [00:02<00:20,  9.15it/s][A
Training:  10%|█         | 21/209 [00:02<00:22,  8.49it/s][A
Training:  11%|█         | 23/209 [00:03<00:18, 10.18it/s][A
Training:  12%|█▏        | 25/209 [00:03<00:20,  8.96it/s][A
Training:  13%|█▎        | 27/209 [00:03<00:19,  9.25it/s][A
Training:  14%|█▍        | 29/209 [00:03<00:21,  8.35it/s][A
Training:  14%|█▍        | 30/209 [00:03<00:23,  7.51it/s][A
Training:  16%|█▌   

Epoch: 23/46 - Loss: 2.2692 - Accuracy: 0.9237



  0%|          | 0/27 [00:00<?, ?it/s][A
  4%|▎         | 1/27 [00:00<00:18,  1.37it/s][A
  7%|▋         | 2/27 [00:00<00:09,  2.73it/s][A
 19%|█▊        | 5/27 [00:01<00:03,  6.50it/s][A
 22%|██▏       | 6/27 [00:01<00:03,  6.49it/s][A
 33%|███▎      | 9/27 [00:01<00:02,  8.07it/s][A
 37%|███▋      | 10/27 [00:01<00:02,  8.20it/s][A
 41%|████      | 11/27 [00:01<00:01,  8.13it/s][A
 48%|████▊     | 13/27 [00:01<00:01,  9.38it/s][A
 52%|█████▏    | 14/27 [00:02<00:01,  8.85it/s][A
 56%|█████▌    | 15/27 [00:02<00:01,  7.84it/s][A
 63%|██████▎   | 17/27 [00:02<00:01,  9.61it/s][A
 70%|███████   | 19/27 [00:02<00:00,  8.23it/s][A
 78%|███████▊  | 21/27 [00:02<00:00,  9.16it/s][A
 81%|████████▏ | 22/27 [00:02<00:00,  9.15it/s][A
 85%|████████▌ | 23/27 [00:03<00:00,  8.49it/s][A
 93%|█████████▎| 25/27 [00:03<00:00,  9.52it/s][A
100%|██████████| 27/27 [00:03<00:00,  7.77it/s][A
Epochs:  50%|█████     | 23/46 [10:37<10:14, 26.73s/it]

Val Loss: 2.5042 - Val Accuracy: 0.8977



Training:   0%|          | 0/209 [00:00<?, ?it/s][A
Training:   0%|          | 1/209 [00:00<02:58,  1.16it/s][A
Training:   2%|▏         | 4/209 [00:00<00:39,  5.19it/s][A
Training:   3%|▎         | 6/209 [00:01<00:33,  6.07it/s][A
Training:   4%|▍         | 9/209 [00:01<00:28,  7.09it/s][A
Training:   5%|▌         | 11/209 [00:01<00:23,  8.52it/s][A
Training:   6%|▌         | 13/209 [00:02<00:27,  7.24it/s][A
Training:   8%|▊         | 16/209 [00:02<00:20,  9.55it/s][A
Training:   9%|▊         | 18/209 [00:02<00:22,  8.66it/s][A
Training:  10%|█         | 21/209 [00:02<00:20,  9.07it/s][A
Training:  11%|█         | 23/209 [00:03<00:21,  8.61it/s][A
Training:  12%|█▏        | 25/209 [00:03<00:20,  8.96it/s][A
Training:  12%|█▏        | 26/209 [00:03<00:22,  8.13it/s][A
Training:  13%|█▎        | 27/209 [00:03<00:23,  7.76it/s][A
Training:  14%|█▍        | 29/209 [00:03<00:19,  9.34it/s][A
Training:  15%|█▍        | 31/209 [00:04<00:23,  7.51it/s][A
Training:  16%|█▌   

Epoch: 24/46 - Loss: 2.1216 - Accuracy: 0.9351



  0%|          | 0/27 [00:00<?, ?it/s][A
  4%|▎         | 1/27 [00:00<00:17,  1.45it/s][A
 15%|█▍        | 4/27 [00:00<00:03,  6.27it/s][A
 22%|██▏       | 6/27 [00:01<00:03,  6.06it/s][A
 33%|███▎      | 9/27 [00:01<00:02,  6.75it/s][A
 44%|████▍     | 12/27 [00:01<00:01,  9.52it/s][A
 52%|█████▏    | 14/27 [00:02<00:01,  7.39it/s][A
 63%|██████▎   | 17/27 [00:02<00:01,  7.37it/s][A
 74%|███████▍  | 20/27 [00:02<00:00,  9.63it/s][A
 81%|████████▏ | 22/27 [00:02<00:00,  9.19it/s][A
 89%|████████▉ | 24/27 [00:02<00:00, 10.70it/s][A
100%|██████████| 27/27 [00:03<00:00,  8.08it/s][A
Epochs:  52%|█████▏    | 24/46 [11:04<09:50, 26.82s/it]

Val Loss: 2.1451 - Val Accuracy: 0.9403



Training:   0%|          | 0/209 [00:00<?, ?it/s][A
Training:   0%|          | 1/209 [00:00<02:28,  1.41it/s][A
Training:   2%|▏         | 4/209 [00:00<00:35,  5.70it/s][A
Training:   3%|▎         | 6/209 [00:01<00:31,  6.51it/s][A
Training:   4%|▍         | 9/209 [00:01<00:28,  7.00it/s][A
Training:   6%|▌         | 12/209 [00:01<00:20,  9.67it/s][A
Training:   7%|▋         | 14/209 [00:01<00:21,  8.96it/s][A
Training:   8%|▊         | 17/209 [00:02<00:22,  8.51it/s][A
Training:  10%|▉         | 20/209 [00:02<00:18, 10.38it/s][A
Training:  11%|█         | 22/209 [00:02<00:22,  8.33it/s][A
Training:  12%|█▏        | 25/209 [00:03<00:24,  7.50it/s][A
Training:  13%|█▎        | 28/209 [00:03<00:19,  9.24it/s][A
Training:  14%|█▍        | 30/209 [00:03<00:21,  8.49it/s][A
Training:  15%|█▌        | 32/209 [00:03<00:18,  9.81it/s][A
Training:  16%|█▋        | 34/209 [00:04<00:19,  9.04it/s][A
Training:  17%|█▋        | 36/209 [00:04<00:16, 10.38it/s][A
Training:  18%|█▊   

Epoch: 25/46 - Loss: 2.4562 - Accuracy: 0.9212



  0%|          | 0/27 [00:00<?, ?it/s][A
  4%|▎         | 1/27 [00:00<00:18,  1.44it/s][A
 11%|█         | 3/27 [00:00<00:05,  4.43it/s][A
 19%|█▊        | 5/27 [00:01<00:04,  5.25it/s][A
 22%|██▏       | 6/27 [00:01<00:03,  5.83it/s][A
 33%|███▎      | 9/27 [00:01<00:02,  7.53it/s][A
 37%|███▋      | 10/27 [00:01<00:02,  7.35it/s][A
 48%|████▊     | 13/27 [00:01<00:01,  8.92it/s][A
 52%|█████▏    | 14/27 [00:02<00:01,  8.36it/s][A
 63%|██████▎   | 17/27 [00:02<00:01,  9.18it/s][A
 74%|███████▍  | 20/27 [00:02<00:00, 12.06it/s][A
 81%|████████▏ | 22/27 [00:02<00:00,  8.83it/s][A
100%|██████████| 27/27 [00:03<00:00,  8.01it/s][A
Epochs:  54%|█████▍    | 25/46 [11:31<09:19, 26.66s/it]

Val Loss: 2.3274 - Val Accuracy: 0.9436



Training:   0%|          | 0/209 [00:00<?, ?it/s][A
Training:   0%|          | 1/209 [00:00<02:47,  1.24it/s][A
Training:   1%|▏         | 3/209 [00:00<00:51,  3.99it/s][A
Training:   2%|▏         | 5/209 [00:01<00:42,  4.76it/s][A
Training:   4%|▍         | 8/209 [00:01<00:25,  7.94it/s][A
Training:   5%|▍         | 10/209 [00:01<00:27,  7.26it/s][A
Training:   6%|▌         | 12/209 [00:01<00:23,  8.51it/s][A
Training:   7%|▋         | 14/209 [00:02<00:22,  8.67it/s][A
Training:   8%|▊         | 16/209 [00:02<00:20,  9.57it/s][A
Training:   9%|▊         | 18/209 [00:02<00:20,  9.54it/s][A
Training:  10%|▉         | 20/209 [00:02<00:18, 10.25it/s][A
Training:  11%|█         | 22/209 [00:02<00:19,  9.83it/s][A
Training:  11%|█▏        | 24/209 [00:03<00:18, 10.25it/s][A
Training:  12%|█▏        | 26/209 [00:03<00:19,  9.46it/s][A
Training:  13%|█▎        | 28/209 [00:03<00:18,  9.89it/s][A
Training:  14%|█▍        | 30/209 [00:03<00:18,  9.74it/s][A
Training:  15%|█▌   

Epoch: 26/46 - Loss: 2.3397 - Accuracy: 0.9293



  0%|          | 0/27 [00:00<?, ?it/s][A
  4%|▎         | 1/27 [00:00<00:19,  1.30it/s][A
 11%|█         | 3/27 [00:00<00:06,  3.65it/s][A
 19%|█▊        | 5/27 [00:01<00:04,  5.27it/s][A
 26%|██▌       | 7/27 [00:01<00:03,  6.64it/s][A
 33%|███▎      | 9/27 [00:01<00:02,  7.73it/s][A
 41%|████      | 11/27 [00:01<00:01,  8.91it/s][A
 48%|████▊     | 13/27 [00:01<00:01,  8.92it/s][A
 56%|█████▌    | 15/27 [00:02<00:01,  9.26it/s][A
 63%|██████▎   | 17/27 [00:02<00:00, 10.27it/s][A
 70%|███████   | 19/27 [00:02<00:00,  8.64it/s][A
 81%|████████▏ | 22/27 [00:02<00:00, 10.99it/s][A
 89%|████████▉ | 24/27 [00:03<00:00,  9.27it/s][A
100%|██████████| 27/27 [00:03<00:00,  8.15it/s][A
Epochs:  57%|█████▋    | 26/46 [11:57<08:50, 26.54s/it]

Val Loss: 4.0507 - Val Accuracy: 0.9042



Training:   0%|          | 0/209 [00:00<?, ?it/s][A
Training:   0%|          | 1/209 [00:00<03:13,  1.08it/s][A
Training:   2%|▏         | 4/209 [00:01<00:42,  4.81it/s][A
Training:   3%|▎         | 6/209 [00:01<00:38,  5.27it/s][A
Training:   4%|▍         | 8/209 [00:01<00:28,  6.99it/s][A
Training:   5%|▍         | 10/209 [00:01<00:31,  6.42it/s][A
Training:   6%|▌         | 12/209 [00:02<00:24,  8.00it/s][A
Training:   7%|▋         | 14/209 [00:02<00:24,  7.88it/s][A
Training:   8%|▊         | 16/209 [00:02<00:21,  8.99it/s][A
Training:   9%|▊         | 18/209 [00:02<00:20,  9.45it/s][A
Training:  10%|▉         | 20/209 [00:02<00:19,  9.74it/s][A
Training:  11%|█         | 22/209 [00:03<00:23,  7.94it/s][A
Training:  12%|█▏        | 25/209 [00:03<00:23,  7.98it/s][A
Training:  13%|█▎        | 28/209 [00:03<00:17, 10.17it/s][A
Training:  14%|█▍        | 30/209 [00:04<00:22,  8.03it/s][A
Training:  16%|█▌        | 33/209 [00:04<00:23,  7.50it/s][A
Training:  17%|█▋   

Epoch: 27/46 - Loss: 2.2396 - Accuracy: 0.9281



  0%|          | 0/27 [00:00<?, ?it/s][A
  4%|▎         | 1/27 [00:00<00:15,  1.64it/s][A
  7%|▋         | 2/27 [00:00<00:09,  2.57it/s][A
 19%|█▊        | 5/27 [00:00<00:03,  7.05it/s][A
 26%|██▌       | 7/27 [00:01<00:02,  7.61it/s][A
 33%|███▎      | 9/27 [00:01<00:02,  8.70it/s][A
 41%|████      | 11/27 [00:01<00:02,  7.70it/s][A
 48%|████▊     | 13/27 [00:01<00:01,  8.35it/s][A
 52%|█████▏    | 14/27 [00:02<00:01,  7.15it/s][A
 63%|██████▎   | 17/27 [00:02<00:01,  9.14it/s][A
 67%|██████▋   | 18/27 [00:02<00:01,  7.65it/s][A
 78%|███████▊  | 21/27 [00:02<00:00, 10.34it/s][A
 85%|████████▌ | 23/27 [00:03<00:00,  8.49it/s][A
100%|██████████| 27/27 [00:03<00:00,  7.59it/s][A
Epochs:  59%|█████▊    | 27/46 [12:24<08:27, 26.69s/it]

Val Loss: 2.3720 - Val Accuracy: 0.9397



Training:   0%|          | 0/209 [00:00<?, ?it/s][A
Training:   0%|          | 1/209 [00:00<02:16,  1.52it/s][A
Training:   1%|▏         | 3/209 [00:00<00:49,  4.13it/s][A
Training:   2%|▏         | 5/209 [00:01<00:37,  5.39it/s][A
Training:   3%|▎         | 7/209 [00:01<00:30,  6.56it/s][A
Training:   4%|▍         | 9/209 [00:01<00:30,  6.65it/s][A
Training:   5%|▌         | 11/209 [00:01<00:25,  7.75it/s][A
Training:   6%|▌         | 13/209 [00:02<00:26,  7.51it/s][A
Training:   8%|▊         | 16/209 [00:02<00:19,  9.88it/s][A
Training:   9%|▊         | 18/209 [00:02<00:19,  9.56it/s][A
Training:  10%|▉         | 20/209 [00:02<00:17, 10.59it/s][A
Training:  11%|█         | 22/209 [00:02<00:20,  9.06it/s][A
Training:  11%|█▏        | 24/209 [00:03<00:19,  9.71it/s][A
Training:  12%|█▏        | 26/209 [00:03<00:23,  7.78it/s][A
Training:  13%|█▎        | 28/209 [00:03<00:19,  9.33it/s][A
Training:  14%|█▍        | 30/209 [00:03<00:20,  8.71it/s][A
Training:  16%|█▌    

Epoch: 28/46 - Loss: 2.5253 - Accuracy: 0.9208



  0%|          | 0/27 [00:00<?, ?it/s][A
  4%|▎         | 1/27 [00:00<00:19,  1.34it/s][A
  7%|▋         | 2/27 [00:00<00:09,  2.71it/s][A
 15%|█▍        | 4/27 [00:01<00:04,  5.19it/s][A
 19%|█▊        | 5/27 [00:01<00:03,  6.06it/s][A
 22%|██▏       | 6/27 [00:01<00:03,  5.60it/s][A
 33%|███▎      | 9/27 [00:01<00:02,  8.15it/s][A
 37%|███▋      | 10/27 [00:01<00:02,  6.52it/s][A
 48%|████▊     | 13/27 [00:02<00:01,  7.96it/s][A
 52%|█████▏    | 14/27 [00:02<00:01,  7.66it/s][A
 63%|██████▎   | 17/27 [00:02<00:01,  8.70it/s][A
 67%|██████▋   | 18/27 [00:02<00:01,  8.88it/s][A
 78%|███████▊  | 21/27 [00:03<00:00,  8.94it/s][A
 89%|████████▉ | 24/27 [00:03<00:00, 11.14it/s][A
100%|██████████| 27/27 [00:03<00:00,  7.60it/s][A
Epochs:  61%|██████    | 28/46 [12:51<08:02, 26.83s/it]

Val Loss: 3.2901 - Val Accuracy: 0.9025



Training:   0%|          | 0/209 [00:00<?, ?it/s][A
Training:   0%|          | 1/209 [00:01<03:28,  1.00s/it][A
Training:   2%|▏         | 5/209 [00:01<00:49,  4.13it/s][A
Training:   4%|▍         | 8/209 [00:01<00:29,  6.79it/s][A
Training:   5%|▍         | 10/209 [00:01<00:31,  6.41it/s][A
Training:   6%|▌         | 13/209 [00:02<00:28,  6.86it/s][A
Training:   8%|▊         | 16/209 [00:02<00:20,  9.51it/s][A
Training:   9%|▊         | 18/209 [00:02<00:21,  8.99it/s][A
Training:  10%|█         | 21/209 [00:03<00:21,  8.61it/s][A
Training:  11%|█▏        | 24/209 [00:03<00:17, 10.86it/s][A
Training:  12%|█▏        | 26/209 [00:03<00:19,  9.41it/s][A
Training:  14%|█▍        | 29/209 [00:03<00:21,  8.42it/s][A
Training:  15%|█▌        | 32/209 [00:04<00:16, 10.73it/s][A
Training:  16%|█▋        | 34/209 [00:04<00:19,  8.89it/s][A
Training:  18%|█▊        | 37/209 [00:04<00:20,  8.33it/s][A
Training:  19%|█▉        | 40/209 [00:04<00:15, 10.82it/s][A
Training:  20%|██  

Epoch: 29/46 - Loss: 2.1912 - Accuracy: 0.9263



  0%|          | 0/27 [00:00<?, ?it/s][A
  4%|▎         | 1/27 [00:00<00:22,  1.14it/s][A
  7%|▋         | 2/27 [00:01<00:11,  2.15it/s][A
 19%|█▊        | 5/27 [00:01<00:04,  5.46it/s][A
 22%|██▏       | 6/27 [00:01<00:04,  4.93it/s][A
 33%|███▎      | 9/27 [00:01<00:02,  8.14it/s][A
 41%|████      | 11/27 [00:01<00:02,  7.49it/s][A
 48%|████▊     | 13/27 [00:02<00:01,  8.83it/s][A
 56%|█████▌    | 15/27 [00:02<00:01,  7.30it/s][A
 63%|██████▎   | 17/27 [00:02<00:01,  9.01it/s][A
 70%|███████   | 19/27 [00:03<00:01,  7.24it/s][A
 81%|████████▏ | 22/27 [00:03<00:00,  7.94it/s][A
100%|██████████| 27/27 [00:03<00:00,  7.08it/s][A
Epochs:  63%|██████▎   | 29/46 [13:18<07:35, 26.79s/it]

Val Loss: 2.5496 - Val Accuracy: 0.8826



Training:   0%|          | 0/209 [00:00<?, ?it/s][A
Training:   0%|          | 1/209 [00:00<03:24,  1.02it/s][A
Training:   2%|▏         | 4/209 [00:01<00:44,  4.65it/s][A
Training:   3%|▎         | 6/209 [00:01<00:38,  5.33it/s][A
Training:   4%|▍         | 8/209 [00:01<00:29,  6.88it/s][A
Training:   5%|▍         | 10/209 [00:01<00:29,  6.64it/s][A
Training:   6%|▌         | 13/209 [00:02<00:26,  7.46it/s][A
Training:   8%|▊         | 16/209 [00:02<00:18, 10.32it/s][A
Training:   9%|▊         | 18/209 [00:02<00:21,  9.09it/s][A
Training:  10%|█         | 21/209 [00:02<00:20,  9.06it/s][A
Training:  11%|█         | 23/209 [00:03<00:19,  9.63it/s][A
Training:  12%|█▏        | 25/209 [00:03<00:19,  9.35it/s][A
Training:  13%|█▎        | 27/209 [00:03<00:17, 10.44it/s][A
Training:  14%|█▍        | 29/209 [00:03<00:20,  8.77it/s][A
Training:  15%|█▍        | 31/209 [00:03<00:18,  9.64it/s][A
Training:  16%|█▌        | 33/209 [00:04<00:21,  8.26it/s][A
Training:  17%|█▋   

Epoch: 30/46 - Loss: 2.1590 - Accuracy: 0.9251



  0%|          | 0/27 [00:00<?, ?it/s][A
  4%|▎         | 1/27 [00:00<00:21,  1.23it/s][A
 19%|█▊        | 5/27 [00:01<00:04,  4.82it/s][A
 30%|██▉       | 8/27 [00:01<00:02,  7.87it/s][A
 37%|███▋      | 10/27 [00:01<00:02,  7.17it/s][A
 44%|████▍     | 12/27 [00:01<00:01,  8.71it/s][A
 52%|█████▏    | 14/27 [00:02<00:01,  7.76it/s][A
 59%|█████▉    | 16/27 [00:02<00:01,  9.01it/s][A
 67%|██████▋   | 18/27 [00:02<00:01,  7.95it/s][A
 74%|███████▍  | 20/27 [00:02<00:00,  9.69it/s][A
 81%|████████▏ | 22/27 [00:02<00:00,  9.23it/s][A
 89%|████████▉ | 24/27 [00:03<00:00,  9.48it/s][A
100%|██████████| 27/27 [00:03<00:00,  7.74it/s][A
Epochs:  65%|██████▌   | 30/46 [13:45<07:08, 26.76s/it]

Val Loss: 2.4214 - Val Accuracy: 0.9208



Training:   0%|          | 0/209 [00:00<?, ?it/s][A
Training:   0%|          | 1/209 [00:00<02:38,  1.31it/s][A
Training:   2%|▏         | 4/209 [00:00<00:38,  5.39it/s][A
Training:   3%|▎         | 6/209 [00:01<00:34,  5.85it/s][A
Training:   4%|▍         | 9/209 [00:01<00:25,  7.97it/s][A
Training:   5%|▌         | 11/209 [00:01<00:22,  8.69it/s][A
Training:   6%|▌         | 13/209 [00:01<00:22,  8.82it/s][A
Training:   7%|▋         | 15/209 [00:01<00:19,  9.98it/s][A
Training:   8%|▊         | 17/209 [00:02<00:21,  9.07it/s][A
Training:   9%|▉         | 19/209 [00:02<00:18, 10.15it/s][A
Training:  10%|█         | 21/209 [00:02<00:24,  7.77it/s][A
Training:  11%|█         | 23/209 [00:02<00:20,  9.07it/s][A
Training:  12%|█▏        | 25/209 [00:03<00:24,  7.57it/s][A
Training:  13%|█▎        | 28/209 [00:03<00:17, 10.54it/s][A
Training:  14%|█▍        | 30/209 [00:03<00:20,  8.94it/s][A
Training:  15%|█▌        | 32/209 [00:03<00:17, 10.35it/s][A
Training:  16%|█▋   

Epoch: 31/46 - Loss: 2.3817 - Accuracy: 0.9269



  0%|          | 0/27 [00:00<?, ?it/s][A
  4%|▎         | 1/27 [00:00<00:17,  1.49it/s][A
 19%|█▊        | 5/27 [00:01<00:03,  5.79it/s][A
 26%|██▌       | 7/27 [00:01<00:02,  7.79it/s][A
 33%|███▎      | 9/27 [00:01<00:02,  7.35it/s][A
 41%|████      | 11/27 [00:01<00:01,  8.66it/s][A
 48%|████▊     | 13/27 [00:01<00:01,  8.62it/s][A
 56%|█████▌    | 15/27 [00:01<00:01,  9.24it/s][A
 63%|██████▎   | 17/27 [00:02<00:01,  9.31it/s][A
 70%|███████   | 19/27 [00:02<00:00,  9.94it/s][A
 78%|███████▊  | 21/27 [00:02<00:00,  8.17it/s][A
 81%|████████▏ | 22/27 [00:02<00:00,  8.27it/s][A
 93%|█████████▎| 25/27 [00:03<00:00,  8.01it/s][A
100%|██████████| 27/27 [00:03<00:00,  7.79it/s][A
Epochs:  67%|██████▋   | 31/46 [14:12<06:43, 26.89s/it]

Val Loss: 2.0671 - Val Accuracy: 0.9370



Training:   0%|          | 0/209 [00:00<?, ?it/s][A
Training:   0%|          | 1/209 [00:00<03:08,  1.10it/s][A
Training:   2%|▏         | 5/209 [00:01<00:43,  4.72it/s][A
Training:   4%|▍         | 9/209 [00:01<00:34,  5.73it/s][A
Training:   6%|▌         | 12/209 [00:01<00:24,  7.99it/s][A
Training:   7%|▋         | 14/209 [00:02<00:26,  7.31it/s][A
Training:   8%|▊         | 17/209 [00:02<00:25,  7.41it/s][A
Training:  10%|█         | 21/209 [00:03<00:22,  8.40it/s][A
Training:  12%|█▏        | 25/209 [00:03<00:21,  8.61it/s][A
Training:  13%|█▎        | 27/209 [00:03<00:18,  9.67it/s][A
Training:  14%|█▍        | 29/209 [00:03<00:21,  8.42it/s][A
Training:  15%|█▌        | 32/209 [00:04<00:16, 10.70it/s][A
Training:  16%|█▋        | 34/209 [00:04<00:18,  9.49it/s][A
Training:  18%|█▊        | 37/209 [00:04<00:19,  8.77it/s][A
Training:  19%|█▉        | 40/209 [00:04<00:16, 10.56it/s][A
Training:  20%|██        | 42/209 [00:05<00:18,  8.90it/s][A
Training:  21%|██  

Epoch: 32/46 - Loss: 2.0259 - Accuracy: 0.9351



  0%|          | 0/27 [00:00<?, ?it/s][A
  4%|▎         | 1/27 [00:00<00:23,  1.13it/s][A
  7%|▋         | 2/27 [00:01<00:11,  2.26it/s][A
 15%|█▍        | 4/27 [00:01<00:04,  5.05it/s][A
 22%|██▏       | 6/27 [00:01<00:03,  5.26it/s][A
 33%|███▎      | 9/27 [00:01<00:02,  7.49it/s][A
 41%|████      | 11/27 [00:01<00:01,  8.83it/s][A
 48%|████▊     | 13/27 [00:02<00:01,  9.14it/s][A
 56%|█████▌    | 15/27 [00:02<00:01, 10.18it/s][A
 63%|██████▎   | 17/27 [00:02<00:00, 10.51it/s][A
 70%|███████   | 19/27 [00:02<00:00, 10.18it/s][A
 78%|███████▊  | 21/27 [00:02<00:00, 10.56it/s][A
 85%|████████▌ | 23/27 [00:02<00:00, 10.94it/s][A
 93%|█████████▎| 25/27 [00:03<00:00, 10.01it/s][A
100%|██████████| 27/27 [00:03<00:00,  7.73it/s][A
Epochs:  70%|██████▉   | 32/46 [14:39<06:18, 27.06s/it]

Val Loss: 2.9057 - Val Accuracy: 0.9138



Training:   0%|          | 0/209 [00:00<?, ?it/s][A
Training:   0%|          | 1/209 [00:00<02:17,  1.51it/s][A
Training:   1%|▏         | 3/209 [00:00<00:47,  4.31it/s][A
Training:   2%|▏         | 4/209 [00:01<00:45,  4.52it/s][A
Training:   2%|▏         | 5/209 [00:01<00:38,  5.30it/s][A
Training:   3%|▎         | 7/209 [00:01<00:25,  7.83it/s][A
Training:   4%|▍         | 9/209 [00:01<00:26,  7.57it/s][A
Training:   5%|▌         | 11/209 [00:01<00:20,  9.52it/s][A
Training:   6%|▌         | 13/209 [00:01<00:22,  8.61it/s][A
Training:   8%|▊         | 16/209 [00:02<00:22,  8.70it/s][A
Training:   8%|▊         | 17/209 [00:02<00:22,  8.53it/s][A
Training:   9%|▉         | 19/209 [00:02<00:18, 10.35it/s][A
Training:  10%|█         | 21/209 [00:02<00:24,  7.53it/s][A
Training:  11%|█▏        | 24/209 [00:03<00:22,  8.38it/s][A
Training:  12%|█▏        | 25/209 [00:03<00:22,  8.06it/s][A
Training:  13%|█▎        | 28/209 [00:03<00:21,  8.60it/s][A
Training:  14%|█▍     

Epoch: 33/46 - Loss: 2.4725 - Accuracy: 0.9292



  0%|          | 0/27 [00:00<?, ?it/s][A
  4%|▎         | 1/27 [00:00<00:17,  1.45it/s][A
 11%|█         | 3/27 [00:00<00:05,  4.50it/s][A
 19%|█▊        | 5/27 [00:01<00:03,  5.81it/s][A
 26%|██▌       | 7/27 [00:01<00:02,  8.12it/s][A
 33%|███▎      | 9/27 [00:01<00:01,  9.34it/s][A
 41%|████      | 11/27 [00:01<00:01,  9.64it/s][A
 48%|████▊     | 13/27 [00:01<00:01, 10.21it/s][A
 56%|█████▌    | 15/27 [00:01<00:01, 10.07it/s][A
 63%|██████▎   | 17/27 [00:02<00:00, 11.11it/s][A
 70%|███████   | 19/27 [00:02<00:00, 10.13it/s][A
 78%|███████▊  | 21/27 [00:02<00:00, 10.23it/s][A
 85%|████████▌ | 23/27 [00:02<00:00,  8.76it/s][A
100%|██████████| 27/27 [00:03<00:00,  8.65it/s][A
Epochs:  72%|███████▏  | 33/46 [15:06<05:48, 26.84s/it]

Val Loss: 2.3818 - Val Accuracy: 0.9425



Training:   0%|          | 0/209 [00:00<?, ?it/s][A
Training:   0%|          | 1/209 [00:00<02:48,  1.23it/s][A
Training:   1%|▏         | 3/209 [00:00<00:52,  3.95it/s][A
Training:   2%|▏         | 5/209 [00:01<00:40,  5.07it/s][A
Training:   4%|▍         | 9/209 [00:01<00:27,  7.27it/s][A
Training:   6%|▌         | 13/209 [00:02<00:24,  8.10it/s][A
Training:   8%|▊         | 17/209 [00:02<00:21,  9.14it/s][A
Training:  10%|█         | 21/209 [00:02<00:20,  9.39it/s][A
Training:  12%|█▏        | 25/209 [00:03<00:19,  9.52it/s][A
Training:  13%|█▎        | 28/209 [00:03<00:15, 11.60it/s][A
Training:  14%|█▍        | 30/209 [00:03<00:18,  9.91it/s][A
Training:  16%|█▌        | 33/209 [00:03<00:18,  9.39it/s][A
Training:  17%|█▋        | 35/209 [00:04<00:16, 10.55it/s][A
Training:  18%|█▊        | 37/209 [00:04<00:17,  9.58it/s][A
Training:  19%|█▊        | 39/209 [00:04<00:15, 10.89it/s][A
Training:  20%|█▉        | 41/209 [00:04<00:19,  8.48it/s][A
Training:  22%|██▏  

Epoch: 34/46 - Loss: 2.5183 - Accuracy: 0.9283



  0%|          | 0/27 [00:00<?, ?it/s][A
  4%|▎         | 1/27 [00:00<00:21,  1.22it/s][A
 19%|█▊        | 5/27 [00:01<00:03,  5.61it/s][A
 26%|██▌       | 7/27 [00:01<00:02,  6.73it/s][A
 33%|███▎      | 9/27 [00:01<00:02,  7.08it/s][A
 41%|████      | 11/27 [00:01<00:01,  8.51it/s][A
 48%|████▊     | 13/27 [00:01<00:01,  8.02it/s][A
 56%|█████▌    | 15/27 [00:02<00:01,  9.55it/s][A
 63%|██████▎   | 17/27 [00:02<00:01,  8.82it/s][A
 70%|███████   | 19/27 [00:02<00:00, 10.08it/s][A
 78%|███████▊  | 21/27 [00:02<00:00, 10.17it/s][A
 85%|████████▌ | 23/27 [00:02<00:00, 10.61it/s][A
 93%|█████████▎| 25/27 [00:02<00:00, 11.63it/s][A
100%|██████████| 27/27 [00:03<00:00,  8.51it/s][A
Epochs:  74%|███████▍  | 34/46 [15:31<05:18, 26.54s/it]

Val Loss: 2.2240 - Val Accuracy: 0.9353



Training:   0%|          | 0/209 [00:00<?, ?it/s][A
Training:   0%|          | 1/209 [00:00<02:06,  1.64it/s][A
Training:   1%|▏         | 3/209 [00:00<00:41,  4.92it/s][A
Training:   2%|▏         | 5/209 [00:00<00:33,  6.12it/s][A
Training:   3%|▎         | 7/209 [00:01<00:25,  7.97it/s][A
Training:   4%|▍         | 9/209 [00:01<00:24,  8.26it/s][A
Training:   5%|▌         | 11/209 [00:01<00:27,  7.12it/s][A
Training:   6%|▌         | 13/209 [00:01<00:24,  8.02it/s][A
Training:   7%|▋         | 15/209 [00:02<00:26,  7.35it/s][A
Training:   8%|▊         | 17/209 [00:02<00:21,  8.95it/s][A
Training:   9%|▉         | 19/209 [00:02<00:25,  7.44it/s][A
Training:  11%|█         | 22/209 [00:02<00:21,  8.83it/s][A
Training:  11%|█▏        | 24/209 [00:03<00:21,  8.75it/s][A
Training:  12%|█▏        | 26/209 [00:03<00:21,  8.39it/s][A
Training:  13%|█▎        | 27/209 [00:03<00:21,  8.38it/s][A
Training:  14%|█▍        | 29/209 [00:03<00:18,  9.89it/s][A
Training:  15%|█▍    

Epoch: 35/46 - Loss: 2.2012 - Accuracy: 0.9312



  0%|          | 0/27 [00:00<?, ?it/s][A
  4%|▎         | 1/27 [00:00<00:19,  1.33it/s][A
  7%|▋         | 2/27 [00:00<00:10,  2.42it/s][A
 19%|█▊        | 5/27 [00:01<00:03,  5.86it/s][A
 22%|██▏       | 6/27 [00:01<00:03,  5.91it/s][A
 30%|██▉       | 8/27 [00:01<00:02,  7.75it/s][A
 37%|███▋      | 10/27 [00:01<00:02,  7.35it/s][A
 44%|████▍     | 12/27 [00:01<00:01,  8.27it/s][A
 52%|█████▏    | 14/27 [00:02<00:01,  7.89it/s][A
 59%|█████▉    | 16/27 [00:02<00:01,  8.44it/s][A
 67%|██████▋   | 18/27 [00:02<00:01,  8.64it/s][A
 74%|███████▍  | 20/27 [00:02<00:00,  7.89it/s][A
 81%|████████▏ | 22/27 [00:03<00:00,  8.84it/s][A
 89%|████████▉ | 24/27 [00:03<00:00,  8.98it/s][A
100%|██████████| 27/27 [00:03<00:00,  7.50it/s][A
Epochs:  76%|███████▌  | 35/46 [15:58<04:52, 26.60s/it]

Val Loss: 2.4489 - Val Accuracy: 0.9392



Training:   0%|          | 0/209 [00:00<?, ?it/s][A
Training:   0%|          | 1/209 [00:00<02:44,  1.26it/s][A
Training:   2%|▏         | 5/209 [00:01<00:41,  4.95it/s][A
Training:   3%|▎         | 7/209 [00:01<00:29,  6.91it/s][A
Training:   4%|▍         | 9/209 [00:01<00:28,  6.91it/s][A
Training:   6%|▌         | 12/209 [00:01<00:19, 10.29it/s][A
Training:   7%|▋         | 14/209 [00:02<00:25,  7.75it/s][A
Training:   8%|▊         | 17/209 [00:02<00:25,  7.68it/s][A
Training:  10%|█         | 21/209 [00:02<00:23,  7.94it/s][A
Training:  12%|█▏        | 25/209 [00:03<00:21,  8.44it/s][A
Training:  14%|█▍        | 29/209 [00:03<00:20,  8.86it/s][A
Training:  16%|█▌        | 33/209 [00:04<00:17, 10.01it/s][A
Training:  18%|█▊        | 37/209 [00:04<00:16, 10.39it/s][A
Training:  20%|█▉        | 41/209 [00:04<00:16, 10.40it/s][A
Training:  22%|██▏       | 45/209 [00:05<00:15, 10.69it/s][A
Training:  23%|██▎       | 49/209 [00:05<00:15, 10.16it/s][A
Training:  25%|██▍  

Epoch: 36/46 - Loss: 2.0813 - Accuracy: 0.9322



  0%|          | 0/27 [00:00<?, ?it/s][A
  4%|▎         | 1/27 [00:00<00:16,  1.57it/s][A
  7%|▋         | 2/27 [00:00<00:08,  3.00it/s][A
 19%|█▊        | 5/27 [00:01<00:03,  5.82it/s][A
 30%|██▉       | 8/27 [00:01<00:02,  8.05it/s][A
 33%|███▎      | 9/27 [00:01<00:02,  7.48it/s][A
 37%|███▋      | 10/27 [00:01<00:02,  7.86it/s][A
 44%|████▍     | 12/27 [00:01<00:01,  8.78it/s][A
 52%|█████▏    | 14/27 [00:01<00:01,  9.92it/s][A
 59%|█████▉    | 16/27 [00:02<00:01,  8.83it/s][A
 67%|██████▋   | 18/27 [00:02<00:00, 10.66it/s][A
 74%|███████▍  | 20/27 [00:02<00:00,  9.12it/s][A
 81%|████████▏ | 22/27 [00:02<00:00, 10.29it/s][A
 89%|████████▉ | 24/27 [00:02<00:00,  9.42it/s][A
100%|██████████| 27/27 [00:03<00:00,  8.35it/s][A
Epochs:  78%|███████▊  | 36/46 [16:25<04:25, 26.60s/it]

Val Loss: 2.3950 - Val Accuracy: 0.9265



Training:   0%|          | 0/209 [00:00<?, ?it/s][A
Training:   0%|          | 1/209 [00:00<02:32,  1.36it/s][A
Training:   1%|▏         | 3/209 [00:00<00:47,  4.36it/s][A
Training:   2%|▏         | 5/209 [00:01<00:39,  5.12it/s][A
Training:   3%|▎         | 7/209 [00:01<00:28,  7.11it/s][A
Training:   4%|▍         | 9/209 [00:01<00:27,  7.34it/s][A
Training:   5%|▌         | 11/209 [00:01<00:22,  8.90it/s][A
Training:   6%|▌         | 13/209 [00:01<00:23,  8.37it/s][A
Training:   7%|▋         | 15/209 [00:02<00:21,  9.20it/s][A
Training:   8%|▊         | 17/209 [00:02<00:25,  7.52it/s][A
Training:   9%|▉         | 19/209 [00:02<00:21,  9.01it/s][A
Training:  10%|█         | 21/209 [00:02<00:23,  8.00it/s][A
Training:  11%|█         | 23/209 [00:03<00:20,  9.29it/s][A
Training:  12%|█▏        | 25/209 [00:03<00:23,  7.90it/s][A
Training:  13%|█▎        | 27/209 [00:03<00:19,  9.44it/s][A
Training:  14%|█▍        | 29/209 [00:03<00:22,  7.91it/s][A
Training:  15%|█▍    

Epoch: 37/46 - Loss: 2.3064 - Accuracy: 0.9265



  0%|          | 0/27 [00:00<?, ?it/s][A
  4%|▎         | 1/27 [00:01<00:29,  1.12s/it][A
 19%|█▊        | 5/27 [00:01<00:05,  3.99it/s][A
 33%|███▎      | 9/27 [00:02<00:03,  5.55it/s][A
 48%|████▊     | 13/27 [00:02<00:02,  6.49it/s][A
 63%|██████▎   | 17/27 [00:02<00:01,  7.08it/s][A
 78%|███████▊  | 21/27 [00:03<00:00,  7.94it/s][A
100%|██████████| 27/27 [00:03<00:00,  6.91it/s][A
Epochs:  80%|████████  | 37/46 [16:52<04:00, 26.67s/it]

Val Loss: 2.2422 - Val Accuracy: 0.9392



Training:   0%|          | 0/209 [00:00<?, ?it/s][A
Training:   0%|          | 1/209 [00:00<02:49,  1.23it/s][A
Training:   1%|▏         | 3/209 [00:00<00:51,  3.99it/s][A
Training:   2%|▏         | 5/209 [00:01<00:40,  5.08it/s][A
Training:   3%|▎         | 6/209 [00:01<00:34,  5.83it/s][A
Training:   4%|▍         | 9/209 [00:01<00:27,  7.41it/s][A
Training:   5%|▍         | 10/209 [00:01<00:27,  7.25it/s][A
Training:   6%|▌         | 13/209 [00:02<00:24,  8.03it/s][A
Training:   7%|▋         | 15/209 [00:02<00:20,  9.67it/s][A
Training:   8%|▊         | 17/209 [00:02<00:22,  8.65it/s][A
Training:   9%|▉         | 19/209 [00:02<00:19,  9.91it/s][A
Training:  10%|█         | 21/209 [00:02<00:20,  9.14it/s][A
Training:  11%|█         | 23/209 [00:03<00:21,  8.61it/s][A
Training:  12%|█▏        | 25/209 [00:03<00:20,  9.06it/s][A
Training:  12%|█▏        | 26/209 [00:03<00:25,  7.19it/s][A
Training:  14%|█▍        | 29/209 [00:03<00:18,  9.57it/s][A
Training:  15%|█▍    

Epoch: 38/46 - Loss: 2.1965 - Accuracy: 0.9301



  0%|          | 0/27 [00:00<?, ?it/s][A
  4%|▎         | 1/27 [00:01<00:26,  1.00s/it][A
 19%|█▊        | 5/27 [00:01<00:05,  4.25it/s][A
 33%|███▎      | 9/27 [00:01<00:03,  5.87it/s][A
 48%|████▊     | 13/27 [00:02<00:01,  7.09it/s][A
 63%|██████▎   | 17/27 [00:02<00:01,  8.16it/s][A
 74%|███████▍  | 20/27 [00:02<00:00, 10.22it/s][A
 81%|████████▏ | 22/27 [00:03<00:00,  9.14it/s][A
100%|██████████| 27/27 [00:03<00:00,  7.50it/s][A
Epochs:  83%|████████▎ | 38/46 [17:18<03:32, 26.51s/it]

Val Loss: 2.3725 - Val Accuracy: 0.9409



Training:   0%|          | 0/209 [00:00<?, ?it/s][A
Training:   0%|          | 1/209 [00:00<02:06,  1.64it/s][A
Training:   1%|          | 2/209 [00:00<01:11,  2.90it/s][A
Training:   2%|▏         | 5/209 [00:00<00:28,  7.12it/s][A
Training:   3%|▎         | 7/209 [00:01<00:28,  7.01it/s][A
Training:   5%|▍         | 10/209 [00:01<00:26,  7.60it/s][A
Training:   6%|▌         | 12/209 [00:01<00:22,  8.77it/s][A
Training:   7%|▋         | 14/209 [00:02<00:26,  7.49it/s][A
Training:   8%|▊         | 17/209 [00:02<00:19,  9.62it/s][A
Training:   9%|▉         | 19/209 [00:02<00:21,  8.94it/s][A
Training:  11%|█         | 22/209 [00:02<00:19,  9.38it/s][A
Training:  12%|█▏        | 25/209 [00:02<00:15, 12.02it/s][A
Training:  13%|█▎        | 27/209 [00:03<00:16, 11.15it/s][A
Training:  14%|█▍        | 30/209 [00:03<00:17, 10.43it/s][A
Training:  16%|█▌        | 33/209 [00:03<00:15, 11.60it/s][A
Training:  17%|█▋        | 35/209 [00:03<00:17, 10.06it/s][A
Training:  18%|█▊   

Epoch: 39/46 - Loss: 2.1487 - Accuracy: 0.9287



  0%|          | 0/27 [00:00<?, ?it/s][A
  4%|▎         | 1/27 [00:00<00:21,  1.22it/s][A
  7%|▋         | 2/27 [00:00<00:10,  2.34it/s][A
 19%|█▊        | 5/27 [00:01<00:03,  5.63it/s][A
 22%|██▏       | 6/27 [00:01<00:03,  5.87it/s][A
 33%|███▎      | 9/27 [00:01<00:02,  7.51it/s][A
 44%|████▍     | 12/27 [00:01<00:01, 10.91it/s][A
 52%|█████▏    | 14/27 [00:02<00:01,  7.38it/s][A
 63%|██████▎   | 17/27 [00:02<00:01,  9.22it/s][A
 70%|███████   | 19/27 [00:02<00:01,  7.94it/s][A
 78%|███████▊  | 21/27 [00:02<00:00,  8.96it/s][A
 85%|████████▌ | 23/27 [00:03<00:00,  8.27it/s][A
 93%|█████████▎| 25/27 [00:03<00:00,  9.57it/s][A
100%|██████████| 27/27 [00:03<00:00,  7.41it/s][A
Epochs:  85%|████████▍ | 39/46 [17:44<03:05, 26.48s/it]

Val Loss: 2.4245 - Val Accuracy: 0.9226



Training:   0%|          | 0/209 [00:00<?, ?it/s][A
Training:   0%|          | 1/209 [00:00<02:31,  1.37it/s][A
Training:   1%|          | 2/209 [00:00<01:18,  2.64it/s][A
Training:   2%|▏         | 4/209 [00:01<00:38,  5.29it/s][A
Training:   2%|▏         | 5/209 [00:01<00:39,  5.11it/s][A
Training:   3%|▎         | 7/209 [00:01<00:28,  7.11it/s][A
Training:   4%|▍         | 8/209 [00:01<00:26,  7.58it/s][A
Training:   4%|▍         | 9/209 [00:01<00:35,  5.69it/s][A
Training:   6%|▌         | 12/209 [00:01<00:20,  9.44it/s][A
Training:   7%|▋         | 14/209 [00:02<00:27,  7.12it/s][A
Training:   8%|▊         | 16/209 [00:02<00:21,  8.92it/s][A
Training:   9%|▊         | 18/209 [00:02<00:25,  7.59it/s][A
Training:  10%|▉         | 20/209 [00:02<00:20,  9.40it/s][A
Training:  11%|█         | 22/209 [00:03<00:23,  8.09it/s][A
Training:  12%|█▏        | 25/209 [00:03<00:19,  9.21it/s][A
Training:  13%|█▎        | 28/209 [00:03<00:16, 10.97it/s][A
Training:  14%|█▍      

Epoch: 40/46 - Loss: 2.0388 - Accuracy: 0.9314



  0%|          | 0/27 [00:00<?, ?it/s][A
  4%|▎         | 1/27 [00:00<00:21,  1.21it/s][A
 15%|█▍        | 4/27 [00:00<00:04,  5.14it/s][A
 22%|██▏       | 6/27 [00:01<00:04,  4.94it/s][A
 33%|███▎      | 9/27 [00:01<00:03,  5.13it/s][A
 37%|███▋      | 10/27 [00:02<00:03,  5.19it/s][A
 48%|████▊     | 13/27 [00:02<00:02,  5.84it/s][A
 52%|█████▏    | 14/27 [00:02<00:02,  5.95it/s][A
 63%|██████▎   | 17/27 [00:03<00:01,  6.93it/s][A
 74%|███████▍  | 20/27 [00:03<00:00,  9.14it/s][A
 81%|████████▏ | 22/27 [00:03<00:00,  8.02it/s][A
 93%|█████████▎| 25/27 [00:03<00:00,  8.50it/s][A
100%|██████████| 27/27 [00:04<00:00,  6.41it/s][A
Epochs:  87%|████████▋ | 40/46 [18:12<02:41, 26.92s/it]

Val Loss: 2.2738 - Val Accuracy: 0.9425



Training:   0%|          | 0/209 [00:00<?, ?it/s][A
Training:   0%|          | 1/209 [00:01<03:26,  1.01it/s][A
Training:   2%|▏         | 4/209 [00:01<00:44,  4.56it/s][A
Training:   3%|▎         | 6/209 [00:01<00:39,  5.08it/s][A
Training:   4%|▍         | 9/209 [00:01<00:31,  6.44it/s][A
Training:   6%|▌         | 12/209 [00:01<00:21,  9.31it/s][A
Training:   7%|▋         | 14/209 [00:02<00:26,  7.42it/s][A
Training:   8%|▊         | 16/209 [00:02<00:21,  9.02it/s][A
Training:   9%|▊         | 18/209 [00:02<00:24,  7.73it/s][A
Training:  10%|▉         | 20/209 [00:02<00:21,  8.94it/s][A
Training:  11%|█         | 22/209 [00:03<00:22,  8.23it/s][A
Training:  11%|█▏        | 24/209 [00:03<00:19,  9.47it/s][A
Training:  12%|█▏        | 26/209 [00:03<00:19,  9.24it/s][A
Training:  14%|█▍        | 29/209 [00:03<00:21,  8.46it/s][A
Training:  15%|█▍        | 31/209 [00:04<00:17,  9.93it/s][A
Training:  16%|█▌        | 33/209 [00:04<00:22,  7.92it/s][A
Training:  17%|█▋   

Epoch: 41/46 - Loss: 2.0570 - Accuracy: 0.9327



  0%|          | 0/27 [00:00<?, ?it/s][A
  4%|▎         | 1/27 [00:00<00:21,  1.23it/s][A
  7%|▋         | 2/27 [00:01<00:11,  2.20it/s][A
 19%|█▊        | 5/27 [00:01<00:04,  5.44it/s][A
 22%|██▏       | 6/27 [00:01<00:04,  5.12it/s][A
 33%|███▎      | 9/27 [00:01<00:02,  7.05it/s][A
 37%|███▋      | 10/27 [00:01<00:02,  6.41it/s][A
 48%|████▊     | 13/27 [00:02<00:01,  8.29it/s][A
 52%|█████▏    | 14/27 [00:02<00:01,  7.51it/s][A
 63%|██████▎   | 17/27 [00:02<00:01,  8.19it/s][A
 67%|██████▋   | 18/27 [00:02<00:01,  7.76it/s][A
 78%|███████▊  | 21/27 [00:03<00:00,  8.72it/s][A
 81%|████████▏ | 22/27 [00:03<00:00,  8.36it/s][A
100%|██████████| 27/27 [00:03<00:00,  7.15it/s][A
Epochs:  89%|████████▉ | 41/46 [18:40<02:15, 27.17s/it]

Val Loss: 2.5845 - Val Accuracy: 0.9174



Training:   0%|          | 0/209 [00:00<?, ?it/s][A
Training:   0%|          | 1/209 [00:00<02:52,  1.20it/s][A
Training:   1%|          | 2/209 [00:01<01:32,  2.24it/s][A
Training:   2%|▏         | 5/209 [00:01<00:37,  5.49it/s][A
Training:   3%|▎         | 6/209 [00:01<00:35,  5.80it/s][A
Training:   4%|▍         | 8/209 [00:01<00:26,  7.69it/s][A
Training:   4%|▍         | 9/209 [00:01<00:29,  6.71it/s][A
Training:   5%|▍         | 10/209 [00:01<00:29,  6.77it/s][A
Training:   6%|▌         | 13/209 [00:02<00:24,  8.04it/s][A
Training:   7%|▋         | 15/209 [00:02<00:20,  9.60it/s][A
Training:   8%|▊         | 17/209 [00:02<00:21,  8.96it/s][A
Training:   9%|▉         | 19/209 [00:02<00:18, 10.26it/s][A
Training:  10%|█         | 21/209 [00:02<00:20,  9.36it/s][A
Training:  11%|█         | 23/209 [00:03<00:20,  9.11it/s][A
Training:  12%|█▏        | 25/209 [00:03<00:17, 10.52it/s][A
Training:  13%|█▎        | 27/209 [00:03<00:19,  9.24it/s][A
Training:  14%|█▍     

Epoch: 42/46 - Loss: 2.2971 - Accuracy: 0.9292



  0%|          | 0/27 [00:00<?, ?it/s][A
  4%|▎         | 1/27 [00:00<00:20,  1.27it/s][A
  7%|▋         | 2/27 [00:00<00:10,  2.35it/s][A
 19%|█▊        | 5/27 [00:01<00:03,  5.82it/s][A
 22%|██▏       | 6/27 [00:01<00:04,  5.08it/s][A
 33%|███▎      | 9/27 [00:01<00:02,  6.77it/s][A
 37%|███▋      | 10/27 [00:01<00:02,  6.71it/s][A
 48%|████▊     | 13/27 [00:02<00:01,  8.79it/s][A
 52%|█████▏    | 14/27 [00:02<00:01,  7.39it/s][A
 63%|██████▎   | 17/27 [00:02<00:00, 10.03it/s][A
 70%|███████   | 19/27 [00:02<00:00,  8.97it/s][A
 78%|███████▊  | 21/27 [00:02<00:00,  9.56it/s][A
 85%|████████▌ | 23/27 [00:03<00:00,  9.71it/s][A
 93%|█████████▎| 25/27 [00:03<00:00,  8.44it/s][A
100%|██████████| 27/27 [00:03<00:00,  7.25it/s][A
Epochs:  91%|█████████▏| 42/46 [19:08<01:49, 27.38s/it]

Val Loss: 2.1904 - Val Accuracy: 0.9403



Training:   0%|          | 0/209 [00:00<?, ?it/s][A
Training:   0%|          | 1/209 [00:00<03:11,  1.08it/s][A
Training:   1%|▏         | 3/209 [00:01<00:59,  3.48it/s][A
Training:   2%|▏         | 5/209 [00:01<00:43,  4.71it/s][A
Training:   3%|▎         | 6/209 [00:01<00:37,  5.35it/s][A
Training:   4%|▍         | 9/209 [00:01<00:32,  6.13it/s][A
Training:   5%|▍         | 10/209 [00:01<00:30,  6.61it/s][A
Training:   6%|▌         | 13/209 [00:02<00:27,  7.22it/s][A
Training:   7%|▋         | 15/209 [00:02<00:21,  8.98it/s][A
Training:   8%|▊         | 17/209 [00:02<00:25,  7.56it/s][A
Training:  10%|▉         | 20/209 [00:02<00:18, 10.42it/s][A
Training:  11%|█         | 22/209 [00:03<00:18,  9.94it/s][A
Training:  12%|█▏        | 25/209 [00:03<00:18,  9.87it/s][A
Training:  14%|█▍        | 29/209 [00:03<00:18,  9.92it/s][A
Training:  16%|█▌        | 33/209 [00:04<00:19,  9.00it/s][A
Training:  17%|█▋        | 36/209 [00:04<00:15, 11.05it/s][A
Training:  18%|█▊    

Epoch: 43/46 - Loss: 2.0546 - Accuracy: 0.9293



  0%|          | 0/27 [00:00<?, ?it/s][A
  4%|▎         | 1/27 [00:00<00:18,  1.40it/s][A
 11%|█         | 3/27 [00:00<00:05,  4.41it/s][A
 19%|█▊        | 5/27 [00:01<00:03,  5.52it/s][A
 22%|██▏       | 6/27 [00:01<00:03,  5.70it/s][A
 33%|███▎      | 9/27 [00:01<00:02,  8.38it/s][A
 41%|████      | 11/27 [00:01<00:01,  9.92it/s][A
 48%|████▊     | 13/27 [00:01<00:01,  9.87it/s][A
 56%|█████▌    | 15/27 [00:01<00:01, 10.67it/s][A
 63%|██████▎   | 17/27 [00:02<00:01,  9.61it/s][A
 70%|███████   | 19/27 [00:02<00:00, 10.03it/s][A
 78%|███████▊  | 21/27 [00:02<00:00, 10.13it/s][A
 85%|████████▌ | 23/27 [00:02<00:00,  9.59it/s][A
100%|██████████| 27/27 [00:03<00:00,  8.23it/s][A
Epochs:  93%|█████████▎| 43/46 [19:35<01:21, 27.27s/it]

Val Loss: 2.4905 - Val Accuracy: 0.9397



Training:   0%|          | 0/209 [00:00<?, ?it/s][A
Training:   0%|          | 1/209 [00:00<03:07,  1.11it/s][A
Training:   2%|▏         | 5/209 [00:01<00:44,  4.55it/s][A
Training:   3%|▎         | 7/209 [00:01<00:31,  6.32it/s][A
Training:   4%|▍         | 9/209 [00:01<00:33,  6.00it/s][A
Training:   6%|▌         | 12/209 [00:01<00:21,  9.12it/s][A
Training:   7%|▋         | 14/209 [00:02<00:23,  8.19it/s][A
Training:   8%|▊         | 17/209 [00:02<00:27,  7.07it/s][A
Training:  10%|▉         | 20/209 [00:02<00:19,  9.66it/s][A
Training:  11%|█         | 22/209 [00:03<00:24,  7.54it/s][A
Training:  12%|█▏        | 25/209 [00:03<00:25,  7.32it/s][A
Training:  13%|█▎        | 27/209 [00:03<00:21,  8.62it/s][A
Training:  14%|█▍        | 29/209 [00:04<00:23,  7.55it/s][A
Training:  16%|█▌        | 33/209 [00:04<00:20,  8.77it/s][A
Training:  18%|█▊        | 37/209 [00:04<00:19,  8.61it/s][A
Training:  20%|█▉        | 41/209 [00:05<00:18,  9.27it/s][A
Training:  21%|██   

Epoch: 44/46 - Loss: 2.3286 - Accuracy: 0.9334



  0%|          | 0/27 [00:00<?, ?it/s][A
  4%|▎         | 1/27 [00:00<00:23,  1.13it/s][A
 19%|█▊        | 5/27 [00:01<00:04,  5.22it/s][A
 30%|██▉       | 8/27 [00:01<00:02,  8.09it/s][A
 37%|███▋      | 10/27 [00:01<00:02,  7.04it/s][A
 48%|████▊     | 13/27 [00:02<00:02,  6.69it/s][A
 59%|█████▉    | 16/27 [00:02<00:01,  9.01it/s][A
 67%|██████▋   | 18/27 [00:02<00:01,  7.33it/s][A
 78%|███████▊  | 21/27 [00:03<00:00,  7.14it/s][A
100%|██████████| 27/27 [00:03<00:00,  7.25it/s][A
Epochs:  96%|█████████▌| 44/46 [20:02<00:54, 27.40s/it]

Val Loss: 2.8363 - Val Accuracy: 0.8583



Training:   0%|          | 0/209 [00:00<?, ?it/s][A
Training:   0%|          | 1/209 [00:00<02:50,  1.22it/s][A
Training:   2%|▏         | 5/209 [00:01<00:40,  5.04it/s][A
Training:   4%|▍         | 9/209 [00:01<00:27,  7.17it/s][A
Training:   6%|▌         | 13/209 [00:01<00:22,  8.62it/s][A
Training:   8%|▊         | 16/209 [00:02<00:18, 10.62it/s][A
Training:   9%|▊         | 18/209 [00:02<00:20,  9.44it/s][A
Training:  10%|▉         | 20/209 [00:02<00:18, 10.20it/s][A
Training:  11%|█         | 22/209 [00:02<00:22,  8.21it/s][A
Training:  11%|█         | 23/209 [00:03<00:24,  7.71it/s][A
Training:  12%|█▏        | 25/209 [00:03<00:25,  7.22it/s][A
Training:  13%|█▎        | 27/209 [00:03<00:20,  8.88it/s][A
Training:  14%|█▍        | 29/209 [00:03<00:22,  8.17it/s][A
Training:  15%|█▍        | 31/209 [00:03<00:18,  9.61it/s][A
Training:  16%|█▌        | 33/209 [00:04<00:19,  8.90it/s][A
Training:  17%|█▋        | 35/209 [00:04<00:16, 10.68it/s][A
Training:  18%|█▊  

Epoch: 45/46 - Loss: 2.1357 - Accuracy: 0.9292



  0%|          | 0/27 [00:00<?, ?it/s][A
  4%|▎         | 1/27 [00:00<00:25,  1.01it/s][A
 19%|█▊        | 5/27 [00:01<00:05,  4.17it/s][A
 33%|███▎      | 9/27 [00:01<00:03,  5.75it/s][A
 48%|████▊     | 13/27 [00:02<00:01,  7.10it/s][A
 63%|██████▎   | 17/27 [00:02<00:01,  8.20it/s][A
 78%|███████▊  | 21/27 [00:03<00:00,  8.97it/s][A
100%|██████████| 27/27 [00:03<00:00,  7.71it/s][A
Epochs:  98%|█████████▊| 45/46 [20:30<00:27, 27.46s/it]

Val Loss: 2.3379 - Val Accuracy: 0.9348



Training:   0%|          | 0/209 [00:00<?, ?it/s][A
Training:   0%|          | 1/209 [00:00<03:13,  1.07it/s][A
Training:   1%|▏         | 3/209 [00:01<00:57,  3.59it/s][A
Training:   2%|▏         | 5/209 [00:01<00:39,  5.14it/s][A
Training:   3%|▎         | 7/209 [00:01<00:30,  6.56it/s][A
Training:   4%|▍         | 9/209 [00:01<00:30,  6.62it/s][A
Training:   5%|▍         | 10/209 [00:01<00:30,  6.59it/s][A
Training:   6%|▌         | 13/209 [00:02<00:26,  7.34it/s][A
Training:   7%|▋         | 15/209 [00:02<00:22,  8.51it/s][A
Training:   8%|▊         | 17/209 [00:02<00:22,  8.41it/s][A
Training:   9%|▊         | 18/209 [00:02<00:22,  8.61it/s][A
Training:  10%|█         | 21/209 [00:03<00:19,  9.54it/s][A
Training:  11%|█         | 22/209 [00:03<00:20,  9.26it/s][A
Training:  12%|█▏        | 25/209 [00:03<00:18,  9.87it/s][A
Training:  12%|█▏        | 26/209 [00:03<00:18,  9.64it/s][A
Training:  14%|█▍        | 29/209 [00:03<00:19,  9.28it/s][A
Training:  14%|█▍    

Epoch: 46/46 - Loss: 1.9832 - Accuracy: 0.9315



  0%|          | 0/27 [00:00<?, ?it/s][A
  4%|▎         | 1/27 [00:00<00:20,  1.24it/s][A
  7%|▋         | 2/27 [00:00<00:10,  2.48it/s][A
 19%|█▊        | 5/27 [00:01<00:04,  5.44it/s][A
 26%|██▌       | 7/27 [00:01<00:02,  7.63it/s][A
 33%|███▎      | 9/27 [00:01<00:02,  6.77it/s][A
 44%|████▍     | 12/27 [00:01<00:01, 10.10it/s][A
 52%|█████▏    | 14/27 [00:02<00:01,  8.47it/s][A
 63%|██████▎   | 17/27 [00:02<00:01,  7.88it/s][A
 70%|███████   | 19/27 [00:02<00:00,  9.35it/s][A
 78%|███████▊  | 21/27 [00:03<00:00,  7.51it/s][A
100%|██████████| 27/27 [00:03<00:00,  7.59it/s][A
Epochs: 100%|██████████| 46/46 [20:57<00:00, 27.34s/it]


Val Loss: 2.3550 - Val Accuracy: 0.9292
Saving best model...


[32m[I 2023-12-14 22:45:39,073][0m Trial 1 finished with value: 0.9292426705360413 and parameters: {'loss_learning_rate': 0.0017350666898728663, 'learning_rate': 0.008226302275945433, 'weight_decay': 0.0019297756421957702, 'epsilon': 1.7694055881118126e-09, 'batch_size': 67, 'epochs': 46}. Best is trial 1 with value: 0.9292426705360413.[0m


Learning rate for Loss: 0.00043085489957524003
Learning rate: 0.06802471398172366
Weight decay: 0.0004464693466243797
Epsilon: 4.952031792291727e-09
Batch size: 177
Number of epochs: 76


Epochs:   0%|          | 0/76 [00:00<?, ?it/s]
Training:   0%|          | 0/79 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/79 [00:01<02:05,  1.61s/it][A
Training:   4%|▍         | 3/79 [00:01<00:35,  2.17it/s][A
Training:   6%|▋         | 5/79 [00:02<00:38,  1.93it/s][A
Training:  10%|█         | 8/79 [00:02<00:18,  3.76it/s][A
Training:  13%|█▎        | 10/79 [00:03<00:22,  3.07it/s][A
Training:  15%|█▌        | 12/79 [00:03<00:16,  4.17it/s][A
Training:  18%|█▊        | 14/79 [00:04<00:19,  3.37it/s][A
Training:  20%|██        | 16/79 [00:04<00:14,  4.48it/s][A
Training:  23%|██▎       | 18/79 [00:05<00:18,  3.27it/s][A
Training:  25%|██▌       | 20/79 [00:06<00:13,  4.36it/s][A
Training:  28%|██▊       | 22/79 [00:07<00:17,  3.19it/s][A
Training:  30%|███       | 24/79 [00:07<00:13,  4.11it/s][A
Training:  32%|███▏      | 25/79 [00:07<00:17,  3.05it/s][A
Training:  35%|███▌      | 28/79 [00:08<00:10,  4.69it/s][A
Training:  37%|███▋      | 29/79 [00:09<00:17,  2.8

Epoch: 1/76 - Loss: 38.9988 - Accuracy: 0.7601



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:01<00:13,  1.54s/it][A
 30%|███       | 3/10 [00:01<00:03,  2.19it/s][A
 50%|█████     | 5/10 [00:02<00:02,  2.05it/s][A
 60%|██████    | 6/10 [00:02<00:01,  2.50it/s][A
100%|██████████| 10/10 [00:04<00:00,  2.46it/s][A
Epochs:   1%|▏         | 1/76 [00:27<34:58, 27.98s/it]

Val Loss: 11.8739 - Val Accuracy: 0.8990



Training:   0%|          | 0/79 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/79 [00:01<01:57,  1.50s/it][A
Training:   5%|▌         | 4/79 [00:01<00:23,  3.18it/s][A
Training:   8%|▊         | 6/79 [00:02<00:34,  2.14it/s][A
Training:  10%|█         | 8/79 [00:03<00:22,  3.15it/s][A
Training:  13%|█▎        | 10/79 [00:03<00:24,  2.78it/s][A
Training:  15%|█▌        | 12/79 [00:04<00:17,  3.77it/s][A
Training:  16%|█▋        | 13/79 [00:04<00:22,  2.94it/s][A
Training:  19%|█▉        | 15/79 [00:05<00:17,  3.75it/s][A
Training:  22%|██▏       | 17/79 [00:05<00:19,  3.22it/s][A
Training:  23%|██▎       | 18/79 [00:05<00:16,  3.70it/s][A
Training:  24%|██▍       | 19/79 [00:06<00:16,  3.64it/s][A
Training:  27%|██▋       | 21/79 [00:06<00:17,  3.31it/s][A
Training:  29%|██▉       | 23/79 [00:07<00:15,  3.52it/s][A
Training:  32%|███▏      | 25/79 [00:07<00:14,  3.82it/s][A
Training:  34%|███▍      | 27/79 [00:08<00:13,  3.76it/s][A
Training:  35%|███▌      | 28/79 [00

Epoch: 2/76 - Loss: 5.8181 - Accuracy: 0.8908



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:01<00:15,  1.73s/it][A
 20%|██        | 2/10 [00:01<00:06,  1.22it/s][A
 50%|█████     | 5/10 [00:02<00:02,  2.24it/s][A
 60%|██████    | 6/10 [00:03<00:01,  2.17it/s][A
 90%|█████████ | 9/10 [00:04<00:00,  2.89it/s][A
100%|██████████| 10/10 [00:04<00:00,  2.29it/s][A
Epochs:   3%|▎         | 2/76 [00:56<34:42, 28.15s/it]

Val Loss: 5.0947 - Val Accuracy: 0.9208



Training:   0%|          | 0/79 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/79 [00:01<02:13,  1.71s/it][A
Training:   4%|▍         | 3/79 [00:01<00:38,  1.98it/s][A
Training:   6%|▋         | 5/79 [00:02<00:35,  2.06it/s][A
Training:   9%|▉         | 7/79 [00:02<00:23,  3.13it/s][A
Training:  11%|█▏        | 9/79 [00:03<00:24,  2.86it/s][A
Training:  13%|█▎        | 10/79 [00:03<00:20,  3.36it/s][A
Training:  15%|█▌        | 12/79 [00:04<00:13,  4.86it/s][A
Training:  18%|█▊        | 14/79 [00:05<00:20,  3.18it/s][A
Training:  20%|██        | 16/79 [00:05<00:14,  4.41it/s][A
Training:  23%|██▎       | 18/79 [00:06<00:20,  2.93it/s][A
Training:  25%|██▌       | 20/79 [00:06<00:15,  3.86it/s][A
Training:  27%|██▋       | 21/79 [00:07<00:20,  2.88it/s][A
Training:  29%|██▉       | 23/79 [00:07<00:13,  4.03it/s][A
Training:  32%|███▏      | 25/79 [00:08<00:19,  2.77it/s][A
Training:  34%|███▍      | 27/79 [00:08<00:13,  3.74it/s][A
Training:  37%|███▋      | 29/79 [00:

Epoch: 3/76 - Loss: 4.6785 - Accuracy: 0.8959



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:01<00:13,  1.45s/it][A
 20%|██        | 2/10 [00:01<00:05,  1.40it/s][A
 50%|█████     | 5/10 [00:02<00:02,  2.34it/s][A
 60%|██████    | 6/10 [00:02<00:01,  2.67it/s][A
100%|██████████| 10/10 [00:03<00:00,  2.58it/s][A
Epochs:   4%|▍         | 3/76 [01:24<34:10, 28.09s/it]

Val Loss: 5.1502 - Val Accuracy: 0.9056



Training:   0%|          | 0/79 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/79 [00:01<02:03,  1.59s/it][A
Training:   4%|▍         | 3/79 [00:01<00:35,  2.16it/s][A
Training:   6%|▋         | 5/79 [00:02<00:38,  1.93it/s][A
Training:  10%|█         | 8/79 [00:03<00:19,  3.69it/s][A
Training:  13%|█▎        | 10/79 [00:03<00:22,  3.08it/s][A
Training:  16%|█▋        | 13/79 [00:04<00:22,  2.94it/s][A
Training:  22%|██▏       | 17/79 [00:06<00:19,  3.11it/s][A
Training:  23%|██▎       | 18/79 [00:06<00:17,  3.43it/s][A
Training:  27%|██▋       | 21/79 [00:07<00:16,  3.42it/s][A
Training:  30%|███       | 24/79 [00:07<00:11,  4.92it/s][A
Training:  33%|███▎      | 26/79 [00:08<00:13,  3.89it/s][A
Training:  34%|███▍      | 27/79 [00:08<00:12,  4.28it/s][A
Training:  35%|███▌      | 28/79 [00:08<00:10,  4.74it/s][A
Training:  37%|███▋      | 29/79 [00:09<00:17,  2.88it/s][A
Training:  41%|████      | 32/79 [00:09<00:09,  4.95it/s][A
Training:  43%|████▎     | 34/79 [00

Epoch: 4/76 - Loss: 4.0974 - Accuracy: 0.9039



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:01<00:12,  1.41s/it][A
 20%|██        | 2/10 [00:01<00:06,  1.32it/s][A
 40%|████      | 4/10 [00:01<00:02,  3.00it/s][A
 50%|█████     | 5/10 [00:02<00:02,  1.99it/s][A
 60%|██████    | 6/10 [00:02<00:01,  2.51it/s][A
 80%|████████  | 8/10 [00:03<00:00,  4.13it/s][A
100%|██████████| 10/10 [00:03<00:00,  2.53it/s][A
Epochs:   5%|▌         | 4/76 [01:52<33:35, 27.99s/it]

Val Loss: 4.0008 - Val Accuracy: 0.8673



Training:   0%|          | 0/79 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/79 [00:01<02:17,  1.76s/it][A
Training:   4%|▍         | 3/79 [00:01<00:38,  1.95it/s][A
Training:   6%|▋         | 5/79 [00:02<00:35,  2.06it/s][A
Training:   9%|▉         | 7/79 [00:02<00:21,  3.29it/s][A
Training:  11%|█▏        | 9/79 [00:03<00:25,  2.77it/s][A
Training:  15%|█▌        | 12/79 [00:03<00:14,  4.61it/s][A
Training:  18%|█▊        | 14/79 [00:04<00:17,  3.62it/s][A
Training:  22%|██▏       | 17/79 [00:05<00:16,  3.66it/s][A
Training:  24%|██▍       | 19/79 [00:05<00:13,  4.42it/s][A
Training:  27%|██▋       | 21/79 [00:06<00:14,  3.98it/s][A
Training:  28%|██▊       | 22/79 [00:06<00:13,  4.13it/s][A
Training:  29%|██▉       | 23/79 [00:06<00:13,  4.24it/s][A
Training:  32%|███▏      | 25/79 [00:07<00:12,  4.34it/s][A
Training:  33%|███▎      | 26/79 [00:07<00:13,  4.05it/s][A
Training:  34%|███▍      | 27/79 [00:07<00:12,  4.21it/s][A
Training:  37%|███▋      | 29/79 [00:

Epoch: 5/76 - Loss: 5.9647 - Accuracy: 0.8870



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:01<00:14,  1.62s/it][A
 20%|██        | 2/10 [00:01<00:05,  1.38it/s][A
 50%|█████     | 5/10 [00:02<00:02,  2.19it/s][A
 60%|██████    | 6/10 [00:03<00:01,  2.45it/s][A
 80%|████████  | 8/10 [00:03<00:00,  3.84it/s][A
100%|██████████| 10/10 [00:04<00:00,  2.47it/s][A
Epochs:   7%|▋         | 5/76 [02:19<32:45, 27.69s/it]

Val Loss: 4.4346 - Val Accuracy: 0.8978



Training:   0%|          | 0/79 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/79 [00:01<02:03,  1.58s/it][A
Training:   5%|▌         | 4/79 [00:01<00:24,  3.06it/s][A
Training:   8%|▊         | 6/79 [00:02<00:32,  2.28it/s][A
Training:  10%|█         | 8/79 [00:03<00:21,  3.35it/s][A
Training:  13%|█▎        | 10/79 [00:04<00:26,  2.60it/s][A
Training:  15%|█▌        | 12/79 [00:04<00:18,  3.64it/s][A
Training:  18%|█▊        | 14/79 [00:05<00:22,  2.86it/s][A
Training:  20%|██        | 16/79 [00:05<00:16,  3.83it/s][A
Training:  23%|██▎       | 18/79 [00:06<00:19,  3.10it/s][A
Training:  27%|██▋       | 21/79 [00:07<00:18,  3.09it/s][A
Training:  30%|███       | 24/79 [00:07<00:12,  4.54it/s][A
Training:  33%|███▎      | 26/79 [00:08<00:15,  3.53it/s][A
Training:  35%|███▌      | 28/79 [00:08<00:11,  4.43it/s][A
Training:  38%|███▊      | 30/79 [00:09<00:13,  3.50it/s][A
Training:  41%|████      | 32/79 [00:09<00:10,  4.48it/s][A
Training:  43%|████▎     | 34/79 [00

Epoch: 6/76 - Loss: 5.9222 - Accuracy: 0.8980



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:01<00:14,  1.58s/it][A
 30%|███       | 3/10 [00:01<00:03,  2.10it/s][A
 50%|█████     | 5/10 [00:02<00:02,  2.01it/s][A
 70%|███████   | 7/10 [00:02<00:00,  3.23it/s][A
100%|██████████| 10/10 [00:03<00:00,  2.53it/s][A
Epochs:   8%|▊         | 6/76 [02:46<32:04, 27.50s/it]

Val Loss: 4.5755 - Val Accuracy: 0.9331



Training:   0%|          | 0/79 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/79 [00:01<01:57,  1.50s/it][A
Training:   3%|▎         | 2/79 [00:01<00:52,  1.46it/s][A
Training:   4%|▍         | 3/79 [00:01<00:33,  2.25it/s][A
Training:   5%|▌         | 4/79 [00:01<00:23,  3.21it/s][A
Training:   6%|▋         | 5/79 [00:02<00:33,  2.19it/s][A
Training:   9%|▉         | 7/79 [00:02<00:20,  3.53it/s][A
Training:  11%|█▏        | 9/79 [00:03<00:25,  2.74it/s][A
Training:  13%|█▎        | 10/79 [00:03<00:21,  3.27it/s][A
Training:  14%|█▍        | 11/79 [00:04<00:17,  3.81it/s][A
Training:  16%|█▋        | 13/79 [00:05<00:24,  2.69it/s][A
Training:  19%|█▉        | 15/79 [00:05<00:17,  3.75it/s][A
Training:  22%|██▏       | 17/79 [00:06<00:22,  2.80it/s][A
Training:  24%|██▍       | 19/79 [00:06<00:15,  3.85it/s][A
Training:  27%|██▋       | 21/79 [00:07<00:19,  3.02it/s][A
Training:  29%|██▉       | 23/79 [00:07<00:13,  4.08it/s][A
Training:  32%|███▏      | 25/79 [00:08

Epoch: 7/76 - Loss: 11.1106 - Accuracy: 0.8912



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:01<00:14,  1.61s/it][A
 20%|██        | 2/10 [00:01<00:05,  1.38it/s][A
 40%|████      | 4/10 [00:01<00:01,  3.15it/s][A
 50%|█████     | 5/10 [00:02<00:02,  1.83it/s][A
100%|██████████| 10/10 [00:03<00:00,  2.50it/s][A
Epochs:   9%|▉         | 7/76 [03:13<31:37, 27.49s/it]

Val Loss: 43.3860 - Val Accuracy: 0.8197



Training:   0%|          | 0/79 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/79 [00:01<01:50,  1.42s/it][A
Training:   3%|▎         | 2/79 [00:01<00:52,  1.48it/s][A
Training:   5%|▌         | 4/79 [00:01<00:26,  2.86it/s][A
Training:   6%|▋         | 5/79 [00:02<00:36,  2.04it/s][A
Training:   9%|▉         | 7/79 [00:02<00:21,  3.39it/s][A
Training:  10%|█         | 8/79 [00:03<00:20,  3.48it/s][A
Training:  11%|█▏        | 9/79 [00:03<00:28,  2.49it/s][A
Training:  14%|█▍        | 11/79 [00:03<00:17,  3.81it/s][A
Training:  15%|█▌        | 12/79 [00:04<00:19,  3.40it/s][A
Training:  16%|█▋        | 13/79 [00:04<00:21,  3.10it/s][A
Training:  18%|█▊        | 14/79 [00:05<00:20,  3.24it/s][A
Training:  19%|█▉        | 15/79 [00:05<00:16,  3.90it/s][A
Training:  20%|██        | 16/79 [00:05<00:17,  3.51it/s][A
Training:  22%|██▏       | 17/79 [00:06<00:21,  2.90it/s][A
Training:  23%|██▎       | 18/79 [00:06<00:21,  2.87it/s][A
Training:  25%|██▌       | 20/79 [00:06

Epoch: 8/76 - Loss: 8.7930 - Accuracy: 0.8936



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:01<00:14,  1.58s/it][A
 20%|██        | 2/10 [00:01<00:06,  1.33it/s][A
 40%|████      | 4/10 [00:01<00:01,  3.09it/s][A
 50%|█████     | 5/10 [00:02<00:02,  2.08it/s][A
 60%|██████    | 6/10 [00:02<00:01,  2.44it/s][A
 80%|████████  | 8/10 [00:03<00:00,  3.98it/s][A
100%|██████████| 10/10 [00:03<00:00,  2.51it/s][A
Epochs:  11%|█         | 8/76 [03:40<30:59, 27.35s/it]

Val Loss: 24.2109 - Val Accuracy: 0.8846



Training:   0%|          | 0/79 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/79 [00:01<01:45,  1.35s/it][A
Training:   3%|▎         | 2/79 [00:01<01:01,  1.25it/s][A
Training:   4%|▍         | 3/79 [00:01<00:36,  2.07it/s][A
Training:   6%|▋         | 5/79 [00:02<00:31,  2.33it/s][A
Training:   8%|▊         | 6/79 [00:02<00:29,  2.48it/s][A
Training:  10%|█         | 8/79 [00:03<00:18,  3.90it/s][A
Training:  11%|█▏        | 9/79 [00:03<00:22,  3.13it/s][A
Training:  13%|█▎        | 10/79 [00:04<00:24,  2.78it/s][A
Training:  15%|█▌        | 12/79 [00:04<00:15,  4.31it/s][A
Training:  16%|█▋        | 13/79 [00:04<00:18,  3.55it/s][A
Training:  18%|█▊        | 14/79 [00:05<00:25,  2.55it/s][A
Training:  20%|██        | 16/79 [00:05<00:15,  4.01it/s][A
Training:  23%|██▎       | 18/79 [00:06<00:20,  2.91it/s][A
Training:  25%|██▌       | 20/79 [00:06<00:14,  4.04it/s][A
Training:  28%|██▊       | 22/79 [00:07<00:16,  3.40it/s][A
Training:  29%|██▉       | 23/79 [00:07

Epoch: 9/76 - Loss: 10.9081 - Accuracy: 0.8950



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:01<00:14,  1.58s/it][A
 30%|███       | 3/10 [00:01<00:03,  2.03it/s][A
 50%|█████     | 5/10 [00:02<00:02,  2.18it/s][A
 70%|███████   | 7/10 [00:02<00:00,  3.26it/s][A
100%|██████████| 10/10 [00:03<00:00,  2.68it/s][A
Epochs:  12%|█▏        | 9/76 [04:07<30:21, 27.19s/it]

Val Loss: 3.2509 - Val Accuracy: 0.9228



Training:   0%|          | 0/79 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/79 [00:01<02:08,  1.65s/it][A
Training:   4%|▍         | 3/79 [00:01<00:35,  2.13it/s][A
Training:   6%|▋         | 5/79 [00:02<00:38,  1.91it/s][A
Training:  10%|█         | 8/79 [00:03<00:19,  3.63it/s][A
Training:  13%|█▎        | 10/79 [00:03<00:23,  2.99it/s][A
Training:  16%|█▋        | 13/79 [00:04<00:21,  3.08it/s][A
Training:  20%|██        | 16/79 [00:05<00:13,  4.50it/s][A
Training:  23%|██▎       | 18/79 [00:06<00:18,  3.29it/s][A
Training:  25%|██▌       | 20/79 [00:06<00:13,  4.23it/s][A
Training:  28%|██▊       | 22/79 [00:07<00:18,  3.08it/s][A
Training:  29%|██▉       | 23/79 [00:07<00:16,  3.48it/s][A
Training:  32%|███▏      | 25/79 [00:08<00:17,  3.17it/s][A
Training:  33%|███▎      | 26/79 [00:08<00:15,  3.45it/s][A
Training:  35%|███▌      | 28/79 [00:08<00:11,  4.42it/s][A
Training:  37%|███▋      | 29/79 [00:09<00:17,  2.89it/s][A
Training:  41%|████      | 32/79 [00

Epoch: 10/76 - Loss: 15.8961 - Accuracy: 0.8917



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:01<00:14,  1.63s/it][A
 30%|███       | 3/10 [00:01<00:03,  2.09it/s][A
 50%|█████     | 5/10 [00:02<00:02,  2.11it/s][A
 80%|████████  | 8/10 [00:02<00:00,  4.01it/s][A
100%|██████████| 10/10 [00:04<00:00,  2.48it/s][A
Epochs:  13%|█▎        | 10/76 [04:35<30:02, 27.31s/it]

Val Loss: 23.7199 - Val Accuracy: 0.8488



Training:   0%|          | 0/79 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/79 [00:01<02:07,  1.64s/it][A
Training:   3%|▎         | 2/79 [00:01<01:02,  1.24it/s][A
Training:   5%|▌         | 4/79 [00:01<00:24,  3.00it/s][A
Training:   8%|▊         | 6/79 [00:02<00:27,  2.62it/s][A
Training:   9%|▉         | 7/79 [00:03<00:23,  3.04it/s][A
Training:  11%|█▏        | 9/79 [00:03<00:25,  2.74it/s][A
Training:  14%|█▍        | 11/79 [00:04<00:18,  3.64it/s][A
Training:  16%|█▋        | 13/79 [00:04<00:21,  3.07it/s][A
Training:  19%|█▉        | 15/79 [00:05<00:17,  3.74it/s][A
Training:  22%|██▏       | 17/79 [00:06<00:20,  3.09it/s][A
Training:  24%|██▍       | 19/79 [00:06<00:15,  3.90it/s][A
Training:  27%|██▋       | 21/79 [00:07<00:19,  3.02it/s][A
Training:  29%|██▉       | 23/79 [00:07<00:14,  3.82it/s][A
Training:  32%|███▏      | 25/79 [00:08<00:17,  3.10it/s][A
Training:  33%|███▎      | 26/79 [00:08<00:15,  3.53it/s][A
Training:  35%|███▌      | 28/79 [00:0

Epoch: 11/76 - Loss: 10.1544 - Accuracy: 0.9032



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:01<00:12,  1.44s/it][A
 50%|█████     | 5/10 [00:02<00:02,  2.19it/s][A
 80%|████████  | 8/10 [00:02<00:00,  3.90it/s][A
100%|██████████| 10/10 [00:03<00:00,  2.73it/s][A
Epochs:  14%|█▍        | 11/76 [05:02<29:36, 27.32s/it]

Val Loss: 24.7699 - Val Accuracy: 0.8447



Training:   0%|          | 0/79 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/79 [00:01<02:28,  1.91s/it][A
Training:   4%|▍         | 3/79 [00:02<00:42,  1.80it/s][A
Training:   6%|▋         | 5/79 [00:02<00:36,  2.02it/s][A
Training:   9%|▉         | 7/79 [00:03<00:22,  3.23it/s][A
Training:  11%|█▏        | 9/79 [00:03<00:23,  2.94it/s][A
Training:  16%|█▋        | 13/79 [00:04<00:20,  3.20it/s][A
Training:  18%|█▊        | 14/79 [00:05<00:18,  3.56it/s][A
Training:  19%|█▉        | 15/79 [00:05<00:15,  4.02it/s][A
Training:  22%|██▏       | 17/79 [00:06<00:21,  2.95it/s][A
Training:  24%|██▍       | 19/79 [00:06<00:15,  3.93it/s][A
Training:  25%|██▌       | 20/79 [00:06<00:13,  4.40it/s][A
Training:  27%|██▋       | 21/79 [00:07<00:20,  2.83it/s][A
Training:  29%|██▉       | 23/79 [00:07<00:14,  3.85it/s][A
Training:  32%|███▏      | 25/79 [00:08<00:15,  3.41it/s][A
Training:  34%|███▍      | 27/79 [00:08<00:11,  4.49it/s][A
Training:  37%|███▋      | 29/79 [00:

Epoch: 12/76 - Loss: 5.7648 - Accuracy: 0.9060



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:01<00:13,  1.54s/it][A
 20%|██        | 2/10 [00:01<00:06,  1.30it/s][A
 40%|████      | 4/10 [00:01<00:01,  3.11it/s][A
 50%|█████     | 5/10 [00:02<00:02,  2.09it/s][A
 60%|██████    | 6/10 [00:02<00:01,  2.43it/s][A
 80%|████████  | 8/10 [00:03<00:00,  4.04it/s][A
100%|██████████| 10/10 [00:03<00:00,  2.55it/s][A
Epochs:  16%|█▌        | 12/76 [05:28<28:42, 26.91s/it]

Val Loss: 4.7814 - Val Accuracy: 0.9299



Training:   0%|          | 0/79 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/79 [00:01<02:12,  1.70s/it][A
Training:   3%|▎         | 2/79 [00:01<01:02,  1.23it/s][A
Training:   4%|▍         | 3/79 [00:01<00:37,  2.05it/s][A
Training:   6%|▋         | 5/79 [00:02<00:34,  2.14it/s][A
Training:   8%|▊         | 6/79 [00:03<00:26,  2.72it/s][A
Training:  10%|█         | 8/79 [00:03<00:17,  4.17it/s][A
Training:  11%|█▏        | 9/79 [00:04<00:28,  2.45it/s][A
Training:  14%|█▍        | 11/79 [00:04<00:18,  3.73it/s][A
Training:  16%|█▋        | 13/79 [00:05<00:23,  2.80it/s][A
Training:  20%|██        | 16/79 [00:05<00:13,  4.63it/s][A
Training:  23%|██▎       | 18/79 [00:06<00:19,  3.20it/s][A
Training:  25%|██▌       | 20/79 [00:06<00:13,  4.24it/s][A
Training:  28%|██▊       | 22/79 [00:07<00:17,  3.24it/s][A
Training:  32%|███▏      | 25/79 [00:08<00:16,  3.34it/s][A
Training:  34%|███▍      | 27/79 [00:08<00:12,  4.20it/s][A
Training:  37%|███▋      | 29/79 [00:09

Epoch: 13/76 - Loss: 5.6111 - Accuracy: 0.9179



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:01<00:13,  1.53s/it][A
 20%|██        | 2/10 [00:01<00:05,  1.37it/s][A
 40%|████      | 4/10 [00:01<00:01,  3.28it/s][A
 60%|██████    | 6/10 [00:02<00:01,  2.51it/s][A
100%|██████████| 10/10 [00:03<00:00,  2.54it/s][A
Epochs:  17%|█▋        | 13/76 [05:55<28:20, 26.99s/it]

Val Loss: 3.7569 - Val Accuracy: 0.9372



Training:   0%|          | 0/79 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/79 [00:01<02:17,  1.76s/it][A
Training:   5%|▌         | 4/79 [00:01<00:28,  2.66it/s][A
Training:   8%|▊         | 6/79 [00:02<00:31,  2.29it/s][A
Training:  11%|█▏        | 9/79 [00:04<00:28,  2.47it/s][A
Training:  16%|█▋        | 13/79 [00:05<00:23,  2.86it/s][A
Training:  19%|█▉        | 15/79 [00:05<00:17,  3.62it/s][A
Training:  22%|██▏       | 17/79 [00:06<00:20,  3.07it/s][A
Training:  24%|██▍       | 19/79 [00:06<00:15,  3.94it/s][A
Training:  27%|██▋       | 21/79 [00:07<00:19,  2.95it/s][A
Training:  28%|██▊       | 22/79 [00:07<00:17,  3.22it/s][A
Training:  30%|███       | 24/79 [00:07<00:12,  4.40it/s][A
Training:  33%|███▎      | 26/79 [00:08<00:17,  3.08it/s][A
Training:  34%|███▍      | 27/79 [00:08<00:14,  3.51it/s][A
Training:  37%|███▋      | 29/79 [00:09<00:16,  2.94it/s][A
Training:  39%|███▉      | 31/79 [00:10<00:12,  3.90it/s][A
Training:  42%|████▏     | 33/79 [00

Epoch: 14/76 - Loss: 6.9978 - Accuracy: 0.9047



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:01<00:15,  1.69s/it][A
 20%|██        | 2/10 [00:01<00:06,  1.32it/s][A
 50%|█████     | 5/10 [00:02<00:02,  2.38it/s][A
 80%|████████  | 8/10 [00:02<00:00,  4.42it/s][A
100%|██████████| 10/10 [00:03<00:00,  2.62it/s][A
Epochs:  18%|█▊        | 14/76 [06:23<28:06, 27.20s/it]

Val Loss: 10.2541 - Val Accuracy: 0.9103



Training:   0%|          | 0/79 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/79 [00:01<01:57,  1.50s/it][A
Training:   4%|▍         | 3/79 [00:01<00:40,  1.87it/s][A
Training:   6%|▋         | 5/79 [00:02<00:34,  2.13it/s][A
Training:   8%|▊         | 6/79 [00:02<00:29,  2.48it/s][A
Training:   9%|▉         | 7/79 [00:03<00:24,  2.95it/s][A
Training:  11%|█▏        | 9/79 [00:03<00:22,  3.12it/s][A
Training:  13%|█▎        | 10/79 [00:04<00:22,  3.06it/s][A
Training:  14%|█▍        | 11/79 [00:04<00:19,  3.55it/s][A
Training:  15%|█▌        | 12/79 [00:04<00:15,  4.25it/s][A
Training:  16%|█▋        | 13/79 [00:04<00:20,  3.25it/s][A
Training:  18%|█▊        | 14/79 [00:05<00:22,  2.83it/s][A
Training:  22%|██▏       | 17/79 [00:05<00:17,  3.50it/s][A
Training:  23%|██▎       | 18/79 [00:06<00:19,  3.06it/s][A
Training:  24%|██▍       | 19/79 [00:06<00:16,  3.60it/s][A
Training:  27%|██▋       | 21/79 [00:07<00:16,  3.61it/s][A
Training:  28%|██▊       | 22/79 [00:0

Epoch: 15/76 - Loss: 5.6593 - Accuracy: 0.9133



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:01<00:14,  1.56s/it][A
 30%|███       | 3/10 [00:01<00:03,  2.07it/s][A
 50%|█████     | 5/10 [00:02<00:02,  2.06it/s][A
 70%|███████   | 7/10 [00:02<00:00,  3.25it/s][A
 80%|████████  | 8/10 [00:03<00:00,  3.45it/s][A
100%|██████████| 10/10 [00:03<00:00,  2.55it/s][A
Epochs:  20%|█▉        | 15/76 [06:51<27:48, 27.35s/it]

Val Loss: 10.8566 - Val Accuracy: 0.9389



Training:   0%|          | 0/79 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/79 [00:01<02:18,  1.77s/it][A
Training:   3%|▎         | 2/79 [00:01<01:00,  1.27it/s][A
Training:   6%|▋         | 5/79 [00:02<00:32,  2.29it/s][A
Training:   9%|▉         | 7/79 [00:02<00:20,  3.48it/s][A
Training:  11%|█▏        | 9/79 [00:03<00:26,  2.66it/s][A
Training:  14%|█▍        | 11/79 [00:04<00:18,  3.69it/s][A
Training:  16%|█▋        | 13/79 [00:05<00:22,  2.94it/s][A
Training:  18%|█▊        | 14/79 [00:05<00:20,  3.13it/s][A
Training:  20%|██        | 16/79 [00:05<00:14,  4.34it/s][A
Training:  22%|██▏       | 17/79 [00:06<00:21,  2.93it/s][A
Training:  23%|██▎       | 18/79 [00:06<00:18,  3.32it/s][A
Training:  27%|██▋       | 21/79 [00:07<00:18,  3.17it/s][A
Training:  28%|██▊       | 22/79 [00:07<00:15,  3.62it/s][A
Training:  32%|███▏      | 25/79 [00:08<00:16,  3.32it/s][A
Training:  33%|███▎      | 26/79 [00:08<00:17,  3.02it/s][A
Training:  35%|███▌      | 28/79 [00:

Epoch: 16/76 - Loss: 20.1337 - Accuracy: 0.8987



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:01<00:13,  1.55s/it][A
 20%|██        | 2/10 [00:01<00:05,  1.34it/s][A
 40%|████      | 4/10 [00:01<00:01,  3.01it/s][A
 50%|█████     | 5/10 [00:02<00:02,  1.85it/s][A
 60%|██████    | 6/10 [00:03<00:01,  2.21it/s][A
 80%|████████  | 8/10 [00:03<00:00,  3.66it/s][A
100%|██████████| 10/10 [00:04<00:00,  2.33it/s][A
Epochs:  21%|██        | 16/76 [07:19<27:47, 27.78s/it]

Val Loss: 47.8543 - Val Accuracy: 0.9050



Training:   0%|          | 0/79 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/79 [00:01<02:13,  1.71s/it][A
Training:   3%|▎         | 2/79 [00:01<00:58,  1.31it/s][A
Training:   6%|▋         | 5/79 [00:02<00:32,  2.25it/s][A
Training:   8%|▊         | 6/79 [00:02<00:26,  2.71it/s][A
Training:   9%|▉         | 7/79 [00:03<00:22,  3.24it/s][A
Training:  10%|█         | 8/79 [00:03<00:17,  3.96it/s][A
Training:  11%|█▏        | 9/79 [00:03<00:27,  2.56it/s][A
Training:  13%|█▎        | 10/79 [00:04<00:27,  2.50it/s][A
Training:  15%|█▌        | 12/79 [00:04<00:16,  4.02it/s][A
Training:  16%|█▋        | 13/79 [00:05<00:26,  2.50it/s][A
Training:  18%|█▊        | 14/79 [00:05<00:25,  2.54it/s][A
Training:  20%|██        | 16/79 [00:05<00:15,  3.99it/s][A
Training:  22%|██▏       | 17/79 [00:06<00:21,  2.88it/s][A
Training:  23%|██▎       | 18/79 [00:06<00:23,  2.64it/s][A
Training:  25%|██▌       | 20/79 [00:07<00:14,  3.94it/s][A
Training:  27%|██▋       | 21/79 [00:07

Epoch: 17/76 - Loss: 18.6953 - Accuracy: 0.8950



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:01<00:13,  1.50s/it][A
 20%|██        | 2/10 [00:01<00:05,  1.39it/s][A
 40%|████      | 4/10 [00:01<00:01,  3.09it/s][A
 50%|█████     | 5/10 [00:02<00:02,  1.97it/s][A
 60%|██████    | 6/10 [00:03<00:01,  2.34it/s][A
 80%|████████  | 8/10 [00:03<00:00,  3.87it/s][A
 90%|█████████ | 9/10 [00:03<00:00,  2.61it/s][A
100%|██████████| 10/10 [00:04<00:00,  2.37it/s][A
Epochs:  22%|██▏       | 17/76 [07:47<27:20, 27.80s/it]

Val Loss: 7.4036 - Val Accuracy: 0.9302



Training:   0%|          | 0/79 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/79 [00:01<01:58,  1.51s/it][A
Training:   3%|▎         | 2/79 [00:01<00:53,  1.44it/s][A
Training:   5%|▌         | 4/79 [00:01<00:22,  3.28it/s][A
Training:   6%|▋         | 5/79 [00:02<00:39,  1.88it/s][A
Training:  11%|█▏        | 9/79 [00:03<00:25,  2.70it/s][A
Training:  14%|█▍        | 11/79 [00:04<00:18,  3.59it/s][A
Training:  16%|█▋        | 13/79 [00:04<00:21,  3.04it/s][A
Training:  19%|█▉        | 15/79 [00:05<00:15,  4.05it/s][A
Training:  22%|██▏       | 17/79 [00:06<00:20,  3.06it/s][A
Training:  24%|██▍       | 19/79 [00:06<00:15,  3.98it/s][A
Training:  25%|██▌       | 20/79 [00:06<00:13,  4.42it/s][A
Training:  27%|██▋       | 21/79 [00:07<00:21,  2.64it/s][A
Training:  30%|███       | 24/79 [00:07<00:12,  4.51it/s][A
Training:  33%|███▎      | 26/79 [00:08<00:17,  3.03it/s][A
Training:  37%|███▋      | 29/79 [00:09<00:16,  2.97it/s][A
Training:  38%|███▊      | 30/79 [00:

Epoch: 18/76 - Loss: 9.0626 - Accuracy: 0.9174



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:01<00:12,  1.44s/it][A
 30%|███       | 3/10 [00:01<00:03,  2.32it/s][A
 50%|█████     | 5/10 [00:02<00:02,  2.11it/s][A
 70%|███████   | 7/10 [00:02<00:00,  3.25it/s][A
100%|██████████| 10/10 [00:03<00:00,  2.63it/s][A
Epochs:  24%|██▎       | 18/76 [08:15<26:46, 27.71s/it]

Val Loss: 3.4944 - Val Accuracy: 0.8692



Training:   0%|          | 0/79 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/79 [00:01<01:54,  1.46s/it][A
Training:   6%|▋         | 5/79 [00:02<00:36,  2.04it/s][A
Training:   9%|▉         | 7/79 [00:02<00:24,  2.97it/s][A
Training:  11%|█▏        | 9/79 [00:04<00:29,  2.34it/s][A
Training:  14%|█▍        | 11/79 [00:04<00:21,  3.16it/s][A
Training:  16%|█▋        | 13/79 [00:05<00:23,  2.76it/s][A
Training:  19%|█▉        | 15/79 [00:05<00:17,  3.76it/s][A
Training:  22%|██▏       | 17/79 [00:06<00:20,  3.03it/s][A
Training:  23%|██▎       | 18/79 [00:06<00:17,  3.45it/s][A
Training:  25%|██▌       | 20/79 [00:06<00:12,  4.80it/s][A
Training:  28%|██▊       | 22/79 [00:07<00:20,  2.75it/s][A
Training:  30%|███       | 24/79 [00:08<00:15,  3.59it/s][A
Training:  32%|███▏      | 25/79 [00:08<00:20,  2.60it/s][A
Training:  34%|███▍      | 27/79 [00:09<00:14,  3.56it/s][A
Training:  37%|███▋      | 29/79 [00:10<00:20,  2.49it/s][A
Training:  38%|███▊      | 30/79 [00

Epoch: 19/76 - Loss: 15.1815 - Accuracy: 0.9075



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:01<00:15,  1.71s/it][A
 30%|███       | 3/10 [00:01<00:03,  1.96it/s][A
 50%|█████     | 5/10 [00:02<00:02,  1.99it/s][A
 70%|███████   | 7/10 [00:03<00:00,  3.13it/s][A
100%|██████████| 10/10 [00:04<00:00,  2.41it/s][A
Epochs:  25%|██▌       | 19/76 [08:44<26:42, 28.11s/it]

Val Loss: 13.0340 - Val Accuracy: 0.8668



Training:   0%|          | 0/79 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/79 [00:01<02:14,  1.73s/it][A
Training:   3%|▎         | 2/79 [00:01<01:02,  1.24it/s][A
Training:   5%|▌         | 4/79 [00:02<00:25,  2.92it/s][A
Training:   6%|▋         | 5/79 [00:02<00:38,  1.92it/s][A
Training:   8%|▊         | 6/79 [00:03<00:30,  2.39it/s][A
Training:  10%|█         | 8/79 [00:03<00:18,  3.75it/s][A
Training:  11%|█▏        | 9/79 [00:04<00:29,  2.40it/s][A
Training:  13%|█▎        | 10/79 [00:04<00:23,  2.97it/s][A
Training:  15%|█▌        | 12/79 [00:04<00:14,  4.51it/s][A
Training:  16%|█▋        | 13/79 [00:05<00:26,  2.53it/s][A
Training:  19%|█▉        | 15/79 [00:05<00:16,  3.88it/s][A
Training:  22%|██▏       | 17/79 [00:06<00:22,  2.73it/s][A
Training:  24%|██▍       | 19/79 [00:06<00:15,  3.80it/s][A
Training:  27%|██▋       | 21/79 [00:07<00:19,  2.91it/s][A
Training:  28%|██▊       | 22/79 [00:07<00:17,  3.19it/s][A
Training:  30%|███       | 24/79 [00:08

Epoch: 20/76 - Loss: 13.7605 - Accuracy: 0.9138



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:01<00:12,  1.34s/it][A
 30%|███       | 3/10 [00:01<00:02,  2.52it/s][A
 50%|█████     | 5/10 [00:02<00:02,  2.25it/s][A
 60%|██████    | 6/10 [00:02<00:01,  2.77it/s][A
100%|██████████| 10/10 [00:03<00:00,  2.82it/s][A
Epochs:  26%|██▋       | 20/76 [09:13<26:23, 28.28s/it]

Val Loss: 5.8087 - Val Accuracy: 0.9361



Training:   0%|          | 0/79 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/79 [00:01<02:19,  1.79s/it][A
Training:   4%|▍         | 3/79 [00:01<00:39,  1.93it/s][A
Training:   6%|▋         | 5/79 [00:02<00:34,  2.15it/s][A
Training:   8%|▊         | 6/79 [00:02<00:27,  2.70it/s][A
Training:  10%|█         | 8/79 [00:03<00:17,  3.98it/s][A
Training:  11%|█▏        | 9/79 [00:03<00:26,  2.64it/s][A
Training:  13%|█▎        | 10/79 [00:03<00:21,  3.20it/s][A
Training:  15%|█▌        | 12/79 [00:04<00:15,  4.44it/s][A
Training:  16%|█▋        | 13/79 [00:05<00:24,  2.70it/s][A
Training:  18%|█▊        | 14/79 [00:05<00:20,  3.19it/s][A
Training:  20%|██        | 16/79 [00:05<00:13,  4.53it/s][A
Training:  22%|██▏       | 17/79 [00:06<00:23,  2.58it/s][A
Training:  24%|██▍       | 19/79 [00:06<00:15,  3.81it/s][A
Training:  27%|██▋       | 21/79 [00:07<00:21,  2.69it/s][A
Training:  28%|██▊       | 22/79 [00:07<00:18,  3.08it/s][A
Training:  30%|███       | 24/79 [00:0

Epoch: 21/76 - Loss: 9.7922 - Accuracy: 0.9067



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:01<00:13,  1.54s/it][A
 30%|███       | 3/10 [00:01<00:03,  2.06it/s][A
 40%|████      | 4/10 [00:01<00:02,  2.83it/s][A
 50%|█████     | 5/10 [00:02<00:02,  2.14it/s][A
 70%|███████   | 7/10 [00:02<00:00,  3.38it/s][A
100%|██████████| 10/10 [00:03<00:00,  2.75it/s][A
Epochs:  28%|██▊       | 21/76 [09:40<25:47, 28.13s/it]

Val Loss: 11.4116 - Val Accuracy: 0.9030



Training:   0%|          | 0/79 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/79 [00:01<02:11,  1.69s/it][A
Training:   4%|▍         | 3/79 [00:01<00:38,  1.97it/s][A
Training:   5%|▌         | 4/79 [00:01<00:27,  2.72it/s][A
Training:   6%|▋         | 5/79 [00:02<00:35,  2.08it/s][A
Training:   9%|▉         | 7/79 [00:02<00:20,  3.52it/s][A
Training:  11%|█▏        | 9/79 [00:03<00:24,  2.82it/s][A
Training:  13%|█▎        | 10/79 [00:03<00:20,  3.32it/s][A
Training:  14%|█▍        | 11/79 [00:04<00:18,  3.76it/s][A
Training:  16%|█▋        | 13/79 [00:04<00:21,  3.10it/s][A
Training:  18%|█▊        | 14/79 [00:04<00:18,  3.58it/s][A
Training:  19%|█▉        | 15/79 [00:05<00:19,  3.34it/s][A
Training:  22%|██▏       | 17/79 [00:06<00:20,  3.02it/s][A
Training:  24%|██▍       | 19/79 [00:06<00:19,  3.14it/s][A
Training:  27%|██▋       | 21/79 [00:07<00:17,  3.25it/s][A
Training:  29%|██▉       | 23/79 [00:07<00:17,  3.29it/s][A
Training:  32%|███▏      | 25/79 [00:0

Epoch: 22/76 - Loss: 6.9837 - Accuracy: 0.9168



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:01<00:16,  1.78s/it][A
 30%|███       | 3/10 [00:01<00:03,  1.94it/s][A
 50%|█████     | 5/10 [00:02<00:02,  2.03it/s][A
100%|██████████| 10/10 [00:04<00:00,  2.47it/s][A
Epochs:  29%|██▉       | 22/76 [10:09<25:20, 28.16s/it]

Val Loss: 3.5363 - Val Accuracy: 0.9267



Training:   0%|          | 0/79 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/79 [00:01<02:05,  1.61s/it][A
Training:   3%|▎         | 2/79 [00:01<00:57,  1.33it/s][A
Training:   5%|▌         | 4/79 [00:01<00:23,  3.13it/s][A
Training:   6%|▋         | 5/79 [00:02<00:36,  2.04it/s][A
Training:   9%|▉         | 7/79 [00:02<00:20,  3.53it/s][A
Training:  11%|█▏        | 9/79 [00:03<00:25,  2.79it/s][A
Training:  13%|█▎        | 10/79 [00:03<00:20,  3.33it/s][A
Training:  14%|█▍        | 11/79 [00:04<00:18,  3.75it/s][A
Training:  16%|█▋        | 13/79 [00:05<00:26,  2.45it/s][A
Training:  19%|█▉        | 15/79 [00:05<00:18,  3.55it/s][A
Training:  22%|██▏       | 17/79 [00:06<00:22,  2.73it/s][A
Training:  24%|██▍       | 19/79 [00:06<00:16,  3.61it/s][A
Training:  25%|██▌       | 20/79 [00:06<00:14,  4.07it/s][A
Training:  27%|██▋       | 21/79 [00:07<00:20,  2.83it/s][A
Training:  29%|██▉       | 23/79 [00:07<00:16,  3.34it/s][A
Training:  32%|███▏      | 25/79 [00:0

Epoch: 23/76 - Loss: 22.2178 - Accuracy: 0.8970



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:01<00:12,  1.38s/it][A
 20%|██        | 2/10 [00:01<00:05,  1.52it/s][A
 40%|████      | 4/10 [00:01<00:01,  3.42it/s][A
 50%|█████     | 5/10 [00:02<00:02,  2.07it/s][A
 60%|██████    | 6/10 [00:02<00:01,  2.40it/s][A
 80%|████████  | 8/10 [00:03<00:00,  3.85it/s][A
100%|██████████| 10/10 [00:03<00:00,  2.60it/s][A
Epochs:  30%|███       | 23/76 [10:37<24:54, 28.21s/it]

Val Loss: 5.1396 - Val Accuracy: 0.9089



Training:   0%|          | 0/79 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/79 [00:01<02:10,  1.67s/it][A
Training:   4%|▍         | 3/79 [00:01<00:37,  2.05it/s][A
Training:   6%|▋         | 5/79 [00:03<00:40,  1.84it/s][A
Training:   9%|▉         | 7/79 [00:03<00:24,  2.91it/s][A
Training:  11%|█▏        | 9/79 [00:04<00:28,  2.48it/s][A
Training:  13%|█▎        | 10/79 [00:04<00:23,  2.95it/s][A
Training:  14%|█▍        | 11/79 [00:04<00:19,  3.52it/s][A
Training:  16%|█▋        | 13/79 [00:05<00:23,  2.86it/s][A
Training:  19%|█▉        | 15/79 [00:05<00:15,  4.05it/s][A
Training:  20%|██        | 16/79 [00:05<00:13,  4.59it/s][A
Training:  22%|██▏       | 17/79 [00:06<00:24,  2.50it/s][A
Training:  23%|██▎       | 18/79 [00:06<00:19,  3.06it/s][A
Training:  25%|██▌       | 20/79 [00:06<00:13,  4.37it/s][A
Training:  27%|██▋       | 21/79 [00:07<00:21,  2.74it/s][A
Training:  32%|███▏      | 25/79 [00:08<00:18,  2.97it/s][A
Training:  33%|███▎      | 26/79 [00:

Epoch: 24/76 - Loss: 8.1491 - Accuracy: 0.9161



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:01<00:13,  1.52s/it][A
 20%|██        | 2/10 [00:01<00:05,  1.43it/s][A
 40%|████      | 4/10 [00:01<00:01,  3.41it/s][A
 60%|██████    | 6/10 [00:02<00:01,  2.54it/s][A
 80%|████████  | 8/10 [00:02<00:00,  3.85it/s][A
100%|██████████| 10/10 [00:03<00:00,  2.67it/s][A
Epochs:  32%|███▏      | 24/76 [11:04<24:16, 28.02s/it]

Val Loss: 12.9099 - Val Accuracy: 0.9339



Training:   0%|          | 0/79 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/79 [00:01<02:13,  1.71s/it][A
Training:   3%|▎         | 2/79 [00:01<01:00,  1.28it/s][A
Training:   6%|▋         | 5/79 [00:02<00:35,  2.06it/s][A
Training:   8%|▊         | 6/79 [00:03<00:28,  2.54it/s][A
Training:  10%|█         | 8/79 [00:03<00:18,  3.74it/s][A
Training:  11%|█▏        | 9/79 [00:04<00:29,  2.36it/s][A
Training:  14%|█▍        | 11/79 [00:04<00:19,  3.57it/s][A
Training:  16%|█▋        | 13/79 [00:05<00:23,  2.87it/s][A
Training:  18%|█▊        | 14/79 [00:05<00:20,  3.25it/s][A
Training:  20%|██        | 16/79 [00:05<00:14,  4.34it/s][A
Training:  22%|██▏       | 17/79 [00:06<00:23,  2.62it/s][A
Training:  24%|██▍       | 19/79 [00:06<00:15,  3.78it/s][A
Training:  27%|██▋       | 21/79 [00:07<00:21,  2.73it/s][A
Training:  29%|██▉       | 23/79 [00:07<00:15,  3.70it/s][A
Training:  32%|███▏      | 25/79 [00:08<00:17,  3.01it/s][A
Training:  34%|███▍      | 27/79 [00:0

Epoch: 25/76 - Loss: 19.4162 - Accuracy: 0.9157



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:01<00:12,  1.36s/it][A
 30%|███       | 3/10 [00:01<00:02,  2.50it/s][A
 50%|█████     | 5/10 [00:02<00:02,  2.02it/s][A
100%|██████████| 10/10 [00:03<00:00,  2.59it/s][A
Epochs:  33%|███▎      | 25/76 [11:33<23:54, 28.12s/it]

Val Loss: 65.3745 - Val Accuracy: 0.8339



Training:   0%|          | 0/79 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/79 [00:01<02:11,  1.69s/it][A
Training:   3%|▎         | 2/79 [00:01<00:58,  1.32it/s][A
Training:   5%|▌         | 4/79 [00:01<00:23,  3.13it/s][A
Training:   8%|▊         | 6/79 [00:02<00:30,  2.37it/s][A
Training:  10%|█         | 8/79 [00:03<00:20,  3.49it/s][A
Training:  11%|█▏        | 9/79 [00:04<00:31,  2.21it/s][A
Training:  15%|█▌        | 12/79 [00:04<00:16,  3.98it/s][A
Training:  18%|█▊        | 14/79 [00:05<00:21,  3.00it/s][A
Training:  20%|██        | 16/79 [00:05<00:15,  4.05it/s][A
Training:  23%|██▎       | 18/79 [00:06<00:20,  2.91it/s][A
Training:  25%|██▌       | 20/79 [00:06<00:15,  3.87it/s][A
Training:  28%|██▊       | 22/79 [00:07<00:19,  2.95it/s][A
Training:  32%|███▏      | 25/79 [00:08<00:19,  2.84it/s][A
Training:  34%|███▍      | 27/79 [00:08<00:14,  3.66it/s][A
Training:  37%|███▋      | 29/79 [00:09<00:16,  3.00it/s][A
Training:  38%|███▊      | 30/79 [00:1

Epoch: 26/76 - Loss: 10.5503 - Accuracy: 0.9100



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:01<00:14,  1.63s/it][A
 30%|███       | 3/10 [00:01<00:03,  2.16it/s][A
 50%|█████     | 5/10 [00:03<00:02,  1.81it/s][A
 70%|███████   | 7/10 [00:03<00:01,  2.91it/s][A
100%|██████████| 10/10 [00:04<00:00,  2.35it/s][A
Epochs:  34%|███▍      | 26/76 [12:02<23:36, 28.33s/it]

Val Loss: 3.8231 - Val Accuracy: 0.9355



Training:   0%|          | 0/79 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/79 [00:01<02:15,  1.73s/it][A
Training:   4%|▍         | 3/79 [00:01<00:39,  1.93it/s][A
Training:   5%|▌         | 4/79 [00:02<00:28,  2.67it/s][A
Training:   6%|▋         | 5/79 [00:02<00:40,  1.81it/s][A
Training:  10%|█         | 8/79 [00:03<00:18,  3.78it/s][A
Training:  11%|█▏        | 9/79 [00:04<00:30,  2.28it/s][A
Training:  14%|█▍        | 11/79 [00:04<00:20,  3.29it/s][A
Training:  16%|█▋        | 13/79 [00:05<00:24,  2.70it/s][A
Training:  19%|█▉        | 15/79 [00:05<00:16,  3.78it/s][A
Training:  22%|██▏       | 17/79 [00:06<00:22,  2.73it/s][A
Training:  25%|██▌       | 20/79 [00:06<00:13,  4.35it/s][A
Training:  28%|██▊       | 22/79 [00:07<00:17,  3.18it/s][A
Training:  32%|███▏      | 25/79 [00:09<00:19,  2.72it/s][A
Training:  33%|███▎      | 26/79 [00:09<00:17,  3.05it/s][A
Training:  35%|███▌      | 28/79 [00:09<00:12,  3.92it/s][A
Training:  37%|███▋      | 29/79 [00:1

Epoch: 27/76 - Loss: 3.9083 - Accuracy: 0.9234



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:01<00:13,  1.54s/it][A
 40%|████      | 4/10 [00:01<00:01,  3.11it/s][A
 60%|██████    | 6/10 [00:02<00:01,  2.57it/s][A
 80%|████████  | 8/10 [00:02<00:00,  3.82it/s][A
100%|██████████| 10/10 [00:03<00:00,  2.68it/s][A
Epochs:  36%|███▌      | 27/76 [12:31<23:18, 28.55s/it]

Val Loss: 3.2774 - Val Accuracy: 0.8959



Training:   0%|          | 0/79 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/79 [00:01<02:16,  1.75s/it][A
Training:   4%|▍         | 3/79 [00:01<00:40,  1.86it/s][A
Training:   6%|▋         | 5/79 [00:03<00:39,  1.87it/s][A
Training:   8%|▊         | 6/79 [00:03<00:31,  2.32it/s][A
Training:   9%|▉         | 7/79 [00:03<00:27,  2.60it/s][A
Training:  10%|█         | 8/79 [00:03<00:21,  3.25it/s][A
Training:  11%|█▏        | 9/79 [00:04<00:31,  2.23it/s][A
Training:  13%|█▎        | 10/79 [00:04<00:27,  2.50it/s][A
Training:  14%|█▍        | 11/79 [00:04<00:22,  2.97it/s][A
Training:  16%|█▋        | 13/79 [00:05<00:23,  2.78it/s][A
Training:  18%|█▊        | 14/79 [00:05<00:21,  3.06it/s][A
Training:  19%|█▉        | 15/79 [00:06<00:20,  3.09it/s][A
Training:  20%|██        | 16/79 [00:06<00:16,  3.76it/s][A
Training:  22%|██▏       | 17/79 [00:06<00:21,  2.86it/s][A
Training:  23%|██▎       | 18/79 [00:06<00:17,  3.50it/s][A
Training:  24%|██▍       | 19/79 [00:07

Epoch: 28/76 - Loss: 23.8264 - Accuracy: 0.9053



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:01<00:13,  1.53s/it][A
 30%|███       | 3/10 [00:01<00:03,  2.13it/s][A
 50%|█████     | 5/10 [00:02<00:02,  2.09it/s][A
 70%|███████   | 7/10 [00:02<00:00,  3.34it/s][A
100%|██████████| 10/10 [00:03<00:00,  2.53it/s][A
Epochs:  37%|███▋      | 28/76 [13:00<23:07, 28.91s/it]

Val Loss: 14.3497 - Val Accuracy: 0.9215



Training:   0%|          | 0/79 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/79 [00:01<02:30,  1.93s/it][A
Training:   4%|▍         | 3/79 [00:02<00:42,  1.78it/s][A
Training:   6%|▋         | 5/79 [00:03<00:39,  1.87it/s][A
Training:   9%|▉         | 7/79 [00:03<00:24,  2.90it/s][A
Training:  11%|█▏        | 9/79 [00:04<00:27,  2.55it/s][A
Training:  14%|█▍        | 11/79 [00:04<00:18,  3.62it/s][A
Training:  16%|█▋        | 13/79 [00:05<00:24,  2.66it/s][A
Training:  19%|█▉        | 15/79 [00:05<00:17,  3.59it/s][A
Training:  22%|██▏       | 17/79 [00:06<00:22,  2.70it/s][A
Training:  24%|██▍       | 19/79 [00:06<00:16,  3.63it/s][A
Training:  27%|██▋       | 21/79 [00:07<00:19,  2.93it/s][A
Training:  29%|██▉       | 23/79 [00:08<00:14,  3.84it/s][A
Training:  32%|███▏      | 25/79 [00:09<00:17,  3.06it/s][A
Training:  33%|███▎      | 26/79 [00:09<00:15,  3.49it/s][A
Training:  35%|███▌      | 28/79 [00:09<00:10,  4.74it/s][A
Training:  38%|███▊      | 30/79 [00:

Epoch: 29/76 - Loss: 6.4316 - Accuracy: 0.9152



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:01<00:15,  1.78s/it][A
 30%|███       | 3/10 [00:01<00:03,  1.94it/s][A
 50%|█████     | 5/10 [00:02<00:02,  1.90it/s][A
 70%|███████   | 7/10 [00:03<00:01,  2.90it/s][A
100%|██████████| 10/10 [00:04<00:00,  2.38it/s][A
Epochs:  38%|███▊      | 29/76 [13:29<22:37, 28.88s/it]

Val Loss: 7.7120 - Val Accuracy: 0.9195



Training:   0%|          | 0/79 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/79 [00:01<02:17,  1.76s/it][A
Training:   4%|▍         | 3/79 [00:01<00:39,  1.93it/s][A
Training:   5%|▌         | 4/79 [00:02<00:27,  2.68it/s][A
Training:   6%|▋         | 5/79 [00:03<00:45,  1.64it/s][A
Training:  11%|█▏        | 9/79 [00:04<00:30,  2.33it/s][A
Training:  13%|█▎        | 10/79 [00:04<00:25,  2.71it/s][A
Training:  15%|█▌        | 12/79 [00:04<00:18,  3.68it/s][A
Training:  16%|█▋        | 13/79 [00:05<00:25,  2.57it/s][A
Training:  19%|█▉        | 15/79 [00:05<00:17,  3.65it/s][A
Training:  22%|██▏       | 17/79 [00:06<00:19,  3.20it/s][A
Training:  23%|██▎       | 18/79 [00:06<00:16,  3.66it/s][A
Training:  25%|██▌       | 20/79 [00:06<00:12,  4.87it/s][A
Training:  27%|██▋       | 21/79 [00:07<00:18,  3.08it/s][A
Training:  28%|██▊       | 22/79 [00:07<00:18,  3.11it/s][A
Training:  30%|███       | 24/79 [00:08<00:12,  4.50it/s][A
Training:  32%|███▏      | 25/79 [00:

Epoch: 30/76 - Loss: 11.0393 - Accuracy: 0.9163



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:01<00:15,  1.73s/it][A
 30%|███       | 3/10 [00:01<00:03,  1.97it/s][A
 50%|█████     | 5/10 [00:02<00:02,  2.12it/s][A
 70%|███████   | 7/10 [00:02<00:00,  3.25it/s][A
100%|██████████| 10/10 [00:03<00:00,  2.55it/s][A
Epochs:  39%|███▉      | 30/76 [13:57<21:55, 28.60s/it]

Val Loss: 23.2295 - Val Accuracy: 0.9418



Training:   0%|          | 0/79 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/79 [00:01<02:21,  1.82s/it][A
Training:   3%|▎         | 2/79 [00:01<01:02,  1.22it/s][A
Training:   5%|▌         | 4/79 [00:02<00:26,  2.82it/s][A
Training:   6%|▋         | 5/79 [00:03<00:38,  1.90it/s][A
Training:   9%|▉         | 7/79 [00:03<00:22,  3.19it/s][A
Training:  10%|█         | 8/79 [00:03<00:18,  3.83it/s][A
Training:  11%|█▏        | 9/79 [00:04<00:29,  2.40it/s][A
Training:  15%|█▌        | 12/79 [00:04<00:14,  4.47it/s][A
Training:  18%|█▊        | 14/79 [00:05<00:21,  3.04it/s][A
Training:  20%|██        | 16/79 [00:05<00:15,  4.10it/s][A
Training:  23%|██▎       | 18/79 [00:06<00:19,  3.14it/s][A
Training:  25%|██▌       | 20/79 [00:06<00:14,  4.18it/s][A
Training:  28%|██▊       | 22/79 [00:07<00:16,  3.51it/s][A
Training:  29%|██▉       | 23/79 [00:07<00:14,  3.96it/s][A
Training:  30%|███       | 24/79 [00:07<00:12,  4.24it/s][A
Training:  32%|███▏      | 25/79 [00:08

Epoch: 31/76 - Loss: 12.2820 - Accuracy: 0.9185



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:01<00:14,  1.63s/it][A
 30%|███       | 3/10 [00:01<00:03,  2.10it/s][A
 50%|█████     | 5/10 [00:02<00:02,  1.99it/s][A
 80%|████████  | 8/10 [00:02<00:00,  3.78it/s][A
100%|██████████| 10/10 [00:04<00:00,  2.48it/s][A
Epochs:  41%|████      | 31/76 [14:25<21:11, 28.26s/it]

Val Loss: 5.1501 - Val Accuracy: 0.9054



Training:   0%|          | 0/79 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/79 [00:01<02:22,  1.82s/it][A
Training:   4%|▍         | 3/79 [00:02<00:41,  1.84it/s][A
Training:   5%|▌         | 4/79 [00:02<00:29,  2.53it/s][A
Training:   6%|▋         | 5/79 [00:03<00:41,  1.79it/s][A
Training:   9%|▉         | 7/79 [00:03<00:22,  3.13it/s][A
Training:  11%|█▏        | 9/79 [00:04<00:25,  2.75it/s][A
Training:  14%|█▍        | 11/79 [00:04<00:17,  3.94it/s][A
Training:  16%|█▋        | 13/79 [00:05<00:24,  2.72it/s][A
Training:  20%|██        | 16/79 [00:05<00:14,  4.25it/s][A
Training:  23%|██▎       | 18/79 [00:06<00:19,  3.15it/s][A
Training:  25%|██▌       | 20/79 [00:06<00:14,  4.09it/s][A
Training:  27%|██▋       | 21/79 [00:07<00:20,  2.85it/s][A
Training:  29%|██▉       | 23/79 [00:07<00:14,  3.95it/s][A
Training:  32%|███▏      | 25/79 [00:08<00:17,  3.12it/s][A
Training:  34%|███▍      | 27/79 [00:08<00:12,  4.21it/s][A
Training:  37%|███▋      | 29/79 [00:0

Epoch: 32/76 - Loss: 11.2608 - Accuracy: 0.9139



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:01<00:12,  1.44s/it][A
 50%|█████     | 5/10 [00:02<00:02,  2.26it/s][A
 70%|███████   | 7/10 [00:02<00:00,  3.38it/s][A
100%|██████████| 10/10 [00:03<00:00,  2.68it/s][A
Epochs:  42%|████▏     | 32/76 [14:52<20:30, 27.96s/it]

Val Loss: 5.0365 - Val Accuracy: 0.9403



Training:   0%|          | 0/79 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/79 [00:01<02:03,  1.58s/it][A
Training:   5%|▌         | 4/79 [00:01<00:24,  3.07it/s][A
Training:   8%|▊         | 6/79 [00:02<00:30,  2.42it/s][A
Training:  11%|█▏        | 9/79 [00:03<00:24,  2.81it/s][A
Training:  14%|█▍        | 11/79 [00:03<00:17,  3.86it/s][A
Training:  16%|█▋        | 13/79 [00:04<00:22,  2.94it/s][A
Training:  18%|█▊        | 14/79 [00:04<00:19,  3.36it/s][A
Training:  20%|██        | 16/79 [00:04<00:13,  4.64it/s][A
Training:  23%|██▎       | 18/79 [00:05<00:19,  3.21it/s][A
Training:  25%|██▌       | 20/79 [00:06<00:13,  4.37it/s][A
Training:  28%|██▊       | 22/79 [00:07<00:17,  3.32it/s][A
Training:  29%|██▉       | 23/79 [00:07<00:15,  3.65it/s][A
Training:  32%|███▏      | 25/79 [00:08<00:18,  2.92it/s][A
Training:  33%|███▎      | 26/79 [00:08<00:16,  3.27it/s][A
Training:  34%|███▍      | 27/79 [00:08<00:14,  3.65it/s][A
Training:  37%|███▋      | 29/79 [00

Epoch: 33/76 - Loss: 8.9500 - Accuracy: 0.9209



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:01<00:14,  1.62s/it][A
 40%|████      | 4/10 [00:01<00:02,  2.91it/s][A
 60%|██████    | 6/10 [00:02<00:01,  2.44it/s][A
 70%|███████   | 7/10 [00:02<00:01,  2.95it/s][A
100%|██████████| 10/10 [00:03<00:00,  2.55it/s][A
Epochs:  43%|████▎     | 33/76 [15:19<19:54, 27.78s/it]

Val Loss: 4.7516 - Val Accuracy: 0.8952



Training:   0%|          | 0/79 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/79 [00:01<02:14,  1.72s/it][A
Training:   6%|▋         | 5/79 [00:02<00:34,  2.12it/s][A
Training:   9%|▉         | 7/79 [00:02<00:22,  3.17it/s][A
Training:  11%|█▏        | 9/79 [00:03<00:25,  2.76it/s][A
Training:  14%|█▍        | 11/79 [00:03<00:17,  3.85it/s][A
Training:  16%|█▋        | 13/79 [00:04<00:22,  2.96it/s][A
Training:  19%|█▉        | 15/79 [00:05<00:16,  3.97it/s][A
Training:  22%|██▏       | 17/79 [00:06<00:22,  2.81it/s][A
Training:  27%|██▋       | 21/79 [00:07<00:18,  3.14it/s][A
Training:  28%|██▊       | 22/79 [00:07<00:16,  3.47it/s][A
Training:  30%|███       | 24/79 [00:07<00:12,  4.44it/s][A
Training:  32%|███▏      | 25/79 [00:08<00:17,  3.02it/s][A
Training:  34%|███▍      | 27/79 [00:08<00:13,  3.99it/s][A
Training:  35%|███▌      | 28/79 [00:08<00:11,  4.47it/s][A
Training:  37%|███▋      | 29/79 [00:09<00:18,  2.76it/s][A
Training:  39%|███▉      | 31/79 [00

Epoch: 34/76 - Loss: 14.4348 - Accuracy: 0.9216



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:01<00:13,  1.48s/it][A
 50%|█████     | 5/10 [00:02<00:02,  2.20it/s][A
 60%|██████    | 6/10 [00:02<00:01,  2.62it/s][A
 80%|████████  | 8/10 [00:02<00:00,  3.99it/s][A
100%|██████████| 10/10 [00:03<00:00,  2.65it/s][A
Epochs:  45%|████▍     | 34/76 [15:47<19:26, 27.78s/it]

Val Loss: 8.7037 - Val Accuracy: 0.9362



Training:   0%|          | 0/79 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/79 [00:01<02:03,  1.58s/it][A
Training:   5%|▌         | 4/79 [00:01<00:25,  2.97it/s][A
Training:   8%|▊         | 6/79 [00:02<00:28,  2.56it/s][A
Training:  10%|█         | 8/79 [00:02<00:19,  3.73it/s][A
Training:  13%|█▎        | 10/79 [00:03<00:26,  2.65it/s][A
Training:  16%|█▋        | 13/79 [00:05<00:24,  2.66it/s][A
Training:  19%|█▉        | 15/79 [00:05<00:18,  3.51it/s][A
Training:  22%|██▏       | 17/79 [00:06<00:22,  2.73it/s][A
Training:  23%|██▎       | 18/79 [00:06<00:19,  3.12it/s][A
Training:  25%|██▌       | 20/79 [00:06<00:14,  4.20it/s][A
Training:  27%|██▋       | 21/79 [00:07<00:22,  2.62it/s][A
Training:  29%|██▉       | 23/79 [00:07<00:14,  3.74it/s][A
Training:  32%|███▏      | 25/79 [00:08<00:18,  2.99it/s][A
Training:  34%|███▍      | 27/79 [00:08<00:13,  3.94it/s][A
Training:  37%|███▋      | 29/79 [00:09<00:16,  3.08it/s][A
Training:  41%|████      | 32/79 [00

Epoch: 35/76 - Loss: 8.2377 - Accuracy: 0.9164



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:01<00:13,  1.52s/it][A
 20%|██        | 2/10 [00:01<00:05,  1.44it/s][A
 40%|████      | 4/10 [00:01<00:01,  3.41it/s][A
 60%|██████    | 6/10 [00:02<00:01,  2.69it/s][A
 80%|████████  | 8/10 [00:02<00:00,  3.97it/s][A
100%|██████████| 10/10 [00:03<00:00,  2.58it/s][A
Epochs:  46%|████▌     | 35/76 [16:15<19:06, 27.96s/it]

Val Loss: 5.1304 - Val Accuracy: 0.9280



Training:   0%|          | 0/79 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/79 [00:01<02:00,  1.55s/it][A
Training:   3%|▎         | 2/79 [00:01<00:53,  1.43it/s][A
Training:   5%|▌         | 4/79 [00:01<00:21,  3.42it/s][A
Training:   8%|▊         | 6/79 [00:02<00:28,  2.58it/s][A
Training:  11%|█▏        | 9/79 [00:04<00:28,  2.46it/s][A
Training:  14%|█▍        | 11/79 [00:04<00:20,  3.37it/s][A
Training:  16%|█▋        | 13/79 [00:05<00:24,  2.71it/s][A
Training:  22%|██▏       | 17/79 [00:06<00:20,  3.09it/s][A
Training:  24%|██▍       | 19/79 [00:06<00:15,  3.77it/s][A
Training:  25%|██▌       | 20/79 [00:06<00:14,  4.11it/s][A
Training:  27%|██▋       | 21/79 [00:07<00:21,  2.68it/s][A
Training:  28%|██▊       | 22/79 [00:07<00:18,  3.15it/s][A
Training:  30%|███       | 24/79 [00:07<00:12,  4.44it/s][A
Training:  32%|███▏      | 25/79 [00:08<00:18,  2.99it/s][A
Training:  34%|███▍      | 27/79 [00:08<00:12,  4.19it/s][A
Training:  35%|███▌      | 28/79 [00:

Epoch: 36/76 - Loss: 6.0633 - Accuracy: 0.9216



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:01<00:12,  1.34s/it][A
 30%|███       | 3/10 [00:01<00:02,  2.46it/s][A
 50%|█████     | 5/10 [00:02<00:02,  2.29it/s][A
 60%|██████    | 6/10 [00:02<00:01,  2.71it/s][A
100%|██████████| 10/10 [00:03<00:00,  2.77it/s][A
Epochs:  47%|████▋     | 36/76 [16:43<18:32, 27.82s/it]

Val Loss: 3.8369 - Val Accuracy: 0.9335



Training:   0%|          | 0/79 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/79 [00:01<02:09,  1.66s/it][A
Training:   5%|▌         | 4/79 [00:01<00:26,  2.83it/s][A
Training:   8%|▊         | 6/79 [00:02<00:28,  2.57it/s][A
Training:  11%|█▏        | 9/79 [00:03<00:25,  2.77it/s][A
Training:  13%|█▎        | 10/79 [00:03<00:23,  2.94it/s][A
Training:  15%|█▌        | 12/79 [00:04<00:16,  3.98it/s][A
Training:  16%|█▋        | 13/79 [00:04<00:20,  3.15it/s][A
Training:  18%|█▊        | 14/79 [00:05<00:21,  3.00it/s][A
Training:  20%|██        | 16/79 [00:05<00:14,  4.31it/s][A
Training:  22%|██▏       | 17/79 [00:05<00:19,  3.11it/s][A
Training:  23%|██▎       | 18/79 [00:06<00:20,  3.02it/s][A
Training:  25%|██▌       | 20/79 [00:06<00:13,  4.35it/s][A
Training:  27%|██▋       | 21/79 [00:06<00:18,  3.17it/s][A
Training:  28%|██▊       | 22/79 [00:07<00:21,  2.60it/s][A
Training:  32%|███▏      | 25/79 [00:08<00:15,  3.39it/s][A
Training:  33%|███▎      | 26/79 [00

Epoch: 37/76 - Loss: 10.7589 - Accuracy: 0.9195



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:01<00:16,  1.81s/it][A
 40%|████      | 4/10 [00:01<00:02,  2.62it/s][A
 60%|██████    | 6/10 [00:03<00:01,  2.22it/s][A
100%|██████████| 10/10 [00:04<00:00,  2.42it/s][A
Epochs:  49%|████▊     | 37/76 [17:10<17:58, 27.65s/it]

Val Loss: 27.7664 - Val Accuracy: 0.9289



Training:   0%|          | 0/79 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/79 [00:01<02:07,  1.64s/it][A
Training:   5%|▌         | 4/79 [00:01<00:26,  2.88it/s][A
Training:   8%|▊         | 6/79 [00:02<00:31,  2.30it/s][A
Training:  11%|█▏        | 9/79 [00:03<00:27,  2.57it/s][A
Training:  13%|█▎        | 10/79 [00:04<00:23,  2.92it/s][A
Training:  15%|█▌        | 12/79 [00:04<00:16,  4.03it/s][A
Training:  16%|█▋        | 13/79 [00:04<00:22,  2.94it/s][A
Training:  18%|█▊        | 14/79 [00:05<00:21,  3.00it/s][A
Training:  20%|██        | 16/79 [00:05<00:14,  4.36it/s][A
Training:  22%|██▏       | 17/79 [00:06<00:21,  2.90it/s][A
Training:  23%|██▎       | 18/79 [00:06<00:19,  3.12it/s][A
Training:  27%|██▋       | 21/79 [00:07<00:17,  3.22it/s][A
Training:  28%|██▊       | 22/79 [00:07<00:16,  3.42it/s][A
Training:  30%|███       | 24/79 [00:07<00:11,  4.79it/s][A
Training:  32%|███▏      | 25/79 [00:08<00:19,  2.75it/s][A
Training:  33%|███▎      | 26/79 [00

Epoch: 38/76 - Loss: 12.4443 - Accuracy: 0.9204



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:01<00:15,  1.71s/it][A
 50%|█████     | 5/10 [00:02<00:02,  1.94it/s][A
100%|██████████| 10/10 [00:04<00:00,  2.48it/s][A
Epochs:  50%|█████     | 38/76 [17:38<17:37, 27.82s/it]

Val Loss: 5.9914 - Val Accuracy: 0.8563



Training:   0%|          | 0/79 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/79 [00:01<01:45,  1.35s/it][A
Training:   3%|▎         | 2/79 [00:01<00:49,  1.55it/s][A
Training:   5%|▌         | 4/79 [00:01<00:20,  3.61it/s][A
Training:   8%|▊         | 6/79 [00:02<00:30,  2.43it/s][A
Training:   9%|▉         | 7/79 [00:02<00:24,  2.98it/s][A
Training:  11%|█▏        | 9/79 [00:03<00:25,  2.75it/s][A
Training:  13%|█▎        | 10/79 [00:03<00:24,  2.82it/s][A
Training:  14%|█▍        | 11/79 [00:04<00:20,  3.36it/s][A
Training:  16%|█▋        | 13/79 [00:04<00:17,  3.70it/s][A
Training:  18%|█▊        | 14/79 [00:05<00:21,  3.07it/s][A
Training:  20%|██        | 16/79 [00:05<00:14,  4.32it/s][A
Training:  22%|██▏       | 17/79 [00:05<00:16,  3.73it/s][A
Training:  23%|██▎       | 18/79 [00:06<00:20,  2.98it/s][A
Training:  27%|██▋       | 21/79 [00:06<00:15,  3.86it/s][A
Training:  28%|██▊       | 22/79 [00:07<00:17,  3.23it/s][A
Training:  29%|██▉       | 23/79 [00:0

Epoch: 39/76 - Loss: 6.9907 - Accuracy: 0.9192



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:01<00:14,  1.65s/it][A
 30%|███       | 3/10 [00:01<00:03,  1.91it/s][A
 50%|█████     | 5/10 [00:02<00:02,  1.95it/s][A
 70%|███████   | 7/10 [00:03<00:01,  2.95it/s][A
100%|██████████| 10/10 [00:03<00:00,  2.59it/s][A
Epochs:  51%|█████▏    | 39/76 [18:05<16:59, 27.56s/it]

Val Loss: 19.9224 - Val Accuracy: 0.9347



Training:   0%|          | 0/79 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/79 [00:01<02:03,  1.58s/it][A
Training:   4%|▍         | 3/79 [00:01<00:35,  2.16it/s][A
Training:   6%|▋         | 5/79 [00:02<00:38,  1.93it/s][A
Training:   9%|▉         | 7/79 [00:02<00:23,  3.08it/s][A
Training:  11%|█▏        | 9/79 [00:04<00:28,  2.47it/s][A
Training:  14%|█▍        | 11/79 [00:04<00:19,  3.46it/s][A
Training:  16%|█▋        | 13/79 [00:05<00:24,  2.74it/s][A
Training:  19%|█▉        | 15/79 [00:05<00:17,  3.72it/s][A
Training:  20%|██        | 16/79 [00:05<00:15,  4.19it/s][A
Training:  22%|██▏       | 17/79 [00:06<00:23,  2.63it/s][A
Training:  25%|██▌       | 20/79 [00:06<00:13,  4.51it/s][A
Training:  28%|██▊       | 22/79 [00:07<00:17,  3.28it/s][A
Training:  32%|███▏      | 25/79 [00:08<00:18,  2.94it/s][A
Training:  34%|███▍      | 27/79 [00:08<00:13,  3.78it/s][A
Training:  35%|███▌      | 28/79 [00:08<00:12,  4.20it/s][A
Training:  37%|███▋      | 29/79 [00:

Epoch: 40/76 - Loss: 11.0340 - Accuracy: 0.9175



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:01<00:12,  1.37s/it][A
 30%|███       | 3/10 [00:01<00:02,  2.45it/s][A
 50%|█████     | 5/10 [00:02<00:02,  2.22it/s][A
 70%|███████   | 7/10 [00:02<00:00,  3.44it/s][A
100%|██████████| 10/10 [00:03<00:00,  2.83it/s][A
Epochs:  53%|█████▎    | 40/76 [18:33<16:30, 27.51s/it]

Val Loss: 3.6276 - Val Accuracy: 0.9161



Training:   0%|          | 0/79 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/79 [00:01<02:07,  1.63s/it][A
Training:   4%|▍         | 3/79 [00:01<00:36,  2.08it/s][A
Training:   5%|▌         | 4/79 [00:01<00:26,  2.84it/s][A
Training:   6%|▋         | 5/79 [00:02<00:41,  1.79it/s][A
Training:  10%|█         | 8/79 [00:03<00:18,  3.76it/s][A
Training:  11%|█▏        | 9/79 [00:04<00:28,  2.42it/s][A
Training:  15%|█▌        | 12/79 [00:04<00:15,  4.30it/s][A
Training:  18%|█▊        | 14/79 [00:05<00:20,  3.21it/s][A
Training:  20%|██        | 16/79 [00:05<00:15,  4.19it/s][A
Training:  23%|██▎       | 18/79 [00:06<00:20,  3.00it/s][A
Training:  25%|██▌       | 20/79 [00:06<00:14,  4.05it/s][A
Training:  28%|██▊       | 22/79 [00:07<00:18,  3.06it/s][A
Training:  32%|███▏      | 25/79 [00:08<00:17,  3.01it/s][A
Training:  33%|███▎      | 26/79 [00:08<00:15,  3.37it/s][A
Training:  35%|███▌      | 28/79 [00:08<00:11,  4.52it/s][A
Training:  38%|███▊      | 30/79 [00:0

Epoch: 41/76 - Loss: 8.0533 - Accuracy: 0.9192



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:01<00:14,  1.63s/it][A
 20%|██        | 2/10 [00:01<00:06,  1.30it/s][A
 50%|█████     | 5/10 [00:02<00:02,  2.11it/s][A
 60%|██████    | 6/10 [00:03<00:01,  2.39it/s][A
100%|██████████| 10/10 [00:04<00:00,  2.46it/s][A
Epochs:  54%|█████▍    | 41/76 [19:00<16:01, 27.46s/it]

Val Loss: 5.4057 - Val Accuracy: 0.9370



Training:   0%|          | 0/79 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/79 [00:01<02:17,  1.76s/it][A
Training:   4%|▍         | 3/79 [00:01<00:38,  2.00it/s][A
Training:   6%|▋         | 5/79 [00:03<00:41,  1.80it/s][A
Training:   8%|▊         | 6/79 [00:03<00:31,  2.31it/s][A
Training:   9%|▉         | 7/79 [00:03<00:24,  2.94it/s][A
Training:  11%|█▏        | 9/79 [00:04<00:28,  2.42it/s][A
Training:  15%|█▌        | 12/79 [00:04<00:15,  4.29it/s][A
Training:  18%|█▊        | 14/79 [00:05<00:21,  2.97it/s][A
Training:  19%|█▉        | 15/79 [00:05<00:19,  3.35it/s][A
Training:  22%|██▏       | 17/79 [00:06<00:22,  2.78it/s][A
Training:  23%|██▎       | 18/79 [00:06<00:18,  3.23it/s][A
Training:  24%|██▍       | 19/79 [00:06<00:15,  3.77it/s][A
Training:  27%|██▋       | 21/79 [00:07<00:18,  3.16it/s][A
Training:  29%|██▉       | 23/79 [00:07<00:13,  4.22it/s][A
Training:  30%|███       | 24/79 [00:07<00:11,  4.69it/s][A
Training:  32%|███▏      | 25/79 [00:0

Epoch: 42/76 - Loss: 6.9221 - Accuracy: 0.9217



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:01<00:14,  1.56s/it][A
 30%|███       | 3/10 [00:01<00:03,  2.10it/s][A
 50%|█████     | 5/10 [00:02<00:02,  2.18it/s][A
 70%|███████   | 7/10 [00:02<00:00,  3.44it/s][A
100%|██████████| 10/10 [00:03<00:00,  2.61it/s][A
Epochs:  55%|█████▌    | 42/76 [19:28<15:39, 27.63s/it]

Val Loss: 12.4251 - Val Accuracy: 0.9237



Training:   0%|          | 0/79 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/79 [00:01<01:55,  1.49s/it][A
Training:   5%|▌         | 4/79 [00:01<00:23,  3.15it/s][A
Training:   8%|▊         | 6/79 [00:02<00:32,  2.24it/s][A
Training:   9%|▉         | 7/79 [00:02<00:26,  2.68it/s][A
Training:  10%|█         | 8/79 [00:03<00:21,  3.25it/s][A
Training:  11%|█▏        | 9/79 [00:03<00:29,  2.40it/s][A
Training:  14%|█▍        | 11/79 [00:04<00:19,  3.41it/s][A
Training:  15%|█▌        | 12/79 [00:04<00:17,  3.92it/s][A
Training:  16%|█▋        | 13/79 [00:04<00:24,  2.73it/s][A
Training:  18%|█▊        | 14/79 [00:05<00:20,  3.24it/s][A
Training:  19%|█▉        | 15/79 [00:05<00:19,  3.34it/s][A
Training:  20%|██        | 16/79 [00:05<00:17,  3.65it/s][A
Training:  22%|██▏       | 17/79 [00:06<00:22,  2.79it/s][A
Training:  23%|██▎       | 18/79 [00:06<00:21,  2.84it/s][A
Training:  25%|██▌       | 20/79 [00:06<00:17,  3.47it/s][A
Training:  27%|██▋       | 21/79 [00:0

Epoch: 43/76 - Loss: 34.3022 - Accuracy: 0.9019



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:01<00:11,  1.33s/it][A
 20%|██        | 2/10 [00:01<00:05,  1.58it/s][A
 40%|████      | 4/10 [00:01<00:01,  3.67it/s][A
 60%|██████    | 6/10 [00:02<00:01,  2.55it/s][A
100%|██████████| 10/10 [00:03<00:00,  2.73it/s][A
Epochs:  57%|█████▋    | 43/76 [19:56<15:17, 27.80s/it]

Val Loss: 35.2980 - Val Accuracy: 0.8985



Training:   0%|          | 0/79 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/79 [00:01<01:57,  1.50s/it][A
Training:   5%|▌         | 4/79 [00:01<00:23,  3.14it/s][A
Training:   8%|▊         | 6/79 [00:02<00:32,  2.24it/s][A
Training:  10%|█         | 8/79 [00:03<00:21,  3.29it/s][A
Training:  13%|█▎        | 10/79 [00:04<00:27,  2.50it/s][A
Training:  16%|█▋        | 13/79 [00:05<00:25,  2.55it/s][A
Training:  19%|█▉        | 15/79 [00:05<00:19,  3.32it/s][A
Training:  20%|██        | 16/79 [00:05<00:16,  3.75it/s][A
Training:  22%|██▏       | 17/79 [00:06<00:25,  2.43it/s][A
Training:  27%|██▋       | 21/79 [00:07<00:19,  2.94it/s][A
Training:  29%|██▉       | 23/79 [00:07<00:14,  3.75it/s][A
Training:  32%|███▏      | 25/79 [00:08<00:18,  2.91it/s][A
Training:  34%|███▍      | 27/79 [00:09<00:13,  3.76it/s][A
Training:  35%|███▌      | 28/79 [00:09<00:12,  4.17it/s][A
Training:  37%|███▋      | 29/79 [00:10<00:18,  2.67it/s][A
Training:  39%|███▉      | 31/79 [00

Epoch: 44/76 - Loss: 22.4026 - Accuracy: 0.9126



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:01<00:12,  1.38s/it][A
 40%|████      | 4/10 [00:01<00:01,  3.38it/s][A
 60%|██████    | 6/10 [00:02<00:01,  2.60it/s][A
100%|██████████| 10/10 [00:03<00:00,  2.70it/s][A
Epochs:  58%|█████▊    | 44/76 [20:24<14:43, 27.62s/it]

Val Loss: 12.2906 - Val Accuracy: 0.9309



Training:   0%|          | 0/79 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/79 [00:01<02:05,  1.61s/it][A
Training:   4%|▍         | 3/79 [00:01<00:36,  2.11it/s][A
Training:   6%|▋         | 5/79 [00:02<00:37,  1.99it/s][A
Training:   8%|▊         | 6/79 [00:02<00:29,  2.43it/s][A
Training:  11%|█▏        | 9/79 [00:03<00:25,  2.74it/s][A
Training:  13%|█▎        | 10/79 [00:04<00:23,  2.93it/s][A
Training:  15%|█▌        | 12/79 [00:04<00:16,  4.06it/s][A
Training:  16%|█▋        | 13/79 [00:05<00:22,  2.91it/s][A
Training:  18%|█▊        | 14/79 [00:05<00:20,  3.24it/s][A
Training:  20%|██        | 16/79 [00:05<00:13,  4.73it/s][A
Training:  22%|██▏       | 17/79 [00:06<00:21,  2.91it/s][A
Training:  23%|██▎       | 18/79 [00:06<00:20,  2.95it/s][A
Training:  25%|██▌       | 20/79 [00:06<00:13,  4.24it/s][A
Training:  27%|██▋       | 21/79 [00:07<00:20,  2.83it/s][A
Training:  28%|██▊       | 22/79 [00:07<00:20,  2.74it/s][A
Training:  30%|███       | 24/79 [00:

Epoch: 45/76 - Loss: 10.5898 - Accuracy: 0.9224



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:01<00:14,  1.62s/it][A
 30%|███       | 3/10 [00:01<00:03,  2.18it/s][A
 50%|█████     | 5/10 [00:02<00:02,  2.08it/s][A
 80%|████████  | 8/10 [00:02<00:00,  3.93it/s][A
100%|██████████| 10/10 [00:03<00:00,  2.56it/s][A
Epochs:  59%|█████▉    | 45/76 [20:51<14:17, 27.65s/it]

Val Loss: 16.4285 - Val Accuracy: 0.9281



Training:   0%|          | 0/79 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/79 [00:01<02:15,  1.74s/it][A
Training:   5%|▌         | 4/79 [00:01<00:27,  2.76it/s][A
Training:   8%|▊         | 6/79 [00:02<00:31,  2.34it/s][A
Training:   9%|▉         | 7/79 [00:03<00:25,  2.82it/s][A
Training:  11%|█▏        | 9/79 [00:04<00:29,  2.38it/s][A
Training:  14%|█▍        | 11/79 [00:04<00:20,  3.35it/s][A
Training:  16%|█▋        | 13/79 [00:05<00:24,  2.69it/s][A
Training:  19%|█▉        | 15/79 [00:05<00:17,  3.74it/s][A
Training:  22%|██▏       | 17/79 [00:06<00:21,  2.91it/s][A
Training:  27%|██▋       | 21/79 [00:07<00:19,  3.03it/s][A
Training:  29%|██▉       | 23/79 [00:07<00:14,  3.75it/s][A
Training:  32%|███▏      | 25/79 [00:08<00:16,  3.30it/s][A
Training:  37%|███▋      | 29/79 [00:09<00:15,  3.28it/s][A
Training:  41%|████      | 32/79 [00:09<00:10,  4.46it/s][A
Training:  42%|████▏     | 33/79 [00:11<00:15,  2.98it/s][A
Training:  44%|████▍     | 35/79 [00:

Epoch: 46/76 - Loss: 6.1253 - Accuracy: 0.9230



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:01<00:13,  1.48s/it][A
 20%|██        | 2/10 [00:01<00:05,  1.47it/s][A
 40%|████      | 4/10 [00:01<00:01,  3.34it/s][A
 50%|█████     | 5/10 [00:02<00:02,  1.81it/s][A
 80%|████████  | 8/10 [00:02<00:00,  3.87it/s][A
100%|██████████| 10/10 [00:03<00:00,  2.51it/s][A
Epochs:  61%|██████    | 46/76 [21:19<13:47, 27.57s/it]

Val Loss: 9.5102 - Val Accuracy: 0.9084



Training:   0%|          | 0/79 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/79 [00:01<02:06,  1.63s/it][A
Training:   3%|▎         | 2/79 [00:01<00:56,  1.36it/s][A
Training:   5%|▌         | 4/79 [00:01<00:23,  3.15it/s][A
Training:   6%|▋         | 5/79 [00:02<00:38,  1.94it/s][A
Training:  10%|█         | 8/79 [00:02<00:17,  4.02it/s][A
Training:  13%|█▎        | 10/79 [00:04<00:26,  2.65it/s][A
Training:  15%|█▌        | 12/79 [00:04<00:18,  3.72it/s][A
Training:  18%|█▊        | 14/79 [00:05<00:24,  2.63it/s][A
Training:  20%|██        | 16/79 [00:05<00:17,  3.54it/s][A
Training:  23%|██▎       | 18/79 [00:06<00:22,  2.74it/s][A
Training:  27%|██▋       | 21/79 [00:07<00:21,  2.67it/s][A
Training:  29%|██▉       | 23/79 [00:08<00:16,  3.45it/s][A
Training:  32%|███▏      | 25/79 [00:09<00:19,  2.76it/s][A
Training:  35%|███▌      | 28/79 [00:09<00:12,  4.13it/s][A
Training:  38%|███▊      | 30/79 [00:10<00:14,  3.41it/s][A
Training:  39%|███▉      | 31/79 [00:

Epoch: 47/76 - Loss: 5.5681 - Accuracy: 0.9262



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:01<00:15,  1.74s/it][A
 50%|█████     | 5/10 [00:02<00:02,  2.03it/s][A
100%|██████████| 10/10 [00:04<00:00,  2.47it/s][A
Epochs:  62%|██████▏   | 47/76 [21:47<13:22, 27.67s/it]

Val Loss: 4.3489 - Val Accuracy: 0.9375



Training:   0%|          | 0/79 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/79 [00:01<02:07,  1.64s/it][A
Training:   5%|▌         | 4/79 [00:01<00:29,  2.55it/s][A
Training:   6%|▋         | 5/79 [00:02<00:39,  1.88it/s][A
Training:   9%|▉         | 7/79 [00:03<00:24,  2.91it/s][A
Training:  11%|█▏        | 9/79 [00:03<00:26,  2.60it/s][A
Training:  14%|█▍        | 11/79 [00:04<00:18,  3.67it/s][A
Training:  15%|█▌        | 12/79 [00:04<00:16,  4.10it/s][A
Training:  16%|█▋        | 13/79 [00:05<00:28,  2.31it/s][A
Training:  19%|█▉        | 15/79 [00:05<00:18,  3.40it/s][A
Training:  22%|██▏       | 17/79 [00:06<00:24,  2.56it/s][A
Training:  23%|██▎       | 18/79 [00:06<00:20,  2.96it/s][A
Training:  25%|██▌       | 20/79 [00:06<00:13,  4.26it/s][A
Training:  27%|██▋       | 21/79 [00:07<00:22,  2.58it/s][A
Training:  30%|███       | 24/79 [00:07<00:12,  4.42it/s][A
Training:  33%|███▎      | 26/79 [00:08<00:16,  3.16it/s][A
Training:  35%|███▌      | 28/79 [00:

Epoch: 48/76 - Loss: 11.6045 - Accuracy: 0.9215



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:01<00:13,  1.46s/it][A
 20%|██        | 2/10 [00:01<00:05,  1.52it/s][A
 50%|█████     | 5/10 [00:02<00:02,  2.38it/s][A
 70%|███████   | 7/10 [00:02<00:00,  3.62it/s][A
100%|██████████| 10/10 [00:03<00:00,  2.63it/s][A
Epochs:  63%|██████▎   | 48/76 [22:14<12:53, 27.63s/it]

Val Loss: 11.6640 - Val Accuracy: 0.8961



Training:   0%|          | 0/79 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/79 [00:01<01:53,  1.45s/it][A
Training:   4%|▍         | 3/79 [00:01<00:31,  2.42it/s][A
Training:   6%|▋         | 5/79 [00:02<00:36,  2.02it/s][A
Training:   9%|▉         | 7/79 [00:02<00:22,  3.25it/s][A
Training:  11%|█▏        | 9/79 [00:04<00:30,  2.32it/s][A
Training:  13%|█▎        | 10/79 [00:04<00:25,  2.74it/s][A
Training:  16%|█▋        | 13/79 [00:05<00:23,  2.84it/s][A
Training:  19%|█▉        | 15/79 [00:05<00:16,  3.86it/s][A
Training:  22%|██▏       | 17/79 [00:06<00:21,  2.93it/s][A
Training:  25%|██▌       | 20/79 [00:06<00:13,  4.53it/s][A
Training:  28%|██▊       | 22/79 [00:07<00:17,  3.18it/s][A
Training:  32%|███▏      | 25/79 [00:08<00:16,  3.18it/s][A
Training:  34%|███▍      | 27/79 [00:08<00:13,  3.90it/s][A
Training:  37%|███▋      | 29/79 [00:09<00:15,  3.13it/s][A
Training:  39%|███▉      | 31/79 [00:09<00:12,  3.97it/s][A
Training:  42%|████▏     | 33/79 [00:

Epoch: 49/76 - Loss: 10.9831 - Accuracy: 0.9229



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:01<00:14,  1.60s/it][A
 30%|███       | 3/10 [00:01<00:03,  2.21it/s][A
 50%|█████     | 5/10 [00:02<00:02,  2.22it/s][A
 70%|███████   | 7/10 [00:02<00:00,  3.42it/s][A
100%|██████████| 10/10 [00:03<00:00,  2.65it/s][A
Epochs:  64%|██████▍   | 49/76 [22:41<12:21, 27.46s/it]

Val Loss: 27.5170 - Val Accuracy: 0.9381



Training:   0%|          | 0/79 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/79 [00:01<01:57,  1.51s/it][A
Training:   3%|▎         | 2/79 [00:01<00:59,  1.30it/s][A
Training:   5%|▌         | 4/79 [00:01<00:24,  3.09it/s][A
Training:   6%|▋         | 5/79 [00:02<00:34,  2.12it/s][A
Training:   8%|▊         | 6/79 [00:02<00:26,  2.71it/s][A
Training:  10%|█         | 8/79 [00:02<00:16,  4.32it/s][A
Training:  11%|█▏        | 9/79 [00:03<00:29,  2.38it/s][A
Training:  13%|█▎        | 10/79 [00:04<00:23,  2.89it/s][A
Training:  15%|█▌        | 12/79 [00:04<00:14,  4.53it/s][A
Training:  18%|█▊        | 14/79 [00:05<00:21,  2.97it/s][A
Training:  20%|██        | 16/79 [00:05<00:15,  4.01it/s][A
Training:  22%|██▏       | 17/79 [00:06<00:23,  2.64it/s][A
Training:  23%|██▎       | 18/79 [00:06<00:19,  3.13it/s][A
Training:  25%|██▌       | 20/79 [00:06<00:13,  4.42it/s][A
Training:  27%|██▋       | 21/79 [00:07<00:20,  2.82it/s][A
Training:  29%|██▉       | 23/79 [00:07

Epoch: 50/76 - Loss: 11.7781 - Accuracy: 0.9170



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:01<00:14,  1.62s/it][A
 30%|███       | 3/10 [00:01<00:03,  2.12it/s][A
 50%|█████     | 5/10 [00:02<00:02,  2.13it/s][A
 60%|██████    | 6/10 [00:02<00:01,  2.70it/s][A
100%|██████████| 10/10 [00:03<00:00,  2.56it/s][A
Epochs:  66%|██████▌   | 50/76 [23:09<11:59, 27.66s/it]

Val Loss: 6.2466 - Val Accuracy: 0.9374



Training:   0%|          | 0/79 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/79 [00:01<02:08,  1.64s/it][A
Training:   4%|▍         | 3/79 [00:01<00:36,  2.07it/s][A
Training:   6%|▋         | 5/79 [00:02<00:39,  1.88it/s][A
Training:   9%|▉         | 7/79 [00:03<00:24,  2.97it/s][A
Training:  11%|█▏        | 9/79 [00:03<00:24,  2.81it/s][A
Training:  14%|█▍        | 11/79 [00:04<00:17,  3.88it/s][A
Training:  16%|█▋        | 13/79 [00:04<00:21,  3.05it/s][A
Training:  19%|█▉        | 15/79 [00:05<00:17,  3.73it/s][A
Training:  20%|██        | 16/79 [00:05<00:15,  4.14it/s][A
Training:  22%|██▏       | 17/79 [00:06<00:20,  2.98it/s][A
Training:  23%|██▎       | 18/79 [00:06<00:17,  3.47it/s][A
Training:  24%|██▍       | 19/79 [00:06<00:15,  3.85it/s][A
Training:  27%|██▋       | 21/79 [00:07<00:18,  3.07it/s][A
Training:  28%|██▊       | 22/79 [00:07<00:17,  3.30it/s][A
Training:  32%|███▏      | 25/79 [00:08<00:16,  3.28it/s][A
Training:  33%|███▎      | 26/79 [00:

Epoch: 51/76 - Loss: 9.3408 - Accuracy: 0.9212



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:01<00:12,  1.40s/it][A
 40%|████      | 4/10 [00:01<00:01,  3.04it/s][A
 50%|█████     | 5/10 [00:02<00:02,  2.17it/s][A
 80%|████████  | 8/10 [00:02<00:00,  3.85it/s][A
100%|██████████| 10/10 [00:03<00:00,  2.64it/s][A
Epochs:  67%|██████▋   | 51/76 [23:36<11:27, 27.51s/it]

Val Loss: 5.2374 - Val Accuracy: 0.9371



Training:   0%|          | 0/79 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/79 [00:01<02:04,  1.59s/it][A
Training:   3%|▎         | 2/79 [00:01<00:56,  1.36it/s][A
Training:   5%|▌         | 4/79 [00:01<00:24,  3.12it/s][A
Training:   6%|▋         | 5/79 [00:02<00:37,  1.96it/s][A
Training:  11%|█▏        | 9/79 [00:03<00:25,  2.72it/s][A
Training:  13%|█▎        | 10/79 [00:04<00:22,  3.12it/s][A
Training:  15%|█▌        | 12/79 [00:04<00:15,  4.38it/s][A
Training:  18%|█▊        | 14/79 [00:05<00:21,  3.08it/s][A
Training:  20%|██        | 16/79 [00:05<00:15,  4.09it/s][A
Training:  22%|██▏       | 17/79 [00:06<00:22,  2.78it/s][A
Training:  27%|██▋       | 21/79 [00:07<00:18,  3.10it/s][A
Training:  29%|██▉       | 23/79 [00:07<00:14,  3.90it/s][A
Training:  32%|███▏      | 25/79 [00:08<00:17,  3.08it/s][A
Training:  34%|███▍      | 27/79 [00:08<00:13,  3.95it/s][A
Training:  37%|███▋      | 29/79 [00:09<00:16,  3.12it/s][A
Training:  39%|███▉      | 31/79 [00:

Epoch: 52/76 - Loss: 12.6791 - Accuracy: 0.9174



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:01<00:14,  1.56s/it][A
 30%|███       | 3/10 [00:01<00:03,  2.17it/s][A
 50%|█████     | 5/10 [00:02<00:02,  2.02it/s][A
 70%|███████   | 7/10 [00:02<00:00,  3.14it/s][A
 80%|████████  | 8/10 [00:03<00:00,  3.67it/s][A
100%|██████████| 10/10 [00:03<00:00,  2.52it/s][A
Epochs:  68%|██████▊   | 52/76 [24:04<10:58, 27.44s/it]

Val Loss: 10.9713 - Val Accuracy: 0.9237



Training:   0%|          | 0/79 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/79 [00:01<02:01,  1.56s/it][A
Training:   4%|▍         | 3/79 [00:01<00:33,  2.26it/s][A
Training:   6%|▋         | 5/79 [00:02<00:36,  2.04it/s][A
Training:   8%|▊         | 6/79 [00:02<00:28,  2.53it/s][A
Training:  10%|█         | 8/79 [00:03<00:17,  3.96it/s][A
Training:  13%|█▎        | 10/79 [00:04<00:24,  2.82it/s][A
Training:  15%|█▌        | 12/79 [00:04<00:16,  3.95it/s][A
Training:  16%|█▋        | 13/79 [00:05<00:25,  2.59it/s][A
Training:  18%|█▊        | 14/79 [00:05<00:21,  3.06it/s][A
Training:  20%|██        | 16/79 [00:05<00:14,  4.45it/s][A
Training:  22%|██▏       | 17/79 [00:06<00:23,  2.65it/s][A
Training:  24%|██▍       | 19/79 [00:06<00:15,  3.94it/s][A
Training:  27%|██▋       | 21/79 [00:07<00:19,  2.94it/s][A
Training:  29%|██▉       | 23/79 [00:07<00:13,  4.02it/s][A
Training:  32%|███▏      | 25/79 [00:08<00:15,  3.54it/s][A
Training:  33%|███▎      | 26/79 [00:

Epoch: 53/76 - Loss: 5.3111 - Accuracy: 0.9255



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:01<00:14,  1.62s/it][A
 20%|██        | 2/10 [00:01<00:06,  1.29it/s][A
 40%|████      | 4/10 [00:01<00:01,  3.06it/s][A
 50%|█████     | 5/10 [00:02<00:02,  2.04it/s][A
 60%|██████    | 6/10 [00:02<00:01,  2.58it/s][A
 90%|█████████ | 9/10 [00:03<00:00,  3.09it/s][A
100%|██████████| 10/10 [00:03<00:00,  2.50it/s][A
Epochs:  70%|██████▉   | 53/76 [24:31<10:29, 27.38s/it]

Val Loss: 3.9256 - Val Accuracy: 0.9342



Training:   0%|          | 0/79 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/79 [00:01<01:59,  1.54s/it][A
Training:   4%|▍         | 3/79 [00:01<00:34,  2.20it/s][A
Training:   5%|▌         | 4/79 [00:01<00:25,  2.97it/s][A
Training:   6%|▋         | 5/79 [00:02<00:39,  1.88it/s][A
Training:   9%|▉         | 7/79 [00:02<00:22,  3.19it/s][A
Training:  11%|█▏        | 9/79 [00:03<00:27,  2.57it/s][A
Training:  14%|█▍        | 11/79 [00:04<00:18,  3.62it/s][A
Training:  16%|█▋        | 13/79 [00:05<00:24,  2.67it/s][A
Training:  19%|█▉        | 15/79 [00:05<00:17,  3.61it/s][A
Training:  22%|██▏       | 17/79 [00:06<00:22,  2.80it/s][A
Training:  27%|██▋       | 21/79 [00:07<00:19,  2.97it/s][A
Training:  30%|███       | 24/79 [00:07<00:12,  4.27it/s][A
Training:  33%|███▎      | 26/79 [00:08<00:16,  3.21it/s][A
Training:  35%|███▌      | 28/79 [00:09<00:12,  3.97it/s][A
Training:  38%|███▊      | 30/79 [00:09<00:14,  3.37it/s][A
Training:  42%|████▏     | 33/79 [00:1

Epoch: 54/76 - Loss: 36.9886 - Accuracy: 0.9049



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:01<00:14,  1.62s/it][A
 20%|██        | 2/10 [00:01<00:06,  1.28it/s][A
 50%|█████     | 5/10 [00:02<00:02,  2.11it/s][A
 60%|██████    | 6/10 [00:02<00:01,  2.63it/s][A
 80%|████████  | 8/10 [00:03<00:00,  4.08it/s][A
100%|██████████| 10/10 [00:04<00:00,  2.44it/s][A
Epochs:  71%|███████   | 54/76 [24:59<10:04, 27.50s/it]

Val Loss: 14.4098 - Val Accuracy: 0.9412



Training:   0%|          | 0/79 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/79 [00:01<01:55,  1.48s/it][A
Training:   4%|▍         | 3/79 [00:01<00:33,  2.27it/s][A
Training:   6%|▋         | 5/79 [00:02<00:37,  1.97it/s][A
Training:   9%|▉         | 7/79 [00:02<00:22,  3.17it/s][A
Training:  11%|█▏        | 9/79 [00:04<00:28,  2.45it/s][A
Training:  16%|█▋        | 13/79 [00:05<00:21,  3.02it/s][A
Training:  20%|██        | 16/79 [00:05<00:14,  4.21it/s][A
Training:  22%|██▏       | 17/79 [00:06<00:21,  2.91it/s][A
Training:  24%|██▍       | 19/79 [00:06<00:15,  3.87it/s][A
Training:  27%|██▋       | 21/79 [00:07<00:19,  2.94it/s][A
Training:  29%|██▉       | 23/79 [00:07<00:14,  3.76it/s][A
Training:  32%|███▏      | 25/79 [00:08<00:18,  2.92it/s][A
Training:  35%|███▌      | 28/79 [00:08<00:11,  4.36it/s][A
Training:  38%|███▊      | 30/79 [00:09<00:15,  3.17it/s][A
Training:  41%|████      | 32/79 [00:10<00:11,  3.98it/s][A
Training:  42%|████▏     | 33/79 [00:

Epoch: 55/76 - Loss: 10.1753 - Accuracy: 0.9185



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:01<00:14,  1.59s/it][A
 30%|███       | 3/10 [00:01<00:03,  2.13it/s][A
 50%|█████     | 5/10 [00:02<00:02,  2.14it/s][A
 60%|██████    | 6/10 [00:02<00:01,  2.50it/s][A
100%|██████████| 10/10 [00:04<00:00,  2.49it/s][A
Epochs:  72%|███████▏  | 55/76 [25:26<09:35, 27.42s/it]

Val Loss: 3.5493 - Val Accuracy: 0.9015



Training:   0%|          | 0/79 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/79 [00:01<01:55,  1.48s/it][A
Training:   3%|▎         | 2/79 [00:01<00:54,  1.42it/s][A
Training:   5%|▌         | 4/79 [00:01<00:22,  3.29it/s][A
Training:   6%|▋         | 5/79 [00:02<00:36,  2.02it/s][A
Training:   9%|▉         | 7/79 [00:02<00:23,  3.03it/s][A
Training:  10%|█         | 8/79 [00:03<00:19,  3.61it/s][A
Training:  11%|█▏        | 9/79 [00:03<00:28,  2.43it/s][A
Training:  13%|█▎        | 10/79 [00:04<00:27,  2.54it/s][A
Training:  15%|█▌        | 12/79 [00:04<00:16,  3.96it/s][A
Training:  16%|█▋        | 13/79 [00:05<00:23,  2.81it/s][A
Training:  18%|█▊        | 14/79 [00:05<00:21,  3.05it/s][A
Training:  19%|█▉        | 15/79 [00:05<00:17,  3.70it/s][A
Training:  22%|██▏       | 17/79 [00:06<00:19,  3.22it/s][A
Training:  23%|██▎       | 18/79 [00:06<00:18,  3.31it/s][A
Training:  24%|██▍       | 19/79 [00:06<00:15,  3.97it/s][A
Training:  27%|██▋       | 21/79 [00:07

Epoch: 56/76 - Loss: 19.4734 - Accuracy: 0.9191



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:01<00:15,  1.67s/it][A
 30%|███       | 3/10 [00:01<00:03,  2.11it/s][A
 50%|█████     | 5/10 [00:02<00:02,  1.96it/s][A
100%|██████████| 10/10 [00:03<00:00,  2.54it/s][A
Epochs:  74%|███████▎  | 56/76 [25:53<09:08, 27.43s/it]

Val Loss: 21.4098 - Val Accuracy: 0.9450



Training:   0%|          | 0/79 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/79 [00:01<01:52,  1.44s/it][A
Training:   3%|▎         | 2/79 [00:01<01:00,  1.28it/s][A
Training:   5%|▌         | 4/79 [00:01<00:25,  2.99it/s][A
Training:   6%|▋         | 5/79 [00:02<00:30,  2.43it/s][A
Training:   8%|▊         | 6/79 [00:03<00:34,  2.12it/s][A
Training:   9%|▉         | 7/79 [00:03<00:25,  2.78it/s][A
Training:  11%|█▏        | 9/79 [00:03<00:19,  3.59it/s][A
Training:  13%|█▎        | 10/79 [00:04<00:28,  2.39it/s][A
Training:  15%|█▌        | 12/79 [00:04<00:17,  3.75it/s][A
Training:  16%|█▋        | 13/79 [00:04<00:15,  4.15it/s][A
Training:  18%|█▊        | 14/79 [00:05<00:25,  2.60it/s][A
Training:  22%|██▏       | 17/79 [00:05<00:13,  4.51it/s][A
Training:  23%|██▎       | 18/79 [00:06<00:22,  2.75it/s][A
Training:  27%|██▋       | 21/79 [00:06<00:12,  4.52it/s][A
Training:  29%|██▉       | 23/79 [00:07<00:16,  3.38it/s][A
Training:  33%|███▎      | 26/79 [00:08

Epoch: 57/76 - Loss: 15.4066 - Accuracy: 0.9228



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:01<00:15,  1.76s/it][A
 40%|████      | 4/10 [00:01<00:02,  2.72it/s][A
 60%|██████    | 6/10 [00:02<00:01,  2.29it/s][A
100%|██████████| 10/10 [00:04<00:00,  2.43it/s][A
Epochs:  75%|███████▌  | 57/76 [26:21<08:44, 27.61s/it]

Val Loss: 10.9429 - Val Accuracy: 0.9246



Training:   0%|          | 0/79 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/79 [00:01<02:12,  1.70s/it][A
Training:   4%|▍         | 3/79 [00:01<00:37,  2.05it/s][A
Training:   6%|▋         | 5/79 [00:02<00:38,  1.93it/s][A
Training:   9%|▉         | 7/79 [00:03<00:23,  3.04it/s][A
Training:  11%|█▏        | 9/79 [00:04<00:27,  2.51it/s][A
Training:  15%|█▌        | 12/79 [00:04<00:15,  4.20it/s][A
Training:  18%|█▊        | 14/79 [00:05<00:21,  3.09it/s][A
Training:  22%|██▏       | 17/79 [00:06<00:19,  3.17it/s][A
Training:  23%|██▎       | 18/79 [00:06<00:17,  3.53it/s][A
Training:  25%|██▌       | 20/79 [00:06<00:12,  4.69it/s][A
Training:  28%|██▊       | 22/79 [00:07<00:17,  3.18it/s][A
Training:  30%|███       | 24/79 [00:07<00:13,  4.19it/s][A
Training:  33%|███▎      | 26/79 [00:08<00:16,  3.14it/s][A
Training:  35%|███▌      | 28/79 [00:08<00:12,  4.17it/s][A
Training:  38%|███▊      | 30/79 [00:09<00:14,  3.38it/s][A
Training:  41%|████      | 32/79 [00:

Epoch: 58/76 - Loss: 10.6119 - Accuracy: 0.9232



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:01<00:14,  1.58s/it][A
 20%|██        | 2/10 [00:01<00:05,  1.41it/s][A
 40%|████      | 4/10 [00:01<00:01,  3.22it/s][A
 50%|█████     | 5/10 [00:02<00:02,  1.93it/s][A
 70%|███████   | 7/10 [00:03<00:00,  3.14it/s][A
100%|██████████| 10/10 [00:03<00:00,  2.57it/s][A
Epochs:  76%|███████▋  | 58/76 [26:49<08:14, 27.46s/it]

Val Loss: 6.4436 - Val Accuracy: 0.9302



Training:   0%|          | 0/79 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/79 [00:01<02:24,  1.85s/it][A
Training:   4%|▍         | 3/79 [00:01<00:39,  1.90it/s][A
Training:   6%|▋         | 5/79 [00:03<00:39,  1.89it/s][A
Training:   9%|▉         | 7/79 [00:03<00:24,  2.97it/s][A
Training:  11%|█▏        | 9/79 [00:04<00:27,  2.55it/s][A
Training:  14%|█▍        | 11/79 [00:04<00:18,  3.66it/s][A
Training:  16%|█▋        | 13/79 [00:05<00:21,  3.02it/s][A
Training:  19%|█▉        | 15/79 [00:05<00:15,  4.09it/s][A
Training:  22%|██▏       | 17/79 [00:06<00:20,  3.05it/s][A
Training:  24%|██▍       | 19/79 [00:06<00:15,  3.94it/s][A
Training:  27%|██▋       | 21/79 [00:07<00:19,  3.00it/s][A
Training:  29%|██▉       | 23/79 [00:07<00:14,  3.98it/s][A
Training:  32%|███▏      | 25/79 [00:08<00:17,  3.04it/s][A
Training:  34%|███▍      | 27/79 [00:08<00:12,  4.05it/s][A
Training:  37%|███▋      | 29/79 [00:09<00:14,  3.40it/s][A
Training:  39%|███▉      | 31/79 [00:

Epoch: 59/76 - Loss: 4.8814 - Accuracy: 0.9256



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:01<00:13,  1.55s/it][A
 40%|████      | 4/10 [00:01<00:01,  3.08it/s][A
 60%|██████    | 6/10 [00:02<00:01,  2.63it/s][A
100%|██████████| 10/10 [00:03<00:00,  2.65it/s][A
Epochs:  78%|███████▊  | 59/76 [27:16<07:45, 27.37s/it]

Val Loss: 4.2708 - Val Accuracy: 0.9199



Training:   0%|          | 0/79 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/79 [00:01<02:03,  1.59s/it][A
Training:   5%|▌         | 4/79 [00:01<00:24,  3.04it/s][A
Training:   8%|▊         | 6/79 [00:02<00:30,  2.38it/s][A
Training:  10%|█         | 8/79 [00:02<00:20,  3.44it/s][A
Training:  13%|█▎        | 10/79 [00:04<00:27,  2.47it/s][A
Training:  16%|█▋        | 13/79 [00:05<00:24,  2.73it/s][A
Training:  19%|█▉        | 15/79 [00:05<00:17,  3.63it/s][A
Training:  22%|██▏       | 17/79 [00:06<00:21,  2.91it/s][A
Training:  24%|██▍       | 19/79 [00:06<00:15,  3.87it/s][A
Training:  27%|██▋       | 21/79 [00:07<00:20,  2.90it/s][A
Training:  29%|██▉       | 23/79 [00:07<00:14,  3.88it/s][A
Training:  32%|███▏      | 25/79 [00:08<00:17,  3.02it/s][A
Training:  35%|███▌      | 28/79 [00:08<00:11,  4.60it/s][A
Training:  38%|███▊      | 30/79 [00:09<00:14,  3.44it/s][A
Training:  42%|████▏     | 33/79 [00:10<00:14,  3.18it/s][A
Training:  44%|████▍     | 35/79 [00

Epoch: 60/76 - Loss: 6.9676 - Accuracy: 0.9289



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:01<00:15,  1.70s/it][A
 30%|███       | 3/10 [00:01<00:03,  1.98it/s][A
 50%|█████     | 5/10 [00:02<00:02,  2.15it/s][A
 60%|██████    | 6/10 [00:02<00:01,  2.72it/s][A
 70%|███████   | 7/10 [00:03<00:01,  2.93it/s][A
100%|██████████| 10/10 [00:03<00:00,  2.50it/s][A
Epochs:  79%|███████▉  | 60/76 [27:42<07:15, 27.19s/it]

Val Loss: 7.4368 - Val Accuracy: 0.9348



Training:   0%|          | 0/79 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/79 [00:01<01:58,  1.52s/it][A
Training:   6%|▋         | 5/79 [00:02<00:32,  2.26it/s][A
Training:   8%|▊         | 6/79 [00:02<00:26,  2.71it/s][A
Training:  11%|█▏        | 9/79 [00:03<00:23,  2.98it/s][A
Training:  13%|█▎        | 10/79 [00:03<00:20,  3.40it/s][A
Training:  15%|█▌        | 12/79 [00:03<00:14,  4.56it/s][A
Training:  16%|█▋        | 13/79 [00:04<00:21,  3.04it/s][A
Training:  18%|█▊        | 14/79 [00:04<00:18,  3.48it/s][A
Training:  19%|█▉        | 15/79 [00:04<00:15,  4.04it/s][A
Training:  22%|██▏       | 17/79 [00:05<00:20,  3.06it/s][A
Training:  23%|██▎       | 18/79 [00:05<00:17,  3.58it/s][A
Training:  25%|██▌       | 20/79 [00:06<00:11,  5.02it/s][A
Training:  27%|██▋       | 21/79 [00:06<00:19,  2.96it/s][A
Training:  28%|██▊       | 22/79 [00:07<00:18,  3.08it/s][A
Training:  30%|███       | 24/79 [00:07<00:12,  4.53it/s][A
Training:  32%|███▏      | 25/79 [00

Epoch: 61/76 - Loss: 4.2242 - Accuracy: 0.9273



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:01<00:14,  1.62s/it][A
 30%|███       | 3/10 [00:01<00:03,  2.09it/s][A
 50%|█████     | 5/10 [00:02<00:02,  2.24it/s][A
 80%|████████  | 8/10 [00:02<00:00,  4.23it/s][A
100%|██████████| 10/10 [00:03<00:00,  2.63it/s][A
Epochs:  80%|████████  | 61/76 [28:09<06:46, 27.12s/it]

Val Loss: 4.3684 - Val Accuracy: 0.9400



Training:   0%|          | 0/79 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/79 [00:01<02:10,  1.67s/it][A
Training:   3%|▎         | 2/79 [00:01<00:58,  1.32it/s][A
Training:   5%|▌         | 4/79 [00:01<00:24,  3.08it/s][A
Training:   6%|▋         | 5/79 [00:02<00:39,  1.89it/s][A
Training:   9%|▉         | 7/79 [00:03<00:23,  3.12it/s][A
Training:  11%|█▏        | 9/79 [00:04<00:26,  2.60it/s][A
Training:  15%|█▌        | 12/79 [00:04<00:15,  4.47it/s][A
Training:  18%|█▊        | 14/79 [00:05<00:20,  3.10it/s][A
Training:  22%|██▏       | 17/79 [00:06<00:20,  3.03it/s][A
Training:  24%|██▍       | 19/79 [00:06<00:15,  3.83it/s][A
Training:  27%|██▋       | 21/79 [00:07<00:18,  3.06it/s][A
Training:  30%|███       | 24/79 [00:07<00:12,  4.54it/s][A
Training:  33%|███▎      | 26/79 [00:08<00:15,  3.51it/s][A
Training:  35%|███▌      | 28/79 [00:08<00:12,  4.12it/s][A
Training:  37%|███▋      | 29/79 [00:09<00:17,  2.87it/s][A
Training:  39%|███▉      | 31/79 [00:0

Epoch: 62/76 - Loss: 18.9575 - Accuracy: 0.9223



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:01<00:14,  1.66s/it][A
 40%|████      | 4/10 [00:01<00:02,  2.82it/s][A
 60%|██████    | 6/10 [00:02<00:01,  2.33it/s][A
 80%|████████  | 8/10 [00:02<00:00,  3.48it/s][A
100%|██████████| 10/10 [00:03<00:00,  2.58it/s][A
Epochs:  82%|████████▏ | 62/76 [28:37<06:22, 27.32s/it]

Val Loss: 5.9458 - Val Accuracy: 0.9296



Training:   0%|          | 0/79 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/79 [00:01<01:47,  1.38s/it][A
Training:   3%|▎         | 2/79 [00:01<00:52,  1.48it/s][A
Training:   5%|▌         | 4/79 [00:01<00:22,  3.36it/s][A
Training:   6%|▋         | 5/79 [00:02<00:37,  1.95it/s][A
Training:  10%|█         | 8/79 [00:02<00:19,  3.71it/s][A
Training:  11%|█▏        | 9/79 [00:03<00:25,  2.74it/s][A
Training:  13%|█▎        | 10/79 [00:03<00:21,  3.19it/s][A
Training:  15%|█▌        | 12/79 [00:03<00:14,  4.57it/s][A
Training:  16%|█▋        | 13/79 [00:04<00:22,  2.90it/s][A
Training:  18%|█▊        | 14/79 [00:04<00:19,  3.28it/s][A
Training:  20%|██        | 16/79 [00:05<00:14,  4.44it/s][A
Training:  22%|██▏       | 17/79 [00:06<00:23,  2.65it/s][A
Training:  23%|██▎       | 18/79 [00:06<00:20,  2.91it/s][A
Training:  25%|██▌       | 20/79 [00:06<00:13,  4.40it/s][A
Training:  27%|██▋       | 21/79 [00:07<00:18,  3.15it/s][A
Training:  28%|██▊       | 22/79 [00:0

Epoch: 63/76 - Loss: 4.8037 - Accuracy: 0.9249



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:01<00:14,  1.67s/it][A
 30%|███       | 3/10 [00:01<00:03,  2.06it/s][A
 50%|█████     | 5/10 [00:02<00:02,  1.93it/s][A
 70%|███████   | 7/10 [00:03<00:00,  3.05it/s][A
100%|██████████| 10/10 [00:04<00:00,  2.45it/s][A
Epochs:  83%|████████▎ | 63/76 [29:04<05:53, 27.21s/it]

Val Loss: 11.3879 - Val Accuracy: 0.9278



Training:   0%|          | 0/79 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/79 [00:02<02:36,  2.00s/it][A
Training:   4%|▍         | 3/79 [00:02<00:42,  1.79it/s][A
Training:   6%|▋         | 5/79 [00:03<00:41,  1.80it/s][A
Training:  10%|█         | 8/79 [00:03<00:20,  3.42it/s][A
Training:  13%|█▎        | 10/79 [00:04<00:26,  2.61it/s][A
Training:  15%|█▌        | 12/79 [00:04<00:19,  3.51it/s][A
Training:  16%|█▋        | 13/79 [00:05<00:25,  2.55it/s][A
Training:  19%|█▉        | 15/79 [00:05<00:17,  3.59it/s][A
Training:  22%|██▏       | 17/79 [00:06<00:20,  3.08it/s][A
Training:  25%|██▌       | 20/79 [00:06<00:12,  4.73it/s][A
Training:  28%|██▊       | 22/79 [00:07<00:17,  3.32it/s][A
Training:  30%|███       | 24/79 [00:07<00:12,  4.35it/s][A
Training:  33%|███▎      | 26/79 [00:08<00:15,  3.33it/s][A
Training:  34%|███▍      | 27/79 [00:09<00:15,  3.41it/s][A
Training:  37%|███▋      | 29/79 [00:09<00:16,  3.11it/s][A
Training:  39%|███▉      | 31/79 [00

Epoch: 64/76 - Loss: 7.1800 - Accuracy: 0.9274



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:01<00:13,  1.48s/it][A
 50%|█████     | 5/10 [00:02<00:02,  2.26it/s][A
 60%|██████    | 6/10 [00:02<00:01,  2.75it/s][A
100%|██████████| 10/10 [00:03<00:00,  2.68it/s][A
Epochs:  84%|████████▍ | 64/76 [29:31<05:25, 27.16s/it]

Val Loss: 5.3891 - Val Accuracy: 0.9109



Training:   0%|          | 0/79 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/79 [00:01<01:44,  1.35s/it][A
Training:   4%|▍         | 3/79 [00:01<00:30,  2.49it/s][A
Training:   6%|▋         | 5/79 [00:02<00:31,  2.37it/s][A
Training:  10%|█         | 8/79 [00:02<00:16,  4.21it/s][A
Training:  11%|█▏        | 9/79 [00:03<00:25,  2.72it/s][A
Training:  14%|█▍        | 11/79 [00:03<00:17,  3.90it/s][A
Training:  15%|█▌        | 12/79 [00:03<00:16,  4.13it/s][A
Training:  16%|█▋        | 13/79 [00:04<00:21,  3.08it/s][A
Training:  19%|█▉        | 15/79 [00:04<00:16,  3.94it/s][A
Training:  20%|██        | 16/79 [00:04<00:14,  4.27it/s][A
Training:  22%|██▏       | 17/79 [00:05<00:20,  3.07it/s][A
Training:  24%|██▍       | 19/79 [00:05<00:16,  3.74it/s][A
Training:  25%|██▌       | 20/79 [00:05<00:14,  4.15it/s][A
Training:  27%|██▋       | 21/79 [00:06<00:19,  2.94it/s][A
Training:  29%|██▉       | 23/79 [00:07<00:15,  3.56it/s][A
Training:  32%|███▏      | 25/79 [00:

Epoch: 65/76 - Loss: 3.7387 - Accuracy: 0.9252



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:01<00:13,  1.47s/it][A
 40%|████      | 4/10 [00:01<00:01,  3.06it/s][A
 60%|██████    | 6/10 [00:02<00:01,  2.31it/s][A
 80%|████████  | 8/10 [00:02<00:00,  3.40it/s][A
100%|██████████| 10/10 [00:03<00:00,  2.58it/s][A
Epochs:  86%|████████▌ | 65/76 [29:57<04:55, 26.89s/it]

Val Loss: 7.7888 - Val Accuracy: 0.8667



Training:   0%|          | 0/79 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/79 [00:01<02:16,  1.75s/it][A
Training:   3%|▎         | 2/79 [00:02<01:06,  1.16it/s][A
Training:   6%|▋         | 5/79 [00:02<00:30,  2.39it/s][A
Training:   8%|▊         | 6/79 [00:02<00:27,  2.64it/s][A
Training:  11%|█▏        | 9/79 [00:03<00:19,  3.54it/s][A
Training:  13%|█▎        | 10/79 [00:04<00:21,  3.17it/s][A
Training:  15%|█▌        | 12/79 [00:04<00:15,  4.42it/s][A
Training:  16%|█▋        | 13/79 [00:04<00:16,  3.96it/s][A
Training:  18%|█▊        | 14/79 [00:05<00:22,  2.93it/s][A
Training:  19%|█▉        | 15/79 [00:05<00:18,  3.54it/s][A
Training:  22%|██▏       | 17/79 [00:05<00:17,  3.64it/s][A
Training:  23%|██▎       | 18/79 [00:06<00:19,  3.10it/s][A
Training:  25%|██▌       | 20/79 [00:06<00:12,  4.55it/s][A
Training:  27%|██▋       | 21/79 [00:06<00:16,  3.53it/s][A
Training:  28%|██▊       | 22/79 [00:07<00:19,  2.92it/s][A
Training:  32%|███▏      | 25/79 [00:

Epoch: 66/76 - Loss: 6.5306 - Accuracy: 0.9254



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:01<00:12,  1.39s/it][A
 20%|██        | 2/10 [00:01<00:05,  1.50it/s][A
 40%|████      | 4/10 [00:01<00:01,  3.40it/s][A
 50%|█████     | 5/10 [00:02<00:02,  2.28it/s][A
 60%|██████    | 6/10 [00:02<00:01,  2.90it/s][A
 70%|███████   | 7/10 [00:02<00:00,  3.60it/s][A
100%|██████████| 10/10 [00:03<00:00,  2.70it/s][A
Epochs:  87%|████████▋ | 66/76 [30:25<04:30, 27.07s/it]

Val Loss: 10.8177 - Val Accuracy: 0.9301



Training:   0%|          | 0/79 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/79 [00:01<01:56,  1.49s/it][A
Training:   3%|▎         | 2/79 [00:01<00:54,  1.41it/s][A
Training:   6%|▋         | 5/79 [00:02<00:34,  2.13it/s][A
Training:   9%|▉         | 7/79 [00:02<00:21,  3.30it/s][A
Training:  11%|█▏        | 9/79 [00:03<00:27,  2.54it/s][A
Training:  14%|█▍        | 11/79 [00:04<00:19,  3.45it/s][A
Training:  16%|█▋        | 13/79 [00:05<00:24,  2.68it/s][A
Training:  19%|█▉        | 15/79 [00:05<00:17,  3.63it/s][A
Training:  22%|██▏       | 17/79 [00:06<00:21,  2.91it/s][A
Training:  24%|██▍       | 19/79 [00:06<00:15,  3.90it/s][A
Training:  27%|██▋       | 21/79 [00:07<00:18,  3.22it/s][A
Training:  29%|██▉       | 23/79 [00:07<00:13,  4.15it/s][A
Training:  32%|███▏      | 25/79 [00:08<00:18,  2.99it/s][A
Training:  34%|███▍      | 27/79 [00:08<00:13,  3.95it/s][A
Training:  37%|███▋      | 29/79 [00:09<00:17,  2.86it/s][A
Training:  39%|███▉      | 31/79 [00:

Epoch: 67/76 - Loss: 5.4101 - Accuracy: 0.9284



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:01<00:14,  1.64s/it][A
 40%|████      | 4/10 [00:01<00:02,  2.90it/s][A
 60%|██████    | 6/10 [00:02<00:01,  2.52it/s][A
100%|██████████| 10/10 [00:03<00:00,  2.59it/s][A
Epochs:  88%|████████▊ | 67/76 [30:52<04:04, 27.13s/it]

Val Loss: 2.7366 - Val Accuracy: 0.9327



Training:   0%|          | 0/79 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/79 [00:01<02:10,  1.67s/it][A
Training:   3%|▎         | 2/79 [00:01<00:59,  1.30it/s][A
Training:   6%|▋         | 5/79 [00:02<00:32,  2.26it/s][A
Training:   9%|▉         | 7/79 [00:02<00:20,  3.46it/s][A
Training:  11%|█▏        | 9/79 [00:03<00:24,  2.87it/s][A
Training:  13%|█▎        | 10/79 [00:03<00:21,  3.28it/s][A
Training:  16%|█▋        | 13/79 [00:04<00:20,  3.28it/s][A
Training:  18%|█▊        | 14/79 [00:05<00:21,  3.02it/s][A
Training:  20%|██        | 16/79 [00:05<00:15,  4.06it/s][A
Training:  22%|██▏       | 17/79 [00:05<00:18,  3.31it/s][A
Training:  23%|██▎       | 18/79 [00:06<00:18,  3.25it/s][A
Training:  24%|██▍       | 19/79 [00:06<00:15,  3.79it/s][A
Training:  27%|██▋       | 21/79 [00:06<00:14,  3.96it/s][A
Training:  28%|██▊       | 22/79 [00:07<00:17,  3.33it/s][A
Training:  30%|███       | 24/79 [00:07<00:11,  4.87it/s][A
Training:  32%|███▏      | 25/79 [00:

Epoch: 68/76 - Loss: 10.9059 - Accuracy: 0.9226



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:01<00:11,  1.33s/it][A
 20%|██        | 2/10 [00:01<00:05,  1.53it/s][A
 50%|█████     | 5/10 [00:02<00:01,  2.61it/s][A
 60%|██████    | 6/10 [00:02<00:01,  2.94it/s][A
100%|██████████| 10/10 [00:03<00:00,  2.93it/s][A
Epochs:  89%|████████▉ | 68/76 [31:19<03:37, 27.13s/it]

Val Loss: 4.4502 - Val Accuracy: 0.9260



Training:   0%|          | 0/79 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/79 [00:01<02:01,  1.56s/it][A
Training:   4%|▍         | 3/79 [00:01<00:35,  2.13it/s][A
Training:   6%|▋         | 5/79 [00:02<00:36,  2.00it/s][A
Training:   9%|▉         | 7/79 [00:02<00:23,  3.04it/s][A
Training:  11%|█▏        | 9/79 [00:04<00:27,  2.51it/s][A
Training:  15%|█▌        | 12/79 [00:04<00:16,  4.09it/s][A
Training:  16%|█▋        | 13/79 [00:05<00:24,  2.67it/s][A
Training:  18%|█▊        | 14/79 [00:05<00:21,  3.09it/s][A
Training:  19%|█▉        | 15/79 [00:05<00:17,  3.65it/s][A
Training:  20%|██        | 16/79 [00:05<00:14,  4.29it/s][A
Training:  22%|██▏       | 17/79 [00:06<00:22,  2.71it/s][A
Training:  23%|██▎       | 18/79 [00:06<00:19,  3.14it/s][A
Training:  25%|██▌       | 20/79 [00:06<00:12,  4.71it/s][A
Training:  27%|██▋       | 21/79 [00:07<00:22,  2.61it/s][A
Training:  32%|███▏      | 25/79 [00:08<00:18,  2.95it/s][A
Training:  34%|███▍      | 27/79 [00:

Epoch: 69/76 - Loss: 5.4417 - Accuracy: 0.9281



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:01<00:14,  1.57s/it][A
 40%|████      | 4/10 [00:01<00:01,  3.05it/s][A
 60%|██████    | 6/10 [00:02<00:01,  2.43it/s][A
 80%|████████  | 8/10 [00:02<00:00,  3.61it/s][A
100%|██████████| 10/10 [00:03<00:00,  2.52it/s][A
Epochs:  91%|█████████ | 69/76 [31:48<03:12, 27.50s/it]

Val Loss: 6.5547 - Val Accuracy: 0.9193



Training:   0%|          | 0/79 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/79 [00:01<01:53,  1.45s/it][A
Training:   3%|▎         | 2/79 [00:01<00:54,  1.42it/s][A
Training:   5%|▌         | 4/79 [00:01<00:22,  3.35it/s][A
Training:   6%|▋         | 5/79 [00:02<00:34,  2.17it/s][A
Training:   8%|▊         | 6/79 [00:02<00:28,  2.53it/s][A
Training:  11%|█▏        | 9/79 [00:03<00:24,  2.81it/s][A
Training:  13%|█▎        | 10/79 [00:04<00:23,  2.98it/s][A
Training:  16%|█▋        | 13/79 [00:04<00:21,  3.12it/s][A
Training:  18%|█▊        | 14/79 [00:05<00:20,  3.17it/s][A
Training:  19%|█▉        | 15/79 [00:05<00:17,  3.63it/s][A
Training:  20%|██        | 16/79 [00:05<00:14,  4.24it/s][A
Training:  22%|██▏       | 17/79 [00:06<00:22,  2.74it/s][A
Training:  23%|██▎       | 18/79 [00:06<00:20,  3.03it/s][A
Training:  27%|██▋       | 21/79 [00:07<00:20,  2.85it/s][A
Training:  29%|██▉       | 23/79 [00:07<00:14,  3.84it/s][A
Training:  32%|███▏      | 25/79 [00:0

Epoch: 70/76 - Loss: 4.5205 - Accuracy: 0.9287



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:01<00:13,  1.54s/it][A
 50%|█████     | 5/10 [00:02<00:02,  2.29it/s][A
 80%|████████  | 8/10 [00:02<00:00,  3.97it/s][A
100%|██████████| 10/10 [00:03<00:00,  2.82it/s][A
Epochs:  92%|█████████▏| 70/76 [32:15<02:44, 27.49s/it]

Val Loss: 13.1418 - Val Accuracy: 0.9111



Training:   0%|          | 0/79 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/79 [00:01<02:07,  1.64s/it][A
Training:   3%|▎         | 2/79 [00:01<00:57,  1.35it/s][A
Training:   5%|▌         | 4/79 [00:01<00:24,  3.09it/s][A
Training:   6%|▋         | 5/79 [00:02<00:38,  1.90it/s][A
Training:   9%|▉         | 7/79 [00:03<00:22,  3.23it/s][A
Training:  11%|█▏        | 9/79 [00:03<00:25,  2.71it/s][A
Training:  13%|█▎        | 10/79 [00:04<00:25,  2.68it/s][A
Training:  14%|█▍        | 11/79 [00:04<00:21,  3.15it/s][A
Training:  16%|█▋        | 13/79 [00:05<00:22,  2.89it/s][A
Training:  18%|█▊        | 14/79 [00:05<00:22,  2.83it/s][A
Training:  20%|██        | 16/79 [00:05<00:15,  4.04it/s][A
Training:  22%|██▏       | 17/79 [00:06<00:22,  2.78it/s][A
Training:  23%|██▎       | 18/79 [00:06<00:22,  2.68it/s][A
Training:  25%|██▌       | 20/79 [00:07<00:14,  4.07it/s][A
Training:  27%|██▋       | 21/79 [00:07<00:19,  2.98it/s][A
Training:  28%|██▊       | 22/79 [00:0

Epoch: 71/76 - Loss: 6.0694 - Accuracy: 0.9263



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:01<00:13,  1.52s/it][A
 20%|██        | 2/10 [00:01<00:05,  1.43it/s][A
 50%|█████     | 5/10 [00:02<00:01,  2.65it/s][A
 70%|███████   | 7/10 [00:02<00:00,  3.60it/s][A
100%|██████████| 10/10 [00:03<00:00,  2.74it/s][A
Epochs:  93%|█████████▎| 71/76 [32:43<02:18, 27.64s/it]

Val Loss: 5.2112 - Val Accuracy: 0.9093



Training:   0%|          | 0/79 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/79 [00:01<02:13,  1.71s/it][A
Training:   5%|▌         | 4/79 [00:01<00:26,  2.84it/s][A
Training:   8%|▊         | 6/79 [00:02<00:29,  2.44it/s][A
Training:   9%|▉         | 7/79 [00:02<00:24,  2.93it/s][A
Training:  10%|█         | 8/79 [00:03<00:20,  3.50it/s][A
Training:  11%|█▏        | 9/79 [00:04<00:32,  2.14it/s][A
Training:  14%|█▍        | 11/79 [00:04<00:20,  3.29it/s][A
Training:  16%|█▋        | 13/79 [00:05<00:22,  2.88it/s][A
Training:  19%|█▉        | 15/79 [00:05<00:15,  4.06it/s][A
Training:  22%|██▏       | 17/79 [00:06<00:20,  3.03it/s][A
Training:  23%|██▎       | 18/79 [00:06<00:18,  3.35it/s][A
Training:  27%|██▋       | 21/79 [00:07<00:18,  3.17it/s][A
Training:  28%|██▊       | 22/79 [00:07<00:17,  3.28it/s][A
Training:  29%|██▉       | 23/79 [00:07<00:14,  3.79it/s][A
Training:  32%|███▏      | 25/79 [00:08<00:17,  3.04it/s][A
Training:  33%|███▎      | 26/79 [00:0

Epoch: 72/76 - Loss: 9.5993 - Accuracy: 0.9257



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:01<00:14,  1.66s/it][A
 50%|█████     | 5/10 [00:02<00:02,  2.25it/s][A
100%|██████████| 10/10 [00:03<00:00,  2.59it/s][A
Epochs:  95%|█████████▍| 72/76 [33:11<01:50, 27.59s/it]

Val Loss: 4.3089 - Val Accuracy: 0.9322



Training:   0%|          | 0/79 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/79 [00:01<01:53,  1.45s/it][A
Training:   3%|▎         | 2/79 [00:01<00:54,  1.42it/s][A
Training:   4%|▍         | 3/79 [00:01<00:34,  2.18it/s][A
Training:   6%|▋         | 5/79 [00:02<00:29,  2.47it/s][A
Training:   8%|▊         | 6/79 [00:02<00:25,  2.86it/s][A
Training:   9%|▉         | 7/79 [00:02<00:21,  3.39it/s][A
Training:  10%|█         | 8/79 [00:03<00:18,  3.93it/s][A
Training:  11%|█▏        | 9/79 [00:03<00:26,  2.61it/s][A
Training:  13%|█▎        | 10/79 [00:03<00:21,  3.18it/s][A
Training:  14%|█▍        | 11/79 [00:04<00:18,  3.74it/s][A
Training:  15%|█▌        | 12/79 [00:04<00:19,  3.44it/s][A
Training:  16%|█▋        | 13/79 [00:04<00:23,  2.78it/s][A
Training:  19%|█▉        | 15/79 [00:05<00:14,  4.32it/s][A
Training:  20%|██        | 16/79 [00:05<00:18,  3.40it/s][A
Training:  22%|██▏       | 17/79 [00:05<00:19,  3.15it/s][A
Training:  23%|██▎       | 18/79 [00:06<

Epoch: 73/76 - Loss: 5.1728 - Accuracy: 0.9250



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:01<00:14,  1.62s/it][A
 40%|████      | 4/10 [00:01<00:02,  2.99it/s][A
 60%|██████    | 6/10 [00:02<00:01,  2.49it/s][A
 80%|████████  | 8/10 [00:02<00:00,  3.73it/s][A
100%|██████████| 10/10 [00:03<00:00,  2.72it/s][A
Epochs:  96%|█████████▌| 73/76 [33:38<01:22, 27.57s/it]

Val Loss: 2.8154 - Val Accuracy: 0.9075



Training:   0%|          | 0/79 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/79 [00:01<01:49,  1.40s/it][A
Training:   4%|▍         | 3/79 [00:01<00:34,  2.23it/s][A
Training:   5%|▌         | 4/79 [00:01<00:28,  2.62it/s][A
Training:   6%|▋         | 5/79 [00:02<00:37,  1.95it/s][A
Training:   9%|▉         | 7/79 [00:02<00:22,  3.22it/s][A
Training:  10%|█         | 8/79 [00:03<00:22,  3.23it/s][A
Training:  11%|█▏        | 9/79 [00:03<00:26,  2.61it/s][A
Training:  14%|█▍        | 11/79 [00:03<00:17,  3.88it/s][A
Training:  15%|█▌        | 12/79 [00:04<00:19,  3.51it/s][A
Training:  16%|█▋        | 13/79 [00:04<00:22,  2.88it/s][A
Training:  18%|█▊        | 14/79 [00:05<00:20,  3.11it/s][A
Training:  20%|██        | 16/79 [00:05<00:17,  3.60it/s][A
Training:  22%|██▏       | 17/79 [00:05<00:19,  3.14it/s][A
Training:  23%|██▎       | 18/79 [00:06<00:20,  3.04it/s][A
Training:  24%|██▍       | 19/79 [00:06<00:16,  3.64it/s][A
Training:  25%|██▌       | 20/79 [00:06

Epoch: 74/76 - Loss: 18.2173 - Accuracy: 0.9100



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:01<00:15,  1.70s/it][A
 30%|███       | 3/10 [00:01<00:03,  2.07it/s][A
 50%|█████     | 5/10 [00:02<00:02,  2.01it/s][A
100%|██████████| 10/10 [00:03<00:00,  2.65it/s][A
Epochs:  97%|█████████▋| 74/76 [34:06<00:55, 27.59s/it]

Val Loss: 13.7212 - Val Accuracy: 0.9232



Training:   0%|          | 0/79 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/79 [00:01<02:13,  1.71s/it][A
Training:   3%|▎         | 2/79 [00:01<01:04,  1.20it/s][A
Training:   6%|▋         | 5/79 [00:02<00:33,  2.21it/s][A
Training:   8%|▊         | 6/79 [00:03<00:28,  2.59it/s][A
Training:  10%|█         | 8/79 [00:03<00:18,  3.88it/s][A
Training:  11%|█▏        | 9/79 [00:03<00:25,  2.76it/s][A
Training:  13%|█▎        | 10/79 [00:04<00:22,  3.09it/s][A
Training:  15%|█▌        | 12/79 [00:04<00:14,  4.59it/s][A
Training:  16%|█▋        | 13/79 [00:04<00:21,  3.13it/s][A
Training:  18%|█▊        | 14/79 [00:05<00:21,  3.04it/s][A
Training:  20%|██        | 16/79 [00:05<00:14,  4.37it/s][A
Training:  22%|██▏       | 17/79 [00:06<00:22,  2.73it/s][A
Training:  23%|██▎       | 18/79 [00:06<00:20,  2.93it/s][A
Training:  25%|██▌       | 20/79 [00:06<00:13,  4.36it/s][A
Training:  27%|██▋       | 21/79 [00:07<00:21,  2.73it/s][A
Training:  28%|██▊       | 22/79 [00:0

Epoch: 75/76 - Loss: 7.9578 - Accuracy: 0.9220



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:01<00:13,  1.55s/it][A
 30%|███       | 3/10 [00:01<00:03,  2.26it/s][A
 50%|█████     | 5/10 [00:02<00:02,  2.21it/s][A
 60%|██████    | 6/10 [00:02<00:01,  2.64it/s][A
 80%|████████  | 8/10 [00:02<00:00,  4.09it/s][A
 90%|█████████ | 9/10 [00:03<00:00,  3.05it/s][A
100%|██████████| 10/10 [00:03<00:00,  2.70it/s][A
Epochs:  99%|█████████▊| 75/76 [34:34<00:27, 27.64s/it]

Val Loss: 6.5724 - Val Accuracy: 0.8618



Training:   0%|          | 0/79 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/79 [00:01<02:02,  1.57s/it][A
Training:   4%|▍         | 3/79 [00:01<00:42,  1.80it/s][A
Training:   6%|▋         | 5/79 [00:02<00:34,  2.13it/s][A
Training:   8%|▊         | 6/79 [00:02<00:27,  2.66it/s][A
Training:   9%|▉         | 7/79 [00:03<00:25,  2.83it/s][A
Training:  11%|█▏        | 9/79 [00:03<00:26,  2.63it/s][A
Training:  14%|█▍        | 11/79 [00:04<00:19,  3.51it/s][A
Training:  16%|█▋        | 13/79 [00:05<00:21,  3.02it/s][A
Training:  19%|█▉        | 15/79 [00:05<00:19,  3.35it/s][A
Training:  20%|██        | 16/79 [00:05<00:16,  3.81it/s][A
Training:  22%|██▏       | 17/79 [00:06<00:20,  3.06it/s][A
Training:  23%|██▎       | 18/79 [00:06<00:16,  3.65it/s][A
Training:  24%|██▍       | 19/79 [00:06<00:15,  3.98it/s][A
Training:  27%|██▋       | 21/79 [00:07<00:21,  2.74it/s][A
Training:  29%|██▉       | 23/79 [00:07<00:15,  3.64it/s][A
Training:  32%|███▏      | 25/79 [00:0

Epoch: 76/76 - Loss: 9.3747 - Accuracy: 0.9249



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:01<00:12,  1.37s/it][A
 20%|██        | 2/10 [00:01<00:05,  1.54it/s][A
 50%|█████     | 5/10 [00:02<00:02,  2.31it/s][A
 60%|██████    | 6/10 [00:02<00:01,  2.58it/s][A
100%|██████████| 10/10 [00:03<00:00,  2.71it/s][A
Epochs: 100%|██████████| 76/76 [35:00<00:00, 27.64s/it]


Val Loss: 15.3394 - Val Accuracy: 0.9033


[32m[I 2023-12-14 23:20:40,653][0m Trial 2 finished with value: 0.9033117294311523 and parameters: {'loss_learning_rate': 0.00043085489957524003, 'learning_rate': 0.06802471398172366, 'weight_decay': 0.0004464693466243797, 'epsilon': 4.952031792291727e-09, 'batch_size': 177, 'epochs': 76}. Best is trial 1 with value: 0.9292426705360413.[0m


Learning rate for Loss: 0.0008525339180252597
Learning rate: 0.0006513527804929251
Weight decay: 0.0038208248001045425
Epsilon: 3.3362510582155838e-09
Batch size: 237
Number of epochs: 37


Epochs:   0%|          | 0/37 [00:00<?, ?it/s]
Training:   0%|          | 0/59 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/59 [00:02<01:57,  2.02s/it][A
Training:   3%|▎         | 2/59 [00:02<00:51,  1.11it/s][A
Training:   5%|▌         | 3/59 [00:02<00:33,  1.68it/s][A
Training:   8%|▊         | 5/59 [00:03<00:31,  1.73it/s][A
Training:  10%|█         | 6/59 [00:03<00:26,  1.98it/s][A
Training:  12%|█▏        | 7/59 [00:03<00:21,  2.45it/s][A
Training:  14%|█▎        | 8/59 [00:04<00:16,  3.14it/s][A
Training:  15%|█▌        | 9/59 [00:05<00:29,  1.71it/s][A
Training:  17%|█▋        | 10/59 [00:05<00:23,  2.13it/s][A
Training:  19%|█▊        | 11/59 [00:05<00:17,  2.67it/s][A
Training:  20%|██        | 12/59 [00:05<00:13,  3.38it/s][A
Training:  22%|██▏       | 13/59 [00:06<00:23,  1.93it/s][A
Training:  24%|██▎       | 14/59 [00:07<00:20,  2.23it/s][A
Training:  29%|██▉       | 17/59 [00:08<00:17,  2.42it/s][A
Training:  31%|███       | 18/59 [00:08<00:16,  2.53it/

Epoch: 1/37 - Loss: 12.3111 - Accuracy: 0.7720



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:01<00:13,  1.94s/it][A
 38%|███▊      | 3/8 [00:02<00:02,  1.83it/s][A
 62%|██████▎   | 5/8 [00:03<00:01,  1.82it/s][A
100%|██████████| 8/8 [00:03<00:00,  2.33it/s][A
Epochs:   3%|▎         | 1/37 [00:27<16:42, 27.85s/it]

Val Loss: 6.6021 - Val Accuracy: 0.8755



Training:   0%|          | 0/59 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/59 [00:02<02:06,  2.19s/it][A
Training:   3%|▎         | 2/59 [00:02<00:54,  1.04it/s][A
Training:   5%|▌         | 3/59 [00:02<00:31,  1.75it/s][A
Training:   8%|▊         | 5/59 [00:03<00:31,  1.69it/s][A
Training:  12%|█▏        | 7/59 [00:03<00:19,  2.61it/s][A
Training:  14%|█▎        | 8/59 [00:04<00:17,  2.91it/s][A
Training:  15%|█▌        | 9/59 [00:05<00:26,  1.90it/s][A
Training:  19%|█▊        | 11/59 [00:05<00:16,  2.83it/s][A
Training:  20%|██        | 12/59 [00:05<00:16,  2.94it/s][A
Training:  22%|██▏       | 13/59 [00:06<00:22,  2.04it/s][A
Training:  25%|██▌       | 15/59 [00:06<00:15,  2.76it/s][A
Training:  27%|██▋       | 16/59 [00:07<00:13,  3.15it/s][A
Training:  29%|██▉       | 17/59 [00:08<00:21,  1.95it/s][A
Training:  31%|███       | 18/59 [00:08<00:16,  2.46it/s][A
Training:  34%|███▍      | 20/59 [00:08<00:14,  2.76it/s][A
Training:  36%|███▌      | 21/59 [00:09

Epoch: 2/37 - Loss: 4.8908 - Accuracy: 0.8933



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:01<00:13,  1.90s/it][A
 25%|██▌       | 2/8 [00:02<00:05,  1.09it/s][A
 50%|█████     | 4/8 [00:02<00:01,  2.53it/s][A
100%|██████████| 8/8 [00:03<00:00,  2.25it/s][A
Epochs:   5%|▌         | 2/37 [00:55<16:05, 27.59s/it]

Val Loss: 3.9133 - Val Accuracy: 0.8961



Training:   0%|          | 0/59 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/59 [00:01<01:49,  1.89s/it][A
Training:   5%|▌         | 3/59 [00:02<00:31,  1.80it/s][A
Training:   8%|▊         | 5/59 [00:03<00:34,  1.57it/s][A
Training:  12%|█▏        | 7/59 [00:03<00:20,  2.54it/s][A
Training:  15%|█▌        | 9/59 [00:05<00:25,  1.96it/s][A
Training:  19%|█▊        | 11/59 [00:05<00:17,  2.82it/s][A
Training:  22%|██▏       | 13/59 [00:06<00:21,  2.12it/s][A
Training:  24%|██▎       | 14/59 [00:06<00:18,  2.46it/s][A
Training:  27%|██▋       | 16/59 [00:06<00:13,  3.21it/s][A
Training:  29%|██▉       | 17/59 [00:08<00:20,  2.02it/s][A
Training:  31%|███       | 18/59 [00:08<00:17,  2.38it/s][A
Training:  34%|███▍      | 20/59 [00:08<00:13,  2.99it/s][A
Training:  36%|███▌      | 21/59 [00:09<00:18,  2.09it/s][A
Training:  37%|███▋      | 22/59 [00:09<00:14,  2.53it/s][A
Training:  39%|███▉      | 23/59 [00:09<00:11,  3.12it/s][A
Training:  41%|████      | 24/59 [00:

Epoch: 3/37 - Loss: 3.4142 - Accuracy: 0.9163



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:01<00:12,  1.79s/it][A
 25%|██▌       | 2/8 [00:01<00:04,  1.22it/s][A
 38%|███▊      | 3/8 [00:02<00:02,  1.90it/s][A
 62%|██████▎   | 5/8 [00:03<00:01,  1.89it/s][A
100%|██████████| 8/8 [00:03<00:00,  2.26it/s][A
Epochs:   8%|▊         | 3/37 [01:22<15:35, 27.53s/it]

Val Loss: 3.0752 - Val Accuracy: 0.9165



Training:   0%|          | 0/59 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/59 [00:02<01:57,  2.03s/it][A
Training:   5%|▌         | 3/59 [00:02<00:31,  1.75it/s][A
Training:   8%|▊         | 5/59 [00:03<00:37,  1.46it/s][A
Training:  12%|█▏        | 7/59 [00:03<00:22,  2.31it/s][A
Training:  14%|█▎        | 8/59 [00:04<00:18,  2.80it/s][A
Training:  15%|█▌        | 9/59 [00:05<00:28,  1.76it/s][A
Training:  17%|█▋        | 10/59 [00:05<00:22,  2.20it/s][A
Training:  20%|██        | 12/59 [00:05<00:13,  3.48it/s][A
Training:  22%|██▏       | 13/59 [00:06<00:22,  2.08it/s][A
Training:  25%|██▌       | 15/59 [00:06<00:13,  3.19it/s][A
Training:  29%|██▉       | 17/59 [00:08<00:19,  2.20it/s][A
Training:  31%|███       | 18/59 [00:08<00:15,  2.62it/s][A
Training:  32%|███▏      | 19/59 [00:08<00:12,  3.15it/s][A
Training:  34%|███▍      | 20/59 [00:08<00:10,  3.74it/s][A
Training:  36%|███▌      | 21/59 [00:09<00:18,  2.03it/s][A
Training:  37%|███▋      | 22/59 [00:0

Epoch: 4/37 - Loss: 2.8336 - Accuracy: 0.9281



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:02<00:14,  2.04s/it][A
 50%|█████     | 4/8 [00:02<00:01,  2.38it/s][A
100%|██████████| 8/8 [00:03<00:00,  2.18it/s][A
Epochs:  11%|█         | 4/37 [01:49<14:55, 27.15s/it]

Val Loss: 2.7857 - Val Accuracy: 0.9145



Training:   0%|          | 0/59 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/59 [00:01<01:47,  1.86s/it][A
Training:   5%|▌         | 3/59 [00:02<00:29,  1.87it/s][A
Training:   7%|▋         | 4/59 [00:02<00:21,  2.56it/s][A
Training:   8%|▊         | 5/59 [00:03<00:33,  1.59it/s][A
Training:  12%|█▏        | 7/59 [00:03<00:18,  2.81it/s][A
Training:  14%|█▎        | 8/59 [00:03<00:17,  2.97it/s][A
Training:  15%|█▌        | 9/59 [00:04<00:30,  1.64it/s][A
Training:  19%|█▊        | 11/59 [00:05<00:18,  2.65it/s][A
Training:  20%|██        | 12/59 [00:05<00:14,  3.21it/s][A
Training:  22%|██▏       | 13/59 [00:06<00:26,  1.73it/s][A
Training:  25%|██▌       | 15/59 [00:06<00:15,  2.77it/s][A
Training:  29%|██▉       | 17/59 [00:08<00:21,  1.99it/s][A
Training:  31%|███       | 18/59 [00:08<00:17,  2.38it/s][A
Training:  34%|███▍      | 20/59 [00:08<00:11,  3.51it/s][A
Training:  37%|███▋      | 22/59 [00:09<00:15,  2.31it/s][A
Training:  41%|████      | 24/59 [00:10

Epoch: 5/37 - Loss: 2.5754 - Accuracy: 0.9327



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:01<00:12,  1.83s/it][A
 50%|█████     | 4/8 [00:02<00:01,  2.51it/s][A
 62%|██████▎   | 5/8 [00:03<00:01,  1.63it/s][A
100%|██████████| 8/8 [00:03<00:00,  2.26it/s][A
Epochs:  14%|█▎        | 5/37 [02:16<14:30, 27.21s/it]

Val Loss: 2.5296 - Val Accuracy: 0.9360



Training:   0%|          | 0/59 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/59 [00:01<01:53,  1.95s/it][A
Training:   3%|▎         | 2/59 [00:02<00:49,  1.16it/s][A
Training:   7%|▋         | 4/59 [00:02<00:20,  2.74it/s][A
Training:   8%|▊         | 5/59 [00:03<00:35,  1.50it/s][A
Training:  12%|█▏        | 7/59 [00:03<00:19,  2.63it/s][A
Training:  15%|█▌        | 9/59 [00:05<00:27,  1.82it/s][A
Training:  20%|██        | 12/59 [00:05<00:15,  3.11it/s][A
Training:  24%|██▎       | 14/59 [00:07<00:20,  2.15it/s][A
Training:  27%|██▋       | 16/59 [00:07<00:14,  2.91it/s][A
Training:  31%|███       | 18/59 [00:08<00:17,  2.30it/s][A
Training:  34%|███▍      | 20/59 [00:08<00:12,  3.10it/s][A
Training:  36%|███▌      | 21/59 [00:09<00:19,  1.96it/s][A
Training:  41%|████      | 24/59 [00:10<00:10,  3.27it/s][A
Training:  44%|████▍     | 26/59 [00:11<00:13,  2.39it/s][A
Training:  46%|████▌     | 27/59 [00:11<00:11,  2.73it/s][A
Training:  47%|████▋     | 28/59 [00:1

Epoch: 6/37 - Loss: 2.4489 - Accuracy: 0.9312



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:01<00:11,  1.65s/it][A
 25%|██▌       | 2/8 [00:01<00:04,  1.20it/s][A
 62%|██████▎   | 5/8 [00:03<00:01,  1.88it/s][A
100%|██████████| 8/8 [00:03<00:00,  2.13it/s][A
Epochs:  16%|█▌        | 6/37 [02:44<14:08, 27.36s/it]

Val Loss: 2.3634 - Val Accuracy: 0.9378



Training:   0%|          | 0/59 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/59 [00:01<01:44,  1.80s/it][A
Training:   5%|▌         | 3/59 [00:01<00:29,  1.87it/s][A
Training:   8%|▊         | 5/59 [00:03<00:32,  1.65it/s][A
Training:  12%|█▏        | 7/59 [00:03<00:20,  2.53it/s][A
Training:  15%|█▌        | 9/59 [00:04<00:25,  1.93it/s][A
Training:  20%|██        | 12/59 [00:05<00:14,  3.26it/s][A
Training:  24%|██▎       | 14/59 [00:06<00:20,  2.22it/s][A
Training:  27%|██▋       | 16/59 [00:06<00:14,  2.93it/s][A
Training:  29%|██▉       | 17/59 [00:08<00:20,  2.01it/s][A
Training:  32%|███▏      | 19/59 [00:08<00:14,  2.74it/s][A
Training:  34%|███▍      | 20/59 [00:08<00:12,  3.16it/s][A
Training:  36%|███▌      | 21/59 [00:09<00:19,  1.95it/s][A
Training:  39%|███▉      | 23/59 [00:09<00:12,  2.84it/s][A
Training:  41%|████      | 24/59 [00:09<00:10,  3.27it/s][A
Training:  42%|████▏     | 25/59 [00:11<00:18,  1.83it/s][A
Training:  44%|████▍     | 26/59 [00:

Epoch: 7/37 - Loss: 2.4394 - Accuracy: 0.9328



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:01<00:12,  1.78s/it][A
 25%|██▌       | 2/8 [00:01<00:04,  1.23it/s][A
 38%|███▊      | 3/8 [00:02<00:02,  1.99it/s][A
 62%|██████▎   | 5/8 [00:03<00:01,  1.75it/s][A
100%|██████████| 8/8 [00:03<00:00,  2.15it/s][A
Epochs:  19%|█▉        | 7/37 [03:11<13:39, 27.31s/it]

Val Loss: 2.4795 - Val Accuracy: 0.9339



Training:   0%|          | 0/59 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/59 [00:01<01:50,  1.91s/it][A
Training:   5%|▌         | 3/59 [00:02<00:29,  1.87it/s][A
Training:   8%|▊         | 5/59 [00:03<00:30,  1.75it/s][A
Training:  12%|█▏        | 7/59 [00:03<00:18,  2.82it/s][A
Training:  15%|█▌        | 9/59 [00:04<00:25,  1.99it/s][A
Training:  19%|█▊        | 11/59 [00:05<00:17,  2.81it/s][A
Training:  20%|██        | 12/59 [00:05<00:14,  3.23it/s][A
Training:  22%|██▏       | 13/59 [00:06<00:22,  2.02it/s][A
Training:  24%|██▎       | 14/59 [00:06<00:19,  2.25it/s][A
Training:  27%|██▋       | 16/59 [00:06<00:12,  3.44it/s][A
Training:  29%|██▉       | 17/59 [00:07<00:18,  2.26it/s][A
Training:  31%|███       | 18/59 [00:08<00:21,  1.94it/s][A
Training:  34%|███▍      | 20/59 [00:08<00:13,  2.96it/s][A
Training:  36%|███▌      | 21/59 [00:09<00:16,  2.36it/s][A
Training:  37%|███▋      | 22/59 [00:09<00:17,  2.07it/s][A
Training:  41%|████      | 24/59 [00:

Epoch: 8/37 - Loss: 2.3753 - Accuracy: 0.9371



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:01<00:12,  1.82s/it][A
 38%|███▊      | 3/8 [00:01<00:02,  1.91it/s][A
100%|██████████| 8/8 [00:03<00:00,  2.21it/s][A
Epochs:  22%|██▏       | 8/37 [03:38<13:08, 27.21s/it]

Val Loss: 2.4920 - Val Accuracy: 0.9254



Training:   0%|          | 0/59 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/59 [00:01<01:54,  1.97s/it][A
Training:   3%|▎         | 2/59 [00:02<00:50,  1.13it/s][A
Training:   5%|▌         | 3/59 [00:02<00:29,  1.89it/s][A
Training:   7%|▋         | 4/59 [00:02<00:20,  2.74it/s][A
Training:   8%|▊         | 5/59 [00:03<00:37,  1.44it/s][A
Training:  10%|█         | 6/59 [00:03<00:26,  2.02it/s][A
Training:  14%|█▎        | 8/59 [00:03<00:14,  3.55it/s][A
Training:  15%|█▌        | 9/59 [00:05<00:30,  1.67it/s][A
Training:  19%|█▊        | 11/59 [00:05<00:17,  2.69it/s][A
Training:  22%|██▏       | 13/59 [00:06<00:22,  2.05it/s][A
Training:  25%|██▌       | 15/59 [00:06<00:14,  2.96it/s][A
Training:  27%|██▋       | 16/59 [00:07<00:12,  3.38it/s][A
Training:  29%|██▉       | 17/59 [00:08<00:24,  1.73it/s][A
Training:  31%|███       | 18/59 [00:08<00:19,  2.15it/s][A
Training:  34%|███▍      | 20/59 [00:08<00:11,  3.34it/s][A
Training:  37%|███▋      | 22/59 [00:10<

Epoch: 9/37 - Loss: 2.4391 - Accuracy: 0.9389



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:01<00:12,  1.77s/it][A
 38%|███▊      | 3/8 [00:01<00:02,  1.91it/s][A
 62%|██████▎   | 5/8 [00:03<00:01,  1.75it/s][A
100%|██████████| 8/8 [00:03<00:00,  2.27it/s][A
Epochs:  24%|██▍       | 9/37 [04:05<12:43, 27.28s/it]

Val Loss: 2.5282 - Val Accuracy: 0.9375



Training:   0%|          | 0/59 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/59 [00:01<01:45,  1.82s/it][A
Training:   3%|▎         | 2/59 [00:01<00:47,  1.20it/s][A
Training:   7%|▋         | 4/59 [00:02<00:19,  2.80it/s][A
Training:   8%|▊         | 5/59 [00:03<00:33,  1.60it/s][A
Training:  12%|█▏        | 7/59 [00:03<00:18,  2.75it/s][A
Training:  15%|█▌        | 9/59 [00:04<00:26,  1.92it/s][A
Training:  19%|█▊        | 11/59 [00:05<00:17,  2.82it/s][A
Training:  22%|██▏       | 13/59 [00:06<00:22,  2.03it/s][A
Training:  29%|██▉       | 17/59 [00:08<00:18,  2.31it/s][A
Training:  31%|███       | 18/59 [00:08<00:15,  2.59it/s][A
Training:  32%|███▏      | 19/59 [00:08<00:13,  2.92it/s][A
Training:  34%|███▍      | 20/59 [00:08<00:11,  3.33it/s][A
Training:  36%|███▌      | 21/59 [00:09<00:19,  2.00it/s][A
Training:  39%|███▉      | 23/59 [00:09<00:12,  2.99it/s][A
Training:  41%|████      | 24/59 [00:09<00:10,  3.48it/s][A
Training:  42%|████▏     | 25/59 [00:1

Epoch: 10/37 - Loss: 2.4060 - Accuracy: 0.9426



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:01<00:12,  1.74s/it][A
 25%|██▌       | 2/8 [00:01<00:04,  1.25it/s][A
 50%|█████     | 4/8 [00:02<00:01,  2.95it/s][A
 62%|██████▎   | 5/8 [00:03<00:01,  1.59it/s][A
100%|██████████| 8/8 [00:03<00:00,  2.23it/s][A
Epochs:  27%|██▋       | 10/37 [04:33<12:19, 27.39s/it]

Val Loss: 2.4628 - Val Accuracy: 0.9412



Training:   0%|          | 0/59 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/59 [00:01<01:48,  1.87s/it][A
Training:   5%|▌         | 3/59 [00:02<00:30,  1.81it/s][A
Training:   8%|▊         | 5/59 [00:03<00:34,  1.56it/s][A
Training:  10%|█         | 6/59 [00:03<00:27,  1.95it/s][A
Training:  15%|█▌        | 9/59 [00:04<00:22,  2.18it/s][A
Training:  17%|█▋        | 10/59 [00:05<00:21,  2.27it/s][A
Training:  20%|██        | 12/59 [00:05<00:14,  3.30it/s][A
Training:  22%|██▏       | 13/59 [00:06<00:21,  2.11it/s][A
Training:  24%|██▎       | 14/59 [00:06<00:19,  2.27it/s][A
Training:  27%|██▋       | 16/59 [00:07<00:12,  3.34it/s][A
Training:  29%|██▉       | 17/59 [00:08<00:20,  2.07it/s][A
Training:  31%|███       | 18/59 [00:08<00:17,  2.31it/s][A
Training:  34%|███▍      | 20/59 [00:08<00:11,  3.42it/s][A
Training:  36%|███▌      | 21/59 [00:09<00:17,  2.17it/s][A
Training:  37%|███▋      | 22/59 [00:10<00:16,  2.30it/s][A
Training:  41%|████      | 24/59 [00:

Epoch: 11/37 - Loss: 2.4427 - Accuracy: 0.9420



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:01<00:12,  1.79s/it][A
 38%|███▊      | 3/8 [00:01<00:02,  1.93it/s][A
 62%|██████▎   | 5/8 [00:03<00:01,  1.83it/s][A
100%|██████████| 8/8 [00:03<00:00,  2.38it/s][A
Epochs:  30%|██▉       | 11/37 [05:00<11:51, 27.35s/it]

Val Loss: 2.4469 - Val Accuracy: 0.9401



Training:   0%|          | 0/59 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/59 [00:01<01:53,  1.96s/it][A
Training:   5%|▌         | 3/59 [00:02<00:32,  1.74it/s][A
Training:   7%|▋         | 4/59 [00:02<00:22,  2.42it/s][A
Training:   8%|▊         | 5/59 [00:03<00:37,  1.45it/s][A
Training:  12%|█▏        | 7/59 [00:03<00:20,  2.57it/s][A
Training:  15%|█▌        | 9/59 [00:05<00:25,  1.96it/s][A
Training:  17%|█▋        | 10/59 [00:05<00:20,  2.39it/s][A
Training:  19%|█▊        | 11/59 [00:05<00:18,  2.64it/s][A
Training:  22%|██▏       | 13/59 [00:06<00:22,  2.07it/s][A
Training:  25%|██▌       | 15/59 [00:06<00:15,  2.77it/s][A
Training:  29%|██▉       | 17/59 [00:08<00:18,  2.23it/s][A
Training:  32%|███▏      | 19/59 [00:08<00:13,  2.99it/s][A
Training:  36%|███▌      | 21/59 [00:09<00:17,  2.17it/s][A
Training:  39%|███▉      | 23/59 [00:09<00:12,  2.97it/s][A
Training:  41%|████      | 24/59 [00:10<00:10,  3.37it/s][A
Training:  42%|████▏     | 25/59 [00:1

Epoch: 12/37 - Loss: 2.4146 - Accuracy: 0.9412



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:01<00:13,  1.89s/it][A
 62%|██████▎   | 5/8 [00:03<00:01,  1.72it/s][A
100%|██████████| 8/8 [00:03<00:00,  2.23it/s][A
Epochs:  32%|███▏      | 12/37 [05:28<11:24, 27.37s/it]

Val Loss: 2.5888 - Val Accuracy: 0.9350



Training:   0%|          | 0/59 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/59 [00:02<01:57,  2.03s/it][A
Training:   3%|▎         | 2/59 [00:02<00:53,  1.07it/s][A
Training:   7%|▋         | 4/59 [00:02<00:21,  2.57it/s][A
Training:   8%|▊         | 5/59 [00:03<00:36,  1.48it/s][A
Training:  10%|█         | 6/59 [00:03<00:26,  1.99it/s][A
Training:  12%|█▏        | 7/59 [00:03<00:19,  2.63it/s][A
Training:  15%|█▌        | 9/59 [00:05<00:27,  1.85it/s][A
Training:  17%|█▋        | 10/59 [00:05<00:21,  2.30it/s][A
Training:  20%|██        | 12/59 [00:05<00:13,  3.59it/s][A
Training:  22%|██▏       | 13/59 [00:06<00:24,  1.90it/s][A
Training:  25%|██▌       | 15/59 [00:07<00:15,  2.92it/s][A
Training:  29%|██▉       | 17/59 [00:08<00:20,  2.07it/s][A
Training:  31%|███       | 18/59 [00:08<00:16,  2.42it/s][A
Training:  34%|███▍      | 20/59 [00:08<00:11,  3.48it/s][A
Training:  36%|███▌      | 21/59 [00:09<00:16,  2.34it/s][A
Training:  37%|███▋      | 22/59 [00:09

Epoch: 13/37 - Loss: 2.2817 - Accuracy: 0.9429



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:01<00:13,  1.91s/it][A
 50%|█████     | 4/8 [00:02<00:01,  2.53it/s][A
100%|██████████| 8/8 [00:03<00:00,  2.24it/s][A
Epochs:  35%|███▌      | 13/37 [05:55<10:57, 27.40s/it]

Val Loss: 2.5025 - Val Accuracy: 0.9248



Training:   0%|          | 0/59 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/59 [00:01<01:41,  1.76s/it][A
Training:   5%|▌         | 3/59 [00:01<00:28,  1.94it/s][A
Training:   7%|▋         | 4/59 [00:02<00:20,  2.68it/s][A
Training:   8%|▊         | 5/59 [00:03<00:34,  1.55it/s][A
Training:  12%|█▏        | 7/59 [00:03<00:18,  2.74it/s][A
Training:  15%|█▌        | 9/59 [00:04<00:24,  2.00it/s][A
Training:  17%|█▋        | 10/59 [00:04<00:20,  2.44it/s][A
Training:  20%|██        | 12/59 [00:05<00:14,  3.32it/s][A
Training:  22%|██▏       | 13/59 [00:06<00:24,  1.91it/s][A
Training:  24%|██▎       | 14/59 [00:06<00:19,  2.32it/s][A
Training:  27%|██▋       | 16/59 [00:06<00:12,  3.37it/s][A
Training:  29%|██▉       | 17/59 [00:07<00:20,  2.10it/s][A
Training:  34%|███▍      | 20/59 [00:08<00:12,  3.22it/s][A
Training:  36%|███▌      | 21/59 [00:09<00:17,  2.18it/s][A
Training:  39%|███▉      | 23/59 [00:09<00:11,  3.09it/s][A
Training:  41%|████      | 24/59 [00:0

Epoch: 14/37 - Loss: 2.2941 - Accuracy: 0.9432



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:01<00:12,  1.80s/it][A
 38%|███▊      | 3/8 [00:01<00:02,  1.94it/s][A
100%|██████████| 8/8 [00:03<00:00,  2.40it/s][A
Epochs:  38%|███▊      | 14/37 [06:23<10:30, 27.43s/it]

Val Loss: 2.3537 - Val Accuracy: 0.9407



Training:   0%|          | 0/59 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/59 [00:02<01:55,  2.00s/it][A
Training:   3%|▎         | 2/59 [00:02<00:50,  1.13it/s][A
Training:   7%|▋         | 4/59 [00:02<00:19,  2.77it/s][A
Training:  10%|█         | 6/59 [00:03<00:28,  1.88it/s][A
Training:  14%|█▎        | 8/59 [00:03<00:17,  2.87it/s][A
Training:  15%|█▌        | 9/59 [00:04<00:23,  2.15it/s][A
Training:  17%|█▋        | 10/59 [00:05<00:24,  1.97it/s][A
Training:  19%|█▊        | 11/59 [00:05<00:19,  2.48it/s][A
Training:  22%|██▏       | 13/59 [00:06<00:18,  2.50it/s][A
Training:  24%|██▎       | 14/59 [00:06<00:21,  2.14it/s][A
Training:  27%|██▋       | 16/59 [00:07<00:13,  3.26it/s][A
Training:  29%|██▉       | 17/59 [00:07<00:15,  2.67it/s][A
Training:  31%|███       | 18/59 [00:08<00:19,  2.10it/s][A
Training:  36%|███▌      | 21/59 [00:08<00:12,  3.07it/s][A
Training:  37%|███▋      | 22/59 [00:10<00:17,  2.08it/s][A
Training:  41%|████      | 24/59 [00:1

Epoch: 15/37 - Loss: 2.1527 - Accuracy: 0.9465



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:02<00:15,  2.24s/it][A
 50%|█████     | 4/8 [00:02<00:01,  2.22it/s][A
100%|██████████| 8/8 [00:03<00:00,  2.14it/s][A
Epochs:  41%|████      | 15/37 [06:50<10:03, 27.43s/it]

Val Loss: 2.2329 - Val Accuracy: 0.9397



Training:   0%|          | 0/59 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/59 [00:02<01:56,  2.02s/it][A
Training:   5%|▌         | 3/59 [00:02<00:32,  1.73it/s][A
Training:   8%|▊         | 5/59 [00:03<00:31,  1.72it/s][A
Training:  10%|█         | 6/59 [00:03<00:24,  2.19it/s][A
Training:  12%|█▏        | 7/59 [00:03<00:18,  2.74it/s][A
Training:  14%|█▎        | 8/59 [00:03<00:14,  3.44it/s][A
Training:  15%|█▌        | 9/59 [00:04<00:28,  1.76it/s][A
Training:  17%|█▋        | 10/59 [00:05<00:22,  2.19it/s][A
Training:  19%|█▊        | 11/59 [00:05<00:16,  2.84it/s][A
Training:  20%|██        | 12/59 [00:05<00:13,  3.46it/s][A
Training:  22%|██▏       | 13/59 [00:06<00:25,  1.83it/s][A
Training:  25%|██▌       | 15/59 [00:06<00:14,  3.01it/s][A
Training:  29%|██▉       | 17/59 [00:07<00:17,  2.41it/s][A
Training:  32%|███▏      | 19/59 [00:07<00:11,  3.46it/s][A
Training:  34%|███▍      | 20/59 [00:08<00:09,  3.99it/s][A
Training:  36%|███▌      | 21/59 [00:09

Epoch: 16/37 - Loss: 2.1647 - Accuracy: 0.9445



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:01<00:13,  1.89s/it][A
 50%|█████     | 4/8 [00:02<00:01,  2.59it/s][A
100%|██████████| 8/8 [00:03<00:00,  2.43it/s][A
Epochs:  43%|████▎     | 16/37 [07:17<09:33, 27.31s/it]

Val Loss: 2.1574 - Val Accuracy: 0.9397



Training:   0%|          | 0/59 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/59 [00:01<01:46,  1.83s/it][A
Training:   5%|▌         | 3/59 [00:01<00:28,  1.95it/s][A
Training:   8%|▊         | 5/59 [00:03<00:32,  1.67it/s][A
Training:  12%|█▏        | 7/59 [00:03<00:19,  2.69it/s][A
Training:  15%|█▌        | 9/59 [00:04<00:24,  2.06it/s][A
Training:  19%|█▊        | 11/59 [00:05<00:17,  2.67it/s][A
Training:  20%|██        | 12/59 [00:05<00:15,  3.12it/s][A
Training:  22%|██▏       | 13/59 [00:06<00:23,  1.92it/s][A
Training:  24%|██▎       | 14/59 [00:06<00:18,  2.37it/s][A
Training:  25%|██▌       | 15/59 [00:06<00:15,  2.87it/s][A
Training:  29%|██▉       | 17/59 [00:07<00:18,  2.31it/s][A
Training:  31%|███       | 18/59 [00:07<00:15,  2.70it/s][A
Training:  34%|███▍      | 20/59 [00:08<00:09,  3.91it/s][A
Training:  36%|███▌      | 21/59 [00:09<00:16,  2.24it/s][A
Training:  37%|███▋      | 22/59 [00:09<00:16,  2.29it/s][A
Training:  41%|████      | 24/59 [00:

Epoch: 17/37 - Loss: 2.0843 - Accuracy: 0.9467



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:02<00:14,  2.06s/it][A
 25%|██▌       | 2/8 [00:02<00:05,  1.07it/s][A
 50%|█████     | 4/8 [00:02<00:01,  2.56it/s][A
100%|██████████| 8/8 [00:03<00:00,  2.25it/s][A
Epochs:  46%|████▌     | 17/37 [07:44<09:04, 27.23s/it]

Val Loss: 2.1045 - Val Accuracy: 0.9444



Training:   0%|          | 0/59 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/59 [00:01<01:54,  1.98s/it][A
Training:   3%|▎         | 2/59 [00:02<00:52,  1.08it/s][A
Training:   7%|▋         | 4/59 [00:02<00:22,  2.48it/s][A
Training:   8%|▊         | 5/59 [00:03<00:34,  1.55it/s][A
Training:  12%|█▏        | 7/59 [00:03<00:19,  2.68it/s][A
Training:  15%|█▌        | 9/59 [00:04<00:22,  2.18it/s][A
Training:  17%|█▋        | 10/59 [00:04<00:18,  2.63it/s][A
Training:  20%|██        | 12/59 [00:05<00:12,  3.81it/s][A
Training:  22%|██▏       | 13/59 [00:06<00:22,  2.06it/s][A
Training:  24%|██▎       | 14/59 [00:06<00:18,  2.49it/s][A
Training:  29%|██▉       | 17/59 [00:08<00:18,  2.24it/s][A
Training:  31%|███       | 18/59 [00:08<00:15,  2.63it/s][A
Training:  36%|███▌      | 21/59 [00:09<00:15,  2.50it/s][A
Training:  37%|███▋      | 22/59 [00:09<00:12,  2.87it/s][A
Training:  39%|███▉      | 23/59 [00:09<00:11,  3.25it/s][A
Training:  42%|████▏     | 25/59 [00:1

Epoch: 18/37 - Loss: 2.0580 - Accuracy: 0.9465



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:01<00:13,  1.91s/it][A
 25%|██▌       | 2/8 [00:02<00:05,  1.16it/s][A
 62%|██████▎   | 5/8 [00:03<00:01,  1.78it/s][A
100%|██████████| 8/8 [00:03<00:00,  2.15it/s][A
Epochs:  49%|████▊     | 18/37 [08:12<08:39, 27.34s/it]

Val Loss: 2.1993 - Val Accuracy: 0.9422



Training:   0%|          | 0/59 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/59 [00:01<01:40,  1.73s/it][A
Training:   5%|▌         | 3/59 [00:01<00:28,  1.98it/s][A
Training:   7%|▋         | 4/59 [00:02<00:21,  2.58it/s][A
Training:   8%|▊         | 5/59 [00:03<00:38,  1.40it/s][A
Training:  10%|█         | 6/59 [00:03<00:28,  1.86it/s][A
Training:  12%|█▏        | 7/59 [00:03<00:21,  2.47it/s][A
Training:  14%|█▎        | 8/59 [00:03<00:16,  3.13it/s][A
Training:  15%|█▌        | 9/59 [00:04<00:25,  1.98it/s][A
Training:  19%|█▊        | 11/59 [00:04<00:14,  3.38it/s][A
Training:  22%|██▏       | 13/59 [00:06<00:20,  2.25it/s][A
Training:  24%|██▎       | 14/59 [00:06<00:17,  2.63it/s][A
Training:  25%|██▌       | 15/59 [00:06<00:13,  3.18it/s][A
Training:  29%|██▉       | 17/59 [00:07<00:18,  2.29it/s][A
Training:  31%|███       | 18/59 [00:07<00:15,  2.58it/s][A
Training:  34%|███▍      | 20/59 [00:08<00:10,  3.84it/s][A
Training:  36%|███▌      | 21/59 [00:09<

Epoch: 19/37 - Loss: 2.0035 - Accuracy: 0.9469



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:01<00:12,  1.85s/it][A
 25%|██▌       | 2/8 [00:02<00:05,  1.03it/s][A
 50%|█████     | 4/8 [00:02<00:01,  2.43it/s][A
 62%|██████▎   | 5/8 [00:03<00:01,  1.62it/s][A
100%|██████████| 8/8 [00:03<00:00,  2.06it/s][A
Epochs:  51%|█████▏    | 19/37 [08:39<08:09, 27.17s/it]

Val Loss: 2.1945 - Val Accuracy: 0.9397



Training:   0%|          | 0/59 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/59 [00:01<01:47,  1.85s/it][A
Training:   5%|▌         | 3/59 [00:02<00:30,  1.82it/s][A
Training:   8%|▊         | 5/59 [00:03<00:33,  1.63it/s][A
Training:  12%|█▏        | 7/59 [00:03<00:21,  2.42it/s][A
Training:  14%|█▎        | 8/59 [00:03<00:17,  2.92it/s][A
Training:  15%|█▌        | 9/59 [00:04<00:23,  2.12it/s][A
Training:  20%|██        | 12/59 [00:04<00:11,  3.98it/s][A
Training:  24%|██▎       | 14/59 [00:06<00:17,  2.60it/s][A
Training:  25%|██▌       | 15/59 [00:06<00:14,  2.97it/s][A
Training:  29%|██▉       | 17/59 [00:07<00:17,  2.45it/s][A
Training:  31%|███       | 18/59 [00:07<00:15,  2.65it/s][A
Training:  34%|███▍      | 20/59 [00:07<00:10,  3.71it/s][A
Training:  36%|███▌      | 21/59 [00:08<00:15,  2.51it/s][A
Training:  37%|███▋      | 22/59 [00:09<00:15,  2.39it/s][A
Training:  39%|███▉      | 23/59 [00:09<00:12,  2.92it/s][A
Training:  41%|████      | 24/59 [00:0

Epoch: 20/37 - Loss: 2.0342 - Accuracy: 0.9484



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:01<00:12,  1.86s/it][A
 38%|███▊      | 3/8 [00:02<00:02,  1.87it/s][A
 50%|█████     | 4/8 [00:02<00:01,  2.53it/s][A
100%|██████████| 8/8 [00:03<00:00,  2.24it/s][A
Epochs:  54%|█████▍    | 20/37 [09:06<07:41, 27.14s/it]

Val Loss: 2.0772 - Val Accuracy: 0.9346



Training:   0%|          | 0/59 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/59 [00:01<01:50,  1.90s/it][A
Training:   7%|▋         | 4/59 [00:02<00:21,  2.54it/s][A
Training:  10%|█         | 6/59 [00:03<00:28,  1.84it/s][A
Training:  12%|█▏        | 7/59 [00:03<00:22,  2.27it/s][A
Training:  14%|█▎        | 8/59 [00:03<00:18,  2.82it/s][A
Training:  15%|█▌        | 9/59 [00:04<00:24,  2.00it/s][A
Training:  17%|█▋        | 10/59 [00:04<00:21,  2.24it/s][A
Training:  22%|██▏       | 13/59 [00:06<00:18,  2.50it/s][A
Training:  24%|██▎       | 14/59 [00:06<00:17,  2.55it/s][A
Training:  27%|██▋       | 16/59 [00:06<00:12,  3.55it/s][A
Training:  29%|██▉       | 17/59 [00:07<00:17,  2.37it/s][A
Training:  31%|███       | 18/59 [00:07<00:15,  2.63it/s][A
Training:  34%|███▍      | 20/59 [00:07<00:09,  4.00it/s][A
Training:  36%|███▌      | 21/59 [00:08<00:14,  2.65it/s][A
Training:  37%|███▋      | 22/59 [00:09<00:17,  2.16it/s][A
Training:  41%|████      | 24/59 [00:0

Epoch: 21/37 - Loss: 2.0802 - Accuracy: 0.9467



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:01<00:13,  1.95s/it][A
 25%|██▌       | 2/8 [00:02<00:05,  1.10it/s][A
 50%|█████     | 4/8 [00:02<00:01,  2.64it/s][A
 62%|██████▎   | 5/8 [00:03<00:01,  1.67it/s][A
100%|██████████| 8/8 [00:03<00:00,  2.13it/s][A
Epochs:  57%|█████▋    | 21/37 [09:32<07:12, 27.05s/it]

Val Loss: 2.4215 - Val Accuracy: 0.9371



Training:   0%|          | 0/59 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/59 [00:01<01:55,  1.99s/it][A
Training:   5%|▌         | 3/59 [00:02<00:32,  1.73it/s][A
Training:   8%|▊         | 5/59 [00:03<00:31,  1.70it/s][A
Training:  10%|█         | 6/59 [00:03<00:26,  1.99it/s][A
Training:  14%|█▎        | 8/59 [00:03<00:15,  3.24it/s][A
Training:  15%|█▌        | 9/59 [00:04<00:25,  1.94it/s][A
Training:  19%|█▊        | 11/59 [00:05<00:16,  2.93it/s][A
Training:  22%|██▏       | 13/59 [00:06<00:20,  2.26it/s][A
Training:  24%|██▎       | 14/59 [00:06<00:17,  2.64it/s][A
Training:  27%|██▋       | 16/59 [00:06<00:11,  3.60it/s][A
Training:  29%|██▉       | 17/59 [00:07<00:17,  2.35it/s][A
Training:  31%|███       | 18/59 [00:07<00:14,  2.83it/s][A
Training:  34%|███▍      | 20/59 [00:07<00:10,  3.85it/s][A
Training:  36%|███▌      | 21/59 [00:09<00:17,  2.23it/s][A
Training:  37%|███▋      | 22/59 [00:09<00:14,  2.51it/s][A
Training:  39%|███▉      | 23/59 [00:0

Epoch: 22/37 - Loss: 2.0029 - Accuracy: 0.9475



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:02<00:14,  2.10s/it][A
 38%|███▊      | 3/8 [00:02<00:03,  1.58it/s][A
 50%|█████     | 4/8 [00:02<00:01,  2.22it/s][A
 62%|██████▎   | 5/8 [00:03<00:01,  1.50it/s][A
100%|██████████| 8/8 [00:03<00:00,  2.08it/s][A
Epochs:  59%|█████▉    | 22/37 [10:00<06:48, 27.26s/it]

Val Loss: 2.0020 - Val Accuracy: 0.9459



Training:   0%|          | 0/59 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/59 [00:01<01:49,  1.89s/it][A
Training:   5%|▌         | 3/59 [00:02<00:30,  1.81it/s][A
Training:   8%|▊         | 5/59 [00:03<00:32,  1.68it/s][A
Training:  12%|█▏        | 7/59 [00:03<00:19,  2.73it/s][A
Training:  15%|█▌        | 9/59 [00:04<00:22,  2.19it/s][A
Training:  17%|█▋        | 10/59 [00:04<00:19,  2.45it/s][A
Training:  20%|██        | 12/59 [00:05<00:13,  3.43it/s][A
Training:  22%|██▏       | 13/59 [00:06<00:21,  2.15it/s][A
Training:  24%|██▎       | 14/59 [00:06<00:19,  2.28it/s][A
Training:  29%|██▉       | 17/59 [00:07<00:17,  2.34it/s][A
Training:  31%|███       | 18/59 [00:08<00:18,  2.26it/s][A
Training:  34%|███▍      | 20/59 [00:08<00:12,  3.13it/s][A
Training:  36%|███▌      | 21/59 [00:09<00:16,  2.31it/s][A
Training:  37%|███▋      | 22/59 [00:09<00:16,  2.23it/s][A
Training:  41%|████      | 24/59 [00:09<00:10,  3.36it/s][A
Training:  42%|████▏     | 25/59 [00:

Epoch: 23/37 - Loss: 1.9363 - Accuracy: 0.9490



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:02<00:14,  2.14s/it][A
 38%|███▊      | 3/8 [00:02<00:02,  1.68it/s][A
100%|██████████| 8/8 [00:03<00:00,  2.02it/s][A
Epochs:  62%|██████▏   | 23/37 [10:28<06:23, 27.42s/it]

Val Loss: 2.0807 - Val Accuracy: 0.9434



Training:   0%|          | 0/59 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/59 [00:01<01:34,  1.63s/it][A
Training:   5%|▌         | 3/59 [00:01<00:25,  2.16it/s][A
Training:   8%|▊         | 5/59 [00:02<00:26,  2.03it/s][A
Training:  10%|█         | 6/59 [00:02<00:21,  2.50it/s][A
Training:  12%|█▏        | 7/59 [00:03<00:17,  3.04it/s][A
Training:  14%|█▎        | 8/59 [00:03<00:14,  3.60it/s][A
Training:  15%|█▌        | 9/59 [00:04<00:22,  2.19it/s][A
Training:  17%|█▋        | 10/59 [00:04<00:18,  2.59it/s][A
Training:  20%|██        | 12/59 [00:04<00:12,  3.81it/s][A
Training:  22%|██▏       | 13/59 [00:05<00:16,  2.81it/s][A
Training:  24%|██▎       | 14/59 [00:05<00:17,  2.57it/s][A
Training:  27%|██▋       | 16/59 [00:05<00:11,  3.66it/s][A
Training:  29%|██▉       | 17/59 [00:06<00:17,  2.36it/s][A
Training:  31%|███       | 18/59 [00:07<00:19,  2.15it/s][A
Training:  34%|███▍      | 20/59 [00:07<00:11,  3.37it/s][A
Training:  36%|███▌      | 21/59 [00:08

Epoch: 24/37 - Loss: 1.9267 - Accuracy: 0.9494



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:01<00:13,  1.92s/it][A
 25%|██▌       | 2/8 [00:02<00:05,  1.10it/s][A
 50%|█████     | 4/8 [00:02<00:01,  2.50it/s][A
 62%|██████▎   | 5/8 [00:03<00:01,  1.63it/s][A
100%|██████████| 8/8 [00:03<00:00,  2.19it/s][A
Epochs:  65%|██████▍   | 24/37 [10:55<05:55, 27.36s/it]

Val Loss: 2.0327 - Val Accuracy: 0.9409



Training:   0%|          | 0/59 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/59 [00:01<01:32,  1.60s/it][A
Training:   3%|▎         | 2/59 [00:01<00:41,  1.38it/s][A
Training:   5%|▌         | 3/59 [00:01<00:25,  2.22it/s][A
Training:   8%|▊         | 5/59 [00:03<00:33,  1.63it/s][A
Training:  12%|█▏        | 7/59 [00:03<00:19,  2.65it/s][A
Training:  15%|█▌        | 9/59 [00:04<00:22,  2.20it/s][A
Training:  19%|█▊        | 11/59 [00:04<00:14,  3.20it/s][A
Training:  22%|██▏       | 13/59 [00:05<00:18,  2.55it/s][A
Training:  25%|██▌       | 15/59 [00:05<00:12,  3.47it/s][A
Training:  29%|██▉       | 17/59 [00:07<00:17,  2.41it/s][A
Training:  34%|███▍      | 20/59 [00:07<00:11,  3.49it/s][A
Training:  36%|███▌      | 21/59 [00:08<00:17,  2.21it/s][A
Training:  39%|███▉      | 23/59 [00:09<00:11,  3.06it/s][A
Training:  41%|████      | 24/59 [00:09<00:10,  3.47it/s][A
Training:  42%|████▏     | 25/59 [00:10<00:17,  1.98it/s][A
Training:  46%|████▌     | 27/59 [00:1

Epoch: 25/37 - Loss: 1.9293 - Accuracy: 0.9485



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:02<00:14,  2.02s/it][A
 25%|██▌       | 2/8 [00:02<00:05,  1.11it/s][A
 38%|███▊      | 3/8 [00:02<00:02,  1.80it/s][A
 50%|█████     | 4/8 [00:02<00:01,  2.60it/s][A
 62%|██████▎   | 5/8 [00:03<00:01,  1.62it/s][A
100%|██████████| 8/8 [00:03<00:00,  2.18it/s][A
Epochs:  68%|██████▊   | 25/37 [11:22<05:27, 27.29s/it]

Val Loss: 2.1168 - Val Accuracy: 0.9360



Training:   0%|          | 0/59 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/59 [00:02<01:58,  2.04s/it][A
Training:   5%|▌         | 3/59 [00:02<00:33,  1.69it/s][A
Training:   8%|▊         | 5/59 [00:03<00:32,  1.66it/s][A
Training:  14%|█▎        | 8/59 [00:03<00:16,  3.10it/s][A
Training:  15%|█▌        | 9/59 [00:05<00:27,  1.83it/s][A
Training:  17%|█▋        | 10/59 [00:05<00:22,  2.23it/s][A
Training:  19%|█▊        | 11/59 [00:05<00:17,  2.73it/s][A
Training:  22%|██▏       | 13/59 [00:06<00:20,  2.29it/s][A
Training:  27%|██▋       | 16/59 [00:06<00:11,  3.81it/s][A
Training:  29%|██▉       | 17/59 [00:07<00:19,  2.14it/s][A
Training:  32%|███▏      | 19/59 [00:08<00:13,  3.06it/s][A
Training:  36%|███▌      | 21/59 [00:09<00:17,  2.12it/s][A
Training:  37%|███▋      | 22/59 [00:09<00:14,  2.48it/s][A
Training:  41%|████      | 24/59 [00:09<00:09,  3.55it/s][A
Training:  44%|████▍     | 26/59 [00:11<00:13,  2.40it/s][A
Training:  46%|████▌     | 27/59 [00:

Epoch: 26/37 - Loss: 1.8775 - Accuracy: 0.9498



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:02<00:14,  2.09s/it][A
 38%|███▊      | 3/8 [00:02<00:03,  1.66it/s][A
 50%|█████     | 4/8 [00:02<00:01,  2.29it/s][A
 62%|██████▎   | 5/8 [00:03<00:01,  1.55it/s][A
100%|██████████| 8/8 [00:03<00:00,  2.18it/s][A
Epochs:  70%|███████   | 26/37 [11:50<05:01, 27.42s/it]

Val Loss: 2.1112 - Val Accuracy: 0.9429



Training:   0%|          | 0/59 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/59 [00:01<01:52,  1.94s/it][A
Training:   5%|▌         | 3/59 [00:02<00:30,  1.82it/s][A
Training:   8%|▊         | 5/59 [00:03<00:32,  1.67it/s][A
Training:  12%|█▏        | 7/59 [00:03<00:19,  2.68it/s][A
Training:  15%|█▌        | 9/59 [00:05<00:25,  1.94it/s][A
Training:  17%|█▋        | 10/59 [00:05<00:20,  2.34it/s][A
Training:  19%|█▊        | 11/59 [00:05<00:17,  2.80it/s][A
Training:  22%|██▏       | 13/59 [00:06<00:21,  2.14it/s][A
Training:  24%|██▎       | 14/59 [00:06<00:17,  2.54it/s][A
Training:  27%|██▋       | 16/59 [00:06<00:11,  3.65it/s][A
Training:  29%|██▉       | 17/59 [00:07<00:17,  2.37it/s][A
Training:  31%|███       | 18/59 [00:07<00:14,  2.88it/s][A
Training:  36%|███▌      | 21/59 [00:09<00:15,  2.44it/s][A
Training:  39%|███▉      | 23/59 [00:09<00:10,  3.38it/s][A
Training:  42%|████▏     | 25/59 [00:10<00:14,  2.34it/s][A
Training:  46%|████▌     | 27/59 [00:

Epoch: 27/37 - Loss: 1.9109 - Accuracy: 0.9480



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:02<00:13,  1.99s/it][A
 38%|███▊      | 3/8 [00:02<00:02,  1.77it/s][A
 62%|██████▎   | 5/8 [00:03<00:01,  1.77it/s][A
100%|██████████| 8/8 [00:03<00:00,  2.30it/s][A
Epochs:  73%|███████▎  | 27/37 [12:17<04:32, 27.21s/it]

Val Loss: 2.0492 - Val Accuracy: 0.9449



Training:   0%|          | 0/59 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/59 [00:01<01:53,  1.96s/it][A
Training:   3%|▎         | 2/59 [00:02<00:50,  1.13it/s][A
Training:   8%|▊         | 5/59 [00:03<00:25,  2.10it/s][A
Training:  10%|█         | 6/59 [00:03<00:20,  2.54it/s][A
Training:  15%|█▌        | 9/59 [00:04<00:22,  2.27it/s][A
Training:  17%|█▋        | 10/59 [00:04<00:18,  2.64it/s][A
Training:  19%|█▊        | 11/59 [00:04<00:15,  3.15it/s][A
Training:  22%|██▏       | 13/59 [00:06<00:20,  2.20it/s][A
Training:  25%|██▌       | 15/59 [00:06<00:14,  3.12it/s][A
Training:  29%|██▉       | 17/59 [00:07<00:17,  2.37it/s][A
Training:  31%|███       | 18/59 [00:07<00:14,  2.75it/s][A
Training:  32%|███▏      | 19/59 [00:07<00:12,  3.25it/s][A
Training:  34%|███▍      | 20/59 [00:07<00:10,  3.82it/s][A
Training:  36%|███▌      | 21/59 [00:09<00:20,  1.81it/s][A
Training:  37%|███▋      | 22/59 [00:09<00:16,  2.29it/s][A
Training:  41%|████      | 24/59 [00:

Epoch: 28/37 - Loss: 1.8990 - Accuracy: 0.9498



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:01<00:13,  1.96s/it][A
 25%|██▌       | 2/8 [00:02<00:06,  1.00s/it][A
 50%|█████     | 4/8 [00:02<00:01,  2.44it/s][A
 62%|██████▎   | 5/8 [00:03<00:01,  1.97it/s][A
100%|██████████| 8/8 [00:03<00:00,  2.09it/s][A
Epochs:  76%|███████▌  | 28/37 [12:44<04:04, 27.19s/it]

Val Loss: 2.0442 - Val Accuracy: 0.9445



Training:   0%|          | 0/59 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/59 [00:01<01:54,  1.97s/it][A
Training:   5%|▌         | 3/59 [00:02<00:32,  1.70it/s][A
Training:   8%|▊         | 5/59 [00:03<00:29,  1.85it/s][A
Training:  12%|█▏        | 7/59 [00:03<00:21,  2.40it/s][A
Training:  15%|█▌        | 9/59 [00:04<00:23,  2.16it/s][A
Training:  17%|█▋        | 10/59 [00:04<00:19,  2.55it/s][A
Training:  19%|█▊        | 11/59 [00:05<00:22,  2.16it/s][A
Training:  22%|██▏       | 13/59 [00:06<00:20,  2.21it/s][A
Training:  25%|██▌       | 15/59 [00:07<00:18,  2.35it/s][A
Training:  29%|██▉       | 17/59 [00:07<00:15,  2.76it/s][A
Training:  32%|███▏      | 19/59 [00:08<00:17,  2.27it/s][A
Training:  36%|███▌      | 21/59 [00:09<00:13,  2.78it/s][A
Training:  37%|███▋      | 22/59 [00:09<00:11,  3.15it/s][A
Training:  39%|███▉      | 23/59 [00:10<00:18,  1.94it/s][A
Training:  42%|████▏     | 25/59 [00:10<00:11,  2.84it/s][A
Training:  44%|████▍     | 26/59 [00:

Epoch: 29/37 - Loss: 1.8979 - Accuracy: 0.9489



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:01<00:11,  1.67s/it][A
 38%|███▊      | 3/8 [00:01<00:02,  2.08it/s][A
 62%|██████▎   | 5/8 [00:03<00:01,  1.74it/s][A
100%|██████████| 8/8 [00:03<00:00,  2.40it/s][A
Epochs:  78%|███████▊  | 29/37 [13:12<03:39, 27.48s/it]

Val Loss: 2.0915 - Val Accuracy: 0.9413



Training:   0%|          | 0/59 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/59 [00:01<01:43,  1.78s/it][A
Training:   5%|▌         | 3/59 [00:01<00:28,  1.98it/s][A
Training:   8%|▊         | 5/59 [00:03<00:31,  1.71it/s][A
Training:  10%|█         | 6/59 [00:03<00:24,  2.19it/s][A
Training:  12%|█▏        | 7/59 [00:03<00:19,  2.70it/s][A
Training:  14%|█▎        | 8/59 [00:03<00:15,  3.30it/s][A
Training:  15%|█▌        | 9/59 [00:04<00:29,  1.69it/s][A
Training:  19%|█▊        | 11/59 [00:05<00:16,  2.84it/s][A
Training:  22%|██▏       | 13/59 [00:06<00:24,  1.88it/s][A
Training:  27%|██▋       | 16/59 [00:06<00:13,  3.20it/s][A
Training:  31%|███       | 18/59 [00:08<00:18,  2.23it/s][A
Training:  34%|███▍      | 20/59 [00:08<00:13,  2.95it/s][A
Training:  36%|███▌      | 21/59 [00:09<00:18,  2.03it/s][A
Training:  39%|███▉      | 23/59 [00:09<00:12,  2.89it/s][A
Training:  42%|████▏     | 25/59 [00:11<00:16,  2.05it/s][A
Training:  44%|████▍     | 26/59 [00:11

Epoch: 30/37 - Loss: 1.9145 - Accuracy: 0.9498



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:01<00:12,  1.81s/it][A
 25%|██▌       | 2/8 [00:01<00:04,  1.23it/s][A
 62%|██████▎   | 5/8 [00:03<00:01,  1.86it/s][A
100%|██████████| 8/8 [00:03<00:00,  2.34it/s][A
Epochs:  81%|████████  | 30/37 [13:39<03:12, 27.44s/it]

Val Loss: 2.0940 - Val Accuracy: 0.9372



Training:   0%|          | 0/59 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/59 [00:01<01:46,  1.83s/it][A
Training:   3%|▎         | 2/59 [00:01<00:47,  1.21it/s][A
Training:   5%|▌         | 3/59 [00:02<00:27,  2.01it/s][A
Training:   7%|▋         | 4/59 [00:02<00:18,  2.93it/s][A
Training:   8%|▊         | 5/59 [00:03<00:33,  1.61it/s][A
Training:  10%|█         | 6/59 [00:03<00:23,  2.21it/s][A
Training:  14%|█▎        | 8/59 [00:03<00:13,  3.85it/s][A
Training:  15%|█▌        | 9/59 [00:05<00:29,  1.67it/s][A
Training:  17%|█▋        | 10/59 [00:05<00:22,  2.14it/s][A
Training:  19%|█▊        | 11/59 [00:05<00:17,  2.72it/s][A
Training:  20%|██        | 12/59 [00:05<00:13,  3.36it/s][A
Training:  22%|██▏       | 13/59 [00:06<00:25,  1.84it/s][A
Training:  29%|██▉       | 17/59 [00:08<00:18,  2.31it/s][A
Training:  34%|███▍      | 20/59 [00:08<00:10,  3.60it/s][A
Training:  36%|███▌      | 21/59 [00:09<00:18,  2.09it/s][A
Training:  39%|███▉      | 23/59 [00:09<

Epoch: 31/37 - Loss: 1.8922 - Accuracy: 0.9498



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:02<00:14,  2.09s/it][A
 38%|███▊      | 3/8 [00:02<00:03,  1.63it/s][A
100%|██████████| 8/8 [00:03<00:00,  2.34it/s][A
Epochs:  84%|████████▍ | 31/37 [14:06<02:43, 27.31s/it]

Val Loss: 2.0603 - Val Accuracy: 0.9449



Training:   0%|          | 0/59 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/59 [00:01<01:51,  1.93s/it][A
Training:   5%|▌         | 3/59 [00:02<00:32,  1.70it/s][A
Training:   8%|▊         | 5/59 [00:03<00:32,  1.66it/s][A
Training:  12%|█▏        | 7/59 [00:03<00:19,  2.61it/s][A
Training:  15%|█▌        | 9/59 [00:04<00:22,  2.18it/s][A
Training:  19%|█▊        | 11/59 [00:04<00:15,  3.16it/s][A
Training:  22%|██▏       | 13/59 [00:06<00:19,  2.42it/s][A
Training:  25%|██▌       | 15/59 [00:06<00:13,  3.25it/s][A
Training:  27%|██▋       | 16/59 [00:06<00:12,  3.53it/s][A
Training:  29%|██▉       | 17/59 [00:07<00:19,  2.17it/s][A
Training:  32%|███▏      | 19/59 [00:07<00:13,  3.07it/s][A
Training:  34%|███▍      | 20/59 [00:07<00:11,  3.55it/s][A
Training:  36%|███▌      | 21/59 [00:08<00:17,  2.15it/s][A
Training:  39%|███▉      | 23/59 [00:09<00:14,  2.52it/s][A
Training:  42%|████▏     | 25/59 [00:10<00:12,  2.72it/s][A
Training:  44%|████▍     | 26/59 [00:

Epoch: 32/37 - Loss: 1.8576 - Accuracy: 0.9514



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:01<00:13,  1.88s/it][A
 25%|██▌       | 2/8 [00:02<00:05,  1.19it/s][A
 62%|██████▎   | 5/8 [00:03<00:01,  1.80it/s][A
100%|██████████| 8/8 [00:03<00:00,  2.24it/s][A
Epochs:  86%|████████▋ | 32/37 [14:34<02:16, 27.32s/it]

Val Loss: 2.2241 - Val Accuracy: 0.9387



Training:   0%|          | 0/59 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/59 [00:02<02:01,  2.10s/it][A
Training:   3%|▎         | 2/59 [00:02<00:53,  1.07it/s][A
Training:   7%|▋         | 4/59 [00:02<00:21,  2.60it/s][A
Training:  10%|█         | 6/59 [00:03<00:26,  1.98it/s][A
Training:  14%|█▎        | 8/59 [00:03<00:16,  3.00it/s][A
Training:  15%|█▌        | 9/59 [00:05<00:27,  1.79it/s][A
Training:  19%|█▊        | 11/59 [00:05<00:17,  2.75it/s][A
Training:  22%|██▏       | 13/59 [00:06<00:22,  2.06it/s][A
Training:  25%|██▌       | 15/59 [00:06<00:15,  2.83it/s][A
Training:  29%|██▉       | 17/59 [00:08<00:18,  2.30it/s][A
Training:  32%|███▏      | 19/59 [00:08<00:12,  3.11it/s][A
Training:  36%|███▌      | 21/59 [00:09<00:16,  2.31it/s][A
Training:  37%|███▋      | 22/59 [00:09<00:13,  2.69it/s][A
Training:  39%|███▉      | 23/59 [00:09<00:11,  3.12it/s][A
Training:  42%|████▏     | 25/59 [00:10<00:14,  2.37it/s][A
Training:  44%|████▍     | 26/59 [00:1

Epoch: 33/37 - Loss: 1.9191 - Accuracy: 0.9458



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:01<00:12,  1.77s/it][A
 25%|██▌       | 2/8 [00:01<00:04,  1.27it/s][A
 38%|███▊      | 3/8 [00:02<00:02,  2.00it/s][A
 50%|█████     | 4/8 [00:02<00:01,  2.85it/s][A
100%|██████████| 8/8 [00:03<00:00,  2.17it/s][A
Epochs:  89%|████████▉ | 33/37 [15:01<01:49, 27.37s/it]

Val Loss: 2.1367 - Val Accuracy: 0.9347



Training:   0%|          | 0/59 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/59 [00:02<02:14,  2.31s/it][A
Training:   3%|▎         | 2/59 [00:02<00:58,  1.02s/it][A
Training:   5%|▌         | 3/59 [00:02<00:34,  1.60it/s][A
Training:   7%|▋         | 4/59 [00:02<00:23,  2.33it/s][A
Training:   8%|▊         | 5/59 [00:03<00:33,  1.61it/s][A
Training:  10%|█         | 6/59 [00:03<00:24,  2.15it/s][A
Training:  14%|█▎        | 8/59 [00:03<00:13,  3.70it/s][A
Training:  15%|█▌        | 9/59 [00:05<00:24,  2.01it/s][A
Training:  17%|█▋        | 10/59 [00:05<00:22,  2.22it/s][A
Training:  20%|██        | 12/59 [00:05<00:13,  3.43it/s][A
Training:  22%|██▏       | 13/59 [00:06<00:22,  2.08it/s][A
Training:  24%|██▎       | 14/59 [00:06<00:18,  2.49it/s][A
Training:  29%|██▉       | 17/59 [00:08<00:16,  2.48it/s][A
Training:  31%|███       | 18/59 [00:08<00:14,  2.76it/s][A
Training:  34%|███▍      | 20/59 [00:08<00:09,  4.00it/s][A
Training:  36%|███▌      | 21/59 [00:09<

Epoch: 34/37 - Loss: 1.8440 - Accuracy: 0.9533



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:02<00:14,  2.04s/it][A
 38%|███▊      | 3/8 [00:02<00:02,  1.75it/s][A
 62%|██████▎   | 5/8 [00:03<00:01,  1.69it/s][A
100%|██████████| 8/8 [00:03<00:00,  2.17it/s][A
Epochs:  92%|█████████▏| 34/37 [15:29<01:22, 27.61s/it]

Val Loss: 2.0472 - Val Accuracy: 0.9408



Training:   0%|          | 0/59 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/59 [00:02<02:04,  2.15s/it][A
Training:   3%|▎         | 2/59 [00:02<00:54,  1.05it/s][A
Training:   7%|▋         | 4/59 [00:02<00:21,  2.52it/s][A
Training:   8%|▊         | 5/59 [00:03<00:34,  1.58it/s][A
Training:  12%|█▏        | 7/59 [00:03<00:19,  2.71it/s][A
Training:  15%|█▌        | 9/59 [00:05<00:24,  2.04it/s][A
Training:  17%|█▋        | 10/59 [00:05<00:19,  2.46it/s][A
Training:  20%|██        | 12/59 [00:05<00:13,  3.56it/s][A
Training:  22%|██▏       | 13/59 [00:06<00:24,  1.86it/s][A
Training:  24%|██▎       | 14/59 [00:06<00:19,  2.30it/s][A
Training:  27%|██▋       | 16/59 [00:06<00:12,  3.54it/s][A
Training:  31%|███       | 18/59 [00:08<00:17,  2.35it/s][A
Training:  34%|███▍      | 20/59 [00:08<00:11,  3.31it/s][A
Training:  37%|███▋      | 22/59 [00:09<00:16,  2.30it/s][A
Training:  41%|████      | 24/59 [00:10<00:11,  3.12it/s][A
Training:  42%|████▏     | 25/59 [00:1

Epoch: 35/37 - Loss: 1.8529 - Accuracy: 0.9519



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:02<00:14,  2.07s/it][A
 38%|███▊      | 3/8 [00:02<00:02,  1.73it/s][A
 62%|██████▎   | 5/8 [00:03<00:01,  1.56it/s][A
100%|██████████| 8/8 [00:03<00:00,  2.04it/s][A
Epochs:  95%|█████████▍| 35/37 [15:57<00:55, 27.57s/it]

Val Loss: 2.1006 - Val Accuracy: 0.9438



Training:   0%|          | 0/59 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/59 [00:01<01:51,  1.92s/it][A
Training:   3%|▎         | 2/59 [00:02<00:52,  1.09it/s][A
Training:   7%|▋         | 4/59 [00:02<00:21,  2.61it/s][A
Training:   8%|▊         | 5/59 [00:03<00:32,  1.64it/s][A
Training:  10%|█         | 6/59 [00:03<00:25,  2.09it/s][A
Training:  14%|█▎        | 8/59 [00:03<00:14,  3.53it/s][A
Training:  15%|█▌        | 9/59 [00:05<00:28,  1.76it/s][A
Training:  17%|█▋        | 10/59 [00:05<00:22,  2.13it/s][A
Training:  20%|██        | 12/59 [00:05<00:14,  3.21it/s][A
Training:  22%|██▏       | 13/59 [00:06<00:23,  1.98it/s][A
Training:  24%|██▎       | 14/59 [00:06<00:19,  2.25it/s][A
Training:  27%|██▋       | 16/59 [00:07<00:12,  3.51it/s][A
Training:  29%|██▉       | 17/59 [00:08<00:22,  1.89it/s][A
Training:  31%|███       | 18/59 [00:08<00:17,  2.36it/s][A
Training:  32%|███▏      | 19/59 [00:08<00:13,  2.93it/s][A
Training:  36%|███▌      | 21/59 [00:09

Epoch: 36/37 - Loss: 1.8918 - Accuracy: 0.9506



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:01<00:13,  1.94s/it][A
 25%|██▌       | 2/8 [00:02<00:05,  1.16it/s][A
 50%|█████     | 4/8 [00:02<00:01,  2.73it/s][A
 62%|██████▎   | 5/8 [00:03<00:01,  1.56it/s][A
100%|██████████| 8/8 [00:03<00:00,  2.13it/s][A
Epochs:  97%|█████████▋| 36/37 [16:24<00:27, 27.56s/it]

Val Loss: 2.1716 - Val Accuracy: 0.9417



Training:   0%|          | 0/59 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/59 [00:01<01:52,  1.94s/it][A
Training:   5%|▌         | 3/59 [00:02<00:30,  1.83it/s][A
Training:   8%|▊         | 5/59 [00:03<00:31,  1.72it/s][A
Training:  12%|█▏        | 7/59 [00:03<00:18,  2.74it/s][A
Training:  14%|█▎        | 8/59 [00:03<00:16,  3.07it/s][A
Training:  15%|█▌        | 9/59 [00:04<00:24,  2.06it/s][A
Training:  17%|█▋        | 10/59 [00:04<00:18,  2.60it/s][A
Training:  19%|█▊        | 11/59 [00:04<00:15,  3.07it/s][A
Training:  20%|██        | 12/59 [00:05<00:17,  2.65it/s][A
Training:  22%|██▏       | 13/59 [00:06<00:23,  1.93it/s][A
Training:  25%|██▌       | 15/59 [00:06<00:15,  2.79it/s][A
Training:  27%|██▋       | 16/59 [00:07<00:17,  2.50it/s][A
Training:  29%|██▉       | 17/59 [00:07<00:19,  2.11it/s][A
Training:  32%|███▏      | 19/59 [00:08<00:13,  3.05it/s][A
Training:  34%|███▍      | 20/59 [00:08<00:14,  2.70it/s][A
Training:  36%|███▌      | 21/59 [00:0

Epoch: 37/37 - Loss: 1.9169 - Accuracy: 0.9517



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:02<00:14,  2.05s/it][A
 38%|███▊      | 3/8 [00:02<00:02,  1.75it/s][A
 62%|██████▎   | 5/8 [00:03<00:01,  1.65it/s][A
100%|██████████| 8/8 [00:03<00:00,  2.18it/s][A
Epochs: 100%|██████████| 37/37 [16:52<00:00, 27.35s/it]


Val Loss: 2.0898 - Val Accuracy: 0.9413
Saving best model...


[32m[I 2023-12-14 23:37:33,481][0m Trial 3 finished with value: 0.9413145780563354 and parameters: {'loss_learning_rate': 0.0008525339180252597, 'learning_rate': 0.0006513527804929251, 'weight_decay': 0.0038208248001045425, 'epsilon': 3.3362510582155838e-09, 'batch_size': 237, 'epochs': 37}. Best is trial 3 with value: 0.9413145780563354.[0m


Learning rate for Loss: 0.0002370798530328366
Learning rate: 0.04652611547988512
Weight decay: 0.0017584196529739696
Epsilon: 2.517132219206721e-09
Batch size: 77
Number of epochs: 24


Epochs:   0%|          | 0/24 [00:00<?, ?it/s]
Training:   0%|          | 0/182 [00:00<?, ?it/s][A
Training:   1%|          | 1/182 [00:01<03:00,  1.00it/s][A
Training:   3%|▎         | 5/182 [00:01<00:45,  3.93it/s][A
Training:   4%|▍         | 7/182 [00:01<00:31,  5.55it/s][A
Training:   5%|▍         | 9/182 [00:01<00:31,  5.46it/s][A
Training:   6%|▌         | 11/182 [00:02<00:24,  7.00it/s][A
Training:   7%|▋         | 13/182 [00:02<00:28,  5.88it/s][A
Training:   8%|▊         | 15/182 [00:02<00:22,  7.49it/s][A
Training:   9%|▉         | 17/182 [00:03<00:27,  6.08it/s][A
Training:  12%|█▏        | 21/182 [00:03<00:23,  6.81it/s][A
Training:  14%|█▎        | 25/182 [00:04<00:19,  8.05it/s][A
Training:  15%|█▍        | 27/182 [00:04<00:16,  9.25it/s][A
Training:  16%|█▌        | 29/182 [00:04<00:20,  7.53it/s][A
Training:  17%|█▋        | 31/182 [00:04<00:17,  8.40it/s][A
Training:  18%|█▊        | 33/182 [00:05<00:20,  7.45it/s][A
Training:  19%|█▊        | 34/182 [0

Epoch: 1/24 - Loss: 15.1249 - Accuracy: 0.8359



  0%|          | 0/23 [00:00<?, ?it/s][A
  4%|▍         | 1/23 [00:00<00:20,  1.09it/s][A
 22%|██▏       | 5/23 [00:01<00:04,  4.16it/s][A
 39%|███▉      | 9/23 [00:01<00:02,  6.01it/s][A
 48%|████▊     | 11/23 [00:01<00:01,  7.48it/s][A
 57%|█████▋    | 13/23 [00:02<00:01,  6.68it/s][A
 65%|██████▌   | 15/23 [00:02<00:01,  7.76it/s][A
 74%|███████▍  | 17/23 [00:02<00:00,  7.03it/s][A
 83%|████████▎ | 19/23 [00:02<00:00,  8.16it/s][A
100%|██████████| 23/23 [00:03<00:00,  6.57it/s][A
Epochs:   4%|▍         | 1/24 [00:26<10:15, 26.76s/it]

Val Loss: 4.1052 - Val Accuracy: 0.8684



Training:   0%|          | 0/182 [00:00<?, ?it/s][A
Training:   1%|          | 1/182 [00:00<02:25,  1.24it/s][A
Training:   2%|▏         | 4/182 [00:00<00:33,  5.38it/s][A
Training:   3%|▎         | 6/182 [00:01<00:34,  5.13it/s][A
Training:   4%|▍         | 8/182 [00:01<00:24,  7.01it/s][A
Training:   5%|▌         | 10/182 [00:01<00:30,  5.55it/s][A
Training:   7%|▋         | 12/182 [00:02<00:23,  7.30it/s][A
Training:   8%|▊         | 14/182 [00:02<00:26,  6.37it/s][A
Training:   9%|▉         | 17/182 [00:02<00:26,  6.26it/s][A
Training:  10%|█         | 19/182 [00:03<00:21,  7.73it/s][A
Training:  12%|█▏        | 21/182 [00:03<00:24,  6.48it/s][A
Training:  14%|█▎        | 25/182 [00:04<00:24,  6.48it/s][A
Training:  16%|█▌        | 29/182 [00:04<00:21,  7.16it/s][A
Training:  17%|█▋        | 31/182 [00:04<00:18,  8.13it/s][A
Training:  18%|█▊        | 33/182 [00:05<00:20,  7.31it/s][A
Training:  20%|█▉        | 36/182 [00:05<00:15,  9.62it/s][A
Training:  21%|██   

Epoch: 2/24 - Loss: 4.3561 - Accuracy: 0.8918



  0%|          | 0/23 [00:00<?, ?it/s][A
  4%|▍         | 1/23 [00:00<00:19,  1.15it/s][A
  9%|▊         | 2/23 [00:01<00:09,  2.18it/s][A
 22%|██▏       | 5/23 [00:01<00:03,  4.82it/s][A
 26%|██▌       | 6/23 [00:01<00:03,  5.20it/s][A
 39%|███▉      | 9/23 [00:01<00:02,  6.01it/s][A
 52%|█████▏    | 12/23 [00:02<00:01,  8.73it/s][A
 61%|██████    | 14/23 [00:02<00:01,  6.80it/s][A
 74%|███████▍  | 17/23 [00:02<00:00,  6.86it/s][A
 78%|███████▊  | 18/23 [00:03<00:00,  7.03it/s][A
100%|██████████| 23/23 [00:03<00:00,  6.32it/s][A
Epochs:   8%|▊         | 2/24 [00:53<09:44, 26.58s/it]

Val Loss: 3.8465 - Val Accuracy: 0.9178



Training:   0%|          | 0/182 [00:00<?, ?it/s][A
Training:   1%|          | 1/182 [00:00<02:42,  1.11it/s][A
Training:   2%|▏         | 4/182 [00:01<00:35,  4.98it/s][A
Training:   3%|▎         | 6/182 [00:01<00:33,  5.25it/s][A
Training:   4%|▍         | 8/182 [00:01<00:24,  7.23it/s][A
Training:   5%|▌         | 10/182 [00:01<00:26,  6.51it/s][A
Training:   7%|▋         | 12/182 [00:02<00:22,  7.61it/s][A
Training:   8%|▊         | 14/182 [00:02<00:24,  6.93it/s][A
Training:   9%|▉         | 16/182 [00:02<00:19,  8.30it/s][A
Training:  10%|▉         | 18/182 [00:02<00:24,  6.71it/s][A
Training:  12%|█▏        | 21/182 [00:03<00:26,  6.00it/s][A
Training:  13%|█▎        | 23/182 [00:03<00:21,  7.32it/s][A
Training:  14%|█▎        | 25/182 [00:04<00:24,  6.32it/s][A
Training:  15%|█▌        | 28/182 [00:04<00:17,  8.75it/s][A
Training:  16%|█▋        | 30/182 [00:04<00:22,  6.70it/s][A
Training:  18%|█▊        | 33/182 [00:05<00:22,  6.75it/s][A
Training:  20%|██   

Epoch: 3/24 - Loss: 5.0974 - Accuracy: 0.8864



  0%|          | 0/23 [00:00<?, ?it/s][A
  4%|▍         | 1/23 [00:00<00:19,  1.12it/s][A
 22%|██▏       | 5/23 [00:01<00:04,  4.05it/s][A
 35%|███▍      | 8/23 [00:01<00:02,  6.82it/s][A
 43%|████▎     | 10/23 [00:01<00:02,  6.32it/s][A
 57%|█████▋    | 13/23 [00:02<00:01,  6.33it/s][A
 74%|███████▍  | 17/23 [00:02<00:00,  6.44it/s][A
 87%|████████▋ | 20/23 [00:03<00:00,  8.53it/s][A
100%|██████████| 23/23 [00:03<00:00,  6.33it/s][A
Epochs:  12%|█▎        | 3/24 [01:20<09:25, 26.91s/it]

Val Loss: 15.1558 - Val Accuracy: 0.8546



Training:   0%|          | 0/182 [00:00<?, ?it/s][A
Training:   1%|          | 1/182 [00:00<02:38,  1.14it/s][A
Training:   1%|          | 2/182 [00:01<01:20,  2.25it/s][A
Training:   2%|▏         | 4/182 [00:01<00:36,  4.85it/s][A
Training:   3%|▎         | 5/182 [00:01<00:38,  4.61it/s][A
Training:   3%|▎         | 6/182 [00:01<00:34,  5.15it/s][A
Training:   5%|▍         | 9/182 [00:01<00:25,  6.77it/s][A
Training:   6%|▌         | 11/182 [00:01<00:19,  8.59it/s][A
Training:   7%|▋         | 13/182 [00:02<00:23,  7.28it/s][A
Training:   8%|▊         | 15/182 [00:02<00:19,  8.44it/s][A
Training:   9%|▉         | 17/182 [00:02<00:22,  7.21it/s][A
Training:  10%|▉         | 18/182 [00:03<00:24,  6.56it/s][A
Training:  11%|█         | 20/182 [00:03<00:19,  8.25it/s][A
Training:  12%|█▏        | 22/182 [00:03<00:23,  6.71it/s][A
Training:  13%|█▎        | 24/182 [00:03<00:19,  7.92it/s][A
Training:  14%|█▍        | 26/182 [00:04<00:24,  6.34it/s][A
Training:  15%|█▌     

Epoch: 4/24 - Loss: 5.6503 - Accuracy: 0.8937



  0%|          | 0/23 [00:00<?, ?it/s][A
  4%|▍         | 1/23 [00:00<00:20,  1.07it/s][A
 17%|█▋        | 4/23 [00:01<00:04,  4.69it/s][A
 26%|██▌       | 6/23 [00:01<00:03,  5.33it/s][A
 39%|███▉      | 9/23 [00:01<00:02,  5.39it/s][A
 52%|█████▏    | 12/23 [00:02<00:01,  7.90it/s][A
 61%|██████    | 14/23 [00:02<00:01,  6.37it/s][A
 74%|███████▍  | 17/23 [00:03<00:01,  5.66it/s][A
100%|██████████| 23/23 [00:03<00:00,  6.14it/s][A
Epochs:  17%|█▋        | 4/24 [01:48<09:05, 27.26s/it]

Val Loss: 4.5510 - Val Accuracy: 0.8848



Training:   0%|          | 0/182 [00:00<?, ?it/s][A
Training:   1%|          | 1/182 [00:00<02:59,  1.01it/s][A
Training:   2%|▏         | 3/182 [00:01<00:53,  3.35it/s][A
Training:   3%|▎         | 5/182 [00:01<00:41,  4.24it/s][A
Training:   4%|▍         | 8/182 [00:01<00:23,  7.52it/s][A
Training:   5%|▌         | 10/182 [00:02<00:27,  6.23it/s][A
Training:   7%|▋         | 13/182 [00:02<00:27,  6.19it/s][A
Training:   8%|▊         | 15/182 [00:02<00:22,  7.28it/s][A
Training:   9%|▉         | 17/182 [00:02<00:22,  7.23it/s][A
Training:  10%|█         | 19/182 [00:03<00:21,  7.48it/s][A
Training:  12%|█▏        | 21/182 [00:03<00:21,  7.47it/s][A
Training:  13%|█▎        | 23/182 [00:03<00:19,  8.15it/s][A
Training:  14%|█▎        | 25/182 [00:04<00:22,  6.91it/s][A
Training:  15%|█▌        | 28/182 [00:04<00:16,  9.44it/s][A
Training:  16%|█▋        | 30/182 [00:04<00:22,  6.74it/s][A
Training:  18%|█▊        | 33/182 [00:05<00:23,  6.34it/s][A
Training:  20%|█▉   

Epoch: 5/24 - Loss: 5.4300 - Accuracy: 0.8914



  0%|          | 0/23 [00:00<?, ?it/s][A
  4%|▍         | 1/23 [00:00<00:18,  1.22it/s][A
 17%|█▋        | 4/23 [00:00<00:03,  5.49it/s][A
 26%|██▌       | 6/23 [00:01<00:03,  5.36it/s][A
 39%|███▉      | 9/23 [00:01<00:02,  5.86it/s][A
 48%|████▊     | 11/23 [00:01<00:01,  7.50it/s][A
 57%|█████▋    | 13/23 [00:02<00:01,  6.25it/s][A
 65%|██████▌   | 15/23 [00:02<00:01,  7.69it/s][A
 74%|███████▍  | 17/23 [00:02<00:00,  6.69it/s][A
 78%|███████▊  | 18/23 [00:03<00:00,  6.13it/s][A
 87%|████████▋ | 20/23 [00:03<00:00,  7.35it/s][A
 91%|█████████▏| 21/23 [00:03<00:00,  6.76it/s][A
100%|██████████| 23/23 [00:03<00:00,  6.22it/s][A
Epochs:  21%|██        | 5/24 [02:16<08:42, 27.51s/it]

Val Loss: 13.4321 - Val Accuracy: 0.9336



Training:   0%|          | 0/182 [00:00<?, ?it/s][A
Training:   1%|          | 1/182 [00:00<02:28,  1.22it/s][A
Training:   2%|▏         | 3/182 [00:00<00:47,  3.75it/s][A
Training:   3%|▎         | 5/182 [00:01<00:38,  4.66it/s][A
Training:   4%|▍         | 8/182 [00:01<00:21,  8.14it/s][A
Training:   5%|▌         | 10/182 [00:01<00:28,  6.00it/s][A
Training:   7%|▋         | 12/182 [00:02<00:22,  7.73it/s][A
Training:   8%|▊         | 14/182 [00:02<00:27,  6.16it/s][A
Training:   9%|▉         | 16/182 [00:02<00:22,  7.42it/s][A
Training:  10%|▉         | 18/182 [00:02<00:22,  7.20it/s][A
Training:  11%|█         | 20/182 [00:03<00:18,  8.69it/s][A
Training:  12%|█▏        | 22/182 [00:03<00:24,  6.44it/s][A
Training:  14%|█▎        | 25/182 [00:03<00:23,  6.78it/s][A
Training:  15%|█▌        | 28/182 [00:04<00:17,  8.98it/s][A
Training:  16%|█▋        | 30/182 [00:04<00:18,  8.34it/s][A
Training:  18%|█▊        | 33/182 [00:04<00:19,  7.63it/s][A
Training:  20%|██   

Epoch: 6/24 - Loss: 12.8389 - Accuracy: 0.8885



  0%|          | 0/23 [00:00<?, ?it/s][A
  4%|▍         | 1/23 [00:00<00:16,  1.34it/s][A
 17%|█▋        | 4/23 [00:00<00:03,  5.69it/s][A
 26%|██▌       | 6/23 [00:01<00:02,  5.78it/s][A
 35%|███▍      | 8/23 [00:01<00:01,  7.79it/s][A
 43%|████▎     | 10/23 [00:01<00:02,  6.18it/s][A
 52%|█████▏    | 12/23 [00:01<00:01,  7.97it/s][A
 61%|██████    | 14/23 [00:02<00:01,  6.71it/s][A
 70%|██████▉   | 16/23 [00:02<00:00,  7.44it/s][A
 78%|███████▊  | 18/23 [00:02<00:00,  6.66it/s][A
 83%|████████▎ | 19/23 [00:03<00:00,  6.64it/s][A
100%|██████████| 23/23 [00:03<00:00,  6.63it/s][A
Epochs:  25%|██▌       | 6/24 [02:42<08:09, 27.21s/it]

Val Loss: 29.3560 - Val Accuracy: 0.8554



Training:   0%|          | 0/182 [00:00<?, ?it/s][A
Training:   1%|          | 1/182 [00:00<02:07,  1.42it/s][A
Training:   1%|          | 2/182 [00:00<01:10,  2.56it/s][A
Training:   3%|▎         | 5/182 [00:01<00:33,  5.30it/s][A
Training:   4%|▍         | 8/182 [00:01<00:19,  9.01it/s][A
Training:   5%|▌         | 10/182 [00:01<00:25,  6.76it/s][A
Training:   7%|▋         | 13/182 [00:02<00:24,  6.94it/s][A
Training:   8%|▊         | 15/182 [00:02<00:20,  8.21it/s][A
Training:   9%|▉         | 17/182 [00:02<00:22,  7.24it/s][A
Training:  10%|▉         | 18/182 [00:02<00:21,  7.50it/s][A
Training:  11%|█         | 20/182 [00:02<00:17,  9.17it/s][A
Training:  12%|█▏        | 22/182 [00:03<00:23,  6.95it/s][A
Training:  13%|█▎        | 24/182 [00:03<00:19,  7.90it/s][A
Training:  14%|█▍        | 26/182 [00:03<00:21,  7.23it/s][A
Training:  15%|█▌        | 28/182 [00:03<00:17,  8.65it/s][A
Training:  16%|█▋        | 30/182 [00:04<00:22,  6.75it/s][A
Training:  18%|█▊   

Epoch: 7/24 - Loss: 6.5128 - Accuracy: 0.9064



  0%|          | 0/23 [00:00<?, ?it/s][A
  4%|▍         | 1/23 [00:00<00:17,  1.28it/s][A
 22%|██▏       | 5/23 [00:01<00:03,  4.68it/s][A
 35%|███▍      | 8/23 [00:01<00:01,  7.82it/s][A
 43%|████▎     | 10/23 [00:01<00:02,  6.34it/s][A
 52%|█████▏    | 12/23 [00:01<00:01,  7.69it/s][A
 61%|██████    | 14/23 [00:02<00:01,  6.54it/s][A
 74%|███████▍  | 17/23 [00:02<00:01,  5.97it/s][A
 83%|████████▎ | 19/23 [00:03<00:00,  7.34it/s][A
100%|██████████| 23/23 [00:03<00:00,  6.52it/s][A
Epochs:  29%|██▉       | 7/24 [03:09<07:41, 27.14s/it]

Val Loss: 6.2474 - Val Accuracy: 0.9246



Training:   0%|          | 0/182 [00:00<?, ?it/s][A
Training:   1%|          | 1/182 [00:00<02:56,  1.02it/s][A
Training:   1%|          | 2/182 [00:01<01:23,  2.17it/s][A
Training:   2%|▏         | 4/182 [00:01<00:37,  4.80it/s][A
Training:   3%|▎         | 6/182 [00:01<00:29,  5.90it/s][A
Training:   5%|▍         | 9/182 [00:01<00:29,  5.87it/s][A
Training:   6%|▌         | 11/182 [00:02<00:23,  7.23it/s][A
Training:   7%|▋         | 13/182 [00:02<00:26,  6.42it/s][A
Training:   8%|▊         | 15/182 [00:02<00:24,  6.74it/s][A
Training:   9%|▉         | 17/182 [00:03<00:25,  6.51it/s][A
Training:  10%|█         | 19/182 [00:03<00:22,  7.23it/s][A
Training:  12%|█▏        | 21/182 [00:03<00:23,  6.92it/s][A
Training:  13%|█▎        | 23/182 [00:03<00:22,  6.94it/s][A
Training:  14%|█▎        | 25/182 [00:04<00:22,  6.95it/s][A
Training:  15%|█▍        | 27/182 [00:04<00:18,  8.46it/s][A
Training:  16%|█▌        | 29/182 [00:04<00:20,  7.53it/s][A
Training:  17%|█▋    

Epoch: 8/24 - Loss: 11.2202 - Accuracy: 0.8974



  0%|          | 0/23 [00:00<?, ?it/s][A
  4%|▍         | 1/23 [00:00<00:19,  1.13it/s][A
 17%|█▋        | 4/23 [00:01<00:03,  4.96it/s][A
 26%|██▌       | 6/23 [00:01<00:03,  4.74it/s][A
 39%|███▉      | 9/23 [00:01<00:02,  5.35it/s][A
 57%|█████▋    | 13/23 [00:02<00:01,  5.88it/s][A
 74%|███████▍  | 17/23 [00:03<00:00,  6.41it/s][A
100%|██████████| 23/23 [00:03<00:00,  6.24it/s][A
Epochs:  33%|███▎      | 8/24 [03:37<07:17, 27.34s/it]

Val Loss: 13.2463 - Val Accuracy: 0.8822



Training:   0%|          | 0/182 [00:00<?, ?it/s][A
Training:   1%|          | 1/182 [00:01<03:03,  1.01s/it][A
Training:   1%|          | 2/182 [00:01<01:26,  2.09it/s][A
Training:   2%|▏         | 4/182 [00:01<00:38,  4.59it/s][A
Training:   3%|▎         | 6/182 [00:01<00:35,  4.95it/s][A
Training:   5%|▍         | 9/182 [00:02<00:30,  5.65it/s][A
Training:   6%|▌         | 11/182 [00:02<00:23,  7.26it/s][A
Training:   7%|▋         | 13/182 [00:02<00:27,  6.16it/s][A
Training:   9%|▉         | 16/182 [00:02<00:18,  9.03it/s][A
Training:  10%|▉         | 18/182 [00:03<00:22,  7.36it/s][A
Training:  11%|█         | 20/182 [00:03<00:18,  8.84it/s][A
Training:  12%|█▏        | 22/182 [00:03<00:24,  6.62it/s][A
Training:  14%|█▎        | 25/182 [00:04<00:24,  6.51it/s][A
Training:  15%|█▌        | 28/182 [00:04<00:17,  8.96it/s][A
Training:  16%|█▋        | 30/182 [00:04<00:23,  6.58it/s][A
Training:  18%|█▊        | 32/182 [00:04<00:18,  7.95it/s][A
Training:  19%|█▊    

Epoch: 9/24 - Loss: 5.6538 - Accuracy: 0.9093



  0%|          | 0/23 [00:00<?, ?it/s][A
  4%|▍         | 1/23 [00:00<00:19,  1.13it/s][A
 13%|█▎        | 3/23 [00:00<00:05,  3.75it/s][A
 22%|██▏       | 5/23 [00:01<00:04,  4.15it/s][A
 39%|███▉      | 9/23 [00:02<00:02,  5.14it/s][A
 52%|█████▏    | 12/23 [00:02<00:01,  7.48it/s][A
 61%|██████    | 14/23 [00:02<00:01,  6.27it/s][A
 74%|███████▍  | 17/23 [00:03<00:00,  6.47it/s][A
100%|██████████| 23/23 [00:03<00:00,  6.15it/s][A
Epochs:  38%|███▊      | 9/24 [04:05<06:51, 27.44s/it]

Val Loss: 3.6608 - Val Accuracy: 0.9201



Training:   0%|          | 0/182 [00:00<?, ?it/s][A
Training:   1%|          | 1/182 [00:00<02:36,  1.16it/s][A
Training:   2%|▏         | 4/182 [00:01<00:36,  4.82it/s][A
Training:   3%|▎         | 6/182 [00:01<00:36,  4.89it/s][A
Training:   5%|▍         | 9/182 [00:01<00:31,  5.55it/s][A
Training:   6%|▌         | 11/182 [00:02<00:24,  6.92it/s][A
Training:   7%|▋         | 13/182 [00:02<00:27,  6.25it/s][A
Training:   8%|▊         | 14/182 [00:02<00:27,  6.21it/s][A
Training:   9%|▉         | 17/182 [00:03<00:26,  6.25it/s][A
Training:  10%|█         | 19/182 [00:03<00:20,  7.79it/s][A
Training:  12%|█▏        | 21/182 [00:03<00:25,  6.42it/s][A
Training:  14%|█▎        | 25/182 [00:04<00:22,  7.12it/s][A
Training:  15%|█▌        | 28/182 [00:04<00:16,  9.38it/s][A
Training:  16%|█▋        | 30/182 [00:04<00:20,  7.60it/s][A
Training:  18%|█▊        | 33/182 [00:05<00:20,  7.35it/s][A
Training:  19%|█▉        | 35/182 [00:05<00:17,  8.60it/s][A
Training:  20%|██   

Epoch: 10/24 - Loss: 6.9451 - Accuracy: 0.9068



  0%|          | 0/23 [00:00<?, ?it/s][A
  4%|▍         | 1/23 [00:00<00:14,  1.47it/s][A
 13%|█▎        | 3/23 [00:00<00:04,  4.64it/s][A
 22%|██▏       | 5/23 [00:01<00:03,  5.13it/s][A
 30%|███       | 7/23 [00:01<00:02,  7.31it/s][A
 39%|███▉      | 9/23 [00:01<00:02,  6.22it/s][A
 48%|████▊     | 11/23 [00:01<00:01,  8.04it/s][A
 57%|█████▋    | 13/23 [00:02<00:01,  6.04it/s][A
 70%|██████▉   | 16/23 [00:02<00:00,  8.83it/s][A
 78%|███████▊  | 18/23 [00:02<00:00,  6.68it/s][A
100%|██████████| 23/23 [00:03<00:00,  6.60it/s][A
Epochs:  42%|████▏     | 10/24 [04:31<06:20, 27.20s/it]

Val Loss: 7.8517 - Val Accuracy: 0.8952



Training:   0%|          | 0/182 [00:00<?, ?it/s][A
Training:   1%|          | 1/182 [00:00<02:36,  1.16it/s][A
Training:   2%|▏         | 3/182 [00:01<00:52,  3.43it/s][A
Training:   3%|▎         | 5/182 [00:01<00:33,  5.34it/s][A
Training:   3%|▎         | 6/182 [00:01<00:33,  5.25it/s][A
Training:   5%|▍         | 9/182 [00:01<00:24,  7.11it/s][A
Training:   5%|▌         | 10/182 [00:01<00:26,  6.57it/s][A
Training:   7%|▋         | 13/182 [00:02<00:23,  7.28it/s][A
Training:   8%|▊         | 14/182 [00:02<00:24,  6.95it/s][A
Training:   9%|▉         | 16/182 [00:02<00:20,  8.20it/s][A
Training:   9%|▉         | 17/182 [00:02<00:25,  6.59it/s][A
Training:  11%|█         | 20/182 [00:03<00:18,  8.92it/s][A
Training:  12%|█▏        | 21/182 [00:03<00:24,  6.50it/s][A
Training:  13%|█▎        | 23/182 [00:03<00:19,  8.12it/s][A
Training:  14%|█▎        | 25/182 [00:03<00:21,  7.44it/s][A
Training:  14%|█▍        | 26/182 [00:04<00:21,  7.34it/s][A
Training:  15%|█▌    

Epoch: 11/24 - Loss: 9.2746 - Accuracy: 0.8975



  0%|          | 0/23 [00:00<?, ?it/s][A
  4%|▍         | 1/23 [00:00<00:21,  1.02it/s][A
 22%|██▏       | 5/23 [00:01<00:04,  3.93it/s][A
 39%|███▉      | 9/23 [00:02<00:02,  5.35it/s][A
 52%|█████▏    | 12/23 [00:02<00:01,  7.49it/s][A
 61%|██████    | 14/23 [00:02<00:01,  7.08it/s][A
 74%|███████▍  | 17/23 [00:03<00:01,  5.95it/s][A
100%|██████████| 23/23 [00:03<00:00,  6.06it/s][A
Epochs:  46%|████▌     | 11/24 [04:59<05:54, 27.30s/it]

Val Loss: 4.0288 - Val Accuracy: 0.9187



Training:   0%|          | 0/182 [00:00<?, ?it/s][A
Training:   1%|          | 1/182 [00:00<02:19,  1.29it/s][A
Training:   2%|▏         | 4/182 [00:00<00:30,  5.75it/s][A
Training:   3%|▎         | 6/182 [00:01<00:34,  5.17it/s][A
Training:   4%|▍         | 8/182 [00:01<00:24,  7.12it/s][A
Training:   5%|▌         | 10/182 [00:01<00:30,  5.61it/s][A
Training:   7%|▋         | 12/182 [00:02<00:25,  6.73it/s][A
Training:   8%|▊         | 14/182 [00:02<00:27,  6.21it/s][A
Training:   9%|▉         | 16/182 [00:02<00:21,  7.89it/s][A
Training:  10%|▉         | 18/182 [00:03<00:26,  6.30it/s][A
Training:  11%|█         | 20/182 [00:03<00:20,  7.81it/s][A
Training:  12%|█▏        | 22/182 [00:03<00:25,  6.18it/s][A
Training:  13%|█▎        | 24/182 [00:03<00:20,  7.67it/s][A
Training:  14%|█▍        | 26/182 [00:04<00:21,  7.29it/s][A
Training:  15%|█▌        | 28/182 [00:04<00:18,  8.38it/s][A
Training:  16%|█▋        | 30/182 [00:04<00:18,  8.19it/s][A
Training:  18%|█▊   

Epoch: 12/24 - Loss: 13.1878 - Accuracy: 0.8937



  0%|          | 0/23 [00:00<?, ?it/s][A
  4%|▍         | 1/23 [00:00<00:16,  1.35it/s][A
  9%|▊         | 2/23 [00:00<00:08,  2.62it/s][A
 22%|██▏       | 5/23 [00:01<00:03,  5.11it/s][A
 26%|██▌       | 6/23 [00:01<00:02,  5.80it/s][A
 39%|███▉      | 9/23 [00:01<00:02,  6.27it/s][A
 43%|████▎     | 10/23 [00:01<00:01,  6.70it/s][A
 57%|█████▋    | 13/23 [00:02<00:01,  6.15it/s][A
 61%|██████    | 14/23 [00:02<00:01,  6.55it/s][A
 74%|███████▍  | 17/23 [00:02<00:00,  6.82it/s][A
 78%|███████▊  | 18/23 [00:03<00:00,  6.73it/s][A
 91%|█████████▏| 21/23 [00:03<00:00,  7.76it/s][A
100%|██████████| 23/23 [00:03<00:00,  6.22it/s][A
Epochs:  50%|█████     | 12/24 [05:27<05:28, 27.36s/it]

Val Loss: 3.2064 - Val Accuracy: 0.9334



Training:   0%|          | 0/182 [00:00<?, ?it/s][A
Training:   1%|          | 1/182 [00:00<02:28,  1.22it/s][A
Training:   2%|▏         | 4/182 [00:01<00:37,  4.78it/s][A
Training:   3%|▎         | 5/182 [00:01<00:38,  4.56it/s][A
Training:   4%|▍         | 7/182 [00:01<00:27,  6.33it/s][A
Training:   4%|▍         | 8/182 [00:01<00:27,  6.38it/s][A
Training:   5%|▍         | 9/182 [00:01<00:28,  6.15it/s][A
Training:   5%|▌         | 10/182 [00:01<00:27,  6.36it/s][A
Training:   6%|▌         | 11/182 [00:02<00:24,  7.05it/s][A
Training:   7%|▋         | 12/182 [00:02<00:24,  6.89it/s][A
Training:   7%|▋         | 13/182 [00:02<00:24,  7.03it/s][A
Training:   8%|▊         | 15/182 [00:02<00:22,  7.50it/s][A
Training:   9%|▉         | 16/182 [00:02<00:21,  7.77it/s][A
Training:   9%|▉         | 17/182 [00:02<00:24,  6.66it/s][A
Training:  10%|█         | 19/182 [00:03<00:21,  7.54it/s][A
Training:  12%|█▏        | 21/182 [00:03<00:22,  7.14it/s][A
Training:  13%|█▎     

Epoch: 13/24 - Loss: 6.6045 - Accuracy: 0.9128



  0%|          | 0/23 [00:00<?, ?it/s][A
  4%|▍         | 1/23 [00:00<00:19,  1.10it/s][A
 17%|█▋        | 4/23 [00:01<00:03,  5.01it/s][A
 26%|██▌       | 6/23 [00:01<00:03,  4.32it/s][A
 39%|███▉      | 9/23 [00:01<00:02,  5.71it/s][A
 48%|████▊     | 11/23 [00:02<00:01,  6.13it/s][A
 57%|█████▋    | 13/23 [00:02<00:01,  7.31it/s][A
 65%|██████▌   | 15/23 [00:02<00:01,  7.03it/s][A
 74%|███████▍  | 17/23 [00:02<00:00,  7.57it/s][A
 78%|███████▊  | 18/23 [00:03<00:00,  6.52it/s][A
 91%|█████████▏| 21/23 [00:03<00:00,  8.54it/s][A
100%|██████████| 23/23 [00:03<00:00,  6.18it/s][A
Epochs:  54%|█████▍    | 13/24 [05:54<05:00, 27.31s/it]

Val Loss: 5.5943 - Val Accuracy: 0.9325



Training:   0%|          | 0/182 [00:00<?, ?it/s][A
Training:   1%|          | 1/182 [00:00<02:16,  1.33it/s][A
Training:   2%|▏         | 3/182 [00:00<00:43,  4.11it/s][A
Training:   3%|▎         | 5/182 [00:01<00:35,  5.01it/s][A
Training:   3%|▎         | 6/182 [00:01<00:32,  5.39it/s][A
Training:   4%|▍         | 8/182 [00:01<00:23,  7.34it/s][A
Training:   5%|▍         | 9/182 [00:01<00:30,  5.76it/s][A
Training:   5%|▌         | 10/182 [00:02<00:34,  5.04it/s][A
Training:   7%|▋         | 13/182 [00:02<00:23,  7.05it/s][A
Training:   8%|▊         | 14/182 [00:02<00:27,  6.02it/s][A
Training:   9%|▉         | 17/182 [00:02<00:20,  8.19it/s][A
Training:  10%|▉         | 18/182 [00:03<00:30,  5.36it/s][A
Training:  12%|█▏        | 21/182 [00:03<00:19,  8.09it/s][A
Training:  13%|█▎        | 23/182 [00:03<00:23,  6.85it/s][A
Training:  14%|█▍        | 26/182 [00:04<00:24,  6.26it/s][A
Training:  16%|█▋        | 30/182 [00:04<00:21,  7.16it/s][A
Training:  18%|█▊     

Epoch: 14/24 - Loss: 7.0534 - Accuracy: 0.9146



  0%|          | 0/23 [00:00<?, ?it/s][A
  4%|▍         | 1/23 [00:00<00:17,  1.23it/s][A
 22%|██▏       | 5/23 [00:01<00:04,  4.31it/s][A
 39%|███▉      | 9/23 [00:01<00:02,  5.82it/s][A
 52%|█████▏    | 12/23 [00:01<00:01,  8.26it/s][A
 61%|██████    | 14/23 [00:02<00:01,  7.01it/s][A
 74%|███████▍  | 17/23 [00:02<00:00,  7.10it/s][A
 83%|████████▎ | 19/23 [00:02<00:00,  8.42it/s][A
 91%|█████████▏| 21/23 [00:03<00:00,  8.04it/s][A
100%|██████████| 23/23 [00:03<00:00,  6.62it/s][A
Epochs:  58%|█████▊    | 14/24 [06:20<04:30, 27.05s/it]

Val Loss: 4.1944 - Val Accuracy: 0.9167



Training:   0%|          | 0/182 [00:00<?, ?it/s][A
Training:   1%|          | 1/182 [00:00<02:25,  1.24it/s][A
Training:   2%|▏         | 3/182 [00:00<00:45,  3.91it/s][A
Training:   3%|▎         | 5/182 [00:01<00:42,  4.20it/s][A
Training:   4%|▍         | 8/182 [00:01<00:23,  7.32it/s][A
Training:   5%|▌         | 10/182 [00:02<00:29,  5.80it/s][A
Training:   7%|▋         | 12/182 [00:02<00:24,  7.08it/s][A
Training:   8%|▊         | 14/182 [00:02<00:29,  5.74it/s][A
Training:   9%|▉         | 16/182 [00:02<00:22,  7.34it/s][A
Training:  10%|▉         | 18/182 [00:03<00:24,  6.82it/s][A
Training:  12%|█▏        | 21/182 [00:03<00:22,  7.17it/s][A
Training:  13%|█▎        | 23/182 [00:03<00:19,  8.31it/s][A
Training:  14%|█▎        | 25/182 [00:04<00:25,  6.14it/s][A
Training:  15%|█▌        | 28/182 [00:04<00:18,  8.40it/s][A
Training:  16%|█▋        | 30/182 [00:04<00:23,  6.59it/s][A
Training:  18%|█▊        | 32/182 [00:04<00:18,  8.00it/s][A
Training:  19%|█▊   

Epoch: 15/24 - Loss: 13.1057 - Accuracy: 0.9011



  0%|          | 0/23 [00:00<?, ?it/s][A
  4%|▍         | 1/23 [00:00<00:21,  1.03it/s][A
 13%|█▎        | 3/23 [00:01<00:05,  3.44it/s][A
 22%|██▏       | 5/23 [00:01<00:04,  3.98it/s][A
 39%|███▉      | 9/23 [00:01<00:02,  5.93it/s][A
 48%|████▊     | 11/23 [00:02<00:01,  7.48it/s][A
 57%|█████▋    | 13/23 [00:02<00:01,  6.74it/s][A
 65%|██████▌   | 15/23 [00:02<00:00,  8.25it/s][A
 74%|███████▍  | 17/23 [00:02<00:00,  7.08it/s][A
 83%|████████▎ | 19/23 [00:03<00:00,  8.43it/s][A
 91%|█████████▏| 21/23 [00:03<00:00,  6.89it/s][A
100%|██████████| 23/23 [00:03<00:00,  6.27it/s][A
Epochs:  62%|██████▎   | 15/24 [06:48<04:04, 27.15s/it]

Val Loss: 4.7383 - Val Accuracy: 0.9170



Training:   0%|          | 0/182 [00:00<?, ?it/s][A
Training:   1%|          | 1/182 [00:00<02:51,  1.05it/s][A
Training:   1%|          | 2/182 [00:01<01:24,  2.14it/s][A
Training:   2%|▏         | 4/182 [00:01<00:37,  4.72it/s][A
Training:   3%|▎         | 6/182 [00:01<00:33,  5.24it/s][A
Training:   5%|▍         | 9/182 [00:01<00:26,  6.47it/s][A
Training:   5%|▌         | 10/182 [00:02<00:26,  6.48it/s][A
Training:   7%|▋         | 13/182 [00:02<00:26,  6.40it/s][A
Training:   8%|▊         | 14/182 [00:02<00:24,  6.76it/s][A
Training:   9%|▉         | 16/182 [00:02<00:19,  8.68it/s][A
Training:  10%|▉         | 18/182 [00:03<00:25,  6.49it/s][A
Training:  11%|█         | 20/182 [00:03<00:19,  8.13it/s][A
Training:  12%|█▏        | 22/182 [00:03<00:25,  6.27it/s][A
Training:  13%|█▎        | 24/182 [00:03<00:20,  7.79it/s][A
Training:  14%|█▍        | 26/182 [00:04<00:25,  6.08it/s][A
Training:  16%|█▌        | 29/182 [00:04<00:26,  5.69it/s][A
Training:  18%|█▊    

Epoch: 16/24 - Loss: 6.1130 - Accuracy: 0.9160



  0%|          | 0/23 [00:00<?, ?it/s][A
  4%|▍         | 1/23 [00:01<00:22,  1.01s/it][A
 17%|█▋        | 4/23 [00:01<00:04,  4.54it/s][A
 26%|██▌       | 6/23 [00:01<00:04,  4.05it/s][A
 39%|███▉      | 9/23 [00:02<00:02,  4.91it/s][A
 57%|█████▋    | 13/23 [00:02<00:01,  6.06it/s][A
 70%|██████▉   | 16/23 [00:02<00:00,  7.95it/s][A
 78%|███████▊  | 18/23 [00:03<00:00,  7.24it/s][A
 87%|████████▋ | 20/23 [00:03<00:00,  8.51it/s][A
100%|██████████| 23/23 [00:03<00:00,  6.06it/s][A
Epochs:  67%|██████▋   | 16/24 [07:15<03:39, 27.39s/it]

Val Loss: 5.3986 - Val Accuracy: 0.9119



Training:   0%|          | 0/182 [00:00<?, ?it/s][A
Training:   1%|          | 1/182 [00:00<02:55,  1.03it/s][A
Training:   2%|▏         | 3/182 [00:01<00:53,  3.34it/s][A
Training:   3%|▎         | 5/182 [00:01<00:40,  4.37it/s][A
Training:   4%|▍         | 7/182 [00:01<00:27,  6.48it/s][A
Training:   5%|▍         | 9/182 [00:01<00:30,  5.62it/s][A
Training:   6%|▌         | 11/182 [00:02<00:23,  7.14it/s][A
Training:   7%|▋         | 13/182 [00:02<00:27,  6.16it/s][A
Training:   9%|▉         | 16/182 [00:02<00:18,  9.00it/s][A
Training:  10%|▉         | 18/182 [00:03<00:23,  7.10it/s][A
Training:  12%|█▏        | 21/182 [00:03<00:22,  7.01it/s][A
Training:  14%|█▎        | 25/182 [00:04<00:21,  7.41it/s][A
Training:  15%|█▌        | 28/182 [00:04<00:17,  9.04it/s][A
Training:  16%|█▋        | 30/182 [00:04<00:20,  7.42it/s][A
Training:  18%|█▊        | 32/182 [00:04<00:17,  8.65it/s][A
Training:  19%|█▊        | 34/182 [00:05<00:19,  7.57it/s][A
Training:  20%|█▉    

Epoch: 17/24 - Loss: 13.2674 - Accuracy: 0.9049



  0%|          | 0/23 [00:00<?, ?it/s][A
  4%|▍         | 1/23 [00:00<00:17,  1.27it/s][A
 22%|██▏       | 5/23 [00:01<00:03,  4.70it/s][A
 35%|███▍      | 8/23 [00:01<00:01,  7.64it/s][A
 43%|████▎     | 10/23 [00:01<00:01,  6.66it/s][A
 57%|█████▋    | 13/23 [00:02<00:01,  6.41it/s][A
 70%|██████▉   | 16/23 [00:02<00:00,  8.86it/s][A
 78%|███████▊  | 18/23 [00:02<00:00,  6.88it/s][A
100%|██████████| 23/23 [00:03<00:00,  6.86it/s][A
Epochs:  71%|███████   | 17/24 [07:43<03:11, 27.31s/it]

Val Loss: 6.2330 - Val Accuracy: 0.9300



Training:   0%|          | 0/182 [00:00<?, ?it/s][A
Training:   1%|          | 1/182 [00:00<02:43,  1.11it/s][A
Training:   1%|          | 2/182 [00:01<01:31,  1.97it/s][A
Training:   3%|▎         | 5/182 [00:01<00:33,  5.21it/s][A
Training:   3%|▎         | 6/182 [00:01<00:36,  4.77it/s][A
Training:   5%|▍         | 9/182 [00:01<00:25,  6.87it/s][A
Training:   5%|▌         | 10/182 [00:02<00:27,  6.23it/s][A
Training:   7%|▋         | 13/182 [00:02<00:20,  8.16it/s][A
Training:   8%|▊         | 14/182 [00:02<00:22,  7.55it/s][A
Training:   9%|▉         | 17/182 [00:02<00:19,  8.51it/s][A
Training:  10%|▉         | 18/182 [00:03<00:23,  7.08it/s][A
Training:  11%|█         | 20/182 [00:03<00:18,  8.98it/s][A
Training:  12%|█▏        | 22/182 [00:03<00:23,  6.85it/s][A
Training:  13%|█▎        | 24/182 [00:03<00:18,  8.59it/s][A
Training:  14%|█▍        | 26/182 [00:04<00:21,  7.15it/s][A
Training:  15%|█▌        | 28/182 [00:04<00:17,  8.59it/s][A
Training:  16%|█▋    

Epoch: 18/24 - Loss: 5.3783 - Accuracy: 0.9136



  0%|          | 0/23 [00:00<?, ?it/s][A
  4%|▍         | 1/23 [00:00<00:20,  1.06it/s][A
 17%|█▋        | 4/23 [00:01<00:03,  4.82it/s][A
 26%|██▌       | 6/23 [00:01<00:03,  4.82it/s][A
 39%|███▉      | 9/23 [00:01<00:02,  5.56it/s][A
 43%|████▎     | 10/23 [00:02<00:02,  5.93it/s][A
 57%|█████▋    | 13/23 [00:02<00:01,  7.15it/s][A
 61%|██████    | 14/23 [00:02<00:01,  6.24it/s][A
 74%|███████▍  | 17/23 [00:02<00:00,  7.67it/s][A
 78%|███████▊  | 18/23 [00:03<00:00,  6.32it/s][A
 91%|█████████▏| 21/23 [00:03<00:00,  8.72it/s][A
100%|██████████| 23/23 [00:03<00:00,  6.17it/s][A
Epochs:  75%|███████▌  | 18/24 [08:10<02:43, 27.22s/it]

Val Loss: 4.7720 - Val Accuracy: 0.9379



Training:   0%|          | 0/182 [00:00<?, ?it/s][A
Training:   1%|          | 1/182 [00:00<02:03,  1.47it/s][A
Training:   2%|▏         | 3/182 [00:00<00:40,  4.37it/s][A
Training:   3%|▎         | 5/182 [00:01<00:38,  4.60it/s][A
Training:   4%|▍         | 7/182 [00:01<00:25,  6.75it/s][A
Training:   5%|▍         | 9/182 [00:01<00:28,  6.07it/s][A
Training:   6%|▌         | 11/182 [00:01<00:23,  7.36it/s][A
Training:   7%|▋         | 13/182 [00:02<00:25,  6.64it/s][A
Training:   8%|▊         | 15/182 [00:02<00:19,  8.38it/s][A
Training:   9%|▉         | 17/182 [00:02<00:23,  7.14it/s][A
Training:  10%|█         | 19/182 [00:02<00:18,  8.59it/s][A
Training:  12%|█▏        | 21/182 [00:03<00:22,  7.25it/s][A
Training:  13%|█▎        | 23/182 [00:03<00:18,  8.58it/s][A
Training:  14%|█▎        | 25/182 [00:03<00:22,  7.02it/s][A
Training:  15%|█▍        | 27/182 [00:03<00:17,  8.63it/s][A
Training:  16%|█▌        | 29/182 [00:04<00:19,  7.73it/s][A
Training:  17%|█▋    

Epoch: 19/24 - Loss: 16.0206 - Accuracy: 0.9029



  0%|          | 0/23 [00:00<?, ?it/s][A
  4%|▍         | 1/23 [00:01<00:22,  1.00s/it][A
 13%|█▎        | 3/23 [00:01<00:06,  3.27it/s][A
 22%|██▏       | 5/23 [00:01<00:04,  4.41it/s][A
 30%|███       | 7/23 [00:01<00:02,  5.84it/s][A
 39%|███▉      | 9/23 [00:01<00:02,  5.85it/s][A
 48%|████▊     | 11/23 [00:02<00:01,  6.69it/s][A
 57%|█████▋    | 13/23 [00:02<00:01,  6.83it/s][A
 65%|██████▌   | 15/23 [00:02<00:01,  6.94it/s][A
 74%|███████▍  | 17/23 [00:02<00:00,  7.75it/s][A
 83%|████████▎ | 19/23 [00:03<00:00,  7.85it/s][A
 91%|█████████▏| 21/23 [00:03<00:00,  8.87it/s][A
100%|██████████| 23/23 [00:03<00:00,  6.29it/s][A
Epochs:  79%|███████▉  | 19/24 [08:36<02:15, 27.08s/it]

Val Loss: 5.7297 - Val Accuracy: 0.9226



Training:   0%|          | 0/182 [00:00<?, ?it/s][A
Training:   1%|          | 1/182 [00:00<02:31,  1.19it/s][A
Training:   2%|▏         | 3/182 [00:00<00:46,  3.85it/s][A
Training:   3%|▎         | 5/182 [00:01<00:40,  4.41it/s][A
Training:   4%|▍         | 8/182 [00:01<00:23,  7.44it/s][A
Training:   5%|▌         | 10/182 [00:01<00:25,  6.74it/s][A
Training:   7%|▋         | 12/182 [00:02<00:21,  7.91it/s][A
Training:   8%|▊         | 14/182 [00:02<00:23,  7.07it/s][A
Training:   9%|▉         | 16/182 [00:02<00:19,  8.44it/s][A
Training:  10%|▉         | 18/182 [00:02<00:23,  6.97it/s][A
Training:  12%|█▏        | 21/182 [00:03<00:25,  6.34it/s][A
Training:  13%|█▎        | 24/182 [00:03<00:18,  8.52it/s][A
Training:  14%|█▍        | 26/182 [00:03<00:21,  7.11it/s][A
Training:  16%|█▌        | 29/182 [00:04<00:21,  7.18it/s][A
Training:  17%|█▋        | 31/182 [00:04<00:17,  8.44it/s][A
Training:  18%|█▊        | 33/182 [00:04<00:20,  7.20it/s][A
Training:  20%|█▉   

Epoch: 20/24 - Loss: 12.6474 - Accuracy: 0.9079



  0%|          | 0/23 [00:00<?, ?it/s][A
  4%|▍         | 1/23 [00:00<00:16,  1.33it/s][A
  9%|▊         | 2/23 [00:00<00:09,  2.26it/s][A
 22%|██▏       | 5/23 [00:01<00:03,  5.18it/s][A
 26%|██▌       | 6/23 [00:01<00:03,  4.95it/s][A
 39%|███▉      | 9/23 [00:01<00:01,  7.11it/s][A
 43%|████▎     | 10/23 [00:02<00:02,  5.20it/s][A
 57%|█████▋    | 13/23 [00:02<00:01,  7.25it/s][A
 61%|██████    | 14/23 [00:02<00:01,  6.14it/s][A
 74%|███████▍  | 17/23 [00:02<00:00,  7.72it/s][A
 78%|███████▊  | 18/23 [00:03<00:00,  6.72it/s][A
 91%|█████████▏| 21/23 [00:03<00:00,  8.06it/s][A
100%|██████████| 23/23 [00:03<00:00,  6.24it/s][A
Epochs:  83%|████████▎ | 20/24 [09:04<01:48, 27.13s/it]

Val Loss: 8.9219 - Val Accuracy: 0.9161



Training:   0%|          | 0/182 [00:00<?, ?it/s][A
Training:   1%|          | 1/182 [00:00<02:18,  1.30it/s][A
Training:   1%|          | 2/182 [00:00<01:11,  2.52it/s][A
Training:   3%|▎         | 5/182 [00:01<00:33,  5.36it/s][A
Training:   3%|▎         | 6/182 [00:01<00:32,  5.37it/s][A
Training:   4%|▍         | 8/182 [00:01<00:23,  7.27it/s][A
Training:   5%|▍         | 9/182 [00:01<00:27,  6.32it/s][A
Training:   5%|▌         | 10/182 [00:01<00:29,  5.83it/s][A
Training:   7%|▋         | 12/182 [00:02<00:21,  7.84it/s][A
Training:   7%|▋         | 13/182 [00:02<00:25,  6.73it/s][A
Training:   8%|▊         | 14/182 [00:02<00:28,  5.88it/s][A
Training:   9%|▉         | 17/182 [00:02<00:21,  7.64it/s][A
Training:  10%|▉         | 18/182 [00:02<00:21,  7.69it/s][A
Training:  11%|█         | 20/182 [00:03<00:16,  9.85it/s][A
Training:  12%|█▏        | 22/182 [00:03<00:18,  8.68it/s][A
Training:  13%|█▎        | 24/182 [00:03<00:17,  8.93it/s][A
Training:  14%|█▎     

Epoch: 21/24 - Loss: 11.0980 - Accuracy: 0.9160



  0%|          | 0/23 [00:00<?, ?it/s][A
  4%|▍         | 1/23 [00:00<00:19,  1.14it/s][A
 22%|██▏       | 5/23 [00:01<00:04,  4.09it/s][A
 39%|███▉      | 9/23 [00:01<00:02,  5.60it/s][A
 57%|█████▋    | 13/23 [00:02<00:01,  6.43it/s][A
 74%|███████▍  | 17/23 [00:02<00:00,  7.02it/s][A
 83%|████████▎ | 19/23 [00:03<00:00,  8.16it/s][A
100%|██████████| 23/23 [00:03<00:00,  6.59it/s][A
Epochs:  88%|████████▊ | 21/24 [09:31<01:21, 27.10s/it]

Val Loss: 9.3909 - Val Accuracy: 0.9305



Training:   0%|          | 0/182 [00:00<?, ?it/s][A
Training:   1%|          | 1/182 [00:00<02:54,  1.04it/s][A
Training:   2%|▏         | 3/182 [00:01<00:52,  3.41it/s][A
Training:   3%|▎         | 5/182 [00:01<00:40,  4.33it/s][A
Training:   4%|▍         | 8/182 [00:01<00:24,  7.01it/s][A
Training:   5%|▌         | 10/182 [00:02<00:27,  6.25it/s][A
Training:   7%|▋         | 13/182 [00:02<00:29,  5.83it/s][A
Training:   9%|▉         | 16/182 [00:02<00:20,  8.03it/s][A
Training:  10%|▉         | 18/182 [00:03<00:24,  6.70it/s][A
Training:  12%|█▏        | 21/182 [00:03<00:22,  7.08it/s][A
Training:  14%|█▎        | 25/182 [00:04<00:22,  7.06it/s][A
Training:  16%|█▌        | 29/182 [00:04<00:19,  7.70it/s][A
Training:  18%|█▊        | 32/182 [00:04<00:16,  9.33it/s][A
Training:  19%|█▊        | 34/182 [00:05<00:18,  7.94it/s][A
Training:  20%|██        | 37/182 [00:05<00:21,  6.90it/s][A
Training:  23%|██▎       | 41/182 [00:06<00:20,  7.00it/s][A
Training:  25%|██▍  

Epoch: 22/24 - Loss: 5.3202 - Accuracy: 0.9190



  0%|          | 0/23 [00:00<?, ?it/s][A
  4%|▍         | 1/23 [00:00<00:20,  1.06it/s][A
 22%|██▏       | 5/23 [00:01<00:04,  4.01it/s][A
 39%|███▉      | 9/23 [00:02<00:02,  5.34it/s][A
 52%|█████▏    | 12/23 [00:02<00:01,  7.53it/s][A
 61%|██████    | 14/23 [00:02<00:01,  6.04it/s][A
 74%|███████▍  | 17/23 [00:03<00:01,  5.96it/s][A
100%|██████████| 23/23 [00:03<00:00,  6.18it/s][A
Epochs:  92%|█████████▏| 22/24 [09:58<00:54, 27.11s/it]

Val Loss: 4.5963 - Val Accuracy: 0.9345



Training:   0%|          | 0/182 [00:00<?, ?it/s][A
Training:   1%|          | 1/182 [00:00<02:58,  1.02it/s][A
Training:   2%|▏         | 3/182 [00:01<00:53,  3.38it/s][A
Training:   3%|▎         | 5/182 [00:01<00:41,  4.31it/s][A
Training:   5%|▍         | 9/182 [00:02<00:31,  5.58it/s][A
Training:   7%|▋         | 12/182 [00:02<00:21,  7.98it/s][A
Training:   8%|▊         | 14/182 [00:02<00:22,  7.56it/s][A
Training:   9%|▉         | 17/182 [00:02<00:21,  7.58it/s][A
Training:  12%|█▏        | 21/182 [00:03<00:19,  8.41it/s][A
Training:  13%|█▎        | 24/182 [00:03<00:15, 10.41it/s][A
Training:  14%|█▍        | 26/182 [00:03<00:16,  9.18it/s][A
Training:  16%|█▌        | 29/182 [00:04<00:18,  8.36it/s][A
Training:  17%|█▋        | 31/182 [00:04<00:16,  9.17it/s][A
Training:  18%|█▊        | 33/182 [00:04<00:18,  8.20it/s][A
Training:  20%|█▉        | 36/182 [00:04<00:13, 10.72it/s][A
Training:  21%|██        | 38/182 [00:05<00:18,  7.77it/s][A
Training:  23%|██▎  

Epoch: 23/24 - Loss: 9.5818 - Accuracy: 0.9134



  0%|          | 0/23 [00:00<?, ?it/s][A
  4%|▍         | 1/23 [00:00<00:20,  1.08it/s][A
 17%|█▋        | 4/23 [00:01<00:03,  4.95it/s][A
 26%|██▌       | 6/23 [00:01<00:03,  4.28it/s][A
 39%|███▉      | 9/23 [00:02<00:02,  5.12it/s][A
 43%|████▎     | 10/23 [00:02<00:02,  5.50it/s][A
 57%|█████▋    | 13/23 [00:02<00:01,  6.86it/s][A
 61%|██████    | 14/23 [00:02<00:01,  6.69it/s][A
 74%|███████▍  | 17/23 [00:02<00:00,  7.55it/s][A
 78%|███████▊  | 18/23 [00:03<00:00,  7.41it/s][A
100%|██████████| 23/23 [00:03<00:00,  6.30it/s][A
Epochs:  96%|█████████▌| 23/24 [10:24<00:26, 26.95s/it]

Val Loss: 4.0654 - Val Accuracy: 0.9359



Training:   0%|          | 0/182 [00:00<?, ?it/s][A
Training:   1%|          | 1/182 [00:00<02:29,  1.21it/s][A
Training:   1%|          | 2/182 [00:01<01:37,  1.84it/s][A
Training:   3%|▎         | 5/182 [00:01<00:38,  4.63it/s][A
Training:   3%|▎         | 6/182 [00:01<00:36,  4.80it/s][A
Training:   4%|▍         | 8/182 [00:01<00:25,  6.81it/s][A
Training:   5%|▍         | 9/182 [00:02<00:30,  5.73it/s][A
Training:   5%|▌         | 10/182 [00:02<00:27,  6.23it/s][A
Training:   7%|▋         | 12/182 [00:02<00:19,  8.61it/s][A
Training:   8%|▊         | 14/182 [00:02<00:24,  6.73it/s][A
Training:   9%|▉         | 16/182 [00:02<00:19,  8.72it/s][A
Training:  10%|▉         | 18/182 [00:03<00:22,  7.39it/s][A
Training:  11%|█         | 20/182 [00:03<00:17,  9.13it/s][A
Training:  12%|█▏        | 22/182 [00:03<00:24,  6.58it/s][A
Training:  13%|█▎        | 24/182 [00:03<00:19,  8.28it/s][A
Training:  14%|█▍        | 26/182 [00:04<00:23,  6.56it/s][A
Training:  15%|█▌     

Epoch: 24/24 - Loss: 7.7355 - Accuracy: 0.9148



  0%|          | 0/23 [00:00<?, ?it/s][A
  4%|▍         | 1/23 [00:00<00:17,  1.28it/s][A
 22%|██▏       | 5/23 [00:01<00:04,  4.49it/s][A
 35%|███▍      | 8/23 [00:01<00:01,  7.51it/s][A
 43%|████▎     | 10/23 [00:01<00:02,  6.14it/s][A
 57%|█████▋    | 13/23 [00:02<00:01,  6.07it/s][A
 61%|██████    | 14/23 [00:02<00:01,  6.11it/s][A
 74%|███████▍  | 17/23 [00:02<00:00,  6.32it/s][A
100%|██████████| 23/23 [00:03<00:00,  6.28it/s][A
Epochs: 100%|██████████| 24/24 [10:52<00:00, 27.17s/it]


Val Loss: 11.4136 - Val Accuracy: 0.9277


[32m[I 2023-12-14 23:48:26,399][0m Trial 4 finished with value: 0.9277133345603943 and parameters: {'loss_learning_rate': 0.0002370798530328366, 'learning_rate': 0.04652611547988512, 'weight_decay': 0.0017584196529739696, 'epsilon': 2.517132219206721e-09, 'batch_size': 77, 'epochs': 24}. Best is trial 3 with value: 0.9413145780563354.[0m


Learning rate for Loss: 0.00011285498412772518
Learning rate: 0.0004870321928878792
Weight decay: 0.002212783214071621
Epsilon: 1.0513313545777498e-09
Batch size: 238
Number of epochs: 23


Epochs:   0%|          | 0/23 [00:00<?, ?it/s]
Training:   0%|          | 0/59 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/59 [00:02<01:56,  2.01s/it][A
Training:   3%|▎         | 2/59 [00:02<00:51,  1.11it/s][A
Training:   5%|▌         | 3/59 [00:02<00:30,  1.85it/s][A
Training:   8%|▊         | 5/59 [00:03<00:33,  1.63it/s][A
Training:  10%|█         | 6/59 [00:03<00:25,  2.11it/s][A
Training:  14%|█▎        | 8/59 [00:03<00:15,  3.39it/s][A
Training:  15%|█▌        | 9/59 [00:05<00:27,  1.85it/s][A
Training:  17%|█▋        | 10/59 [00:05<00:21,  2.29it/s][A
Training:  19%|█▊        | 11/59 [00:05<00:17,  2.73it/s][A
Training:  22%|██▏       | 13/59 [00:07<00:24,  1.85it/s][A
Training:  25%|██▌       | 15/59 [00:07<00:15,  2.79it/s][A
Training:  29%|██▉       | 17/59 [00:08<00:22,  1.90it/s][A
Training:  31%|███       | 18/59 [00:08<00:18,  2.24it/s][A
Training:  32%|███▏      | 19/59 [00:09<00:14,  2.68it/s][A
Training:  34%|███▍      | 20/59 [00:09<00:12,  3.18it

Epoch: 1/23 - Loss: 12.4188 - Accuracy: 0.8055



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:02<00:13,  1.98s/it][A
 25%|██▌       | 2/8 [00:02<00:05,  1.13it/s][A
 62%|██████▎   | 5/8 [00:03<00:01,  1.63it/s][A
100%|██████████| 8/8 [00:03<00:00,  2.06it/s][A
Epochs:   0%|          | 0/23 [00:27<?, ?it/s]
[32m[I 2023-12-14 23:48:54,906][0m Trial 5 pruned. [0m


Val Loss: 6.4371 - Val Accuracy: 0.8765
Learning rate for Loss: 0.007580120623994243
Learning rate: 0.04884100913157098
Weight decay: 0.0011280209385660376
Epsilon: 2.849586798033918e-09
Batch size: 99
Number of epochs: 54


Epochs:   0%|          | 0/54 [00:00<?, ?it/s]
Training:   0%|          | 0/142 [00:00<?, ?it/s][A
Training:   1%|          | 1/142 [00:00<02:12,  1.06it/s][A
Training:   2%|▏         | 3/142 [00:01<00:40,  3.47it/s][A
Training:   4%|▎         | 5/142 [00:01<00:36,  3.73it/s][A
Training:   5%|▍         | 7/142 [00:01<00:24,  5.59it/s][A
Training:   6%|▋         | 9/142 [00:02<00:30,  4.41it/s][A
Training:   7%|▋         | 10/142 [00:02<00:27,  4.76it/s][A
Training:   8%|▊         | 12/142 [00:02<00:20,  6.48it/s][A
Training:  10%|▉         | 14/142 [00:03<00:26,  4.87it/s][A
Training:  11%|█         | 15/142 [00:03<00:23,  5.40it/s][A
Training:  12%|█▏        | 17/142 [00:03<00:24,  5.10it/s][A
Training:  13%|█▎        | 18/142 [00:03<00:26,  4.77it/s][A
Training:  15%|█▍        | 21/142 [00:04<00:21,  5.50it/s][A
Training:  15%|█▌        | 22/142 [00:04<00:24,  4.92it/s][A
Training:  18%|█▊        | 25/142 [00:05<00:20,  5.67it/s][A
Training:  18%|█▊        | 26/142 [00

Epoch: 1/54 - Loss: 30.4702 - Accuracy: 0.7879



  0%|          | 0/18 [00:00<?, ?it/s][A
  6%|▌         | 1/18 [00:01<00:17,  1.00s/it][A
 22%|██▏       | 4/18 [00:01<00:03,  4.60it/s][A
 33%|███▎      | 6/18 [00:01<00:02,  4.18it/s][A
 50%|█████     | 9/18 [00:02<00:02,  4.17it/s][A
 61%|██████    | 11/18 [00:02<00:01,  5.47it/s][A
 72%|███████▏  | 13/18 [00:03<00:01,  4.59it/s][A
 83%|████████▎ | 15/18 [00:03<00:00,  5.75it/s][A
100%|██████████| 18/18 [00:03<00:00,  4.68it/s][A
Epochs:   2%|▏         | 1/54 [00:27<24:23, 27.62s/it]

Val Loss: 3.3259 - Val Accuracy: 0.9119



Training:   0%|          | 0/142 [00:00<?, ?it/s][A
Training:   1%|          | 1/142 [00:00<02:14,  1.05it/s][A
Training:   2%|▏         | 3/142 [00:01<00:40,  3.47it/s][A
Training:   4%|▎         | 5/142 [00:01<00:34,  3.97it/s][A
Training:   6%|▌         | 8/142 [00:01<00:18,  7.19it/s][A
Training:   7%|▋         | 10/142 [00:02<00:23,  5.68it/s][A
Training:   8%|▊         | 12/142 [00:02<00:18,  6.98it/s][A
Training:  10%|▉         | 14/142 [00:02<00:22,  5.81it/s][A
Training:  11%|█▏        | 16/142 [00:02<00:17,  7.41it/s][A
Training:  13%|█▎        | 18/142 [00:03<00:25,  4.78it/s][A
Training:  14%|█▍        | 20/142 [00:03<00:19,  6.11it/s][A
Training:  15%|█▌        | 22/142 [00:04<00:23,  5.15it/s][A
Training:  17%|█▋        | 24/142 [00:04<00:17,  6.62it/s][A
Training:  18%|█▊        | 26/142 [00:04<00:20,  5.64it/s][A
Training:  20%|██        | 29/142 [00:05<00:21,  5.24it/s][A
Training:  22%|██▏       | 31/142 [00:05<00:17,  6.38it/s][A
Training:  23%|██▎  

Epoch: 2/54 - Loss: 3.5572 - Accuracy: 0.8918



  0%|          | 0/18 [00:00<?, ?it/s][A
  6%|▌         | 1/18 [00:01<00:20,  1.23s/it][A
 22%|██▏       | 4/18 [00:01<00:03,  3.84it/s][A
 33%|███▎      | 6/18 [00:01<00:03,  3.55it/s][A
 44%|████▍     | 8/18 [00:02<00:01,  5.08it/s][A
 56%|█████▌    | 10/18 [00:02<00:01,  4.22it/s][A
 67%|██████▋   | 12/18 [00:02<00:01,  5.65it/s][A
 78%|███████▊  | 14/18 [00:03<00:00,  4.80it/s][A
 89%|████████▉ | 16/18 [00:03<00:00,  6.30it/s][A
100%|██████████| 18/18 [00:04<00:00,  4.44it/s][A
Epochs:   2%|▏         | 1/54 [00:55<48:42, 55.14s/it]
[32m[I 2023-12-14 23:49:50,703][0m Trial 6 pruned. [0m


Val Loss: 6.0302 - Val Accuracy: 0.5205
Learning rate for Loss: 0.00017237051393809033
Learning rate: 0.005231337095494607
Weight decay: 0.0010085209986501272
Epsilon: 1.0952706936186941e-08
Batch size: 148
Number of epochs: 98


Epochs:   0%|          | 0/98 [00:00<?, ?it/s]
Training:   0%|          | 0/95 [00:00<?, ?it/s][A
Training:   1%|          | 1/95 [00:01<02:26,  1.56s/it][A
Training:   4%|▍         | 4/95 [00:01<00:29,  3.08it/s][A
Training:   6%|▋         | 6/95 [00:02<00:33,  2.65it/s][A
Training:   8%|▊         | 8/95 [00:02<00:23,  3.67it/s][A
Training:   9%|▉         | 9/95 [00:03<00:30,  2.79it/s][A
Training:  11%|█         | 10/95 [00:03<00:25,  3.35it/s][A
Training:  12%|█▏        | 11/95 [00:03<00:22,  3.79it/s][A
Training:  14%|█▎        | 13/95 [00:04<00:27,  2.97it/s][A
Training:  16%|█▌        | 15/95 [00:04<00:18,  4.25it/s][A
Training:  18%|█▊        | 17/95 [00:05<00:22,  3.48it/s][A
Training:  20%|██        | 19/95 [00:05<00:16,  4.53it/s][A
Training:  22%|██▏       | 21/95 [00:06<00:19,  3.73it/s][A
Training:  24%|██▍       | 23/95 [00:06<00:16,  4.27it/s][A
Training:  26%|██▋       | 25/95 [00:07<00:17,  3.96it/s][A
Training:  28%|██▊       | 27/95 [00:07<00:18,  3.74

Epoch: 1/98 - Loss: 11.1684 - Accuracy: 0.8109



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:16,  1.46s/it][A
 17%|█▋        | 2/12 [00:01<00:06,  1.48it/s][A
 33%|███▎      | 4/12 [00:01<00:02,  3.52it/s][A
 50%|█████     | 6/12 [00:02<00:02,  2.72it/s][A
 67%|██████▋   | 8/12 [00:02<00:01,  3.95it/s][A
 75%|███████▌  | 9/12 [00:03<00:01,  2.67it/s][A
100%|██████████| 12/12 [00:03<00:00,  3.16it/s][A
Epochs:   1%|          | 1/98 [00:27<44:18, 27.41s/it]

Val Loss: 4.8096 - Val Accuracy: 0.9088



Training:   0%|          | 0/95 [00:00<?, ?it/s][A
Training:   1%|          | 1/95 [00:01<02:04,  1.33s/it][A
Training:   4%|▍         | 4/95 [00:01<00:26,  3.40it/s][A
Training:   6%|▋         | 6/95 [00:02<00:32,  2.75it/s][A
Training:   9%|▉         | 9/95 [00:03<00:31,  2.70it/s][A
Training:  14%|█▎        | 13/95 [00:04<00:25,  3.26it/s][A
Training:  16%|█▌        | 15/95 [00:04<00:19,  4.11it/s][A
Training:  18%|█▊        | 17/95 [00:05<00:24,  3.18it/s][A
Training:  20%|██        | 19/95 [00:05<00:18,  4.10it/s][A
Training:  22%|██▏       | 21/95 [00:06<00:23,  3.20it/s][A
Training:  24%|██▍       | 23/95 [00:06<00:17,  4.21it/s][A
Training:  26%|██▋       | 25/95 [00:07<00:21,  3.24it/s][A
Training:  28%|██▊       | 27/95 [00:07<00:16,  4.17it/s][A
Training:  31%|███       | 29/95 [00:08<00:18,  3.48it/s][A
Training:  35%|███▍      | 33/95 [00:09<00:16,  3.81it/s][A
Training:  39%|███▉      | 37/95 [00:10<00:14,  3.93it/s][A
Training:  42%|████▏     | 40/95 [00

Epoch: 2/98 - Loss: 3.9307 - Accuracy: 0.9159



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:14,  1.30s/it][A
 25%|██▌       | 3/12 [00:01<00:03,  2.64it/s][A
 42%|████▏     | 5/12 [00:02<00:02,  2.36it/s][A
 58%|█████▊    | 7/12 [00:02<00:01,  3.74it/s][A
 75%|███████▌  | 9/12 [00:03<00:00,  3.20it/s][A
100%|██████████| 12/12 [00:03<00:00,  3.34it/s][A
Epochs:   2%|▏         | 2/98 [00:54<43:41, 27.31s/it]

Val Loss: 3.5265 - Val Accuracy: 0.9210



Training:   0%|          | 0/95 [00:00<?, ?it/s][A
Training:   1%|          | 1/95 [00:01<02:17,  1.46s/it][A
Training:   4%|▍         | 4/95 [00:01<00:29,  3.08it/s][A
Training:   6%|▋         | 6/95 [00:02<00:32,  2.73it/s][A
Training:   8%|▊         | 8/95 [00:02<00:23,  3.76it/s][A
Training:   9%|▉         | 9/95 [00:03<00:28,  3.00it/s][A
Training:  11%|█         | 10/95 [00:03<00:25,  3.30it/s][A
Training:  14%|█▎        | 13/95 [00:04<00:20,  3.96it/s][A
Training:  15%|█▍        | 14/95 [00:04<00:23,  3.52it/s][A
Training:  17%|█▋        | 16/95 [00:04<00:16,  4.82it/s][A
Training:  18%|█▊        | 17/95 [00:05<00:20,  3.89it/s][A
Training:  19%|█▉        | 18/95 [00:05<00:22,  3.45it/s][A
Training:  21%|██        | 20/95 [00:05<00:15,  4.89it/s][A
Training:  22%|██▏       | 21/95 [00:06<00:19,  3.86it/s][A
Training:  23%|██▎       | 22/95 [00:06<00:20,  3.57it/s][A
Training:  25%|██▌       | 24/95 [00:06<00:14,  4.98it/s][A
Training:  26%|██▋       | 25/95 [00:

Epoch: 3/98 - Loss: 3.2840 - Accuracy: 0.9138



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:15,  1.41s/it][A
 17%|█▋        | 2/12 [00:01<00:06,  1.52it/s][A
 33%|███▎      | 4/12 [00:01<00:02,  3.14it/s][A
 42%|████▏     | 5/12 [00:02<00:03,  2.12it/s][A
 58%|█████▊    | 7/12 [00:02<00:01,  3.52it/s][A
 75%|███████▌  | 9/12 [00:03<00:00,  3.16it/s][A
100%|██████████| 12/12 [00:03<00:00,  3.19it/s][A
Epochs:   3%|▎         | 3/98 [01:21<43:00, 27.16s/it]

Val Loss: 3.1341 - Val Accuracy: 0.9246



Training:   0%|          | 0/95 [00:00<?, ?it/s][A
Training:   1%|          | 1/95 [00:01<02:14,  1.43s/it][A
Training:   4%|▍         | 4/95 [00:01<00:27,  3.27it/s][A
Training:   6%|▋         | 6/95 [00:02<00:32,  2.78it/s][A
Training:   9%|▉         | 9/95 [00:03<00:25,  3.32it/s][A
Training:  12%|█▏        | 11/95 [00:03<00:19,  4.33it/s][A
Training:  14%|█▎        | 13/95 [00:04<00:23,  3.55it/s][A
Training:  16%|█▌        | 15/95 [00:04<00:19,  4.21it/s][A
Training:  18%|█▊        | 17/95 [00:05<00:23,  3.37it/s][A
Training:  20%|██        | 19/95 [00:05<00:17,  4.42it/s][A
Training:  22%|██▏       | 21/95 [00:06<00:20,  3.54it/s][A
Training:  24%|██▍       | 23/95 [00:06<00:16,  4.35it/s][A
Training:  26%|██▋       | 25/95 [00:07<00:18,  3.79it/s][A
Training:  28%|██▊       | 27/95 [00:07<00:15,  4.47it/s][A
Training:  31%|███       | 29/95 [00:08<00:18,  3.55it/s][A
Training:  33%|███▎      | 31/95 [00:08<00:15,  4.20it/s][A
Training:  35%|███▍      | 33/95 [00

Epoch: 4/98 - Loss: 2.8671 - Accuracy: 0.9325



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:14,  1.29s/it][A
 25%|██▌       | 3/12 [00:01<00:03,  2.68it/s][A
 42%|████▏     | 5/12 [00:02<00:02,  2.54it/s][A
 50%|█████     | 6/12 [00:02<00:01,  3.15it/s][A
 75%|███████▌  | 9/12 [00:03<00:00,  3.18it/s][A
100%|██████████| 12/12 [00:03<00:00,  3.43it/s][A
Epochs:   4%|▍         | 4/98 [01:48<42:04, 26.86s/it]

Val Loss: 2.6797 - Val Accuracy: 0.9379



Training:   0%|          | 0/95 [00:00<?, ?it/s][A
Training:   1%|          | 1/95 [00:01<02:15,  1.45s/it][A
Training:   3%|▎         | 3/95 [00:01<00:38,  2.37it/s][A
Training:   5%|▌         | 5/95 [00:02<00:36,  2.45it/s][A
Training:   6%|▋         | 6/95 [00:02<00:31,  2.82it/s][A
Training:   9%|▉         | 9/95 [00:03<00:26,  3.24it/s][A
Training:  11%|█         | 10/95 [00:03<00:23,  3.56it/s][A
Training:  12%|█▏        | 11/95 [00:03<00:20,  4.15it/s][A
Training:  13%|█▎        | 12/95 [00:03<00:17,  4.82it/s][A
Training:  14%|█▎        | 13/95 [00:04<00:25,  3.27it/s][A
Training:  15%|█▍        | 14/95 [00:04<00:21,  3.70it/s][A
Training:  16%|█▌        | 15/95 [00:04<00:17,  4.48it/s][A
Training:  18%|█▊        | 17/95 [00:05<00:18,  4.27it/s][A
Training:  19%|█▉        | 18/95 [00:05<00:22,  3.43it/s][A
Training:  21%|██        | 20/95 [00:05<00:15,  4.83it/s][A
Training:  22%|██▏       | 21/95 [00:06<00:18,  3.98it/s][A
Training:  23%|██▎       | 22/95 [00:

Epoch: 5/98 - Loss: 2.9383 - Accuracy: 0.9212



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:16,  1.50s/it][A
 33%|███▎      | 4/12 [00:01<00:02,  3.17it/s][A
 50%|█████     | 6/12 [00:02<00:02,  2.76it/s][A
100%|██████████| 12/12 [00:03<00:00,  3.39it/s][A
Epochs:   5%|▌         | 5/98 [02:15<41:48, 26.97s/it]

Val Loss: 2.6023 - Val Accuracy: 0.9064



Training:   0%|          | 0/95 [00:00<?, ?it/s][A
Training:   1%|          | 1/95 [00:01<02:15,  1.44s/it][A
Training:   2%|▏         | 2/95 [00:01<01:07,  1.37it/s][A
Training:   4%|▍         | 4/95 [00:01<00:28,  3.20it/s][A
Training:   5%|▌         | 5/95 [00:02<00:34,  2.58it/s][A
Training:   6%|▋         | 6/95 [00:02<00:30,  2.95it/s][A
Training:   8%|▊         | 8/95 [00:02<00:18,  4.68it/s][A
Training:   9%|▉         | 9/95 [00:03<00:26,  3.26it/s][A
Training:  11%|█         | 10/95 [00:03<00:25,  3.32it/s][A
Training:  13%|█▎        | 12/95 [00:03<00:16,  5.06it/s][A
Training:  14%|█▎        | 13/95 [00:04<00:24,  3.36it/s][A
Training:  15%|█▍        | 14/95 [00:04<00:22,  3.61it/s][A
Training:  17%|█▋        | 16/95 [00:04<00:14,  5.40it/s][A
Training:  18%|█▊        | 17/95 [00:05<00:26,  2.99it/s][A
Training:  19%|█▉        | 18/95 [00:05<00:21,  3.56it/s][A
Training:  21%|██        | 20/95 [00:05<00:14,  5.14it/s][A
Training:  22%|██▏       | 21/95 [00:06

Epoch: 6/98 - Loss: 2.5319 - Accuracy: 0.9333



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:14,  1.34s/it][A
 25%|██▌       | 3/12 [00:01<00:03,  2.54it/s][A
 42%|████▏     | 5/12 [00:02<00:03,  2.24it/s][A
 67%|██████▋   | 8/12 [00:02<00:00,  4.19it/s][A
 83%|████████▎ | 10/12 [00:03<00:00,  3.32it/s][A
100%|██████████| 12/12 [00:03<00:00,  3.24it/s][A
Epochs:   6%|▌         | 6/98 [02:42<41:35, 27.13s/it]

Val Loss: 2.5147 - Val Accuracy: 0.9379



Training:   0%|          | 0/95 [00:00<?, ?it/s][A
Training:   1%|          | 1/95 [00:01<01:55,  1.23s/it][A
Training:   4%|▍         | 4/95 [00:01<00:25,  3.55it/s][A
Training:   6%|▋         | 6/95 [00:02<00:31,  2.82it/s][A
Training:   7%|▋         | 7/95 [00:02<00:25,  3.40it/s][A
Training:   9%|▉         | 9/95 [00:03<00:27,  3.17it/s][A
Training:  11%|█         | 10/95 [00:03<00:23,  3.68it/s][A
Training:  12%|█▏        | 11/95 [00:03<00:19,  4.35it/s][A
Training:  13%|█▎        | 12/95 [00:03<00:17,  4.73it/s][A
Training:  14%|█▎        | 13/95 [00:04<00:26,  3.12it/s][A
Training:  16%|█▌        | 15/95 [00:04<00:18,  4.44it/s][A
Training:  18%|█▊        | 17/95 [00:05<00:21,  3.59it/s][A
Training:  20%|██        | 19/95 [00:05<00:17,  4.24it/s][A
Training:  22%|██▏       | 21/95 [00:06<00:20,  3.65it/s][A
Training:  24%|██▍       | 23/95 [00:06<00:16,  4.49it/s][A
Training:  26%|██▋       | 25/95 [00:06<00:18,  3.83it/s][A
Training:  27%|██▋       | 26/95 [00:

Epoch: 7/98 - Loss: 2.4265 - Accuracy: 0.9403



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:14,  1.31s/it][A
 25%|██▌       | 3/12 [00:01<00:03,  2.61it/s][A
 42%|████▏     | 5/12 [00:02<00:02,  2.36it/s][A
 67%|██████▋   | 8/12 [00:02<00:00,  4.35it/s][A
100%|██████████| 12/12 [00:03<00:00,  3.30it/s][A
Epochs:   7%|▋         | 7/98 [03:09<40:57, 27.01s/it]

Val Loss: 2.5530 - Val Accuracy: 0.9304



Training:   0%|          | 0/95 [00:00<?, ?it/s][A
Training:   1%|          | 1/95 [00:01<02:32,  1.63s/it][A
Training:   3%|▎         | 3/95 [00:01<00:43,  2.09it/s][A
Training:   5%|▌         | 5/95 [00:02<00:40,  2.21it/s][A
Training:   7%|▋         | 7/95 [00:02<00:25,  3.51it/s][A
Training:   9%|▉         | 9/95 [00:03<00:27,  3.11it/s][A
Training:  11%|█         | 10/95 [00:03<00:23,  3.65it/s][A
Training:  13%|█▎        | 12/95 [00:03<00:16,  5.03it/s][A
Training:  15%|█▍        | 14/95 [00:04<00:19,  4.26it/s][A
Training:  16%|█▌        | 15/95 [00:04<00:17,  4.53it/s][A
Training:  17%|█▋        | 16/95 [00:04<00:15,  5.15it/s][A
Training:  18%|█▊        | 17/95 [00:05<00:22,  3.42it/s][A
Training:  19%|█▉        | 18/95 [00:05<00:18,  4.06it/s][A
Training:  20%|██        | 19/95 [00:05<00:18,  4.16it/s][A
Training:  22%|██▏       | 21/95 [00:06<00:19,  3.72it/s][A
Training:  23%|██▎       | 22/95 [00:06<00:18,  4.05it/s][A
Training:  24%|██▍       | 23/95 [00:

Epoch: 8/98 - Loss: 2.4709 - Accuracy: 0.9357



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:14,  1.31s/it][A
 17%|█▋        | 2/12 [00:01<00:06,  1.49it/s][A
 33%|███▎      | 4/12 [00:01<00:02,  3.53it/s][A
 50%|█████     | 6/12 [00:02<00:02,  2.78it/s][A
 67%|██████▋   | 8/12 [00:02<00:00,  4.10it/s][A
 75%|███████▌  | 9/12 [00:03<00:01,  2.74it/s][A
100%|██████████| 12/12 [00:03<00:00,  3.26it/s][A
Epochs:   8%|▊         | 8/98 [03:36<40:47, 27.19s/it]

Val Loss: 2.4230 - Val Accuracy: 0.9200



Training:   0%|          | 0/95 [00:00<?, ?it/s][A
Training:   1%|          | 1/95 [00:01<02:26,  1.56s/it][A
Training:   5%|▌         | 5/95 [00:02<00:37,  2.37it/s][A
Training:   7%|▋         | 7/95 [00:02<00:24,  3.52it/s][A
Training:   9%|▉         | 9/95 [00:03<00:29,  2.91it/s][A
Training:  12%|█▏        | 11/95 [00:03<00:21,  3.93it/s][A
Training:  14%|█▎        | 13/95 [00:04<00:25,  3.24it/s][A
Training:  16%|█▌        | 15/95 [00:04<00:18,  4.35it/s][A
Training:  18%|█▊        | 17/95 [00:05<00:22,  3.53it/s][A
Training:  22%|██▏       | 21/95 [00:06<00:19,  3.89it/s][A
Training:  26%|██▋       | 25/95 [00:07<00:18,  3.78it/s][A
Training:  28%|██▊       | 27/95 [00:07<00:14,  4.55it/s][A
Training:  31%|███       | 29/95 [00:08<00:17,  3.83it/s][A
Training:  33%|███▎      | 31/95 [00:08<00:13,  4.75it/s][A
Training:  35%|███▍      | 33/95 [00:09<00:15,  3.94it/s][A
Training:  38%|███▊      | 36/95 [00:09<00:11,  5.12it/s][A
Training:  39%|███▉      | 37/95 [00

Epoch: 9/98 - Loss: 2.2132 - Accuracy: 0.9401



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:14,  1.33s/it][A
 25%|██▌       | 3/12 [00:01<00:03,  2.33it/s][A
 42%|████▏     | 5/12 [00:02<00:02,  2.41it/s][A
 58%|█████▊    | 7/12 [00:02<00:01,  3.83it/s][A
100%|██████████| 12/12 [00:03<00:00,  3.46it/s][A
Epochs:   9%|▉         | 9/98 [04:03<40:13, 27.11s/it]

Val Loss: 2.3934 - Val Accuracy: 0.9315



Training:   0%|          | 0/95 [00:00<?, ?it/s][A
Training:   1%|          | 1/95 [00:01<02:04,  1.32s/it][A
Training:   2%|▏         | 2/95 [00:01<01:04,  1.45it/s][A
Training:   4%|▍         | 4/95 [00:01<00:27,  3.29it/s][A
Training:   5%|▌         | 5/95 [00:02<00:35,  2.56it/s][A
Training:   6%|▋         | 6/95 [00:02<00:31,  2.81it/s][A
Training:   8%|▊         | 8/95 [00:02<00:18,  4.65it/s][A
Training:   9%|▉         | 9/95 [00:03<00:27,  3.17it/s][A
Training:  11%|█         | 10/95 [00:03<00:25,  3.35it/s][A
Training:  13%|█▎        | 12/95 [00:03<00:16,  5.06it/s][A
Training:  14%|█▎        | 13/95 [00:04<00:23,  3.48it/s][A
Training:  15%|█▍        | 14/95 [00:04<00:21,  3.73it/s][A
Training:  16%|█▌        | 15/95 [00:04<00:18,  4.41it/s][A
Training:  18%|█▊        | 17/95 [00:05<00:22,  3.49it/s][A
Training:  20%|██        | 19/95 [00:05<00:17,  4.30it/s][A
Training:  22%|██▏       | 21/95 [00:06<00:19,  3.81it/s][A
Training:  23%|██▎       | 22/95 [00:06

Epoch: 10/98 - Loss: 2.1333 - Accuracy: 0.9407



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:15,  1.44s/it][A
 17%|█▋        | 2/12 [00:01<00:06,  1.52it/s][A
 33%|███▎      | 4/12 [00:01<00:02,  3.54it/s][A
 50%|█████     | 6/12 [00:02<00:02,  2.88it/s][A
 67%|██████▋   | 8/12 [00:02<00:00,  4.37it/s][A
100%|██████████| 12/12 [00:03<00:00,  3.30it/s][A
Epochs:  10%|█         | 10/98 [04:31<40:00, 27.28s/it]

Val Loss: 2.2609 - Val Accuracy: 0.9420



Training:   0%|          | 0/95 [00:00<?, ?it/s][A
Training:   1%|          | 1/95 [00:01<02:08,  1.37s/it][A
Training:   3%|▎         | 3/95 [00:01<00:37,  2.48it/s][A
Training:   5%|▌         | 5/95 [00:02<00:34,  2.61it/s][A
Training:   7%|▋         | 7/95 [00:02<00:22,  3.96it/s][A
Training:   9%|▉         | 9/95 [00:03<00:25,  3.39it/s][A
Training:  12%|█▏        | 11/95 [00:03<00:18,  4.63it/s][A
Training:  13%|█▎        | 12/95 [00:03<00:16,  5.18it/s][A
Training:  14%|█▎        | 13/95 [00:04<00:24,  3.31it/s][A
Training:  15%|█▍        | 14/95 [00:04<00:21,  3.74it/s][A
Training:  17%|█▋        | 16/95 [00:04<00:15,  5.07it/s][A
Training:  18%|█▊        | 17/95 [00:05<00:24,  3.22it/s][A
Training:  19%|█▉        | 18/95 [00:05<00:20,  3.70it/s][A
Training:  20%|██        | 19/95 [00:05<00:17,  4.41it/s][A
Training:  22%|██▏       | 21/95 [00:06<00:21,  3.50it/s][A
Training:  24%|██▍       | 23/95 [00:06<00:15,  4.54it/s][A
Training:  26%|██▋       | 25/95 [00:

Epoch: 11/98 - Loss: 2.1811 - Accuracy: 0.9394



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:17,  1.62s/it][A
 25%|██▌       | 3/12 [00:01<00:04,  2.19it/s][A
 42%|████▏     | 5/12 [00:02<00:03,  2.23it/s][A
 75%|███████▌  | 9/12 [00:03<00:01,  2.92it/s][A
100%|██████████| 12/12 [00:03<00:00,  3.08it/s][A
Epochs:  11%|█         | 11/98 [04:58<39:30, 27.25s/it]

Val Loss: 2.4810 - Val Accuracy: 0.9307



Training:   0%|          | 0/95 [00:00<?, ?it/s][A
Training:   1%|          | 1/95 [00:01<01:50,  1.18s/it][A
Training:   2%|▏         | 2/95 [00:01<00:53,  1.73it/s][A
Training:   4%|▍         | 4/95 [00:01<00:22,  3.98it/s][A
Training:   6%|▋         | 6/95 [00:02<00:31,  2.79it/s][A
Training:   8%|▊         | 8/95 [00:02<00:21,  4.14it/s][A
Training:   9%|▉         | 9/95 [00:03<00:27,  3.10it/s][A
Training:  12%|█▏        | 11/95 [00:03<00:18,  4.55it/s][A
Training:  14%|█▎        | 13/95 [00:04<00:23,  3.53it/s][A
Training:  15%|█▍        | 14/95 [00:04<00:20,  3.87it/s][A
Training:  17%|█▋        | 16/95 [00:04<00:14,  5.35it/s][A
Training:  18%|█▊        | 17/95 [00:05<00:22,  3.50it/s][A
Training:  19%|█▉        | 18/95 [00:05<00:19,  3.98it/s][A
Training:  22%|██▏       | 21/95 [00:05<00:18,  3.93it/s][A
Training:  24%|██▍       | 23/95 [00:06<00:13,  5.25it/s][A
Training:  26%|██▋       | 25/95 [00:06<00:17,  3.95it/s][A
Training:  27%|██▋       | 26/95 [00:0

Epoch: 12/98 - Loss: 2.0668 - Accuracy: 0.9418



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:13,  1.24s/it][A
 17%|█▋        | 2/12 [00:01<00:06,  1.65it/s][A
 33%|███▎      | 4/12 [00:01<00:02,  3.63it/s][A
 42%|████▏     | 5/12 [00:02<00:02,  2.43it/s][A
 58%|█████▊    | 7/12 [00:02<00:01,  4.00it/s][A
 75%|███████▌  | 9/12 [00:03<00:00,  3.25it/s][A
100%|██████████| 12/12 [00:03<00:00,  3.32it/s][A
Epochs:  12%|█▏        | 12/98 [05:25<38:50, 27.10s/it]

Val Loss: 2.1985 - Val Accuracy: 0.9401



Training:   0%|          | 0/95 [00:00<?, ?it/s][A
Training:   1%|          | 1/95 [00:01<02:16,  1.45s/it][A
Training:   2%|▏         | 2/95 [00:01<01:01,  1.52it/s][A
Training:   5%|▌         | 5/95 [00:02<00:36,  2.48it/s][A
Training:   7%|▋         | 7/95 [00:02<00:23,  3.68it/s][A
Training:   9%|▉         | 9/95 [00:03<00:26,  3.21it/s][A
Training:  11%|█         | 10/95 [00:03<00:24,  3.43it/s][A
Training:  13%|█▎        | 12/95 [00:03<00:16,  4.88it/s][A
Training:  14%|█▎        | 13/95 [00:04<00:24,  3.32it/s][A
Training:  15%|█▍        | 14/95 [00:04<00:24,  3.37it/s][A
Training:  18%|█▊        | 17/95 [00:05<00:21,  3.69it/s][A
Training:  19%|█▉        | 18/95 [00:05<00:21,  3.56it/s][A
Training:  21%|██        | 20/95 [00:05<00:15,  4.84it/s][A
Training:  22%|██▏       | 21/95 [00:06<00:21,  3.49it/s][A
Training:  23%|██▎       | 22/95 [00:06<00:20,  3.50it/s][A
Training:  26%|██▋       | 25/95 [00:07<00:18,  3.82it/s][A
Training:  27%|██▋       | 26/95 [00:

Epoch: 13/98 - Loss: 2.1061 - Accuracy: 0.9419



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:14,  1.34s/it][A
 25%|██▌       | 3/12 [00:01<00:03,  2.57it/s][A
 42%|████▏     | 5/12 [00:02<00:02,  2.76it/s][A
 50%|█████     | 6/12 [00:02<00:01,  3.25it/s][A
 67%|██████▋   | 8/12 [00:02<00:00,  4.93it/s][A
 75%|███████▌  | 9/12 [00:03<00:00,  3.27it/s][A
100%|██████████| 12/12 [00:03<00:00,  3.48it/s][A
Epochs:  13%|█▎        | 13/98 [05:53<38:41, 27.31s/it]

Val Loss: 2.3867 - Val Accuracy: 0.9246



Training:   0%|          | 0/95 [00:00<?, ?it/s][A
Training:   1%|          | 1/95 [00:01<02:14,  1.43s/it][A
Training:   2%|▏         | 2/95 [00:01<01:01,  1.51it/s][A
Training:   5%|▌         | 5/95 [00:02<00:37,  2.38it/s][A
Training:   7%|▋         | 7/95 [00:02<00:24,  3.56it/s][A
Training:   9%|▉         | 9/95 [00:03<00:29,  2.88it/s][A
Training:  12%|█▏        | 11/95 [00:03<00:21,  3.99it/s][A
Training:  14%|█▎        | 13/95 [00:04<00:25,  3.24it/s][A
Training:  16%|█▌        | 15/95 [00:04<00:18,  4.42it/s][A
Training:  18%|█▊        | 17/95 [00:05<00:22,  3.43it/s][A
Training:  21%|██        | 20/95 [00:05<00:14,  5.21it/s][A
Training:  23%|██▎       | 22/95 [00:06<00:18,  3.90it/s][A
Training:  25%|██▌       | 24/95 [00:06<00:14,  4.88it/s][A
Training:  27%|██▋       | 26/95 [00:07<00:18,  3.67it/s][A
Training:  31%|███       | 29/95 [00:08<00:18,  3.50it/s][A
Training:  33%|███▎      | 31/95 [00:08<00:14,  4.34it/s][A
Training:  35%|███▍      | 33/95 [00:

Epoch: 14/98 - Loss: 2.0376 - Accuracy: 0.9427



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:15,  1.39s/it][A
 42%|████▏     | 5/12 [00:02<00:02,  2.61it/s][A
 58%|█████▊    | 7/12 [00:02<00:01,  3.81it/s][A
 75%|███████▌  | 9/12 [00:03<00:00,  3.15it/s][A
100%|██████████| 12/12 [00:03<00:00,  3.50it/s][A
Epochs:  14%|█▍        | 14/98 [06:20<38:00, 27.14s/it]

Val Loss: 2.0926 - Val Accuracy: 0.9424



Training:   0%|          | 0/95 [00:00<?, ?it/s][A
Training:   1%|          | 1/95 [00:01<02:09,  1.37s/it][A
Training:   3%|▎         | 3/95 [00:01<00:37,  2.42it/s][A
Training:   5%|▌         | 5/95 [00:02<00:37,  2.41it/s][A
Training:   6%|▋         | 6/95 [00:02<00:31,  2.81it/s][A
Training:   8%|▊         | 8/95 [00:02<00:19,  4.46it/s][A
Training:  11%|█         | 10/95 [00:03<00:26,  3.26it/s][A
Training:  14%|█▎        | 13/95 [00:04<00:23,  3.56it/s][A
Training:  15%|█▍        | 14/95 [00:04<00:22,  3.56it/s][A
Training:  18%|█▊        | 17/95 [00:05<00:19,  3.94it/s][A
Training:  19%|█▉        | 18/95 [00:05<00:20,  3.72it/s][A
Training:  21%|██        | 20/95 [00:05<00:14,  5.04it/s][A
Training:  22%|██▏       | 21/95 [00:06<00:18,  4.00it/s][A
Training:  23%|██▎       | 22/95 [00:06<00:19,  3.77it/s][A
Training:  25%|██▌       | 24/95 [00:06<00:14,  4.89it/s][A
Training:  26%|██▋       | 25/95 [00:07<00:17,  4.00it/s][A
Training:  27%|██▋       | 26/95 [00:

Epoch: 15/98 - Loss: 1.9268 - Accuracy: 0.9442



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:13,  1.21s/it][A
 42%|████▏     | 5/12 [00:02<00:02,  2.77it/s][A
 58%|█████▊    | 7/12 [00:02<00:01,  3.82it/s][A
 75%|███████▌  | 9/12 [00:03<00:00,  3.10it/s][A
100%|██████████| 12/12 [00:03<00:00,  3.53it/s][A
Epochs:  15%|█▌        | 15/98 [06:46<37:21, 27.01s/it]

Val Loss: 2.2162 - Val Accuracy: 0.9355



Training:   0%|          | 0/95 [00:00<?, ?it/s][A
Training:   1%|          | 1/95 [00:01<02:08,  1.36s/it][A
Training:   3%|▎         | 3/95 [00:01<00:37,  2.43it/s][A
Training:   5%|▌         | 5/95 [00:02<00:38,  2.34it/s][A
Training:   8%|▊         | 8/95 [00:02<00:19,  4.51it/s][A
Training:  11%|█         | 10/95 [00:03<00:24,  3.53it/s][A
Training:  13%|█▎        | 12/95 [00:03<00:18,  4.37it/s][A
Training:  14%|█▎        | 13/95 [00:03<00:21,  3.80it/s][A
Training:  16%|█▌        | 15/95 [00:04<00:19,  4.06it/s][A
Training:  18%|█▊        | 17/95 [00:04<00:19,  4.10it/s][A
Training:  19%|█▉        | 18/95 [00:04<00:16,  4.62it/s][A
Training:  20%|██        | 19/95 [00:05<00:21,  3.47it/s][A
Training:  22%|██▏       | 21/95 [00:05<00:16,  4.46it/s][A
Training:  24%|██▍       | 23/95 [00:06<00:21,  3.41it/s][A
Training:  26%|██▋       | 25/95 [00:06<00:16,  4.28it/s][A
Training:  27%|██▋       | 26/95 [00:06<00:14,  4.79it/s][A
Training:  28%|██▊       | 27/95 [00

Epoch: 16/98 - Loss: 1.9861 - Accuracy: 0.9419



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:14,  1.31s/it][A
 42%|████▏     | 5/12 [00:02<00:02,  2.68it/s][A
 67%|██████▋   | 8/12 [00:02<00:00,  4.69it/s][A
100%|██████████| 12/12 [00:03<00:00,  3.44it/s][A
Epochs:  16%|█▋        | 16/98 [07:13<36:49, 26.95s/it]

Val Loss: 2.0865 - Val Accuracy: 0.9345



Training:   0%|          | 0/95 [00:00<?, ?it/s][A
Training:   1%|          | 1/95 [00:01<01:54,  1.21s/it][A
Training:   2%|▏         | 2/95 [00:01<00:52,  1.77it/s][A
Training:   4%|▍         | 4/95 [00:01<00:23,  3.89it/s][A
Training:   5%|▌         | 5/95 [00:02<00:32,  2.75it/s][A
Training:   6%|▋         | 6/95 [00:02<00:28,  3.10it/s][A
Training:   7%|▋         | 7/95 [00:02<00:23,  3.77it/s][A
Training:   9%|▉         | 9/95 [00:03<00:28,  3.05it/s][A
Training:  11%|█         | 10/95 [00:03<00:24,  3.44it/s][A
Training:  13%|█▎        | 12/95 [00:03<00:16,  4.89it/s][A
Training:  14%|█▎        | 13/95 [00:04<00:25,  3.19it/s][A
Training:  16%|█▌        | 15/95 [00:04<00:19,  4.17it/s][A
Training:  18%|█▊        | 17/95 [00:05<00:20,  3.83it/s][A
Training:  20%|██        | 19/95 [00:05<00:16,  4.49it/s][A
Training:  22%|██▏       | 21/95 [00:06<00:18,  3.96it/s][A
Training:  24%|██▍       | 23/95 [00:06<00:15,  4.71it/s][A
Training:  26%|██▋       | 25/95 [00:07

Epoch: 17/98 - Loss: 1.8920 - Accuracy: 0.9439



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:16,  1.48s/it][A
 25%|██▌       | 3/12 [00:01<00:03,  2.27it/s][A
 42%|████▏     | 5/12 [00:02<00:02,  2.63it/s][A
 67%|██████▋   | 8/12 [00:02<00:00,  4.54it/s][A
 75%|███████▌  | 9/12 [00:03<00:00,  3.24it/s][A
100%|██████████| 12/12 [00:03<00:00,  3.56it/s][A
Epochs:  17%|█▋        | 17/98 [07:40<36:15, 26.86s/it]

Val Loss: 2.7656 - Val Accuracy: 0.9338



Training:   0%|          | 0/95 [00:00<?, ?it/s][A
Training:   1%|          | 1/95 [00:01<02:28,  1.58s/it][A
Training:   2%|▏         | 2/95 [00:01<01:06,  1.39it/s][A
Training:   4%|▍         | 4/95 [00:01<00:28,  3.21it/s][A
Training:   5%|▌         | 5/95 [00:02<00:38,  2.36it/s][A
Training:   9%|▉         | 9/95 [00:03<00:26,  3.25it/s][A
Training:  12%|█▏        | 11/95 [00:03<00:19,  4.36it/s][A
Training:  14%|█▎        | 13/95 [00:04<00:24,  3.30it/s][A
Training:  16%|█▌        | 15/95 [00:04<00:18,  4.34it/s][A
Training:  18%|█▊        | 17/95 [00:05<00:24,  3.15it/s][A
Training:  21%|██        | 20/95 [00:05<00:15,  4.86it/s][A
Training:  23%|██▎       | 22/95 [00:06<00:19,  3.83it/s][A
Training:  26%|██▋       | 25/95 [00:07<00:20,  3.47it/s][A
Training:  28%|██▊       | 27/95 [00:07<00:15,  4.25it/s][A
Training:  31%|███       | 29/95 [00:08<00:19,  3.46it/s][A
Training:  33%|███▎      | 31/95 [00:08<00:14,  4.37it/s][A
Training:  35%|███▍      | 33/95 [00:

Epoch: 18/98 - Loss: 1.9553 - Accuracy: 0.9423



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:14,  1.29s/it][A
 17%|█▋        | 2/12 [00:01<00:06,  1.56it/s][A
 42%|████▏     | 5/12 [00:02<00:02,  2.83it/s][A
 50%|█████     | 6/12 [00:02<00:01,  3.43it/s][A
100%|██████████| 12/12 [00:03<00:00,  3.66it/s][A
Epochs:  18%|█▊        | 18/98 [08:07<36:07, 27.10s/it]

Val Loss: 2.2149 - Val Accuracy: 0.8747



Training:   0%|          | 0/95 [00:00<?, ?it/s][A
Training:   1%|          | 1/95 [00:01<02:09,  1.38s/it][A
Training:   3%|▎         | 3/95 [00:01<00:37,  2.42it/s][A
Training:   5%|▌         | 5/95 [00:02<00:37,  2.38it/s][A
Training:   6%|▋         | 6/95 [00:02<00:31,  2.80it/s][A
Training:   8%|▊         | 8/95 [00:02<00:20,  4.23it/s][A
Training:   9%|▉         | 9/95 [00:03<00:29,  2.92it/s][A
Training:  11%|█         | 10/95 [00:03<00:28,  2.96it/s][A
Training:  13%|█▎        | 12/95 [00:03<00:18,  4.50it/s][A
Training:  14%|█▎        | 13/95 [00:04<00:23,  3.45it/s][A
Training:  15%|█▍        | 14/95 [00:04<00:24,  3.32it/s][A
Training:  17%|█▋        | 16/95 [00:04<00:15,  4.98it/s][A
Training:  18%|█▊        | 17/95 [00:05<00:21,  3.67it/s][A
Training:  19%|█▉        | 18/95 [00:05<00:24,  3.11it/s][A
Training:  20%|██        | 19/95 [00:05<00:20,  3.72it/s][A
Training:  22%|██▏       | 21/95 [00:06<00:17,  4.26it/s][A
Training:  23%|██▎       | 22/95 [00:0

Epoch: 19/98 - Loss: 1.9440 - Accuracy: 0.9405



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:15,  1.42s/it][A
 17%|█▋        | 2/12 [00:01<00:06,  1.48it/s][A
 42%|████▏     | 5/12 [00:02<00:02,  2.59it/s][A
 58%|█████▊    | 7/12 [00:02<00:01,  4.00it/s][A
100%|██████████| 12/12 [00:03<00:00,  3.69it/s][A
Epochs:  19%|█▉        | 19/98 [08:35<35:43, 27.13s/it]

Val Loss: 2.2325 - Val Accuracy: 0.9273



Training:   0%|          | 0/95 [00:00<?, ?it/s][A
Training:   1%|          | 1/95 [00:01<02:08,  1.37s/it][A
Training:   2%|▏         | 2/95 [00:01<01:00,  1.55it/s][A
Training:   4%|▍         | 4/95 [00:01<00:26,  3.45it/s][A
Training:   5%|▌         | 5/95 [00:02<00:39,  2.29it/s][A
Training:   6%|▋         | 6/95 [00:02<00:29,  2.97it/s][A
Training:   9%|▉         | 9/95 [00:03<00:25,  3.33it/s][A
Training:  13%|█▎        | 12/95 [00:03<00:15,  5.50it/s][A
Training:  15%|█▍        | 14/95 [00:04<00:18,  4.32it/s][A
Training:  17%|█▋        | 16/95 [00:04<00:14,  5.44it/s][A
Training:  19%|█▉        | 18/95 [00:05<00:18,  4.08it/s][A
Training:  21%|██        | 20/95 [00:05<00:14,  5.33it/s][A
Training:  23%|██▎       | 22/95 [00:06<00:19,  3.82it/s][A
Training:  26%|██▋       | 25/95 [00:06<00:18,  3.75it/s][A
Training:  28%|██▊       | 27/95 [00:07<00:14,  4.69it/s][A
Training:  31%|███       | 29/95 [00:07<00:16,  4.07it/s][A
Training:  32%|███▏      | 30/95 [00:0

Epoch: 20/98 - Loss: 1.9174 - Accuracy: 0.9429



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:13,  1.27s/it][A
 17%|█▋        | 2/12 [00:01<00:05,  1.69it/s][A
 33%|███▎      | 4/12 [00:01<00:02,  3.83it/s][A
 42%|████▏     | 5/12 [00:02<00:02,  3.08it/s][A
 50%|█████     | 6/12 [00:02<00:02,  2.77it/s][A
 67%|██████▋   | 8/12 [00:02<00:00,  4.43it/s][A
 75%|███████▌  | 9/12 [00:03<00:00,  3.47it/s][A
100%|██████████| 12/12 [00:03<00:00,  3.37it/s][A
Epochs:  20%|██        | 20/98 [09:02<35:15, 27.12s/it]

Val Loss: 2.0838 - Val Accuracy: 0.9434



Training:   0%|          | 0/95 [00:00<?, ?it/s][A
Training:   1%|          | 1/95 [00:01<01:52,  1.20s/it][A
Training:   3%|▎         | 3/95 [00:01<00:33,  2.71it/s][A
Training:   5%|▌         | 5/95 [00:02<00:34,  2.58it/s][A
Training:   7%|▋         | 7/95 [00:02<00:22,  3.96it/s][A
Training:   9%|▉         | 9/95 [00:03<00:25,  3.33it/s][A
Training:  12%|█▏        | 11/95 [00:03<00:18,  4.65it/s][A
Training:  14%|█▎        | 13/95 [00:04<00:25,  3.23it/s][A
Training:  16%|█▌        | 15/95 [00:04<00:18,  4.43it/s][A
Training:  18%|█▊        | 17/95 [00:05<00:23,  3.27it/s][A
Training:  20%|██        | 19/95 [00:05<00:17,  4.27it/s][A
Training:  22%|██▏       | 21/95 [00:06<00:22,  3.35it/s][A
Training:  24%|██▍       | 23/95 [00:06<00:16,  4.36it/s][A
Training:  26%|██▋       | 25/95 [00:07<00:19,  3.60it/s][A
Training:  28%|██▊       | 27/95 [00:07<00:14,  4.79it/s][A
Training:  31%|███       | 29/95 [00:08<00:17,  3.80it/s][A
Training:  33%|███▎      | 31/95 [00:

Epoch: 21/98 - Loss: 1.9388 - Accuracy: 0.9423



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:15,  1.41s/it][A
 25%|██▌       | 3/12 [00:01<00:03,  2.35it/s][A
 42%|████▏     | 5/12 [00:02<00:03,  2.26it/s][A
 58%|█████▊    | 7/12 [00:02<00:01,  3.60it/s][A
 75%|███████▌  | 9/12 [00:03<00:00,  3.09it/s][A
100%|██████████| 12/12 [00:03<00:00,  3.35it/s][A
Epochs:  21%|██▏       | 21/98 [09:29<34:55, 27.22s/it]

Val Loss: 2.0660 - Val Accuracy: 0.9387



Training:   0%|          | 0/95 [00:00<?, ?it/s][A
Training:   1%|          | 1/95 [00:01<02:05,  1.34s/it][A
Training:   2%|▏         | 2/95 [00:01<01:01,  1.52it/s][A
Training:   4%|▍         | 4/95 [00:01<00:25,  3.59it/s][A
Training:   6%|▋         | 6/95 [00:02<00:29,  2.99it/s][A
Training:   8%|▊         | 8/95 [00:02<00:20,  4.31it/s][A
Training:   9%|▉         | 9/95 [00:03<00:27,  3.18it/s][A
Training:  11%|█         | 10/95 [00:03<00:22,  3.71it/s][A
Training:  14%|█▎        | 13/95 [00:04<00:23,  3.56it/s][A
Training:  16%|█▌        | 15/95 [00:04<00:16,  4.78it/s][A
Training:  18%|█▊        | 17/95 [00:05<00:24,  3.20it/s][A
Training:  21%|██        | 20/95 [00:05<00:15,  4.90it/s][A
Training:  23%|██▎       | 22/95 [00:06<00:20,  3.62it/s][A
Training:  25%|██▌       | 24/95 [00:06<00:15,  4.66it/s][A
Training:  27%|██▋       | 26/95 [00:07<00:18,  3.64it/s][A
Training:  31%|███       | 29/95 [00:08<00:19,  3.40it/s][A
Training:  33%|███▎      | 31/95 [00:0

Epoch: 22/98 - Loss: 1.8770 - Accuracy: 0.9444



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:13,  1.22s/it][A
 17%|█▋        | 2/12 [00:01<00:06,  1.65it/s][A
 33%|███▎      | 4/12 [00:01<00:02,  3.80it/s][A
 42%|████▏     | 5/12 [00:02<00:03,  2.28it/s][A
 75%|███████▌  | 9/12 [00:03<00:00,  3.08it/s][A
100%|██████████| 12/12 [00:03<00:00,  3.27it/s][A
Epochs:  22%|██▏       | 22/98 [09:57<34:35, 27.31s/it]

Val Loss: 1.9669 - Val Accuracy: 0.9418



Training:   0%|          | 0/95 [00:00<?, ?it/s][A
Training:   1%|          | 1/95 [00:01<01:59,  1.27s/it][A
Training:   3%|▎         | 3/95 [00:01<00:35,  2.60it/s][A
Training:   5%|▌         | 5/95 [00:02<00:38,  2.33it/s][A
Training:   7%|▋         | 7/95 [00:02<00:23,  3.67it/s][A
Training:   9%|▉         | 9/95 [00:03<00:29,  2.96it/s][A
Training:  12%|█▏        | 11/95 [00:03<00:20,  4.04it/s][A
Training:  14%|█▎        | 13/95 [00:04<00:26,  3.11it/s][A
Training:  16%|█▌        | 15/95 [00:04<00:19,  4.14it/s][A
Training:  18%|█▊        | 17/95 [00:05<00:21,  3.66it/s][A
Training:  20%|██        | 19/95 [00:05<00:15,  4.88it/s][A
Training:  22%|██▏       | 21/95 [00:06<00:21,  3.44it/s][A
Training:  24%|██▍       | 23/95 [00:06<00:15,  4.59it/s][A
Training:  26%|██▋       | 25/95 [00:07<00:20,  3.44it/s][A
Training:  28%|██▊       | 27/95 [00:07<00:15,  4.53it/s][A
Training:  31%|███       | 29/95 [00:08<00:18,  3.53it/s][A
Training:  33%|███▎      | 31/95 [00:

Epoch: 23/98 - Loss: 1.8930 - Accuracy: 0.9410



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:13,  1.22s/it][A
 17%|█▋        | 2/12 [00:01<00:05,  1.76it/s][A
 42%|████▏     | 5/12 [00:02<00:02,  2.51it/s][A
 50%|█████     | 6/12 [00:02<00:01,  3.07it/s][A
 67%|██████▋   | 8/12 [00:02<00:00,  4.72it/s][A
 83%|████████▎ | 10/12 [00:03<00:00,  3.58it/s][A
100%|██████████| 12/12 [00:03<00:00,  3.40it/s][A
Epochs:  23%|██▎       | 23/98 [10:24<34:14, 27.39s/it]

Val Loss: 2.3059 - Val Accuracy: 0.9405



Training:   0%|          | 0/95 [00:00<?, ?it/s][A
Training:   1%|          | 1/95 [00:01<02:07,  1.36s/it][A
Training:   2%|▏         | 2/95 [00:01<01:02,  1.49it/s][A
Training:   4%|▍         | 4/95 [00:01<00:25,  3.52it/s][A
Training:   6%|▋         | 6/95 [00:02<00:32,  2.70it/s][A
Training:   8%|▊         | 8/95 [00:02<00:22,  3.95it/s][A
Training:   9%|▉         | 9/95 [00:03<00:33,  2.56it/s][A
Training:  12%|█▏        | 11/95 [00:03<00:22,  3.80it/s][A
Training:  14%|█▎        | 13/95 [00:04<00:22,  3.57it/s][A
Training:  15%|█▍        | 14/95 [00:04<00:21,  3.84it/s][A
Training:  17%|█▋        | 16/95 [00:04<00:14,  5.29it/s][A
Training:  18%|█▊        | 17/95 [00:05<00:19,  4.01it/s][A
Training:  19%|█▉        | 18/95 [00:05<00:17,  4.33it/s][A
Training:  22%|██▏       | 21/95 [00:06<00:17,  4.20it/s][A
Training:  23%|██▎       | 22/95 [00:06<00:15,  4.67it/s][A
Training:  24%|██▍       | 23/95 [00:06<00:13,  5.27it/s][A
Training:  26%|██▋       | 25/95 [00:0

Epoch: 24/98 - Loss: 2.0551 - Accuracy: 0.9430



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:16,  1.49s/it][A
 25%|██▌       | 3/12 [00:01<00:03,  2.32it/s][A
 42%|████▏     | 5/12 [00:02<00:02,  2.50it/s][A
 58%|█████▊    | 7/12 [00:02<00:01,  3.78it/s][A
 75%|███████▌  | 9/12 [00:03<00:00,  3.35it/s][A
100%|██████████| 12/12 [00:03<00:00,  3.43it/s][A
Epochs:  24%|██▍       | 24/98 [10:52<33:51, 27.45s/it]

Val Loss: 2.0277 - Val Accuracy: 0.9366



Training:   0%|          | 0/95 [00:00<?, ?it/s][A
Training:   1%|          | 1/95 [00:01<02:28,  1.58s/it][A
Training:   4%|▍         | 4/95 [00:01<00:30,  2.94it/s][A
Training:   6%|▋         | 6/95 [00:02<00:33,  2.68it/s][A
Training:   8%|▊         | 8/95 [00:02<00:22,  3.82it/s][A
Training:   9%|▉         | 9/95 [00:03<00:32,  2.62it/s][A
Training:  13%|█▎        | 12/95 [00:03<00:19,  4.27it/s][A
Training:  14%|█▎        | 13/95 [00:04<00:28,  2.88it/s][A
Training:  17%|█▋        | 16/95 [00:04<00:19,  4.11it/s][A
Training:  18%|█▊        | 17/95 [00:05<00:24,  3.16it/s][A
Training:  20%|██        | 19/95 [00:05<00:17,  4.27it/s][A
Training:  21%|██        | 20/95 [00:05<00:15,  4.75it/s][A
Training:  22%|██▏       | 21/95 [00:06<00:23,  3.10it/s][A
Training:  24%|██▍       | 23/95 [00:06<00:16,  4.34it/s][A
Training:  25%|██▌       | 24/95 [00:06<00:15,  4.60it/s][A
Training:  26%|██▋       | 25/95 [00:07<00:22,  3.14it/s][A
Training:  28%|██▊       | 27/95 [00:

Epoch: 25/98 - Loss: 1.8995 - Accuracy: 0.9379



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:14,  1.31s/it][A
 17%|█▋        | 2/12 [00:01<00:06,  1.56it/s][A
 33%|███▎      | 4/12 [00:01<00:02,  3.59it/s][A
 42%|████▏     | 5/12 [00:02<00:02,  2.68it/s][A
 50%|█████     | 6/12 [00:02<00:02,  2.73it/s][A
 67%|██████▋   | 8/12 [00:02<00:00,  4.50it/s][A
 75%|███████▌  | 9/12 [00:03<00:00,  3.81it/s][A
100%|██████████| 12/12 [00:03<00:00,  3.25it/s][A
Epochs:  26%|██▌       | 25/98 [11:20<33:49, 27.80s/it]

Val Loss: 2.2539 - Val Accuracy: 0.9366



Training:   0%|          | 0/95 [00:00<?, ?it/s][A
Training:   1%|          | 1/95 [00:01<02:10,  1.38s/it][A
Training:   3%|▎         | 3/95 [00:01<00:37,  2.47it/s][A
Training:   5%|▌         | 5/95 [00:02<00:39,  2.30it/s][A
Training:   7%|▋         | 7/95 [00:02<00:24,  3.65it/s][A
Training:   9%|▉         | 9/95 [00:03<00:28,  3.06it/s][A
Training:  12%|█▏        | 11/95 [00:03<00:20,  4.16it/s][A
Training:  14%|█▎        | 13/95 [00:04<00:26,  3.14it/s][A
Training:  17%|█▋        | 16/95 [00:04<00:15,  4.96it/s][A
Training:  19%|█▉        | 18/95 [00:05<00:21,  3.58it/s][A
Training:  22%|██▏       | 21/95 [00:06<00:20,  3.55it/s][A
Training:  26%|██▋       | 25/95 [00:07<00:19,  3.68it/s][A
Training:  29%|██▉       | 28/95 [00:07<00:13,  5.02it/s][A
Training:  32%|███▏      | 30/95 [00:08<00:16,  4.00it/s][A
Training:  33%|███▎      | 31/95 [00:08<00:14,  4.33it/s][A
Training:  35%|███▍      | 33/95 [00:09<00:16,  3.68it/s][A
Training:  37%|███▋      | 35/95 [00:

Epoch: 26/98 - Loss: 1.9083 - Accuracy: 0.9443



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:16,  1.46s/it][A
 33%|███▎      | 4/12 [00:01<00:02,  3.27it/s][A
 50%|█████     | 6/12 [00:02<00:02,  2.99it/s][A
100%|██████████| 12/12 [00:03<00:00,  3.47it/s][A
Epochs:  27%|██▋       | 26/98 [11:48<33:08, 27.61s/it]

Val Loss: 2.2698 - Val Accuracy: 0.9259



Training:   0%|          | 0/95 [00:00<?, ?it/s][A
Training:   1%|          | 1/95 [00:01<02:19,  1.49s/it][A
Training:   3%|▎         | 3/95 [00:01<00:45,  2.04it/s][A
Training:   5%|▌         | 5/95 [00:02<00:37,  2.42it/s][A
Training:   6%|▋         | 6/95 [00:02<00:31,  2.86it/s][A
Training:   7%|▋         | 7/95 [00:02<00:24,  3.55it/s][A
Training:   9%|▉         | 9/95 [00:03<00:25,  3.42it/s][A
Training:  11%|█         | 10/95 [00:03<00:22,  3.73it/s][A
Training:  12%|█▏        | 11/95 [00:03<00:22,  3.71it/s][A
Training:  14%|█▎        | 13/95 [00:04<00:23,  3.43it/s][A
Training:  16%|█▌        | 15/95 [00:04<00:18,  4.27it/s][A
Training:  18%|█▊        | 17/95 [00:05<00:21,  3.55it/s][A
Training:  20%|██        | 19/95 [00:05<00:16,  4.70it/s][A
Training:  22%|██▏       | 21/95 [00:06<00:21,  3.41it/s][A
Training:  24%|██▍       | 23/95 [00:06<00:15,  4.51it/s][A
Training:  26%|██▋       | 25/95 [00:07<00:19,  3.54it/s][A
Training:  28%|██▊       | 27/95 [00:0

Epoch: 27/98 - Loss: 1.8504 - Accuracy: 0.9473



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:16,  1.51s/it][A
 25%|██▌       | 3/12 [00:01<00:03,  2.26it/s][A
 42%|████▏     | 5/12 [00:02<00:02,  2.80it/s][A
 50%|█████     | 6/12 [00:02<00:01,  3.19it/s][A
 75%|███████▌  | 9/12 [00:03<00:00,  3.89it/s][A
100%|██████████| 12/12 [00:03<00:00,  3.36it/s][A
Epochs:  28%|██▊       | 27/98 [12:15<32:32, 27.50s/it]

Val Loss: 2.1294 - Val Accuracy: 0.9410



Training:   0%|          | 0/95 [00:00<?, ?it/s][A
Training:   1%|          | 1/95 [00:01<02:34,  1.65s/it][A
Training:   2%|▏         | 2/95 [00:01<01:08,  1.35it/s][A
Training:   5%|▌         | 5/95 [00:02<00:39,  2.30it/s][A
Training:   6%|▋         | 6/95 [00:02<00:31,  2.84it/s][A
Training:   8%|▊         | 8/95 [00:02<00:20,  4.28it/s][A
Training:   9%|▉         | 9/95 [00:04<00:36,  2.36it/s][A
Training:  12%|█▏        | 11/95 [00:04<00:24,  3.49it/s][A
Training:  13%|█▎        | 12/95 [00:04<00:20,  4.05it/s][A
Training:  14%|█▎        | 13/95 [00:05<00:30,  2.72it/s][A
Training:  16%|█▌        | 15/95 [00:05<00:19,  4.11it/s][A
Training:  18%|█▊        | 17/95 [00:06<00:24,  3.19it/s][A
Training:  20%|██        | 19/95 [00:06<00:17,  4.35it/s][A
Training:  22%|██▏       | 21/95 [00:07<00:22,  3.26it/s][A
Training:  24%|██▍       | 23/95 [00:07<00:16,  4.31it/s][A
Training:  26%|██▋       | 25/95 [00:08<00:21,  3.20it/s][A
Training:  28%|██▊       | 27/95 [00:0

Epoch: 28/98 - Loss: 1.9764 - Accuracy: 0.9477



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:17,  1.55s/it][A
 42%|████▏     | 5/12 [00:02<00:03,  2.31it/s][A
 58%|█████▊    | 7/12 [00:02<00:01,  3.41it/s][A
 75%|███████▌  | 9/12 [00:03<00:00,  3.00it/s][A
100%|██████████| 12/12 [00:03<00:00,  3.27it/s][A
Epochs:  29%|██▊       | 28/98 [12:43<32:21, 27.73s/it]

Val Loss: 2.6668 - Val Accuracy: 0.9398



Training:   0%|          | 0/95 [00:00<?, ?it/s][A
Training:   1%|          | 1/95 [00:01<01:57,  1.25s/it][A
Training:   2%|▏         | 2/95 [00:01<00:58,  1.59it/s][A
Training:   3%|▎         | 3/95 [00:01<00:38,  2.36it/s][A
Training:   5%|▌         | 5/95 [00:02<00:38,  2.33it/s][A
Training:   7%|▋         | 7/95 [00:02<00:24,  3.58it/s][A
Training:   9%|▉         | 9/95 [00:03<00:28,  3.05it/s][A
Training:  12%|█▏        | 11/95 [00:03<00:20,  4.17it/s][A
Training:  14%|█▎        | 13/95 [00:04<00:25,  3.22it/s][A
Training:  16%|█▌        | 15/95 [00:04<00:19,  4.14it/s][A
Training:  17%|█▋        | 16/95 [00:04<00:16,  4.65it/s][A
Training:  18%|█▊        | 17/95 [00:05<00:26,  2.96it/s][A
Training:  22%|██▏       | 21/95 [00:06<00:20,  3.65it/s][A
Training:  25%|██▌       | 24/95 [00:06<00:13,  5.28it/s][A
Training:  27%|██▋       | 26/95 [00:07<00:16,  4.17it/s][A
Training:  28%|██▊       | 27/95 [00:07<00:15,  4.53it/s][A
Training:  29%|██▉       | 28/95 [00:0

Epoch: 29/98 - Loss: 1.9097 - Accuracy: 0.9414



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:15,  1.39s/it][A
 17%|█▋        | 2/12 [00:01<00:06,  1.54it/s][A
 33%|███▎      | 4/12 [00:01<00:02,  3.64it/s][A
 50%|█████     | 6/12 [00:02<00:02,  2.76it/s][A
100%|██████████| 12/12 [00:03<00:00,  3.27it/s][A
Epochs:  30%|██▉       | 29/98 [13:11<31:57, 27.80s/it]

Val Loss: 2.2403 - Val Accuracy: 0.9366



Training:   0%|          | 0/95 [00:00<?, ?it/s][A
Training:   1%|          | 1/95 [00:01<02:00,  1.28s/it][A
Training:   3%|▎         | 3/95 [00:01<00:34,  2.67it/s][A
Training:   5%|▌         | 5/95 [00:02<00:32,  2.75it/s][A
Training:   6%|▋         | 6/95 [00:02<00:28,  3.14it/s][A
Training:   8%|▊         | 8/95 [00:02<00:18,  4.65it/s][A
Training:   9%|▉         | 9/95 [00:03<00:27,  3.13it/s][A
Training:  11%|█         | 10/95 [00:03<00:26,  3.24it/s][A
Training:  13%|█▎        | 12/95 [00:03<00:17,  4.80it/s][A
Training:  14%|█▎        | 13/95 [00:04<00:23,  3.45it/s][A
Training:  15%|█▍        | 14/95 [00:04<00:23,  3.38it/s][A
Training:  18%|█▊        | 17/95 [00:05<00:19,  3.92it/s][A
Training:  19%|█▉        | 18/95 [00:05<00:20,  3.78it/s][A
Training:  20%|██        | 19/95 [00:05<00:18,  4.18it/s][A
Training:  22%|██▏       | 21/95 [00:06<00:18,  3.97it/s][A
Training:  23%|██▎       | 22/95 [00:06<00:19,  3.69it/s][A
Training:  25%|██▌       | 24/95 [00:0

Epoch: 30/98 - Loss: 1.9455 - Accuracy: 0.9425



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:13,  1.24s/it][A
 42%|████▏     | 5/12 [00:02<00:02,  2.79it/s][A
 58%|█████▊    | 7/12 [00:02<00:01,  4.02it/s][A
 75%|███████▌  | 9/12 [00:03<00:01,  2.96it/s][A
100%|██████████| 12/12 [00:03<00:00,  3.43it/s][A
Epochs:  31%|███       | 30/98 [13:38<31:21, 27.67s/it]

Val Loss: 2.1064 - Val Accuracy: 0.9446



Training:   0%|          | 0/95 [00:00<?, ?it/s][A
Training:   1%|          | 1/95 [00:01<02:21,  1.51s/it][A
Training:   4%|▍         | 4/95 [00:01<00:28,  3.17it/s][A
Training:   6%|▋         | 6/95 [00:02<00:32,  2.72it/s][A
Training:   8%|▊         | 8/95 [00:02<00:21,  4.01it/s][A
Training:  11%|█         | 10/95 [00:03<00:28,  2.95it/s][A
Training:  13%|█▎        | 12/95 [00:03<00:20,  4.11it/s][A
Training:  15%|█▍        | 14/95 [00:04<00:25,  3.17it/s][A
Training:  18%|█▊        | 17/95 [00:05<00:23,  3.37it/s][A
Training:  20%|██        | 19/95 [00:05<00:17,  4.27it/s][A
Training:  22%|██▏       | 21/95 [00:06<00:20,  3.64it/s][A
Training:  25%|██▌       | 24/95 [00:06<00:13,  5.09it/s][A
Training:  26%|██▋       | 25/95 [00:07<00:21,  3.30it/s][A
Training:  28%|██▊       | 27/95 [00:07<00:15,  4.33it/s][A
Training:  31%|███       | 29/95 [00:08<00:19,  3.44it/s][A
Training:  33%|███▎      | 31/95 [00:08<00:14,  4.39it/s][A
Training:  35%|███▍      | 33/95 [00

Epoch: 31/98 - Loss: 2.0334 - Accuracy: 0.9414



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:15,  1.44s/it][A
 33%|███▎      | 4/12 [00:01<00:02,  3.22it/s][A
 50%|█████     | 6/12 [00:02<00:02,  2.87it/s][A
 67%|██████▋   | 8/12 [00:02<00:00,  4.22it/s][A
100%|██████████| 12/12 [00:03<00:00,  3.42it/s][A
Epochs:  32%|███▏      | 31/98 [14:06<30:51, 27.63s/it]

Val Loss: 2.2418 - Val Accuracy: 0.9298



Training:   0%|          | 0/95 [00:00<?, ?it/s][A
Training:   1%|          | 1/95 [00:01<02:22,  1.52s/it][A
Training:   2%|▏         | 2/95 [00:01<01:04,  1.45it/s][A
Training:   5%|▌         | 5/95 [00:02<00:37,  2.38it/s][A
Training:   7%|▋         | 7/95 [00:02<00:25,  3.49it/s][A
Training:   9%|▉         | 9/95 [00:03<00:27,  3.13it/s][A
Training:  12%|█▏        | 11/95 [00:03<00:20,  4.03it/s][A
Training:  14%|█▎        | 13/95 [00:04<00:23,  3.54it/s][A
Training:  16%|█▌        | 15/95 [00:04<00:17,  4.57it/s][A
Training:  17%|█▋        | 16/95 [00:04<00:15,  5.08it/s][A
Training:  18%|█▊        | 17/95 [00:05<00:22,  3.42it/s][A
Training:  20%|██        | 19/95 [00:05<00:17,  4.25it/s][A
Training:  22%|██▏       | 21/95 [00:06<00:21,  3.48it/s][A
Training:  24%|██▍       | 23/95 [00:06<00:16,  4.29it/s][A
Training:  25%|██▌       | 24/95 [00:06<00:14,  4.81it/s][A
Training:  26%|██▋       | 25/95 [00:07<00:19,  3.66it/s][A
Training:  28%|██▊       | 27/95 [00:

Epoch: 32/98 - Loss: 2.0001 - Accuracy: 0.9420



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:15,  1.38s/it][A
 25%|██▌       | 3/12 [00:01<00:03,  2.52it/s][A
 42%|████▏     | 5/12 [00:02<00:02,  2.65it/s][A
 50%|█████     | 6/12 [00:02<00:01,  3.29it/s][A
 75%|███████▌  | 9/12 [00:03<00:00,  3.26it/s][A
100%|██████████| 12/12 [00:03<00:00,  3.41it/s][A
Epochs:  33%|███▎      | 32/98 [14:33<30:12, 27.46s/it]

Val Loss: 2.1254 - Val Accuracy: 0.9410



Training:   0%|          | 0/95 [00:00<?, ?it/s][A
Training:   1%|          | 1/95 [00:01<02:14,  1.43s/it][A
Training:   2%|▏         | 2/95 [00:01<01:07,  1.38it/s][A
Training:   4%|▍         | 4/95 [00:01<00:28,  3.24it/s][A
Training:   5%|▌         | 5/95 [00:02<00:33,  2.67it/s][A
Training:   6%|▋         | 6/95 [00:02<00:32,  2.70it/s][A
Training:   9%|▉         | 9/95 [00:03<00:25,  3.39it/s][A
Training:  11%|█         | 10/95 [00:03<00:28,  2.98it/s][A
Training:  13%|█▎        | 12/95 [00:03<00:19,  4.33it/s][A
Training:  14%|█▎        | 13/95 [00:04<00:21,  3.78it/s][A
Training:  15%|█▍        | 14/95 [00:04<00:26,  3.10it/s][A
Training:  18%|█▊        | 17/95 [00:05<00:19,  3.91it/s][A
Training:  19%|█▉        | 18/95 [00:05<00:20,  3.74it/s][A
Training:  22%|██▏       | 21/95 [00:06<00:19,  3.79it/s][A
Training:  23%|██▎       | 22/95 [00:06<00:18,  4.02it/s][A
Training:  25%|██▌       | 24/95 [00:06<00:13,  5.28it/s][A
Training:  26%|██▋       | 25/95 [00:0

Epoch: 33/98 - Loss: 2.0121 - Accuracy: 0.9439



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:14,  1.28s/it][A
 33%|███▎      | 4/12 [00:01<00:02,  3.44it/s][A
 50%|█████     | 6/12 [00:02<00:02,  2.96it/s][A
 67%|██████▋   | 8/12 [00:02<00:00,  4.38it/s][A
100%|██████████| 12/12 [00:03<00:00,  3.57it/s][A
Epochs:  34%|███▎      | 33/98 [15:01<29:53, 27.59s/it]

Val Loss: 2.2319 - Val Accuracy: 0.9438



Training:   0%|          | 0/95 [00:00<?, ?it/s][A
Training:   1%|          | 1/95 [00:01<02:14,  1.43s/it][A
Training:   2%|▏         | 2/95 [00:01<01:07,  1.38it/s][A
Training:   4%|▍         | 4/95 [00:01<00:28,  3.15it/s][A
Training:   5%|▌         | 5/95 [00:02<00:35,  2.53it/s][A
Training:   6%|▋         | 6/95 [00:02<00:29,  3.04it/s][A
Training:   8%|▊         | 8/95 [00:02<00:17,  4.89it/s][A
Training:   9%|▉         | 9/95 [00:03<00:31,  2.75it/s][A
Training:  12%|█▏        | 11/95 [00:03<00:21,  3.95it/s][A
Training:  14%|█▎        | 13/95 [00:04<00:25,  3.19it/s][A
Training:  16%|█▌        | 15/95 [00:04<00:17,  4.50it/s][A
Training:  18%|█▊        | 17/95 [00:05<00:23,  3.28it/s][A
Training:  20%|██        | 19/95 [00:05<00:17,  4.32it/s][A
Training:  22%|██▏       | 21/95 [00:06<00:21,  3.52it/s][A
Training:  24%|██▍       | 23/95 [00:06<00:15,  4.64it/s][A
Training:  26%|██▋       | 25/95 [00:07<00:19,  3.51it/s][A
Training:  28%|██▊       | 27/95 [00:07

Epoch: 34/98 - Loss: 2.0228 - Accuracy: 0.9411



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:13,  1.27s/it][A
 17%|█▋        | 2/12 [00:01<00:05,  1.69it/s][A
 25%|██▌       | 3/12 [00:01<00:03,  2.68it/s][A
 42%|████▏     | 5/12 [00:02<00:02,  2.68it/s][A
 58%|█████▊    | 7/12 [00:02<00:01,  4.02it/s][A
 75%|███████▌  | 9/12 [00:03<00:00,  3.16it/s][A
100%|██████████| 12/12 [00:03<00:00,  3.32it/s][A
Epochs:  35%|███▍      | 34/98 [15:29<29:42, 27.85s/it]

Val Loss: 2.2609 - Val Accuracy: 0.9381



Training:   0%|          | 0/95 [00:00<?, ?it/s][A
Training:   1%|          | 1/95 [00:01<02:02,  1.30s/it][A
Training:   2%|▏         | 2/95 [00:01<00:55,  1.67it/s][A
Training:   4%|▍         | 4/95 [00:01<00:24,  3.78it/s][A
Training:   6%|▋         | 6/95 [00:02<00:30,  2.89it/s][A
Training:   8%|▊         | 8/95 [00:02<00:20,  4.28it/s][A
Training:   9%|▉         | 9/95 [00:03<00:33,  2.54it/s][A
Training:  12%|█▏        | 11/95 [00:03<00:22,  3.80it/s][A
Training:  14%|█▎        | 13/95 [00:04<00:26,  3.11it/s][A
Training:  16%|█▌        | 15/95 [00:04<00:18,  4.27it/s][A
Training:  18%|█▊        | 17/95 [00:05<00:23,  3.35it/s][A
Training:  19%|█▉        | 18/95 [00:05<00:20,  3.83it/s][A
Training:  22%|██▏       | 21/95 [00:06<00:21,  3.51it/s][A
Training:  24%|██▍       | 23/95 [00:06<00:15,  4.64it/s][A
Training:  26%|██▋       | 25/95 [00:07<00:20,  3.34it/s][A
Training:  29%|██▉       | 28/95 [00:07<00:13,  5.05it/s][A
Training:  32%|███▏      | 30/95 [00:0

Epoch: 35/98 - Loss: 2.0020 - Accuracy: 0.9467



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:13,  1.27s/it][A
 33%|███▎      | 4/12 [00:01<00:02,  3.71it/s][A
 50%|█████     | 6/12 [00:02<00:02,  2.65it/s][A
 67%|██████▋   | 8/12 [00:02<00:01,  3.82it/s][A
100%|██████████| 12/12 [00:03<00:00,  3.37it/s][A
Epochs:  36%|███▌      | 35/98 [15:57<29:02, 27.66s/it]

Val Loss: 2.5810 - Val Accuracy: 0.9116



Training:   0%|          | 0/95 [00:00<?, ?it/s][A
Training:   1%|          | 1/95 [00:01<02:09,  1.38s/it][A
Training:   2%|▏         | 2/95 [00:01<01:07,  1.39it/s][A
Training:   3%|▎         | 3/95 [00:01<00:40,  2.25it/s][A
Training:   4%|▍         | 4/95 [00:01<00:28,  3.24it/s][A
Training:   5%|▌         | 5/95 [00:02<00:34,  2.61it/s][A
Training:   6%|▋         | 6/95 [00:02<00:27,  3.26it/s][A
Training:   8%|▊         | 8/95 [00:02<00:17,  4.99it/s][A
Training:   9%|▉         | 9/95 [00:03<00:25,  3.32it/s][A
Training:  12%|█▏        | 11/95 [00:03<00:16,  4.95it/s][A
Training:  14%|█▎        | 13/95 [00:04<00:20,  3.92it/s][A
Training:  18%|█▊        | 17/95 [00:05<00:19,  3.91it/s][A
Training:  20%|██        | 19/95 [00:05<00:16,  4.74it/s][A
Training:  22%|██▏       | 21/95 [00:06<00:19,  3.78it/s][A
Training:  25%|██▌       | 24/95 [00:06<00:13,  5.45it/s][A
Training:  27%|██▋       | 26/95 [00:07<00:18,  3.77it/s][A
Training:  29%|██▉       | 28/95 [00:07<

Epoch: 36/98 - Loss: 2.0300 - Accuracy: 0.9422



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:15,  1.37s/it][A
 33%|███▎      | 4/12 [00:01<00:02,  3.34it/s][A
 50%|█████     | 6/12 [00:02<00:02,  2.63it/s][A
 67%|██████▋   | 8/12 [00:02<00:01,  3.82it/s][A
100%|██████████| 12/12 [00:03<00:00,  3.23it/s][A
Epochs:  37%|███▋      | 36/98 [16:24<28:35, 27.67s/it]

Val Loss: 2.2166 - Val Accuracy: 0.9448



Training:   0%|          | 0/95 [00:00<?, ?it/s][A
Training:   1%|          | 1/95 [00:01<02:25,  1.55s/it][A
Training:   2%|▏         | 2/95 [00:01<01:06,  1.40it/s][A
Training:   5%|▌         | 5/95 [00:02<00:35,  2.55it/s][A
Training:   9%|▉         | 9/95 [00:03<00:27,  3.18it/s][A
Training:  13%|█▎        | 12/95 [00:03<00:18,  4.56it/s][A
Training:  14%|█▎        | 13/95 [00:04<00:25,  3.19it/s][A
Training:  16%|█▌        | 15/95 [00:04<00:19,  4.10it/s][A
Training:  18%|█▊        | 17/95 [00:05<00:23,  3.34it/s][A
Training:  20%|██        | 19/95 [00:05<00:17,  4.43it/s][A
Training:  22%|██▏       | 21/95 [00:06<00:20,  3.56it/s][A
Training:  24%|██▍       | 23/95 [00:06<00:15,  4.59it/s][A
Training:  26%|██▋       | 25/95 [00:07<00:18,  3.84it/s][A
Training:  28%|██▊       | 27/95 [00:07<00:14,  4.80it/s][A
Training:  31%|███       | 29/95 [00:08<00:17,  3.69it/s][A
Training:  32%|███▏      | 30/95 [00:08<00:15,  4.13it/s][A
Training:  35%|███▍      | 33/95 [00

Epoch: 37/98 - Loss: 2.0293 - Accuracy: 0.9459



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:13,  1.24s/it][A
 33%|███▎      | 4/12 [00:01<00:02,  3.81it/s][A
 50%|█████     | 6/12 [00:02<00:02,  2.98it/s][A
 75%|███████▌  | 9/12 [00:03<00:00,  3.26it/s][A
100%|██████████| 12/12 [00:03<00:00,  3.53it/s][A
Epochs:  38%|███▊      | 37/98 [16:52<28:01, 27.56s/it]

Val Loss: 2.2316 - Val Accuracy: 0.9336



Training:   0%|          | 0/95 [00:00<?, ?it/s][A
Training:   1%|          | 1/95 [00:01<02:14,  1.43s/it][A
Training:   3%|▎         | 3/95 [00:01<00:38,  2.39it/s][A
Training:   5%|▌         | 5/95 [00:02<00:39,  2.30it/s][A
Training:   7%|▋         | 7/95 [00:02<00:25,  3.45it/s][A
Training:   9%|▉         | 9/95 [00:03<00:29,  2.89it/s][A
Training:  12%|█▏        | 11/95 [00:03<00:20,  4.10it/s][A
Training:  14%|█▎        | 13/95 [00:04<00:27,  3.01it/s][A
Training:  18%|█▊        | 17/95 [00:05<00:21,  3.60it/s][A
Training:  20%|██        | 19/95 [00:05<00:16,  4.52it/s][A
Training:  21%|██        | 20/95 [00:05<00:15,  4.92it/s][A
Training:  22%|██▏       | 21/95 [00:06<00:21,  3.43it/s][A
Training:  24%|██▍       | 23/95 [00:06<00:16,  4.44it/s][A
Training:  25%|██▌       | 24/95 [00:06<00:14,  4.90it/s][A
Training:  26%|██▋       | 25/95 [00:07<00:21,  3.28it/s][A
Training:  28%|██▊       | 27/95 [00:07<00:15,  4.37it/s][A
Training:  29%|██▉       | 28/95 [00:

Epoch: 38/98 - Loss: 2.0698 - Accuracy: 0.9458



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:15,  1.37s/it][A
 25%|██▌       | 3/12 [00:01<00:03,  2.50it/s][A
 42%|████▏     | 5/12 [00:02<00:02,  2.69it/s][A
 50%|█████     | 6/12 [00:02<00:02,  2.76it/s][A
 75%|███████▌  | 9/12 [00:03<00:00,  3.22it/s][A
100%|██████████| 12/12 [00:03<00:00,  3.18it/s][A
Epochs:  39%|███▉      | 38/98 [17:19<27:24, 27.41s/it]

Val Loss: 2.2780 - Val Accuracy: 0.9335



Training:   0%|          | 0/95 [00:00<?, ?it/s][A
Training:   1%|          | 1/95 [00:01<02:27,  1.57s/it][A
Training:   3%|▎         | 3/95 [00:01<00:43,  2.14it/s][A
Training:   5%|▌         | 5/95 [00:02<00:40,  2.25it/s][A
Training:   7%|▋         | 7/95 [00:02<00:24,  3.54it/s][A
Training:   9%|▉         | 9/95 [00:03<00:32,  2.66it/s][A
Training:  13%|█▎        | 12/95 [00:03<00:18,  4.47it/s][A
Training:  15%|█▍        | 14/95 [00:04<00:24,  3.37it/s][A
Training:  17%|█▋        | 16/95 [00:04<00:17,  4.44it/s][A
Training:  19%|█▉        | 18/95 [00:05<00:21,  3.60it/s][A
Training:  21%|██        | 20/95 [00:05<00:16,  4.67it/s][A
Training:  23%|██▎       | 22/95 [00:06<00:19,  3.66it/s][A
Training:  25%|██▌       | 24/95 [00:06<00:15,  4.70it/s][A
Training:  27%|██▋       | 26/95 [00:07<00:18,  3.65it/s][A
Training:  29%|██▉       | 28/95 [00:07<00:14,  4.68it/s][A
Training:  31%|███       | 29/95 [00:08<00:21,  3.09it/s][A
Training:  32%|███▏      | 30/95 [00:

Epoch: 39/98 - Loss: 2.0946 - Accuracy: 0.9463



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:13,  1.19s/it][A
 33%|███▎      | 4/12 [00:01<00:02,  3.80it/s][A
 50%|█████     | 6/12 [00:02<00:02,  2.82it/s][A
100%|██████████| 12/12 [00:03<00:00,  3.45it/s][A
Epochs:  40%|███▉      | 39/98 [17:46<26:56, 27.39s/it]

Val Loss: 2.2568 - Val Accuracy: 0.9422



Training:   0%|          | 0/95 [00:00<?, ?it/s][A
Training:   1%|          | 1/95 [00:01<02:17,  1.46s/it][A
Training:   3%|▎         | 3/95 [00:01<00:40,  2.26it/s][A
Training:   5%|▌         | 5/95 [00:02<00:40,  2.24it/s][A
Training:   7%|▋         | 7/95 [00:02<00:24,  3.59it/s][A
Training:   9%|▉         | 9/95 [00:03<00:27,  3.13it/s][A
Training:  12%|█▏        | 11/95 [00:03<00:19,  4.40it/s][A
Training:  14%|█▎        | 13/95 [00:04<00:21,  3.80it/s][A
Training:  17%|█▋        | 16/95 [00:04<00:13,  5.76it/s][A
Training:  19%|█▉        | 18/95 [00:05<00:20,  3.76it/s][A
Training:  22%|██▏       | 21/95 [00:06<00:20,  3.67it/s][A
Training:  24%|██▍       | 23/95 [00:06<00:15,  4.59it/s][A
Training:  26%|██▋       | 25/95 [00:07<00:20,  3.49it/s][A
Training:  28%|██▊       | 27/95 [00:07<00:15,  4.43it/s][A
Training:  31%|███       | 29/95 [00:08<00:18,  3.60it/s][A
Training:  33%|███▎      | 31/95 [00:08<00:13,  4.59it/s][A
Training:  34%|███▎      | 32/95 [00:

Epoch: 40/98 - Loss: 2.0779 - Accuracy: 0.9491



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:14,  1.27s/it][A
 25%|██▌       | 3/12 [00:01<00:03,  2.71it/s][A
 42%|████▏     | 5/12 [00:02<00:02,  2.78it/s][A
 67%|██████▋   | 8/12 [00:02<00:00,  5.28it/s][A
100%|██████████| 12/12 [00:03<00:00,  3.65it/s][A
Epochs:  41%|████      | 40/98 [18:13<26:26, 27.35s/it]

Val Loss: 2.3251 - Val Accuracy: 0.9462



Training:   0%|          | 0/95 [00:00<?, ?it/s][A
Training:   1%|          | 1/95 [00:01<02:22,  1.52s/it][A
Training:   3%|▎         | 3/95 [00:01<00:40,  2.26it/s][A
Training:   5%|▌         | 5/95 [00:02<00:35,  2.55it/s][A
Training:   7%|▋         | 7/95 [00:02<00:22,  3.88it/s][A
Training:   8%|▊         | 8/95 [00:02<00:19,  4.39it/s][A
Training:   9%|▉         | 9/95 [00:03<00:30,  2.87it/s][A
Training:  12%|█▏        | 11/95 [00:03<00:20,  4.09it/s][A
Training:  14%|█▎        | 13/95 [00:04<00:24,  3.37it/s][A
Training:  16%|█▌        | 15/95 [00:04<00:19,  4.15it/s][A
Training:  18%|█▊        | 17/95 [00:05<00:23,  3.39it/s][A
Training:  20%|██        | 19/95 [00:05<00:17,  4.31it/s][A
Training:  22%|██▏       | 21/95 [00:06<00:20,  3.65it/s][A
Training:  24%|██▍       | 23/95 [00:06<00:15,  4.60it/s][A
Training:  26%|██▋       | 25/95 [00:07<00:18,  3.74it/s][A
Training:  28%|██▊       | 27/95 [00:07<00:14,  4.75it/s][A
Training:  31%|███       | 29/95 [00:0

Epoch: 41/98 - Loss: 2.0137 - Accuracy: 0.9497



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:14,  1.33s/it][A
 33%|███▎      | 4/12 [00:01<00:02,  3.16it/s][A
 42%|████▏     | 5/12 [00:02<00:02,  2.48it/s][A
 58%|█████▊    | 7/12 [00:02<00:01,  4.00it/s][A
 67%|██████▋   | 8/12 [00:02<00:00,  4.39it/s][A
100%|██████████| 12/12 [00:03<00:00,  3.75it/s][A
Epochs:  42%|████▏     | 41/98 [18:40<25:54, 27.27s/it]

Val Loss: 2.1831 - Val Accuracy: 0.9435



Training:   0%|          | 0/95 [00:00<?, ?it/s][A
Training:   1%|          | 1/95 [00:01<02:19,  1.49s/it][A
Training:   3%|▎         | 3/95 [00:01<00:40,  2.29it/s][A
Training:   5%|▌         | 5/95 [00:02<00:34,  2.57it/s][A
Training:   7%|▋         | 7/95 [00:02<00:22,  3.93it/s][A
Training:   9%|▉         | 9/95 [00:03<00:26,  3.22it/s][A
Training:  11%|█         | 10/95 [00:03<00:22,  3.74it/s][A
Training:  13%|█▎        | 12/95 [00:03<00:16,  5.16it/s][A
Training:  14%|█▎        | 13/95 [00:04<00:25,  3.21it/s][A
Training:  16%|█▌        | 15/95 [00:04<00:18,  4.36it/s][A
Training:  18%|█▊        | 17/95 [00:05<00:21,  3.70it/s][A
Training:  19%|█▉        | 18/95 [00:05<00:20,  3.84it/s][A
Training:  21%|██        | 20/95 [00:05<00:14,  5.21it/s][A
Training:  22%|██▏       | 21/95 [00:06<00:19,  3.74it/s][A
Training:  23%|██▎       | 22/95 [00:06<00:19,  3.70it/s][A
Training:  26%|██▋       | 25/95 [00:07<00:19,  3.62it/s][A
Training:  27%|██▋       | 26/95 [00:

Epoch: 42/98 - Loss: 2.0060 - Accuracy: 0.9486



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:14,  1.32s/it][A
 33%|███▎      | 4/12 [00:01<00:02,  3.39it/s][A
 50%|█████     | 6/12 [00:02<00:02,  2.82it/s][A
 67%|██████▋   | 8/12 [00:02<00:00,  4.20it/s][A
100%|██████████| 12/12 [00:03<00:00,  3.48it/s][A
Epochs:  43%|████▎     | 42/98 [19:07<25:24, 27.23s/it]

Val Loss: 2.2971 - Val Accuracy: 0.9387



Training:   0%|          | 0/95 [00:00<?, ?it/s][A
Training:   1%|          | 1/95 [00:01<01:58,  1.26s/it][A
Training:   2%|▏         | 2/95 [00:01<00:55,  1.67it/s][A
Training:   4%|▍         | 4/95 [00:01<00:24,  3.67it/s][A
Training:   5%|▌         | 5/95 [00:02<00:34,  2.64it/s][A
Training:   6%|▋         | 6/95 [00:02<00:27,  3.26it/s][A
Training:   8%|▊         | 8/95 [00:02<00:19,  4.44it/s][A
Training:   9%|▉         | 9/95 [00:03<00:28,  2.99it/s][A
Training:  13%|█▎        | 12/95 [00:03<00:19,  4.29it/s][A
Training:  14%|█▎        | 13/95 [00:04<00:22,  3.65it/s][A
Training:  15%|█▍        | 14/95 [00:04<00:20,  3.90it/s][A
Training:  17%|█▋        | 16/95 [00:04<00:18,  4.27it/s][A
Training:  18%|█▊        | 17/95 [00:05<00:19,  3.93it/s][A
Training:  19%|█▉        | 18/95 [00:05<00:19,  4.00it/s][A
Training:  21%|██        | 20/95 [00:05<00:16,  4.65it/s][A
Training:  22%|██▏       | 21/95 [00:05<00:17,  4.19it/s][A
Training:  23%|██▎       | 22/95 [00:06

Epoch: 43/98 - Loss: 2.0048 - Accuracy: 0.9480



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:14,  1.29s/it][A
 33%|███▎      | 4/12 [00:01<00:02,  3.64it/s][A
 50%|█████     | 6/12 [00:02<00:02,  2.85it/s][A
 67%|██████▋   | 8/12 [00:02<00:00,  4.16it/s][A
100%|██████████| 12/12 [00:03<00:00,  3.49it/s][A
Epochs:  44%|████▍     | 43/98 [19:34<24:42, 26.95s/it]

Val Loss: 2.3517 - Val Accuracy: 0.9415



Training:   0%|          | 0/95 [00:00<?, ?it/s][A
Training:   1%|          | 1/95 [00:01<02:04,  1.33s/it][A
Training:   3%|▎         | 3/95 [00:01<00:35,  2.62it/s][A
Training:   5%|▌         | 5/95 [00:02<00:32,  2.78it/s][A
Training:   6%|▋         | 6/95 [00:02<00:26,  3.42it/s][A
Training:   8%|▊         | 8/95 [00:02<00:16,  5.29it/s][A
Training:  11%|█         | 10/95 [00:03<00:21,  3.98it/s][A
Training:  13%|█▎        | 12/95 [00:03<00:15,  5.37it/s][A
Training:  15%|█▍        | 14/95 [00:03<00:18,  4.32it/s][A
Training:  17%|█▋        | 16/95 [00:04<00:14,  5.32it/s][A
Training:  18%|█▊        | 17/95 [00:04<00:18,  4.11it/s][A
Training:  19%|█▉        | 18/95 [00:04<00:20,  3.84it/s][A
Training:  21%|██        | 20/95 [00:04<00:14,  5.23it/s][A
Training:  22%|██▏       | 21/95 [00:05<00:15,  4.65it/s][A
Training:  23%|██▎       | 22/95 [00:05<00:21,  3.44it/s][A
Training:  25%|██▌       | 24/95 [00:05<00:14,  4.98it/s][A
Training:  26%|██▋       | 25/95 [00:

Epoch: 44/98 - Loss: 2.1131 - Accuracy: 0.9434



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:15,  1.44s/it][A
 25%|██▌       | 3/12 [00:01<00:03,  2.35it/s][A
 42%|████▏     | 5/12 [00:02<00:02,  2.38it/s][A
 58%|█████▊    | 7/12 [00:02<00:01,  3.80it/s][A
100%|██████████| 12/12 [00:03<00:00,  3.61it/s][A
Epochs:  45%|████▍     | 44/98 [20:00<23:59, 26.65s/it]

Val Loss: 2.5761 - Val Accuracy: 0.8819



Training:   0%|          | 0/95 [00:00<?, ?it/s][A
Training:   1%|          | 1/95 [00:01<02:10,  1.39s/it][A
Training:   2%|▏         | 2/95 [00:01<01:03,  1.48it/s][A
Training:   4%|▍         | 4/95 [00:01<00:26,  3.41it/s][A
Training:   5%|▌         | 5/95 [00:02<00:36,  2.48it/s][A
Training:   6%|▋         | 6/95 [00:02<00:27,  3.22it/s][A
Training:   7%|▋         | 7/95 [00:02<00:21,  4.03it/s][A
Training:   9%|▉         | 9/95 [00:03<00:26,  3.30it/s][A
Training:  12%|█▏        | 11/95 [00:03<00:17,  4.70it/s][A
Training:  14%|█▎        | 13/95 [00:04<00:20,  3.93it/s][A
Training:  15%|█▍        | 14/95 [00:04<00:21,  3.84it/s][A
Training:  18%|█▊        | 17/95 [00:05<00:18,  4.17it/s][A
Training:  19%|█▉        | 18/95 [00:05<00:19,  3.92it/s][A
Training:  22%|██▏       | 21/95 [00:05<00:17,  4.29it/s][A
Training:  23%|██▎       | 22/95 [00:06<00:18,  4.04it/s][A
Training:  26%|██▋       | 25/95 [00:06<00:16,  4.18it/s][A
Training:  27%|██▋       | 26/95 [00:07

Epoch: 45/98 - Loss: 1.9891 - Accuracy: 0.9463



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:17,  1.55s/it][A
 25%|██▌       | 3/12 [00:01<00:03,  2.26it/s][A
 42%|████▏     | 5/12 [00:02<00:02,  2.46it/s][A
 58%|█████▊    | 7/12 [00:02<00:01,  3.81it/s][A
 75%|███████▌  | 9/12 [00:03<00:00,  3.45it/s][A
100%|██████████| 12/12 [00:03<00:00,  3.46it/s][A
Epochs:  46%|████▌     | 45/98 [20:27<23:49, 26.97s/it]

Val Loss: 2.2676 - Val Accuracy: 0.9331



Training:   0%|          | 0/95 [00:00<?, ?it/s][A
Training:   1%|          | 1/95 [00:01<01:56,  1.23s/it][A
Training:   3%|▎         | 3/95 [00:01<00:35,  2.61it/s][A
Training:   5%|▌         | 5/95 [00:02<00:38,  2.36it/s][A
Training:   7%|▋         | 7/95 [00:02<00:23,  3.68it/s][A
Training:   9%|▉         | 9/95 [00:03<00:28,  2.99it/s][A
Training:  13%|█▎        | 12/95 [00:03<00:17,  4.83it/s][A
Training:  15%|█▍        | 14/95 [00:04<00:22,  3.63it/s][A
Training:  17%|█▋        | 16/95 [00:04<00:16,  4.79it/s][A
Training:  19%|█▉        | 18/95 [00:05<00:21,  3.63it/s][A
Training:  21%|██        | 20/95 [00:05<00:15,  4.76it/s][A
Training:  23%|██▎       | 22/95 [00:06<00:20,  3.59it/s][A
Training:  25%|██▌       | 24/95 [00:06<00:15,  4.61it/s][A
Training:  27%|██▋       | 26/95 [00:07<00:18,  3.81it/s][A
Training:  29%|██▉       | 28/95 [00:07<00:13,  4.89it/s][A
Training:  31%|███       | 29/95 [00:07<00:18,  3.59it/s][A
Training:  32%|███▏      | 30/95 [00:

Epoch: 46/98 - Loss: 1.9414 - Accuracy: 0.9450



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:17,  1.55s/it][A
 25%|██▌       | 3/12 [00:01<00:04,  2.18it/s][A
 42%|████▏     | 5/12 [00:02<00:02,  2.50it/s][A
 67%|██████▋   | 8/12 [00:02<00:00,  4.75it/s][A
100%|██████████| 12/12 [00:03<00:00,  3.48it/s][A
Epochs:  47%|████▋     | 46/98 [20:54<23:22, 26.97s/it]

Val Loss: 2.1920 - Val Accuracy: 0.9360



Training:   0%|          | 0/95 [00:00<?, ?it/s][A
Training:   1%|          | 1/95 [00:01<02:04,  1.32s/it][A
Training:   3%|▎         | 3/95 [00:01<00:35,  2.62it/s][A
Training:   5%|▌         | 5/95 [00:02<00:40,  2.22it/s][A
Training:   7%|▋         | 7/95 [00:02<00:25,  3.45it/s][A
Training:   9%|▉         | 9/95 [00:03<00:28,  3.04it/s][A
Training:  12%|█▏        | 11/95 [00:03<00:19,  4.26it/s][A
Training:  14%|█▎        | 13/95 [00:04<00:22,  3.64it/s][A
Training:  16%|█▌        | 15/95 [00:04<00:17,  4.56it/s][A
Training:  18%|█▊        | 17/95 [00:05<00:19,  4.04it/s][A
Training:  20%|██        | 19/95 [00:05<00:15,  4.78it/s][A
Training:  22%|██▏       | 21/95 [00:05<00:18,  4.07it/s][A
Training:  23%|██▎       | 22/95 [00:06<00:17,  4.22it/s][A
Training:  24%|██▍       | 23/95 [00:06<00:15,  4.76it/s][A
Training:  26%|██▋       | 25/95 [00:06<00:16,  4.13it/s][A
Training:  27%|██▋       | 26/95 [00:07<00:16,  4.12it/s][A
Training:  31%|███       | 29/95 [00:

Epoch: 47/98 - Loss: 1.9312 - Accuracy: 0.9485



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:15,  1.38s/it][A
 25%|██▌       | 3/12 [00:01<00:03,  2.48it/s][A
 42%|████▏     | 5/12 [00:02<00:03,  2.32it/s][A
 58%|█████▊    | 7/12 [00:02<00:01,  3.51it/s][A
 75%|███████▌  | 9/12 [00:03<00:00,  3.09it/s][A
100%|██████████| 12/12 [00:03<00:00,  3.35it/s][A
Epochs:  48%|████▊     | 47/98 [21:21<22:54, 26.95s/it]

Val Loss: 2.1456 - Val Accuracy: 0.9435



Training:   0%|          | 0/95 [00:00<?, ?it/s][A
Training:   1%|          | 1/95 [00:01<02:02,  1.31s/it][A
Training:   5%|▌         | 5/95 [00:02<00:36,  2.47it/s][A
Training:   7%|▋         | 7/95 [00:02<00:24,  3.61it/s][A
Training:   9%|▉         | 9/95 [00:03<00:28,  3.05it/s][A
Training:  12%|█▏        | 11/95 [00:03<00:20,  4.07it/s][A
Training:  14%|█▎        | 13/95 [00:04<00:22,  3.59it/s][A
Training:  17%|█▋        | 16/95 [00:04<00:14,  5.41it/s][A
Training:  19%|█▉        | 18/95 [00:04<00:16,  4.65it/s][A
Training:  21%|██        | 20/95 [00:04<00:12,  5.94it/s][A
Training:  23%|██▎       | 22/95 [00:05<00:14,  4.87it/s][A
Training:  25%|██▌       | 24/95 [00:05<00:13,  5.30it/s][A
Training:  26%|██▋       | 25/95 [00:06<00:18,  3.81it/s][A
Training:  28%|██▊       | 27/95 [00:06<00:13,  5.11it/s][A
Training:  29%|██▉       | 28/95 [00:06<00:12,  5.31it/s][A
Training:  31%|███       | 29/95 [00:07<00:18,  3.51it/s][A
Training:  32%|███▏      | 30/95 [00

Epoch: 48/98 - Loss: 2.0215 - Accuracy: 0.9425



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:15,  1.45s/it][A
 17%|█▋        | 2/12 [00:01<00:06,  1.44it/s][A
 42%|████▏     | 5/12 [00:02<00:02,  2.41it/s][A
 50%|█████     | 6/12 [00:02<00:02,  2.81it/s][A
100%|██████████| 12/12 [00:03<00:00,  3.32it/s][A
Epochs:  49%|████▉     | 48/98 [21:48<22:19, 26.80s/it]

Val Loss: 2.2111 - Val Accuracy: 0.9417



Training:   0%|          | 0/95 [00:00<?, ?it/s][A
Training:   1%|          | 1/95 [00:01<02:02,  1.30s/it][A
Training:   2%|▏         | 2/95 [00:01<00:55,  1.67it/s][A
Training:   4%|▍         | 4/95 [00:01<00:25,  3.61it/s][A
Training:   5%|▌         | 5/95 [00:02<00:33,  2.71it/s][A
Training:   6%|▋         | 6/95 [00:02<00:29,  3.06it/s][A
Training:   9%|▉         | 9/95 [00:02<00:21,  3.98it/s][A
Training:  11%|█         | 10/95 [00:03<00:21,  3.89it/s][A
Training:  13%|█▎        | 12/95 [00:03<00:15,  5.47it/s][A
Training:  14%|█▎        | 13/95 [00:03<00:22,  3.70it/s][A
Training:  15%|█▍        | 14/95 [00:04<00:21,  3.82it/s][A
Training:  18%|█▊        | 17/95 [00:04<00:20,  3.86it/s][A
Training:  19%|█▉        | 18/95 [00:05<00:18,  4.19it/s][A
Training:  21%|██        | 20/95 [00:05<00:13,  5.67it/s][A
Training:  22%|██▏       | 21/95 [00:05<00:19,  3.79it/s][A
Training:  23%|██▎       | 22/95 [00:06<00:17,  4.10it/s][A
Training:  24%|██▍       | 23/95 [00:0

Epoch: 49/98 - Loss: 1.9977 - Accuracy: 0.9456



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:14,  1.30s/it][A
 25%|██▌       | 3/12 [00:01<00:03,  2.55it/s][A
 42%|████▏     | 5/12 [00:02<00:02,  2.50it/s][A
 58%|█████▊    | 7/12 [00:02<00:01,  3.79it/s][A
 75%|███████▌  | 9/12 [00:03<00:00,  3.13it/s][A
100%|██████████| 12/12 [00:03<00:00,  3.38it/s][A
Epochs:  50%|█████     | 49/98 [22:14<21:46, 26.65s/it]

Val Loss: 2.6313 - Val Accuracy: 0.9437



Training:   0%|          | 0/95 [00:00<?, ?it/s][A
Training:   1%|          | 1/95 [00:01<02:22,  1.52s/it][A
Training:   3%|▎         | 3/95 [00:01<00:40,  2.27it/s][A
Training:   5%|▌         | 5/95 [00:02<00:38,  2.36it/s][A
Training:   6%|▋         | 6/95 [00:02<00:29,  2.97it/s][A
Training:   8%|▊         | 8/95 [00:02<00:19,  4.57it/s][A
Training:  11%|█         | 10/95 [00:03<00:23,  3.65it/s][A
Training:  13%|█▎        | 12/95 [00:03<00:17,  4.85it/s][A
Training:  14%|█▎        | 13/95 [00:04<00:23,  3.46it/s][A
Training:  16%|█▌        | 15/95 [00:04<00:16,  4.95it/s][A
Training:  18%|█▊        | 17/95 [00:05<00:21,  3.64it/s][A
Training:  19%|█▉        | 18/95 [00:05<00:18,  4.08it/s][A
Training:  20%|██        | 19/95 [00:05<00:16,  4.55it/s][A
Training:  22%|██▏       | 21/95 [00:06<00:19,  3.76it/s][A
Training:  24%|██▍       | 23/95 [00:06<00:14,  4.94it/s][A
Training:  26%|██▋       | 25/95 [00:07<00:18,  3.69it/s][A
Training:  28%|██▊       | 27/95 [00:

Epoch: 50/98 - Loss: 2.0879 - Accuracy: 0.9452



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:14,  1.34s/it][A
 25%|██▌       | 3/12 [00:01<00:03,  2.53it/s][A
 42%|████▏     | 5/12 [00:02<00:03,  2.26it/s][A
 58%|█████▊    | 7/12 [00:02<00:01,  3.54it/s][A
100%|██████████| 12/12 [00:03<00:00,  3.33it/s][A
Epochs:  51%|█████     | 50/98 [22:41<21:23, 26.73s/it]

Val Loss: 2.2049 - Val Accuracy: 0.9372



Training:   0%|          | 0/95 [00:00<?, ?it/s][A
Training:   1%|          | 1/95 [00:01<01:56,  1.24s/it][A
Training:   2%|▏         | 2/95 [00:01<00:54,  1.70it/s][A
Training:   5%|▌         | 5/95 [00:02<00:32,  2.81it/s][A
Training:   7%|▋         | 7/95 [00:02<00:21,  4.16it/s][A
Training:   8%|▊         | 8/95 [00:02<00:18,  4.77it/s][A
Training:   9%|▉         | 9/95 [00:03<00:33,  2.55it/s][A
Training:  14%|█▎        | 13/95 [00:04<00:26,  3.15it/s][A
Training:  18%|█▊        | 17/95 [00:05<00:21,  3.63it/s][A
Training:  20%|██        | 19/95 [00:05<00:16,  4.50it/s][A
Training:  22%|██▏       | 21/95 [00:06<00:18,  3.93it/s][A
Training:  24%|██▍       | 23/95 [00:06<00:14,  4.82it/s][A
Training:  26%|██▋       | 25/95 [00:07<00:17,  3.99it/s][A
Training:  27%|██▋       | 26/95 [00:07<00:15,  4.40it/s][A
Training:  31%|███       | 29/95 [00:07<00:16,  4.11it/s][A
Training:  33%|███▎      | 31/95 [00:08<00:12,  5.25it/s][A
Training:  35%|███▍      | 33/95 [00:0

Epoch: 51/98 - Loss: 1.9290 - Accuracy: 0.9444



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:15,  1.40s/it][A
 17%|█▋        | 2/12 [00:01<00:06,  1.43it/s][A
 33%|███▎      | 4/12 [00:01<00:02,  3.27it/s][A
 42%|████▏     | 5/12 [00:02<00:02,  2.39it/s][A
 50%|█████     | 6/12 [00:02<00:02,  2.96it/s][A
 67%|██████▋   | 8/12 [00:02<00:00,  4.69it/s][A
100%|██████████| 12/12 [00:03<00:00,  3.36it/s][A
Epochs:  52%|█████▏    | 51/98 [23:07<20:51, 26.63s/it]

Val Loss: 2.3360 - Val Accuracy: 0.9176



Training:   0%|          | 0/95 [00:00<?, ?it/s][A
Training:   1%|          | 1/95 [00:01<02:15,  1.44s/it][A
Training:   2%|▏         | 2/95 [00:01<01:01,  1.50it/s][A
Training:   5%|▌         | 5/95 [00:02<00:39,  2.28it/s][A
Training:   7%|▋         | 7/95 [00:02<00:25,  3.45it/s][A
Training:   9%|▉         | 9/95 [00:03<00:27,  3.11it/s][A
Training:  11%|█         | 10/95 [00:03<00:24,  3.53it/s][A
Training:  12%|█▏        | 11/95 [00:03<00:20,  4.14it/s][A
Training:  14%|█▎        | 13/95 [00:04<00:24,  3.31it/s][A
Training:  15%|█▍        | 14/95 [00:04<00:22,  3.59it/s][A
Training:  16%|█▌        | 15/95 [00:04<00:18,  4.23it/s][A
Training:  17%|█▋        | 16/95 [00:04<00:16,  4.93it/s][A
Training:  18%|█▊        | 17/95 [00:05<00:23,  3.25it/s][A
Training:  20%|██        | 19/95 [00:05<00:15,  5.04it/s][A
Training:  22%|██▏       | 21/95 [00:06<00:20,  3.65it/s][A
Training:  24%|██▍       | 23/95 [00:06<00:14,  4.85it/s][A
Training:  26%|██▋       | 25/95 [00:

Epoch: 52/98 - Loss: 1.8678 - Accuracy: 0.9443



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:15,  1.37s/it][A
 17%|█▋        | 2/12 [00:01<00:06,  1.55it/s][A
 33%|███▎      | 4/12 [00:01<00:02,  3.62it/s][A
 50%|█████     | 6/12 [00:02<00:01,  3.01it/s][A
 67%|██████▋   | 8/12 [00:02<00:00,  4.09it/s][A
 75%|███████▌  | 9/12 [00:03<00:01,  2.87it/s][A
100%|██████████| 12/12 [00:03<00:00,  3.28it/s][A
Epochs:  53%|█████▎    | 52/98 [23:34<20:23, 26.59s/it]

Val Loss: 2.1635 - Val Accuracy: 0.9400



Training:   0%|          | 0/95 [00:00<?, ?it/s][A
Training:   1%|          | 1/95 [00:01<02:13,  1.42s/it][A
Training:   3%|▎         | 3/95 [00:01<00:37,  2.43it/s][A
Training:   5%|▌         | 5/95 [00:02<00:36,  2.46it/s][A
Training:   6%|▋         | 6/95 [00:02<00:28,  3.08it/s][A
Training:   7%|▋         | 7/95 [00:02<00:23,  3.79it/s][A
Training:   9%|▉         | 9/95 [00:03<00:28,  3.06it/s][A
Training:  11%|█         | 10/95 [00:03<00:25,  3.40it/s][A
Training:  13%|█▎        | 12/95 [00:03<00:16,  4.98it/s][A
Training:  14%|█▎        | 13/95 [00:04<00:25,  3.22it/s][A
Training:  15%|█▍        | 14/95 [00:04<00:21,  3.78it/s][A
Training:  16%|█▌        | 15/95 [00:04<00:18,  4.42it/s][A
Training:  18%|█▊        | 17/95 [00:05<00:21,  3.64it/s][A
Training:  20%|██        | 19/95 [00:05<00:14,  5.14it/s][A
Training:  22%|██▏       | 21/95 [00:06<00:18,  3.90it/s][A
Training:  25%|██▌       | 24/95 [00:06<00:13,  5.44it/s][A
Training:  26%|██▋       | 25/95 [00:0

Epoch: 53/98 - Loss: 1.9706 - Accuracy: 0.9417



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:15,  1.36s/it][A
 33%|███▎      | 4/12 [00:01<00:02,  3.33it/s][A
 50%|█████     | 6/12 [00:02<00:02,  2.86it/s][A
 67%|██████▋   | 8/12 [00:02<00:00,  4.12it/s][A
100%|██████████| 12/12 [00:03<00:00,  3.38it/s][A
Epochs:  54%|█████▍    | 53/98 [24:00<19:56, 26.59s/it]

Val Loss: 2.2416 - Val Accuracy: 0.9394



Training:   0%|          | 0/95 [00:00<?, ?it/s][A
Training:   1%|          | 1/95 [00:01<01:56,  1.24s/it][A
Training:   2%|▏         | 2/95 [00:01<00:55,  1.69it/s][A
Training:   5%|▌         | 5/95 [00:02<00:31,  2.90it/s][A
Training:   6%|▋         | 6/95 [00:02<00:27,  3.25it/s][A
Training:   8%|▊         | 8/95 [00:02<00:18,  4.74it/s][A
Training:   9%|▉         | 9/95 [00:03<00:27,  3.15it/s][A
Training:  11%|█         | 10/95 [00:03<00:24,  3.48it/s][A
Training:  13%|█▎        | 12/95 [00:03<00:17,  4.68it/s][A
Training:  14%|█▎        | 13/95 [00:04<00:27,  3.03it/s][A
Training:  15%|█▍        | 14/95 [00:04<00:22,  3.65it/s][A
Training:  17%|█▋        | 16/95 [00:04<00:15,  5.22it/s][A
Training:  18%|█▊        | 17/95 [00:05<00:25,  3.09it/s][A
Training:  20%|██        | 19/95 [00:05<00:17,  4.37it/s][A
Training:  22%|██▏       | 21/95 [00:06<00:21,  3.42it/s][A
Training:  24%|██▍       | 23/95 [00:06<00:15,  4.71it/s][A
Training:  26%|██▋       | 25/95 [00:0

Epoch: 54/98 - Loss: 1.9091 - Accuracy: 0.9403



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:15,  1.43s/it][A
 17%|█▋        | 2/12 [00:01<00:07,  1.43it/s][A
 33%|███▎      | 4/12 [00:01<00:02,  3.37it/s][A
 42%|████▏     | 5/12 [00:02<00:02,  2.42it/s][A
 50%|█████     | 6/12 [00:02<00:01,  3.02it/s][A
 67%|██████▋   | 8/12 [00:02<00:00,  4.80it/s][A
 75%|███████▌  | 9/12 [00:03<00:01,  2.82it/s][A
100%|██████████| 12/12 [00:03<00:00,  3.21it/s][A
Epochs:  55%|█████▌    | 54/98 [24:27<19:31, 26.61s/it]

Val Loss: 2.1804 - Val Accuracy: 0.9424



Training:   0%|          | 0/95 [00:00<?, ?it/s][A
Training:   1%|          | 1/95 [00:01<02:22,  1.51s/it][A
Training:   3%|▎         | 3/95 [00:01<00:41,  2.24it/s][A
Training:   5%|▌         | 5/95 [00:02<00:37,  2.40it/s][A
Training:   7%|▋         | 7/95 [00:02<00:24,  3.64it/s][A
Training:   9%|▉         | 9/95 [00:03<00:28,  3.01it/s][A
Training:  11%|█         | 10/95 [00:03<00:24,  3.47it/s][A
Training:  13%|█▎        | 12/95 [00:03<00:16,  4.89it/s][A
Training:  14%|█▎        | 13/95 [00:04<00:26,  3.05it/s][A
Training:  15%|█▍        | 14/95 [00:04<00:22,  3.62it/s][A
Training:  18%|█▊        | 17/95 [00:05<00:21,  3.64it/s][A
Training:  19%|█▉        | 18/95 [00:05<00:18,  4.10it/s][A
Training:  22%|██▏       | 21/95 [00:06<00:20,  3.59it/s][A
Training:  26%|██▋       | 25/95 [00:07<00:19,  3.59it/s][A
Training:  28%|██▊       | 27/95 [00:07<00:15,  4.41it/s][A
Training:  31%|███       | 29/95 [00:08<00:18,  3.51it/s][A
Training:  35%|███▍      | 33/95 [00:

Epoch: 55/98 - Loss: 1.9340 - Accuracy: 0.9432



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:15,  1.40s/it][A
 33%|███▎      | 4/12 [00:01<00:02,  3.35it/s][A
 50%|█████     | 6/12 [00:02<00:02,  2.70it/s][A
 67%|██████▋   | 8/12 [00:02<00:00,  4.03it/s][A
100%|██████████| 12/12 [00:03<00:00,  3.37it/s][A
Epochs:  56%|█████▌    | 55/98 [24:54<19:05, 26.63s/it]

Val Loss: 2.1455 - Val Accuracy: 0.9396



Training:   0%|          | 0/95 [00:00<?, ?it/s][A
Training:   1%|          | 1/95 [00:01<02:18,  1.47s/it][A
Training:   3%|▎         | 3/95 [00:01<00:40,  2.24it/s][A
Training:   5%|▌         | 5/95 [00:02<00:39,  2.29it/s][A
Training:   7%|▋         | 7/95 [00:02<00:25,  3.45it/s][A
Training:   9%|▉         | 9/95 [00:03<00:29,  2.90it/s][A
Training:  12%|█▏        | 11/95 [00:03<00:20,  4.10it/s][A
Training:  13%|█▎        | 12/95 [00:03<00:18,  4.55it/s][A
Training:  14%|█▎        | 13/95 [00:04<00:25,  3.22it/s][A
Training:  15%|█▍        | 14/95 [00:04<00:21,  3.80it/s][A
Training:  16%|█▌        | 15/95 [00:04<00:17,  4.47it/s][A
Training:  18%|█▊        | 17/95 [00:05<00:22,  3.54it/s][A
Training:  19%|█▉        | 18/95 [00:05<00:20,  3.73it/s][A
Training:  20%|██        | 19/95 [00:05<00:17,  4.40it/s][A
Training:  22%|██▏       | 21/95 [00:06<00:21,  3.44it/s][A
Training:  23%|██▎       | 22/95 [00:06<00:18,  4.03it/s][A
Training:  26%|██▋       | 25/95 [00:

Epoch: 56/98 - Loss: 1.8910 - Accuracy: 0.9469



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:14,  1.36s/it][A
 17%|█▋        | 2/12 [00:01<00:06,  1.59it/s][A
 42%|████▏     | 5/12 [00:02<00:02,  2.50it/s][A
 67%|██████▋   | 8/12 [00:02<00:00,  4.41it/s][A
 75%|███████▌  | 9/12 [00:03<00:01,  2.90it/s][A
100%|██████████| 12/12 [00:03<00:00,  3.28it/s][A
Epochs:  57%|█████▋    | 56/98 [25:21<18:40, 26.69s/it]

Val Loss: 2.2875 - Val Accuracy: 0.9336



Training:   0%|          | 0/95 [00:00<?, ?it/s][A
Training:   1%|          | 1/95 [00:01<02:44,  1.75s/it][A
Training:   2%|▏         | 2/95 [00:01<01:14,  1.25it/s][A
Training:   4%|▍         | 4/95 [00:02<00:31,  2.94it/s][A
Training:   5%|▌         | 5/95 [00:02<00:38,  2.34it/s][A
Training:   7%|▋         | 7/95 [00:02<00:22,  3.95it/s][A
Training:   9%|▉         | 9/95 [00:03<00:28,  3.00it/s][A
Training:  12%|█▏        | 11/95 [00:03<00:20,  4.10it/s][A
Training:  14%|█▎        | 13/95 [00:04<00:25,  3.21it/s][A
Training:  16%|█▌        | 15/95 [00:04<00:18,  4.33it/s][A
Training:  18%|█▊        | 17/95 [00:05<00:24,  3.19it/s][A
Training:  20%|██        | 19/95 [00:06<00:18,  4.15it/s][A
Training:  22%|██▏       | 21/95 [00:06<00:19,  3.78it/s][A
Training:  26%|██▋       | 25/95 [00:07<00:18,  3.87it/s][A
Training:  28%|██▊       | 27/95 [00:07<00:14,  4.70it/s][A
Training:  31%|███       | 29/95 [00:08<00:17,  3.82it/s][A
Training:  35%|███▍      | 33/95 [00:0

Epoch: 57/98 - Loss: 1.8826 - Accuracy: 0.9404



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:16,  1.50s/it][A
 33%|███▎      | 4/12 [00:01<00:02,  3.04it/s][A
 50%|█████     | 6/12 [00:02<00:02,  2.60it/s][A
 75%|███████▌  | 9/12 [00:03<00:01,  2.89it/s][A
100%|██████████| 12/12 [00:03<00:00,  3.23it/s][A
Epochs:  58%|█████▊    | 57/98 [25:48<18:26, 26.98s/it]

Val Loss: 2.1789 - Val Accuracy: 0.9393



Training:   0%|          | 0/95 [00:00<?, ?it/s][A
Training:   1%|          | 1/95 [00:01<02:14,  1.44s/it][A
Training:   2%|▏         | 2/95 [00:01<01:00,  1.54it/s][A
Training:   3%|▎         | 3/95 [00:01<00:37,  2.44it/s][A
Training:   5%|▌         | 5/95 [00:02<00:33,  2.70it/s][A
Training:   6%|▋         | 6/95 [00:02<00:26,  3.37it/s][A
Training:   8%|▊         | 8/95 [00:02<00:17,  5.08it/s][A
Training:   9%|▉         | 9/95 [00:03<00:25,  3.34it/s][A
Training:  11%|█         | 10/95 [00:03<00:25,  3.37it/s][A
Training:  13%|█▎        | 12/95 [00:03<00:16,  4.91it/s][A
Training:  14%|█▎        | 13/95 [00:04<00:24,  3.40it/s][A
Training:  15%|█▍        | 14/95 [00:04<00:20,  3.90it/s][A
Training:  17%|█▋        | 16/95 [00:04<00:15,  5.22it/s][A
Training:  18%|█▊        | 17/95 [00:05<00:22,  3.45it/s][A
Training:  19%|█▉        | 18/95 [00:05<00:19,  3.92it/s][A
Training:  21%|██        | 20/95 [00:05<00:15,  4.86it/s][A
Training:  22%|██▏       | 21/95 [00:06

Epoch: 58/98 - Loss: 1.8120 - Accuracy: 0.9461



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:13,  1.24s/it][A
 25%|██▌       | 3/12 [00:01<00:03,  2.48it/s][A
 42%|████▏     | 5/12 [00:02<00:02,  2.70it/s][A
 50%|█████     | 6/12 [00:02<00:01,  3.30it/s][A
 58%|█████▊    | 7/12 [00:02<00:01,  3.64it/s][A
 75%|███████▌  | 9/12 [00:03<00:00,  3.55it/s][A
 83%|████████▎ | 10/12 [00:03<00:00,  3.86it/s][A
100%|██████████| 12/12 [00:03<00:00,  3.28it/s][A
Epochs:  59%|█████▉    | 58/98 [26:15<17:58, 26.96s/it]

Val Loss: 2.1014 - Val Accuracy: 0.9376



Training:   0%|          | 0/95 [00:00<?, ?it/s][A
Training:   1%|          | 1/95 [00:01<02:19,  1.49s/it][A
Training:   3%|▎         | 3/95 [00:01<00:39,  2.32it/s][A
Training:   5%|▌         | 5/95 [00:02<00:35,  2.53it/s][A
Training:   9%|▉         | 9/95 [00:03<00:25,  3.38it/s][A
Training:  12%|█▏        | 11/95 [00:03<00:19,  4.28it/s][A
Training:  14%|█▎        | 13/95 [00:04<00:24,  3.39it/s][A
Training:  17%|█▋        | 16/95 [00:04<00:15,  5.14it/s][A
Training:  19%|█▉        | 18/95 [00:05<00:20,  3.71it/s][A
Training:  21%|██        | 20/95 [00:05<00:15,  4.75it/s][A
Training:  23%|██▎       | 22/95 [00:06<00:19,  3.74it/s][A
Training:  25%|██▌       | 24/95 [00:06<00:14,  4.75it/s][A
Training:  27%|██▋       | 26/95 [00:07<00:18,  3.70it/s][A
Training:  31%|███       | 29/95 [00:08<00:18,  3.50it/s][A
Training:  33%|███▎      | 31/95 [00:08<00:14,  4.45it/s][A
Training:  35%|███▍      | 33/95 [00:09<00:16,  3.75it/s][A
Training:  38%|███▊      | 36/95 [00

Epoch: 59/98 - Loss: 1.9118 - Accuracy: 0.9402



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:16,  1.51s/it][A
 25%|██▌       | 3/12 [00:01<00:03,  2.29it/s][A
 42%|████▏     | 5/12 [00:02<00:02,  2.62it/s][A
 50%|█████     | 6/12 [00:02<00:02,  2.88it/s][A
 75%|███████▌  | 9/12 [00:03<00:00,  3.68it/s][A
100%|██████████| 12/12 [00:03<00:00,  3.30it/s][A
Epochs:  60%|██████    | 59/98 [26:42<17:24, 26.79s/it]

Val Loss: 2.1465 - Val Accuracy: 0.9324



Training:   0%|          | 0/95 [00:00<?, ?it/s][A
Training:   1%|          | 1/95 [00:01<02:17,  1.46s/it][A
Training:   4%|▍         | 4/95 [00:01<00:27,  3.28it/s][A
Training:   6%|▋         | 6/95 [00:02<00:32,  2.75it/s][A
Training:   8%|▊         | 8/95 [00:02<00:23,  3.77it/s][A
Training:   9%|▉         | 9/95 [00:03<00:30,  2.81it/s][A
Training:  11%|█         | 10/95 [00:03<00:25,  3.27it/s][A
Training:  13%|█▎        | 12/95 [00:03<00:17,  4.71it/s][A
Training:  14%|█▎        | 13/95 [00:04<00:24,  3.37it/s][A
Training:  15%|█▍        | 14/95 [00:04<00:24,  3.25it/s][A
Training:  17%|█▋        | 16/95 [00:04<00:16,  4.83it/s][A
Training:  18%|█▊        | 17/95 [00:05<00:21,  3.67it/s][A
Training:  19%|█▉        | 18/95 [00:05<00:22,  3.45it/s][A
Training:  21%|██        | 20/95 [00:05<00:14,  5.07it/s][A
Training:  22%|██▏       | 21/95 [00:06<00:18,  3.94it/s][A
Training:  23%|██▎       | 22/95 [00:06<00:17,  4.18it/s][A
Training:  24%|██▍       | 23/95 [00:

Epoch: 60/98 - Loss: 1.8324 - Accuracy: 0.9509



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:14,  1.36s/it][A
 33%|███▎      | 4/12 [00:01<00:02,  3.39it/s][A
 50%|█████     | 6/12 [00:02<00:02,  2.66it/s][A
 67%|██████▋   | 8/12 [00:02<00:01,  3.94it/s][A
100%|██████████| 12/12 [00:03<00:00,  3.38it/s][A
Epochs:  61%|██████    | 60/98 [27:08<16:52, 26.63s/it]

Val Loss: 2.1412 - Val Accuracy: 0.9400



Training:   0%|          | 0/95 [00:00<?, ?it/s][A
Training:   1%|          | 1/95 [00:01<02:08,  1.37s/it][A
Training:   2%|▏         | 2/95 [00:01<01:01,  1.52it/s][A
Training:   5%|▌         | 5/95 [00:02<00:37,  2.41it/s][A
Training:   8%|▊         | 8/95 [00:02<00:19,  4.42it/s][A
Training:  11%|█         | 10/95 [00:03<00:26,  3.27it/s][A
Training:  13%|█▎        | 12/95 [00:03<00:19,  4.34it/s][A
Training:  15%|█▍        | 14/95 [00:04<00:23,  3.46it/s][A
Training:  17%|█▋        | 16/95 [00:04<00:17,  4.54it/s][A
Training:  19%|█▉        | 18/95 [00:05<00:19,  3.94it/s][A
Training:  22%|██▏       | 21/95 [00:06<00:20,  3.54it/s][A
Training:  24%|██▍       | 23/95 [00:06<00:17,  4.15it/s][A
Training:  26%|██▋       | 25/95 [00:07<00:19,  3.63it/s][A
Training:  28%|██▊       | 27/95 [00:07<00:16,  4.22it/s][A
Training:  31%|███       | 29/95 [00:08<00:17,  3.88it/s][A
Training:  32%|███▏      | 30/95 [00:08<00:16,  4.03it/s][A
Training:  33%|███▎      | 31/95 [00

Epoch: 61/98 - Loss: 1.8678 - Accuracy: 0.9387



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:14,  1.34s/it][A
 33%|███▎      | 4/12 [00:01<00:02,  3.53it/s][A
 50%|█████     | 6/12 [00:02<00:02,  2.74it/s][A
 67%|██████▋   | 8/12 [00:02<00:01,  3.91it/s][A
100%|██████████| 12/12 [00:03<00:00,  3.36it/s][A
Epochs:  62%|██████▏   | 61/98 [27:35<16:35, 26.89s/it]

Val Loss: 2.2183 - Val Accuracy: 0.9400



Training:   0%|          | 0/95 [00:00<?, ?it/s][A
Training:   1%|          | 1/95 [00:01<02:06,  1.35s/it][A
Training:   2%|▏         | 2/95 [00:01<00:58,  1.58it/s][A
Training:   3%|▎         | 3/95 [00:01<00:37,  2.47it/s][A
Training:   5%|▌         | 5/95 [00:02<00:34,  2.61it/s][A
Training:   7%|▋         | 7/95 [00:02<00:22,  3.92it/s][A
Training:   9%|▉         | 9/95 [00:03<00:26,  3.28it/s][A
Training:  12%|█▏        | 11/95 [00:03<00:19,  4.23it/s][A
Training:  14%|█▎        | 13/95 [00:04<00:21,  3.78it/s][A
Training:  16%|█▌        | 15/95 [00:04<00:18,  4.30it/s][A
Training:  18%|█▊        | 17/95 [00:05<00:19,  4.06it/s][A
Training:  20%|██        | 19/95 [00:05<00:18,  4.03it/s][A
Training:  22%|██▏       | 21/95 [00:05<00:17,  4.27it/s][A
Training:  24%|██▍       | 23/95 [00:06<00:19,  3.73it/s][A
Training:  26%|██▋       | 25/95 [00:06<00:15,  4.49it/s][A
Training:  28%|██▊       | 27/95 [00:07<00:18,  3.76it/s][A
Training:  31%|███       | 29/95 [00:0

Epoch: 62/98 - Loss: 1.8176 - Accuracy: 0.9471



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:13,  1.23s/it][A
 33%|███▎      | 4/12 [00:01<00:02,  3.79it/s][A
 50%|█████     | 6/12 [00:02<00:02,  2.84it/s][A
 75%|███████▌  | 9/12 [00:03<00:00,  3.14it/s][A
100%|██████████| 12/12 [00:03<00:00,  3.54it/s][A
Epochs:  63%|██████▎   | 62/98 [28:02<16:09, 26.93s/it]

Val Loss: 2.1461 - Val Accuracy: 0.9360



Training:   0%|          | 0/95 [00:00<?, ?it/s][A
Training:   1%|          | 1/95 [00:01<01:59,  1.27s/it][A
Training:   3%|▎         | 3/95 [00:01<00:35,  2.57it/s][A
Training:   4%|▍         | 4/95 [00:01<00:26,  3.44it/s][A
Training:   5%|▌         | 5/95 [00:02<00:42,  2.14it/s][A
Training:   7%|▋         | 7/95 [00:02<00:24,  3.56it/s][A
Training:   8%|▊         | 8/95 [00:02<00:22,  3.84it/s][A
Training:   9%|▉         | 9/95 [00:03<00:29,  2.95it/s][A
Training:  12%|█▏        | 11/95 [00:03<00:18,  4.59it/s][A
Training:  13%|█▎        | 12/95 [00:03<00:21,  3.85it/s][A
Training:  14%|█▎        | 13/95 [00:04<00:26,  3.05it/s][A
Training:  16%|█▌        | 15/95 [00:04<00:17,  4.55it/s][A
Training:  17%|█▋        | 16/95 [00:04<00:20,  3.78it/s][A
Training:  18%|█▊        | 17/95 [00:05<00:21,  3.68it/s][A
Training:  20%|██        | 19/95 [00:05<00:15,  4.91it/s][A
Training:  21%|██        | 20/95 [00:05<00:20,  3.59it/s][A
Training:  22%|██▏       | 21/95 [00:06

Epoch: 63/98 - Loss: 1.8025 - Accuracy: 0.9450



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:14,  1.29s/it][A
 33%|███▎      | 4/12 [00:01<00:02,  3.63it/s][A
 50%|█████     | 6/12 [00:02<00:01,  3.24it/s][A
 67%|██████▋   | 8/12 [00:02<00:00,  4.68it/s][A
100%|██████████| 12/12 [00:03<00:00,  3.66it/s][A
Epochs:  64%|██████▍   | 63/98 [28:29<15:42, 26.93s/it]

Val Loss: 2.2938 - Val Accuracy: 0.9359



Training:   0%|          | 0/95 [00:00<?, ?it/s][A
Training:   1%|          | 1/95 [00:01<02:25,  1.55s/it][A
Training:   3%|▎         | 3/95 [00:01<00:40,  2.26it/s][A
Training:   5%|▌         | 5/95 [00:02<00:38,  2.33it/s][A
Training:   7%|▋         | 7/95 [00:02<00:23,  3.71it/s][A
Training:   9%|▉         | 9/95 [00:03<00:30,  2.86it/s][A
Training:  13%|█▎        | 12/95 [00:03<00:17,  4.70it/s][A
Training:  15%|█▍        | 14/95 [00:04<00:23,  3.46it/s][A
Training:  18%|█▊        | 17/95 [00:05<00:23,  3.28it/s][A
Training:  20%|██        | 19/95 [00:05<00:18,  4.16it/s][A
Training:  22%|██▏       | 21/95 [00:06<00:20,  3.58it/s][A
Training:  25%|██▌       | 24/95 [00:06<00:13,  5.19it/s][A
Training:  27%|██▋       | 26/95 [00:07<00:16,  4.09it/s][A
Training:  31%|███       | 29/95 [00:08<00:18,  3.53it/s][A
Training:  33%|███▎      | 31/95 [00:08<00:14,  4.46it/s][A
Training:  35%|███▍      | 33/95 [00:09<00:16,  3.73it/s][A
Training:  39%|███▉      | 37/95 [00:

Epoch: 64/98 - Loss: 1.9033 - Accuracy: 0.9411



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:14,  1.34s/it][A
 42%|████▏     | 5/12 [00:02<00:02,  2.52it/s][A
 75%|███████▌  | 9/12 [00:03<00:00,  3.32it/s][A
100%|██████████| 12/12 [00:03<00:00,  3.46it/s][A
Epochs:  65%|██████▌   | 64/98 [28:56<15:14, 26.89s/it]

Val Loss: 2.2134 - Val Accuracy: 0.9394



Training:   0%|          | 0/95 [00:00<?, ?it/s][A
Training:   1%|          | 1/95 [00:01<01:58,  1.26s/it][A
Training:   3%|▎         | 3/95 [00:01<00:36,  2.50it/s][A
Training:   5%|▌         | 5/95 [00:02<00:34,  2.58it/s][A
Training:   7%|▋         | 7/95 [00:02<00:22,  3.86it/s][A
Training:   9%|▉         | 9/95 [00:03<00:29,  2.91it/s][A
Training:  12%|█▏        | 11/95 [00:03<00:21,  3.99it/s][A
Training:  14%|█▎        | 13/95 [00:04<00:25,  3.23it/s][A
Training:  16%|█▌        | 15/95 [00:04<00:18,  4.32it/s][A
Training:  18%|█▊        | 17/95 [00:05<00:21,  3.60it/s][A
Training:  20%|██        | 19/95 [00:05<00:16,  4.61it/s][A
Training:  22%|██▏       | 21/95 [00:06<00:20,  3.60it/s][A
Training:  25%|██▌       | 24/95 [00:06<00:12,  5.47it/s][A
Training:  27%|██▋       | 26/95 [00:07<00:18,  3.77it/s][A
Training:  31%|███       | 29/95 [00:08<00:18,  3.54it/s][A
Training:  35%|███▍      | 33/95 [00:09<00:16,  3.87it/s][A
Training:  37%|███▋      | 35/95 [00:

Epoch: 65/98 - Loss: 1.8439 - Accuracy: 0.9424



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:15,  1.40s/it][A
 33%|███▎      | 4/12 [00:01<00:02,  3.40it/s][A
 50%|█████     | 6/12 [00:02<00:02,  2.83it/s][A
100%|██████████| 12/12 [00:03<00:00,  3.46it/s][A
Epochs:  66%|██████▋   | 65/98 [29:24<14:52, 27.05s/it]

Val Loss: 3.0328 - Val Accuracy: 0.9105



Training:   0%|          | 0/95 [00:00<?, ?it/s][A
Training:   1%|          | 1/95 [00:01<02:13,  1.42s/it][A
Training:   2%|▏         | 2/95 [00:01<01:00,  1.53it/s][A
Training:   4%|▍         | 4/95 [00:01<00:27,  3.35it/s][A
Training:   5%|▌         | 5/95 [00:02<00:37,  2.42it/s][A
Training:   7%|▋         | 7/95 [00:02<00:22,  3.96it/s][A
Training:   9%|▉         | 9/95 [00:03<00:28,  3.01it/s][A
Training:  12%|█▏        | 11/95 [00:03<00:19,  4.23it/s][A
Training:  14%|█▎        | 13/95 [00:04<00:23,  3.56it/s][A
Training:  16%|█▌        | 15/95 [00:04<00:16,  4.72it/s][A
Training:  17%|█▋        | 16/95 [00:04<00:15,  5.22it/s][A
Training:  18%|█▊        | 17/95 [00:05<00:20,  3.73it/s][A
Training:  19%|█▉        | 18/95 [00:05<00:18,  4.10it/s][A
Training:  21%|██        | 20/95 [00:05<00:13,  5.44it/s][A
Training:  22%|██▏       | 21/95 [00:05<00:19,  3.82it/s][A
Training:  23%|██▎       | 22/95 [00:06<00:18,  3.88it/s][A
Training:  25%|██▌       | 24/95 [00:0

Epoch: 66/98 - Loss: 1.8487 - Accuracy: 0.9432



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:14,  1.28s/it][A
 33%|███▎      | 4/12 [00:01<00:02,  3.59it/s][A
 50%|█████     | 6/12 [00:02<00:02,  2.82it/s][A
 75%|███████▌  | 9/12 [00:03<00:00,  3.09it/s][A
100%|██████████| 12/12 [00:03<00:00,  3.52it/s][A
Epochs:  67%|██████▋   | 66/98 [29:50<14:24, 27.02s/it]

Val Loss: 2.1215 - Val Accuracy: 0.9372



Training:   0%|          | 0/95 [00:00<?, ?it/s][A
Training:   1%|          | 1/95 [00:01<01:52,  1.20s/it][A
Training:   2%|▏         | 2/95 [00:01<00:51,  1.81it/s][A
Training:   4%|▍         | 4/95 [00:01<00:22,  4.02it/s][A
Training:   6%|▋         | 6/95 [00:02<00:28,  3.17it/s][A
Training:   9%|▉         | 9/95 [00:03<00:27,  3.13it/s][A
Training:  12%|█▏        | 11/95 [00:03<00:19,  4.27it/s][A
Training:  14%|█▎        | 13/95 [00:04<00:23,  3.52it/s][A
Training:  16%|█▌        | 15/95 [00:04<00:16,  4.71it/s][A
Training:  18%|█▊        | 17/95 [00:05<00:22,  3.54it/s][A
Training:  19%|█▉        | 18/95 [00:05<00:19,  3.90it/s][A
Training:  21%|██        | 20/95 [00:05<00:14,  5.15it/s][A
Training:  22%|██▏       | 21/95 [00:06<00:22,  3.26it/s][A
Training:  24%|██▍       | 23/95 [00:06<00:15,  4.52it/s][A
Training:  26%|██▋       | 25/95 [00:07<00:19,  3.66it/s][A
Training:  28%|██▊       | 27/95 [00:07<00:14,  4.74it/s][A
Training:  31%|███       | 29/95 [00:

Epoch: 67/98 - Loss: 1.8638 - Accuracy: 0.9388



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:15,  1.44s/it][A
 25%|██▌       | 3/12 [00:01<00:03,  2.43it/s][A
 42%|████▏     | 5/12 [00:02<00:02,  2.49it/s][A
 75%|███████▌  | 9/12 [00:03<00:00,  3.43it/s][A
100%|██████████| 12/12 [00:03<00:00,  3.50it/s][A
Epochs:  68%|██████▊   | 67/98 [30:17<13:56, 26.97s/it]

Val Loss: 2.1199 - Val Accuracy: 0.9398



Training:   0%|          | 0/95 [00:00<?, ?it/s][A
Training:   1%|          | 1/95 [00:01<01:52,  1.19s/it][A
Training:   2%|▏         | 2/95 [00:01<00:53,  1.72it/s][A
Training:   4%|▍         | 4/95 [00:01<00:24,  3.77it/s][A
Training:   5%|▌         | 5/95 [00:02<00:34,  2.63it/s][A
Training:   7%|▋         | 7/95 [00:02<00:20,  4.27it/s][A
Training:   8%|▊         | 8/95 [00:02<00:18,  4.74it/s][A
Training:   9%|▉         | 9/95 [00:03<00:28,  3.01it/s][A
Training:  12%|█▏        | 11/95 [00:03<00:18,  4.54it/s][A
Training:  14%|█▎        | 13/95 [00:04<00:23,  3.45it/s][A
Training:  15%|█▍        | 14/95 [00:04<00:20,  3.90it/s][A
Training:  17%|█▋        | 16/95 [00:04<00:14,  5.33it/s][A
Training:  18%|█▊        | 17/95 [00:05<00:25,  3.07it/s][A
Training:  19%|█▉        | 18/95 [00:05<00:21,  3.65it/s][A
Training:  21%|██        | 20/95 [00:05<00:14,  5.21it/s][A
Training:  22%|██▏       | 21/95 [00:06<00:22,  3.30it/s][A
Training:  26%|██▋       | 25/95 [00:06

Epoch: 68/98 - Loss: 1.7584 - Accuracy: 0.9453



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:14,  1.31s/it][A
 33%|███▎      | 4/12 [00:01<00:02,  3.43it/s][A
 50%|█████     | 6/12 [00:02<00:02,  2.92it/s][A
100%|██████████| 12/12 [00:03<00:00,  3.77it/s][A
Epochs:  69%|██████▉   | 68/98 [30:44<13:24, 26.81s/it]

Val Loss: 2.4137 - Val Accuracy: 0.9344



Training:   0%|          | 0/95 [00:00<?, ?it/s][A
Training:   1%|          | 1/95 [00:01<02:13,  1.42s/it][A
Training:   2%|▏         | 2/95 [00:01<01:02,  1.49it/s][A
Training:   4%|▍         | 4/95 [00:01<00:25,  3.54it/s][A
Training:   6%|▋         | 6/95 [00:02<00:31,  2.87it/s][A
Training:   8%|▊         | 8/95 [00:02<00:20,  4.32it/s][A
Training:  11%|█         | 10/95 [00:03<00:22,  3.82it/s][A
Training:  14%|█▎        | 13/95 [00:04<00:22,  3.68it/s][A
Training:  16%|█▌        | 15/95 [00:04<00:17,  4.65it/s][A
Training:  18%|█▊        | 17/95 [00:05<00:22,  3.50it/s][A
Training:  20%|██        | 19/95 [00:05<00:16,  4.60it/s][A
Training:  22%|██▏       | 21/95 [00:06<00:20,  3.62it/s][A
Training:  24%|██▍       | 23/95 [00:06<00:15,  4.74it/s][A
Training:  26%|██▋       | 25/95 [00:06<00:17,  4.00it/s][A
Training:  28%|██▊       | 27/95 [00:07<00:13,  5.21it/s][A
Training:  31%|███       | 29/95 [00:07<00:16,  4.10it/s][A
Training:  33%|███▎      | 31/95 [00:

Epoch: 69/98 - Loss: 1.8085 - Accuracy: 0.9503



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:14,  1.30s/it][A
 33%|███▎      | 4/12 [00:01<00:02,  3.53it/s][A
 50%|█████     | 6/12 [00:02<00:02,  2.74it/s][A
 67%|██████▋   | 8/12 [00:02<00:00,  4.01it/s][A
100%|██████████| 12/12 [00:03<00:00,  3.49it/s][A
Epochs:  70%|███████   | 69/98 [31:10<12:55, 26.76s/it]

Val Loss: 2.5700 - Val Accuracy: 0.9383



Training:   0%|          | 0/95 [00:00<?, ?it/s][A
Training:   1%|          | 1/95 [00:01<02:03,  1.31s/it][A
Training:   3%|▎         | 3/95 [00:01<00:36,  2.54it/s][A
Training:   5%|▌         | 5/95 [00:02<00:35,  2.51it/s][A
Training:   6%|▋         | 6/95 [00:02<00:29,  3.04it/s][A
Training:   9%|▉         | 9/95 [00:03<00:23,  3.63it/s][A
Training:  11%|█         | 10/95 [00:03<00:21,  3.97it/s][A
Training:  13%|█▎        | 12/95 [00:03<00:15,  5.48it/s][A
Training:  14%|█▎        | 13/95 [00:04<00:24,  3.36it/s][A
Training:  17%|█▋        | 16/95 [00:04<00:13,  5.70it/s][A
Training:  19%|█▉        | 18/95 [00:05<00:19,  3.99it/s][A
Training:  21%|██        | 20/95 [00:05<00:15,  4.87it/s][A
Training:  22%|██▏       | 21/95 [00:05<00:19,  3.71it/s][A
Training:  24%|██▍       | 23/95 [00:05<00:14,  4.94it/s][A
Training:  25%|██▌       | 24/95 [00:06<00:15,  4.68it/s][A
Training:  26%|██▋       | 25/95 [00:06<00:18,  3.70it/s][A
Training:  28%|██▊       | 27/95 [00:

Epoch: 70/98 - Loss: 1.9060 - Accuracy: 0.9397



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:16,  1.49s/it][A
 17%|█▋        | 2/12 [00:01<00:06,  1.48it/s][A
 33%|███▎      | 4/12 [00:01<00:02,  3.48it/s][A
 50%|█████     | 6/12 [00:02<00:02,  2.84it/s][A
 75%|███████▌  | 9/12 [00:03<00:00,  3.21it/s][A
100%|██████████| 12/12 [00:03<00:00,  3.18it/s][A
Epochs:  71%|███████▏  | 70/98 [31:37<12:28, 26.73s/it]

Val Loss: 2.2723 - Val Accuracy: 0.9183



Training:   0%|          | 0/95 [00:00<?, ?it/s][A
Training:   1%|          | 1/95 [00:01<02:24,  1.54s/it][A
Training:   3%|▎         | 3/95 [00:01<00:40,  2.25it/s][A
Training:   5%|▌         | 5/95 [00:02<00:34,  2.63it/s][A
Training:   7%|▋         | 7/95 [00:02<00:21,  4.14it/s][A
Training:   9%|▉         | 9/95 [00:03<00:25,  3.35it/s][A
Training:  12%|█▏        | 11/95 [00:03<00:18,  4.51it/s][A
Training:  14%|█▎        | 13/95 [00:04<00:25,  3.22it/s][A
Training:  16%|█▌        | 15/95 [00:04<00:18,  4.33it/s][A
Training:  18%|█▊        | 17/95 [00:05<00:22,  3.45it/s][A
Training:  20%|██        | 19/95 [00:05<00:16,  4.51it/s][A
Training:  22%|██▏       | 21/95 [00:06<00:19,  3.74it/s][A
Training:  24%|██▍       | 23/95 [00:06<00:14,  4.85it/s][A
Training:  26%|██▋       | 25/95 [00:06<00:17,  4.07it/s][A
Training:  28%|██▊       | 27/95 [00:07<00:12,  5.30it/s][A
Training:  31%|███       | 29/95 [00:07<00:16,  3.93it/s][A
Training:  35%|███▍      | 33/95 [00:

Epoch: 71/98 - Loss: 1.9264 - Accuracy: 0.9421



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:15,  1.38s/it][A
 17%|█▋        | 2/12 [00:01<00:06,  1.55it/s][A
 33%|███▎      | 4/12 [00:01<00:02,  3.49it/s][A
 42%|████▏     | 5/12 [00:02<00:02,  2.54it/s][A
 50%|█████     | 6/12 [00:02<00:01,  3.00it/s][A
 67%|██████▋   | 8/12 [00:02<00:00,  4.87it/s][A
 75%|███████▌  | 9/12 [00:03<00:00,  3.32it/s][A
100%|██████████| 12/12 [00:03<00:00,  3.38it/s][A
Epochs:  72%|███████▏  | 71/98 [32:03<11:58, 26.60s/it]

Val Loss: 2.3934 - Val Accuracy: 0.9105



Training:   0%|          | 0/95 [00:00<?, ?it/s][A
Training:   1%|          | 1/95 [00:01<02:15,  1.44s/it][A
Training:   3%|▎         | 3/95 [00:01<00:38,  2.41it/s][A
Training:   5%|▌         | 5/95 [00:02<00:36,  2.47it/s][A
Training:   6%|▋         | 6/95 [00:02<00:29,  3.07it/s][A
Training:   8%|▊         | 8/95 [00:02<00:18,  4.69it/s][A
Training:  11%|█         | 10/95 [00:03<00:22,  3.84it/s][A
Training:  12%|█▏        | 11/95 [00:03<00:19,  4.39it/s][A
Training:  14%|█▎        | 13/95 [00:04<00:24,  3.36it/s][A
Training:  17%|█▋        | 16/95 [00:04<00:14,  5.49it/s][A
Training:  19%|█▉        | 18/95 [00:05<00:20,  3.70it/s][A
Training:  21%|██        | 20/95 [00:05<00:15,  4.74it/s][A
Training:  23%|██▎       | 22/95 [00:06<00:17,  4.17it/s][A
Training:  25%|██▌       | 24/95 [00:06<00:13,  5.20it/s][A
Training:  26%|██▋       | 25/95 [00:06<00:17,  3.96it/s][A
Training:  29%|██▉       | 28/95 [00:06<00:10,  6.23it/s][A
Training:  32%|███▏      | 30/95 [00:

Epoch: 72/98 - Loss: 1.9641 - Accuracy: 0.9299



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:14,  1.27s/it][A
 33%|███▎      | 4/12 [00:01<00:02,  3.61it/s][A
 50%|█████     | 6/12 [00:02<00:02,  2.72it/s][A
 67%|██████▋   | 8/12 [00:02<00:01,  3.89it/s][A
 75%|███████▌  | 9/12 [00:03<00:01,  2.74it/s][A
100%|██████████| 12/12 [00:03<00:00,  3.30it/s][A
Epochs:  73%|███████▎  | 72/98 [32:30<11:30, 26.57s/it]

Val Loss: 2.1862 - Val Accuracy: 0.9424



Training:   0%|          | 0/95 [00:00<?, ?it/s][A
Training:   1%|          | 1/95 [00:01<02:19,  1.48s/it][A
Training:   3%|▎         | 3/95 [00:01<00:39,  2.32it/s][A
Training:   5%|▌         | 5/95 [00:02<00:39,  2.26it/s][A
Training:   7%|▋         | 7/95 [00:02<00:24,  3.55it/s][A
Training:   9%|▉         | 9/95 [00:03<00:29,  2.90it/s][A
Training:  12%|█▏        | 11/95 [00:03<00:20,  4.07it/s][A
Training:  14%|█▎        | 13/95 [00:04<00:23,  3.42it/s][A
Training:  16%|█▌        | 15/95 [00:04<00:17,  4.51it/s][A
Training:  18%|█▊        | 17/95 [00:05<00:19,  4.10it/s][A
Training:  19%|█▉        | 18/95 [00:05<00:16,  4.57it/s][A
Training:  22%|██▏       | 21/95 [00:06<00:18,  4.05it/s][A
Training:  24%|██▍       | 23/95 [00:06<00:13,  5.30it/s][A
Training:  26%|██▋       | 25/95 [00:07<00:20,  3.42it/s][A
Training:  31%|███       | 29/95 [00:08<00:16,  3.92it/s][A
Training:  33%|███▎      | 31/95 [00:08<00:13,  4.85it/s][A
Training:  35%|███▍      | 33/95 [00:

Epoch: 73/98 - Loss: 1.8445 - Accuracy: 0.9394



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:16,  1.47s/it][A
 25%|██▌       | 3/12 [00:01<00:03,  2.37it/s][A
 42%|████▏     | 5/12 [00:02<00:03,  2.11it/s][A
 58%|█████▊    | 7/12 [00:02<00:01,  3.33it/s][A
 75%|███████▌  | 9/12 [00:03<00:00,  3.07it/s][A
100%|██████████| 12/12 [00:03<00:00,  3.24it/s][A
Epochs:  74%|███████▍  | 73/98 [32:57<11:07, 26.71s/it]

Val Loss: 2.3908 - Val Accuracy: 0.9338



Training:   0%|          | 0/95 [00:00<?, ?it/s][A
Training:   1%|          | 1/95 [00:01<02:19,  1.48s/it][A
Training:   3%|▎         | 3/95 [00:01<00:38,  2.36it/s][A
Training:   5%|▌         | 5/95 [00:02<00:39,  2.30it/s][A
Training:   7%|▋         | 7/95 [00:02<00:24,  3.62it/s][A
Training:   9%|▉         | 9/95 [00:03<00:28,  3.00it/s][A
Training:  11%|█         | 10/95 [00:03<00:24,  3.51it/s][A
Training:  13%|█▎        | 12/95 [00:03<00:17,  4.87it/s][A
Training:  15%|█▍        | 14/95 [00:04<00:21,  3.80it/s][A
Training:  17%|█▋        | 16/95 [00:04<00:15,  5.06it/s][A
Training:  18%|█▊        | 17/95 [00:05<00:23,  3.28it/s][A
Training:  20%|██        | 19/95 [00:05<00:16,  4.62it/s][A
Training:  22%|██▏       | 21/95 [00:06<00:19,  3.87it/s][A
Training:  25%|██▌       | 24/95 [00:06<00:12,  5.62it/s][A
Training:  27%|██▋       | 26/95 [00:07<00:15,  4.52it/s][A
Training:  29%|██▉       | 28/95 [00:07<00:12,  5.56it/s][A
Training:  31%|███       | 29/95 [00:

Epoch: 74/98 - Loss: 1.9328 - Accuracy: 0.9372



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:15,  1.37s/it][A
 33%|███▎      | 4/12 [00:01<00:02,  3.42it/s][A
 50%|█████     | 6/12 [00:02<00:02,  2.94it/s][A
 67%|██████▋   | 8/12 [00:02<00:00,  4.36it/s][A
100%|██████████| 12/12 [00:03<00:00,  3.44it/s][A
Epochs:  76%|███████▌  | 74/98 [33:24<10:43, 26.83s/it]

Val Loss: 2.1496 - Val Accuracy: 0.9425



Training:   0%|          | 0/95 [00:00<?, ?it/s][A
Training:   1%|          | 1/95 [00:01<02:25,  1.54s/it][A
Training:   5%|▌         | 5/95 [00:02<00:39,  2.29it/s][A
Training:   6%|▋         | 6/95 [00:02<00:33,  2.66it/s][A
Training:   9%|▉         | 9/95 [00:03<00:29,  2.96it/s][A
Training:  12%|█▏        | 11/95 [00:03<00:21,  3.92it/s][A
Training:  14%|█▎        | 13/95 [00:04<00:24,  3.32it/s][A
Training:  16%|█▌        | 15/95 [00:04<00:18,  4.39it/s][A
Training:  18%|█▊        | 17/95 [00:05<00:21,  3.57it/s][A
Training:  20%|██        | 19/95 [00:05<00:16,  4.74it/s][A
Training:  22%|██▏       | 21/95 [00:06<00:20,  3.53it/s][A
Training:  24%|██▍       | 23/95 [00:06<00:15,  4.56it/s][A
Training:  26%|██▋       | 25/95 [00:07<00:19,  3.59it/s][A
Training:  29%|██▉       | 28/95 [00:07<00:12,  5.42it/s][A
Training:  32%|███▏      | 30/95 [00:08<00:15,  4.16it/s][A
Training:  34%|███▎      | 32/95 [00:08<00:12,  4.95it/s][A
Training:  35%|███▍      | 33/95 [00

Epoch: 75/98 - Loss: 1.8335 - Accuracy: 0.9406



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:13,  1.25s/it][A
 25%|██▌       | 3/12 [00:01<00:03,  2.54it/s][A
 42%|████▏     | 5/12 [00:02<00:02,  2.59it/s][A
 58%|█████▊    | 7/12 [00:02<00:01,  3.47it/s][A
 75%|███████▌  | 9/12 [00:03<00:00,  3.40it/s][A
 83%|████████▎ | 10/12 [00:03<00:00,  3.69it/s][A
100%|██████████| 12/12 [00:03<00:00,  3.23it/s][A
Epochs:  77%|███████▋  | 75/98 [33:51<10:16, 26.79s/it]

Val Loss: 2.2876 - Val Accuracy: 0.9314



Training:   0%|          | 0/95 [00:00<?, ?it/s][A
Training:   1%|          | 1/95 [00:01<02:08,  1.36s/it][A
Training:   3%|▎         | 3/95 [00:01<00:36,  2.50it/s][A
Training:   5%|▌         | 5/95 [00:02<00:34,  2.63it/s][A
Training:   7%|▋         | 7/95 [00:02<00:22,  3.98it/s][A
Training:   9%|▉         | 9/95 [00:03<00:28,  3.02it/s][A
Training:  12%|█▏        | 11/95 [00:03<00:20,  4.16it/s][A
Training:  14%|█▎        | 13/95 [00:04<00:26,  3.11it/s][A
Training:  16%|█▌        | 15/95 [00:04<00:19,  4.16it/s][A
Training:  18%|█▊        | 17/95 [00:05<00:23,  3.37it/s][A
Training:  21%|██        | 20/95 [00:05<00:14,  5.17it/s][A
Training:  23%|██▎       | 22/95 [00:06<00:18,  3.98it/s][A
Training:  26%|██▋       | 25/95 [00:07<00:17,  3.92it/s][A
Training:  29%|██▉       | 28/95 [00:07<00:12,  5.51it/s][A
Training:  32%|███▏      | 30/95 [00:08<00:15,  4.27it/s][A
Training:  35%|███▍      | 33/95 [00:08<00:14,  4.19it/s][A
Training:  37%|███▋      | 35/95 [00:

Epoch: 76/98 - Loss: 1.8211 - Accuracy: 0.9419



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:14,  1.33s/it][A
 25%|██▌       | 3/12 [00:01<00:03,  2.55it/s][A
 42%|████▏     | 5/12 [00:02<00:02,  2.65it/s][A
 67%|██████▋   | 8/12 [00:02<00:00,  5.06it/s][A
100%|██████████| 12/12 [00:03<00:00,  3.58it/s][A
Epochs:  78%|███████▊  | 76/98 [34:17<09:47, 26.71s/it]

Val Loss: 2.1136 - Val Accuracy: 0.9366



Training:   0%|          | 0/95 [00:00<?, ?it/s][A
Training:   1%|          | 1/95 [00:01<02:22,  1.52s/it][A
Training:   3%|▎         | 3/95 [00:01<00:39,  2.32it/s][A
Training:   5%|▌         | 5/95 [00:02<00:39,  2.30it/s][A
Training:   7%|▋         | 7/95 [00:02<00:25,  3.46it/s][A
Training:   9%|▉         | 9/95 [00:03<00:27,  3.11it/s][A
Training:  11%|█         | 10/95 [00:03<00:23,  3.55it/s][A
Training:  13%|█▎        | 12/95 [00:03<00:16,  4.95it/s][A
Training:  14%|█▎        | 13/95 [00:04<00:27,  2.97it/s][A
Training:  16%|█▌        | 15/95 [00:04<00:18,  4.27it/s][A
Training:  18%|█▊        | 17/95 [00:05<00:22,  3.42it/s][A
Training:  20%|██        | 19/95 [00:05<00:16,  4.60it/s][A
Training:  22%|██▏       | 21/95 [00:06<00:19,  3.78it/s][A
Training:  25%|██▌       | 24/95 [00:06<00:12,  5.71it/s][A
Training:  27%|██▋       | 26/95 [00:07<00:17,  4.02it/s][A
Training:  31%|███       | 29/95 [00:08<00:17,  3.80it/s][A
Training:  32%|███▏      | 30/95 [00:

Epoch: 77/98 - Loss: 1.7500 - Accuracy: 0.9439



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:13,  1.18s/it][A
 17%|█▋        | 2/12 [00:01<00:05,  1.67it/s][A
 33%|███▎      | 4/12 [00:01<00:02,  3.87it/s][A
 50%|█████     | 6/12 [00:02<00:01,  3.24it/s][A
 67%|██████▋   | 8/12 [00:02<00:00,  4.88it/s][A
100%|██████████| 12/12 [00:03<00:00,  3.53it/s][A
Epochs:  79%|███████▊  | 77/98 [34:44<09:23, 26.85s/it]

Val Loss: 2.3089 - Val Accuracy: 0.8969



Training:   0%|          | 0/95 [00:00<?, ?it/s][A
Training:   1%|          | 1/95 [00:01<02:05,  1.33s/it][A
Training:   2%|▏         | 2/95 [00:01<01:05,  1.41it/s][A
Training:   5%|▌         | 5/95 [00:02<00:33,  2.68it/s][A
Training:   6%|▋         | 6/95 [00:02<00:30,  2.91it/s][A
Training:   8%|▊         | 8/95 [00:02<00:19,  4.41it/s][A
Training:   9%|▉         | 9/95 [00:03<00:27,  3.08it/s][A
Training:  11%|█         | 10/95 [00:03<00:27,  3.04it/s][A
Training:  13%|█▎        | 12/95 [00:03<00:17,  4.66it/s][A
Training:  14%|█▎        | 13/95 [00:04<00:23,  3.47it/s][A
Training:  15%|█▍        | 14/95 [00:04<00:24,  3.34it/s][A
Training:  17%|█▋        | 16/95 [00:04<00:16,  4.88it/s][A
Training:  18%|█▊        | 17/95 [00:05<00:20,  3.81it/s][A
Training:  19%|█▉        | 18/95 [00:05<00:23,  3.21it/s][A
Training:  21%|██        | 20/95 [00:05<00:15,  4.70it/s][A
Training:  22%|██▏       | 21/95 [00:06<00:18,  3.92it/s][A
Training:  23%|██▎       | 22/95 [00:0

Epoch: 78/98 - Loss: 1.8281 - Accuracy: 0.9371



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:16,  1.49s/it][A
 17%|█▋        | 2/12 [00:01<00:07,  1.43it/s][A
 42%|████▏     | 5/12 [00:02<00:02,  2.74it/s][A
 50%|█████     | 6/12 [00:02<00:01,  3.24it/s][A
 75%|███████▌  | 9/12 [00:03<00:00,  3.47it/s][A
100%|██████████| 12/12 [00:03<00:00,  3.35it/s][A
Epochs:  80%|███████▉  | 78/98 [35:11<08:58, 26.92s/it]

Val Loss: 2.4283 - Val Accuracy: 0.9169



Training:   0%|          | 0/95 [00:00<?, ?it/s][A
Training:   1%|          | 1/95 [00:01<02:24,  1.53s/it][A
Training:   3%|▎         | 3/95 [00:01<00:41,  2.21it/s][A
Training:   5%|▌         | 5/95 [00:02<00:36,  2.46it/s][A
Training:   6%|▋         | 6/95 [00:02<00:29,  3.07it/s][A
Training:   8%|▊         | 8/95 [00:02<00:18,  4.69it/s][A
Training:  11%|█         | 10/95 [00:03<00:27,  3.07it/s][A
Training:  13%|█▎        | 12/95 [00:03<00:19,  4.25it/s][A
Training:  14%|█▎        | 13/95 [00:04<00:25,  3.21it/s][A
Training:  15%|█▍        | 14/95 [00:04<00:25,  3.20it/s][A
Training:  17%|█▋        | 16/95 [00:04<00:17,  4.50it/s][A
Training:  18%|█▊        | 17/95 [00:05<00:21,  3.58it/s][A
Training:  19%|█▉        | 18/95 [00:05<00:21,  3.56it/s][A
Training:  21%|██        | 20/95 [00:05<00:14,  5.06it/s][A
Training:  22%|██▏       | 21/95 [00:06<00:19,  3.70it/s][A
Training:  23%|██▎       | 22/95 [00:06<00:19,  3.82it/s][A
Training:  25%|██▌       | 24/95 [00:

Epoch: 79/98 - Loss: 1.8742 - Accuracy: 0.9385



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:16,  1.53s/it][A
 42%|████▏     | 5/12 [00:02<00:03,  2.17it/s][A
 58%|█████▊    | 7/12 [00:02<00:01,  3.22it/s][A
 75%|███████▌  | 9/12 [00:03<00:01,  2.98it/s][A
100%|██████████| 12/12 [00:03<00:00,  3.19it/s][A
Epochs:  81%|████████  | 79/98 [35:39<08:32, 26.96s/it]

Val Loss: 2.2283 - Val Accuracy: 0.9253



Training:   0%|          | 0/95 [00:00<?, ?it/s][A
Training:   1%|          | 1/95 [00:01<02:08,  1.37s/it][A
Training:   3%|▎         | 3/95 [00:01<00:38,  2.40it/s][A
Training:   5%|▌         | 5/95 [00:02<00:37,  2.43it/s][A
Training:   6%|▋         | 6/95 [00:02<00:29,  3.01it/s][A
Training:   8%|▊         | 8/95 [00:02<00:19,  4.40it/s][A
Training:   9%|▉         | 9/95 [00:03<00:29,  2.96it/s][A
Training:  12%|█▏        | 11/95 [00:03<00:19,  4.24it/s][A
Training:  14%|█▎        | 13/95 [00:04<00:23,  3.52it/s][A
Training:  15%|█▍        | 14/95 [00:04<00:20,  4.05it/s][A
Training:  17%|█▋        | 16/95 [00:04<00:14,  5.35it/s][A
Training:  18%|█▊        | 17/95 [00:05<00:23,  3.32it/s][A
Training:  19%|█▉        | 18/95 [00:05<00:22,  3.37it/s][A
Training:  21%|██        | 20/95 [00:05<00:14,  5.01it/s][A
Training:  22%|██▏       | 21/95 [00:06<00:19,  3.74it/s][A
Training:  23%|██▎       | 22/95 [00:06<00:18,  3.88it/s][A
Training:  26%|██▋       | 25/95 [00:0

Epoch: 80/98 - Loss: 1.7623 - Accuracy: 0.9447



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:15,  1.37s/it][A
 25%|██▌       | 3/12 [00:01<00:03,  2.45it/s][A
 42%|████▏     | 5/12 [00:02<00:02,  2.42it/s][A
 67%|██████▋   | 8/12 [00:02<00:00,  4.42it/s][A
100%|██████████| 12/12 [00:03<00:00,  3.36it/s][A
Epochs:  82%|████████▏ | 80/98 [36:05<08:04, 26.92s/it]

Val Loss: 2.6582 - Val Accuracy: 0.9335



Training:   0%|          | 0/95 [00:00<?, ?it/s][A
Training:   1%|          | 1/95 [00:01<02:01,  1.29s/it][A
Training:   2%|▏         | 2/95 [00:01<00:56,  1.65it/s][A
Training:   3%|▎         | 3/95 [00:01<00:35,  2.59it/s][A
Training:   5%|▌         | 5/95 [00:02<00:35,  2.52it/s][A
Training:   7%|▋         | 7/95 [00:02<00:21,  4.09it/s][A
Training:   9%|▉         | 9/95 [00:03<00:29,  2.96it/s][A
Training:  12%|█▏        | 11/95 [00:03<00:20,  4.04it/s][A
Training:  14%|█▎        | 13/95 [00:04<00:25,  3.24it/s][A
Training:  17%|█▋        | 16/95 [00:04<00:15,  5.10it/s][A
Training:  19%|█▉        | 18/95 [00:05<00:20,  3.84it/s][A
Training:  22%|██▏       | 21/95 [00:06<00:20,  3.53it/s][A
Training:  26%|██▋       | 25/95 [00:07<00:18,  3.79it/s][A
Training:  28%|██▊       | 27/95 [00:07<00:14,  4.65it/s][A
Training:  31%|███       | 29/95 [00:08<00:17,  3.82it/s][A
Training:  33%|███▎      | 31/95 [00:08<00:13,  4.74it/s][A
Training:  35%|███▍      | 33/95 [00:0

Epoch: 81/98 - Loss: 1.7965 - Accuracy: 0.9483



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:15,  1.45s/it][A
 33%|███▎      | 4/12 [00:01<00:02,  3.23it/s][A
 50%|█████     | 6/12 [00:02<00:02,  2.64it/s][A
 67%|██████▋   | 8/12 [00:02<00:01,  3.86it/s][A
 83%|████████▎ | 10/12 [00:03<00:00,  3.16it/s][A
100%|██████████| 12/12 [00:03<00:00,  3.20it/s][A
Epochs:  83%|████████▎ | 81/98 [36:32<07:38, 26.97s/it]

Val Loss: 2.1763 - Val Accuracy: 0.9383



Training:   0%|          | 0/95 [00:00<?, ?it/s][A
Training:   1%|          | 1/95 [00:01<02:04,  1.32s/it][A
Training:   3%|▎         | 3/95 [00:01<00:36,  2.52it/s][A
Training:   5%|▌         | 5/95 [00:02<00:36,  2.43it/s][A
Training:   7%|▋         | 7/95 [00:02<00:23,  3.72it/s][A
Training:   9%|▉         | 9/95 [00:03<00:29,  2.95it/s][A
Training:  13%|█▎        | 12/95 [00:03<00:16,  4.94it/s][A
Training:  15%|█▍        | 14/95 [00:04<00:22,  3.62it/s][A
Training:  18%|█▊        | 17/95 [00:05<00:22,  3.50it/s][A
Training:  20%|██        | 19/95 [00:05<00:17,  4.29it/s][A
Training:  22%|██▏       | 21/95 [00:06<00:20,  3.66it/s][A
Training:  25%|██▌       | 24/95 [00:06<00:13,  5.43it/s][A
Training:  27%|██▋       | 26/95 [00:07<00:17,  4.05it/s][A
Training:  29%|██▉       | 28/95 [00:07<00:13,  5.15it/s][A
Training:  32%|███▏      | 30/95 [00:08<00:16,  3.98it/s][A
Training:  35%|███▍      | 33/95 [00:08<00:16,  3.82it/s][A
Training:  37%|███▋      | 35/95 [00:

Epoch: 82/98 - Loss: 1.7338 - Accuracy: 0.9415



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:19,  1.78s/it][A
 42%|████▏     | 5/12 [00:02<00:03,  2.13it/s][A
 58%|█████▊    | 7/12 [00:02<00:01,  3.17it/s][A
100%|██████████| 12/12 [00:03<00:00,  3.23it/s][A
Epochs:  84%|████████▎ | 82/98 [36:59<07:09, 26.84s/it]

Val Loss: 2.2908 - Val Accuracy: 0.9243



Training:   0%|          | 0/95 [00:00<?, ?it/s][A
Training:   1%|          | 1/95 [00:01<02:08,  1.36s/it][A
Training:   3%|▎         | 3/95 [00:01<00:37,  2.47it/s][A
Training:   5%|▌         | 5/95 [00:02<00:35,  2.54it/s][A
Training:   7%|▋         | 7/95 [00:02<00:26,  3.37it/s][A
Training:   9%|▉         | 9/95 [00:03<00:26,  3.28it/s][A
Training:  12%|█▏        | 11/95 [00:03<00:21,  3.89it/s][A
Training:  14%|█▎        | 13/95 [00:04<00:23,  3.54it/s][A
Training:  16%|█▌        | 15/95 [00:04<00:20,  3.96it/s][A
Training:  18%|█▊        | 17/95 [00:05<00:20,  3.79it/s][A
Training:  19%|█▉        | 18/95 [00:05<00:18,  4.26it/s][A
Training:  20%|██        | 19/95 [00:05<00:19,  3.88it/s][A
Training:  21%|██        | 20/95 [00:05<00:17,  4.38it/s][A
Training:  22%|██▏       | 21/95 [00:06<00:19,  3.72it/s][A
Training:  23%|██▎       | 22/95 [00:06<00:16,  4.39it/s][A
Training:  24%|██▍       | 23/95 [00:06<00:16,  4.26it/s][A
Training:  26%|██▋       | 25/95 [00:

Epoch: 83/98 - Loss: 1.7417 - Accuracy: 0.9447



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:17,  1.59s/it][A
 25%|██▌       | 3/12 [00:01<00:04,  2.21it/s][A
 42%|████▏     | 5/12 [00:02<00:03,  2.24it/s][A
 58%|█████▊    | 7/12 [00:02<00:01,  3.54it/s][A
100%|██████████| 12/12 [00:03<00:00,  3.22it/s][A
Epochs:  85%|████████▍ | 83/98 [37:26<06:44, 26.99s/it]

Val Loss: 2.1803 - Val Accuracy: 0.9411



Training:   0%|          | 0/95 [00:00<?, ?it/s][A
Training:   1%|          | 1/95 [00:01<02:10,  1.38s/it][A
Training:   4%|▍         | 4/95 [00:01<00:26,  3.40it/s][A
Training:   6%|▋         | 6/95 [00:02<00:33,  2.67it/s][A
Training:   8%|▊         | 8/95 [00:02<00:22,  3.87it/s][A
Training:  11%|█         | 10/95 [00:03<00:28,  3.02it/s][A
Training:  12%|█▏        | 11/95 [00:03<00:24,  3.47it/s][A
Training:  14%|█▎        | 13/95 [00:04<00:27,  2.97it/s][A
Training:  16%|█▌        | 15/95 [00:04<00:19,  4.05it/s][A
Training:  18%|█▊        | 17/95 [00:05<00:21,  3.56it/s][A
Training:  20%|██        | 19/95 [00:05<00:15,  4.80it/s][A
Training:  22%|██▏       | 21/95 [00:06<00:19,  3.72it/s][A
Training:  24%|██▍       | 23/95 [00:06<00:15,  4.77it/s][A
Training:  26%|██▋       | 25/95 [00:07<00:17,  3.91it/s][A
Training:  27%|██▋       | 26/95 [00:07<00:15,  4.39it/s][A
Training:  31%|███       | 29/95 [00:08<00:17,  3.77it/s][A
Training:  33%|███▎      | 31/95 [00

Epoch: 84/98 - Loss: 1.7219 - Accuracy: 0.9446



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:13,  1.20s/it][A
 25%|██▌       | 3/12 [00:01<00:03,  2.73it/s][A
 42%|████▏     | 5/12 [00:02<00:02,  2.61it/s][A
 58%|█████▊    | 7/12 [00:02<00:01,  4.06it/s][A
100%|██████████| 12/12 [00:03<00:00,  3.59it/s][A
Epochs:  86%|████████▌ | 84/98 [37:53<06:14, 26.77s/it]

Val Loss: 2.2445 - Val Accuracy: 0.9422



Training:   0%|          | 0/95 [00:00<?, ?it/s][A
Training:   1%|          | 1/95 [00:01<02:10,  1.39s/it][A
Training:   3%|▎         | 3/95 [00:01<00:37,  2.47it/s][A
Training:   5%|▌         | 5/95 [00:02<00:35,  2.55it/s][A
Training:   6%|▋         | 6/95 [00:02<00:28,  3.11it/s][A
Training:   7%|▋         | 7/95 [00:02<00:24,  3.56it/s][A
Training:   8%|▊         | 8/95 [00:02<00:20,  4.35it/s][A
Training:   9%|▉         | 9/95 [00:03<00:25,  3.34it/s][A
Training:  11%|█         | 10/95 [00:03<00:25,  3.27it/s][A
Training:  13%|█▎        | 12/95 [00:03<00:16,  4.92it/s][A
Training:  14%|█▎        | 13/95 [00:04<00:21,  3.89it/s][A
Training:  15%|█▍        | 14/95 [00:04<00:22,  3.68it/s][A
Training:  16%|█▌        | 15/95 [00:04<00:18,  4.42it/s][A
Training:  18%|█▊        | 17/95 [00:04<00:18,  4.17it/s][A
Training:  19%|█▉        | 18/95 [00:05<00:20,  3.80it/s][A
Training:  21%|██        | 20/95 [00:05<00:13,  5.42it/s][A
Training:  22%|██▏       | 21/95 [00:05

Epoch: 85/98 - Loss: 1.7520 - Accuracy: 0.9441



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:13,  1.24s/it][A
 17%|█▋        | 2/12 [00:01<00:06,  1.66it/s][A
 33%|███▎      | 4/12 [00:01<00:02,  3.82it/s][A
 42%|████▏     | 5/12 [00:02<00:02,  2.60it/s][A
 50%|█████     | 6/12 [00:02<00:01,  3.21it/s][A
 67%|██████▋   | 8/12 [00:02<00:00,  5.06it/s][A
 75%|███████▌  | 9/12 [00:03<00:00,  3.12it/s][A
 83%|████████▎ | 10/12 [00:03<00:00,  3.75it/s][A
100%|██████████| 12/12 [00:03<00:00,  3.45it/s][A
Epochs:  87%|████████▋ | 85/98 [38:20<05:50, 26.95s/it]

Val Loss: 2.1902 - Val Accuracy: 0.9370



Training:   0%|          | 0/95 [00:00<?, ?it/s][A
Training:   1%|          | 1/95 [00:01<02:07,  1.36s/it][A
Training:   2%|▏         | 2/95 [00:01<00:58,  1.58it/s][A
Training:   5%|▌         | 5/95 [00:02<00:34,  2.62it/s][A
Training:   6%|▋         | 6/95 [00:02<00:28,  3.17it/s][A
Training:   8%|▊         | 8/95 [00:02<00:17,  4.91it/s][A
Training:  11%|█         | 10/95 [00:03<00:24,  3.40it/s][A
Training:  13%|█▎        | 12/95 [00:03<00:17,  4.70it/s][A
Training:  15%|█▍        | 14/95 [00:04<00:22,  3.53it/s][A
Training:  16%|█▌        | 15/95 [00:04<00:22,  3.60it/s][A
Training:  18%|█▊        | 17/95 [00:05<00:23,  3.31it/s][A
Training:  20%|██        | 19/95 [00:05<00:17,  4.35it/s][A
Training:  22%|██▏       | 21/95 [00:06<00:21,  3.47it/s][A
Training:  24%|██▍       | 23/95 [00:06<00:15,  4.55it/s][A
Training:  26%|██▋       | 25/95 [00:07<00:17,  4.01it/s][A
Training:  28%|██▊       | 27/95 [00:07<00:13,  5.01it/s][A
Training:  31%|███       | 29/95 [00:

Epoch: 86/98 - Loss: 1.7055 - Accuracy: 0.9469



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:13,  1.23s/it][A
 17%|█▋        | 2/12 [00:01<00:05,  1.69it/s][A
 42%|████▏     | 5/12 [00:02<00:02,  2.88it/s][A
100%|██████████| 12/12 [00:03<00:00,  3.62it/s][A
Epochs:  88%|████████▊ | 86/98 [38:47<05:23, 27.00s/it]

Val Loss: 2.0921 - Val Accuracy: 0.9426



Training:   0%|          | 0/95 [00:00<?, ?it/s][A
Training:   1%|          | 1/95 [00:01<02:25,  1.55s/it][A
Training:   4%|▍         | 4/95 [00:01<00:29,  3.05it/s][A
Training:   6%|▋         | 6/95 [00:02<00:34,  2.60it/s][A
Training:   8%|▊         | 8/95 [00:02<00:22,  3.88it/s][A
Training:  11%|█         | 10/95 [00:03<00:29,  2.92it/s][A
Training:  13%|█▎        | 12/95 [00:03<00:21,  3.95it/s][A
Training:  15%|█▍        | 14/95 [00:04<00:26,  3.06it/s][A
Training:  17%|█▋        | 16/95 [00:04<00:19,  4.04it/s][A
Training:  18%|█▊        | 17/95 [00:05<00:26,  2.92it/s][A
Training:  20%|██        | 19/95 [00:05<00:18,  4.08it/s][A
Training:  22%|██▏       | 21/95 [00:06<00:21,  3.47it/s][A
Training:  24%|██▍       | 23/95 [00:06<00:16,  4.48it/s][A
Training:  26%|██▋       | 25/95 [00:07<00:19,  3.61it/s][A
Training:  28%|██▊       | 27/95 [00:07<00:14,  4.80it/s][A
Training:  31%|███       | 29/95 [00:08<00:19,  3.38it/s][A
Training:  33%|███▎      | 31/95 [00

Epoch: 87/98 - Loss: 1.8897 - Accuracy: 0.9429



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:15,  1.42s/it][A
 17%|█▋        | 2/12 [00:01<00:06,  1.47it/s][A
 33%|███▎      | 4/12 [00:01<00:02,  3.46it/s][A
 50%|█████     | 6/12 [00:02<00:01,  3.22it/s][A
 75%|███████▌  | 9/12 [00:02<00:00,  3.89it/s][A
100%|██████████| 12/12 [00:03<00:00,  3.70it/s][A
Epochs:  89%|████████▉ | 87/98 [39:14<04:56, 26.91s/it]

Val Loss: 2.1198 - Val Accuracy: 0.9300



Training:   0%|          | 0/95 [00:00<?, ?it/s][A
Training:   1%|          | 1/95 [00:01<02:20,  1.49s/it][A
Training:   5%|▌         | 5/95 [00:02<00:38,  2.35it/s][A
Training:   7%|▋         | 7/95 [00:02<00:25,  3.42it/s][A
Training:   9%|▉         | 9/95 [00:03<00:27,  3.15it/s][A
Training:  13%|█▎        | 12/95 [00:03<00:16,  4.97it/s][A
Training:  15%|█▍        | 14/95 [00:04<00:21,  3.84it/s][A
Training:  17%|█▋        | 16/95 [00:04<00:16,  4.82it/s][A
Training:  18%|█▊        | 17/95 [00:04<00:20,  3.85it/s][A
Training:  21%|██        | 20/95 [00:05<00:13,  5.66it/s][A
Training:  22%|██▏       | 21/95 [00:05<00:19,  3.75it/s][A
Training:  25%|██▌       | 24/95 [00:06<00:14,  4.91it/s][A
Training:  26%|██▋       | 25/95 [00:06<00:18,  3.86it/s][A
Training:  29%|██▉       | 28/95 [00:07<00:12,  5.22it/s][A
Training:  31%|███       | 29/95 [00:07<00:18,  3.58it/s][A
Training:  32%|███▏      | 30/95 [00:07<00:15,  4.07it/s][A
Training:  34%|███▎      | 32/95 [00

Epoch: 88/98 - Loss: 1.8881 - Accuracy: 0.9379



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:14,  1.35s/it][A
 33%|███▎      | 4/12 [00:01<00:02,  3.47it/s][A
 50%|█████     | 6/12 [00:02<00:02,  2.93it/s][A
 75%|███████▌  | 9/12 [00:03<00:00,  3.42it/s][A
100%|██████████| 12/12 [00:03<00:00,  3.57it/s][A
Epochs:  90%|████████▉ | 88/98 [39:40<04:28, 26.80s/it]

Val Loss: 2.5065 - Val Accuracy: 0.9379



Training:   0%|          | 0/95 [00:00<?, ?it/s][A
Training:   1%|          | 1/95 [00:01<02:23,  1.52s/it][A
Training:   3%|▎         | 3/95 [00:01<00:39,  2.31it/s][A
Training:   5%|▌         | 5/95 [00:02<00:33,  2.69it/s][A
Training:   7%|▋         | 7/95 [00:02<00:20,  4.22it/s][A
Training:   9%|▉         | 9/95 [00:03<00:26,  3.24it/s][A
Training:  13%|█▎        | 12/95 [00:03<00:16,  5.14it/s][A
Training:  15%|█▍        | 14/95 [00:04<00:21,  3.74it/s][A
Training:  17%|█▋        | 16/95 [00:04<00:17,  4.58it/s][A
Training:  18%|█▊        | 17/95 [00:05<00:22,  3.53it/s][A
Training:  21%|██        | 20/95 [00:05<00:13,  5.56it/s][A
Training:  23%|██▎       | 22/95 [00:05<00:17,  4.21it/s][A
Training:  25%|██▌       | 24/95 [00:06<00:13,  5.17it/s][A
Training:  26%|██▋       | 25/95 [00:06<00:19,  3.55it/s][A
Training:  27%|██▋       | 26/95 [00:06<00:18,  3.81it/s][A
Training:  29%|██▉       | 28/95 [00:07<00:12,  5.28it/s][A
Training:  31%|███       | 29/95 [00:

Epoch: 89/98 - Loss: 1.7608 - Accuracy: 0.9460



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:16,  1.46s/it][A
 25%|██▌       | 3/12 [00:01<00:03,  2.37it/s][A
 42%|████▏     | 5/12 [00:02<00:02,  2.39it/s][A
 58%|█████▊    | 7/12 [00:02<00:01,  3.74it/s][A
100%|██████████| 12/12 [00:03<00:00,  3.47it/s][A
Epochs:  91%|█████████ | 89/98 [40:07<04:01, 26.85s/it]

Val Loss: 2.2136 - Val Accuracy: 0.9338



Training:   0%|          | 0/95 [00:00<?, ?it/s][A
Training:   1%|          | 1/95 [00:01<02:27,  1.57s/it][A
Training:   3%|▎         | 3/95 [00:01<00:40,  2.25it/s][A
Training:   5%|▌         | 5/95 [00:02<00:38,  2.34it/s][A
Training:   8%|▊         | 8/95 [00:02<00:19,  4.47it/s][A
Training:  11%|█         | 10/95 [00:03<00:24,  3.42it/s][A
Training:  13%|█▎        | 12/95 [00:03<00:18,  4.60it/s][A
Training:  15%|█▍        | 14/95 [00:04<00:22,  3.66it/s][A
Training:  17%|█▋        | 16/95 [00:04<00:16,  4.84it/s][A
Training:  19%|█▉        | 18/95 [00:05<00:19,  3.88it/s][A
Training:  21%|██        | 20/95 [00:05<00:14,  5.10it/s][A
Training:  23%|██▎       | 22/95 [00:06<00:18,  3.97it/s][A
Training:  25%|██▌       | 24/95 [00:06<00:14,  4.93it/s][A
Training:  26%|██▋       | 25/95 [00:07<00:23,  2.97it/s][A
Training:  28%|██▊       | 27/95 [00:07<00:16,  4.10it/s][A
Training:  31%|███       | 29/95 [00:08<00:17,  3.69it/s][A
Training:  33%|███▎      | 31/95 [00

Epoch: 90/98 - Loss: 1.7795 - Accuracy: 0.9436



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:15,  1.39s/it][A
 25%|██▌       | 3/12 [00:01<00:03,  2.43it/s][A
 42%|████▏     | 5/12 [00:02<00:02,  2.49it/s][A
 58%|█████▊    | 7/12 [00:02<00:01,  3.81it/s][A
 75%|███████▌  | 9/12 [00:03<00:00,  3.65it/s][A
100%|██████████| 12/12 [00:03<00:00,  3.66it/s][A
Epochs:  92%|█████████▏| 90/98 [40:34<03:34, 26.85s/it]

Val Loss: 2.2186 - Val Accuracy: 0.9374



Training:   0%|          | 0/95 [00:00<?, ?it/s][A
Training:   1%|          | 1/95 [00:01<02:24,  1.53s/it][A
Training:   4%|▍         | 4/95 [00:01<00:30,  3.01it/s][A
Training:   6%|▋         | 6/95 [00:02<00:34,  2.59it/s][A
Training:   8%|▊         | 8/95 [00:02<00:22,  3.83it/s][A
Training:  11%|█         | 10/95 [00:03<00:24,  3.51it/s][A
Training:  14%|█▎        | 13/95 [00:03<00:20,  4.01it/s][A
Training:  16%|█▌        | 15/95 [00:04<00:15,  5.18it/s][A
Training:  18%|█▊        | 17/95 [00:04<00:20,  3.90it/s][A
Training:  20%|██        | 19/95 [00:05<00:15,  4.82it/s][A
Training:  22%|██▏       | 21/95 [00:05<00:18,  3.95it/s][A
Training:  24%|██▍       | 23/95 [00:06<00:17,  4.21it/s][A
Training:  25%|██▌       | 24/95 [00:06<00:15,  4.60it/s][A
Training:  26%|██▋       | 25/95 [00:06<00:17,  3.90it/s][A
Training:  28%|██▊       | 27/95 [00:07<00:15,  4.25it/s][A
Training:  31%|███       | 29/95 [00:07<00:15,  4.36it/s][A
Training:  33%|███▎      | 31/95 [00

Epoch: 91/98 - Loss: 1.7322 - Accuracy: 0.9444



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:14,  1.34s/it][A
 25%|██▌       | 3/12 [00:01<00:03,  2.41it/s][A
 33%|███▎      | 4/12 [00:01<00:02,  3.22it/s][A
 42%|████▏     | 5/12 [00:02<00:03,  2.27it/s][A
 58%|█████▊    | 7/12 [00:02<00:01,  3.86it/s][A
 75%|███████▌  | 9/12 [00:03<00:00,  3.33it/s][A
100%|██████████| 12/12 [00:03<00:00,  3.53it/s][A
Epochs:  93%|█████████▎| 91/98 [41:01<03:07, 26.75s/it]

Val Loss: 2.0870 - Val Accuracy: 0.9336



Training:   0%|          | 0/95 [00:00<?, ?it/s][A
Training:   1%|          | 1/95 [00:01<02:12,  1.41s/it][A
Training:   3%|▎         | 3/95 [00:01<00:37,  2.45it/s][A
Training:   5%|▌         | 5/95 [00:02<00:36,  2.46it/s][A
Training:   6%|▋         | 6/95 [00:02<00:29,  3.03it/s][A
Training:   8%|▊         | 8/95 [00:02<00:18,  4.73it/s][A
Training:  11%|█         | 10/95 [00:03<00:24,  3.46it/s][A
Training:  14%|█▎        | 13/95 [00:03<00:19,  4.23it/s][A
Training:  15%|█▍        | 14/95 [00:04<00:19,  4.20it/s][A
Training:  17%|█▋        | 16/95 [00:04<00:14,  5.56it/s][A
Training:  18%|█▊        | 17/95 [00:04<00:17,  4.34it/s][A
Training:  19%|█▉        | 18/95 [00:05<00:18,  4.19it/s][A
Training:  21%|██        | 20/95 [00:05<00:12,  5.95it/s][A
Training:  22%|██▏       | 21/95 [00:05<00:15,  4.81it/s][A
Training:  23%|██▎       | 22/95 [00:05<00:17,  4.22it/s][A
Training:  25%|██▌       | 24/95 [00:05<00:12,  5.78it/s][A
Training:  26%|██▋       | 25/95 [00:

Epoch: 92/98 - Loss: 1.8060 - Accuracy: 0.9422



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:15,  1.44s/it][A
 17%|█▋        | 2/12 [00:01<00:06,  1.49it/s][A
 33%|███▎      | 4/12 [00:01<00:02,  3.32it/s][A
 42%|████▏     | 5/12 [00:02<00:02,  2.36it/s][A
 50%|█████     | 6/12 [00:02<00:02,  2.93it/s][A
 75%|███████▌  | 9/12 [00:03<00:00,  3.38it/s][A
100%|██████████| 12/12 [00:03<00:00,  3.27it/s][A
Epochs:  94%|█████████▍| 92/98 [41:27<02:40, 26.77s/it]

Val Loss: 2.4505 - Val Accuracy: 0.8903



Training:   0%|          | 0/95 [00:00<?, ?it/s][A
Training:   1%|          | 1/95 [00:01<02:13,  1.43s/it][A
Training:   5%|▌         | 5/95 [00:02<00:35,  2.52it/s][A
Training:   6%|▋         | 6/95 [00:02<00:29,  3.05it/s][A
Training:   8%|▊         | 8/95 [00:02<00:19,  4.52it/s][A
Training:  11%|█         | 10/95 [00:03<00:23,  3.55it/s][A
Training:  13%|█▎        | 12/95 [00:03<00:17,  4.82it/s][A
Training:  15%|█▍        | 14/95 [00:04<00:25,  3.17it/s][A
Training:  16%|█▌        | 15/95 [00:04<00:22,  3.63it/s][A
Training:  18%|█▊        | 17/95 [00:05<00:22,  3.50it/s][A
Training:  22%|██▏       | 21/95 [00:05<00:17,  4.21it/s][A
Training:  23%|██▎       | 22/95 [00:06<00:15,  4.62it/s][A
Training:  25%|██▌       | 24/95 [00:06<00:12,  5.75it/s][A
Training:  26%|██▋       | 25/95 [00:06<00:17,  4.10it/s][A
Training:  28%|██▊       | 27/95 [00:06<00:12,  5.27it/s][A
Training:  29%|██▉       | 28/95 [00:07<00:11,  5.60it/s][A
Training:  31%|███       | 29/95 [00

Epoch: 93/98 - Loss: 1.8515 - Accuracy: 0.9387



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:15,  1.45s/it][A
 25%|██▌       | 3/12 [00:01<00:03,  2.40it/s][A
 42%|████▏     | 5/12 [00:02<00:02,  2.43it/s][A
 58%|█████▊    | 7/12 [00:02<00:01,  3.81it/s][A
 75%|███████▌  | 9/12 [00:03<00:00,  3.16it/s][A
100%|██████████| 12/12 [00:03<00:00,  3.32it/s][A
Epochs:  95%|█████████▍| 93/98 [41:55<02:14, 27.00s/it]

Val Loss: 2.1452 - Val Accuracy: 0.9411



Training:   0%|          | 0/95 [00:00<?, ?it/s][A
Training:   1%|          | 1/95 [00:01<01:46,  1.14s/it][A
Training:   3%|▎         | 3/95 [00:01<00:30,  2.98it/s][A
Training:   5%|▌         | 5/95 [00:02<00:35,  2.56it/s][A
Training:   7%|▋         | 7/95 [00:02<00:22,  3.99it/s][A
Training:   9%|▉         | 9/95 [00:03<00:26,  3.25it/s][A
Training:  12%|█▏        | 11/95 [00:03<00:18,  4.58it/s][A
Training:  14%|█▎        | 13/95 [00:04<00:24,  3.39it/s][A
Training:  16%|█▌        | 15/95 [00:04<00:17,  4.60it/s][A
Training:  18%|█▊        | 17/95 [00:04<00:20,  3.80it/s][A
Training:  20%|██        | 19/95 [00:05<00:15,  5.00it/s][A
Training:  22%|██▏       | 21/95 [00:05<00:17,  4.26it/s][A
Training:  25%|██▌       | 24/95 [00:06<00:13,  5.15it/s][A
Training:  26%|██▋       | 25/95 [00:06<00:17,  4.02it/s][A
Training:  28%|██▊       | 27/95 [00:06<00:13,  5.11it/s][A
Training:  29%|██▉       | 28/95 [00:07<00:14,  4.64it/s][A
Training:  31%|███       | 29/95 [00:

Epoch: 94/98 - Loss: 1.8824 - Accuracy: 0.9434



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:13,  1.27s/it][A
 25%|██▌       | 3/12 [00:01<00:03,  2.59it/s][A
 42%|████▏     | 5/12 [00:02<00:02,  2.51it/s][A
 67%|██████▋   | 8/12 [00:02<00:00,  4.60it/s][A
100%|██████████| 12/12 [00:03<00:00,  3.44it/s][A
Epochs:  96%|█████████▌| 94/98 [42:22<01:48, 27.08s/it]

Val Loss: 2.2022 - Val Accuracy: 0.9097



Training:   0%|          | 0/95 [00:00<?, ?it/s][A
Training:   1%|          | 1/95 [00:01<02:16,  1.45s/it][A
Training:   3%|▎         | 3/95 [00:01<00:38,  2.41it/s][A
Training:   5%|▌         | 5/95 [00:02<00:32,  2.81it/s][A
Training:   8%|▊         | 8/95 [00:02<00:16,  5.33it/s][A
Training:  11%|█         | 10/95 [00:03<00:23,  3.67it/s][A
Training:  13%|█▎        | 12/95 [00:03<00:17,  4.76it/s][A
Training:  15%|█▍        | 14/95 [00:04<00:22,  3.56it/s][A
Training:  17%|█▋        | 16/95 [00:04<00:16,  4.69it/s][A
Training:  19%|█▉        | 18/95 [00:05<00:22,  3.36it/s][A
Training:  22%|██▏       | 21/95 [00:05<00:16,  4.49it/s][A
Training:  23%|██▎       | 22/95 [00:06<00:20,  3.64it/s][A
Training:  25%|██▌       | 24/95 [00:06<00:15,  4.71it/s][A
Training:  26%|██▋       | 25/95 [00:06<00:14,  4.69it/s][A
Training:  27%|██▋       | 26/95 [00:06<00:17,  4.00it/s][A
Training:  31%|███       | 29/95 [00:07<00:13,  5.02it/s][A
Training:  32%|███▏      | 30/95 [00

Epoch: 95/98 - Loss: 1.8464 - Accuracy: 0.9420



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:13,  1.24s/it][A
 17%|█▋        | 2/12 [00:01<00:05,  1.73it/s][A
 33%|███▎      | 4/12 [00:01<00:02,  3.89it/s][A
 42%|████▏     | 5/12 [00:02<00:02,  2.62it/s][A
 50%|█████     | 6/12 [00:02<00:02,  3.00it/s][A
 67%|██████▋   | 8/12 [00:02<00:00,  4.69it/s][A
100%|██████████| 12/12 [00:03<00:00,  3.39it/s][A
Epochs:  97%|█████████▋| 95/98 [42:49<01:20, 26.88s/it]

Val Loss: 2.1853 - Val Accuracy: 0.9357



Training:   0%|          | 0/95 [00:00<?, ?it/s][A
Training:   1%|          | 1/95 [00:01<02:03,  1.31s/it][A
Training:   3%|▎         | 3/95 [00:01<00:35,  2.60it/s][A
Training:   5%|▌         | 5/95 [00:02<00:35,  2.54it/s][A
Training:   7%|▋         | 7/95 [00:02<00:21,  4.03it/s][A
Training:   9%|▉         | 9/95 [00:03<00:25,  3.34it/s][A
Training:  12%|█▏        | 11/95 [00:03<00:17,  4.67it/s][A
Training:  14%|█▎        | 13/95 [00:03<00:19,  4.12it/s][A
Training:  17%|█▋        | 16/95 [00:04<00:14,  5.45it/s][A
Training:  18%|█▊        | 17/95 [00:04<00:18,  4.24it/s][A
Training:  20%|██        | 19/95 [00:04<00:13,  5.45it/s][A
Training:  21%|██        | 20/95 [00:05<00:14,  5.09it/s][A
Training:  22%|██▏       | 21/95 [00:05<00:18,  3.99it/s][A
Training:  25%|██▌       | 24/95 [00:05<00:11,  5.97it/s][A
Training:  26%|██▋       | 25/95 [00:06<00:17,  4.02it/s][A
Training:  28%|██▊       | 27/95 [00:06<00:12,  5.46it/s][A
Training:  31%|███       | 29/95 [00:

Epoch: 96/98 - Loss: 1.8258 - Accuracy: 0.9424



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:12,  1.14s/it][A
 25%|██▌       | 3/12 [00:01<00:03,  2.92it/s][A
 42%|████▏     | 5/12 [00:02<00:02,  2.56it/s][A
 67%|██████▋   | 8/12 [00:02<00:00,  4.85it/s][A
100%|██████████| 12/12 [00:03<00:00,  3.66it/s][A
Epochs:  98%|█████████▊| 96/98 [43:15<00:53, 26.70s/it]

Val Loss: 2.4354 - Val Accuracy: 0.9377



Training:   0%|          | 0/95 [00:00<?, ?it/s][A
Training:   1%|          | 1/95 [00:01<02:13,  1.42s/it][A
Training:   2%|▏         | 2/95 [00:01<01:00,  1.53it/s][A
Training:   4%|▍         | 4/95 [00:01<00:26,  3.42it/s][A
Training:   5%|▌         | 5/95 [00:02<00:35,  2.56it/s][A
Training:   6%|▋         | 6/95 [00:02<00:29,  3.03it/s][A
Training:   8%|▊         | 8/95 [00:02<00:17,  4.96it/s][A
Training:   9%|▉         | 9/95 [00:03<00:25,  3.38it/s][A
Training:  11%|█         | 10/95 [00:03<00:22,  3.84it/s][A
Training:  13%|█▎        | 12/95 [00:03<00:14,  5.63it/s][A
Training:  14%|█▎        | 13/95 [00:04<00:24,  3.32it/s][A
Training:  15%|█▍        | 14/95 [00:04<00:21,  3.71it/s][A
Training:  17%|█▋        | 16/95 [00:04<00:14,  5.48it/s][A
Training:  18%|█▊        | 17/95 [00:05<00:21,  3.60it/s][A
Training:  19%|█▉        | 18/95 [00:05<00:21,  3.60it/s][A
Training:  21%|██        | 20/95 [00:05<00:14,  5.19it/s][A
Training:  22%|██▏       | 21/95 [00:05

Epoch: 97/98 - Loss: 1.7562 - Accuracy: 0.9455



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:14,  1.36s/it][A
 17%|█▋        | 2/12 [00:01<00:06,  1.62it/s][A
 33%|███▎      | 4/12 [00:01<00:02,  3.73it/s][A
 50%|█████     | 6/12 [00:02<00:02,  2.97it/s][A
100%|██████████| 12/12 [00:03<00:00,  3.43it/s][A
Epochs:  99%|█████████▉| 97/98 [43:42<00:26, 26.90s/it]

Val Loss: 2.2448 - Val Accuracy: 0.9257



Training:   0%|          | 0/95 [00:00<?, ?it/s][A
Training:   1%|          | 1/95 [00:01<02:29,  1.59s/it][A
Training:   4%|▍         | 4/95 [00:01<00:30,  3.01it/s][A
Training:   6%|▋         | 6/95 [00:02<00:32,  2.76it/s][A
Training:   7%|▋         | 7/95 [00:02<00:26,  3.28it/s][A
Training:   9%|▉         | 9/95 [00:03<00:27,  3.12it/s][A
Training:  12%|█▏        | 11/95 [00:03<00:19,  4.37it/s][A
Training:  14%|█▎        | 13/95 [00:04<00:22,  3.66it/s][A
Training:  15%|█▍        | 14/95 [00:04<00:20,  4.03it/s][A
Training:  16%|█▌        | 15/95 [00:04<00:18,  4.37it/s][A
Training:  18%|█▊        | 17/95 [00:05<00:20,  3.83it/s][A
Training:  19%|█▉        | 18/95 [00:05<00:17,  4.38it/s][A
Training:  20%|██        | 19/95 [00:05<00:16,  4.48it/s][A
Training:  22%|██▏       | 21/95 [00:05<00:17,  4.19it/s][A
Training:  23%|██▎       | 22/95 [00:06<00:15,  4.81it/s][A
Training:  24%|██▍       | 23/95 [00:06<00:14,  5.14it/s][A
Training:  26%|██▋       | 25/95 [00:

Epoch: 98/98 - Loss: 1.8252 - Accuracy: 0.9456



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:15,  1.41s/it][A
 42%|████▏     | 5/12 [00:02<00:02,  2.33it/s][A
100%|██████████| 12/12 [00:03<00:00,  3.39it/s][A
Epochs: 100%|██████████| 98/98 [44:09<00:00, 27.04s/it]


Val Loss: 2.3263 - Val Accuracy: 0.8843


[32m[I 2023-12-15 00:34:01,459][0m Trial 7 finished with value: 0.8843218684196472 and parameters: {'loss_learning_rate': 0.00017237051393809033, 'learning_rate': 0.005231337095494607, 'weight_decay': 0.0010085209986501272, 'epsilon': 1.0952706936186941e-08, 'batch_size': 148, 'epochs': 98}. Best is trial 3 with value: 0.9413145780563354.[0m


Learning rate for Loss: 0.003051727754771083
Learning rate: 1.0981903003814207e-05
Weight decay: 0.0008344988551319097
Epsilon: 4.720113297586265e-09
Batch size: 204
Number of epochs: 71


Epochs:   0%|          | 0/71 [00:00<?, ?it/s]
Training:   0%|          | 0/69 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/69 [00:01<01:54,  1.68s/it][A
Training:   4%|▍         | 3/69 [00:01<00:32,  2.01it/s][A
Training:   7%|▋         | 5/69 [00:02<00:33,  1.88it/s][A
Training:  10%|█         | 7/69 [00:03<00:21,  2.88it/s][A
Training:  13%|█▎        | 9/69 [00:04<00:24,  2.46it/s][A
Training:  16%|█▌        | 11/69 [00:04<00:18,  3.22it/s][A
Training:  19%|█▉        | 13/69 [00:05<00:20,  2.77it/s][A
Training:  22%|██▏       | 15/69 [00:05<00:15,  3.51it/s][A
Training:  25%|██▍       | 17/69 [00:06<00:17,  3.02it/s][A
Training:  28%|██▊       | 19/69 [00:06<00:14,  3.41it/s][A
Training:  30%|███       | 21/69 [00:07<00:17,  2.76it/s][A
Training:  32%|███▏      | 22/69 [00:08<00:14,  3.17it/s][A
Training:  33%|███▎      | 23/69 [00:08<00:13,  3.50it/s][A
Training:  36%|███▌      | 25/69 [00:09<00:16,  2.59it/s][A
Training:  39%|███▉      | 27/69 [00:09<00:11,  3.65

Epoch: 1/71 - Loss: 28.0001 - Accuracy: 0.5743



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:01<00:12,  1.53s/it][A
 22%|██▏       | 2/9 [00:01<00:04,  1.43it/s][A
 44%|████▍     | 4/9 [00:01<00:01,  3.11it/s][A
 56%|█████▌    | 5/9 [00:02<00:01,  2.04it/s][A
 67%|██████▋   | 6/9 [00:02<00:01,  2.54it/s][A
 78%|███████▊  | 7/9 [00:03<00:00,  2.89it/s][A
100%|██████████| 9/9 [00:03<00:00,  2.56it/s][A
Epochs:   0%|          | 0/71 [00:26<?, ?it/s]
[32m[I 2023-12-15 00:34:28,636][0m Trial 8 pruned. [0m


Val Loss: 24.5186 - Val Accuracy: 0.6030
Learning rate for Loss: 0.0031807063540439545
Learning rate: 5.7594623285778144e-05
Weight decay: 0.006299303958659332
Epsilon: 2.4375762402836795e-09
Batch size: 265
Number of epochs: 47


Epochs:   0%|          | 0/47 [00:00<?, ?it/s]
Training:   0%|          | 0/53 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/53 [00:01<01:32,  1.79s/it][A
Training:   4%|▍         | 2/53 [00:01<00:42,  1.20it/s][A
Training:   8%|▊         | 4/53 [00:02<00:18,  2.71it/s][A
Training:   9%|▉         | 5/53 [00:03<00:33,  1.44it/s][A
Training:  11%|█▏        | 6/53 [00:03<00:24,  1.93it/s][A
Training:  13%|█▎        | 7/53 [00:03<00:18,  2.55it/s][A
Training:  15%|█▌        | 8/53 [00:03<00:13,  3.25it/s][A
Training:  17%|█▋        | 9/53 [00:05<00:25,  1.76it/s][A
Training:  21%|██        | 11/53 [00:05<00:14,  2.86it/s][A
Training:  25%|██▍       | 13/53 [00:06<00:20,  1.99it/s][A
Training:  28%|██▊       | 15/53 [00:06<00:12,  2.94it/s][A
Training:  30%|███       | 16/53 [00:07<00:11,  3.29it/s][A
Training:  32%|███▏      | 17/53 [00:08<00:18,  1.92it/s][A
Training:  38%|███▊      | 20/53 [00:08<00:10,  3.03it/s][A
Training:  40%|███▉      | 21/53 [00:09<00:16,  2.00it/

Epoch: 1/47 - Loss: 24.0846 - Accuracy: 0.6069



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:02<00:13,  2.26s/it][A
 43%|████▎     | 3/7 [00:02<00:02,  1.60it/s][A
100%|██████████| 7/7 [00:03<00:00,  1.76it/s][A
Epochs:   0%|          | 0/47 [00:27<?, ?it/s]
[32m[I 2023-12-15 00:34:56,566][0m Trial 9 pruned. [0m


Val Loss: 16.5937 - Val Accuracy: 0.7065
Learning rate for Loss: 0.000993899885376822
Learning rate: 0.0003501871985411181
Weight decay: 0.0001625787648406097
Epsilon: 4.2341545795510904e-08
Batch size: 297
Number of epochs: 36


Epochs:   0%|          | 0/36 [00:00<?, ?it/s]
Training:   0%|          | 0/48 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/48 [00:02<01:50,  2.36s/it][A
Training:   4%|▍         | 2/48 [00:02<00:56,  1.22s/it][A
Training:   8%|▊         | 4/48 [00:02<00:22,  1.99it/s][A
Training:  10%|█         | 5/48 [00:04<00:34,  1.24it/s][A
Training:  12%|█▎        | 6/48 [00:04<00:27,  1.53it/s][A
Training:  17%|█▋        | 8/48 [00:04<00:14,  2.68it/s][A
Training:  19%|█▉        | 9/48 [00:06<00:25,  1.53it/s][A
Training:  21%|██        | 10/48 [00:06<00:19,  1.91it/s][A
Training:  23%|██▎       | 11/48 [00:06<00:15,  2.42it/s][A
Training:  25%|██▌       | 12/48 [00:06<00:12,  2.98it/s][A
Training:  27%|██▋       | 13/48 [00:08<00:22,  1.53it/s][A
Training:  29%|██▉       | 14/48 [00:08<00:17,  1.94it/s][A
Training:  31%|███▏      | 15/48 [00:08<00:13,  2.48it/s][A
Training:  35%|███▌      | 17/48 [00:09<00:15,  1.97it/s][A
Training:  38%|███▊      | 18/48 [00:10<00:14,  2.01it

Epoch: 1/36 - Loss: 14.9258 - Accuracy: 0.7124



  0%|          | 0/6 [00:00<?, ?it/s][A
 17%|█▋        | 1/6 [00:02<00:11,  2.33s/it][A
 33%|███▎      | 2/6 [00:02<00:04,  1.02s/it][A
 67%|██████▋   | 4/6 [00:02<00:00,  2.14it/s][A
100%|██████████| 6/6 [00:04<00:00,  1.47it/s][A
Epochs:   0%|          | 0/36 [00:28<?, ?it/s]
[32m[I 2023-12-15 00:35:25,223][0m Trial 10 pruned. [0m


Val Loss: 9.1559 - Val Accuracy: 0.8392
Learning rate for Loss: 0.0022039026522337533
Learning rate: 0.003855536505422354
Weight decay: 0.003485245048842352
Epsilon: 1.1759787698978145e-08
Batch size: 50
Number of epochs: 43


Epochs:   0%|          | 0/43 [00:00<?, ?it/s]
Training:   0%|          | 0/280 [00:00<?, ?it/s][A
Training:   0%|          | 1/280 [00:00<03:45,  1.24it/s][A
Training:   2%|▏         | 5/280 [00:01<00:51,  5.39it/s][A
Training:   3%|▎         | 9/280 [00:01<00:36,  7.44it/s][A
Training:   4%|▍         | 12/280 [00:01<00:26, 10.11it/s][A
Training:   5%|▌         | 14/280 [00:01<00:30,  8.68it/s][A
Training:   6%|▌         | 17/280 [00:02<00:29,  8.96it/s][A
Training:   8%|▊         | 21/280 [00:02<00:25, 10.16it/s][A
Training:   9%|▊         | 24/280 [00:02<00:20, 12.62it/s][A
Training:   9%|▉         | 26/280 [00:02<00:22, 11.14it/s][A
Training:  10%|█         | 28/280 [00:03<00:20, 12.43it/s][A
Training:  11%|█         | 30/280 [00:03<00:22, 10.92it/s][A
Training:  12%|█▏        | 33/280 [00:03<00:24,  9.88it/s][A
Training:  13%|█▎        | 36/280 [00:03<00:19, 12.73it/s][A
Training:  14%|█▎        | 38/280 [00:03<00:20, 11.59it/s][A
Training:  15%|█▍        | 41/280 [

Epoch: 1/43 - Loss: 5.4590 - Accuracy: 0.8680



  0%|          | 0/35 [00:00<?, ?it/s][A
  3%|▎         | 1/35 [00:00<00:24,  1.38it/s][A
 11%|█▏        | 4/35 [00:00<00:05,  5.50it/s][A
 17%|█▋        | 6/35 [00:01<00:03,  7.88it/s][A
 23%|██▎       | 8/35 [00:01<00:02,  9.56it/s][A
 29%|██▊       | 10/35 [00:01<00:02, 10.38it/s][A
 37%|███▋      | 13/35 [00:01<00:02, 10.98it/s][A
 46%|████▌     | 16/35 [00:01<00:01, 13.04it/s][A
 51%|█████▏    | 18/35 [00:01<00:01, 13.45it/s][A
 57%|█████▋    | 20/35 [00:02<00:01, 13.18it/s][A
 63%|██████▎   | 22/35 [00:02<00:00, 13.83it/s][A
 69%|██████▊   | 24/35 [00:02<00:00, 11.80it/s][A
 77%|███████▋  | 27/35 [00:02<00:00, 14.25it/s][A
 83%|████████▎ | 29/35 [00:02<00:00, 11.26it/s][A
100%|██████████| 35/35 [00:03<00:00, 10.77it/s][A
Epochs:   2%|▏         | 1/43 [00:27<18:57, 27.08s/it]

Val Loss: 3.4410 - Val Accuracy: 0.9290



Training:   0%|          | 0/280 [00:00<?, ?it/s][A
Training:   0%|          | 1/280 [00:00<03:27,  1.35it/s][A
Training:   1%|          | 3/280 [00:00<01:05,  4.23it/s][A
Training:   2%|▏         | 5/280 [00:01<00:49,  5.53it/s][A
Training:   3%|▎         | 8/280 [00:01<00:28,  9.59it/s][A
Training:   4%|▎         | 10/280 [00:01<00:28,  9.39it/s][A
Training:   5%|▍         | 13/280 [00:01<00:25, 10.40it/s][A
Training:   6%|▌         | 16/280 [00:01<00:19, 13.65it/s][A
Training:   6%|▋         | 18/280 [00:01<00:20, 12.60it/s][A
Training:   8%|▊         | 21/280 [00:02<00:22, 11.64it/s][A
Training:   9%|▉         | 25/280 [00:02<00:21, 11.63it/s][A
Training:  10%|█         | 29/280 [00:02<00:21, 11.74it/s][A
Training:  12%|█▏        | 33/280 [00:03<00:21, 11.41it/s][A
Training:  13%|█▎        | 36/280 [00:03<00:17, 13.65it/s][A
Training:  14%|█▎        | 38/280 [00:03<00:21, 11.39it/s][A
Training:  15%|█▍        | 41/280 [00:04<00:23, 10.32it/s][A
Training:  16%|█▌   

Epoch: 2/43 - Loss: 3.2342 - Accuracy: 0.9133



  0%|          | 0/35 [00:00<?, ?it/s][A
  3%|▎         | 1/35 [00:00<00:28,  1.20it/s][A
  9%|▊         | 3/35 [00:00<00:08,  3.76it/s][A
 14%|█▍        | 5/35 [00:01<00:05,  5.86it/s][A
 26%|██▌       | 9/35 [00:01<00:03,  8.05it/s][A
 37%|███▋      | 13/35 [00:01<00:02,  9.60it/s][A
 49%|████▊     | 17/35 [00:02<00:01, 11.79it/s][A
 54%|█████▍    | 19/35 [00:02<00:01, 12.48it/s][A
 60%|██████    | 21/35 [00:02<00:01, 12.23it/s][A
 66%|██████▌   | 23/35 [00:02<00:00, 12.47it/s][A
 74%|███████▍  | 26/35 [00:02<00:00, 15.04it/s][A
 80%|████████  | 28/35 [00:02<00:00, 13.97it/s][A
 86%|████████▌ | 30/35 [00:02<00:00, 14.67it/s][A
 91%|█████████▏| 32/35 [00:03<00:00, 14.03it/s][A
100%|██████████| 35/35 [00:03<00:00, 10.50it/s][A
Epochs:   5%|▍         | 2/43 [00:53<18:03, 26.42s/it]

Val Loss: 2.6154 - Val Accuracy: 0.9271



Training:   0%|          | 0/280 [00:00<?, ?it/s][A
Training:   0%|          | 1/280 [00:00<04:01,  1.16it/s][A
Training:   2%|▏         | 5/280 [00:01<00:55,  4.99it/s][A
Training:   3%|▎         | 9/280 [00:01<00:36,  7.35it/s][A
Training:   4%|▍         | 11/280 [00:01<00:30,  8.84it/s][A
Training:   5%|▍         | 13/280 [00:01<00:29,  8.97it/s][A
Training:   6%|▌         | 16/280 [00:01<00:22, 11.99it/s][A
Training:   6%|▋         | 18/280 [00:02<00:26,  9.96it/s][A
Training:   7%|▋         | 20/280 [00:02<00:22, 11.42it/s][A
Training:   8%|▊         | 22/280 [00:02<00:21, 11.87it/s][A
Training:   9%|▉         | 25/280 [00:02<00:23, 10.84it/s][A
Training:  10%|█         | 29/280 [00:03<00:21, 11.74it/s][A
Training:  12%|█▏        | 33/280 [00:03<00:20, 12.12it/s][A
Training:  13%|█▎        | 36/280 [00:03<00:17, 14.06it/s][A
Training:  14%|█▎        | 38/280 [00:03<00:21, 11.24it/s][A
Training:  15%|█▍        | 41/280 [00:04<00:22, 10.49it/s][A
Training:  16%|█▌  

Epoch: 3/43 - Loss: 2.6478 - Accuracy: 0.9283



  0%|          | 0/35 [00:00<?, ?it/s][A
  3%|▎         | 1/35 [00:00<00:22,  1.53it/s][A
 11%|█▏        | 4/35 [00:00<00:04,  6.22it/s][A
 17%|█▋        | 6/35 [00:00<00:03,  8.54it/s][A
 23%|██▎       | 8/35 [00:01<00:02,  9.73it/s][A
 29%|██▊       | 10/35 [00:01<00:02, 10.81it/s][A
 34%|███▍      | 12/35 [00:01<00:02, 10.65it/s][A
 43%|████▎     | 15/35 [00:01<00:01, 13.69it/s][A
 49%|████▊     | 17/35 [00:01<00:01, 12.76it/s][A
 57%|█████▋    | 20/35 [00:02<00:01, 11.53it/s][A
 66%|██████▌   | 23/35 [00:02<00:00, 14.64it/s][A
 71%|███████▏  | 25/35 [00:02<00:00, 11.64it/s][A
 80%|████████  | 28/35 [00:02<00:00, 10.53it/s][A
100%|██████████| 35/35 [00:03<00:00, 10.84it/s][A
Epochs:   7%|▋         | 3/43 [01:19<17:43, 26.58s/it]

Val Loss: 2.4356 - Val Accuracy: 0.9313



Training:   0%|          | 0/280 [00:00<?, ?it/s][A
Training:   0%|          | 1/280 [00:00<03:21,  1.39it/s][A
Training:   1%|          | 3/280 [00:00<01:04,  4.32it/s][A
Training:   2%|▏         | 5/280 [00:01<00:47,  5.83it/s][A
Training:   2%|▎         | 7/280 [00:01<00:33,  8.11it/s][A
Training:   3%|▎         | 9/280 [00:01<00:31,  8.53it/s][A
Training:   4%|▍         | 11/280 [00:01<00:26, 10.25it/s][A
Training:   5%|▍         | 13/280 [00:01<00:27,  9.79it/s][A
Training:   5%|▌         | 15/280 [00:01<00:23, 11.17it/s][A
Training:   6%|▌         | 17/280 [00:02<00:21, 12.15it/s][A
Training:   7%|▋         | 19/280 [00:02<00:23, 11.02it/s][A
Training:   8%|▊         | 21/280 [00:02<00:23, 11.15it/s][A
Training:   8%|▊         | 23/280 [00:02<00:22, 11.66it/s][A
Training:   9%|▉         | 25/280 [00:02<00:23, 10.85it/s][A
Training:  10%|▉         | 27/280 [00:02<00:21, 11.92it/s][A
Training:  10%|█         | 29/280 [00:03<00:25,  9.85it/s][A
Training:  11%|█     

Epoch: 4/43 - Loss: 2.6766 - Accuracy: 0.9260



  0%|          | 0/35 [00:00<?, ?it/s][A
  3%|▎         | 1/35 [00:00<00:21,  1.60it/s][A
  6%|▌         | 2/35 [00:00<00:11,  3.00it/s][A
 14%|█▍        | 5/35 [00:00<00:04,  7.23it/s][A
 20%|██        | 7/35 [00:01<00:03,  8.93it/s][A
 26%|██▌       | 9/35 [00:01<00:02, 10.03it/s][A
 31%|███▏      | 11/35 [00:01<00:02, 10.09it/s][A
 37%|███▋      | 13/35 [00:01<00:02, 10.05it/s][A
 49%|████▊     | 17/35 [00:01<00:01, 10.68it/s][A
 54%|█████▍    | 19/35 [00:02<00:01, 11.40it/s][A
 60%|██████    | 21/35 [00:02<00:01, 11.39it/s][A
 66%|██████▌   | 23/35 [00:02<00:01, 11.97it/s][A
 71%|███████▏  | 25/35 [00:02<00:00, 11.57it/s][A
 77%|███████▋  | 27/35 [00:02<00:00, 10.90it/s][A
 83%|████████▎ | 29/35 [00:03<00:00, 11.09it/s][A
 91%|█████████▏| 32/35 [00:03<00:00, 14.53it/s][A
100%|██████████| 35/35 [00:03<00:00,  9.77it/s][A
Epochs:   9%|▉         | 4/43 [01:47<17:34, 27.05s/it]

Val Loss: 2.6780 - Val Accuracy: 0.9347



Training:   0%|          | 0/280 [00:00<?, ?it/s][A
Training:   0%|          | 1/280 [00:00<02:29,  1.86it/s][A
Training:   1%|          | 2/280 [00:00<01:30,  3.07it/s][A
Training:   2%|▏         | 5/280 [00:00<00:38,  7.17it/s][A
Training:   2%|▏         | 6/280 [00:01<00:37,  7.22it/s][A
Training:   3%|▎         | 9/280 [00:01<00:23, 11.38it/s][A
Training:   4%|▍         | 11/280 [00:01<00:27,  9.89it/s][A
Training:   5%|▌         | 14/280 [00:01<00:25, 10.55it/s][A
Training:   6%|▌         | 17/280 [00:01<00:19, 13.41it/s][A
Training:   7%|▋         | 19/280 [00:02<00:25, 10.37it/s][A
Training:   8%|▊         | 22/280 [00:02<00:24, 10.36it/s][A
Training:   9%|▉         | 25/280 [00:02<00:19, 12.99it/s][A
Training:  10%|▉         | 27/280 [00:02<00:22, 11.21it/s][A
Training:  11%|█         | 30/280 [00:03<00:23, 10.67it/s][A
Training:  12%|█▏        | 34/280 [00:03<00:21, 11.40it/s][A
Training:  13%|█▎        | 37/280 [00:03<00:17, 13.83it/s][A
Training:  14%|█▍    

Epoch: 5/43 - Loss: 2.6164 - Accuracy: 0.9316



  0%|          | 0/35 [00:00<?, ?it/s][A
  3%|▎         | 1/35 [00:00<00:24,  1.39it/s][A
 14%|█▍        | 5/35 [00:01<00:05,  5.72it/s][A
 26%|██▌       | 9/35 [00:01<00:03,  7.67it/s][A
 37%|███▋      | 13/35 [00:01<00:02,  8.57it/s][A
 49%|████▊     | 17/35 [00:02<00:01,  9.48it/s][A
 60%|██████    | 21/35 [00:02<00:01, 10.67it/s][A
 71%|███████▏  | 25/35 [00:02<00:00, 11.41it/s][A
 83%|████████▎ | 29/35 [00:02<00:00, 12.99it/s][A
100%|██████████| 35/35 [00:03<00:00, 10.56it/s][A
Epochs:  12%|█▏        | 5/43 [02:13<16:54, 26.68s/it]

Val Loss: 2.3202 - Val Accuracy: 0.9336



Training:   0%|          | 0/280 [00:00<?, ?it/s][A
Training:   0%|          | 1/280 [00:00<03:19,  1.40it/s][A
Training:   1%|          | 3/280 [00:00<01:03,  4.33it/s][A
Training:   2%|▏         | 5/280 [00:01<00:49,  5.61it/s][A
Training:   2%|▎         | 7/280 [00:01<00:34,  8.02it/s][A
Training:   3%|▎         | 9/280 [00:01<00:34,  7.80it/s][A
Training:   4%|▍         | 12/280 [00:01<00:24, 10.75it/s][A
Training:   5%|▌         | 14/280 [00:01<00:24, 10.97it/s][A
Training:   6%|▌         | 16/280 [00:01<00:23, 11.35it/s][A
Training:   6%|▋         | 18/280 [00:02<00:22, 11.80it/s][A
Training:   7%|▋         | 20/280 [00:02<00:21, 12.01it/s][A
Training:   8%|▊         | 22/280 [00:02<00:21, 12.13it/s][A
Training:   9%|▊         | 24/280 [00:02<00:21, 12.03it/s][A
Training:   9%|▉         | 26/280 [00:02<00:21, 11.70it/s][A
Training:  10%|█         | 29/280 [00:02<00:19, 12.85it/s][A
Training:  11%|█         | 31/280 [00:03<00:19, 12.70it/s][A
Training:  12%|█▏    

Epoch: 6/43 - Loss: 2.3932 - Accuracy: 0.9286



  0%|          | 0/35 [00:00<?, ?it/s][A
  3%|▎         | 1/35 [00:00<00:25,  1.36it/s][A
 14%|█▍        | 5/35 [00:01<00:05,  5.57it/s][A
 26%|██▌       | 9/35 [00:01<00:03,  7.93it/s][A
 37%|███▋      | 13/35 [00:01<00:02,  9.50it/s][A
 49%|████▊     | 17/35 [00:02<00:01, 10.60it/s][A
 60%|██████    | 21/35 [00:02<00:01, 11.65it/s][A
 71%|███████▏  | 25/35 [00:02<00:00, 12.77it/s][A
 83%|████████▎ | 29/35 [00:02<00:00, 13.05it/s][A
100%|██████████| 35/35 [00:03<00:00, 10.49it/s][A
Epochs:  14%|█▍        | 6/43 [02:40<16:33, 26.85s/it]

Val Loss: 2.5832 - Val Accuracy: 0.9277



Training:   0%|          | 0/280 [00:00<?, ?it/s][A
Training:   0%|          | 1/280 [00:00<02:19,  1.99it/s][A
Training:   1%|▏         | 4/280 [00:00<00:36,  7.51it/s][A
Training:   2%|▏         | 6/280 [00:00<00:28,  9.54it/s][A
Training:   3%|▎         | 8/280 [00:00<00:24, 10.91it/s][A
Training:   4%|▎         | 10/280 [00:01<00:24, 10.91it/s][A
Training:   4%|▍         | 12/280 [00:01<00:21, 12.47it/s][A
Training:   5%|▌         | 14/280 [00:01<00:22, 11.99it/s][A
Training:   6%|▌         | 16/280 [00:01<00:22, 11.49it/s][A
Training:   7%|▋         | 19/280 [00:01<00:19, 13.52it/s][A
Training:   8%|▊         | 21/280 [00:01<00:22, 11.57it/s][A
Training:   8%|▊         | 23/280 [00:02<00:21, 11.80it/s][A
Training:   9%|▉         | 25/280 [00:02<00:21, 12.00it/s][A
Training:  10%|▉         | 27/280 [00:02<00:20, 12.53it/s][A
Training:  10%|█         | 29/280 [00:02<00:21, 11.88it/s][A
Training:  11%|█         | 31/280 [00:02<00:20, 12.26it/s][A
Training:  12%|█▏   

Epoch: 7/43 - Loss: 2.3262 - Accuracy: 0.9318



  0%|          | 0/35 [00:00<?, ?it/s][A
  3%|▎         | 1/35 [00:00<00:22,  1.50it/s][A
 14%|█▍        | 5/35 [00:00<00:05,  5.94it/s][A
 26%|██▌       | 9/35 [00:01<00:03,  8.32it/s][A
 37%|███▋      | 13/35 [00:01<00:02,  9.27it/s][A
 49%|████▊     | 17/35 [00:01<00:01, 10.72it/s][A
 60%|██████    | 21/35 [00:02<00:01, 12.12it/s][A
 71%|███████▏  | 25/35 [00:02<00:00, 12.18it/s][A
 83%|████████▎ | 29/35 [00:02<00:00, 12.14it/s][A
100%|██████████| 35/35 [00:03<00:00, 10.39it/s][A
Epochs:  16%|█▋        | 7/43 [03:07<16:05, 26.81s/it]

Val Loss: 2.3434 - Val Accuracy: 0.9168



Training:   0%|          | 0/280 [00:00<?, ?it/s][A
Training:   0%|          | 1/280 [00:00<02:59,  1.55it/s][A
Training:   1%|          | 3/280 [00:00<00:56,  4.88it/s][A
Training:   2%|▏         | 5/280 [00:00<00:38,  7.20it/s][A
Training:   2%|▎         | 7/280 [00:01<00:31,  8.73it/s][A
Training:   3%|▎         | 9/280 [00:01<00:25, 10.75it/s][A
Training:   4%|▍         | 11/280 [00:01<00:26, 10.13it/s][A
Training:   5%|▌         | 14/280 [00:01<00:26,  9.86it/s][A
Training:   6%|▌         | 16/280 [00:01<00:24, 10.80it/s][A
Training:   6%|▋         | 18/280 [00:02<00:28,  9.31it/s][A
Training:   8%|▊         | 22/280 [00:02<00:25, 10.07it/s][A
Training:   9%|▉         | 26/280 [00:02<00:21, 11.77it/s][A
Training:  11%|█         | 30/280 [00:03<00:20, 12.06it/s][A
Training:  12%|█▏        | 33/280 [00:03<00:17, 14.46it/s][A
Training:  12%|█▎        | 35/280 [00:03<00:23, 10.25it/s][A
Training:  14%|█▎        | 38/280 [00:03<00:23, 10.10it/s][A
Training:  15%|█▍    

Epoch: 8/43 - Loss: 2.3321 - Accuracy: 0.9301



  0%|          | 0/35 [00:00<?, ?it/s][A
  3%|▎         | 1/35 [00:00<00:27,  1.23it/s][A
  6%|▌         | 2/35 [00:00<00:13,  2.45it/s][A
 17%|█▋        | 6/35 [00:01<00:04,  6.30it/s][A
 29%|██▊       | 10/35 [00:01<00:02,  8.94it/s][A
 40%|████      | 14/35 [00:01<00:02, 10.41it/s][A
 51%|█████▏    | 18/35 [00:02<00:01, 12.23it/s][A
 60%|██████    | 21/35 [00:02<00:00, 14.33it/s][A
 66%|██████▌   | 23/35 [00:02<00:00, 13.45it/s][A
 74%|███████▍  | 26/35 [00:02<00:00, 13.44it/s][A
 83%|████████▎ | 29/35 [00:02<00:00, 15.80it/s][A
 89%|████████▊ | 31/35 [00:02<00:00, 14.26it/s][A
 94%|█████████▍| 33/35 [00:03<00:00, 15.02it/s][A
100%|██████████| 35/35 [00:03<00:00, 10.51it/s][A
Epochs:  19%|█▊        | 8/43 [03:34<15:39, 26.86s/it]

Val Loss: 2.7617 - Val Accuracy: 0.9025



Training:   0%|          | 0/280 [00:00<?, ?it/s][A
Training:   0%|          | 1/280 [00:00<03:59,  1.16it/s][A
Training:   2%|▏         | 5/280 [00:01<00:47,  5.77it/s][A
Training:   3%|▎         | 8/280 [00:01<00:32,  8.33it/s][A
Training:   4%|▎         | 10/280 [00:01<00:29,  9.29it/s][A
Training:   4%|▍         | 12/280 [00:01<00:30,  8.78it/s][A
Training:   5%|▌         | 14/280 [00:01<00:25, 10.46it/s][A
Training:   6%|▌         | 16/280 [00:02<00:28,  9.19it/s][A
Training:   7%|▋         | 19/280 [00:02<00:20, 12.59it/s][A
Training:   8%|▊         | 21/280 [00:02<00:20, 12.42it/s][A
Training:   9%|▊         | 24/280 [00:02<00:20, 12.78it/s][A
Training:  10%|▉         | 27/280 [00:02<00:16, 15.15it/s][A
Training:  10%|█         | 29/280 [00:02<00:21, 11.91it/s][A
Training:  11%|█▏        | 32/280 [00:03<00:21, 11.31it/s][A
Training:  12%|█▎        | 35/280 [00:03<00:18, 13.35it/s][A
Training:  13%|█▎        | 37/280 [00:03<00:22, 10.92it/s][A
Training:  14%|█▍  

Epoch: 9/43 - Loss: 2.4234 - Accuracy: 0.9270



  0%|          | 0/35 [00:00<?, ?it/s][A
  3%|▎         | 1/35 [00:00<00:23,  1.45it/s][A
 14%|█▍        | 5/35 [00:00<00:05,  5.95it/s][A
 23%|██▎       | 8/35 [00:01<00:02,  9.58it/s][A
 29%|██▊       | 10/35 [00:01<00:03,  8.33it/s][A
 37%|███▋      | 13/35 [00:01<00:02,  9.43it/s][A
 43%|████▎     | 15/35 [00:01<00:01, 10.77it/s][A
 49%|████▊     | 17/35 [00:01<00:01, 10.93it/s][A
 60%|██████    | 21/35 [00:02<00:01, 12.31it/s][A
 66%|██████▌   | 23/35 [00:02<00:00, 12.74it/s][A
 71%|███████▏  | 25/35 [00:02<00:00, 11.80it/s][A
 77%|███████▋  | 27/35 [00:02<00:00, 12.88it/s][A
 83%|████████▎ | 29/35 [00:02<00:00, 12.11it/s][A
 91%|█████████▏| 32/35 [00:03<00:00, 15.05it/s][A
100%|██████████| 35/35 [00:03<00:00, 10.30it/s][A
Epochs:  21%|██        | 9/43 [04:01<15:11, 26.81s/it]

Val Loss: 2.6426 - Val Accuracy: 0.9289



Training:   0%|          | 0/280 [00:00<?, ?it/s][A
Training:   0%|          | 1/280 [00:00<03:58,  1.17it/s][A
Training:   1%|▏         | 4/280 [00:00<00:54,  5.05it/s][A
Training:   2%|▏         | 6/280 [00:01<00:41,  6.67it/s][A
Training:   3%|▎         | 9/280 [00:01<00:36,  7.42it/s][A
Training:   4%|▍         | 11/280 [00:01<00:29,  8.99it/s][A
Training:   5%|▍         | 13/280 [00:01<00:31,  8.37it/s][A
Training:   6%|▌         | 17/280 [00:02<00:26, 10.06it/s][A
Training:   7%|▋         | 20/280 [00:02<00:20, 12.42it/s][A
Training:   8%|▊         | 22/280 [00:02<00:22, 11.66it/s][A
Training:   9%|▉         | 25/280 [00:02<00:18, 14.09it/s][A
Training:  10%|▉         | 27/280 [00:02<00:19, 13.13it/s][A
Training:  10%|█         | 29/280 [00:02<00:18, 13.64it/s][A
Training:  11%|█         | 31/280 [00:03<00:19, 12.56it/s][A
Training:  12%|█▏        | 33/280 [00:03<00:19, 12.99it/s][A
Training:  12%|█▎        | 35/280 [00:03<00:23, 10.54it/s][A
Training:  14%|█▎   

Epoch: 10/43 - Loss: 2.3589 - Accuracy: 0.9286



  0%|          | 0/35 [00:00<?, ?it/s][A
  3%|▎         | 1/35 [00:00<00:22,  1.48it/s][A
  6%|▌         | 2/35 [00:00<00:11,  2.78it/s][A
 14%|█▍        | 5/35 [00:01<00:04,  6.43it/s][A
 23%|██▎       | 8/35 [00:01<00:02,  9.47it/s][A
 29%|██▊       | 10/35 [00:01<00:02,  9.55it/s][A
 34%|███▍      | 12/35 [00:01<00:02, 11.37it/s][A
 40%|████      | 14/35 [00:01<00:01, 10.90it/s][A
 46%|████▌     | 16/35 [00:01<00:01, 11.23it/s][A
 51%|█████▏    | 18/35 [00:02<00:01, 12.56it/s][A
 57%|█████▋    | 20/35 [00:02<00:01, 11.07it/s][A
 63%|██████▎   | 22/35 [00:02<00:01, 12.77it/s][A
 69%|██████▊   | 24/35 [00:02<00:00, 11.26it/s][A
 80%|████████  | 28/35 [00:02<00:00, 12.94it/s][A
 86%|████████▌ | 30/35 [00:02<00:00, 12.96it/s][A
 91%|█████████▏| 32/35 [00:03<00:00, 13.32it/s][A
100%|██████████| 35/35 [00:03<00:00, 10.06it/s][A
Epochs:  23%|██▎       | 10/43 [04:27<14:44, 26.79s/it]

Val Loss: 2.3056 - Val Accuracy: 0.9371



Training:   0%|          | 0/280 [00:00<?, ?it/s][A
Training:   0%|          | 1/280 [00:00<03:01,  1.54it/s][A
Training:   2%|▏         | 5/280 [00:00<00:45,  6.03it/s][A
Training:   3%|▎         | 8/280 [00:01<00:29,  9.30it/s][A
Training:   4%|▎         | 10/280 [00:01<00:27,  9.66it/s][A
Training:   5%|▍         | 13/280 [00:01<00:23, 11.37it/s][A
Training:   6%|▌         | 17/280 [00:01<00:19, 13.45it/s][A
Training:   7%|▋         | 20/280 [00:01<00:16, 16.20it/s][A
Training:   8%|▊         | 22/280 [00:02<00:18, 13.98it/s][A
Training:   9%|▉         | 25/280 [00:02<00:18, 14.06it/s][A
Training:  10%|▉         | 27/280 [00:02<00:16, 15.01it/s][A
Training:  10%|█         | 29/280 [00:02<00:16, 15.12it/s][A
Training:  11%|█         | 31/280 [00:02<00:18, 13.73it/s][A
Training:  12%|█▏        | 33/280 [00:02<00:18, 13.63it/s][A
Training:  12%|█▎        | 35/280 [00:03<00:21, 11.47it/s][A
Training:  14%|█▎        | 38/280 [00:03<00:19, 12.65it/s][A
Training:  14%|█▍  

Epoch: 11/43 - Loss: 2.2239 - Accuracy: 0.9293



  0%|          | 0/35 [00:00<?, ?it/s][A
  3%|▎         | 1/35 [00:00<00:19,  1.75it/s][A
 11%|█▏        | 4/35 [00:00<00:04,  7.01it/s][A
 17%|█▋        | 6/35 [00:00<00:03,  7.88it/s][A
 26%|██▌       | 9/35 [00:01<00:02, 11.15it/s][A
 31%|███▏      | 11/35 [00:01<00:02, 11.34it/s][A
 37%|███▋      | 13/35 [00:01<00:01, 12.74it/s][A
 43%|████▎     | 15/35 [00:01<00:01, 12.47it/s][A
 51%|█████▏    | 18/35 [00:01<00:01, 11.29it/s][A
 60%|██████    | 21/35 [00:01<00:00, 14.17it/s][A
 66%|██████▌   | 23/35 [00:02<00:00, 12.09it/s][A
 74%|███████▍  | 26/35 [00:02<00:00, 12.47it/s][A
 86%|████████▌ | 30/35 [00:02<00:00, 13.54it/s][A
100%|██████████| 35/35 [00:03<00:00, 11.34it/s][A
Epochs:  26%|██▌       | 11/43 [04:54<14:13, 26.67s/it]

Val Loss: 2.1187 - Val Accuracy: 0.9399



Training:   0%|          | 0/280 [00:00<?, ?it/s][A
Training:   0%|          | 1/280 [00:00<03:21,  1.38it/s][A
Training:   2%|▏         | 5/280 [00:01<00:47,  5.74it/s][A
Training:   3%|▎         | 8/280 [00:01<00:29,  9.18it/s][A
Training:   4%|▎         | 10/280 [00:01<00:32,  8.38it/s][A
Training:   5%|▍         | 13/280 [00:01<00:28,  9.24it/s][A
Training:   6%|▌         | 16/280 [00:01<00:21, 12.20it/s][A
Training:   6%|▋         | 18/280 [00:02<00:24, 10.85it/s][A
Training:   8%|▊         | 21/280 [00:02<00:25, 10.13it/s][A
Training:   9%|▉         | 25/280 [00:02<00:23, 10.63it/s][A
Training:  10%|█         | 28/280 [00:02<00:19, 12.63it/s][A
Training:  11%|█         | 30/280 [00:03<00:21, 11.77it/s][A
Training:  12%|█▏        | 33/280 [00:03<00:23, 10.54it/s][A
Training:  13%|█▎        | 37/280 [00:03<00:22, 10.71it/s][A
Training:  15%|█▍        | 41/280 [00:04<00:22, 10.84it/s][A
Training:  16%|█▌        | 44/280 [00:04<00:18, 12.48it/s][A
Training:  16%|█▋  

Epoch: 12/43 - Loss: 2.2034 - Accuracy: 0.9311



  0%|          | 0/35 [00:00<?, ?it/s][A
  3%|▎         | 1/35 [00:00<00:25,  1.35it/s][A
 14%|█▍        | 5/35 [00:01<00:05,  5.69it/s][A
 26%|██▌       | 9/35 [00:01<00:03,  8.27it/s][A
 37%|███▋      | 13/35 [00:01<00:02, 10.17it/s][A
 49%|████▊     | 17/35 [00:01<00:01, 11.91it/s][A
 60%|██████    | 21/35 [00:02<00:01, 12.63it/s][A
 69%|██████▊   | 24/35 [00:02<00:00, 14.30it/s][A
 74%|███████▍  | 26/35 [00:02<00:00, 14.91it/s][A
 80%|████████  | 28/35 [00:02<00:00, 14.65it/s][A
 89%|████████▊ | 31/35 [00:02<00:00, 16.16it/s][A
100%|██████████| 35/35 [00:02<00:00, 11.91it/s][A
Epochs:  28%|██▊       | 12/43 [05:20<13:44, 26.59s/it]

Val Loss: 2.1816 - Val Accuracy: 0.9399



Training:   0%|          | 0/280 [00:00<?, ?it/s][A
Training:   0%|          | 1/280 [00:00<02:53,  1.61it/s][A
Training:   2%|▏         | 5/280 [00:00<00:46,  5.93it/s][A
Training:   2%|▏         | 6/280 [00:01<00:42,  6.50it/s][A
Training:   3%|▎         | 8/280 [00:01<00:31,  8.61it/s][A
Training:   4%|▎         | 10/280 [00:01<00:36,  7.43it/s][A
Training:   5%|▍         | 13/280 [00:01<00:27,  9.65it/s][A
Training:   5%|▌         | 15/280 [00:01<00:25, 10.58it/s][A
Training:   6%|▌         | 17/280 [00:02<00:27,  9.61it/s][A
Training:   7%|▋         | 20/280 [00:02<00:20, 12.68it/s][A
Training:   8%|▊         | 22/280 [00:02<00:26,  9.79it/s][A
Training:   9%|▉         | 25/280 [00:02<00:20, 12.37it/s][A
Training:  10%|▉         | 27/280 [00:02<00:22, 11.03it/s][A
Training:  10%|█         | 29/280 [00:03<00:20, 12.44it/s][A
Training:  11%|█         | 31/280 [00:03<00:20, 12.43it/s][A
Training:  12%|█▏        | 34/280 [00:03<00:21, 11.68it/s][A
Training:  13%|█▎   

Epoch: 13/43 - Loss: 2.2399 - Accuracy: 0.9303



  0%|          | 0/35 [00:00<?, ?it/s][A
  3%|▎         | 1/35 [00:00<00:24,  1.39it/s][A
 11%|█▏        | 4/35 [00:00<00:05,  5.65it/s][A
 17%|█▋        | 6/35 [00:00<00:03,  8.04it/s][A
 26%|██▌       | 9/35 [00:01<00:03,  8.14it/s][A
 37%|███▋      | 13/35 [00:01<00:02,  9.10it/s][A
 49%|████▊     | 17/35 [00:02<00:01,  9.93it/s][A
 60%|██████    | 21/35 [00:02<00:01, 10.94it/s][A
 71%|███████▏  | 25/35 [00:02<00:00, 11.06it/s][A
 83%|████████▎ | 29/35 [00:03<00:00, 11.09it/s][A
100%|██████████| 35/35 [00:03<00:00, 10.10it/s][A
Epochs:  30%|███       | 13/43 [05:47<13:22, 26.76s/it]

Val Loss: 2.2642 - Val Accuracy: 0.9318



Training:   0%|          | 0/280 [00:00<?, ?it/s][A
Training:   0%|          | 1/280 [00:00<03:10,  1.46it/s][A
Training:   2%|▏         | 5/280 [00:00<00:45,  6.02it/s][A
Training:   3%|▎         | 9/280 [00:01<00:30,  8.84it/s][A
Training:   5%|▍         | 13/280 [00:01<00:24, 10.96it/s][A
Training:   6%|▌         | 17/280 [00:01<00:20, 12.57it/s][A
Training:   8%|▊         | 21/280 [00:02<00:19, 13.16it/s][A
Training:   9%|▉         | 25/280 [00:02<00:18, 13.43it/s][A
Training:  10%|█         | 28/280 [00:02<00:16, 15.37it/s][A
Training:  11%|█         | 30/280 [00:02<00:20, 12.47it/s][A
Training:  12%|█▏        | 33/280 [00:03<00:21, 11.73it/s][A
Training:  13%|█▎        | 36/280 [00:03<00:17, 13.71it/s][A
Training:  14%|█▎        | 38/280 [00:03<00:18, 13.20it/s][A
Training:  14%|█▍        | 40/280 [00:03<00:18, 12.90it/s][A
Training:  15%|█▌        | 42/280 [00:03<00:16, 14.17it/s][A
Training:  16%|█▌        | 44/280 [00:03<00:18, 12.68it/s][A
Training:  16%|█▋  

Epoch: 14/43 - Loss: 2.2814 - Accuracy: 0.9271



  0%|          | 0/35 [00:00<?, ?it/s][A
  3%|▎         | 1/35 [00:00<00:20,  1.63it/s][A
  6%|▌         | 2/35 [00:00<00:10,  3.07it/s][A
 11%|█▏        | 4/35 [00:00<00:04,  6.32it/s][A
 17%|█▋        | 6/35 [00:01<00:03,  7.51it/s][A
 23%|██▎       | 8/35 [00:01<00:03,  8.94it/s][A
 29%|██▊       | 10/35 [00:01<00:02,  9.34it/s][A
 34%|███▍      | 12/35 [00:01<00:02, 10.97it/s][A
 40%|████      | 14/35 [00:01<00:01, 11.51it/s][A
 46%|████▌     | 16/35 [00:01<00:01, 12.78it/s][A
 51%|█████▏    | 18/35 [00:02<00:01, 11.24it/s][A
 57%|█████▋    | 20/35 [00:02<00:01, 12.72it/s][A
 63%|██████▎   | 22/35 [00:02<00:00, 13.42it/s][A
 69%|██████▊   | 24/35 [00:02<00:00, 12.28it/s][A
 74%|███████▍  | 26/35 [00:02<00:00, 13.24it/s][A
 80%|████████  | 28/35 [00:02<00:00, 11.58it/s][A
 89%|████████▊ | 31/35 [00:03<00:00, 11.40it/s][A
100%|██████████| 35/35 [00:03<00:00, 10.27it/s][A
Epochs:  33%|███▎      | 14/43 [06:14<12:54, 26.72s/it]

Val Loss: 2.3249 - Val Accuracy: 0.9008



Training:   0%|          | 0/280 [00:00<?, ?it/s][A
Training:   0%|          | 1/280 [00:00<03:21,  1.39it/s][A
Training:   1%|          | 3/280 [00:00<01:02,  4.44it/s][A
Training:   2%|▏         | 5/280 [00:01<00:48,  5.69it/s][A
Training:   3%|▎         | 8/280 [00:01<00:27,  9.83it/s][A
Training:   4%|▎         | 10/280 [00:01<00:28,  9.61it/s][A
Training:   5%|▍         | 13/280 [00:01<00:26, 10.17it/s][A
Training:   6%|▌         | 16/280 [00:01<00:19, 13.47it/s][A
Training:   6%|▋         | 18/280 [00:02<00:22, 11.46it/s][A
Training:   8%|▊         | 21/280 [00:02<00:21, 11.84it/s][A
Training:   9%|▊         | 24/280 [00:02<00:17, 14.68it/s][A
Training:   9%|▉         | 26/280 [00:02<00:20, 12.21it/s][A
Training:  10%|█         | 29/280 [00:02<00:22, 11.11it/s][A
Training:  12%|█▏        | 33/280 [00:03<00:19, 12.61it/s][A
Training:  13%|█▎        | 37/280 [00:03<00:16, 14.72it/s][A
Training:  15%|█▍        | 41/280 [00:03<00:15, 15.59it/s][A
Training:  15%|█▌   

Epoch: 15/43 - Loss: 2.1861 - Accuracy: 0.9334



  0%|          | 0/35 [00:00<?, ?it/s][A
  3%|▎         | 1/35 [00:00<00:19,  1.75it/s][A
 14%|█▍        | 5/35 [00:00<00:04,  6.82it/s][A
 26%|██▌       | 9/35 [00:01<00:02,  8.90it/s][A
 37%|███▋      | 13/35 [00:01<00:02,  9.66it/s][A
 49%|████▊     | 17/35 [00:01<00:01, 10.35it/s][A
 60%|██████    | 21/35 [00:02<00:01, 11.56it/s][A
 69%|██████▊   | 24/35 [00:02<00:00, 13.89it/s][A
 74%|███████▍  | 26/35 [00:02<00:00, 13.47it/s][A
 80%|████████  | 28/35 [00:02<00:00, 13.20it/s][A
 86%|████████▌ | 30/35 [00:02<00:00, 12.29it/s][A
 91%|█████████▏| 32/35 [00:02<00:00, 13.44it/s][A
100%|██████████| 35/35 [00:03<00:00, 10.99it/s][A
Epochs:  35%|███▍      | 15/43 [06:41<12:26, 26.67s/it]

Val Loss: 2.4475 - Val Accuracy: 0.8613



Training:   0%|          | 0/280 [00:00<?, ?it/s][A
Training:   0%|          | 1/280 [00:00<02:41,  1.72it/s][A
Training:   2%|▏         | 5/280 [00:00<00:39,  7.02it/s][A
Training:   3%|▎         | 9/280 [00:01<00:26, 10.22it/s][A
Training:   4%|▍         | 12/280 [00:01<00:20, 13.05it/s][A
Training:   5%|▌         | 14/280 [00:01<00:24, 10.90it/s][A
Training:   6%|▌         | 17/280 [00:01<00:25, 10.25it/s][A
Training:   8%|▊         | 21/280 [00:02<00:23, 10.87it/s][A
Training:   9%|▉         | 25/280 [00:02<00:23, 10.99it/s][A
Training:  10%|█         | 29/280 [00:02<00:23, 10.79it/s][A
Training:  12%|█▏        | 33/280 [00:03<00:21, 11.28it/s][A
Training:  13%|█▎        | 36/280 [00:03<00:18, 13.18it/s][A
Training:  14%|█▎        | 38/280 [00:03<00:22, 10.67it/s][A
Training:  15%|█▍        | 41/280 [00:03<00:19, 12.55it/s][A
Training:  15%|█▌        | 43/280 [00:03<00:19, 12.40it/s][A
Training:  16%|█▌        | 45/280 [00:04<00:17, 13.21it/s][A
Training:  17%|█▋  

Epoch: 16/43 - Loss: 2.1257 - Accuracy: 0.9332



  0%|          | 0/35 [00:00<?, ?it/s][A
  3%|▎         | 1/35 [00:00<00:23,  1.45it/s][A
 14%|█▍        | 5/35 [00:00<00:04,  6.16it/s][A
 20%|██        | 7/35 [00:01<00:03,  8.01it/s][A
 26%|██▌       | 9/35 [00:01<00:03,  7.75it/s][A
 31%|███▏      | 11/35 [00:01<00:02,  9.16it/s][A
 37%|███▋      | 13/35 [00:01<00:02,  9.50it/s][A
 43%|████▎     | 15/35 [00:01<00:02,  9.93it/s][A
 49%|████▊     | 17/35 [00:02<00:01, 10.25it/s][A
 54%|█████▍    | 19/35 [00:02<00:01, 11.29it/s][A
 60%|██████    | 21/35 [00:02<00:01, 10.68it/s][A
 71%|███████▏  | 25/35 [00:02<00:00, 11.90it/s][A
 77%|███████▋  | 27/35 [00:02<00:00, 12.98it/s][A
 83%|████████▎ | 29/35 [00:02<00:00, 12.44it/s][A
100%|██████████| 35/35 [00:03<00:00, 10.00it/s][A
Epochs:  37%|███▋      | 16/43 [07:07<11:59, 26.66s/it]

Val Loss: 2.6586 - Val Accuracy: 0.9272



Training:   0%|          | 0/280 [00:00<?, ?it/s][A
Training:   0%|          | 1/280 [00:00<03:01,  1.54it/s][A
Training:   1%|▏         | 4/280 [00:00<00:43,  6.32it/s][A
Training:   2%|▏         | 6/280 [00:00<00:34,  7.86it/s][A
Training:   3%|▎         | 9/280 [00:01<00:29,  9.09it/s][A
Training:   4%|▍         | 11/280 [00:01<00:24, 10.93it/s][A
Training:   5%|▍         | 13/280 [00:01<00:27,  9.77it/s][A
Training:   6%|▌         | 16/280 [00:01<00:20, 13.15it/s][A
Training:   6%|▋         | 18/280 [00:01<00:21, 12.39it/s][A
Training:   8%|▊         | 21/280 [00:02<00:21, 12.02it/s][A
Training:   9%|▊         | 24/280 [00:02<00:17, 14.53it/s][A
Training:   9%|▉         | 26/280 [00:02<00:18, 13.38it/s][A
Training:  10%|█         | 29/280 [00:02<00:20, 12.11it/s][A
Training:  11%|█         | 31/280 [00:02<00:18, 13.22it/s][A
Training:  12%|█▏        | 33/280 [00:03<00:18, 13.13it/s][A
Training:  12%|█▎        | 35/280 [00:03<00:19, 12.45it/s][A
Training:  13%|█▎   

Epoch: 17/43 - Loss: 2.1556 - Accuracy: 0.9309



  0%|          | 0/35 [00:00<?, ?it/s][A
  3%|▎         | 1/35 [00:00<00:26,  1.27it/s][A
 14%|█▍        | 5/35 [00:01<00:05,  5.62it/s][A
 26%|██▌       | 9/35 [00:01<00:03,  7.70it/s][A
 37%|███▋      | 13/35 [00:01<00:02,  8.75it/s][A
 49%|████▊     | 17/35 [00:02<00:01, 10.27it/s][A
 60%|██████    | 21/35 [00:02<00:01, 10.66it/s][A
 71%|███████▏  | 25/35 [00:02<00:00, 11.47it/s][A
 83%|████████▎ | 29/35 [00:03<00:00, 11.75it/s][A
100%|██████████| 35/35 [00:03<00:00,  9.85it/s][A
Epochs:  40%|███▉      | 17/43 [07:34<11:35, 26.75s/it]

Val Loss: 2.2673 - Val Accuracy: 0.9417



Training:   0%|          | 0/280 [00:00<?, ?it/s][A
Training:   0%|          | 1/280 [00:00<03:56,  1.18it/s][A
Training:   1%|          | 3/280 [00:00<01:12,  3.82it/s][A
Training:   2%|▏         | 5/280 [00:01<00:44,  6.15it/s][A
Training:   3%|▎         | 9/280 [00:01<00:31,  8.70it/s][A
Training:   4%|▍         | 12/280 [00:01<00:23, 11.62it/s][A
Training:   5%|▌         | 14/280 [00:01<00:25, 10.38it/s][A
Training:   6%|▌         | 17/280 [00:02<00:25, 10.25it/s][A
Training:   7%|▋         | 20/280 [00:02<00:20, 12.70it/s][A
Training:   8%|▊         | 22/280 [00:02<00:23, 10.87it/s][A
Training:   9%|▉         | 25/280 [00:02<00:21, 11.95it/s][A
Training:  10%|█         | 28/280 [00:02<00:17, 14.61it/s][A
Training:  11%|█         | 30/280 [00:03<00:20, 12.25it/s][A
Training:  11%|█▏        | 32/280 [00:03<00:18, 13.33it/s][A
Training:  12%|█▏        | 34/280 [00:03<00:20, 12.03it/s][A
Training:  13%|█▎        | 36/280 [00:03<00:18, 13.36it/s][A
Training:  14%|█▎   

Epoch: 18/43 - Loss: 2.1898 - Accuracy: 0.9319



  0%|          | 0/35 [00:00<?, ?it/s][A
  3%|▎         | 1/35 [00:00<00:26,  1.29it/s][A
 14%|█▍        | 5/35 [00:01<00:05,  5.68it/s][A
 26%|██▌       | 9/35 [00:01<00:03,  8.33it/s][A
 37%|███▋      | 13/35 [00:01<00:02,  9.50it/s][A
 49%|████▊     | 17/35 [00:01<00:01, 11.04it/s][A
 54%|█████▍    | 19/35 [00:02<00:01, 12.13it/s][A
 60%|██████    | 21/35 [00:02<00:01, 11.42it/s][A
 66%|██████▌   | 23/35 [00:02<00:01, 11.49it/s][A
 71%|███████▏  | 25/35 [00:02<00:00, 12.02it/s][A
 77%|███████▋  | 27/35 [00:02<00:00, 11.89it/s][A
 83%|████████▎ | 29/35 [00:02<00:00, 13.05it/s][A
 89%|████████▊ | 31/35 [00:03<00:00, 11.25it/s][A
 94%|█████████▍| 33/35 [00:03<00:00, 12.88it/s][A
100%|██████████| 35/35 [00:03<00:00,  9.77it/s][A
Epochs:  42%|████▏     | 18/43 [08:01<11:08, 26.76s/it]

Val Loss: 2.1235 - Val Accuracy: 0.9428



Training:   0%|          | 0/280 [00:00<?, ?it/s][A
Training:   0%|          | 1/280 [00:00<02:15,  2.05it/s][A
Training:   1%|          | 3/280 [00:00<00:47,  5.85it/s][A
Training:   2%|▏         | 5/280 [00:00<00:30,  8.96it/s][A
Training:   2%|▎         | 7/280 [00:00<00:24, 11.02it/s][A
Training:   3%|▎         | 9/280 [00:01<00:23, 11.65it/s][A
Training:   4%|▍         | 11/280 [00:01<00:23, 11.60it/s][A
Training:   5%|▍         | 13/280 [00:01<00:19, 13.47it/s][A
Training:   5%|▌         | 15/280 [00:01<00:24, 10.87it/s][A
Training:   6%|▌         | 17/280 [00:01<00:21, 12.52it/s][A
Training:   7%|▋         | 19/280 [00:01<00:25, 10.35it/s][A
Training:   8%|▊         | 21/280 [00:02<00:21, 12.15it/s][A
Training:   8%|▊         | 23/280 [00:02<00:23, 10.95it/s][A
Training:   9%|▉         | 25/280 [00:02<00:20, 12.21it/s][A
Training:  10%|▉         | 27/280 [00:02<00:24, 10.33it/s][A
Training:  11%|█         | 30/280 [00:02<00:25,  9.97it/s][A
Training:  12%|█▏    

Epoch: 19/43 - Loss: 2.2107 - Accuracy: 0.9293



  0%|          | 0/35 [00:00<?, ?it/s][A
  3%|▎         | 1/35 [00:00<00:23,  1.44it/s][A
 14%|█▍        | 5/35 [00:00<00:04,  6.11it/s][A
 20%|██        | 7/35 [00:01<00:03,  7.79it/s][A
 26%|██▌       | 9/35 [00:01<00:03,  8.42it/s][A
 37%|███▋      | 13/35 [00:01<00:02,  9.64it/s][A
 46%|████▌     | 16/35 [00:01<00:01, 12.37it/s][A
 51%|█████▏    | 18/35 [00:02<00:01, 11.00it/s][A
 60%|██████    | 21/35 [00:02<00:01, 11.34it/s][A
 66%|██████▌   | 23/35 [00:02<00:00, 12.29it/s][A
 71%|███████▏  | 25/35 [00:02<00:00, 12.60it/s][A
 77%|███████▋  | 27/35 [00:02<00:00, 12.82it/s][A
 83%|████████▎ | 29/35 [00:02<00:00, 12.25it/s][A
100%|██████████| 35/35 [00:03<00:00, 10.21it/s][A
Epochs:  44%|████▍     | 19/43 [08:28<10:40, 26.70s/it]

Val Loss: 2.3675 - Val Accuracy: 0.9382



Training:   0%|          | 0/280 [00:00<?, ?it/s][A
Training:   0%|          | 1/280 [00:00<02:47,  1.66it/s][A
Training:   1%|          | 3/280 [00:00<00:54,  5.05it/s][A
Training:   2%|▏         | 5/280 [00:00<00:34,  7.95it/s][A
Training:   2%|▎         | 7/280 [00:01<00:31,  8.70it/s][A
Training:   3%|▎         | 9/280 [00:01<00:26, 10.12it/s][A
Training:   4%|▍         | 11/280 [00:01<00:23, 11.37it/s][A
Training:   5%|▍         | 13/280 [00:01<00:23, 11.52it/s][A
Training:   5%|▌         | 15/280 [00:01<00:23, 11.48it/s][A
Training:   6%|▌         | 17/280 [00:01<00:21, 12.21it/s][A
Training:   7%|▋         | 19/280 [00:02<00:23, 11.22it/s][A
Training:   8%|▊         | 21/280 [00:02<00:21, 12.30it/s][A
Training:   8%|▊         | 23/280 [00:02<00:24, 10.56it/s][A
Training:   9%|▉         | 25/280 [00:02<00:21, 12.01it/s][A
Training:  10%|▉         | 27/280 [00:02<00:23, 10.81it/s][A
Training:  11%|█         | 30/280 [00:03<00:24, 10.19it/s][A
Training:  12%|█▏    

Epoch: 20/43 - Loss: 2.1091 - Accuracy: 0.9353



  0%|          | 0/35 [00:00<?, ?it/s][A
  3%|▎         | 1/35 [00:00<00:26,  1.26it/s][A
  9%|▊         | 3/35 [00:00<00:07,  4.02it/s][A
 14%|█▍        | 5/35 [00:01<00:04,  6.57it/s][A
 23%|██▎       | 8/35 [00:01<00:02, 10.78it/s][A
 29%|██▊       | 10/35 [00:01<00:02,  8.96it/s][A
 37%|███▋      | 13/35 [00:01<00:02, 10.88it/s][A
 43%|████▎     | 15/35 [00:01<00:01, 10.85it/s][A
 49%|████▊     | 17/35 [00:01<00:01, 11.08it/s][A
 54%|█████▍    | 19/35 [00:02<00:01, 10.73it/s][A
 63%|██████▎   | 22/35 [00:02<00:01, 11.11it/s][A
 71%|███████▏  | 25/35 [00:02<00:00, 13.80it/s][A
 77%|███████▋  | 27/35 [00:02<00:00, 10.87it/s][A
 86%|████████▌ | 30/35 [00:03<00:00, 11.38it/s][A
 91%|█████████▏| 32/35 [00:03<00:00, 12.40it/s][A
100%|██████████| 35/35 [00:03<00:00,  9.73it/s][A
Epochs:  47%|████▋     | 20/43 [08:54<10:15, 26.76s/it]

Val Loss: 2.1029 - Val Accuracy: 0.9265



Training:   0%|          | 0/280 [00:00<?, ?it/s][A
Training:   0%|          | 1/280 [00:00<03:12,  1.45it/s][A
Training:   1%|          | 3/280 [00:00<01:01,  4.53it/s][A
Training:   2%|▏         | 5/280 [00:01<00:43,  6.36it/s][A
Training:   2%|▎         | 7/280 [00:01<00:30,  8.85it/s][A
Training:   3%|▎         | 9/280 [00:01<00:31,  8.53it/s][A
Training:   4%|▍         | 12/280 [00:01<00:22, 11.76it/s][A
Training:   5%|▌         | 14/280 [00:01<00:24, 10.93it/s][A
Training:   6%|▌         | 16/280 [00:01<00:23, 11.38it/s][A
Training:   6%|▋         | 18/280 [00:01<00:20, 12.82it/s][A
Training:   7%|▋         | 20/280 [00:02<00:19, 13.19it/s][A
Training:   8%|▊         | 22/280 [00:02<00:22, 11.60it/s][A
Training:   9%|▊         | 24/280 [00:02<00:20, 12.60it/s][A
Training:   9%|▉         | 26/280 [00:02<00:22, 11.47it/s][A
Training:  10%|█         | 28/280 [00:02<00:20, 12.49it/s][A
Training:  11%|█         | 30/280 [00:02<00:19, 12.94it/s][A
Training:  11%|█▏    

Epoch: 21/43 - Loss: 2.1199 - Accuracy: 0.9337



  0%|          | 0/35 [00:00<?, ?it/s][A
  3%|▎         | 1/35 [00:00<00:20,  1.63it/s][A
  9%|▊         | 3/35 [00:00<00:06,  5.05it/s][A
 14%|█▍        | 5/35 [00:00<00:04,  6.96it/s][A
 26%|██▌       | 9/35 [00:01<00:02,  9.31it/s][A
 34%|███▍      | 12/35 [00:01<00:01, 11.95it/s][A
 40%|████      | 14/35 [00:01<00:02,  9.88it/s][A
 49%|████▊     | 17/35 [00:01<00:01, 11.81it/s][A
 54%|█████▍    | 19/35 [00:01<00:01, 12.33it/s][A
 60%|██████    | 21/35 [00:02<00:01, 12.17it/s][A
 66%|██████▌   | 23/35 [00:02<00:01, 10.74it/s][A
 71%|███████▏  | 25/35 [00:02<00:00, 10.14it/s][A
 77%|███████▋  | 27/35 [00:02<00:00,  9.88it/s][A
 83%|████████▎ | 29/35 [00:02<00:00, 11.28it/s][A
 89%|████████▊ | 31/35 [00:03<00:00, 10.64it/s][A
 94%|█████████▍| 33/35 [00:03<00:00, 11.38it/s][A
100%|██████████| 35/35 [00:03<00:00,  9.80it/s][A
Epochs:  49%|████▉     | 21/43 [09:21<09:49, 26.81s/it]

Val Loss: 2.3424 - Val Accuracy: 0.9324



Training:   0%|          | 0/280 [00:00<?, ?it/s][A
Training:   0%|          | 1/280 [00:00<03:12,  1.45it/s][A
Training:   1%|          | 3/280 [00:00<01:00,  4.55it/s][A
Training:   2%|▏         | 6/280 [00:01<00:35,  7.78it/s][A
Training:   3%|▎         | 9/280 [00:01<00:28,  9.37it/s][A
Training:   4%|▍         | 11/280 [00:01<00:24, 10.79it/s][A
Training:   5%|▍         | 13/280 [00:01<00:22, 12.08it/s][A
Training:   5%|▌         | 15/280 [00:01<00:24, 10.84it/s][A
Training:   6%|▋         | 18/280 [00:01<00:18, 14.47it/s][A
Training:   7%|▋         | 20/280 [00:02<00:20, 12.48it/s][A
Training:   8%|▊         | 23/280 [00:02<00:25, 10.00it/s][A
Training:  10%|▉         | 27/280 [00:02<00:22, 11.39it/s][A
Training:  10%|█         | 29/280 [00:02<00:20, 12.53it/s][A
Training:  11%|█         | 31/280 [00:03<00:22, 11.24it/s][A
Training:  12%|█▎        | 35/280 [00:03<00:22, 10.94it/s][A
Training:  14%|█▎        | 38/280 [00:03<00:18, 13.40it/s][A
Training:  14%|█▍   

Epoch: 22/43 - Loss: 2.0905 - Accuracy: 0.9312



  0%|          | 0/35 [00:00<?, ?it/s][A
  3%|▎         | 1/35 [00:00<00:27,  1.24it/s][A
 11%|█▏        | 4/35 [00:00<00:05,  5.37it/s][A
 17%|█▋        | 6/35 [00:01<00:03,  7.27it/s][A
 26%|██▌       | 9/35 [00:01<00:03,  7.02it/s][A
 37%|███▋      | 13/35 [00:01<00:02,  9.01it/s][A
 46%|████▌     | 16/35 [00:01<00:01, 11.48it/s][A
 51%|█████▏    | 18/35 [00:02<00:01, 12.13it/s][A
 57%|█████▋    | 20/35 [00:02<00:01, 13.36it/s][A
 63%|██████▎   | 22/35 [00:02<00:01, 12.04it/s][A
 69%|██████▊   | 24/35 [00:02<00:00, 12.41it/s][A
 74%|███████▍  | 26/35 [00:02<00:00, 11.60it/s][A
 83%|████████▎ | 29/35 [00:03<00:00, 10.00it/s][A
 94%|█████████▍| 33/35 [00:03<00:00, 11.58it/s][A
100%|██████████| 35/35 [00:03<00:00,  9.76it/s][A
Epochs:  51%|█████     | 22/43 [09:48<09:22, 26.77s/it]

Val Loss: 2.1378 - Val Accuracy: 0.9370



Training:   0%|          | 0/280 [00:00<?, ?it/s][A
Training:   0%|          | 1/280 [00:00<04:22,  1.06it/s][A
Training:   2%|▏         | 5/280 [00:01<00:56,  4.87it/s][A
Training:   3%|▎         | 8/280 [00:01<00:33,  8.11it/s][A
Training:   4%|▎         | 10/280 [00:01<00:36,  7.39it/s][A
Training:   5%|▍         | 13/280 [00:01<00:27,  9.67it/s][A
Training:   5%|▌         | 15/280 [00:02<00:26,  9.99it/s][A
Training:   6%|▋         | 18/280 [00:02<00:27,  9.38it/s][A
Training:   8%|▊         | 21/280 [00:02<00:21, 11.86it/s][A
Training:   8%|▊         | 23/280 [00:02<00:25, 10.20it/s][A
Training:   9%|▉         | 26/280 [00:03<00:26,  9.66it/s][A
Training:  10%|█         | 29/280 [00:03<00:21, 11.92it/s][A
Training:  11%|█         | 31/280 [00:03<00:24, 10.05it/s][A
Training:  12%|█▏        | 34/280 [00:03<00:24,  9.97it/s][A
Training:  14%|█▎        | 38/280 [00:04<00:23, 10.46it/s][A
Training:  15%|█▌        | 42/280 [00:04<00:20, 11.45it/s][A
Training:  16%|█▌  

Epoch: 23/43 - Loss: 2.0251 - Accuracy: 0.9394



  0%|          | 0/35 [00:00<?, ?it/s][A
  3%|▎         | 1/35 [00:00<00:23,  1.48it/s][A
 14%|█▍        | 5/35 [00:01<00:05,  5.46it/s][A
 26%|██▌       | 9/35 [00:01<00:03,  8.38it/s][A
 37%|███▋      | 13/35 [00:01<00:02,  9.27it/s][A
 49%|████▊     | 17/35 [00:02<00:01,  9.19it/s][A
 60%|██████    | 21/35 [00:02<00:01, 10.07it/s][A
 66%|██████▌   | 23/35 [00:02<00:01, 10.72it/s][A
 71%|███████▏  | 25/35 [00:02<00:00, 10.95it/s][A
 83%|████████▎ | 29/35 [00:03<00:00, 11.75it/s][A
100%|██████████| 35/35 [00:03<00:00,  9.91it/s][A
Epochs:  53%|█████▎    | 23/43 [10:15<08:55, 26.76s/it]

Val Loss: 2.4617 - Val Accuracy: 0.9330



Training:   0%|          | 0/280 [00:00<?, ?it/s][A
Training:   0%|          | 1/280 [00:00<03:28,  1.34it/s][A
Training:   1%|          | 3/280 [00:00<01:04,  4.28it/s][A
Training:   2%|▏         | 5/280 [00:01<00:54,  5.08it/s][A
Training:   3%|▎         | 8/280 [00:01<00:31,  8.59it/s][A
Training:   4%|▎         | 10/280 [00:01<00:30,  8.99it/s][A
Training:   5%|▍         | 13/280 [00:01<00:26, 10.19it/s][A
Training:   6%|▌         | 16/280 [00:01<00:20, 12.85it/s][A
Training:   6%|▋         | 18/280 [00:02<00:21, 12.10it/s][A
Training:   8%|▊         | 21/280 [00:02<00:25, 10.25it/s][A
Training:   9%|▊         | 24/280 [00:02<00:19, 13.00it/s][A
Training:   9%|▉         | 26/280 [00:02<00:22, 11.20it/s][A
Training:  10%|█         | 29/280 [00:03<00:22, 11.38it/s][A
Training:  12%|█▏        | 33/280 [00:03<00:22, 11.10it/s][A
Training:  13%|█▎        | 37/280 [00:03<00:20, 11.67it/s][A
Training:  15%|█▍        | 41/280 [00:04<00:20, 11.82it/s][A
Training:  16%|█▌   

Epoch: 24/43 - Loss: 2.0666 - Accuracy: 0.9355



  0%|          | 0/35 [00:00<?, ?it/s][A
  3%|▎         | 1/35 [00:00<00:22,  1.52it/s][A
 11%|█▏        | 4/35 [00:00<00:05,  5.88it/s][A
 17%|█▋        | 6/35 [00:00<00:03,  7.70it/s][A
 23%|██▎       | 8/35 [00:01<00:02,  9.67it/s][A
 29%|██▊       | 10/35 [00:01<00:03,  8.33it/s][A
 37%|███▋      | 13/35 [00:01<00:02,  8.77it/s][A
 49%|████▊     | 17/35 [00:02<00:01, 10.34it/s][A
 54%|█████▍    | 19/35 [00:02<00:01, 11.22it/s][A
 60%|██████    | 21/35 [00:02<00:01, 10.73it/s][A
 69%|██████▊   | 24/35 [00:02<00:00, 13.32it/s][A
 74%|███████▍  | 26/35 [00:02<00:00, 12.11it/s][A
 83%|████████▎ | 29/35 [00:03<00:00, 11.07it/s][A
100%|██████████| 35/35 [00:03<00:00,  9.84it/s][A
Epochs:  56%|█████▌    | 24/43 [10:41<08:28, 26.76s/it]

Val Loss: 2.1089 - Val Accuracy: 0.9376



Training:   0%|          | 0/280 [00:00<?, ?it/s][A
Training:   0%|          | 1/280 [00:00<03:40,  1.27it/s][A
Training:   2%|▏         | 5/280 [00:01<00:48,  5.68it/s][A
Training:   2%|▏         | 6/280 [00:01<00:45,  6.06it/s][A
Training:   3%|▎         | 8/280 [00:01<00:35,  7.60it/s][A
Training:   3%|▎         | 9/280 [00:01<00:36,  7.39it/s][A
Training:   4%|▍         | 12/280 [00:01<00:25, 10.50it/s][A
Training:   5%|▌         | 14/280 [00:01<00:23, 11.36it/s][A
Training:   6%|▌         | 16/280 [00:01<00:21, 12.34it/s][A
Training:   6%|▋         | 18/280 [00:02<00:22, 11.69it/s][A
Training:   8%|▊         | 21/280 [00:02<00:20, 12.35it/s][A
Training:   8%|▊         | 23/280 [00:02<00:21, 11.83it/s][A
Training:   9%|▉         | 25/280 [00:02<00:19, 12.95it/s][A
Training:  10%|▉         | 27/280 [00:02<00:19, 13.02it/s][A
Training:  10%|█         | 29/280 [00:02<00:20, 12.32it/s][A
Training:  11%|█         | 31/280 [00:03<00:18, 13.64it/s][A
Training:  12%|█▏    

Epoch: 25/43 - Loss: 2.0227 - Accuracy: 0.9390



  0%|          | 0/35 [00:00<?, ?it/s][A
  3%|▎         | 1/35 [00:00<00:24,  1.37it/s][A
  6%|▌         | 2/35 [00:00<00:12,  2.62it/s][A
 14%|█▍        | 5/35 [00:00<00:04,  7.27it/s][A
 20%|██        | 7/35 [00:01<00:03,  7.80it/s][A
 26%|██▌       | 9/35 [00:01<00:02,  9.47it/s][A
 31%|███▏      | 11/35 [00:01<00:02,  9.23it/s][A
 37%|███▋      | 13/35 [00:01<00:02, 10.21it/s][A
 43%|████▎     | 15/35 [00:01<00:02,  9.82it/s][A
 49%|████▊     | 17/35 [00:02<00:01, 10.51it/s][A
 54%|█████▍    | 19/35 [00:02<00:01, 11.42it/s][A
 60%|██████    | 21/35 [00:02<00:01, 11.23it/s][A
 66%|██████▌   | 23/35 [00:02<00:01, 11.31it/s][A
 71%|███████▏  | 25/35 [00:02<00:00, 10.27it/s][A
 77%|███████▋  | 27/35 [00:02<00:00, 12.00it/s][A
 83%|████████▎ | 29/35 [00:03<00:00, 10.25it/s][A
100%|██████████| 35/35 [00:03<00:00,  9.54it/s][A
Epochs:  58%|█████▊    | 25/43 [11:08<08:02, 26.81s/it]

Val Loss: 2.2952 - Val Accuracy: 0.9003



Training:   0%|          | 0/280 [00:00<?, ?it/s][A
Training:   0%|          | 1/280 [00:00<02:58,  1.56it/s][A
Training:   1%|          | 3/280 [00:00<00:58,  4.77it/s][A
Training:   2%|▏         | 5/280 [00:00<00:43,  6.28it/s][A
Training:   2%|▎         | 7/280 [00:01<00:32,  8.42it/s][A
Training:   3%|▎         | 9/280 [00:01<00:35,  7.74it/s][A
Training:   4%|▍         | 12/280 [00:01<00:23, 11.25it/s][A
Training:   5%|▌         | 14/280 [00:01<00:24, 10.78it/s][A
Training:   6%|▌         | 17/280 [00:01<00:23, 11.34it/s][A
Training:   7%|▋         | 20/280 [00:02<00:17, 14.46it/s][A
Training:   8%|▊         | 22/280 [00:02<00:21, 11.85it/s][A
Training:   9%|▊         | 24/280 [00:02<00:19, 13.23it/s][A
Training:   9%|▉         | 26/280 [00:02<00:21, 11.72it/s][A
Training:  10%|█         | 28/280 [00:02<00:19, 13.03it/s][A
Training:  11%|█         | 30/280 [00:02<00:20, 12.01it/s][A
Training:  11%|█▏        | 32/280 [00:03<00:18, 13.50it/s][A
Training:  12%|█▏    

Epoch: 26/43 - Loss: 2.0575 - Accuracy: 0.9334



  0%|          | 0/35 [00:00<?, ?it/s][A
  3%|▎         | 1/35 [00:00<00:21,  1.57it/s][A
 14%|█▍        | 5/35 [00:00<00:04,  6.32it/s][A
 26%|██▌       | 9/35 [00:01<00:02,  9.88it/s][A
 37%|███▋      | 13/35 [00:01<00:01, 11.18it/s][A
 49%|████▊     | 17/35 [00:01<00:01, 12.41it/s][A
 60%|██████    | 21/35 [00:02<00:01, 12.62it/s][A
 71%|███████▏  | 25/35 [00:02<00:00, 12.57it/s][A
 83%|████████▎ | 29/35 [00:02<00:00, 12.71it/s][A
100%|██████████| 35/35 [00:03<00:00, 11.38it/s][A
Epochs:  60%|██████    | 26/43 [11:35<07:33, 26.66s/it]

Val Loss: 2.2299 - Val Accuracy: 0.9357



Training:   0%|          | 0/280 [00:00<?, ?it/s][A
Training:   0%|          | 1/280 [00:00<04:03,  1.15it/s][A
Training:   1%|▏         | 4/280 [00:00<00:53,  5.13it/s][A
Training:   2%|▏         | 6/280 [00:01<00:44,  6.18it/s][A
Training:   3%|▎         | 9/280 [00:01<00:33,  8.07it/s][A
Training:   5%|▍         | 13/280 [00:01<00:26,  9.92it/s][A
Training:   6%|▌         | 16/280 [00:01<00:20, 12.79it/s][A
Training:   6%|▋         | 18/280 [00:02<00:24, 10.84it/s][A
Training:   8%|▊         | 21/280 [00:02<00:21, 11.92it/s][A
Training:   9%|▊         | 24/280 [00:02<00:19, 12.85it/s][A
Training:   9%|▉         | 26/280 [00:02<00:19, 13.01it/s][A
Training:  10%|█         | 28/280 [00:02<00:19, 13.16it/s][A
Training:  11%|█         | 30/280 [00:02<00:18, 13.88it/s][A
Training:  11%|█▏        | 32/280 [00:03<00:18, 13.08it/s][A
Training:  12%|█▎        | 35/280 [00:03<00:15, 16.15it/s][A
Training:  13%|█▎        | 37/280 [00:03<00:22, 10.61it/s][A
Training:  14%|█▍   

Epoch: 27/43 - Loss: 2.0093 - Accuracy: 0.9398



  0%|          | 0/35 [00:00<?, ?it/s][A
  3%|▎         | 1/35 [00:00<00:22,  1.48it/s][A
 11%|█▏        | 4/35 [00:00<00:04,  6.35it/s][A
 17%|█▋        | 6/35 [00:01<00:04,  6.62it/s][A
 26%|██▌       | 9/35 [00:01<00:02,  8.72it/s][A
 31%|███▏      | 11/35 [00:01<00:02, 10.05it/s][A
 37%|███▋      | 13/35 [00:01<00:02,  9.50it/s][A
 46%|████▌     | 16/35 [00:01<00:01, 12.76it/s][A
 51%|█████▏    | 18/35 [00:02<00:01, 10.67it/s][A
 60%|██████    | 21/35 [00:02<00:01,  9.57it/s][A
 71%|███████▏  | 25/35 [00:02<00:00, 10.36it/s][A
 80%|████████  | 28/35 [00:02<00:00, 12.93it/s][A
 86%|████████▌ | 30/35 [00:03<00:00, 12.25it/s][A
100%|██████████| 35/35 [00:03<00:00,  9.92it/s][A
Epochs:  63%|██████▎   | 27/43 [12:02<07:07, 26.71s/it]

Val Loss: 2.2108 - Val Accuracy: 0.9071



Training:   0%|          | 0/280 [00:00<?, ?it/s][A
Training:   0%|          | 1/280 [00:00<02:57,  1.57it/s][A
Training:   1%|▏         | 4/280 [00:00<00:48,  5.65it/s][A
Training:   2%|▏         | 5/280 [00:00<00:46,  5.94it/s][A
Training:   3%|▎         | 8/280 [00:01<00:33,  8.18it/s][A
Training:   4%|▎         | 10/280 [00:01<00:28,  9.63it/s][A
Training:   4%|▍         | 12/280 [00:01<00:27,  9.67it/s][A
Training:   5%|▌         | 14/280 [00:01<00:24, 10.76it/s][A
Training:   6%|▌         | 16/280 [00:01<00:24, 10.96it/s][A
Training:   6%|▋         | 18/280 [00:02<00:20, 12.72it/s][A
Training:   7%|▋         | 20/280 [00:02<00:21, 12.35it/s][A
Training:   8%|▊         | 22/280 [00:02<00:19, 13.58it/s][A
Training:   9%|▊         | 24/280 [00:02<00:20, 12.29it/s][A
Training:   9%|▉         | 26/280 [00:02<00:19, 13.06it/s][A
Training:  10%|█         | 28/280 [00:02<00:20, 12.40it/s][A
Training:  11%|█         | 30/280 [00:02<00:19, 13.04it/s][A
Training:  11%|█▏   

Epoch: 28/43 - Loss: 2.0878 - Accuracy: 0.9314



  0%|          | 0/35 [00:00<?, ?it/s][A
  3%|▎         | 1/35 [00:00<00:20,  1.64it/s][A
 14%|█▍        | 5/35 [00:00<00:04,  6.43it/s][A
 20%|██        | 7/35 [00:01<00:03,  8.59it/s][A
 26%|██▌       | 9/35 [00:01<00:03,  8.65it/s][A
 31%|███▏      | 11/35 [00:01<00:02, 10.23it/s][A
 37%|███▋      | 13/35 [00:01<00:01, 11.40it/s][A
 43%|████▎     | 15/35 [00:01<00:01, 11.74it/s][A
 51%|█████▏    | 18/35 [00:01<00:01, 14.55it/s][A
 57%|█████▋    | 20/35 [00:01<00:01, 14.14it/s][A
 63%|██████▎   | 22/35 [00:02<00:00, 13.63it/s][A
 69%|██████▊   | 24/35 [00:02<00:00, 13.69it/s][A
 74%|███████▍  | 26/35 [00:02<00:00, 15.06it/s][A
 80%|████████  | 28/35 [00:02<00:00, 13.36it/s][A
 86%|████████▌ | 30/35 [00:02<00:00, 14.00it/s][A
 91%|█████████▏| 32/35 [00:02<00:00, 13.41it/s][A
100%|██████████| 35/35 [00:03<00:00, 10.83it/s][A
Epochs:  65%|██████▌   | 28/43 [12:28<06:40, 26.68s/it]

Val Loss: 2.2150 - Val Accuracy: 0.9387



Training:   0%|          | 0/280 [00:00<?, ?it/s][A
Training:   0%|          | 1/280 [00:00<03:03,  1.52it/s][A
Training:   1%|▏         | 4/280 [00:00<00:43,  6.36it/s][A
Training:   2%|▏         | 6/280 [00:00<00:31,  8.61it/s][A
Training:   3%|▎         | 8/280 [00:01<00:26, 10.41it/s][A
Training:   4%|▎         | 10/280 [00:01<00:27,  9.94it/s][A
Training:   4%|▍         | 12/280 [00:01<00:24, 10.98it/s][A
Training:   5%|▌         | 14/280 [00:01<00:27,  9.75it/s][A
Training:   6%|▌         | 16/280 [00:01<00:22, 11.50it/s][A
Training:   6%|▋         | 18/280 [00:01<00:25, 10.39it/s][A
Training:   7%|▋         | 20/280 [00:02<00:21, 11.85it/s][A
Training:   8%|▊         | 22/280 [00:02<00:21, 11.91it/s][A
Training:   9%|▊         | 24/280 [00:02<00:20, 12.49it/s][A
Training:   9%|▉         | 26/280 [00:02<00:19, 13.19it/s][A
Training:  10%|█         | 28/280 [00:02<00:18, 13.76it/s][A
Training:  11%|█         | 30/280 [00:02<00:20, 12.31it/s][A
Training:  12%|█▏   

Epoch: 29/43 - Loss: 2.0883 - Accuracy: 0.9338



  0%|          | 0/35 [00:00<?, ?it/s][A
  3%|▎         | 1/35 [00:00<00:27,  1.26it/s][A
 14%|█▍        | 5/35 [00:01<00:05,  5.13it/s][A
 26%|██▌       | 9/35 [00:01<00:03,  7.02it/s][A
 37%|███▋      | 13/35 [00:01<00:02,  8.65it/s][A
 46%|████▌     | 16/35 [00:01<00:01, 11.09it/s][A
 51%|█████▏    | 18/35 [00:02<00:01, 10.00it/s][A
 60%|██████    | 21/35 [00:02<00:01, 10.76it/s][A
 71%|███████▏  | 25/35 [00:02<00:00, 11.93it/s][A
 83%|████████▎ | 29/35 [00:03<00:00, 12.80it/s][A
100%|██████████| 35/35 [00:03<00:00, 10.14it/s][A
Epochs:  67%|██████▋   | 29/43 [12:55<06:12, 26.63s/it]

Val Loss: 2.4734 - Val Accuracy: 0.9128



Training:   0%|          | 0/280 [00:00<?, ?it/s][A
Training:   0%|          | 1/280 [00:00<03:02,  1.53it/s][A
Training:   1%|          | 3/280 [00:00<01:00,  4.61it/s][A
Training:   2%|▏         | 5/280 [00:00<00:40,  6.87it/s][A
Training:   2%|▎         | 7/280 [00:01<00:34,  8.03it/s][A
Training:   3%|▎         | 9/280 [00:01<00:32,  8.26it/s][A
Training:   5%|▍         | 13/280 [00:01<00:26, 10.17it/s][A
Training:   6%|▌         | 16/280 [00:01<00:20, 12.91it/s][A
Training:   6%|▋         | 18/280 [00:02<00:23, 11.09it/s][A
Training:   8%|▊         | 21/280 [00:02<00:22, 11.29it/s][A
Training:   8%|▊         | 23/280 [00:02<00:20, 12.42it/s][A
Training:   9%|▉         | 25/280 [00:02<00:24, 10.62it/s][A
Training:  10%|█         | 28/280 [00:02<00:18, 13.69it/s][A
Training:  11%|█         | 30/280 [00:03<00:21, 11.55it/s][A
Training:  12%|█▏        | 33/280 [00:03<00:19, 12.73it/s][A
Training:  12%|█▎        | 35/280 [00:03<00:19, 12.86it/s][A
Training:  13%|█▎    

Epoch: 30/43 - Loss: 2.0920 - Accuracy: 0.9372



  0%|          | 0/35 [00:00<?, ?it/s][A
  3%|▎         | 1/35 [00:00<00:21,  1.58it/s][A
 11%|█▏        | 4/35 [00:00<00:05,  6.15it/s][A
 17%|█▋        | 6/35 [00:00<00:03,  7.37it/s][A
 26%|██▌       | 9/35 [00:01<00:03,  8.24it/s][A
 37%|███▋      | 13/35 [00:01<00:02,  9.97it/s][A
 49%|████▊     | 17/35 [00:01<00:01, 11.21it/s][A
 60%|██████    | 21/35 [00:02<00:01, 12.13it/s][A
 71%|███████▏  | 25/35 [00:02<00:00, 13.40it/s][A
 83%|████████▎ | 29/35 [00:02<00:00, 13.36it/s][A
100%|██████████| 35/35 [00:03<00:00, 11.23it/s][A
Epochs:  70%|██████▉   | 30/43 [13:22<05:47, 26.70s/it]

Val Loss: 2.2164 - Val Accuracy: 0.9359



Training:   0%|          | 0/280 [00:00<?, ?it/s][A
Training:   0%|          | 1/280 [00:00<02:51,  1.63it/s][A
Training:   2%|▏         | 5/280 [00:00<00:39,  6.94it/s][A
Training:   2%|▎         | 7/280 [00:00<00:30,  8.87it/s][A
Training:   3%|▎         | 9/280 [00:01<00:29,  9.21it/s][A
Training:   4%|▍         | 12/280 [00:01<00:22, 12.14it/s][A
Training:   5%|▌         | 14/280 [00:01<00:25, 10.37it/s][A
Training:   6%|▌         | 17/280 [00:01<00:22, 11.53it/s][A
Training:   7%|▋         | 19/280 [00:01<00:22, 11.43it/s][A
Training:   8%|▊         | 21/280 [00:02<00:20, 12.53it/s][A
Training:   8%|▊         | 23/280 [00:02<00:23, 10.94it/s][A
Training:   9%|▉         | 26/280 [00:02<00:21, 11.72it/s][A
Training:  10%|█         | 28/280 [00:02<00:19, 12.72it/s][A
Training:  11%|█         | 30/280 [00:02<00:20, 12.42it/s][A
Training:  11%|█▏        | 32/280 [00:03<00:19, 12.95it/s][A
Training:  12%|█▏        | 34/280 [00:03<00:19, 12.74it/s][A
Training:  13%|█▎   

Epoch: 31/43 - Loss: 2.0227 - Accuracy: 0.9373



  0%|          | 0/35 [00:00<?, ?it/s][A
  3%|▎         | 1/35 [00:00<00:22,  1.50it/s][A
 14%|█▍        | 5/35 [00:00<00:05,  5.98it/s][A
 26%|██▌       | 9/35 [00:01<00:03,  7.67it/s][A
 37%|███▋      | 13/35 [00:01<00:02,  9.62it/s][A
 49%|████▊     | 17/35 [00:02<00:01,  9.83it/s][A
 60%|██████    | 21/35 [00:02<00:01, 10.69it/s][A
 71%|███████▏  | 25/35 [00:02<00:00, 11.59it/s][A
 83%|████████▎ | 29/35 [00:03<00:00, 11.47it/s][A
100%|██████████| 35/35 [00:03<00:00,  9.88it/s][A
Epochs:  72%|███████▏  | 31/43 [13:48<05:21, 26.75s/it]

Val Loss: 2.1857 - Val Accuracy: 0.9260



Training:   0%|          | 0/280 [00:00<?, ?it/s][A
Training:   0%|          | 1/280 [00:00<03:20,  1.39it/s][A
Training:   1%|▏         | 4/280 [00:00<00:45,  6.03it/s][A
Training:   2%|▏         | 6/280 [00:01<00:37,  7.26it/s][A
Training:   3%|▎         | 8/280 [00:01<00:28,  9.59it/s][A
Training:   4%|▎         | 10/280 [00:01<00:31,  8.55it/s][A
Training:   5%|▍         | 13/280 [00:01<00:30,  8.81it/s][A
Training:   6%|▌         | 17/280 [00:02<00:26,  9.87it/s][A
Training:   8%|▊         | 21/280 [00:02<00:22, 11.61it/s][A
Training:   9%|▊         | 24/280 [00:02<00:18, 13.87it/s][A
Training:   9%|▉         | 26/280 [00:02<00:18, 13.50it/s][A
Training:  10%|█         | 29/280 [00:02<00:19, 12.81it/s][A
Training:  12%|█▏        | 33/280 [00:03<00:17, 13.73it/s][A
Training:  13%|█▎        | 37/280 [00:03<00:16, 15.17it/s][A
Training:  15%|█▍        | 41/280 [00:03<00:14, 16.03it/s][A
Training:  16%|█▌        | 44/280 [00:03<00:13, 18.03it/s][A
Training:  16%|█▋   

Epoch: 32/43 - Loss: 2.0795 - Accuracy: 0.9343



  0%|          | 0/35 [00:00<?, ?it/s][A
  3%|▎         | 1/35 [00:00<00:24,  1.41it/s][A
 14%|█▍        | 5/35 [00:00<00:04,  6.23it/s][A
 20%|██        | 7/35 [00:01<00:03,  8.20it/s][A
 26%|██▌       | 9/35 [00:01<00:02,  8.76it/s][A
 31%|███▏      | 11/35 [00:01<00:02, 10.03it/s][A
 37%|███▋      | 13/35 [00:01<00:02,  8.83it/s][A
 46%|████▌     | 16/35 [00:01<00:01, 12.14it/s][A
 51%|█████▏    | 18/35 [00:02<00:01, 10.13it/s][A
 57%|█████▋    | 20/35 [00:02<00:01, 11.67it/s][A
 63%|██████▎   | 22/35 [00:02<00:01, 10.45it/s][A
 71%|███████▏  | 25/35 [00:02<00:00, 10.11it/s][A
 77%|███████▋  | 27/35 [00:02<00:00, 10.26it/s][A
 86%|████████▌ | 30/35 [00:03<00:00, 13.01it/s][A
 91%|█████████▏| 32/35 [00:03<00:00, 11.61it/s][A
100%|██████████| 35/35 [00:03<00:00,  9.64it/s][A
Epochs:  74%|███████▍  | 32/43 [14:15<04:55, 26.82s/it]

Val Loss: 2.3477 - Val Accuracy: 0.8968



Training:   0%|          | 0/280 [00:00<?, ?it/s][A
Training:   0%|          | 1/280 [00:00<02:28,  1.88it/s][A
Training:   1%|          | 3/280 [00:00<00:51,  5.34it/s][A
Training:   2%|▏         | 6/280 [00:00<00:33,  8.11it/s][A
Training:   3%|▎         | 9/280 [00:01<00:28,  9.48it/s][A
Training:   4%|▍         | 11/280 [00:01<00:23, 11.25it/s][A
Training:   5%|▍         | 13/280 [00:01<00:29,  8.93it/s][A
Training:   6%|▌         | 16/280 [00:01<00:21, 12.06it/s][A
Training:   6%|▋         | 18/280 [00:01<00:24, 10.78it/s][A
Training:   8%|▊         | 21/280 [00:02<00:25, 10.35it/s][A
Training:   9%|▉         | 25/280 [00:02<00:23, 10.86it/s][A
Training:  10%|█         | 29/280 [00:02<00:21, 11.55it/s][A
Training:  12%|█▏        | 33/280 [00:03<00:19, 12.87it/s][A
Training:  13%|█▎        | 37/280 [00:03<00:19, 12.30it/s][A
Training:  15%|█▍        | 41/280 [00:03<00:18, 12.70it/s][A
Training:  16%|█▌        | 45/280 [00:04<00:16, 13.91it/s][A
Training:  18%|█▊   

Epoch: 33/43 - Loss: 2.0380 - Accuracy: 0.9362



  0%|          | 0/35 [00:00<?, ?it/s][A
  3%|▎         | 1/35 [00:00<00:26,  1.28it/s][A
 14%|█▍        | 5/35 [00:01<00:05,  5.66it/s][A
 23%|██▎       | 8/35 [00:01<00:03,  8.64it/s][A
 29%|██▊       | 10/35 [00:01<00:02,  8.96it/s][A
 34%|███▍      | 12/35 [00:01<00:02, 10.71it/s][A
 40%|████      | 14/35 [00:01<00:02,  9.56it/s][A
 49%|████▊     | 17/35 [00:02<00:01,  9.56it/s][A
 60%|██████    | 21/35 [00:02<00:01,  9.96it/s][A
 71%|███████▏  | 25/35 [00:02<00:00, 10.58it/s][A
 83%|████████▎ | 29/35 [00:03<00:00, 11.02it/s][A
100%|██████████| 35/35 [00:03<00:00,  9.79it/s][A
Epochs:  77%|███████▋  | 33/43 [14:42<04:28, 26.82s/it]

Val Loss: 2.1564 - Val Accuracy: 0.9416



Training:   0%|          | 0/280 [00:00<?, ?it/s][A
Training:   0%|          | 1/280 [00:00<03:17,  1.42it/s][A
Training:   2%|▏         | 5/280 [00:01<00:46,  5.95it/s][A
Training:   3%|▎         | 8/280 [00:01<00:29,  9.28it/s][A
Training:   4%|▎         | 10/280 [00:01<00:27,  9.67it/s][A
Training:   4%|▍         | 12/280 [00:01<00:24, 10.92it/s][A
Training:   5%|▌         | 14/280 [00:01<00:24, 11.00it/s][A
Training:   6%|▌         | 16/280 [00:01<00:23, 11.26it/s][A
Training:   6%|▋         | 18/280 [00:01<00:22, 11.75it/s][A
Training:   7%|▋         | 20/280 [00:02<00:21, 11.98it/s][A
Training:   8%|▊         | 23/280 [00:02<00:21, 12.02it/s][A
Training:  10%|▉         | 27/280 [00:02<00:17, 14.17it/s][A
Training:  11%|█         | 31/280 [00:02<00:16, 15.36it/s][A
Training:  12%|█▎        | 35/280 [00:03<00:15, 16.05it/s][A
Training:  14%|█▍        | 39/280 [00:03<00:15, 15.33it/s][A
Training:  15%|█▌        | 43/280 [00:03<00:16, 14.73it/s][A
Training:  16%|█▌  

Epoch: 34/43 - Loss: 1.9995 - Accuracy: 0.9356



  0%|          | 0/35 [00:00<?, ?it/s][A
  3%|▎         | 1/35 [00:00<00:25,  1.34it/s][A
 11%|█▏        | 4/35 [00:00<00:05,  5.68it/s][A
 17%|█▋        | 6/35 [00:01<00:04,  6.32it/s][A
 26%|██▌       | 9/35 [00:01<00:03,  7.53it/s][A
 37%|███▋      | 13/35 [00:01<00:02,  9.69it/s][A
 43%|████▎     | 15/35 [00:01<00:01, 11.02it/s][A
 49%|████▊     | 17/35 [00:02<00:01, 10.61it/s][A
 54%|█████▍    | 19/35 [00:02<00:01, 12.14it/s][A
 60%|██████    | 21/35 [00:02<00:01, 11.78it/s][A
 66%|██████▌   | 23/35 [00:02<00:00, 12.49it/s][A
 71%|███████▏  | 25/35 [00:02<00:00, 11.98it/s][A
 77%|███████▋  | 27/35 [00:02<00:00, 12.55it/s][A
 83%|████████▎ | 29/35 [00:03<00:00, 11.39it/s][A
 89%|████████▊ | 31/35 [00:03<00:00, 12.61it/s][A
100%|██████████| 35/35 [00:03<00:00,  9.95it/s][A
Epochs:  79%|███████▉  | 34/43 [15:09<04:00, 26.74s/it]

Val Loss: 2.2765 - Val Accuracy: 0.9180



Training:   0%|          | 0/280 [00:00<?, ?it/s][A
Training:   0%|          | 1/280 [00:00<03:05,  1.50it/s][A
Training:   2%|▏         | 5/280 [00:00<00:39,  6.95it/s][A
Training:   3%|▎         | 8/280 [00:01<00:25, 10.58it/s][A
Training:   4%|▎         | 10/280 [00:01<00:29,  9.13it/s][A
Training:   5%|▍         | 13/280 [00:01<00:26,  9.94it/s][A
Training:   6%|▌         | 17/280 [00:01<00:23, 11.32it/s][A
Training:   7%|▋         | 20/280 [00:01<00:19, 13.68it/s][A
Training:   8%|▊         | 22/280 [00:02<00:22, 11.45it/s][A
Training:   9%|▉         | 25/280 [00:02<00:24, 10.62it/s][A
Training:  10%|█         | 29/280 [00:02<00:20, 12.15it/s][A
Training:  11%|█▏        | 32/280 [00:02<00:17, 14.57it/s][A
Training:  12%|█▏        | 34/280 [00:03<00:19, 12.72it/s][A
Training:  13%|█▎        | 37/280 [00:03<00:20, 11.74it/s][A
Training:  14%|█▍        | 39/280 [00:03<00:20, 12.05it/s][A
Training:  15%|█▍        | 41/280 [00:03<00:19, 12.39it/s][A
Training:  16%|█▌  

Epoch: 35/43 - Loss: 2.0180 - Accuracy: 0.9363



  0%|          | 0/35 [00:00<?, ?it/s][A
  3%|▎         | 1/35 [00:00<00:20,  1.66it/s][A
  6%|▌         | 2/35 [00:00<00:10,  3.04it/s][A
 14%|█▍        | 5/35 [00:00<00:04,  7.45it/s][A
 20%|██        | 7/35 [00:01<00:02,  9.43it/s][A
 26%|██▌       | 9/35 [00:01<00:02,  9.36it/s][A
 31%|███▏      | 11/35 [00:01<00:02, 10.80it/s][A
 37%|███▋      | 13/35 [00:01<00:02, 10.05it/s][A
 43%|████▎     | 15/35 [00:01<00:01, 10.84it/s][A
 49%|████▊     | 17/35 [00:02<00:01,  9.58it/s][A
 54%|█████▍    | 19/35 [00:02<00:01, 11.35it/s][A
 60%|██████    | 21/35 [00:02<00:01,  8.87it/s][A
 69%|██████▊   | 24/35 [00:02<00:00, 12.23it/s][A
 74%|███████▍  | 26/35 [00:02<00:00,  9.99it/s][A
 83%|████████▎ | 29/35 [00:03<00:00, 11.02it/s][A
 89%|████████▊ | 31/35 [00:03<00:00, 11.53it/s][A
 94%|█████████▍| 33/35 [00:03<00:00, 11.42it/s][A
100%|██████████| 35/35 [00:03<00:00,  9.48it/s][A
Epochs:  81%|████████▏ | 35/43 [15:36<03:35, 26.94s/it]

Val Loss: 2.1421 - Val Accuracy: 0.9439



Training:   0%|          | 0/280 [00:00<?, ?it/s][A
Training:   0%|          | 1/280 [00:00<03:29,  1.33it/s][A
Training:   2%|▏         | 5/280 [00:01<00:49,  5.51it/s][A
Training:   3%|▎         | 8/280 [00:01<00:30,  8.87it/s][A
Training:   4%|▎         | 10/280 [00:01<00:32,  8.39it/s][A
Training:   5%|▍         | 13/280 [00:01<00:30,  8.84it/s][A
Training:   6%|▌         | 16/280 [00:01<00:22, 11.78it/s][A
Training:   6%|▋         | 18/280 [00:02<00:23, 11.01it/s][A
Training:   8%|▊         | 21/280 [00:02<00:25, 10.09it/s][A
Training:   9%|▊         | 24/280 [00:02<00:19, 12.81it/s][A
Training:   9%|▉         | 26/280 [00:02<00:21, 11.81it/s][A
Training:  10%|█         | 29/280 [00:02<00:19, 12.62it/s][A
Training:  11%|█▏        | 32/280 [00:03<00:18, 13.40it/s][A
Training:  12%|█▏        | 34/280 [00:03<00:18, 13.39it/s][A
Training:  13%|█▎        | 36/280 [00:03<00:19, 12.83it/s][A
Training:  14%|█▎        | 38/280 [00:03<00:18, 13.40it/s][A
Training:  14%|█▍  

Epoch: 36/43 - Loss: 2.0114 - Accuracy: 0.9337



  0%|          | 0/35 [00:00<?, ?it/s][A
  3%|▎         | 1/35 [00:00<00:19,  1.75it/s][A
  9%|▊         | 3/35 [00:00<00:06,  5.28it/s][A
 14%|█▍        | 5/35 [00:00<00:04,  7.18it/s][A
 20%|██        | 7/35 [00:01<00:03,  8.57it/s][A
 26%|██▌       | 9/35 [00:01<00:02,  9.25it/s][A
 31%|███▏      | 11/35 [00:01<00:02,  9.78it/s][A
 37%|███▋      | 13/35 [00:01<00:02, 10.70it/s][A
 43%|████▎     | 15/35 [00:01<00:02,  8.97it/s][A
 51%|█████▏    | 18/35 [00:02<00:01, 11.13it/s][A
 57%|█████▋    | 20/35 [00:02<00:01,  9.94it/s][A
 63%|██████▎   | 22/35 [00:02<00:01, 11.46it/s][A
 69%|██████▊   | 24/35 [00:02<00:01, 10.56it/s][A
 74%|███████▍  | 26/35 [00:02<00:00, 12.01it/s][A
 80%|████████  | 28/35 [00:03<00:00, 10.12it/s][A
 86%|████████▌ | 30/35 [00:03<00:00, 11.13it/s][A
 91%|█████████▏| 32/35 [00:03<00:00, 10.26it/s][A
100%|██████████| 35/35 [00:03<00:00,  9.48it/s][A
Epochs:  84%|████████▎ | 36/43 [16:03<03:08, 27.00s/it]

Val Loss: 2.0884 - Val Accuracy: 0.9427



Training:   0%|          | 0/280 [00:00<?, ?it/s][A
Training:   0%|          | 1/280 [00:00<03:20,  1.39it/s][A
Training:   1%|          | 2/280 [00:00<01:40,  2.76it/s][A
Training:   2%|▏         | 5/280 [00:00<00:36,  7.63it/s][A
Training:   2%|▎         | 7/280 [00:01<00:32,  8.42it/s][A
Training:   3%|▎         | 9/280 [00:01<00:26, 10.17it/s][A
Training:   4%|▍         | 11/280 [00:01<00:30,  8.93it/s][A
Training:   5%|▍         | 13/280 [00:01<00:24, 10.82it/s][A
Training:   5%|▌         | 15/280 [00:01<00:26,  9.82it/s][A
Training:   6%|▌         | 17/280 [00:02<00:24, 10.81it/s][A
Training:   7%|▋         | 19/280 [00:02<00:26,  9.86it/s][A
Training:   8%|▊         | 22/280 [00:02<00:27,  9.29it/s][A
Training:   9%|▉         | 26/280 [00:02<00:22, 11.22it/s][A
Training:  11%|█         | 30/280 [00:03<00:20, 12.48it/s][A
Training:  12%|█▏        | 34/280 [00:03<00:17, 13.83it/s][A
Training:  14%|█▎        | 38/280 [00:03<00:16, 14.29it/s][A
Training:  15%|█▍    

Epoch: 37/43 - Loss: 1.9341 - Accuracy: 0.9413



  0%|          | 0/35 [00:00<?, ?it/s][A
  3%|▎         | 1/35 [00:00<00:21,  1.59it/s][A
 11%|█▏        | 4/35 [00:00<00:04,  6.77it/s][A
 17%|█▋        | 6/35 [00:01<00:04,  6.48it/s][A
 26%|██▌       | 9/35 [00:01<00:02,  8.89it/s][A
 31%|███▏      | 11/35 [00:01<00:02,  9.64it/s][A
 37%|███▋      | 13/35 [00:01<00:02, 10.75it/s][A
 43%|████▎     | 15/35 [00:01<00:02,  9.85it/s][A
 51%|█████▏    | 18/35 [00:02<00:01, 10.06it/s][A
 60%|██████    | 21/35 [00:02<00:01, 12.47it/s][A
 66%|██████▌   | 23/35 [00:02<00:00, 12.14it/s][A
 71%|███████▏  | 25/35 [00:02<00:00, 12.42it/s][A
 77%|███████▋  | 27/35 [00:02<00:00, 12.50it/s][A
 83%|████████▎ | 29/35 [00:02<00:00, 12.05it/s][A
 89%|████████▊ | 31/35 [00:03<00:00, 12.53it/s][A
 94%|█████████▍| 33/35 [00:03<00:00, 13.13it/s][A
100%|██████████| 35/35 [00:03<00:00, 10.20it/s][A
Epochs:  86%|████████▌ | 37/43 [16:30<02:41, 26.94s/it]

Val Loss: 2.1652 - Val Accuracy: 0.9445



Training:   0%|          | 0/280 [00:00<?, ?it/s][A
Training:   0%|          | 1/280 [00:00<03:29,  1.33it/s][A
Training:   1%|          | 3/280 [00:00<01:04,  4.28it/s][A
Training:   2%|▏         | 5/280 [00:01<00:44,  6.15it/s][A
Training:   2%|▎         | 7/280 [00:01<00:34,  7.88it/s][A
Training:   3%|▎         | 9/280 [00:01<00:31,  8.73it/s][A
Training:   4%|▍         | 11/280 [00:01<00:31,  8.68it/s][A
Training:   5%|▌         | 14/280 [00:01<00:22, 11.80it/s][A
Training:   6%|▌         | 16/280 [00:02<00:26, 10.06it/s][A
Training:   6%|▋         | 18/280 [00:02<00:22, 11.61it/s][A
Training:   7%|▋         | 20/280 [00:02<00:25, 10.38it/s][A
Training:   8%|▊         | 22/280 [00:02<00:21, 11.86it/s][A
Training:   9%|▊         | 24/280 [00:02<00:21, 11.80it/s][A
Training:   9%|▉         | 26/280 [00:02<00:18, 13.37it/s][A
Training:  10%|█         | 28/280 [00:02<00:21, 11.71it/s][A
Training:  11%|█         | 31/280 [00:03<00:21, 11.61it/s][A
Training:  12%|█▎    

Epoch: 38/43 - Loss: 1.9584 - Accuracy: 0.9395



  0%|          | 0/35 [00:00<?, ?it/s][A
  3%|▎         | 1/35 [00:00<00:26,  1.27it/s][A
 11%|█▏        | 4/35 [00:00<00:05,  5.50it/s][A
 17%|█▋        | 6/35 [00:01<00:04,  6.70it/s][A
 23%|██▎       | 8/35 [00:01<00:03,  8.39it/s][A
 29%|██▊       | 10/35 [00:01<00:02,  8.74it/s][A
 34%|███▍      | 12/35 [00:01<00:02,  9.46it/s][A
 43%|████▎     | 15/35 [00:01<00:01, 12.98it/s][A
 49%|████▊     | 17/35 [00:02<00:01, 10.46it/s][A
 57%|█████▋    | 20/35 [00:02<00:01,  9.83it/s][A
 69%|██████▊   | 24/35 [00:02<00:00, 11.07it/s][A
 80%|████████  | 28/35 [00:03<00:00, 11.47it/s][A
 89%|████████▊ | 31/35 [00:03<00:00, 13.89it/s][A
100%|██████████| 35/35 [00:03<00:00,  9.79it/s][A
Epochs:  88%|████████▊ | 38/43 [16:58<02:15, 27.10s/it]

Val Loss: 2.1799 - Val Accuracy: 0.9439



Training:   0%|          | 0/280 [00:00<?, ?it/s][A
Training:   0%|          | 1/280 [00:00<03:06,  1.49it/s][A
Training:   1%|▏         | 4/280 [00:00<00:44,  6.22it/s][A
Training:   2%|▏         | 6/280 [00:00<00:35,  7.71it/s][A
Training:   3%|▎         | 8/280 [00:01<00:27,  9.91it/s][A
Training:   4%|▎         | 10/280 [00:01<00:30,  8.94it/s][A
Training:   5%|▍         | 13/280 [00:01<00:24, 10.77it/s][A
Training:   6%|▌         | 16/280 [00:01<00:19, 13.26it/s][A
Training:   6%|▋         | 18/280 [00:01<00:21, 12.07it/s][A
Training:   8%|▊         | 21/280 [00:02<00:19, 13.31it/s][A
Training:   8%|▊         | 23/280 [00:02<00:20, 12.25it/s][A
Training:   9%|▉         | 25/280 [00:02<00:19, 13.03it/s][A
Training:  10%|▉         | 27/280 [00:02<00:20, 12.07it/s][A
Training:  10%|█         | 29/280 [00:02<00:18, 13.58it/s][A
Training:  11%|█         | 31/280 [00:02<00:20, 12.41it/s][A
Training:  12%|█▏        | 33/280 [00:03<00:19, 12.95it/s][A
Training:  12%|█▎   

Epoch: 39/43 - Loss: 1.9645 - Accuracy: 0.9356



  0%|          | 0/35 [00:00<?, ?it/s][A
  3%|▎         | 1/35 [00:00<00:26,  1.30it/s][A
 14%|█▍        | 5/35 [00:01<00:05,  5.69it/s][A
 26%|██▌       | 9/35 [00:01<00:03,  7.34it/s][A
 37%|███▋      | 13/35 [00:01<00:02,  8.92it/s][A
 49%|████▊     | 17/35 [00:02<00:01,  9.43it/s][A
 57%|█████▋    | 20/35 [00:02<00:01, 11.70it/s][A
 63%|██████▎   | 22/35 [00:02<00:01,  9.80it/s][A
 71%|███████▏  | 25/35 [00:02<00:01,  9.75it/s][A
 83%|████████▎ | 29/35 [00:03<00:00,  9.92it/s][A
100%|██████████| 35/35 [00:03<00:00,  9.38it/s][A
Epochs:  91%|█████████ | 39/43 [17:24<01:47, 26.98s/it]

Val Loss: 2.0728 - Val Accuracy: 0.9279



Training:   0%|          | 0/280 [00:00<?, ?it/s][A
Training:   0%|          | 1/280 [00:00<02:49,  1.65it/s][A
Training:   1%|          | 3/280 [00:00<01:06,  4.19it/s][A
Training:   2%|▏         | 6/280 [00:01<00:36,  7.50it/s][A
Training:   3%|▎         | 8/280 [00:01<00:29,  9.32it/s][A
Training:   4%|▎         | 10/280 [00:01<00:28,  9.46it/s][A
Training:   4%|▍         | 12/280 [00:01<00:24, 11.00it/s][A
Training:   5%|▌         | 14/280 [00:01<00:24, 10.78it/s][A
Training:   6%|▌         | 16/280 [00:01<00:25, 10.43it/s][A
Training:   6%|▋         | 18/280 [00:02<00:23, 11.25it/s][A
Training:   7%|▋         | 20/280 [00:02<00:23, 10.95it/s][A
Training:   8%|▊         | 22/280 [00:02<00:22, 11.31it/s][A
Training:   9%|▊         | 24/280 [00:02<00:24, 10.61it/s][A
Training:   9%|▉         | 26/280 [00:02<00:22, 11.14it/s][A
Training:  10%|█         | 28/280 [00:03<00:25,  9.82it/s][A
Training:  11%|█         | 31/280 [00:03<00:27,  9.10it/s][A
Training:  12%|█▏   

Epoch: 40/43 - Loss: 1.9527 - Accuracy: 0.9388



  0%|          | 0/35 [00:00<?, ?it/s][A
  3%|▎         | 1/35 [00:00<00:21,  1.59it/s][A
  6%|▌         | 2/35 [00:00<00:11,  2.90it/s][A
 14%|█▍        | 5/35 [00:00<00:04,  7.48it/s][A
 20%|██        | 7/35 [00:01<00:03,  8.65it/s][A
 26%|██▌       | 9/35 [00:01<00:02,  9.96it/s][A
 31%|███▏      | 11/35 [00:01<00:02,  9.65it/s][A
 37%|███▋      | 13/35 [00:01<00:01, 11.46it/s][A
 43%|████▎     | 15/35 [00:01<00:01, 10.28it/s][A
 51%|█████▏    | 18/35 [00:02<00:01,  9.55it/s][A
 63%|██████▎   | 22/35 [00:02<00:01,  9.88it/s][A
 74%|███████▍  | 26/35 [00:02<00:00, 10.63it/s][A
 86%|████████▌ | 30/35 [00:03<00:00, 11.03it/s][A
100%|██████████| 35/35 [00:03<00:00,  9.48it/s][A
Epochs:  93%|█████████▎| 40/43 [17:52<01:21, 27.17s/it]

Val Loss: 2.3579 - Val Accuracy: 0.9427



Training:   0%|          | 0/280 [00:00<?, ?it/s][A
Training:   0%|          | 1/280 [00:00<03:07,  1.49it/s][A
Training:   1%|▏         | 4/280 [00:00<00:45,  6.12it/s][A
Training:   2%|▏         | 6/280 [00:00<00:33,  8.11it/s][A
Training:   3%|▎         | 8/280 [00:01<00:26, 10.43it/s][A
Training:   4%|▎         | 10/280 [00:01<00:25, 10.70it/s][A
Training:   4%|▍         | 12/280 [00:01<00:22, 12.09it/s][A
Training:   5%|▌         | 14/280 [00:01<00:25, 10.31it/s][A
Training:   6%|▌         | 17/280 [00:01<00:23, 11.07it/s][A
Training:   7%|▋         | 19/280 [00:02<00:22, 11.53it/s][A
Training:   8%|▊         | 21/280 [00:02<00:21, 11.87it/s][A
Training:   8%|▊         | 23/280 [00:02<00:19, 13.33it/s][A
Training:   9%|▉         | 25/280 [00:02<00:20, 12.74it/s][A
Training:  10%|▉         | 27/280 [00:02<00:19, 12.98it/s][A
Training:  10%|█         | 29/280 [00:02<00:22, 11.36it/s][A
Training:  11%|█▏        | 32/280 [00:02<00:16, 14.65it/s][A
Training:  12%|█▏   

Epoch: 41/43 - Loss: 1.9880 - Accuracy: 0.9389



  0%|          | 0/35 [00:00<?, ?it/s][A
  3%|▎         | 1/35 [00:00<00:23,  1.45it/s][A
 14%|█▍        | 5/35 [00:01<00:05,  5.74it/s][A
 26%|██▌       | 9/35 [00:01<00:03,  7.62it/s][A
 37%|███▋      | 13/35 [00:01<00:02,  8.93it/s][A
 49%|████▊     | 17/35 [00:02<00:01,  9.36it/s][A
 60%|██████    | 21/35 [00:02<00:01, 10.36it/s][A
 71%|███████▏  | 25/35 [00:02<00:00, 10.57it/s][A
 83%|████████▎ | 29/35 [00:03<00:00, 10.70it/s][A
100%|██████████| 35/35 [00:03<00:00,  9.59it/s][A
Epochs:  95%|█████████▌| 41/43 [18:19<00:54, 27.10s/it]

Val Loss: 2.3068 - Val Accuracy: 0.9277



Training:   0%|          | 0/280 [00:00<?, ?it/s][A
Training:   0%|          | 1/280 [00:00<02:31,  1.84it/s][A
Training:   1%|          | 3/280 [00:00<00:50,  5.48it/s][A
Training:   2%|▏         | 5/280 [00:00<00:37,  7.39it/s][A
Training:   2%|▎         | 7/280 [00:00<00:27, 10.04it/s][A
Training:   3%|▎         | 9/280 [00:01<00:31,  8.64it/s][A
Training:   4%|▍         | 12/280 [00:01<00:23, 11.50it/s][A
Training:   5%|▌         | 14/280 [00:01<00:26, 10.09it/s][A
Training:   6%|▌         | 17/280 [00:01<00:27,  9.55it/s][A
Training:   7%|▋         | 20/280 [00:02<00:21, 12.17it/s][A
Training:   8%|▊         | 22/280 [00:02<00:24, 10.66it/s][A
Training:   9%|▉         | 25/280 [00:02<00:23, 10.79it/s][A
Training:  10%|█         | 28/280 [00:02<00:18, 13.30it/s][A
Training:  11%|█         | 30/280 [00:02<00:21, 11.71it/s][A
Training:  12%|█▏        | 33/280 [00:03<00:22, 11.05it/s][A
Training:  13%|█▎        | 36/280 [00:03<00:17, 13.71it/s][A
Training:  14%|█▎    

Epoch: 42/43 - Loss: 1.9515 - Accuracy: 0.9391



  0%|          | 0/35 [00:00<?, ?it/s][A
  3%|▎         | 1/35 [00:00<00:22,  1.48it/s][A
  6%|▌         | 2/35 [00:00<00:11,  2.96it/s][A
 14%|█▍        | 5/35 [00:00<00:04,  7.32it/s][A
 20%|██        | 7/35 [00:01<00:03,  8.16it/s][A
 26%|██▌       | 9/35 [00:01<00:02,  9.84it/s][A
 31%|███▏      | 11/35 [00:01<00:02,  9.90it/s][A
 37%|███▋      | 13/35 [00:01<00:01, 11.30it/s][A
 43%|████▎     | 15/35 [00:01<00:02,  9.71it/s][A
 51%|█████▏    | 18/35 [00:02<00:01, 10.18it/s][A
 63%|██████▎   | 22/35 [00:02<00:01, 10.61it/s][A
 74%|███████▍  | 26/35 [00:02<00:00, 10.97it/s][A
 86%|████████▌ | 30/35 [00:03<00:00, 11.81it/s][A
100%|██████████| 35/35 [00:03<00:00,  9.79it/s][A
Epochs:  98%|█████████▊| 42/43 [18:45<00:26, 26.91s/it]

Val Loss: 2.3321 - Val Accuracy: 0.9404



Training:   0%|          | 0/280 [00:00<?, ?it/s][A
Training:   0%|          | 1/280 [00:00<03:01,  1.54it/s][A
Training:   1%|          | 2/280 [00:00<01:35,  2.90it/s][A
Training:   1%|▏         | 4/280 [00:00<00:44,  6.18it/s][A
Training:   2%|▏         | 6/280 [00:01<00:40,  6.82it/s][A
Training:   3%|▎         | 9/280 [00:01<00:31,  8.54it/s][A
Training:   4%|▍         | 12/280 [00:01<00:26, 10.05it/s][A
Training:   5%|▌         | 14/280 [00:01<00:24, 10.65it/s][A
Training:   6%|▌         | 16/280 [00:02<00:26, 10.07it/s][A
Training:   7%|▋         | 19/280 [00:02<00:19, 13.10it/s][A
Training:   8%|▊         | 21/280 [00:02<00:20, 12.67it/s][A
Training:   9%|▊         | 24/280 [00:02<00:22, 11.47it/s][A
Training:  10%|▉         | 27/280 [00:02<00:17, 14.46it/s][A
Training:  10%|█         | 29/280 [00:02<00:18, 13.68it/s][A
Training:  11%|█▏        | 32/280 [00:03<00:18, 13.07it/s][A
Training:  12%|█▎        | 35/280 [00:03<00:15, 15.84it/s][A
Training:  13%|█▎    

Epoch: 43/43 - Loss: 1.9680 - Accuracy: 0.9385



  0%|          | 0/35 [00:00<?, ?it/s][A
  3%|▎         | 1/35 [00:00<00:25,  1.33it/s][A
 14%|█▍        | 5/35 [00:01<00:05,  5.56it/s][A
 26%|██▌       | 9/35 [00:01<00:03,  8.08it/s][A
 37%|███▋      | 13/35 [00:01<00:02,  9.42it/s][A
 49%|████▊     | 17/35 [00:01<00:01, 11.45it/s][A
 60%|██████    | 21/35 [00:02<00:01, 11.34it/s][A
 69%|██████▊   | 24/35 [00:02<00:00, 13.36it/s][A
 74%|███████▍  | 26/35 [00:02<00:00, 10.52it/s][A
 83%|████████▎ | 29/35 [00:02<00:00, 11.18it/s][A
 89%|████████▊ | 31/35 [00:03<00:00, 11.32it/s][A
 94%|█████████▍| 33/35 [00:03<00:00, 11.19it/s][A
100%|██████████| 35/35 [00:03<00:00,  9.66it/s][A
Epochs: 100%|██████████| 43/43 [19:12<00:00, 26.80s/it]


Val Loss: 2.1767 - Val Accuracy: 0.9387


[32m[I 2023-12-15 00:54:38,562][0m Trial 11 finished with value: 0.9387301802635193 and parameters: {'loss_learning_rate': 0.0022039026522337533, 'learning_rate': 0.003855536505422354, 'weight_decay': 0.003485245048842352, 'epsilon': 1.1759787698978145e-08, 'batch_size': 50, 'epochs': 43}. Best is trial 3 with value: 0.9413145780563354.[0m


Learning rate for Loss: 0.0011031898945929235
Learning rate: 0.0021582686856352106
Weight decay: 0.009994675561598458
Epsilon: 1.647043315653362e-08
Batch size: 207
Number of epochs: 35


Epochs:   0%|          | 0/35 [00:00<?, ?it/s]
Training:   0%|          | 0/68 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/68 [00:01<02:02,  1.84s/it][A
Training:   6%|▌         | 4/68 [00:01<00:24,  2.60it/s][A
Training:   9%|▉         | 6/68 [00:03<00:31,  1.95it/s][A
Training:  12%|█▏        | 8/68 [00:03<00:20,  2.93it/s][A
Training:  15%|█▍        | 10/68 [00:04<00:26,  2.17it/s][A
Training:  18%|█▊        | 12/68 [00:04<00:18,  3.09it/s][A
Training:  21%|██        | 14/68 [00:06<00:22,  2.45it/s][A
Training:  25%|██▌       | 17/68 [00:07<00:21,  2.38it/s][A
Training:  26%|██▋       | 18/68 [00:07<00:18,  2.68it/s][A
Training:  28%|██▊       | 19/68 [00:07<00:16,  3.06it/s][A
Training:  29%|██▉       | 20/68 [00:07<00:13,  3.52it/s][A
Training:  31%|███       | 21/68 [00:08<00:21,  2.22it/s][A
Training:  32%|███▏      | 22/68 [00:08<00:16,  2.72it/s][A
Training:  35%|███▌      | 24/68 [00:09<00:10,  4.18it/s][A
Training:  37%|███▋      | 25/68 [00:10<00:19,  2.2

Epoch: 1/35 - Loss: 12.4394 - Accuracy: 0.7901



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:01<00:15,  1.97s/it][A
 22%|██▏       | 2/9 [00:02<00:06,  1.13it/s][A
 44%|████▍     | 4/9 [00:02<00:01,  2.72it/s][A
 67%|██████▋   | 6/9 [00:03<00:01,  2.14it/s][A
100%|██████████| 9/9 [00:04<00:00,  2.22it/s][A
Epochs:   0%|          | 0/35 [00:27<?, ?it/s]
[32m[I 2023-12-15 00:55:06,361][0m Trial 12 pruned. [0m


Val Loss: 5.5872 - Val Accuracy: 0.8952
Learning rate for Loss: 0.008226475138360454
Learning rate: 0.00023559479818267292
Weight decay: 0.004438394908214023
Epsilon: 2.681775677119305e-08
Batch size: 52
Number of epochs: 66


Epochs:   0%|          | 0/66 [00:00<?, ?it/s]
Training:   0%|          | 0/269 [00:00<?, ?it/s][A
Training:   0%|          | 1/269 [00:00<03:21,  1.33it/s][A
Training:   1%|          | 3/269 [00:00<01:03,  4.19it/s][A
Training:   2%|▏         | 5/269 [00:01<00:43,  6.12it/s][A
Training:   3%|▎         | 7/269 [00:01<00:32,  8.11it/s][A
Training:   3%|▎         | 9/269 [00:01<00:29,  8.92it/s][A
Training:   4%|▍         | 11/269 [00:01<00:26,  9.58it/s][A
Training:   5%|▍         | 13/269 [00:01<00:23, 10.87it/s][A
Training:   6%|▌         | 15/269 [00:01<00:23, 10.74it/s][A
Training:   6%|▋         | 17/269 [00:02<00:22, 11.25it/s][A
Training:   7%|▋         | 19/269 [00:02<00:21, 11.47it/s][A
Training:   8%|▊         | 21/269 [00:02<00:21, 11.61it/s][A
Training:   9%|▊         | 23/269 [00:02<00:21, 11.21it/s][A
Training:   9%|▉         | 25/269 [00:02<00:19, 12.35it/s][A
Training:  10%|█         | 27/269 [00:02<00:22, 10.67it/s][A
Training:  11%|█         | 29/269 [00

Epoch: 1/66 - Loss: 11.3500 - Accuracy: 0.8048



  0%|          | 0/34 [00:00<?, ?it/s][A
  3%|▎         | 1/34 [00:00<00:21,  1.52it/s][A
 15%|█▍        | 5/34 [00:01<00:05,  5.78it/s][A
 26%|██▋       | 9/34 [00:01<00:03,  8.17it/s][A
 38%|███▊      | 13/34 [00:01<00:02,  8.65it/s][A
 50%|█████     | 17/34 [00:02<00:01,  9.56it/s][A
 62%|██████▏   | 21/34 [00:02<00:01,  9.79it/s][A
 74%|███████▎  | 25/34 [00:02<00:00, 10.80it/s][A
 85%|████████▌ | 29/34 [00:03<00:00, 11.05it/s][A
100%|██████████| 34/34 [00:03<00:00,  9.49it/s][A
Epochs:   0%|          | 0/66 [00:27<?, ?it/s]
[32m[I 2023-12-15 00:55:34,081][0m Trial 13 pruned. [0m


Val Loss: 5.5704 - Val Accuracy: 0.8892
Learning rate for Loss: 0.003020886280706533
Learning rate: 0.001753432040609032
Weight decay: 0.0033486711312313805
Epsilon: 9.047363102566672e-08
Batch size: 243
Number of epochs: 33


Epochs:   0%|          | 0/33 [00:00<?, ?it/s]
Training:   0%|          | 0/58 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/58 [00:01<01:48,  1.91s/it][A
Training:   3%|▎         | 2/58 [00:02<00:56,  1.02s/it][A
Training:   9%|▊         | 5/58 [00:03<00:28,  1.83it/s][A
Training:  10%|█         | 6/58 [00:03<00:28,  1.85it/s][A
Training:  12%|█▏        | 7/58 [00:04<00:22,  2.30it/s][A
Training:  16%|█▌        | 9/58 [00:05<00:22,  2.21it/s][A
Training:  17%|█▋        | 10/58 [00:05<00:23,  2.05it/s][A
Training:  21%|██        | 12/58 [00:05<00:14,  3.07it/s][A
Training:  22%|██▏       | 13/58 [00:06<00:21,  2.09it/s][A
Training:  24%|██▍       | 14/58 [00:07<00:20,  2.18it/s][A
Training:  28%|██▊       | 16/58 [00:07<00:12,  3.30it/s][A
Training:  29%|██▉       | 17/58 [00:08<00:19,  2.13it/s][A
Training:  31%|███       | 18/58 [00:08<00:19,  2.02it/s][A
Training:  34%|███▍      | 20/58 [00:09<00:12,  3.01it/s][A
Training:  36%|███▌      | 21/58 [00:10<00:17,  2.14i

Epoch: 1/33 - Loss: 8.8676 - Accuracy: 0.8119



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:02<00:14,  2.14s/it][A
 38%|███▊      | 3/8 [00:02<00:02,  1.67it/s][A
 62%|██████▎   | 5/8 [00:03<00:01,  1.69it/s][A
100%|██████████| 8/8 [00:03<00:00,  2.20it/s][A
Epochs:   0%|          | 0/33 [00:26<?, ?it/s]
[32m[I 2023-12-15 00:56:01,633][0m Trial 14 pruned. [0m


Val Loss: 4.0631 - Val Accuracy: 0.8834
Learning rate for Loss: 0.0006142753776189039
Learning rate: 0.010169022220306113
Weight decay: 0.003120397839988537
Epsilon: 5.304404641597612e-09
Batch size: 150
Number of epochs: 10


Epochs:   0%|          | 0/10 [00:00<?, ?it/s]
Training:   0%|          | 0/94 [00:00<?, ?it/s][A
Training:   1%|          | 1/94 [00:01<02:10,  1.40s/it][A
Training:   3%|▎         | 3/94 [00:01<00:39,  2.28it/s][A
Training:   5%|▌         | 5/94 [00:02<00:37,  2.37it/s][A
Training:   7%|▋         | 7/94 [00:02<00:24,  3.58it/s][A
Training:   9%|▊         | 8/94 [00:02<00:20,  4.20it/s][A
Training:  10%|▉         | 9/94 [00:03<00:31,  2.68it/s][A
Training:  13%|█▎        | 12/94 [00:03<00:17,  4.72it/s][A
Training:  14%|█▍        | 13/94 [00:04<00:26,  3.05it/s][A
Training:  16%|█▌        | 15/94 [00:04<00:18,  4.25it/s][A
Training:  17%|█▋        | 16/94 [00:04<00:16,  4.69it/s][A
Training:  18%|█▊        | 17/94 [00:05<00:23,  3.31it/s][A
Training:  20%|██        | 19/94 [00:05<00:15,  4.74it/s][A
Training:  21%|██▏       | 20/94 [00:05<00:16,  4.48it/s][A
Training:  22%|██▏       | 21/94 [00:06<00:21,  3.39it/s][A
Training:  26%|██▌       | 24/94 [00:06<00:15,  4.55i

Epoch: 1/10 - Loss: 7.5494 - Accuracy: 0.8299



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:13,  1.26s/it][A
 25%|██▌       | 3/12 [00:01<00:03,  2.64it/s][A
 42%|████▏     | 5/12 [00:02<00:02,  2.46it/s][A
 50%|█████     | 6/12 [00:02<00:02,  2.90it/s][A
 75%|███████▌  | 9/12 [00:03<00:00,  3.23it/s][A
100%|██████████| 12/12 [00:03<00:00,  3.32it/s][A
Epochs:  10%|█         | 1/10 [00:26<03:56, 26.29s/it]

Val Loss: 4.0037 - Val Accuracy: 0.9024



Training:   0%|          | 0/94 [00:00<?, ?it/s][A
Training:   1%|          | 1/94 [00:01<01:58,  1.27s/it][A
Training:   3%|▎         | 3/94 [00:01<00:34,  2.66it/s][A
Training:   5%|▌         | 5/94 [00:02<00:36,  2.45it/s][A
Training:   7%|▋         | 7/94 [00:02<00:22,  3.80it/s][A
Training:  10%|▉         | 9/94 [00:03<00:27,  3.10it/s][A
Training:  12%|█▏        | 11/94 [00:03<00:19,  4.21it/s][A
Training:  14%|█▍        | 13/94 [00:04<00:24,  3.28it/s][A
Training:  15%|█▍        | 14/94 [00:04<00:21,  3.73it/s][A
Training:  17%|█▋        | 16/94 [00:04<00:15,  4.93it/s][A
Training:  18%|█▊        | 17/94 [00:05<00:22,  3.47it/s][A
Training:  20%|██        | 19/94 [00:05<00:15,  4.87it/s][A
Training:  22%|██▏       | 21/94 [00:06<00:21,  3.46it/s][A
Training:  23%|██▎       | 22/94 [00:06<00:18,  3.90it/s][A
Training:  26%|██▌       | 24/94 [00:06<00:13,  5.34it/s][A
Training:  27%|██▋       | 25/94 [00:07<00:22,  3.08it/s][A
Training:  29%|██▊       | 27/94 [00:

Epoch: 2/10 - Loss: 3.3779 - Accuracy: 0.9108



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:15,  1.43s/it][A
 25%|██▌       | 3/12 [00:01<00:03,  2.38it/s][A
 42%|████▏     | 5/12 [00:02<00:02,  2.39it/s][A
 58%|█████▊    | 7/12 [00:02<00:01,  3.80it/s][A
 75%|███████▌  | 9/12 [00:03<00:01,  2.97it/s][A
100%|██████████| 12/12 [00:03<00:00,  3.28it/s][A
Epochs:  10%|█         | 1/10 [00:53<07:59, 53.25s/it]
[32m[I 2023-12-15 00:56:55,419][0m Trial 15 pruned. [0m


Val Loss: 2.7906 - Val Accuracy: 0.9127
Learning rate for Loss: 0.0016277456678043456
Learning rate: 0.00013167619130430164
Weight decay: 0.00828228000323938
Epsilon: 9.138950918927498e-09
Batch size: 296
Number of epochs: 85


Epochs:   0%|          | 0/85 [00:00<?, ?it/s]
Training:   0%|          | 0/48 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/48 [00:02<01:48,  2.31s/it][A
Training:   6%|▋         | 3/48 [00:02<00:29,  1.52it/s][A
Training:   8%|▊         | 4/48 [00:02<00:20,  2.14it/s][A
Training:  10%|█         | 5/48 [00:04<00:39,  1.09it/s][A
Training:  15%|█▍        | 7/48 [00:04<00:21,  1.92it/s][A
Training:  17%|█▋        | 8/48 [00:04<00:17,  2.34it/s][A
Training:  19%|█▉        | 9/48 [00:06<00:27,  1.42it/s][A
Training:  21%|██        | 10/48 [00:06<00:20,  1.82it/s][A
Training:  23%|██▎       | 11/48 [00:06<00:17,  2.16it/s][A
Training:  27%|██▋       | 13/48 [00:08<00:20,  1.72it/s][A
Training:  29%|██▉       | 14/48 [00:08<00:17,  1.98it/s][A
Training:  31%|███▏      | 15/48 [00:08<00:15,  2.16it/s][A
Training:  35%|███▌      | 17/48 [00:10<00:17,  1.80it/s][A
Training:  38%|███▊      | 18/48 [00:10<00:14,  2.03it/s][A
Training:  40%|███▉      | 19/48 [00:10<00:11,  2.42it

Epoch: 1/85 - Loss: 20.3975 - Accuracy: 0.5273



  0%|          | 0/6 [00:00<?, ?it/s][A
 17%|█▋        | 1/6 [00:02<00:11,  2.38s/it][A
 67%|██████▋   | 4/6 [00:02<00:00,  2.08it/s][A
100%|██████████| 6/6 [00:04<00:00,  1.40it/s][A
Epochs:   0%|          | 0/85 [00:27<?, ?it/s]
[32m[I 2023-12-15 00:57:24,013][0m Trial 16 pruned. [0m


Val Loss: 13.6912 - Val Accuracy: 0.7121
Learning rate for Loss: 0.004613233401394835
Learning rate: 0.0010553647684039844
Weight decay: 0.0003623515715932159
Epsilon: 9.453943163239698e-09
Batch size: 203
Number of epochs: 60


Epochs:   0%|          | 0/60 [00:00<?, ?it/s]
Training:   0%|          | 0/69 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/69 [00:01<02:07,  1.88s/it][A
Training:   4%|▍         | 3/69 [00:02<00:36,  1.83it/s][A
Training:   7%|▋         | 5/69 [00:03<00:36,  1.74it/s][A
Training:  10%|█         | 7/69 [00:03<00:22,  2.71it/s][A
Training:  13%|█▎        | 9/69 [00:04<00:29,  2.06it/s][A
Training:  16%|█▌        | 11/69 [00:04<00:20,  2.89it/s][A
Training:  19%|█▉        | 13/69 [00:06<00:23,  2.43it/s][A
Training:  23%|██▎       | 16/69 [00:06<00:13,  3.89it/s][A
Training:  26%|██▌       | 18/69 [00:07<00:19,  2.63it/s][A
Training:  29%|██▉       | 20/69 [00:07<00:14,  3.44it/s][A
Training:  30%|███       | 21/69 [00:08<00:19,  2.52it/s][A
Training:  32%|███▏      | 22/69 [00:08<00:17,  2.73it/s][A
Training:  36%|███▌      | 25/69 [00:09<00:15,  2.76it/s][A
Training:  38%|███▊      | 26/69 [00:10<00:14,  2.90it/s][A
Training:  41%|████      | 28/69 [00:10<00:10,  4.01

Epoch: 1/60 - Loss: 9.7761 - Accuracy: 0.8096



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:01<00:14,  1.76s/it][A
 33%|███▎      | 3/9 [00:01<00:03,  1.97it/s][A
 56%|█████▌    | 5/9 [00:03<00:02,  1.68it/s][A
 78%|███████▊  | 7/9 [00:03<00:00,  2.68it/s][A
100%|██████████| 9/9 [00:04<00:00,  2.24it/s][A
Epochs:   2%|▏         | 1/60 [00:27<27:06, 27.57s/it]

Val Loss: 4.1073 - Val Accuracy: 0.9053



Training:   0%|          | 0/69 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/69 [00:01<01:48,  1.59s/it][A
Training:   3%|▎         | 2/69 [00:01<00:49,  1.36it/s][A
Training:   4%|▍         | 3/69 [00:01<00:29,  2.23it/s][A
Training:   7%|▋         | 5/69 [00:03<00:35,  1.82it/s][A
Training:  10%|█         | 7/69 [00:03<00:20,  3.06it/s][A
Training:  13%|█▎        | 9/69 [00:04<00:28,  2.12it/s][A
Training:  16%|█▌        | 11/69 [00:04<00:19,  3.04it/s][A
Training:  17%|█▋        | 12/69 [00:04<00:16,  3.53it/s][A
Training:  19%|█▉        | 13/69 [00:05<00:22,  2.45it/s][A
Training:  22%|██▏       | 15/69 [00:05<00:14,  3.61it/s][A
Training:  25%|██▍       | 17/69 [00:06<00:19,  2.61it/s][A
Training:  26%|██▌       | 18/69 [00:07<00:16,  3.06it/s][A
Training:  30%|███       | 21/69 [00:08<00:16,  2.97it/s][A
Training:  33%|███▎      | 23/69 [00:08<00:12,  3.82it/s][A
Training:  36%|███▌      | 25/69 [00:09<00:13,  3.20it/s][A
Training:  42%|████▏     | 29/69 [00:1

Epoch: 2/60 - Loss: 3.9063 - Accuracy: 0.9093



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:01<00:13,  1.74s/it][A
 33%|███▎      | 3/9 [00:01<00:03,  1.96it/s][A
 56%|█████▌    | 5/9 [00:02<00:02,  1.94it/s][A
 67%|██████▋   | 6/9 [00:03<00:01,  2.37it/s][A
 78%|███████▊  | 7/9 [00:03<00:00,  2.84it/s][A
100%|██████████| 9/9 [00:03<00:00,  2.33it/s][A
Epochs:   2%|▏         | 1/60 [00:54<53:35, 54.49s/it]
[32m[I 2023-12-15 00:58:19,179][0m Trial 17 pruned. [0m


Val Loss: 4.1332 - Val Accuracy: 0.9120
Learning rate for Loss: 0.0013889548548342947
Learning rate: 0.015408694911041685
Weight decay: 0.003615493045718425
Epsilon: 2.068481048838303e-08
Batch size: 107
Number of epochs: 44


Epochs:   0%|          | 0/44 [00:00<?, ?it/s]
Training:   0%|          | 0/131 [00:00<?, ?it/s][A
Training:   1%|          | 1/131 [00:01<02:15,  1.04s/it][A
Training:   2%|▏         | 2/131 [00:01<01:04,  2.00it/s][A
Training:   2%|▏         | 3/131 [00:01<00:40,  3.14it/s][A
Training:   4%|▍         | 5/131 [00:01<00:37,  3.36it/s][A
Training:   5%|▌         | 7/131 [00:01<00:24,  5.15it/s][A
Training:   7%|▋         | 9/131 [00:02<00:27,  4.44it/s][A
Training:   8%|▊         | 11/131 [00:02<00:19,  6.01it/s][A
Training:  10%|▉         | 13/131 [00:03<00:24,  4.76it/s][A
Training:  12%|█▏        | 16/131 [00:03<00:15,  7.34it/s][A
Training:  14%|█▎        | 18/131 [00:04<00:22,  5.01it/s][A
Training:  16%|█▌        | 21/131 [00:04<00:22,  5.00it/s][A
Training:  17%|█▋        | 22/131 [00:04<00:20,  5.41it/s][A
Training:  19%|█▉        | 25/131 [00:05<00:20,  5.05it/s][A
Training:  21%|██        | 27/131 [00:05<00:16,  6.24it/s][A
Training:  22%|██▏       | 29/131 [00:

Epoch: 1/44 - Loss: 6.7892 - Accuracy: 0.8487



  0%|          | 0/17 [00:00<?, ?it/s][A
  6%|▌         | 1/17 [00:00<00:14,  1.10it/s][A
 12%|█▏        | 2/17 [00:01<00:06,  2.19it/s][A
 18%|█▊        | 3/17 [00:01<00:04,  3.10it/s][A
 29%|██▉       | 5/17 [00:01<00:02,  4.33it/s][A
 35%|███▌      | 6/17 [00:01<00:02,  4.78it/s][A
 41%|████      | 7/17 [00:01<00:02,  4.65it/s][A
 53%|█████▎    | 9/17 [00:02<00:01,  5.41it/s][A
 59%|█████▉    | 10/17 [00:02<00:01,  5.37it/s][A
 65%|██████▍   | 11/17 [00:02<00:01,  5.25it/s][A
 76%|███████▋  | 13/17 [00:02<00:00,  5.48it/s][A
100%|██████████| 17/17 [00:03<00:00,  4.96it/s][A
Epochs:   2%|▏         | 1/44 [00:26<19:07, 26.67s/it]

Val Loss: 3.1922 - Val Accuracy: 0.9097



Training:   0%|          | 0/131 [00:00<?, ?it/s][A
Training:   1%|          | 1/131 [00:01<02:20,  1.08s/it][A
Training:   3%|▎         | 4/131 [00:01<00:33,  3.85it/s][A
Training:   4%|▍         | 5/131 [00:01<00:38,  3.29it/s][A
Training:   5%|▌         | 7/131 [00:01<00:24,  5.03it/s][A
Training:   6%|▌         | 8/131 [00:02<00:24,  4.94it/s][A
Training:   7%|▋         | 9/131 [00:02<00:30,  4.01it/s][A
Training:   8%|▊         | 10/131 [00:02<00:26,  4.60it/s][A
Training:   9%|▉         | 12/131 [00:02<00:19,  6.12it/s][A
Training:  10%|▉         | 13/131 [00:03<00:26,  4.45it/s][A
Training:  11%|█         | 14/131 [00:03<00:23,  4.92it/s][A
Training:  12%|█▏        | 16/131 [00:03<00:17,  6.50it/s][A
Training:  13%|█▎        | 17/131 [00:03<00:23,  4.77it/s][A
Training:  14%|█▎        | 18/131 [00:04<00:21,  5.31it/s][A
Training:  15%|█▌        | 20/131 [00:04<00:19,  5.81it/s][A
Training:  16%|█▌        | 21/131 [00:04<00:19,  5.59it/s][A
Training:  17%|█▋     

Epoch: 2/44 - Loss: 2.8250 - Accuracy: 0.9144



  0%|          | 0/17 [00:00<?, ?it/s][A
  6%|▌         | 1/17 [00:01<00:17,  1.09s/it][A
 12%|█▏        | 2/17 [00:01<00:08,  1.84it/s][A
 29%|██▉       | 5/17 [00:01<00:03,  3.68it/s][A
 35%|███▌      | 6/17 [00:01<00:02,  3.90it/s][A
 53%|█████▎    | 9/17 [00:02<00:01,  4.63it/s][A
 59%|█████▉    | 10/17 [00:02<00:01,  4.70it/s][A
 65%|██████▍   | 11/17 [00:02<00:01,  5.32it/s][A
 76%|███████▋  | 13/17 [00:03<00:00,  4.72it/s][A
100%|██████████| 17/17 [00:03<00:00,  4.60it/s][A
Epochs:   5%|▍         | 2/44 [00:54<18:58, 27.10s/it]

Val Loss: 2.4133 - Val Accuracy: 0.9316



Training:   0%|          | 0/131 [00:00<?, ?it/s][A
Training:   1%|          | 1/131 [00:01<02:11,  1.01s/it][A
Training:   2%|▏         | 2/131 [00:01<01:02,  2.06it/s][A
Training:   4%|▍         | 5/131 [00:01<00:34,  3.70it/s][A
Training:   5%|▍         | 6/131 [00:01<00:28,  4.33it/s][A
Training:   6%|▌         | 8/131 [00:01<00:19,  6.41it/s][A
Training:   8%|▊         | 10/131 [00:02<00:25,  4.66it/s][A
Training:  10%|▉         | 13/131 [00:03<00:25,  4.59it/s][A
Training:  11%|█▏        | 15/131 [00:03<00:20,  5.73it/s][A
Training:  13%|█▎        | 17/131 [00:03<00:23,  4.75it/s][A
Training:  15%|█▍        | 19/131 [00:04<00:18,  6.07it/s][A
Training:  16%|█▌        | 21/131 [00:04<00:22,  4.84it/s][A
Training:  18%|█▊        | 24/131 [00:04<00:15,  7.05it/s][A
Training:  20%|█▉        | 26/131 [00:05<00:19,  5.43it/s][A
Training:  21%|██▏       | 28/131 [00:05<00:16,  6.34it/s][A
Training:  23%|██▎       | 30/131 [00:06<00:17,  5.65it/s][A
Training:  25%|██▌   

Epoch: 3/44 - Loss: 2.7487 - Accuracy: 0.9227



  0%|          | 0/17 [00:00<?, ?it/s][A
  6%|▌         | 1/17 [00:00<00:15,  1.02it/s][A
 18%|█▊        | 3/17 [00:01<00:04,  3.30it/s][A
 29%|██▉       | 5/17 [00:01<00:03,  3.67it/s][A
 47%|████▋     | 8/17 [00:01<00:01,  6.55it/s][A
 59%|█████▉    | 10/17 [00:02<00:01,  5.30it/s][A
 76%|███████▋  | 13/17 [00:02<00:00,  5.11it/s][A
100%|██████████| 17/17 [00:03<00:00,  5.44it/s][A
Epochs:   7%|▋         | 3/44 [01:20<18:13, 26.67s/it]

Val Loss: 2.8867 - Val Accuracy: 0.8884



Training:   0%|          | 0/131 [00:00<?, ?it/s][A
Training:   1%|          | 1/131 [00:01<02:27,  1.14s/it][A
Training:   3%|▎         | 4/131 [00:01<00:32,  3.92it/s][A
Training:   5%|▍         | 6/131 [00:02<00:37,  3.31it/s][A
Training:   6%|▌         | 8/131 [00:02<00:26,  4.72it/s][A
Training:   8%|▊         | 10/131 [00:02<00:30,  3.94it/s][A
Training:   9%|▉         | 12/131 [00:02<00:22,  5.37it/s][A
Training:  11%|█         | 14/131 [00:03<00:25,  4.56it/s][A
Training:  13%|█▎        | 17/131 [00:04<00:23,  4.92it/s][A
Training:  14%|█▎        | 18/131 [00:04<00:21,  5.30it/s][A
Training:  16%|█▌        | 21/131 [00:04<00:21,  5.07it/s][A
Training:  17%|█▋        | 22/131 [00:04<00:20,  5.25it/s][A
Training:  18%|█▊        | 24/131 [00:05<00:15,  6.81it/s][A
Training:  20%|█▉        | 26/131 [00:05<00:20,  5.04it/s][A
Training:  21%|██▏       | 28/131 [00:05<00:15,  6.44it/s][A
Training:  23%|██▎       | 30/131 [00:06<00:19,  5.26it/s][A
Training:  24%|██▍  

Epoch: 4/44 - Loss: 2.7715 - Accuracy: 0.9277



  0%|          | 0/17 [00:00<?, ?it/s][A
  6%|▌         | 1/17 [00:00<00:15,  1.04it/s][A
 18%|█▊        | 3/17 [00:01<00:04,  3.44it/s][A
 29%|██▉       | 5/17 [00:01<00:03,  3.42it/s][A
 41%|████      | 7/17 [00:01<00:02,  4.76it/s][A
 53%|█████▎    | 9/17 [00:02<00:01,  4.24it/s][A
 71%|███████   | 12/17 [00:02<00:00,  5.52it/s][A
 76%|███████▋  | 13/17 [00:03<00:00,  4.80it/s][A
 82%|████████▏ | 14/17 [00:03<00:00,  5.00it/s][A
100%|██████████| 17/17 [00:03<00:00,  4.73it/s][A
Epochs:   9%|▉         | 4/44 [01:47<17:49, 26.74s/it]

Val Loss: 3.5304 - Val Accuracy: 0.7748



Training:   0%|          | 0/131 [00:00<?, ?it/s][A
Training:   1%|          | 1/131 [00:01<02:28,  1.14s/it][A
Training:   2%|▏         | 3/131 [00:01<00:43,  2.96it/s][A
Training:   4%|▍         | 5/131 [00:01<00:36,  3.43it/s][A
Training:   5%|▍         | 6/131 [00:02<00:35,  3.51it/s][A
Training:   6%|▌         | 8/131 [00:02<00:23,  5.23it/s][A
Training:   7%|▋         | 9/131 [00:02<00:26,  4.68it/s][A
Training:   8%|▊         | 10/131 [00:02<00:27,  4.43it/s][A
Training:  10%|▉         | 13/131 [00:03<00:20,  5.66it/s][A
Training:  11%|█         | 14/131 [00:03<00:23,  5.04it/s][A
Training:  13%|█▎        | 17/131 [00:03<00:19,  5.97it/s][A
Training:  14%|█▎        | 18/131 [00:04<00:22,  5.04it/s][A
Training:  16%|█▌        | 21/131 [00:04<00:19,  5.64it/s][A
Training:  17%|█▋        | 22/131 [00:04<00:21,  5.15it/s][A
Training:  18%|█▊        | 24/131 [00:04<00:16,  6.49it/s][A
Training:  19%|█▉        | 25/131 [00:05<00:17,  6.18it/s][A
Training:  20%|█▉     

Epoch: 5/44 - Loss: 2.7988 - Accuracy: 0.9181



  0%|          | 0/17 [00:00<?, ?it/s][A
  6%|▌         | 1/17 [00:01<00:19,  1.21s/it][A
 24%|██▎       | 4/17 [00:01<00:03,  3.76it/s][A
 35%|███▌      | 6/17 [00:01<00:03,  3.48it/s][A
 53%|█████▎    | 9/17 [00:02<00:01,  4.11it/s][A
 71%|███████   | 12/17 [00:02<00:00,  6.29it/s][A
 82%|████████▏ | 14/17 [00:03<00:00,  4.87it/s][A
100%|██████████| 17/17 [00:03<00:00,  4.78it/s][A
Epochs:  11%|█▏        | 5/44 [02:14<17:28, 26.89s/it]

Val Loss: 2.4871 - Val Accuracy: 0.9143



Training:   0%|          | 0/131 [00:00<?, ?it/s][A
Training:   1%|          | 1/131 [00:01<02:11,  1.01s/it][A
Training:   2%|▏         | 2/131 [00:01<01:01,  2.09it/s][A
Training:   3%|▎         | 4/131 [00:01<00:28,  4.52it/s][A
Training:   5%|▍         | 6/131 [00:01<00:28,  4.34it/s][A
Training:   6%|▌         | 8/131 [00:01<00:20,  6.14it/s][A
Training:   8%|▊         | 10/131 [00:02<00:26,  4.57it/s][A
Training:   9%|▉         | 12/131 [00:02<00:19,  6.02it/s][A
Training:  11%|█         | 14/131 [00:03<00:25,  4.55it/s][A
Training:  12%|█▏        | 16/131 [00:03<00:19,  5.79it/s][A
Training:  13%|█▎        | 17/131 [00:04<00:28,  3.97it/s][A
Training:  16%|█▌        | 21/131 [00:04<00:24,  4.57it/s][A
Training:  18%|█▊        | 24/131 [00:04<00:16,  6.44it/s][A
Training:  20%|█▉        | 26/131 [00:05<00:20,  5.22it/s][A
Training:  22%|██▏       | 29/131 [00:06<00:20,  4.97it/s][A
Training:  25%|██▌       | 33/131 [00:06<00:18,  5.19it/s][A
Training:  27%|██▋   

Epoch: 6/44 - Loss: 4.0018 - Accuracy: 0.8998



  0%|          | 0/17 [00:00<?, ?it/s][A
  6%|▌         | 1/17 [00:01<00:18,  1.17s/it][A
 18%|█▊        | 3/17 [00:01<00:04,  2.92it/s][A
 29%|██▉       | 5/17 [00:02<00:04,  2.83it/s][A
 53%|█████▎    | 9/17 [00:02<00:01,  4.07it/s][A
 65%|██████▍   | 11/17 [00:02<00:01,  5.22it/s][A
 76%|███████▋  | 13/17 [00:03<00:00,  4.79it/s][A
100%|██████████| 17/17 [00:03<00:00,  4.67it/s][A
Epochs:  11%|█▏        | 5/44 [02:41<21:00, 32.33s/it]
[32m[I 2023-12-15 01:01:01,409][0m Trial 18 pruned. [0m


Val Loss: 4.3157 - Val Accuracy: 0.9085
Learning rate for Loss: 0.00035492638456620357
Learning rate: 0.00370949749957313
Weight decay: 0.00011715500420087854
Epsilon: 6.7116543092181055e-09
Batch size: 172
Number of epochs: 55


Epochs:   0%|          | 0/55 [00:00<?, ?it/s]
Training:   0%|          | 0/82 [00:00<?, ?it/s][A
Training:   1%|          | 1/82 [00:01<02:28,  1.84s/it][A
Training:   2%|▏         | 2/82 [00:01<01:06,  1.20it/s][A
Training:   5%|▍         | 4/82 [00:02<00:28,  2.75it/s][A
Training:   6%|▌         | 5/82 [00:02<00:39,  1.95it/s][A
Training:   9%|▊         | 7/82 [00:03<00:22,  3.28it/s][A
Training:  11%|█         | 9/82 [00:04<00:30,  2.40it/s][A
Training:  12%|█▏        | 10/82 [00:04<00:24,  2.88it/s][A
Training:  13%|█▎        | 11/82 [00:04<00:20,  3.47it/s][A
Training:  16%|█▌        | 13/82 [00:05<00:24,  2.83it/s][A
Training:  17%|█▋        | 14/82 [00:05<00:20,  3.30it/s][A
Training:  20%|█▉        | 16/82 [00:05<00:13,  4.73it/s][A
Training:  21%|██        | 17/82 [00:06<00:20,  3.21it/s][A
Training:  23%|██▎       | 19/82 [00:06<00:14,  4.40it/s][A
Training:  26%|██▌       | 21/82 [00:07<00:16,  3.67it/s][A
Training:  28%|██▊       | 23/82 [00:07<00:12,  4.89i

Epoch: 1/55 - Loss: 7.8784 - Accuracy: 0.8116



  0%|          | 0/11 [00:00<?, ?it/s][A
  9%|▉         | 1/11 [00:01<00:15,  1.51s/it][A
 36%|███▋      | 4/11 [00:01<00:02,  3.16it/s][A
 55%|█████▍    | 6/11 [00:02<00:01,  2.86it/s][A
 64%|██████▎   | 7/11 [00:02<00:01,  3.36it/s][A
 82%|████████▏ | 9/11 [00:03<00:00,  3.00it/s][A
100%|██████████| 11/11 [00:03<00:00,  3.08it/s][A
Epochs:   0%|          | 0/55 [00:27<?, ?it/s]
[32m[I 2023-12-15 01:01:29,910][0m Trial 19 pruned. [0m


Val Loss: 9.4273 - Val Accuracy: 0.7822

Study statistics: 
  Number of finished trials:  20
  Number of pruned trials:  13
  Number of complete trials:  7


In [20]:
print("Best trial:")
trial = study.best_trial

print("  Value: ", trial.value)

print("  Params: ")
for key, value in trial.params.items():
    print("    {}: {}".format(key, value))

Best trial:
  Value:  0.9413145780563354
  Params: 
    batch_size: 237
    epochs: 37
    epsilon: 3.3362510582155838e-09
    learning_rate: 0.0006513527804929251
    loss_learning_rate: 0.0008525339180252597
    weight_decay: 0.0038208248001045425


In [None]:
# ViT P12-S8 ArcFace Mean

Best trial:
Value:  0.9413145780563354
Params: 
batch_size: 237
epochs: 37
epsilon: 3.3362510582155838e-09
learning_rate: 0.0006513527804929251
loss_learning_rate: 0.0008525339180252597
weight_decay: 0.0038208248001045425