In [1]:
import os
import random
import pandas as pd
import numpy as np
import mxnet as mx
import torch
import torch.nn as nn
import torch.nn.functional as F
import torch.optim as opt
from torch.utils.data import Dataset, DataLoader
from einops import rearrange, repeat
import optuna
from optuna.trial import TrialState
from tqdm import tqdm

In [2]:
def file_to_embed(embeds, file):
    emb = []
    for f in file:
        emb.append(embeds[f][0])
    return torch.stack(emb)

In [3]:
MIN_NUM_PATCHES = 16

In [4]:
device = torch.device("cuda:3" if torch.cuda.is_available() else "cpu")
device

device(type='cuda', index=3)

In [5]:
class AdienceDataset(Dataset):
    def __init__(self, annot_file, img_dir):
        self.img_lbls = pd.read_csv(annot_file, header=None)
        self.img_dir = img_dir
    
    def __len__(self):
        return len(self.img_lbls)
    
    def __getitem__(self, idx):
        img_file = self.img_lbls.iloc[idx, 0]
        img_path = os.path.join(self.img_dir, img_file)
        image = mx.image.imread(img_path)
        if image.shape[1] != 112:
            image = mx.image.resize_short(image, 112)
        image = mx.nd.transpose(image, axes=(2,0,1))
        image = torch.tensor(image.asnumpy()).type(torch.FloatTensor)
        label = self.img_lbls.iloc[idx, 1]

        return image, label, img_file

In [6]:
train_data = AdienceDataset("../train.csv", "../cropped_Adience/")
val_data = AdienceDataset("../val.csv", "../cropped_Adience/")

In [7]:
class CosFace(nn.Module):
    r"""Implement of CosFace (https://arxiv.org/pdf/1801.09414.pdf):
    Args:
        in_features: size of each input sample
        out_features: size of each output sample
        device_id: the ID of GPU where the model will be trained by model parallel.
                       if device_id=None, it will be trained on CPU without model parallel.
        s: norm of input feature
        m: margin
        cos(theta)-m
    """

    def __init__(self, in_features, out_features, device_id, s=64.0, m=0.35):
        super(CosFace, self).__init__()
        self.in_features = in_features
        self.out_features = out_features
        self.device_id = device_id
        self.s = s
        self.m = m
        print("self.device_id", self.device_id)
        self.weight = nn.Parameter(torch.FloatTensor(out_features, in_features))
        nn.init.xavier_uniform_(self.weight)

    def forward(self, input, label):
        # --------------------------- cos(theta) & phi(theta) ---------------------------

        if self.device_id == None:
            cosine = F.linear(F.normalize(input), F.normalize(self.weight))
        else:
            x = input
            sub_weights = torch.chunk(self.weight, len(self.device_id), dim=0)
            temp_x = x.cuda(self.device_id[0])
            weight = sub_weights[0].cuda(self.device_id[0])
            cosine = F.linear(F.normalize(temp_x), F.normalize(weight))
            for i in range(1, len(self.device_id)):
                temp_x = x.cuda(self.device_id[i])
                weight = sub_weights[i].cuda(self.device_id[i])
                cosine = torch.cat((cosine, F.linear(F.normalize(temp_x), F.normalize(weight)).cuda(self.device_id[0])),
                                   dim=1)
        phi = cosine - self.m
        # --------------------------- convert label to one-hot ---------------------------
        one_hot = torch.zeros(cosine.size())
        if self.device_id != None:
            one_hot = one_hot.cuda(self.device_id[0])
        # one_hot = one_hot.cuda() if cosine.is_cuda else one_hot

        one_hot.scatter_(1, label.view(-1, 1).long(), 1)
        # -------------torch.where(out_i = {x_i if condition_i else y_i) -------------
        output = (one_hot * phi) + (
                    (1.0 - one_hot) * cosine)  # you can use torch.where if your torch.__version__ is 0.4
        output *= self.s

        return output

    def __repr__(self):
        return self.__class__.__name__ + '(' \
               + 'in_features = ' + str(self.in_features) \
               + ', out_features = ' + str(self.out_features) \
               + ', s = ' + str(self.s) \
               + ', m = ' + str(self.m) + ')'

In [8]:
class Residual(nn.Module):
    def __init__(self, fn):
        super().__init__()
        self.fn = fn
    def forward(self, x, **kwargs):
        return self.fn(x, **kwargs) + x

In [9]:
class PreNorm(nn.Module):
    def __init__(self, dim, fn):
        super().__init__()
        self.norm = nn.LayerNorm(dim)
        self.fn = fn
    def forward(self, x, **kwargs):
        return self.fn(self.norm(x), **kwargs)

In [10]:
class FeedForward(nn.Module):
    def __init__(self, dim, hidden_dim, dropout = 0.):
        super().__init__()
        self.net = nn.Sequential(
            nn.Linear(dim, hidden_dim),
            nn.GELU(),
            nn.Dropout(dropout),
            nn.Linear(hidden_dim, dim),
            nn.Dropout(dropout)
        )
    def forward(self, x):
        return self.net(x)

In [11]:
class Attention(nn.Module):
    def __init__(self, dim, heads = 8, dim_head = 64, dropout = 0.):
        super().__init__()
        inner_dim = dim_head *  heads
        self.heads = heads
        self.scale = dim ** -0.5

        self.to_qkv = nn.Linear(dim, inner_dim * 3, bias = False)
        self.to_out = nn.Sequential(
            nn.Linear(inner_dim, dim),
            nn.Dropout(dropout)
        )

    def forward(self, x, mask = None):
        b, n, _, h = *x.shape, self.heads
        qkv = self.to_qkv(x).chunk(3, dim = -1)

        q, k, v = map(lambda t: rearrange(t, 'b n (h d) -> b h n d', h = h), qkv)
        dots = torch.einsum('bhid,bhjd->bhij', q, k) * self.scale
        mask_value = -torch.finfo(dots.dtype).max
        #embed()
        if mask is not None:
            mask = F.pad(mask.flatten(1), (1, 0), value = True)
            assert mask.shape[-1] == dots.shape[-1], 'mask has incorrect dimensions'
            mask = mask[:, None, :] * mask[:, :, None]
            dots.masked_fill_(~mask, mask_value)
            del mask

        attn = dots.softmax(dim=-1)

        out = torch.einsum('bhij,bhjd->bhid', attn, v)
        out = rearrange(out, 'b h n d -> b n (h d)')
        out =  self.to_out(out)

        return out

In [12]:
class Transformer(nn.Module):
    def __init__(self, dim, depth, heads, dim_head, mlp_dim, dropout):
        super().__init__()
        self.layers = nn.ModuleList([])
        for _ in range(depth):
            self.layers.append(nn.ModuleList([
                Residual(PreNorm(dim, Attention(dim, heads = heads, dim_head = dim_head, dropout = dropout))),
                Residual(PreNorm(dim, FeedForward(dim, mlp_dim, dropout = dropout)))
            ]))
    def forward(self, x, mask = None):
        for attn, ff in self.layers:
            x = attn(x, mask = mask)
            #embed()
            x = ff(x)
        return x

In [13]:
class ViT_face(nn.Module):
    def __init__(self, *, loss_type, GPU_ID, num_class, image_size, patch_size, dim, depth, heads, mlp_dim, pool = 'mean', channels = 3, dim_head = 64, dropout = 0., emb_dropout = 0.):
        super().__init__()
        assert image_size % patch_size == 0, 'Image dimensions must be divisible by the patch size.'
        num_patches = (image_size // patch_size) ** 2
        patch_dim = channels * patch_size ** 2
        assert num_patches > MIN_NUM_PATCHES, f'your number of patches ({num_patches}) is way too small for attention to be effective (at least 16). Try decreasing your patch size'
        assert pool in {'cls', 'mean'}, 'pool type must be either cls (cls token) or mean (mean pooling)'

        self.patch_size = patch_size

        self.pos_embedding = nn.Parameter(torch.randn(1, num_patches + 1, dim))
        self.patch_to_embedding = nn.Linear(patch_dim, dim)
        self.cls_token = nn.Parameter(torch.randn(1, 1, dim))
        self.dropout = nn.Dropout(emb_dropout)

        self.transformer = Transformer(dim, depth, heads, dim_head, mlp_dim, dropout)

        self.pool = pool
        self.to_latent = nn.Identity()

        self.mlp_head = nn.Sequential(
            nn.LayerNorm(dim),
        )
        self.loss_type = loss_type
        self.GPU_ID = GPU_ID
        if self.loss_type == 'None':
            print("no loss for vit_face")
        else:
            if self.loss_type == 'CosFace':
                self.loss = CosFace(in_features=dim, out_features=num_class, device_id=self.GPU_ID)

    def forward(self, img, label=None, mask=None):
        p = self.patch_size
        
        x = rearrange(img, 'b c (h p1) (w p2) -> b (h w) (p1 p2 c)', p1 = p, p2 = p)
        x = self.patch_to_embedding(x)
        b, n, _ = x.shape

        cls_tokens = repeat(self.cls_token, '() n d -> b n d', b = b)
        x = torch.cat((cls_tokens, x), dim=1)
        x += self.pos_embedding[:, :(n + 1)]
        x = self.dropout(x)
        x = self.transformer(x, mask)

        y = x[:, 0]
        # z = x[:, 1:].mean(dim = 1)

        y = self.to_latent(y)
        emb_y = self.mlp_head(y)
        # z = self.to_latent(z)
        # emb_z = self.mlp_head(z)
        # emb = torch.cat((emb_y, emb_z), dim=1)
        emb = emb_y
        if label is not None:
            x = self.loss(emb, label)
            return x, emb
        else:
            return emb

In [18]:
class ViT_plus(nn.Module):
    def __init__(self):
        super(ViT_plus, self).__init__()
        
        self.fc1 = nn.Linear(in_features=512, out_features=512)
        self.fc2 = nn.Linear(in_features=512, out_features=2)
        
    def forward(self, x):
        x = self.fc1(x)
        x_cosface = x
        x_classification = self.fc2(x)
        
        return x_cosface, x_classification

In [15]:
model = ViT_face(
            image_size=112,
            patch_size=8,
            loss_type='CosFace',
            GPU_ID= [device],
            num_class=93431,
            dim=512,
            depth=20,
            heads=8,
            mlp_dim=2048,
            dropout=0.1,
            emb_dropout=0.1
        ).to(device)
model.load_state_dict(
    torch.load("../Backbone_VIT_Epoch_2_Batch_20000_Time_2021-01-12-16-48_checkpoint.pth", map_location=device)
)

self.device_id [device(type='cuda', index=3)]


<All keys matched successfully>

In [16]:
for param in model.parameters():
    param.requires_grad = False

In [19]:
embeds = {}
model.eval()

with torch.no_grad():
    for img, label, file in train_data:
        img = img.to(device)
        embeds[file] = model(torch.unsqueeze(img, 0))

    for img, label, file in val_data:
        img = img.to(device)
        embeds[file] = model(torch.unsqueeze(img, 0))

In [20]:
best_accu = 0.0
def objective(trial):
    model_xtr = ViT_plus().to(device)
    
    lr = trial.suggest_float("learning_rate", 1e-5, 1e-1, log=True)
    wd = trial.suggest_float('weight_decay', 1e-4, 1e-2, log=True)
    eps = trial.suggest_float("epsilon", 1e-9, 1e-7, log=True)
    optimizer = opt.AdamW(model_xtr.parameters(), lr=lr, eps=eps, weight_decay=wd)
    
    criterion = nn.CrossEntropyLoss()
    
    batch_size = trial.suggest_int('batch_size', 50, 300)
    num_epochs = trial.suggest_int('epochs', 10, 100)
    
    print("Learning rate: "+ str(lr))
    print("Weight decay: "+ str(wd))
    print("Epsilon: "+ str(eps))
    print("Batch size: "+ str(batch_size))
    print("Number of epochs: "+ str(num_epochs))
    
    for epoch in tqdm(range(num_epochs), desc="Epochs"):
        train_loader = DataLoader(train_data, batch_size=batch_size, shuffle=True, num_workers=4)
        val_loader = DataLoader(val_data, batch_size=batch_size, shuffle=False, num_workers=4)
        
        # training loop
        running_loss = []
        running_accu = []
        
        model_xtr.train()
        for img, label, file in tqdm(train_loader, desc="Training", leave=False):
            img, label = img.to(device), label.to(device)

            x = file_to_embed(embeds, file)
            
            optimizer.zero_grad()
            _, output = model_xtr(x)
            
            pred = torch.argmax(output, 1)
            accuracy = torch.eq(pred, label).sum() / len(img)

            loss = criterion(output, label)
            loss.backward()
            optimizer.step()

            running_accu.append(accuracy.cpu().detach().numpy())
            running_loss.append(loss.cpu().detach().numpy())
        print("Epoch: {}/{} - Loss: {:.4f} - Accuracy: {:.4f}".format(epoch+1, num_epochs, np.mean(running_loss), np.mean(running_accu)))
        
        # validation loop
        val_loss = []
        val_accu = []

        model_xtr.eval()
        with torch.no_grad():
            for img, label, file in tqdm(val_loader):
                img, label = img.to(device), label.to(device)
                
                x = file_to_embed(embeds, file)
                
                _, output = model_xtr(x)
                
                pred = torch.argmax(output, 1)
                accuracy = torch.eq(pred, label).sum() / len(img)
                
                loss = criterion(output, label)
                
                val_accu.append(accuracy.cpu().detach().numpy())
                val_loss.append(loss.cpu().detach().numpy())
        val_accu = np.mean(val_accu)
        val_loss = np.mean(val_loss)
        print("Val Loss: {:.4f} - Val Accuracy: {:.4f}".format(val_loss, val_accu))
        
        trial.report(val_accu, epoch)
        if trial.should_prune():
            raise optuna.exceptions.TrialPruned()
    
    global best_accu
    if val_accu > best_accu:
        best_accu = val_accu
        print("Saving best model...")
        torch.save(model_xtr.state_dict(), "../vit_8-8_cls.pt")
            
    return val_accu

In [21]:
study = optuna.create_study(direction='maximize',
                            study_name='vit-8-8-cls-study',
                            storage='sqlite:///study9.db',
                            load_if_exists=True)
study.optimize(objective, n_trials=10)

pruned_trials = study.get_trials(deepcopy=False, states=[TrialState.PRUNED])
complete_trials = study.get_trials(deepcopy=False, states=[TrialState.COMPLETE])

# Display the study statistics
print("\nStudy statistics: ")
print("  Number of finished trials: ", len(study.trials))
print("  Number of pruned trials: ", len(pruned_trials))
print("  Number of complete trials: ", len(complete_trials))

[32m[I 2023-12-11 23:09:36,444][0m A new study created in RDB with name: vit-8-8-cls-study[0m


Learning rate: 0.000287881984666585
Weight decay: 0.009570542308397574
Epsilon: 5.706295335047529e-08
Batch size: 268
Number of epochs: 95


Epochs:   0%|          | 0/95 [00:00<?, ?it/s]
Training:   0%|          | 0/53 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/53 [00:01<01:25,  1.65s/it][A
Training:   9%|▉         | 5/53 [00:02<00:24,  1.95it/s][A
Training:  11%|█▏        | 6/53 [00:03<00:19,  2.37it/s][A
Training:  15%|█▌        | 8/53 [00:03<00:12,  3.63it/s][A
Training:  19%|█▉        | 10/53 [00:04<00:17,  2.52it/s][A
Training:  23%|██▎       | 12/53 [00:04<00:11,  3.56it/s][A
Training:  26%|██▋       | 14/53 [00:05<00:14,  2.69it/s][A
Training:  32%|███▏      | 17/53 [00:06<00:12,  2.83it/s][A
Training:  34%|███▍      | 18/53 [00:06<00:11,  3.00it/s][A
Training:  38%|███▊      | 20/53 [00:06<00:08,  3.99it/s][A
Training:  40%|███▉      | 21/53 [00:07<00:11,  2.77it/s][A
Training:  42%|████▏     | 22/53 [00:08<00:10,  2.99it/s][A
Training:  43%|████▎     | 23/53 [00:08<00:08,  3.53it/s][A
Training:  45%|████▌     | 24/53 [00:08<00:06,  4.19it/s][A
Training:  47%|████▋     | 25/53 [00:09<00:10,  2.6

Epoch: 1/95 - Loss: 0.3468 - Accuracy: 0.8581



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:01<00:09,  1.51s/it][A
 57%|█████▋    | 4/7 [00:01<00:00,  3.19it/s][A
100%|██████████| 7/7 [00:02<00:00,  2.40it/s][A
Epochs:   1%|          | 1/95 [00:19<30:44, 19.62s/it]

Val Loss: 0.2321 - Val Accuracy: 0.9054



Training:   0%|          | 0/53 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/53 [00:01<01:17,  1.50s/it][A
Training:   6%|▌         | 3/53 [00:01<00:21,  2.29it/s][A
Training:   9%|▉         | 5/53 [00:02<00:24,  1.99it/s][A
Training:  11%|█▏        | 6/53 [00:02<00:19,  2.41it/s][A
Training:  15%|█▌        | 8/53 [00:03<00:12,  3.66it/s][A
Training:  17%|█▋        | 9/53 [00:04<00:19,  2.24it/s][A
Training:  19%|█▉        | 10/53 [00:04<00:15,  2.76it/s][A
Training:  23%|██▎       | 12/53 [00:04<00:10,  4.00it/s][A
Training:  25%|██▍       | 13/53 [00:05<00:16,  2.45it/s][A
Training:  26%|██▋       | 14/53 [00:05<00:14,  2.78it/s][A
Training:  30%|███       | 16/53 [00:05<00:08,  4.14it/s][A
Training:  32%|███▏      | 17/53 [00:06<00:13,  2.66it/s][A
Training:  34%|███▍      | 18/53 [00:06<00:11,  3.04it/s][A
Training:  40%|███▉      | 21/53 [00:07<00:10,  3.15it/s][A
Training:  42%|████▏     | 22/53 [00:07<00:09,  3.21it/s][A
Training:  47%|████▋     | 25/53 [00:0

Epoch: 2/95 - Loss: 0.2136 - Accuracy: 0.9187



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:01<00:09,  1.59s/it][A
100%|██████████| 7/7 [00:02<00:00,  2.37it/s][A
Epochs:   2%|▏         | 2/95 [00:39<30:21, 19.58s/it]

Val Loss: 0.2105 - Val Accuracy: 0.9149



Training:   0%|          | 0/53 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/53 [00:01<01:25,  1.64s/it][A
Training:   8%|▊         | 4/53 [00:01<00:17,  2.87it/s][A
Training:  11%|█▏        | 6/53 [00:03<00:21,  2.15it/s][A
Training:  15%|█▌        | 8/53 [00:03<00:13,  3.23it/s][A
Training:  19%|█▉        | 10/53 [00:04<00:16,  2.61it/s][A
Training:  23%|██▎       | 12/53 [00:04<00:11,  3.60it/s][A
Training:  26%|██▋       | 14/53 [00:05<00:14,  2.63it/s][A
Training:  32%|███▏      | 17/53 [00:06<00:14,  2.53it/s][A
Training:  38%|███▊      | 20/53 [00:06<00:08,  3.76it/s][A
Training:  42%|████▏     | 22/53 [00:07<00:10,  3.09it/s][A
Training:  47%|████▋     | 25/53 [00:09<00:10,  2.79it/s][A
Training:  55%|█████▍    | 29/53 [00:10<00:08,  3.00it/s][A
Training:  62%|██████▏   | 33/53 [00:11<00:06,  3.10it/s][A
Training:  70%|██████▉   | 37/53 [00:12<00:05,  3.13it/s][A
Training:  77%|███████▋  | 41/53 [00:13<00:03,  3.22it/s][A
Training:  85%|████████▍ | 45/53 [00

Epoch: 3/95 - Loss: 0.1966 - Accuracy: 0.9244



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:01<00:09,  1.56s/it][A
 57%|█████▋    | 4/7 [00:01<00:00,  3.10it/s][A
100%|██████████| 7/7 [00:02<00:00,  2.44it/s][A
Epochs:   3%|▎         | 3/95 [00:58<29:54, 19.50s/it]

Val Loss: 0.2057 - Val Accuracy: 0.9134



Training:   0%|          | 0/53 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/53 [00:01<01:23,  1.60s/it][A
Training:   8%|▊         | 4/53 [00:01<00:16,  3.01it/s][A
Training:  11%|█▏        | 6/53 [00:02<00:21,  2.15it/s][A
Training:  17%|█▋        | 9/53 [00:04<00:19,  2.31it/s][A
Training:  21%|██        | 11/53 [00:04<00:13,  3.14it/s][A
Training:  25%|██▍       | 13/53 [00:05<00:15,  2.53it/s][A
Training:  28%|██▊       | 15/53 [00:05<00:11,  3.38it/s][A
Training:  32%|███▏      | 17/53 [00:06<00:13,  2.68it/s][A
Training:  38%|███▊      | 20/53 [00:06<00:08,  3.91it/s][A
Training:  40%|███▉      | 21/53 [00:07<00:11,  2.86it/s][A
Training:  42%|████▏     | 22/53 [00:07<00:09,  3.22it/s][A
Training:  45%|████▌     | 24/53 [00:08<00:06,  4.47it/s][A
Training:  47%|████▋     | 25/53 [00:08<00:09,  2.86it/s][A
Training:  49%|████▉     | 26/53 [00:09<00:08,  3.34it/s][A
Training:  55%|█████▍    | 29/53 [00:10<00:07,  3.13it/s][A
Training:  57%|█████▋    | 30/53 [00

Epoch: 4/95 - Loss: 0.1951 - Accuracy: 0.9252



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:01<00:08,  1.47s/it][A
 43%|████▎     | 3/7 [00:01<00:01,  2.35it/s][A
100%|██████████| 7/7 [00:02<00:00,  2.59it/s][A
Epochs:   4%|▍         | 4/95 [01:17<29:17, 19.31s/it]

Val Loss: 0.2055 - Val Accuracy: 0.9129



Training:   0%|          | 0/53 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/53 [00:01<01:22,  1.58s/it][A
Training:   9%|▉         | 5/53 [00:02<00:24,  1.96it/s][A
Training:  13%|█▎        | 7/53 [00:02<00:15,  2.94it/s][A
Training:  17%|█▋        | 9/53 [00:04<00:17,  2.47it/s][A
Training:  19%|█▉        | 10/53 [00:04<00:15,  2.79it/s][A
Training:  23%|██▎       | 12/53 [00:04<00:10,  4.06it/s][A
Training:  26%|██▋       | 14/53 [00:05<00:14,  2.73it/s][A
Training:  32%|███▏      | 17/53 [00:06<00:13,  2.64it/s][A
Training:  38%|███▊      | 20/53 [00:06<00:08,  3.88it/s][A
Training:  40%|███▉      | 21/53 [00:07<00:12,  2.66it/s][A
Training:  42%|████▏     | 22/53 [00:08<00:10,  3.06it/s][A
Training:  45%|████▌     | 24/53 [00:08<00:06,  4.14it/s][A
Training:  47%|████▋     | 25/53 [00:09<00:10,  2.61it/s][A
Training:  49%|████▉     | 26/53 [00:09<00:08,  3.08it/s][A
Training:  51%|█████     | 27/53 [00:09<00:07,  3.57it/s][A
Training:  55%|█████▍    | 29/53 [00

Epoch: 5/95 - Loss: 0.1911 - Accuracy: 0.9262



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:01<00:09,  1.57s/it][A
100%|██████████| 7/7 [00:02<00:00,  2.65it/s][A
Epochs:   5%|▌         | 5/95 [01:36<28:58, 19.32s/it]

Val Loss: 0.2064 - Val Accuracy: 0.9165



Training:   0%|          | 0/53 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/53 [00:01<01:19,  1.52s/it][A
Training:   6%|▌         | 3/53 [00:01<00:21,  2.32it/s][A
Training:   9%|▉         | 5/53 [00:02<00:24,  1.94it/s][A
Training:  15%|█▌        | 8/53 [00:02<00:11,  3.79it/s][A
Training:  19%|█▉        | 10/53 [00:04<00:17,  2.53it/s][A
Training:  25%|██▍       | 13/53 [00:05<00:15,  2.51it/s][A
Training:  28%|██▊       | 15/53 [00:05<00:11,  3.33it/s][A
Training:  32%|███▏      | 17/53 [00:06<00:14,  2.57it/s][A
Training:  38%|███▊      | 20/53 [00:06<00:08,  3.88it/s][A
Training:  42%|████▏     | 22/53 [00:08<00:10,  2.88it/s][A
Training:  47%|████▋     | 25/53 [00:09<00:10,  2.70it/s][A
Training:  53%|█████▎    | 28/53 [00:09<00:06,  3.82it/s][A
Training:  57%|█████▋    | 30/53 [00:10<00:07,  3.16it/s][A
Training:  60%|██████    | 32/53 [00:10<00:05,  4.04it/s][A
Training:  64%|██████▍   | 34/53 [00:11<00:05,  3.23it/s][A
Training:  70%|██████▉   | 37/53 [00

Epoch: 6/95 - Loss: 0.1860 - Accuracy: 0.9301



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:01<00:08,  1.49s/it][A
100%|██████████| 7/7 [00:02<00:00,  2.57it/s][A
Epochs:   6%|▋         | 6/95 [01:56<28:41, 19.34s/it]

Val Loss: 0.2013 - Val Accuracy: 0.9144



Training:   0%|          | 0/53 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/53 [00:01<01:18,  1.51s/it][A
Training:   8%|▊         | 4/53 [00:01<00:16,  2.99it/s][A
Training:  11%|█▏        | 6/53 [00:02<00:21,  2.14it/s][A
Training:  15%|█▌        | 8/53 [00:03<00:14,  3.15it/s][A
Training:  17%|█▋        | 9/53 [00:04<00:20,  2.13it/s][A
Training:  23%|██▎       | 12/53 [00:04<00:11,  3.68it/s][A
Training:  25%|██▍       | 13/53 [00:05<00:17,  2.26it/s][A
Training:  28%|██▊       | 15/53 [00:05<00:11,  3.22it/s][A
Training:  32%|███▏      | 17/53 [00:06<00:13,  2.69it/s][A
Training:  36%|███▌      | 19/53 [00:06<00:09,  3.72it/s][A
Training:  40%|███▉      | 21/53 [00:07<00:11,  2.67it/s][A
Training:  43%|████▎     | 23/53 [00:08<00:08,  3.64it/s][A
Training:  47%|████▋     | 25/53 [00:09<00:09,  2.84it/s][A
Training:  49%|████▉     | 26/53 [00:09<00:08,  3.06it/s][A
Training:  55%|█████▍    | 29/53 [00:10<00:08,  2.92it/s][A
Training:  57%|█████▋    | 30/53 [00:

Epoch: 7/95 - Loss: 0.1855 - Accuracy: 0.9298



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:01<00:08,  1.50s/it][A
100%|██████████| 7/7 [00:02<00:00,  2.67it/s][A
Epochs:   7%|▋         | 7/95 [02:15<28:23, 19.35s/it]

Val Loss: 0.2049 - Val Accuracy: 0.9129



Training:   0%|          | 0/53 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/53 [00:01<01:21,  1.57s/it][A
Training:   6%|▌         | 3/53 [00:01<00:22,  2.25it/s][A
Training:   9%|▉         | 5/53 [00:02<00:22,  2.09it/s][A
Training:  11%|█▏        | 6/53 [00:02<00:17,  2.62it/s][A
Training:  17%|█▋        | 9/53 [00:04<00:17,  2.57it/s][A
Training:  19%|█▉        | 10/53 [00:04<00:14,  2.91it/s][A
Training:  25%|██▍       | 13/53 [00:05<00:14,  2.73it/s][A
Training:  28%|██▊       | 15/53 [00:05<00:10,  3.67it/s][A
Training:  32%|███▏      | 17/53 [00:06<00:12,  2.77it/s][A
Training:  34%|███▍      | 18/53 [00:06<00:11,  3.16it/s][A
Training:  40%|███▉      | 21/53 [00:07<00:11,  2.86it/s][A
Training:  42%|████▏     | 22/53 [00:08<00:09,  3.16it/s][A
Training:  45%|████▌     | 24/53 [00:08<00:06,  4.27it/s][A
Training:  47%|████▋     | 25/53 [00:09<00:10,  2.59it/s][A
Training:  55%|█████▍    | 29/53 [00:10<00:08,  2.85it/s][A
Training:  60%|██████    | 32/53 [00:

Epoch: 8/95 - Loss: 0.1847 - Accuracy: 0.9292



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:01<00:08,  1.50s/it][A
 29%|██▊       | 2/7 [00:01<00:03,  1.39it/s][A
100%|██████████| 7/7 [00:02<00:00,  2.60it/s][A
Epochs:   8%|▊         | 8/95 [02:35<28:08, 19.41s/it]

Val Loss: 0.2050 - Val Accuracy: 0.9139



Training:   0%|          | 0/53 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/53 [00:01<01:19,  1.52s/it][A
Training:   6%|▌         | 3/53 [00:01<00:22,  2.24it/s][A
Training:   9%|▉         | 5/53 [00:02<00:23,  2.08it/s][A
Training:  15%|█▌        | 8/53 [00:02<00:11,  3.79it/s][A
Training:  17%|█▋        | 9/53 [00:03<00:18,  2.44it/s][A
Training:  23%|██▎       | 12/53 [00:04<00:10,  3.73it/s][A
Training:  25%|██▍       | 13/53 [00:05<00:15,  2.60it/s][A
Training:  28%|██▊       | 15/53 [00:05<00:10,  3.63it/s][A
Training:  30%|███       | 16/53 [00:05<00:10,  3.53it/s][A
Training:  32%|███▏      | 17/53 [00:06<00:14,  2.53it/s][A
Training:  38%|███▊      | 20/53 [00:06<00:09,  3.63it/s][A
Training:  40%|███▉      | 21/53 [00:07<00:12,  2.65it/s][A
Training:  43%|████▎     | 23/53 [00:07<00:08,  3.75it/s][A
Training:  45%|████▌     | 24/53 [00:08<00:08,  3.38it/s][A
Training:  47%|████▋     | 25/53 [00:08<00:10,  2.56it/s][A
Training:  53%|█████▎    | 28/53 [00:

Epoch: 9/95 - Loss: 0.1854 - Accuracy: 0.9294



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:01<00:09,  1.57s/it][A
 57%|█████▋    | 4/7 [00:01<00:01,  2.85it/s][A
100%|██████████| 7/7 [00:02<00:00,  2.41it/s][A
Epochs:   9%|▉         | 9/95 [02:54<27:58, 19.52s/it]

Val Loss: 0.2040 - Val Accuracy: 0.9166



Training:   0%|          | 0/53 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/53 [00:01<01:18,  1.51s/it][A
Training:   6%|▌         | 3/53 [00:01<00:21,  2.28it/s][A
Training:   9%|▉         | 5/53 [00:02<00:24,  1.98it/s][A
Training:  15%|█▌        | 8/53 [00:02<00:11,  3.77it/s][A
Training:  19%|█▉        | 10/53 [00:03<00:15,  2.83it/s][A
Training:  25%|██▍       | 13/53 [00:05<00:14,  2.79it/s][A
Training:  30%|███       | 16/53 [00:05<00:09,  4.02it/s][A
Training:  32%|███▏      | 17/53 [00:06<00:13,  2.65it/s][A
Training:  36%|███▌      | 19/53 [00:06<00:09,  3.57it/s][A
Training:  40%|███▉      | 21/53 [00:07<00:11,  2.68it/s][A
Training:  45%|████▌     | 24/53 [00:08<00:07,  3.64it/s][A
Training:  47%|████▋     | 25/53 [00:08<00:10,  2.60it/s][A
Training:  53%|█████▎    | 28/53 [00:09<00:07,  3.44it/s][A
Training:  55%|█████▍    | 29/53 [00:10<00:09,  2.61it/s][A
Training:  60%|██████    | 32/53 [00:10<00:06,  3.50it/s][A
Training:  62%|██████▏   | 33/53 [00

Epoch: 10/95 - Loss: 0.1853 - Accuracy: 0.9301



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:01<00:09,  1.54s/it][A
100%|██████████| 7/7 [00:02<00:00,  2.42it/s][A
Epochs:  11%|█         | 10/95 [03:14<27:43, 19.57s/it]

Val Loss: 0.2061 - Val Accuracy: 0.9139



Training:   0%|          | 0/53 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/53 [00:01<01:13,  1.41s/it][A
Training:   4%|▍         | 2/53 [00:01<00:33,  1.54it/s][A
Training:   6%|▌         | 3/53 [00:01<00:20,  2.42it/s][A
Training:   9%|▉         | 5/53 [00:02<00:22,  2.10it/s][A
Training:  11%|█▏        | 6/53 [00:02<00:18,  2.61it/s][A
Training:  15%|█▌        | 8/53 [00:03<00:11,  4.01it/s][A
Training:  17%|█▋        | 9/53 [00:03<00:17,  2.53it/s][A
Training:  19%|█▉        | 10/53 [00:03<00:13,  3.10it/s][A
Training:  25%|██▍       | 13/53 [00:05<00:13,  2.95it/s][A
Training:  26%|██▋       | 14/53 [00:05<00:11,  3.29it/s][A
Training:  30%|███       | 16/53 [00:05<00:08,  4.60it/s][A
Training:  32%|███▏      | 17/53 [00:06<00:13,  2.64it/s][A
Training:  34%|███▍      | 18/53 [00:06<00:12,  2.91it/s][A
Training:  40%|███▉      | 21/53 [00:07<00:11,  2.82it/s][A
Training:  42%|████▏     | 22/53 [00:07<00:09,  3.10it/s][A
Training:  45%|████▌     | 24/53 [00:07

Epoch: 11/95 - Loss: 0.1841 - Accuracy: 0.9308



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:01<00:08,  1.47s/it][A
 43%|████▎     | 3/7 [00:01<00:01,  2.30it/s][A
100%|██████████| 7/7 [00:02<00:00,  2.54it/s][A
Epochs:  12%|█▏        | 11/95 [03:34<27:22, 19.56s/it]

Val Loss: 0.2098 - Val Accuracy: 0.9144



Training:   0%|          | 0/53 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/53 [00:01<01:16,  1.48s/it][A
Training:   9%|▉         | 5/53 [00:02<00:23,  2.08it/s][A
Training:  13%|█▎        | 7/53 [00:02<00:14,  3.13it/s][A
Training:  17%|█▋        | 9/53 [00:04<00:18,  2.36it/s][A
Training:  25%|██▍       | 13/53 [00:05<00:14,  2.82it/s][A
Training:  32%|███▏      | 17/53 [00:06<00:12,  2.98it/s][A
Training:  38%|███▊      | 20/53 [00:06<00:07,  4.13it/s][A
Training:  42%|████▏     | 22/53 [00:07<00:10,  3.08it/s][A
Training:  47%|████▋     | 25/53 [00:09<00:09,  2.81it/s][A
Training:  55%|█████▍    | 29/53 [00:10<00:08,  2.94it/s][A
Training:  62%|██████▏   | 33/53 [00:11<00:06,  3.06it/s][A
Training:  66%|██████▌   | 35/53 [00:11<00:04,  3.64it/s][A
Training:  70%|██████▉   | 37/53 [00:12<00:05,  3.00it/s][A
Training:  74%|███████▎  | 39/53 [00:12<00:03,  3.68it/s][A
Training:  77%|███████▋  | 41/53 [00:13<00:04,  2.96it/s][A
Training:  83%|████████▎ | 44/53 [00

Epoch: 12/95 - Loss: 0.1825 - Accuracy: 0.9316



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:01<00:08,  1.45s/it][A
 57%|█████▋    | 4/7 [00:01<00:00,  3.20it/s][A
100%|██████████| 7/7 [00:02<00:00,  2.60it/s][A
Epochs:  13%|█▎        | 12/95 [03:53<26:55, 19.46s/it]

Val Loss: 0.2055 - Val Accuracy: 0.9128



Training:   0%|          | 0/53 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/53 [00:01<01:28,  1.70s/it][A
Training:   6%|▌         | 3/53 [00:01<00:24,  2.04it/s][A
Training:   9%|▉         | 5/53 [00:02<00:24,  1.92it/s][A
Training:  17%|█▋        | 9/53 [00:04<00:17,  2.58it/s][A
Training:  21%|██        | 11/53 [00:04<00:12,  3.46it/s][A
Training:  25%|██▍       | 13/53 [00:05<00:14,  2.70it/s][A
Training:  32%|███▏      | 17/53 [00:06<00:11,  3.03it/s][A
Training:  40%|███▉      | 21/53 [00:07<00:10,  3.19it/s][A
Training:  47%|████▋     | 25/53 [00:08<00:08,  3.13it/s][A
Training:  53%|█████▎    | 28/53 [00:09<00:06,  4.15it/s][A
Training:  57%|█████▋    | 30/53 [00:10<00:07,  3.06it/s][A
Training:  62%|██████▏   | 33/53 [00:11<00:06,  3.17it/s][A
Training:  64%|██████▍   | 34/53 [00:11<00:06,  3.11it/s][A
Training:  70%|██████▉   | 37/53 [00:12<00:05,  3.15it/s][A
Training:  72%|███████▏  | 38/53 [00:12<00:05,  2.98it/s][A
Training:  75%|███████▌  | 40/53 [00

Epoch: 13/95 - Loss: 0.1820 - Accuracy: 0.9298



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:01<00:09,  1.56s/it][A
100%|██████████| 7/7 [00:02<00:00,  2.61it/s][A
Epochs:  14%|█▎        | 13/95 [04:12<26:36, 19.47s/it]

Val Loss: 0.2052 - Val Accuracy: 0.9134



Training:   0%|          | 0/53 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/53 [00:01<01:19,  1.52s/it][A
Training:   4%|▍         | 2/53 [00:01<00:38,  1.31it/s][A
Training:   8%|▊         | 4/53 [00:01<00:15,  3.07it/s][A
Training:   9%|▉         | 5/53 [00:02<00:23,  2.01it/s][A
Training:  11%|█▏        | 6/53 [00:03<00:19,  2.39it/s][A
Training:  15%|█▌        | 8/53 [00:03<00:11,  4.03it/s][A
Training:  17%|█▋        | 9/53 [00:04<00:18,  2.41it/s][A
Training:  19%|█▉        | 10/53 [00:04<00:14,  2.89it/s][A
Training:  25%|██▍       | 13/53 [00:05<00:13,  2.98it/s][A
Training:  26%|██▋       | 14/53 [00:05<00:12,  3.12it/s][A
Training:  30%|███       | 16/53 [00:05<00:08,  4.40it/s][A
Training:  32%|███▏      | 17/53 [00:06<00:13,  2.69it/s][A
Training:  34%|███▍      | 18/53 [00:06<00:11,  3.07it/s][A
Training:  40%|███▉      | 21/53 [00:07<00:10,  3.02it/s][A
Training:  43%|████▎     | 23/53 [00:07<00:07,  4.06it/s][A
Training:  47%|████▋     | 25/53 [00:08

Epoch: 14/95 - Loss: 0.1814 - Accuracy: 0.9320



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:01<00:08,  1.47s/it][A
100%|██████████| 7/7 [00:02<00:00,  2.58it/s][A
Epochs:  15%|█▍        | 14/95 [04:32<26:18, 19.49s/it]

Val Loss: 0.2060 - Val Accuracy: 0.9160



Training:   0%|          | 0/53 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/53 [00:01<01:20,  1.55s/it][A
Training:   6%|▌         | 3/53 [00:01<00:23,  2.14it/s][A
Training:   9%|▉         | 5/53 [00:02<00:26,  1.82it/s][A
Training:  13%|█▎        | 7/53 [00:03<00:15,  2.90it/s][A
Training:  17%|█▋        | 9/53 [00:04<00:19,  2.28it/s][A
Training:  23%|██▎       | 12/53 [00:04<00:10,  3.82it/s][A
Training:  26%|██▋       | 14/53 [00:05<00:12,  3.09it/s][A
Training:  30%|███       | 16/53 [00:05<00:09,  4.03it/s][A
Training:  34%|███▍      | 18/53 [00:06<00:11,  2.98it/s][A
Training:  38%|███▊      | 20/53 [00:06<00:08,  3.84it/s][A
Training:  40%|███▉      | 21/53 [00:07<00:13,  2.45it/s][A
Training:  45%|████▌     | 24/53 [00:07<00:07,  4.01it/s][A
Training:  49%|████▉     | 26/53 [00:08<00:08,  3.13it/s][A
Training:  55%|█████▍    | 29/53 [00:10<00:08,  2.89it/s][A
Training:  58%|█████▊    | 31/53 [00:10<00:05,  3.71it/s][A
Training:  62%|██████▏   | 33/53 [00:

Epoch: 15/95 - Loss: 0.1825 - Accuracy: 0.9316



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:01<00:08,  1.42s/it][A
 43%|████▎     | 3/7 [00:01<00:01,  2.45it/s][A
100%|██████████| 7/7 [00:02<00:00,  2.64it/s][A
Epochs:  16%|█▌        | 15/95 [04:51<25:58, 19.48s/it]

Val Loss: 0.2113 - Val Accuracy: 0.9160



Training:   0%|          | 0/53 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/53 [00:01<01:15,  1.45s/it][A
Training:   8%|▊         | 4/53 [00:01<00:15,  3.24it/s][A
Training:  11%|█▏        | 6/53 [00:02<00:19,  2.44it/s][A
Training:  17%|█▋        | 9/53 [00:03<00:17,  2.51it/s][A
Training:  21%|██        | 11/53 [00:03<00:12,  3.40it/s][A
Training:  25%|██▍       | 13/53 [00:05<00:15,  2.65it/s][A
Training:  26%|██▋       | 14/53 [00:05<00:13,  2.90it/s][A
Training:  32%|███▏      | 17/53 [00:06<00:11,  3.03it/s][A
Training:  34%|███▍      | 18/53 [00:06<00:10,  3.38it/s][A
Training:  40%|███▉      | 21/53 [00:07<00:09,  3.36it/s][A
Training:  42%|████▏     | 22/53 [00:07<00:08,  3.58it/s][A
Training:  47%|████▋     | 25/53 [00:08<00:09,  3.04it/s][A
Training:  49%|████▉     | 26/53 [00:08<00:08,  3.36it/s][A
Training:  53%|█████▎    | 28/53 [00:08<00:05,  4.56it/s][A
Training:  55%|█████▍    | 29/53 [00:09<00:08,  2.95it/s][A
Training:  57%|█████▋    | 30/53 [00

Epoch: 16/95 - Loss: 0.1828 - Accuracy: 0.9319



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:01<00:09,  1.64s/it][A
100%|██████████| 7/7 [00:02<00:00,  2.57it/s][A
Epochs:  17%|█▋        | 16/95 [05:10<25:29, 19.36s/it]

Val Loss: 0.2098 - Val Accuracy: 0.9149



Training:   0%|          | 0/53 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/53 [00:01<01:23,  1.61s/it][A
Training:   6%|▌         | 3/53 [00:01<00:23,  2.13it/s][A
Training:   9%|▉         | 5/53 [00:02<00:25,  1.92it/s][A
Training:  15%|█▌        | 8/53 [00:03<00:12,  3.74it/s][A
Training:  19%|█▉        | 10/53 [00:03<00:14,  2.94it/s][A
Training:  25%|██▍       | 13/53 [00:05<00:15,  2.62it/s][A
Training:  32%|███▏      | 17/53 [00:06<00:12,  2.79it/s][A
Training:  38%|███▊      | 20/53 [00:06<00:08,  3.87it/s][A
Training:  42%|████▏     | 22/53 [00:07<00:09,  3.10it/s][A
Training:  47%|████▋     | 25/53 [00:08<00:09,  3.10it/s][A
Training:  55%|█████▍    | 29/53 [00:10<00:07,  3.10it/s][A
Training:  58%|█████▊    | 31/53 [00:10<00:05,  3.75it/s][A
Training:  62%|██████▏   | 33/53 [00:11<00:06,  3.13it/s][A
Training:  66%|██████▌   | 35/53 [00:11<00:04,  3.92it/s][A
Training:  70%|██████▉   | 37/53 [00:12<00:05,  3.19it/s][A
Training:  74%|███████▎  | 39/53 [00

Epoch: 17/95 - Loss: 0.1792 - Accuracy: 0.9323



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:01<00:09,  1.60s/it][A
 57%|█████▋    | 4/7 [00:01<00:01,  2.85it/s][A
100%|██████████| 7/7 [00:02<00:00,  2.41it/s][A
Epochs:  18%|█▊        | 17/95 [05:30<25:12, 19.39s/it]

Val Loss: 0.2080 - Val Accuracy: 0.9149



Training:   0%|          | 0/53 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/53 [00:01<01:23,  1.61s/it][A
Training:   6%|▌         | 3/53 [00:01<00:22,  2.18it/s][A
Training:   9%|▉         | 5/53 [00:02<00:25,  1.90it/s][A
Training:  13%|█▎        | 7/53 [00:03<00:14,  3.07it/s][A
Training:  17%|█▋        | 9/53 [00:04<00:18,  2.43it/s][A
Training:  25%|██▍       | 13/53 [00:05<00:13,  2.92it/s][A
Training:  26%|██▋       | 14/53 [00:05<00:11,  3.27it/s][A
Training:  32%|███▏      | 17/53 [00:06<00:12,  2.97it/s][A
Training:  34%|███▍      | 18/53 [00:06<00:10,  3.34it/s][A
Training:  38%|███▊      | 20/53 [00:06<00:07,  4.43it/s][A
Training:  40%|███▉      | 21/53 [00:07<00:12,  2.66it/s][A
Training:  42%|████▏     | 22/53 [00:07<00:10,  3.01it/s][A
Training:  45%|████▌     | 24/53 [00:08<00:06,  4.37it/s][A
Training:  49%|████▉     | 26/53 [00:09<00:09,  2.94it/s][A
Training:  55%|█████▍    | 29/53 [00:09<00:07,  3.25it/s][A
Training:  57%|█████▋    | 30/53 [00:

Epoch: 18/95 - Loss: 0.1821 - Accuracy: 0.9316



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:01<00:08,  1.50s/it][A
 43%|████▎     | 3/7 [00:01<00:01,  2.31it/s][A
 57%|█████▋    | 4/7 [00:01<00:00,  3.11it/s][A
100%|██████████| 7/7 [00:02<00:00,  2.47it/s][A
Epochs:  19%|█▉        | 18/95 [05:49<24:50, 19.36s/it]

Val Loss: 0.2090 - Val Accuracy: 0.9123



Training:   0%|          | 0/53 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/53 [00:01<01:18,  1.50s/it][A
Training:   6%|▌         | 3/53 [00:01<00:21,  2.33it/s][A
Training:   9%|▉         | 5/53 [00:02<00:22,  2.14it/s][A
Training:  15%|█▌        | 8/53 [00:02<00:11,  4.07it/s][A
Training:  19%|█▉        | 10/53 [00:03<00:15,  2.70it/s][A
Training:  25%|██▍       | 13/53 [00:05<00:14,  2.70it/s][A
Training:  30%|███       | 16/53 [00:05<00:09,  4.00it/s][A
Training:  34%|███▍      | 18/53 [00:06<00:11,  3.03it/s][A
Training:  38%|███▊      | 20/53 [00:06<00:08,  3.94it/s][A
Training:  42%|████▏     | 22/53 [00:07<00:10,  2.86it/s][A
Training:  45%|████▌     | 24/53 [00:07<00:07,  3.75it/s][A
Training:  49%|████▉     | 26/53 [00:08<00:09,  2.94it/s][A
Training:  53%|█████▎    | 28/53 [00:09<00:07,  3.56it/s][A
Training:  55%|█████▍    | 29/53 [00:10<00:09,  2.54it/s][A
Training:  58%|█████▊    | 31/53 [00:10<00:06,  3.56it/s][A
Training:  60%|██████    | 32/53 [00

Epoch: 19/95 - Loss: 0.1824 - Accuracy: 0.9328



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:01<00:09,  1.60s/it][A
 43%|████▎     | 3/7 [00:01<00:01,  2.20it/s][A
100%|██████████| 7/7 [00:02<00:00,  2.41it/s][A
Epochs:  20%|██        | 19/95 [06:08<24:25, 19.28s/it]

Val Loss: 0.2072 - Val Accuracy: 0.9160



Training:   0%|          | 0/53 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/53 [00:01<01:16,  1.47s/it][A
Training:   9%|▉         | 5/53 [00:02<00:22,  2.14it/s][A
Training:  17%|█▋        | 9/53 [00:03<00:16,  2.67it/s][A
Training:  21%|██        | 11/53 [00:03<00:11,  3.51it/s][A
Training:  25%|██▍       | 13/53 [00:05<00:14,  2.79it/s][A
Training:  32%|███▏      | 17/53 [00:06<00:11,  3.16it/s][A
Training:  36%|███▌      | 19/53 [00:06<00:08,  3.90it/s][A
Training:  40%|███▉      | 21/53 [00:07<00:10,  3.19it/s][A
Training:  42%|████▏     | 22/53 [00:07<00:09,  3.31it/s][A
Training:  45%|████▌     | 24/53 [00:07<00:06,  4.34it/s][A
Training:  47%|████▋     | 25/53 [00:08<00:09,  2.84it/s][A
Training:  49%|████▉     | 26/53 [00:08<00:09,  2.96it/s][A
Training:  53%|█████▎    | 28/53 [00:08<00:05,  4.20it/s][A
Training:  55%|█████▍    | 29/53 [00:09<00:08,  2.71it/s][A
Training:  57%|█████▋    | 30/53 [00:10<00:07,  2.91it/s][A
Training:  62%|██████▏   | 33/53 [0

Epoch: 20/95 - Loss: 0.1835 - Accuracy: 0.9309



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:01<00:08,  1.44s/it][A
 29%|██▊       | 2/7 [00:01<00:03,  1.48it/s][A
 57%|█████▋    | 4/7 [00:01<00:00,  3.30it/s][A
 71%|███████▏  | 5/7 [00:02<00:00,  2.12it/s][A
100%|██████████| 7/7 [00:02<00:00,  2.43it/s][A
Epochs:  21%|██        | 20/95 [06:28<24:04, 19.25s/it]

Val Loss: 0.2095 - Val Accuracy: 0.9113



Training:   0%|          | 0/53 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/53 [00:01<01:21,  1.56s/it][A
Training:   8%|▊         | 4/53 [00:01<00:16,  3.04it/s][A
Training:  11%|█▏        | 6/53 [00:02<00:19,  2.36it/s][A
Training:  17%|█▋        | 9/53 [00:03<00:17,  2.56it/s][A
Training:  19%|█▉        | 10/53 [00:03<00:14,  2.93it/s][A
Training:  23%|██▎       | 12/53 [00:04<00:10,  4.07it/s][A
Training:  25%|██▍       | 13/53 [00:05<00:15,  2.62it/s][A
Training:  26%|██▋       | 14/53 [00:05<00:14,  2.72it/s][A
Training:  30%|███       | 16/53 [00:05<00:09,  4.07it/s][A
Training:  32%|███▏      | 17/53 [00:06<00:12,  2.96it/s][A
Training:  34%|███▍      | 18/53 [00:06<00:11,  3.15it/s][A
Training:  38%|███▊      | 20/53 [00:06<00:07,  4.61it/s][A
Training:  40%|███▉      | 21/53 [00:07<00:11,  2.78it/s][A
Training:  42%|████▏     | 22/53 [00:07<00:10,  3.09it/s][A
Training:  45%|████▌     | 24/53 [00:07<00:06,  4.48it/s][A
Training:  47%|████▋     | 25/53 [00

Epoch: 21/95 - Loss: 0.1794 - Accuracy: 0.9323



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:01<00:08,  1.44s/it][A
100%|██████████| 7/7 [00:02<00:00,  2.64it/s][A
Epochs:  22%|██▏       | 21/95 [06:47<23:44, 19.25s/it]

Val Loss: 0.2070 - Val Accuracy: 0.9144



Training:   0%|          | 0/53 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/53 [00:01<01:25,  1.64s/it][A
Training:   8%|▊         | 4/53 [00:01<00:17,  2.88it/s][A
Training:  11%|█▏        | 6/53 [00:02<00:20,  2.25it/s][A
Training:  15%|█▌        | 8/53 [00:03<00:13,  3.35it/s][A
Training:  19%|█▉        | 10/53 [00:04<00:16,  2.68it/s][A
Training:  25%|██▍       | 13/53 [00:05<00:14,  2.68it/s][A
Training:  28%|██▊       | 15/53 [00:05<00:10,  3.49it/s][A
Training:  30%|███       | 16/53 [00:05<00:09,  3.88it/s][A
Training:  32%|███▏      | 17/53 [00:06<00:14,  2.54it/s][A
Training:  38%|███▊      | 20/53 [00:06<00:08,  4.09it/s][A
Training:  40%|███▉      | 21/53 [00:07<00:11,  2.74it/s][A
Training:  42%|████▏     | 22/53 [00:07<00:09,  3.14it/s][A
Training:  45%|████▌     | 24/53 [00:07<00:06,  4.30it/s][A
Training:  47%|████▋     | 25/53 [00:08<00:10,  2.79it/s][A
Training:  49%|████▉     | 26/53 [00:08<00:09,  2.96it/s][A
Training:  53%|█████▎    | 28/53 [00

Epoch: 22/95 - Loss: 0.1814 - Accuracy: 0.9308



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:01<00:09,  1.53s/it][A
 43%|████▎     | 3/7 [00:01<00:01,  2.24it/s][A
100%|██████████| 7/7 [00:02<00:00,  2.63it/s][A
Epochs:  23%|██▎       | 22/95 [07:06<23:25, 19.26s/it]

Val Loss: 0.2088 - Val Accuracy: 0.9155



Training:   0%|          | 0/53 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/53 [00:01<01:15,  1.46s/it][A
Training:   4%|▍         | 2/53 [00:01<00:36,  1.38it/s][A
Training:   9%|▉         | 5/53 [00:02<00:22,  2.10it/s][A
Training:  11%|█▏        | 6/53 [00:02<00:18,  2.56it/s][A
Training:  15%|█▌        | 8/53 [00:03<00:11,  4.01it/s][A
Training:  17%|█▋        | 9/53 [00:04<00:18,  2.35it/s][A
Training:  23%|██▎       | 12/53 [00:04<00:09,  4.32it/s][A
Training:  26%|██▋       | 14/53 [00:05<00:12,  3.02it/s][A
Training:  30%|███       | 16/53 [00:05<00:08,  4.12it/s][A
Training:  34%|███▍      | 18/53 [00:06<00:12,  2.87it/s][A
Training:  40%|███▉      | 21/53 [00:07<00:10,  2.92it/s][A
Training:  43%|████▎     | 23/53 [00:07<00:07,  3.79it/s][A
Training:  47%|████▋     | 25/53 [00:08<00:09,  2.85it/s][A
Training:  55%|█████▍    | 29/53 [00:10<00:08,  2.92it/s][A
Training:  62%|██████▏   | 33/53 [00:11<00:06,  3.05it/s][A
Training:  68%|██████▊   | 36/53 [00:1

Epoch: 23/95 - Loss: 0.1800 - Accuracy: 0.9328



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:01<00:09,  1.57s/it][A
100%|██████████| 7/7 [00:02<00:00,  2.55it/s][A
Epochs:  24%|██▍       | 23/95 [07:26<23:10, 19.31s/it]

Val Loss: 0.2086 - Val Accuracy: 0.9144



Training:   0%|          | 0/53 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/53 [00:01<01:11,  1.38s/it][A
Training:   4%|▍         | 2/53 [00:01<00:32,  1.58it/s][A
Training:   9%|▉         | 5/53 [00:02<00:22,  2.13it/s][A
Training:  11%|█▏        | 6/53 [00:02<00:17,  2.62it/s][A
Training:  15%|█▌        | 8/53 [00:02<00:10,  4.12it/s][A
Training:  19%|█▉        | 10/53 [00:04<00:15,  2.70it/s][A
Training:  25%|██▍       | 13/53 [00:05<00:13,  2.93it/s][A
Training:  26%|██▋       | 14/53 [00:05<00:12,  3.18it/s][A
Training:  32%|███▏      | 17/53 [00:06<00:11,  3.07it/s][A
Training:  34%|███▍      | 18/53 [00:06<00:11,  3.11it/s][A
Training:  38%|███▊      | 20/53 [00:06<00:07,  4.25it/s][A
Training:  40%|███▉      | 21/53 [00:07<00:10,  2.94it/s][A
Training:  42%|████▏     | 22/53 [00:07<00:09,  3.14it/s][A
Training:  47%|████▋     | 25/53 [00:08<00:08,  3.19it/s][A
Training:  49%|████▉     | 26/53 [00:08<00:08,  3.27it/s][A
Training:  53%|█████▎    | 28/53 [00:

Epoch: 24/95 - Loss: 0.1781 - Accuracy: 0.9327



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:01<00:08,  1.49s/it][A
100%|██████████| 7/7 [00:02<00:00,  2.58it/s][A
Epochs:  25%|██▌       | 24/95 [07:45<22:54, 19.36s/it]

Val Loss: 0.2122 - Val Accuracy: 0.9144



Training:   0%|          | 0/53 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/53 [00:01<01:18,  1.51s/it][A
Training:   6%|▌         | 3/53 [00:01<00:21,  2.33it/s][A
Training:   9%|▉         | 5/53 [00:02<00:23,  2.01it/s][A
Training:  13%|█▎        | 7/53 [00:02<00:14,  3.24it/s][A
Training:  17%|█▋        | 9/53 [00:03<00:17,  2.46it/s][A
Training:  23%|██▎       | 12/53 [00:04<00:09,  4.16it/s][A
Training:  26%|██▋       | 14/53 [00:05<00:12,  3.04it/s][A
Training:  32%|███▏      | 17/53 [00:06<00:12,  2.91it/s][A
Training:  36%|███▌      | 19/53 [00:06<00:09,  3.77it/s][A
Training:  40%|███▉      | 21/53 [00:07<00:11,  2.79it/s][A
Training:  45%|████▌     | 24/53 [00:07<00:06,  4.21it/s][A
Training:  49%|████▉     | 26/53 [00:08<00:08,  3.33it/s][A
Training:  53%|█████▎    | 28/53 [00:08<00:05,  4.29it/s][A
Training:  57%|█████▋    | 30/53 [00:09<00:07,  3.03it/s][A
Training:  62%|██████▏   | 33/53 [00:11<00:07,  2.82it/s][A
Training:  66%|██████▌   | 35/53 [00:

Epoch: 25/95 - Loss: 0.1822 - Accuracy: 0.9321



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:01<00:07,  1.28s/it][A
 29%|██▊       | 2/7 [00:01<00:02,  1.67it/s][A
100%|██████████| 7/7 [00:02<00:00,  2.70it/s][A
Epochs:  26%|██▋       | 25/95 [08:04<22:30, 19.29s/it]

Val Loss: 0.2081 - Val Accuracy: 0.9139



Training:   0%|          | 0/53 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/53 [00:01<01:15,  1.46s/it][A
Training:   6%|▌         | 3/53 [00:01<00:21,  2.37it/s][A
Training:   9%|▉         | 5/53 [00:02<00:22,  2.11it/s][A
Training:  11%|█▏        | 6/53 [00:02<00:18,  2.56it/s][A
Training:  15%|█▌        | 8/53 [00:02<00:11,  4.09it/s][A
Training:  19%|█▉        | 10/53 [00:04<00:15,  2.72it/s][A
Training:  23%|██▎       | 12/53 [00:04<00:10,  3.87it/s][A
Training:  26%|██▋       | 14/53 [00:05<00:13,  2.88it/s][A
Training:  32%|███▏      | 17/53 [00:06<00:13,  2.76it/s][A
Training:  40%|███▉      | 21/53 [00:07<00:10,  2.98it/s][A
Training:  45%|████▌     | 24/53 [00:07<00:06,  4.16it/s][A
Training:  49%|████▉     | 26/53 [00:08<00:08,  3.19it/s][A
Training:  55%|█████▍    | 29/53 [00:09<00:07,  3.10it/s][A
Training:  57%|█████▋    | 30/53 [00:09<00:06,  3.41it/s][A
Training:  60%|██████    | 32/53 [00:10<00:04,  4.34it/s][A
Training:  62%|██████▏   | 33/53 [00:

Epoch: 26/95 - Loss: 0.1795 - Accuracy: 0.9317



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:01<00:08,  1.44s/it][A
 57%|█████▋    | 4/7 [00:01<00:00,  3.31it/s][A
100%|██████████| 7/7 [00:02<00:00,  2.64it/s][A
Epochs:  27%|██▋       | 26/95 [08:23<22:09, 19.27s/it]

Val Loss: 0.2082 - Val Accuracy: 0.9134



Training:   0%|          | 0/53 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/53 [00:01<01:20,  1.54s/it][A
Training:   9%|▉         | 5/53 [00:02<00:22,  2.14it/s][A
Training:  15%|█▌        | 8/53 [00:02<00:11,  3.75it/s][A
Training:  19%|█▉        | 10/53 [00:04<00:16,  2.67it/s][A
Training:  23%|██▎       | 12/53 [00:04<00:11,  3.58it/s][A
Training:  26%|██▋       | 14/53 [00:05<00:13,  2.79it/s][A
Training:  32%|███▏      | 17/53 [00:06<00:13,  2.75it/s][A
Training:  38%|███▊      | 20/53 [00:06<00:08,  4.07it/s][A
Training:  42%|████▏     | 22/53 [00:07<00:09,  3.16it/s][A
Training:  43%|████▎     | 23/53 [00:07<00:08,  3.51it/s][A
Training:  47%|████▋     | 25/53 [00:08<00:10,  2.76it/s][A
Training:  51%|█████     | 27/53 [00:08<00:07,  3.39it/s][A
Training:  55%|█████▍    | 29/53 [00:09<00:07,  3.06it/s][A
Training:  58%|█████▊    | 31/53 [00:10<00:05,  3.77it/s][A
Training:  62%|██████▏   | 33/53 [00:10<00:06,  3.08it/s][A
Training:  66%|██████▌   | 35/53 [0

Epoch: 27/95 - Loss: 0.1797 - Accuracy: 0.9324



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:01<00:09,  1.58s/it][A
100%|██████████| 7/7 [00:02<00:00,  2.62it/s][A
Epochs:  28%|██▊       | 27/95 [08:42<21:45, 19.19s/it]

Val Loss: 0.2065 - Val Accuracy: 0.9139



Training:   0%|          | 0/53 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/53 [00:01<01:25,  1.64s/it][A
Training:   8%|▊         | 4/53 [00:01<00:16,  2.89it/s][A
Training:  11%|█▏        | 6/53 [00:02<00:20,  2.32it/s][A
Training:  17%|█▋        | 9/53 [00:03<00:17,  2.47it/s][A
Training:  23%|██▎       | 12/53 [00:04<00:10,  3.92it/s][A
Training:  26%|██▋       | 14/53 [00:05<00:13,  2.87it/s][A
Training:  32%|███▏      | 17/53 [00:06<00:13,  2.71it/s][A
Training:  38%|███▊      | 20/53 [00:06<00:08,  3.90it/s][A
Training:  42%|████▏     | 22/53 [00:07<00:09,  3.13it/s][A
Training:  45%|████▌     | 24/53 [00:07<00:07,  3.96it/s][A
Training:  49%|████▉     | 26/53 [00:08<00:09,  2.86it/s][A
Training:  51%|█████     | 27/53 [00:09<00:08,  3.20it/s][A
Training:  55%|█████▍    | 29/53 [00:10<00:09,  2.61it/s][A
Training:  62%|██████▏   | 33/53 [00:11<00:06,  3.08it/s][A
Training:  66%|██████▌   | 35/53 [00:11<00:04,  3.66it/s][A
Training:  70%|██████▉   | 37/53 [00

Epoch: 28/95 - Loss: 0.1804 - Accuracy: 0.9333



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:01<00:09,  1.59s/it][A
 29%|██▊       | 2/7 [00:01<00:03,  1.38it/s][A
 57%|█████▋    | 4/7 [00:01<00:00,  3.28it/s][A
100%|██████████| 7/7 [00:02<00:00,  2.47it/s][A
Epochs:  29%|██▉       | 28/95 [09:02<21:35, 19.34s/it]

Val Loss: 0.2076 - Val Accuracy: 0.9155



Training:   0%|          | 0/53 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/53 [00:01<01:21,  1.57s/it][A
Training:   8%|▊         | 4/53 [00:01<00:16,  2.98it/s][A
Training:  11%|█▏        | 6/53 [00:02<00:20,  2.35it/s][A
Training:  17%|█▋        | 9/53 [00:03<00:17,  2.50it/s][A
Training:  23%|██▎       | 12/53 [00:04<00:10,  3.97it/s][A
Training:  26%|██▋       | 14/53 [00:05<00:13,  2.80it/s][A
Training:  30%|███       | 16/53 [00:05<00:10,  3.67it/s][A
Training:  34%|███▍      | 18/53 [00:06<00:12,  2.77it/s][A
Training:  40%|███▉      | 21/53 [00:07<00:11,  2.67it/s][A
Training:  47%|████▋     | 25/53 [00:08<00:09,  2.95it/s][A
Training:  55%|█████▍    | 29/53 [00:09<00:07,  3.23it/s][A
Training:  62%|██████▏   | 33/53 [00:11<00:05,  3.38it/s][A
Training:  66%|██████▌   | 35/53 [00:11<00:04,  4.02it/s][A
Training:  70%|██████▉   | 37/53 [00:12<00:04,  3.31it/s][A
Training:  75%|███████▌  | 40/53 [00:12<00:02,  4.60it/s][A
Training:  79%|███████▉  | 42/53 [00

Epoch: 29/95 - Loss: 0.1800 - Accuracy: 0.9333



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:01<00:08,  1.47s/it][A
 57%|█████▋    | 4/7 [00:01<00:00,  3.25it/s][A
100%|██████████| 7/7 [00:02<00:00,  2.78it/s][A
Epochs:  31%|███       | 29/95 [09:20<20:53, 19.00s/it]

Val Loss: 0.2053 - Val Accuracy: 0.9160



Training:   0%|          | 0/53 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/53 [00:01<01:13,  1.41s/it][A
Training:   9%|▉         | 5/53 [00:02<00:20,  2.29it/s][A
Training:  15%|█▌        | 8/53 [00:02<00:11,  4.03it/s][A
Training:  19%|█▉        | 10/53 [00:03<00:13,  3.15it/s][A
Training:  23%|██▎       | 12/53 [00:03<00:09,  4.24it/s][A
Training:  26%|██▋       | 14/53 [00:04<00:12,  3.04it/s][A
Training:  30%|███       | 16/53 [00:04<00:09,  3.98it/s][A
Training:  34%|███▍      | 18/53 [00:05<00:11,  3.08it/s][A
Training:  40%|███▉      | 21/53 [00:06<00:10,  3.06it/s][A
Training:  42%|████▏     | 22/53 [00:07<00:09,  3.33it/s][A
Training:  47%|████▋     | 25/53 [00:07<00:07,  3.56it/s][A
Training:  49%|████▉     | 26/53 [00:08<00:07,  3.57it/s][A
Training:  53%|█████▎    | 28/53 [00:08<00:05,  4.82it/s][A
Training:  55%|█████▍    | 29/53 [00:08<00:07,  3.18it/s][A
Training:  57%|█████▋    | 30/53 [00:09<00:06,  3.37it/s][A
Training:  62%|██████▏   | 33/53 [0

Epoch: 30/95 - Loss: 0.1797 - Accuracy: 0.9341



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:01<00:08,  1.44s/it][A
100%|██████████| 7/7 [00:02<00:00,  2.74it/s][A
Epochs:  32%|███▏      | 30/95 [09:38<20:04, 18.53s/it]

Val Loss: 0.2099 - Val Accuracy: 0.9150



Training:   0%|          | 0/53 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/53 [00:01<01:05,  1.26s/it][A
Training:   8%|▊         | 4/53 [00:01<00:13,  3.71it/s][A
Training:  11%|█▏        | 6/53 [00:02<00:18,  2.59it/s][A
Training:  17%|█▋        | 9/53 [00:03<00:16,  2.66it/s][A
Training:  25%|██▍       | 13/53 [00:04<00:13,  3.00it/s][A
Training:  28%|██▊       | 15/53 [00:04<00:09,  3.81it/s][A
Training:  32%|███▏      | 17/53 [00:05<00:12,  2.85it/s][A
Training:  36%|███▌      | 19/53 [00:06<00:09,  3.68it/s][A
Training:  40%|███▉      | 21/53 [00:07<00:10,  2.93it/s][A
Training:  43%|████▎     | 23/53 [00:07<00:07,  3.87it/s][A
Training:  47%|████▋     | 25/53 [00:08<00:09,  2.99it/s][A
Training:  53%|█████▎    | 28/53 [00:08<00:05,  4.52it/s][A
Training:  57%|█████▋    | 30/53 [00:09<00:06,  3.31it/s][A
Training:  62%|██████▏   | 33/53 [00:10<00:06,  3.20it/s][A
Training:  70%|██████▉   | 37/53 [00:11<00:04,  3.49it/s][A
Training:  74%|███████▎  | 39/53 [00

Epoch: 31/95 - Loss: 0.1810 - Accuracy: 0.9322



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:01<00:09,  1.56s/it][A
 57%|█████▋    | 4/7 [00:01<00:00,  3.08it/s][A
100%|██████████| 7/7 [00:02<00:00,  2.50it/s][A
Epochs:  33%|███▎      | 31/95 [09:56<19:39, 18.44s/it]

Val Loss: 0.2090 - Val Accuracy: 0.9187



Training:   0%|          | 0/53 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/53 [00:01<01:11,  1.37s/it][A
Training:   9%|▉         | 5/53 [00:02<00:20,  2.39it/s][A
Training:  15%|█▌        | 8/53 [00:02<00:10,  4.21it/s][A
Training:  19%|█▉        | 10/53 [00:03<00:14,  2.91it/s][A
Training:  25%|██▍       | 13/53 [00:04<00:13,  3.03it/s][A
Training:  30%|███       | 16/53 [00:04<00:08,  4.42it/s][A
Training:  34%|███▍      | 18/53 [00:05<00:10,  3.26it/s][A
Training:  40%|███▉      | 21/53 [00:06<00:10,  3.07it/s][A
Training:  42%|████▏     | 22/53 [00:07<00:09,  3.33it/s][A
Training:  47%|████▋     | 25/53 [00:07<00:08,  3.26it/s][A
Training:  49%|████▉     | 26/53 [00:08<00:07,  3.61it/s][A
Training:  55%|█████▍    | 29/53 [00:09<00:07,  3.19it/s][A
Training:  60%|██████    | 32/53 [00:09<00:04,  4.63it/s][A
Training:  64%|██████▍   | 34/53 [00:10<00:05,  3.55it/s][A
Training:  70%|██████▉   | 37/53 [00:11<00:04,  3.25it/s][A
Training:  72%|███████▏  | 38/53 [0

Epoch: 32/95 - Loss: 0.1821 - Accuracy: 0.9305



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:01<00:08,  1.48s/it][A
100%|██████████| 7/7 [00:02<00:00,  2.59it/s][A
Epochs:  34%|███▎      | 32/95 [10:14<19:10, 18.25s/it]

Val Loss: 0.2088 - Val Accuracy: 0.9107



Training:   0%|          | 0/53 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/53 [00:01<01:16,  1.47s/it][A
Training:   8%|▊         | 4/53 [00:01<00:15,  3.24it/s][A
Training:  11%|█▏        | 6/53 [00:02<00:17,  2.67it/s][A
Training:  17%|█▋        | 9/53 [00:03<00:15,  2.78it/s][A
Training:  19%|█▉        | 10/53 [00:03<00:13,  3.20it/s][A
Training:  25%|██▍       | 13/53 [00:04<00:12,  3.13it/s][A
Training:  28%|██▊       | 15/53 [00:04<00:09,  4.14it/s][A
Training:  32%|███▏      | 17/53 [00:05<00:11,  3.23it/s][A
Training:  34%|███▍      | 18/53 [00:05<00:09,  3.55it/s][A
Training:  40%|███▉      | 21/53 [00:07<00:10,  2.98it/s][A
Training:  43%|████▎     | 23/53 [00:07<00:07,  3.91it/s][A
Training:  47%|████▋     | 25/53 [00:08<00:09,  3.02it/s][A
Training:  55%|█████▍    | 29/53 [00:09<00:07,  3.26it/s][A
Training:  58%|█████▊    | 31/53 [00:09<00:05,  4.08it/s][A
Training:  62%|██████▏   | 33/53 [00:10<00:06,  3.22it/s][A
Training:  68%|██████▊   | 36/53 [00

Epoch: 33/95 - Loss: 0.1811 - Accuracy: 0.9325



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:01<00:08,  1.44s/it][A
100%|██████████| 7/7 [00:02<00:00,  2.74it/s][A
Epochs:  35%|███▍      | 33/95 [10:32<18:45, 18.15s/it]

Val Loss: 0.2104 - Val Accuracy: 0.9128



Training:   0%|          | 0/53 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/53 [00:01<01:16,  1.47s/it][A
Training:   6%|▌         | 3/53 [00:01<00:21,  2.34it/s][A
Training:   9%|▉         | 5/53 [00:02<00:22,  2.15it/s][A
Training:  17%|█▋        | 9/53 [00:03<00:14,  3.05it/s][A
Training:  21%|██        | 11/53 [00:03<00:10,  3.99it/s][A
Training:  25%|██▍       | 13/53 [00:04<00:13,  3.06it/s][A
Training:  30%|███       | 16/53 [00:04<00:07,  4.68it/s][A
Training:  34%|███▍      | 18/53 [00:05<00:09,  3.56it/s][A
Training:  40%|███▉      | 21/53 [00:06<00:09,  3.28it/s][A
Training:  42%|████▏     | 22/53 [00:06<00:08,  3.56it/s][A
Training:  45%|████▌     | 24/53 [00:07<00:06,  4.69it/s][A
Training:  49%|████▉     | 26/53 [00:08<00:08,  3.28it/s][A
Training:  55%|█████▍    | 29/53 [00:08<00:07,  3.25it/s][A
Training:  57%|█████▋    | 30/53 [00:09<00:06,  3.59it/s][A
Training:  62%|██████▏   | 33/53 [00:10<00:05,  3.41it/s][A
Training:  64%|██████▍   | 34/53 [00

Epoch: 34/95 - Loss: 0.1790 - Accuracy: 0.9329



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:01<00:08,  1.43s/it][A
100%|██████████| 7/7 [00:02<00:00,  2.68it/s][A
Epochs:  36%|███▌      | 34/95 [10:49<18:14, 17.94s/it]

Val Loss: 0.2069 - Val Accuracy: 0.9182



Training:   0%|          | 0/53 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/53 [00:01<01:17,  1.48s/it][A
Training:   6%|▌         | 3/53 [00:01<00:21,  2.28it/s][A
Training:   9%|▉         | 5/53 [00:02<00:22,  2.11it/s][A
Training:  17%|█▋        | 9/53 [00:03<00:15,  2.91it/s][A
Training:  23%|██▎       | 12/53 [00:03<00:09,  4.42it/s][A
Training:  26%|██▋       | 14/53 [00:04<00:11,  3.27it/s][A
Training:  32%|███▏      | 17/53 [00:05<00:11,  3.16it/s][A
Training:  38%|███▊      | 20/53 [00:05<00:07,  4.53it/s][A
Training:  42%|████▏     | 22/53 [00:06<00:09,  3.39it/s][A
Training:  47%|████▋     | 25/53 [00:08<00:08,  3.13it/s][A
Training:  51%|█████     | 27/53 [00:08<00:06,  3.93it/s][A
Training:  55%|█████▍    | 29/53 [00:09<00:07,  3.28it/s][A
Training:  58%|█████▊    | 31/53 [00:09<00:05,  4.18it/s][A
Training:  62%|██████▏   | 33/53 [00:10<00:06,  3.16it/s][A
Training:  66%|██████▌   | 35/53 [00:10<00:04,  4.08it/s][A
Training:  70%|██████▉   | 37/53 [00

Epoch: 35/95 - Loss: 0.1813 - Accuracy: 0.9322



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:01<00:09,  1.55s/it][A
 57%|█████▋    | 4/7 [00:01<00:00,  3.09it/s][A
100%|██████████| 7/7 [00:02<00:00,  2.55it/s][A
Epochs:  37%|███▋      | 35/95 [11:07<17:52, 17.87s/it]

Val Loss: 0.2107 - Val Accuracy: 0.9139



Training:   0%|          | 0/53 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/53 [00:01<01:14,  1.44s/it][A
Training:   9%|▉         | 5/53 [00:02<00:22,  2.09it/s][A
Training:  15%|█▌        | 8/53 [00:02<00:12,  3.73it/s][A
Training:  19%|█▉        | 10/53 [00:03<00:14,  2.94it/s][A
Training:  25%|██▍       | 13/53 [00:04<00:13,  2.98it/s][A
Training:  30%|███       | 16/53 [00:04<00:08,  4.39it/s][A
Training:  34%|███▍      | 18/53 [00:06<00:11,  3.14it/s][A
Training:  40%|███▉      | 21/53 [00:06<00:09,  3.22it/s][A
Training:  47%|████▋     | 25/53 [00:08<00:08,  3.40it/s][A
Training:  51%|█████     | 27/53 [00:08<00:06,  4.15it/s][A
Training:  55%|█████▍    | 29/53 [00:09<00:07,  3.37it/s][A
Training:  57%|█████▋    | 30/53 [00:09<00:06,  3.63it/s][A
Training:  62%|██████▏   | 33/53 [00:10<00:05,  3.43it/s][A
Training:  64%|██████▍   | 34/53 [00:10<00:05,  3.69it/s][A
Training:  68%|██████▊   | 36/53 [00:10<00:03,  4.80it/s][A
Training:  70%|██████▉   | 37/53 [0

Epoch: 36/95 - Loss: 0.1802 - Accuracy: 0.9323



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:01<00:08,  1.46s/it][A
100%|██████████| 7/7 [00:02<00:00,  2.63it/s][A
Epochs:  38%|███▊      | 36/95 [11:24<17:28, 17.77s/it]

Val Loss: 0.2068 - Val Accuracy: 0.9128



Training:   0%|          | 0/53 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/53 [00:01<01:19,  1.53s/it][A
Training:   6%|▌         | 3/53 [00:01<00:21,  2.30it/s][A
Training:   9%|▉         | 5/53 [00:02<00:22,  2.12it/s][A
Training:  15%|█▌        | 8/53 [00:02<00:10,  4.10it/s][A
Training:  19%|█▉        | 10/53 [00:03<00:14,  2.89it/s][A
Training:  25%|██▍       | 13/53 [00:04<00:12,  3.08it/s][A
Training:  26%|██▋       | 14/53 [00:04<00:11,  3.28it/s][A
Training:  32%|███▏      | 17/53 [00:05<00:10,  3.41it/s][A
Training:  34%|███▍      | 18/53 [00:05<00:09,  3.69it/s][A
Training:  40%|███▉      | 21/53 [00:06<00:09,  3.46it/s][A
Training:  42%|████▏     | 22/53 [00:06<00:08,  3.83it/s][A
Training:  43%|████▎     | 23/53 [00:07<00:07,  4.11it/s][A
Training:  47%|████▋     | 25/53 [00:07<00:08,  3.42it/s][A
Training:  51%|█████     | 27/53 [00:08<00:06,  4.27it/s][A
Training:  55%|█████▍    | 29/53 [00:09<00:07,  3.40it/s][A
Training:  58%|█████▊    | 31/53 [00

Epoch: 37/95 - Loss: 0.1779 - Accuracy: 0.9340



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:01<00:08,  1.40s/it][A
 43%|████▎     | 3/7 [00:01<00:01,  2.49it/s][A
 71%|███████▏  | 5/7 [00:02<00:00,  2.43it/s][A
100%|██████████| 7/7 [00:02<00:00,  2.67it/s][A
Epochs:  39%|███▉      | 37/95 [11:42<17:05, 17.67s/it]

Val Loss: 0.2072 - Val Accuracy: 0.9134



Training:   0%|          | 0/53 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/53 [00:01<01:12,  1.40s/it][A
Training:   8%|▊         | 4/53 [00:01<00:14,  3.28it/s][A
Training:  11%|█▏        | 6/53 [00:02<00:18,  2.51it/s][A
Training:  15%|█▌        | 8/53 [00:02<00:12,  3.71it/s][A
Training:  19%|█▉        | 10/53 [00:03<00:15,  2.69it/s][A
Training:  25%|██▍       | 13/53 [00:05<00:15,  2.62it/s][A
Training:  30%|███       | 16/53 [00:05<00:09,  4.00it/s][A
Training:  34%|███▍      | 18/53 [00:06<00:10,  3.31it/s][A
Training:  40%|███▉      | 21/53 [00:07<00:10,  3.19it/s][A
Training:  47%|████▋     | 25/53 [00:08<00:08,  3.33it/s][A
Training:  53%|█████▎    | 28/53 [00:08<00:05,  4.51it/s][A
Training:  57%|█████▋    | 30/53 [00:09<00:06,  3.68it/s][A
Training:  62%|██████▏   | 33/53 [00:10<00:05,  3.49it/s][A
Training:  70%|██████▉   | 37/53 [00:11<00:04,  3.51it/s][A
Training:  75%|███████▌  | 40/53 [00:11<00:02,  4.70it/s][A
Training:  79%|███████▉  | 42/53 [00

Epoch: 38/95 - Loss: 0.1793 - Accuracy: 0.9338



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:01<00:08,  1.45s/it][A
 43%|████▎     | 3/7 [00:01<00:01,  2.41it/s][A
100%|██████████| 7/7 [00:02<00:00,  2.73it/s][A
Epochs:  40%|████      | 38/95 [11:59<16:38, 17.52s/it]

Val Loss: 0.2048 - Val Accuracy: 0.9150



Training:   0%|          | 0/53 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/53 [00:01<01:14,  1.43s/it][A
Training:   8%|▊         | 4/53 [00:01<00:14,  3.32it/s][A
Training:  11%|█▏        | 6/53 [00:02<00:19,  2.37it/s][A
Training:  17%|█▋        | 9/53 [00:03<00:17,  2.46it/s][A
Training:  21%|██        | 11/53 [00:04<00:12,  3.35it/s][A
Training:  25%|██▍       | 13/53 [00:05<00:15,  2.51it/s][A
Training:  30%|███       | 16/53 [00:05<00:09,  3.94it/s][A
Training:  34%|███▍      | 18/53 [00:06<00:12,  2.82it/s][A
Training:  38%|███▊      | 20/53 [00:06<00:09,  3.55it/s][A
Training:  42%|████▏     | 22/53 [00:07<00:10,  2.88it/s][A
Training:  45%|████▌     | 24/53 [00:07<00:07,  3.64it/s][A
Training:  47%|████▋     | 25/53 [00:09<00:11,  2.46it/s][A
Training:  53%|█████▎    | 28/53 [00:09<00:06,  3.98it/s][A
Training:  57%|█████▋    | 30/53 [00:10<00:07,  3.08it/s][A
Training:  62%|██████▏   | 33/53 [00:11<00:06,  3.17it/s][A
Training:  70%|██████▉   | 37/53 [00

Epoch: 39/95 - Loss: 0.1814 - Accuracy: 0.9323



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:01<00:08,  1.47s/it][A
100%|██████████| 7/7 [00:02<00:00,  2.68it/s][A
Epochs:  41%|████      | 39/95 [12:17<16:30, 17.68s/it]

Val Loss: 0.2082 - Val Accuracy: 0.9155



Training:   0%|          | 0/53 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/53 [00:01<01:12,  1.40s/it][A
Training:   8%|▊         | 4/53 [00:01<00:14,  3.39it/s][A
Training:  11%|█▏        | 6/53 [00:02<00:19,  2.45it/s][A
Training:  13%|█▎        | 7/53 [00:02<00:15,  2.95it/s][A
Training:  17%|█▋        | 9/53 [00:03<00:17,  2.45it/s][A
Training:  21%|██        | 11/53 [00:03<00:12,  3.39it/s][A
Training:  25%|██▍       | 13/53 [00:04<00:14,  2.72it/s][A
Training:  28%|██▊       | 15/53 [00:05<00:10,  3.58it/s][A
Training:  32%|███▏      | 17/53 [00:06<00:12,  2.92it/s][A
Training:  36%|███▌      | 19/53 [00:06<00:08,  3.80it/s][A
Training:  40%|███▉      | 21/53 [00:07<00:11,  2.81it/s][A
Training:  43%|████▎     | 23/53 [00:07<00:08,  3.57it/s][A
Training:  47%|████▋     | 25/53 [00:08<00:10,  2.79it/s][A
Training:  51%|█████     | 27/53 [00:08<00:06,  3.76it/s][A
Training:  55%|█████▍    | 29/53 [00:09<00:08,  2.83it/s][A
Training:  62%|██████▏   | 33/53 [00:

Epoch: 40/95 - Loss: 0.1780 - Accuracy: 0.9341



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:01<00:08,  1.42s/it][A
 57%|█████▋    | 4/7 [00:01<00:00,  3.36it/s][A
100%|██████████| 7/7 [00:02<00:00,  2.76it/s][A
Epochs:  42%|████▏     | 40/95 [12:35<16:19, 17.82s/it]

Val Loss: 0.2081 - Val Accuracy: 0.9129



Training:   0%|          | 0/53 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/53 [00:01<01:16,  1.47s/it][A
Training:   6%|▌         | 3/53 [00:01<00:21,  2.34it/s][A
Training:   9%|▉         | 5/53 [00:02<00:23,  2.02it/s][A
Training:  15%|█▌        | 8/53 [00:02<00:11,  3.89it/s][A
Training:  19%|█▉        | 10/53 [00:03<00:14,  2.93it/s][A
Training:  25%|██▍       | 13/53 [00:05<00:14,  2.72it/s][A
Training:  28%|██▊       | 15/53 [00:05<00:10,  3.59it/s][A
Training:  32%|███▏      | 17/53 [00:06<00:12,  2.89it/s][A
Training:  36%|███▌      | 19/53 [00:06<00:08,  3.82it/s][A
Training:  40%|███▉      | 21/53 [00:07<00:10,  2.92it/s][A
Training:  43%|████▎     | 23/53 [00:07<00:07,  3.89it/s][A
Training:  47%|████▋     | 25/53 [00:08<00:09,  3.09it/s][A
Training:  53%|█████▎    | 28/53 [00:08<00:05,  4.68it/s][A
Training:  57%|█████▋    | 30/53 [00:09<00:06,  3.43it/s][A
Training:  62%|██████▏   | 33/53 [00:10<00:06,  3.20it/s][A
Training:  66%|██████▌   | 35/53 [00

Epoch: 41/95 - Loss: 0.1786 - Accuracy: 0.9330



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:01<00:07,  1.32s/it][A
 29%|██▊       | 2/7 [00:01<00:03,  1.63it/s][A
100%|██████████| 7/7 [00:02<00:00,  2.71it/s][A
Epochs:  43%|████▎     | 41/95 [12:53<16:00, 17.78s/it]

Val Loss: 0.2092 - Val Accuracy: 0.9123



Training:   0%|          | 0/53 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/53 [00:01<01:10,  1.35s/it][A
Training:   4%|▍         | 2/53 [00:01<00:32,  1.55it/s][A
Training:   8%|▊         | 4/53 [00:01<00:13,  3.60it/s][A
Training:  11%|█▏        | 6/53 [00:02<00:18,  2.53it/s][A
Training:  15%|█▌        | 8/53 [00:02<00:11,  3.89it/s][A
Training:  19%|█▉        | 10/53 [00:03<00:15,  2.85it/s][A
Training:  23%|██▎       | 12/53 [00:03<00:10,  3.95it/s][A
Training:  26%|██▋       | 14/53 [00:05<00:13,  2.86it/s][A
Training:  32%|███▏      | 17/53 [00:06<00:12,  2.83it/s][A
Training:  34%|███▍      | 18/53 [00:06<00:11,  3.16it/s][A
Training:  40%|███▉      | 21/53 [00:07<00:10,  3.08it/s][A
Training:  43%|████▎     | 23/53 [00:07<00:07,  4.02it/s][A
Training:  47%|████▋     | 25/53 [00:08<00:09,  3.03it/s][A
Training:  51%|█████     | 27/53 [00:08<00:06,  3.98it/s][A
Training:  55%|█████▍    | 29/53 [00:09<00:08,  2.94it/s][A
Training:  62%|██████▏   | 33/53 [00:

Epoch: 42/95 - Loss: 0.1776 - Accuracy: 0.9340



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:01<00:08,  1.38s/it][A
 57%|█████▋    | 4/7 [00:01<00:00,  3.44it/s][A
100%|██████████| 7/7 [00:02<00:00,  2.75it/s][A
Epochs:  44%|████▍     | 42/95 [13:11<15:45, 17.83s/it]

Val Loss: 0.2067 - Val Accuracy: 0.9144



Training:   0%|          | 0/53 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/53 [00:01<01:14,  1.43s/it][A
Training:   6%|▌         | 3/53 [00:01<00:20,  2.41it/s][A
Training:   9%|▉         | 5/53 [00:02<00:21,  2.23it/s][A
Training:  15%|█▌        | 8/53 [00:02<00:11,  4.06it/s][A
Training:  19%|█▉        | 10/53 [00:03<00:14,  2.90it/s][A
Training:  25%|██▍       | 13/53 [00:04<00:13,  2.88it/s][A
Training:  28%|██▊       | 15/53 [00:04<00:10,  3.73it/s][A
Training:  32%|███▏      | 17/53 [00:06<00:12,  2.95it/s][A
Training:  34%|███▍      | 18/53 [00:06<00:10,  3.29it/s][A
Training:  36%|███▌      | 19/53 [00:06<00:09,  3.77it/s][A
Training:  40%|███▉      | 21/53 [00:07<00:10,  2.95it/s][A
Training:  43%|████▎     | 23/53 [00:07<00:07,  3.91it/s][A
Training:  47%|████▋     | 25/53 [00:08<00:08,  3.16it/s][A
Training:  49%|████▉     | 26/53 [00:08<00:07,  3.40it/s][A
Training:  51%|█████     | 27/53 [00:08<00:06,  3.82it/s][A
Training:  55%|█████▍    | 29/53 [00

Epoch: 43/95 - Loss: 0.1770 - Accuracy: 0.9339



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:01<00:07,  1.29s/it][A
 29%|██▊       | 2/7 [00:01<00:03,  1.63it/s][A
 57%|█████▋    | 4/7 [00:01<00:00,  3.81it/s][A
100%|██████████| 7/7 [00:02<00:00,  2.74it/s][A
Epochs:  45%|████▌     | 43/95 [13:29<15:29, 17.88s/it]

Val Loss: 0.2101 - Val Accuracy: 0.9133



Training:   0%|          | 0/53 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/53 [00:01<01:14,  1.44s/it][A
Training:   8%|▊         | 4/53 [00:01<00:14,  3.31it/s][A
Training:  11%|█▏        | 6/53 [00:02<00:19,  2.46it/s][A
Training:  15%|█▌        | 8/53 [00:02<00:12,  3.68it/s][A
Training:  19%|█▉        | 10/53 [00:03<00:16,  2.67it/s][A
Training:  25%|██▍       | 13/53 [00:05<00:15,  2.60it/s][A
Training:  32%|███▏      | 17/53 [00:06<00:12,  2.86it/s][A
Training:  36%|███▌      | 19/53 [00:06<00:09,  3.59it/s][A
Training:  40%|███▉      | 21/53 [00:07<00:10,  2.98it/s][A
Training:  47%|████▋     | 25/53 [00:08<00:08,  3.25it/s][A
Training:  53%|█████▎    | 28/53 [00:08<00:05,  4.48it/s][A
Training:  57%|█████▋    | 30/53 [00:09<00:06,  3.36it/s][A
Training:  62%|██████▏   | 33/53 [00:10<00:06,  3.15it/s][A
Training:  70%|██████▉   | 37/53 [00:11<00:04,  3.27it/s][A
Training:  74%|███████▎  | 39/53 [00:12<00:03,  3.99it/s][A
Training:  77%|███████▋  | 41/53 [00

Epoch: 44/95 - Loss: 0.1805 - Accuracy: 0.9330



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:01<00:08,  1.42s/it][A
100%|██████████| 7/7 [00:02<00:00,  2.75it/s][A
Epochs:  46%|████▋     | 44/95 [13:47<15:12, 17.89s/it]

Val Loss: 0.2102 - Val Accuracy: 0.9112



Training:   0%|          | 0/53 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/53 [00:01<01:18,  1.51s/it][A
Training:   6%|▌         | 3/53 [00:01<00:21,  2.29it/s][A
Training:   9%|▉         | 5/53 [00:02<00:23,  2.06it/s][A
Training:  17%|█▋        | 9/53 [00:03<00:16,  2.65it/s][A
Training:  25%|██▍       | 13/53 [00:05<00:13,  3.00it/s][A
Training:  32%|███▏      | 17/53 [00:06<00:11,  3.11it/s][A
Training:  38%|███▊      | 20/53 [00:06<00:07,  4.24it/s][A
Training:  42%|████▏     | 22/53 [00:07<00:08,  3.48it/s][A
Training:  47%|████▋     | 25/53 [00:08<00:08,  3.20it/s][A
Training:  53%|█████▎    | 28/53 [00:08<00:05,  4.43it/s][A
Training:  57%|█████▋    | 30/53 [00:09<00:06,  3.50it/s][A
Training:  62%|██████▏   | 33/53 [00:10<00:06,  3.21it/s][A
Training:  66%|██████▌   | 35/53 [00:10<00:04,  4.01it/s][A
Training:  70%|██████▉   | 37/53 [00:11<00:05,  3.15it/s][A
Training:  75%|███████▌  | 40/53 [00:11<00:02,  4.55it/s][A
Training:  79%|███████▉  | 42/53 [00

Epoch: 45/95 - Loss: 0.1767 - Accuracy: 0.9324



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:01<00:07,  1.32s/it][A
100%|██████████| 7/7 [00:02<00:00,  2.88it/s][A
Epochs:  47%|████▋     | 45/95 [14:04<14:52, 17.85s/it]

Val Loss: 0.2095 - Val Accuracy: 0.9144



Training:   0%|          | 0/53 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/53 [00:01<01:13,  1.42s/it][A
Training:   8%|▊         | 4/53 [00:01<00:15,  3.23it/s][A
Training:  11%|█▏        | 6/53 [00:02<00:18,  2.50it/s][A
Training:  17%|█▋        | 9/53 [00:03<00:17,  2.53it/s][A
Training:  23%|██▎       | 12/53 [00:03<00:10,  4.01it/s][A
Training:  26%|██▋       | 14/53 [00:04<00:12,  3.01it/s][A
Training:  30%|███       | 16/53 [00:05<00:09,  3.95it/s][A
Training:  34%|███▍      | 18/53 [00:06<00:11,  3.00it/s][A
Training:  40%|███▉      | 21/53 [00:07<00:10,  3.00it/s][A
Training:  45%|████▌     | 24/53 [00:07<00:06,  4.36it/s][A
Training:  49%|████▉     | 26/53 [00:08<00:08,  3.23it/s][A
Training:  55%|█████▍    | 29/53 [00:09<00:07,  3.11it/s][A
Training:  62%|██████▏   | 33/53 [00:10<00:05,  3.43it/s][A
Training:  64%|██████▍   | 34/53 [00:10<00:05,  3.60it/s][A
Training:  70%|██████▉   | 37/53 [00:11<00:04,  3.46it/s][A
Training:  72%|███████▏  | 38/53 [00

Epoch: 46/95 - Loss: 0.1782 - Accuracy: 0.9342



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:01<00:08,  1.37s/it][A
100%|██████████| 7/7 [00:02<00:00,  2.85it/s][A
Epochs:  48%|████▊     | 46/95 [14:22<14:32, 17.80s/it]

Val Loss: 0.2090 - Val Accuracy: 0.9133



Training:   0%|          | 0/53 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/53 [00:01<01:17,  1.49s/it][A
Training:   8%|▊         | 4/53 [00:01<00:15,  3.09it/s][A
Training:  11%|█▏        | 6/53 [00:02<00:18,  2.53it/s][A
Training:  17%|█▋        | 9/53 [00:03<00:16,  2.59it/s][A
Training:  23%|██▎       | 12/53 [00:03<00:09,  4.12it/s][A
Training:  26%|██▋       | 14/53 [00:05<00:13,  2.95it/s][A
Training:  30%|███       | 16/53 [00:05<00:09,  3.86it/s][A
Training:  34%|███▍      | 18/53 [00:06<00:11,  3.02it/s][A
Training:  40%|███▉      | 21/53 [00:07<00:11,  2.90it/s][A
Training:  45%|████▌     | 24/53 [00:07<00:06,  4.24it/s][A
Training:  49%|████▉     | 26/53 [00:08<00:08,  3.35it/s][A
Training:  55%|█████▍    | 29/53 [00:09<00:07,  3.04it/s][A
Training:  62%|██████▏   | 33/53 [00:10<00:06,  3.31it/s][A
Training:  66%|██████▌   | 35/53 [00:10<00:04,  4.04it/s][A
Training:  70%|██████▉   | 37/53 [00:11<00:05,  3.16it/s][A
Training:  72%|███████▏  | 38/53 [00

Epoch: 47/95 - Loss: 0.1763 - Accuracy: 0.9339



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:01<00:07,  1.30s/it][A
 43%|████▎     | 3/7 [00:01<00:01,  2.68it/s][A
100%|██████████| 7/7 [00:02<00:00,  2.96it/s][A
Epochs:  49%|████▉     | 47/95 [14:40<14:14, 17.80s/it]

Val Loss: 0.2070 - Val Accuracy: 0.9134



Training:   0%|          | 0/53 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/53 [00:01<01:19,  1.53s/it][A
Training:   8%|▊         | 4/53 [00:01<00:15,  3.11it/s][A
Training:  11%|█▏        | 6/53 [00:02<00:19,  2.42it/s][A
Training:  17%|█▋        | 9/53 [00:03<00:17,  2.55it/s][A
Training:  25%|██▍       | 13/53 [00:04<00:13,  2.99it/s][A
Training:  28%|██▊       | 15/53 [00:05<00:10,  3.79it/s][A
Training:  32%|███▏      | 17/53 [00:06<00:11,  3.05it/s][A
Training:  34%|███▍      | 18/53 [00:06<00:10,  3.41it/s][A
Training:  40%|███▉      | 21/53 [00:07<00:09,  3.29it/s][A
Training:  43%|████▎     | 23/53 [00:07<00:07,  4.26it/s][A
Training:  47%|████▋     | 25/53 [00:08<00:09,  3.11it/s][A
Training:  55%|█████▍    | 29/53 [00:09<00:07,  3.33it/s][A
Training:  60%|██████    | 32/53 [00:09<00:04,  4.67it/s][A
Training:  64%|██████▍   | 34/53 [00:10<00:05,  3.54it/s][A
Training:  70%|██████▉   | 37/53 [00:11<00:04,  3.25it/s][A
Training:  75%|███████▌  | 40/53 [00

Epoch: 48/95 - Loss: 0.1768 - Accuracy: 0.9335



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:01<00:08,  1.37s/it][A
 57%|█████▋    | 4/7 [00:01<00:00,  3.33it/s][A
100%|██████████| 7/7 [00:02<00:00,  2.90it/s][A
Epochs:  51%|█████     | 48/95 [14:58<13:56, 17.80s/it]

Val Loss: 0.2087 - Val Accuracy: 0.9123



Training:   0%|          | 0/53 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/53 [00:01<01:19,  1.52s/it][A
Training:   8%|▊         | 4/53 [00:01<00:15,  3.13it/s][A
Training:  11%|█▏        | 6/53 [00:02<00:20,  2.27it/s][A
Training:  17%|█▋        | 9/53 [00:03<00:17,  2.47it/s][A
Training:  23%|██▎       | 12/53 [00:04<00:10,  3.91it/s][A
Training:  26%|██▋       | 14/53 [00:05<00:13,  2.99it/s][A
Training:  32%|███▏      | 17/53 [00:06<00:12,  2.79it/s][A
Training:  38%|███▊      | 20/53 [00:06<00:08,  4.05it/s][A
Training:  42%|████▏     | 22/53 [00:07<00:09,  3.19it/s][A
Training:  47%|████▋     | 25/53 [00:08<00:09,  3.01it/s][A
Training:  53%|█████▎    | 28/53 [00:08<00:05,  4.19it/s][A
Training:  57%|█████▋    | 30/53 [00:09<00:06,  3.32it/s][A
Training:  60%|██████    | 32/53 [00:09<00:04,  4.21it/s][A
Training:  64%|██████▍   | 34/53 [00:10<00:06,  3.03it/s][A
Training:  70%|██████▉   | 37/53 [00:12<00:05,  2.91it/s][A
Training:  77%|███████▋  | 41/53 [00

Epoch: 49/95 - Loss: 0.1759 - Accuracy: 0.9333



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:01<00:08,  1.38s/it][A
 57%|█████▋    | 4/7 [00:01<00:00,  3.46it/s][A
100%|██████████| 7/7 [00:02<00:00,  2.86it/s][A
Epochs:  52%|█████▏    | 49/95 [15:16<13:43, 17.90s/it]

Val Loss: 0.2044 - Val Accuracy: 0.9134



Training:   0%|          | 0/53 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/53 [00:01<01:12,  1.40s/it][A
Training:   6%|▌         | 3/53 [00:01<00:20,  2.46it/s][A
Training:   9%|▉         | 5/53 [00:02<00:22,  2.17it/s][A
Training:  11%|█▏        | 6/53 [00:02<00:17,  2.72it/s][A
Training:  17%|█▋        | 9/53 [00:03<00:15,  2.85it/s][A
Training:  21%|██        | 11/53 [00:03<00:10,  3.94it/s][A
Training:  25%|██▍       | 13/53 [00:04<00:13,  2.88it/s][A
Training:  30%|███       | 16/53 [00:05<00:08,  4.41it/s][A
Training:  34%|███▍      | 18/53 [00:06<00:10,  3.31it/s][A
Training:  40%|███▉      | 21/53 [00:07<00:10,  3.09it/s][A
Training:  43%|████▎     | 23/53 [00:07<00:07,  3.96it/s][A
Training:  47%|████▋     | 25/53 [00:08<00:09,  3.06it/s][A
Training:  51%|█████     | 27/53 [00:08<00:06,  3.99it/s][A
Training:  55%|█████▍    | 29/53 [00:09<00:07,  3.30it/s][A
Training:  57%|█████▋    | 30/53 [00:09<00:06,  3.42it/s][A
Training:  60%|██████    | 32/53 [00:

Epoch: 50/95 - Loss: 0.1766 - Accuracy: 0.9345



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:01<00:09,  1.52s/it][A
100%|██████████| 7/7 [00:02<00:00,  2.81it/s][A
Epochs:  53%|█████▎    | 50/95 [15:34<13:25, 17.89s/it]

Val Loss: 0.2088 - Val Accuracy: 0.9128



Training:   0%|          | 0/53 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/53 [00:01<01:11,  1.37s/it][A
Training:   4%|▍         | 2/53 [00:01<00:31,  1.60it/s][A
Training:   9%|▉         | 5/53 [00:02<00:20,  2.33it/s][A
Training:  11%|█▏        | 6/53 [00:02<00:16,  2.81it/s][A
Training:  15%|█▌        | 8/53 [00:02<00:10,  4.22it/s][A
Training:  17%|█▋        | 9/53 [00:03<00:16,  2.63it/s][A
Training:  19%|█▉        | 10/53 [00:03<00:14,  2.96it/s][A
Training:  25%|██▍       | 13/53 [00:04<00:13,  3.00it/s][A
Training:  26%|██▋       | 14/53 [00:04<00:11,  3.43it/s][A
Training:  30%|███       | 16/53 [00:05<00:07,  4.78it/s][A
Training:  32%|███▏      | 17/53 [00:05<00:11,  3.04it/s][A
Training:  36%|███▌      | 19/53 [00:06<00:07,  4.37it/s][A
Training:  40%|███▉      | 21/53 [00:07<00:10,  3.08it/s][A
Training:  42%|████▏     | 22/53 [00:07<00:08,  3.49it/s][A
Training:  45%|████▌     | 24/53 [00:07<00:05,  4.93it/s][A
Training:  49%|████▉     | 26/53 [00:0

Epoch: 51/95 - Loss: 0.1778 - Accuracy: 0.9324



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:01<00:08,  1.37s/it][A
 43%|████▎     | 3/7 [00:01<00:01,  2.47it/s][A
100%|██████████| 7/7 [00:02<00:00,  2.84it/s][A
Epochs:  54%|█████▎    | 51/95 [15:52<13:07, 17.89s/it]

Val Loss: 0.2090 - Val Accuracy: 0.9133



Training:   0%|          | 0/53 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/53 [00:01<01:08,  1.33s/it][A
Training:   8%|▊         | 4/53 [00:01<00:13,  3.52it/s][A
Training:  11%|█▏        | 6/53 [00:02<00:18,  2.55it/s][A
Training:  15%|█▌        | 8/53 [00:02<00:11,  3.81it/s][A
Training:  19%|█▉        | 10/53 [00:03<00:15,  2.79it/s][A
Training:  23%|██▎       | 12/53 [00:03<00:10,  3.85it/s][A
Training:  26%|██▋       | 14/53 [00:04<00:13,  2.92it/s][A
Training:  30%|███       | 16/53 [00:04<00:09,  3.96it/s][A
Training:  34%|███▍      | 18/53 [00:05<00:11,  3.06it/s][A
Training:  38%|███▊      | 20/53 [00:06<00:08,  4.11it/s][A
Training:  42%|████▏     | 22/53 [00:07<00:10,  3.05it/s][A
Training:  47%|████▋     | 25/53 [00:08<00:09,  3.01it/s][A
Training:  51%|█████     | 27/53 [00:08<00:06,  3.83it/s][A
Training:  55%|█████▍    | 29/53 [00:09<00:07,  3.00it/s][A
Training:  58%|█████▊    | 31/53 [00:09<00:05,  3.83it/s][A
Training:  62%|██████▏   | 33/53 [00

Epoch: 52/95 - Loss: 0.1796 - Accuracy: 0.9329



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:01<00:08,  1.39s/it][A
100%|██████████| 7/7 [00:02<00:00,  2.80it/s][A
Epochs:  55%|█████▍    | 52/95 [16:10<12:50, 17.91s/it]

Val Loss: 0.2066 - Val Accuracy: 0.9171



Training:   0%|          | 0/53 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/53 [00:01<01:09,  1.33s/it][A
Training:   8%|▊         | 4/53 [00:01<00:14,  3.48it/s][A
Training:  11%|█▏        | 6/53 [00:02<00:18,  2.51it/s][A
Training:  17%|█▋        | 9/53 [00:03<00:17,  2.58it/s][A
Training:  21%|██        | 11/53 [00:03<00:11,  3.51it/s][A
Training:  25%|██▍       | 13/53 [00:04<00:13,  2.88it/s][A
Training:  28%|██▊       | 15/53 [00:04<00:09,  3.85it/s][A
Training:  32%|███▏      | 17/53 [00:05<00:11,  3.05it/s][A
Training:  34%|███▍      | 18/53 [00:05<00:10,  3.41it/s][A
Training:  38%|███▊      | 20/53 [00:06<00:07,  4.68it/s][A
Training:  42%|████▏     | 22/53 [00:07<00:09,  3.37it/s][A
Training:  47%|████▋     | 25/53 [00:08<00:08,  3.16it/s][A
Training:  49%|████▉     | 26/53 [00:08<00:07,  3.49it/s][A
Training:  53%|█████▎    | 28/53 [00:08<00:05,  4.70it/s][A
Training:  57%|█████▋    | 30/53 [00:09<00:06,  3.33it/s][A
Training:  60%|██████    | 32/53 [00

Epoch: 53/95 - Loss: 0.1789 - Accuracy: 0.9330



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:01<00:08,  1.41s/it][A
 57%|█████▋    | 4/7 [00:01<00:00,  3.40it/s][A
100%|██████████| 7/7 [00:02<00:00,  2.78it/s][A
Epochs:  56%|█████▌    | 53/95 [16:28<12:32, 17.92s/it]

Val Loss: 0.2079 - Val Accuracy: 0.9160



Training:   0%|          | 0/53 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/53 [00:01<01:08,  1.31s/it][A
Training:   6%|▌         | 3/53 [00:01<00:20,  2.42it/s][A
Training:   9%|▉         | 5/53 [00:02<00:20,  2.34it/s][A
Training:  11%|█▏        | 6/53 [00:02<00:16,  2.93it/s][A
Training:  13%|█▎        | 7/53 [00:02<00:14,  3.15it/s][A
Training:  17%|█▋        | 9/53 [00:03<00:16,  2.71it/s][A
Training:  21%|██        | 11/53 [00:03<00:11,  3.50it/s][A
Training:  25%|██▍       | 13/53 [00:04<00:12,  3.23it/s][A
Training:  28%|██▊       | 15/53 [00:05<00:10,  3.68it/s][A
Training:  32%|███▏      | 17/53 [00:05<00:10,  3.34it/s][A
Training:  34%|███▍      | 18/53 [00:05<00:09,  3.72it/s][A
Training:  36%|███▌      | 19/53 [00:06<00:08,  3.85it/s][A
Training:  40%|███▉      | 21/53 [00:06<00:09,  3.45it/s][A
Training:  42%|████▏     | 22/53 [00:06<00:07,  3.97it/s][A
Training:  43%|████▎     | 23/53 [00:07<00:07,  4.01it/s][A
Training:  47%|████▋     | 25/53 [00:0

Epoch: 54/95 - Loss: 0.1766 - Accuracy: 0.9328



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:01<00:08,  1.34s/it][A
100%|██████████| 7/7 [00:02<00:00,  2.85it/s][A
Epochs:  57%|█████▋    | 54/95 [16:45<12:14, 17.91s/it]

Val Loss: 0.2077 - Val Accuracy: 0.9117



Training:   0%|          | 0/53 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/53 [00:01<01:06,  1.28s/it][A
Training:   8%|▊         | 4/53 [00:01<00:13,  3.63it/s][A
Training:  11%|█▏        | 6/53 [00:02<00:18,  2.61it/s][A
Training:  15%|█▌        | 8/53 [00:02<00:11,  3.90it/s][A
Training:  19%|█▉        | 10/53 [00:03<00:15,  2.73it/s][A
Training:  25%|██▍       | 13/53 [00:04<00:14,  2.84it/s][A
Training:  30%|███       | 16/53 [00:04<00:08,  4.30it/s][A
Training:  34%|███▍      | 18/53 [00:05<00:11,  3.10it/s][A
Training:  40%|███▉      | 21/53 [00:06<00:10,  3.07it/s][A
Training:  43%|████▎     | 23/53 [00:07<00:07,  3.88it/s][A
Training:  47%|████▋     | 25/53 [00:08<00:09,  2.97it/s][A
Training:  53%|█████▎    | 28/53 [00:08<00:05,  4.35it/s][A
Training:  57%|█████▋    | 30/53 [00:09<00:06,  3.34it/s][A
Training:  62%|██████▏   | 33/53 [00:10<00:06,  3.13it/s][A
Training:  66%|██████▌   | 35/53 [00:10<00:04,  3.94it/s][A
Training:  70%|██████▉   | 37/53 [00

Epoch: 55/95 - Loss: 0.1797 - Accuracy: 0.9339



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:01<00:08,  1.35s/it][A
100%|██████████| 7/7 [00:02<00:00,  2.88it/s][A
Epochs:  58%|█████▊    | 55/95 [17:03<11:53, 17.85s/it]

Val Loss: 0.2096 - Val Accuracy: 0.9139



Training:   0%|          | 0/53 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/53 [00:01<01:06,  1.27s/it][A
Training:   6%|▌         | 3/53 [00:01<00:18,  2.68it/s][A
Training:   9%|▉         | 5/53 [00:02<00:19,  2.45it/s][A
Training:  13%|█▎        | 7/53 [00:02<00:11,  3.85it/s][A
Training:  17%|█▋        | 9/53 [00:03<00:16,  2.68it/s][A
Training:  25%|██▍       | 13/53 [00:04<00:12,  3.14it/s][A
Training:  26%|██▋       | 14/53 [00:04<00:11,  3.51it/s][A
Training:  30%|███       | 16/53 [00:04<00:07,  4.67it/s][A
Training:  34%|███▍      | 18/53 [00:05<00:10,  3.32it/s][A
Training:  36%|███▌      | 19/53 [00:05<00:09,  3.65it/s][A
Training:  40%|███▉      | 21/53 [00:06<00:10,  3.11it/s][A
Training:  42%|████▏     | 22/53 [00:06<00:08,  3.49it/s][A
Training:  47%|████▋     | 25/53 [00:07<00:08,  3.26it/s][A
Training:  49%|████▉     | 26/53 [00:08<00:07,  3.55it/s][A
Training:  55%|█████▍    | 29/53 [00:09<00:07,  3.35it/s][A
Training:  57%|█████▋    | 30/53 [00:

Epoch: 56/95 - Loss: 0.1764 - Accuracy: 0.9332



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:01<00:08,  1.40s/it][A
100%|██████████| 7/7 [00:02<00:00,  2.75it/s][A
Epochs:  59%|█████▉    | 56/95 [17:21<11:35, 17.83s/it]

Val Loss: 0.2100 - Val Accuracy: 0.9171



Training:   0%|          | 0/53 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/53 [00:01<01:09,  1.34s/it][A
Training:   4%|▍         | 2/53 [00:01<00:31,  1.61it/s][A
Training:   9%|▉         | 5/53 [00:02<00:18,  2.58it/s][A
Training:  11%|█▏        | 6/53 [00:02<00:15,  3.06it/s][A
Training:  17%|█▋        | 9/53 [00:03<00:14,  3.11it/s][A
Training:  19%|█▉        | 10/53 [00:03<00:12,  3.53it/s][A
Training:  25%|██▍       | 13/53 [00:04<00:12,  3.24it/s][A
Training:  28%|██▊       | 15/53 [00:04<00:08,  4.26it/s][A
Training:  32%|███▏      | 17/53 [00:05<00:11,  3.03it/s][A
Training:  40%|███▉      | 21/53 [00:06<00:09,  3.23it/s][A
Training:  47%|████▋     | 25/53 [00:08<00:08,  3.25it/s][A
Training:  51%|█████     | 27/53 [00:08<00:06,  3.98it/s][A
Training:  55%|█████▍    | 29/53 [00:09<00:07,  3.09it/s][A
Training:  60%|██████    | 32/53 [00:09<00:04,  4.43it/s][A
Training:  64%|██████▍   | 34/53 [00:10<00:05,  3.26it/s][A
Training:  70%|██████▉   | 37/53 [00:

Epoch: 57/95 - Loss: 0.1782 - Accuracy: 0.9328



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:01<00:08,  1.43s/it][A
100%|██████████| 7/7 [00:02<00:00,  2.74it/s][A
Epochs:  60%|██████    | 57/95 [17:39<11:20, 17.91s/it]

Val Loss: 0.2060 - Val Accuracy: 0.9129



Training:   0%|          | 0/53 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/53 [00:01<01:11,  1.37s/it][A
Training:   6%|▌         | 3/53 [00:01<00:19,  2.55it/s][A
Training:   9%|▉         | 5/53 [00:02<00:20,  2.34it/s][A
Training:  13%|█▎        | 7/53 [00:02<00:12,  3.67it/s][A
Training:  17%|█▋        | 9/53 [00:03<00:15,  2.80it/s][A
Training:  21%|██        | 11/53 [00:03<00:10,  3.84it/s][A
Training:  25%|██▍       | 13/53 [00:04<00:13,  3.01it/s][A
Training:  28%|██▊       | 15/53 [00:04<00:09,  3.91it/s][A
Training:  32%|███▏      | 17/53 [00:05<00:11,  3.14it/s][A
Training:  34%|███▍      | 18/53 [00:05<00:09,  3.56it/s][A
Training:  40%|███▉      | 21/53 [00:06<00:10,  3.14it/s][A
Training:  43%|████▎     | 23/53 [00:07<00:07,  4.10it/s][A
Training:  47%|████▋     | 25/53 [00:08<00:08,  3.17it/s][A
Training:  51%|█████     | 27/53 [00:08<00:06,  4.11it/s][A
Training:  55%|█████▍    | 29/53 [00:09<00:07,  3.14it/s][A
Training:  57%|█████▋    | 30/53 [00:

Epoch: 58/95 - Loss: 0.1785 - Accuracy: 0.9326



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:01<00:07,  1.31s/it][A
 43%|████▎     | 3/7 [00:01<00:01,  2.54it/s][A
100%|██████████| 7/7 [00:02<00:00,  2.82it/s][A
Epochs:  61%|██████    | 58/95 [17:57<11:02, 17.90s/it]

Val Loss: 0.2073 - Val Accuracy: 0.9139



Training:   0%|          | 0/53 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/53 [00:01<01:17,  1.50s/it][A
Training:   6%|▌         | 3/53 [00:01<00:21,  2.34it/s][A
Training:   9%|▉         | 5/53 [00:02<00:21,  2.24it/s][A
Training:  17%|█▋        | 9/53 [00:03<00:14,  3.04it/s][A
Training:  25%|██▍       | 13/53 [00:04<00:12,  3.17it/s][A
Training:  28%|██▊       | 15/53 [00:04<00:09,  3.96it/s][A
Training:  32%|███▏      | 17/53 [00:05<00:11,  3.16it/s][A
Training:  40%|███▉      | 21/53 [00:07<00:09,  3.25it/s][A
Training:  43%|████▎     | 23/53 [00:07<00:07,  4.04it/s][A
Training:  47%|████▋     | 25/53 [00:08<00:08,  3.24it/s][A
Training:  51%|█████     | 27/53 [00:08<00:06,  4.13it/s][A
Training:  55%|█████▍    | 29/53 [00:09<00:07,  3.17it/s][A
Training:  60%|██████    | 32/53 [00:09<00:04,  4.60it/s][A
Training:  64%|██████▍   | 34/53 [00:10<00:05,  3.35it/s][A
Training:  70%|██████▉   | 37/53 [00:11<00:05,  3.07it/s][A
Training:  77%|███████▋  | 41/53 [00

Epoch: 59/95 - Loss: 0.1763 - Accuracy: 0.9344



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:01<00:08,  1.50s/it][A
100%|██████████| 7/7 [00:02<00:00,  2.75it/s][A
Epochs:  62%|██████▏   | 59/95 [18:15<10:44, 17.90s/it]

Val Loss: 0.2083 - Val Accuracy: 0.9134



Training:   0%|          | 0/53 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/53 [00:01<01:11,  1.38s/it][A
Training:   8%|▊         | 4/53 [00:01<00:14,  3.41it/s][A
Training:  11%|█▏        | 6/53 [00:02<00:16,  2.77it/s][A
Training:  17%|█▋        | 9/53 [00:03<00:15,  2.86it/s][A
Training:  19%|█▉        | 10/53 [00:03<00:13,  3.30it/s][A
Training:  25%|██▍       | 13/53 [00:04<00:13,  3.02it/s][A
Training:  32%|███▏      | 17/53 [00:05<00:10,  3.29it/s][A
Training:  40%|███▉      | 21/53 [00:06<00:09,  3.29it/s][A
Training:  45%|████▌     | 24/53 [00:07<00:06,  4.36it/s][A
Training:  47%|████▋     | 25/53 [00:08<00:09,  3.03it/s][A
Training:  55%|█████▍    | 29/53 [00:09<00:07,  3.12it/s][A
Training:  62%|██████▏   | 33/53 [00:10<00:06,  3.26it/s][A
Training:  68%|██████▊   | 36/53 [00:10<00:04,  4.23it/s][A
Training:  70%|██████▉   | 37/53 [00:11<00:05,  2.97it/s][A
Training:  77%|███████▋  | 41/53 [00:12<00:03,  3.15it/s][A
Training:  85%|████████▍ | 45/53 [00

Epoch: 60/95 - Loss: 0.1782 - Accuracy: 0.9329



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:01<00:08,  1.42s/it][A
 57%|█████▋    | 4/7 [00:01<00:00,  3.31it/s][A
100%|██████████| 7/7 [00:02<00:00,  2.76it/s][A
Epochs:  63%|██████▎   | 60/95 [18:33<10:28, 17.95s/it]

Val Loss: 0.2055 - Val Accuracy: 0.9150



Training:   0%|          | 0/53 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/53 [00:01<01:19,  1.52s/it][A
Training:   9%|▉         | 5/53 [00:02<00:20,  2.40it/s][A
Training:  17%|█▋        | 9/53 [00:03<00:14,  3.03it/s][A
Training:  25%|██▍       | 13/53 [00:04<00:12,  3.23it/s][A
Training:  32%|███▏      | 17/53 [00:05<00:10,  3.37it/s][A
Training:  40%|███▉      | 21/53 [00:06<00:09,  3.39it/s][A
Training:  45%|████▌     | 24/53 [00:06<00:06,  4.48it/s][A
Training:  49%|████▉     | 26/53 [00:08<00:07,  3.47it/s][A
Training:  55%|█████▍    | 29/53 [00:09<00:07,  3.22it/s][A
Training:  62%|██████▏   | 33/53 [00:10<00:06,  3.25it/s][A
Training:  70%|██████▉   | 37/53 [00:11<00:04,  3.29it/s][A
Training:  74%|███████▎  | 39/53 [00:11<00:03,  3.92it/s][A
Training:  77%|███████▋  | 41/53 [00:12<00:03,  3.21it/s][A
Training:  85%|████████▍ | 45/53 [00:13<00:02,  3.36it/s][A
Training:  92%|█████████▏| 49/53 [00:14<00:01,  3.49it/s][A
Training: 100%|██████████| 53/53 [0

Epoch: 61/95 - Loss: 0.1767 - Accuracy: 0.9347



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:01<00:08,  1.46s/it][A
100%|██████████| 7/7 [00:02<00:00,  2.69it/s][A
Epochs:  64%|██████▍   | 61/95 [18:51<10:07, 17.88s/it]

Val Loss: 0.2090 - Val Accuracy: 0.9139



Training:   0%|          | 0/53 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/53 [00:01<01:13,  1.41s/it][A
Training:   8%|▊         | 4/53 [00:01<00:15,  3.25it/s][A
Training:  11%|█▏        | 6/53 [00:02<00:17,  2.72it/s][A
Training:  17%|█▋        | 9/53 [00:03<00:15,  2.80it/s][A
Training:  23%|██▎       | 12/53 [00:03<00:09,  4.37it/s][A
Training:  26%|██▋       | 14/53 [00:04<00:12,  3.23it/s][A
Training:  30%|███       | 16/53 [00:04<00:08,  4.21it/s][A
Training:  34%|███▍      | 18/53 [00:05<00:10,  3.21it/s][A
Training:  38%|███▊      | 20/53 [00:05<00:07,  4.17it/s][A
Training:  42%|████▏     | 22/53 [00:06<00:09,  3.23it/s][A
Training:  47%|████▋     | 25/53 [00:07<00:09,  3.05it/s][A
Training:  49%|████▉     | 26/53 [00:08<00:08,  3.35it/s][A
Training:  53%|█████▎    | 28/53 [00:08<00:05,  4.44it/s][A
Training:  55%|█████▍    | 29/53 [00:08<00:07,  3.00it/s][A
Training:  57%|█████▋    | 30/53 [00:09<00:07,  3.25it/s][A
Training:  62%|██████▏   | 33/53 [00

Epoch: 62/95 - Loss: 0.1807 - Accuracy: 0.9323



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:01<00:08,  1.39s/it][A
 43%|████▎     | 3/7 [00:01<00:01,  2.49it/s][A
100%|██████████| 7/7 [00:02<00:00,  2.68it/s][A
Epochs:  65%|██████▌   | 62/95 [19:08<09:49, 17.87s/it]

Val Loss: 0.2127 - Val Accuracy: 0.9075



Training:   0%|          | 0/53 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/53 [00:01<01:11,  1.38s/it][A
Training:   8%|▊         | 4/53 [00:01<00:14,  3.44it/s][A
Training:  11%|█▏        | 6/53 [00:02<00:17,  2.65it/s][A
Training:  17%|█▋        | 9/53 [00:03<00:15,  2.91it/s][A
Training:  23%|██▎       | 12/53 [00:03<00:08,  4.57it/s][A
Training:  26%|██▋       | 14/53 [00:04<00:10,  3.56it/s][A
Training:  32%|███▏      | 17/53 [00:05<00:11,  3.06it/s][A
Training:  38%|███▊      | 20/53 [00:05<00:07,  4.36it/s][A
Training:  42%|████▏     | 22/53 [00:06<00:09,  3.35it/s][A
Training:  47%|████▋     | 25/53 [00:07<00:09,  3.09it/s][A
Training:  53%|█████▎    | 28/53 [00:07<00:05,  4.34it/s][A
Training:  57%|█████▋    | 30/53 [00:08<00:06,  3.38it/s][A
Training:  62%|██████▏   | 33/53 [00:10<00:06,  3.14it/s][A
Training:  68%|██████▊   | 36/53 [00:10<00:04,  4.16it/s][A
Training:  70%|██████▉   | 37/53 [00:11<00:05,  3.06it/s][A
Training:  75%|███████▌  | 40/53 [00

Epoch: 63/95 - Loss: 0.1807 - Accuracy: 0.9320



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:01<00:08,  1.43s/it][A
 57%|█████▋    | 4/7 [00:01<00:00,  3.15it/s][A
100%|██████████| 7/7 [00:02<00:00,  2.67it/s][A
Epochs:  66%|██████▋   | 63/95 [19:26<09:31, 17.85s/it]

Val Loss: 0.2145 - Val Accuracy: 0.9086



Training:   0%|          | 0/53 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/53 [00:01<01:06,  1.27s/it][A
Training:   6%|▌         | 3/53 [00:01<00:18,  2.67it/s][A
Training:   9%|▉         | 5/53 [00:02<00:21,  2.27it/s][A
Training:  17%|█▋        | 9/53 [00:03<00:14,  2.98it/s][A
Training:  25%|██▍       | 13/53 [00:04<00:11,  3.38it/s][A
Training:  28%|██▊       | 15/53 [00:04<00:09,  4.21it/s][A
Training:  32%|███▏      | 17/53 [00:05<00:11,  3.17it/s][A
Training:  40%|███▉      | 21/53 [00:06<00:09,  3.32it/s][A
Training:  45%|████▌     | 24/53 [00:06<00:06,  4.56it/s][A
Training:  49%|████▉     | 26/53 [00:07<00:07,  3.45it/s][A
Training:  55%|█████▍    | 29/53 [00:09<00:07,  3.15it/s][A
Training:  60%|██████    | 32/53 [00:09<00:04,  4.37it/s][A
Training:  64%|██████▍   | 34/53 [00:10<00:05,  3.30it/s][A
Training:  70%|██████▉   | 37/53 [00:11<00:05,  3.06it/s][A
Training:  77%|███████▋  | 41/53 [00:12<00:03,  3.23it/s][A
Training:  83%|████████▎ | 44/53 [00

Epoch: 64/95 - Loss: 0.1780 - Accuracy: 0.9331



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:01<00:08,  1.46s/it][A
100%|██████████| 7/7 [00:02<00:00,  2.64it/s][A
Epochs:  67%|██████▋   | 64/95 [19:44<09:11, 17.81s/it]

Val Loss: 0.2076 - Val Accuracy: 0.9160



Training:   0%|          | 0/53 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/53 [00:01<01:09,  1.34s/it][A
Training:   9%|▉         | 5/53 [00:02<00:20,  2.34it/s][A
Training:  15%|█▌        | 8/53 [00:02<00:10,  4.15it/s][A
Training:  19%|█▉        | 10/53 [00:03<00:13,  3.16it/s][A
Training:  25%|██▍       | 13/53 [00:04<00:12,  3.19it/s][A
Training:  32%|███▏      | 17/53 [00:05<00:10,  3.44it/s][A
Training:  36%|███▌      | 19/53 [00:05<00:08,  4.15it/s][A
Training:  40%|███▉      | 21/53 [00:06<00:09,  3.21it/s][A
Training:  43%|████▎     | 23/53 [00:06<00:07,  4.04it/s][A
Training:  47%|████▋     | 25/53 [00:07<00:09,  3.10it/s][A
Training:  51%|█████     | 27/53 [00:07<00:06,  4.02it/s][A
Training:  55%|█████▍    | 29/53 [00:09<00:07,  3.04it/s][A
Training:  62%|██████▏   | 33/53 [00:10<00:06,  3.12it/s][A
Training:  66%|██████▌   | 35/53 [00:10<00:04,  3.91it/s][A
Training:  70%|██████▉   | 37/53 [00:11<00:05,  3.12it/s][A
Training:  75%|███████▌  | 40/53 [0

Epoch: 65/95 - Loss: 0.1799 - Accuracy: 0.9344



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:01<00:08,  1.38s/it][A
 57%|█████▋    | 4/7 [00:01<00:00,  3.32it/s][A
100%|██████████| 7/7 [00:02<00:00,  2.73it/s][A
Epochs:  68%|██████▊   | 65/95 [20:02<08:53, 17.78s/it]

Val Loss: 0.2088 - Val Accuracy: 0.9149



Training:   0%|          | 0/53 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/53 [00:01<01:14,  1.43s/it][A
Training:   8%|▊         | 4/53 [00:01<00:15,  3.22it/s][A
Training:  11%|█▏        | 6/53 [00:02<00:18,  2.59it/s][A
Training:  17%|█▋        | 9/53 [00:03<00:16,  2.70it/s][A
Training:  25%|██▍       | 13/53 [00:04<00:12,  3.26it/s][A
Training:  30%|███       | 16/53 [00:04<00:08,  4.62it/s][A
Training:  34%|███▍      | 18/53 [00:05<00:10,  3.47it/s][A
Training:  40%|███▉      | 21/53 [00:06<00:09,  3.21it/s][A
Training:  43%|████▎     | 23/53 [00:06<00:07,  3.94it/s][A
Training:  47%|████▋     | 25/53 [00:08<00:09,  3.04it/s][A
Training:  51%|█████     | 27/53 [00:08<00:06,  3.90it/s][A
Training:  55%|█████▍    | 29/53 [00:09<00:07,  3.08it/s][A
Training:  58%|█████▊    | 31/53 [00:09<00:05,  3.89it/s][A
Training:  62%|██████▏   | 33/53 [00:10<00:06,  3.19it/s][A
Training:  66%|██████▌   | 35/53 [00:10<00:04,  3.90it/s][A
Training:  70%|██████▉   | 37/53 [00

Epoch: 66/95 - Loss: 0.1774 - Accuracy: 0.9360



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:01<00:08,  1.49s/it][A
100%|██████████| 7/7 [00:02<00:00,  2.72it/s][A
Epochs:  69%|██████▉   | 66/95 [20:19<08:36, 17.80s/it]

Val Loss: 0.2073 - Val Accuracy: 0.9165



Training:   0%|          | 0/53 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/53 [00:01<01:14,  1.43s/it][A
Training:   6%|▌         | 3/53 [00:01<00:20,  2.44it/s][A
Training:   9%|▉         | 5/53 [00:02<00:21,  2.23it/s][A
Training:  15%|█▌        | 8/53 [00:02<00:10,  4.32it/s][A
Training:  19%|█▉        | 10/53 [00:03<00:14,  3.05it/s][A
Training:  25%|██▍       | 13/53 [00:04<00:12,  3.14it/s][A
Training:  32%|███▏      | 17/53 [00:05<00:10,  3.42it/s][A
Training:  34%|███▍      | 18/53 [00:05<00:09,  3.75it/s][A
Training:  40%|███▉      | 21/53 [00:06<00:09,  3.33it/s][A
Training:  43%|████▎     | 23/53 [00:06<00:07,  4.22it/s][A
Training:  47%|████▋     | 25/53 [00:07<00:08,  3.25it/s][A
Training:  49%|████▉     | 26/53 [00:08<00:07,  3.54it/s][A
Training:  55%|█████▍    | 29/53 [00:09<00:07,  3.21it/s][A
Training:  58%|█████▊    | 31/53 [00:09<00:05,  4.07it/s][A
Training:  62%|██████▏   | 33/53 [00:10<00:06,  3.19it/s][A
Training:  66%|██████▌   | 35/53 [00

Epoch: 67/95 - Loss: 0.1782 - Accuracy: 0.9345



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:01<00:08,  1.43s/it][A
 57%|█████▋    | 4/7 [00:01<00:00,  3.33it/s][A
100%|██████████| 7/7 [00:02<00:00,  2.71it/s][A
Epochs:  71%|███████   | 67/95 [20:37<08:18, 17.79s/it]

Val Loss: 0.2090 - Val Accuracy: 0.9160



Training:   0%|          | 0/53 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/53 [00:01<01:12,  1.40s/it][A
Training:   8%|▊         | 4/53 [00:01<00:14,  3.29it/s][A
Training:  11%|█▏        | 6/53 [00:02<00:17,  2.63it/s][A
Training:  17%|█▋        | 9/53 [00:03<00:15,  2.87it/s][A
Training:  21%|██        | 11/53 [00:03<00:10,  3.84it/s][A
Training:  25%|██▍       | 13/53 [00:04<00:13,  3.04it/s][A
Training:  30%|███       | 16/53 [00:04<00:08,  4.57it/s][A
Training:  34%|███▍      | 18/53 [00:05<00:09,  3.56it/s][A
Training:  40%|███▉      | 21/53 [00:06<00:09,  3.33it/s][A
Training:  42%|████▏     | 22/53 [00:06<00:08,  3.49it/s][A
Training:  45%|████▌     | 24/53 [00:06<00:06,  4.58it/s][A
Training:  47%|████▋     | 25/53 [00:07<00:09,  3.08it/s][A
Training:  49%|████▉     | 26/53 [00:07<00:08,  3.23it/s][A
Training:  53%|█████▎    | 28/53 [00:08<00:05,  4.61it/s][A
Training:  55%|█████▍    | 29/53 [00:08<00:08,  2.99it/s][A
Training:  57%|█████▋    | 30/53 [00

Epoch: 68/95 - Loss: 0.1765 - Accuracy: 0.9331



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:01<00:08,  1.42s/it][A
 57%|█████▋    | 4/7 [00:01<00:00,  3.34it/s][A
100%|██████████| 7/7 [00:02<00:00,  2.72it/s][A
Epochs:  72%|███████▏  | 68/95 [20:55<07:59, 17.76s/it]

Val Loss: 0.2070 - Val Accuracy: 0.9144



Training:   0%|          | 0/53 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/53 [00:01<01:11,  1.37s/it][A
Training:   4%|▍         | 2/53 [00:01<00:32,  1.59it/s][A
Training:   9%|▉         | 5/53 [00:02<00:19,  2.51it/s][A
Training:  11%|█▏        | 6/53 [00:02<00:16,  2.93it/s][A
Training:  17%|█▋        | 9/53 [00:03<00:13,  3.28it/s][A
Training:  19%|█▉        | 10/53 [00:03<00:12,  3.55it/s][A
Training:  25%|██▍       | 13/53 [00:04<00:11,  3.36it/s][A
Training:  26%|██▋       | 14/53 [00:04<00:11,  3.43it/s][A
Training:  32%|███▏      | 17/53 [00:05<00:10,  3.57it/s][A
Training:  34%|███▍      | 18/53 [00:05<00:09,  3.61it/s][A
Training:  40%|███▉      | 21/53 [00:06<00:08,  3.72it/s][A
Training:  42%|████▏     | 22/53 [00:06<00:08,  3.61it/s][A
Training:  47%|████▋     | 25/53 [00:07<00:08,  3.49it/s][A
Training:  49%|████▉     | 26/53 [00:08<00:07,  3.60it/s][A
Training:  53%|█████▎    | 28/53 [00:08<00:05,  4.85it/s][A
Training:  55%|█████▍    | 29/53 [00:

Epoch: 69/95 - Loss: 0.1783 - Accuracy: 0.9331



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:01<00:08,  1.44s/it][A
 29%|██▊       | 2/7 [00:01<00:03,  1.51it/s][A
100%|██████████| 7/7 [00:02<00:00,  2.69it/s][A
Epochs:  73%|███████▎  | 69/95 [21:13<07:42, 17.78s/it]

Val Loss: 0.2105 - Val Accuracy: 0.9149



Training:   0%|          | 0/53 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/53 [00:01<01:13,  1.41s/it][A
Training:   8%|▊         | 4/53 [00:01<00:15,  3.27it/s][A
Training:  11%|█▏        | 6/53 [00:02<00:17,  2.69it/s][A
Training:  15%|█▌        | 8/53 [00:02<00:11,  3.93it/s][A
Training:  19%|█▉        | 10/53 [00:03<00:14,  3.04it/s][A
Training:  25%|██▍       | 13/53 [00:04<00:13,  3.03it/s][A
Training:  26%|██▋       | 14/53 [00:04<00:11,  3.36it/s][A
Training:  32%|███▏      | 17/53 [00:05<00:11,  3.21it/s][A
Training:  34%|███▍      | 18/53 [00:05<00:09,  3.60it/s][A
Training:  40%|███▉      | 21/53 [00:06<00:09,  3.43it/s][A
Training:  45%|████▌     | 24/53 [00:06<00:05,  5.09it/s][A
Training:  49%|████▉     | 26/53 [00:07<00:07,  3.38it/s][A
Training:  55%|█████▍    | 29/53 [00:08<00:07,  3.26it/s][A
Training:  57%|█████▋    | 30/53 [00:09<00:06,  3.60it/s][A
Training:  62%|██████▏   | 33/53 [00:10<00:06,  3.33it/s][A
Training:  64%|██████▍   | 34/53 [00

Epoch: 70/95 - Loss: 0.1758 - Accuracy: 0.9346



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:01<00:08,  1.45s/it][A
 57%|█████▋    | 4/7 [00:01<00:00,  3.27it/s][A
100%|██████████| 7/7 [00:02<00:00,  2.67it/s][A
Epochs:  74%|███████▎  | 70/95 [21:30<07:23, 17.74s/it]

Val Loss: 0.2069 - Val Accuracy: 0.9165



Training:   0%|          | 0/53 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/53 [00:01<01:14,  1.43s/it][A
Training:   4%|▍         | 2/53 [00:01<00:33,  1.51it/s][A
Training:   9%|▉         | 5/53 [00:02<00:19,  2.44it/s][A
Training:  15%|█▌        | 8/53 [00:02<00:09,  4.51it/s][A
Training:  19%|█▉        | 10/53 [00:03<00:14,  3.03it/s][A
Training:  25%|██▍       | 13/53 [00:04<00:13,  2.93it/s][A
Training:  28%|██▊       | 15/53 [00:04<00:09,  3.82it/s][A
Training:  32%|███▏      | 17/53 [00:05<00:12,  2.94it/s][A
Training:  40%|███▉      | 21/53 [00:06<00:09,  3.41it/s][A
Training:  45%|████▌     | 24/53 [00:07<00:06,  4.72it/s][A
Training:  49%|████▉     | 26/53 [00:08<00:07,  3.59it/s][A
Training:  53%|█████▎    | 28/53 [00:08<00:05,  4.50it/s][A
Training:  57%|█████▋    | 30/53 [00:09<00:06,  3.37it/s][A
Training:  62%|██████▏   | 33/53 [00:10<00:06,  3.16it/s][A
Training:  66%|██████▌   | 35/53 [00:10<00:04,  3.86it/s][A
Training:  70%|██████▉   | 37/53 [00

Epoch: 71/95 - Loss: 0.1786 - Accuracy: 0.9330



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:01<00:08,  1.41s/it][A
100%|██████████| 7/7 [00:02<00:00,  2.73it/s][A
Epochs:  75%|███████▍  | 71/95 [21:48<07:05, 17.72s/it]

Val Loss: 0.2094 - Val Accuracy: 0.9144



Training:   0%|          | 0/53 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/53 [00:01<01:13,  1.42s/it][A
Training:   8%|▊         | 4/53 [00:01<00:15,  3.18it/s][A
Training:  11%|█▏        | 6/53 [00:02<00:17,  2.69it/s][A
Training:  15%|█▌        | 8/53 [00:02<00:11,  3.78it/s][A
Training:  17%|█▋        | 9/53 [00:03<00:17,  2.45it/s][A
Training:  21%|██        | 11/53 [00:03<00:11,  3.64it/s][A
Training:  25%|██▍       | 13/53 [00:04<00:13,  2.93it/s][A
Training:  30%|███       | 16/53 [00:04<00:07,  4.76it/s][A
Training:  34%|███▍      | 18/53 [00:05<00:10,  3.33it/s][A
Training:  38%|███▊      | 20/53 [00:05<00:07,  4.23it/s][A
Training:  42%|████▏     | 22/53 [00:06<00:08,  3.46it/s][A
Training:  43%|████▎     | 23/53 [00:06<00:08,  3.66it/s][A
Training:  47%|████▋     | 25/53 [00:07<00:09,  3.05it/s][A
Training:  51%|█████     | 27/53 [00:08<00:06,  4.02it/s][A
Training:  55%|█████▍    | 29/53 [00:08<00:07,  3.11it/s][A
Training:  58%|█████▊    | 31/53 [00:

Epoch: 72/95 - Loss: 0.1762 - Accuracy: 0.9332



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:01<00:08,  1.46s/it][A
100%|██████████| 7/7 [00:02<00:00,  2.72it/s][A
Epochs:  76%|███████▌  | 72/95 [22:06<06:46, 17.67s/it]

Val Loss: 0.2096 - Val Accuracy: 0.9133



Training:   0%|          | 0/53 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/53 [00:01<01:16,  1.47s/it][A
Training:   8%|▊         | 4/53 [00:01<00:14,  3.27it/s][A
Training:  11%|█▏        | 6/53 [00:02<00:18,  2.59it/s][A
Training:  15%|█▌        | 8/53 [00:02<00:11,  3.80it/s][A
Training:  19%|█▉        | 10/53 [00:03<00:15,  2.75it/s][A
Training:  25%|██▍       | 13/53 [00:04<00:14,  2.79it/s][A
Training:  28%|██▊       | 15/53 [00:04<00:10,  3.72it/s][A
Training:  32%|███▏      | 17/53 [00:05<00:11,  3.07it/s][A
Training:  36%|███▌      | 19/53 [00:06<00:08,  3.87it/s][A
Training:  40%|███▉      | 21/53 [00:07<00:10,  3.06it/s][A
Training:  43%|████▎     | 23/53 [00:07<00:07,  4.04it/s][A
Training:  47%|████▋     | 25/53 [00:08<00:08,  3.23it/s][A
Training:  53%|█████▎    | 28/53 [00:08<00:05,  4.91it/s][A
Training:  57%|█████▋    | 30/53 [00:09<00:06,  3.54it/s][A
Training:  62%|██████▏   | 33/53 [00:10<00:06,  3.18it/s][A
Training:  68%|██████▊   | 36/53 [00

Epoch: 73/95 - Loss: 0.1769 - Accuracy: 0.9341



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:01<00:08,  1.43s/it][A
100%|██████████| 7/7 [00:02<00:00,  2.76it/s][A
Epochs:  77%|███████▋  | 73/95 [22:23<06:29, 17.68s/it]

Val Loss: 0.2062 - Val Accuracy: 0.9149



Training:   0%|          | 0/53 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/53 [00:01<01:12,  1.40s/it][A
Training:   6%|▌         | 3/53 [00:01<00:20,  2.50it/s][A
Training:   9%|▉         | 5/53 [00:02<00:21,  2.23it/s][A
Training:  13%|█▎        | 7/53 [00:02<00:13,  3.52it/s][A
Training:  17%|█▋        | 9/53 [00:03<00:17,  2.57it/s][A
Training:  23%|██▎       | 12/53 [00:03<00:09,  4.30it/s][A
Training:  26%|██▋       | 14/53 [00:04<00:12,  3.07it/s][A
Training:  32%|███▏      | 17/53 [00:06<00:12,  2.87it/s][A
Training:  38%|███▊      | 20/53 [00:06<00:07,  4.20it/s][A
Training:  42%|████▏     | 22/53 [00:07<00:09,  3.24it/s][A
Training:  43%|████▎     | 23/53 [00:07<00:08,  3.61it/s][A
Training:  47%|████▋     | 25/53 [00:08<00:09,  3.02it/s][A
Training:  51%|█████     | 27/53 [00:08<00:06,  4.01it/s][A
Training:  55%|█████▍    | 29/53 [00:09<00:07,  3.12it/s][A
Training:  58%|█████▊    | 31/53 [00:09<00:05,  3.98it/s][A
Training:  62%|██████▏   | 33/53 [00:

Epoch: 74/95 - Loss: 0.1786 - Accuracy: 0.9319



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:01<00:08,  1.40s/it][A
 43%|████▎     | 3/7 [00:01<00:01,  2.45it/s][A
100%|██████████| 7/7 [00:02<00:00,  2.80it/s][A
Epochs:  78%|███████▊  | 74/95 [22:41<06:12, 17.76s/it]

Val Loss: 0.2049 - Val Accuracy: 0.9134



Training:   0%|          | 0/53 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/53 [00:01<01:15,  1.46s/it][A
Training:   6%|▌         | 3/53 [00:01<00:20,  2.40it/s][A
Training:   9%|▉         | 5/53 [00:02<00:23,  2.08it/s][A
Training:  15%|█▌        | 8/53 [00:02<00:11,  4.04it/s][A
Training:  19%|█▉        | 10/53 [00:03<00:14,  2.92it/s][A
Training:  25%|██▍       | 13/53 [00:04<00:14,  2.84it/s][A
Training:  28%|██▊       | 15/53 [00:05<00:10,  3.70it/s][A
Training:  32%|███▏      | 17/53 [00:05<00:11,  3.06it/s][A
Training:  34%|███▍      | 18/53 [00:06<00:10,  3.46it/s][A
Training:  40%|███▉      | 21/53 [00:07<00:09,  3.25it/s][A
Training:  42%|████▏     | 22/53 [00:07<00:08,  3.64it/s][A
Training:  45%|████▌     | 24/53 [00:07<00:05,  4.87it/s][A
Training:  49%|████▉     | 26/53 [00:08<00:07,  3.47it/s][A
Training:  55%|█████▍    | 29/53 [00:09<00:07,  3.34it/s][A
Training:  58%|█████▊    | 31/53 [00:09<00:05,  4.34it/s][A
Training:  62%|██████▏   | 33/53 [00

Epoch: 75/95 - Loss: 0.1792 - Accuracy: 0.9336



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:01<00:08,  1.43s/it][A
100%|██████████| 7/7 [00:02<00:00,  2.79it/s][A
Epochs:  79%|███████▉  | 75/95 [22:59<05:54, 17.73s/it]

Val Loss: 0.2103 - Val Accuracy: 0.9133



Training:   0%|          | 0/53 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/53 [00:01<01:14,  1.43s/it][A
Training:   6%|▌         | 3/53 [00:01<00:20,  2.44it/s][A
Training:   9%|▉         | 5/53 [00:02<00:20,  2.32it/s][A
Training:  13%|█▎        | 7/53 [00:02<00:12,  3.58it/s][A
Training:  17%|█▋        | 9/53 [00:03<00:16,  2.68it/s][A
Training:  21%|██        | 11/53 [00:03<00:11,  3.77it/s][A
Training:  25%|██▍       | 13/53 [00:04<00:13,  2.93it/s][A
Training:  28%|██▊       | 15/53 [00:04<00:10,  3.76it/s][A
Training:  32%|███▏      | 17/53 [00:05<00:11,  3.06it/s][A
Training:  34%|███▍      | 18/53 [00:06<00:10,  3.49it/s][A
Training:  38%|███▊      | 20/53 [00:06<00:07,  4.66it/s][A
Training:  40%|███▉      | 21/53 [00:07<00:10,  2.95it/s][A
Training:  45%|████▌     | 24/53 [00:07<00:06,  4.52it/s][A
Training:  47%|████▋     | 25/53 [00:08<00:09,  2.95it/s][A
Training:  53%|█████▎    | 28/53 [00:08<00:05,  4.31it/s][A
Training:  55%|█████▍    | 29/53 [00:

Epoch: 76/95 - Loss: 0.1755 - Accuracy: 0.9341



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:01<00:08,  1.44s/it][A
100%|██████████| 7/7 [00:02<00:00,  2.84it/s][A
Epochs:  80%|████████  | 76/95 [23:17<05:37, 17.75s/it]

Val Loss: 0.2094 - Val Accuracy: 0.9134



Training:   0%|          | 0/53 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/53 [00:01<01:14,  1.43s/it][A
Training:   9%|▉         | 5/53 [00:02<00:21,  2.23it/s][A
Training:  17%|█▋        | 9/53 [00:03<00:15,  2.85it/s][A
Training:  21%|██        | 11/53 [00:03<00:11,  3.71it/s][A
Training:  25%|██▍       | 13/53 [00:04<00:13,  3.02it/s][A
Training:  28%|██▊       | 15/53 [00:04<00:09,  3.94it/s][A
Training:  32%|███▏      | 17/53 [00:05<00:12,  2.97it/s][A
Training:  38%|███▊      | 20/53 [00:06<00:07,  4.43it/s][A
Training:  42%|████▏     | 22/53 [00:07<00:09,  3.18it/s][A
Training:  45%|████▌     | 24/53 [00:07<00:07,  4.09it/s][A
Training:  49%|████▉     | 26/53 [00:08<00:08,  3.16it/s][A
Training:  53%|█████▎    | 28/53 [00:08<00:06,  4.15it/s][A
Training:  57%|█████▋    | 30/53 [00:09<00:06,  3.33it/s][A
Training:  62%|██████▏   | 33/53 [00:10<00:06,  3.13it/s][A
Training:  70%|██████▉   | 37/53 [00:11<00:04,  3.22it/s][A
Training:  75%|███████▌  | 40/53 [0

Epoch: 77/95 - Loss: 0.1768 - Accuracy: 0.9342



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:01<00:08,  1.45s/it][A
 57%|█████▋    | 4/7 [00:01<00:00,  3.25it/s][A
100%|██████████| 7/7 [00:02<00:00,  2.78it/s][A
Epochs:  81%|████████  | 77/95 [23:34<05:19, 17.73s/it]

Val Loss: 0.2098 - Val Accuracy: 0.9149



Training:   0%|          | 0/53 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/53 [00:01<01:18,  1.52s/it][A
Training:   9%|▉         | 5/53 [00:02<00:22,  2.17it/s][A
Training:  17%|█▋        | 9/53 [00:03<00:16,  2.71it/s][A
Training:  23%|██▎       | 12/53 [00:03<00:10,  4.04it/s][A
Training:  26%|██▋       | 14/53 [00:05<00:12,  3.06it/s][A
Training:  32%|███▏      | 17/53 [00:06<00:12,  2.97it/s][A
Training:  34%|███▍      | 18/53 [00:06<00:10,  3.29it/s][A
Training:  38%|███▊      | 20/53 [00:06<00:07,  4.34it/s][A
Training:  42%|████▏     | 22/53 [00:07<00:09,  3.18it/s][A
Training:  47%|████▋     | 25/53 [00:08<00:08,  3.12it/s][A
Training:  49%|████▉     | 26/53 [00:08<00:08,  3.34it/s][A
Training:  53%|█████▎    | 28/53 [00:08<00:05,  4.46it/s][A
Training:  55%|█████▍    | 29/53 [00:09<00:07,  3.09it/s][A
Training:  57%|█████▋    | 30/53 [00:09<00:06,  3.50it/s][A
Training:  62%|██████▏   | 33/53 [00:10<00:05,  3.41it/s][A
Training:  64%|██████▍   | 34/53 [0

Epoch: 78/95 - Loss: 0.1789 - Accuracy: 0.9336



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:01<00:08,  1.37s/it][A
 71%|███████▏  | 5/7 [00:02<00:00,  2.47it/s][A
100%|██████████| 7/7 [00:02<00:00,  2.77it/s][A
Epochs:  82%|████████▏ | 78/95 [23:52<05:02, 17.81s/it]

Val Loss: 0.2087 - Val Accuracy: 0.9139



Training:   0%|          | 0/53 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/53 [00:01<01:10,  1.37s/it][A
Training:   6%|▌         | 3/53 [00:01<00:20,  2.48it/s][A
Training:   9%|▉         | 5/53 [00:02<00:21,  2.19it/s][A
Training:  11%|█▏        | 6/53 [00:02<00:17,  2.61it/s][A
Training:  17%|█▋        | 9/53 [00:03<00:15,  2.93it/s][A
Training:  19%|█▉        | 10/53 [00:03<00:13,  3.08it/s][A
Training:  25%|██▍       | 13/53 [00:04<00:12,  3.26it/s][A
Training:  26%|██▋       | 14/53 [00:04<00:11,  3.41it/s][A
Training:  32%|███▏      | 17/53 [00:05<00:10,  3.28it/s][A
Training:  34%|███▍      | 18/53 [00:06<00:09,  3.53it/s][A
Training:  40%|███▉      | 21/53 [00:07<00:09,  3.38it/s][A
Training:  42%|████▏     | 22/53 [00:07<00:08,  3.74it/s][A
Training:  47%|████▋     | 25/53 [00:08<00:07,  3.57it/s][A
Training:  49%|████▉     | 26/53 [00:08<00:06,  3.99it/s][A
Training:  53%|█████▎    | 28/53 [00:08<00:04,  5.08it/s][A
Training:  55%|█████▍    | 29/53 [00:

Epoch: 79/95 - Loss: 0.1793 - Accuracy: 0.9329



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:01<00:08,  1.42s/it][A
100%|██████████| 7/7 [00:02<00:00,  2.75it/s][A
Epochs:  83%|████████▎ | 79/95 [24:10<04:44, 17.76s/it]

Val Loss: 0.2083 - Val Accuracy: 0.9123



Training:   0%|          | 0/53 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/53 [00:01<01:13,  1.41s/it][A
Training:   9%|▉         | 5/53 [00:02<00:23,  2.09it/s][A
Training:  13%|█▎        | 7/53 [00:02<00:14,  3.14it/s][A
Training:  17%|█▋        | 9/53 [00:03<00:16,  2.60it/s][A
Training:  23%|██▎       | 12/53 [00:03<00:09,  4.19it/s][A
Training:  26%|██▋       | 14/53 [00:05<00:12,  3.01it/s][A
Training:  30%|███       | 16/53 [00:05<00:09,  3.96it/s][A
Training:  34%|███▍      | 18/53 [00:06<00:11,  3.06it/s][A
Training:  40%|███▉      | 21/53 [00:07<00:11,  2.88it/s][A
Training:  47%|████▋     | 25/53 [00:08<00:08,  3.26it/s][A
Training:  53%|█████▎    | 28/53 [00:08<00:05,  4.46it/s][A
Training:  57%|█████▋    | 30/53 [00:09<00:06,  3.37it/s][A
Training:  62%|██████▏   | 33/53 [00:10<00:05,  3.35it/s][A
Training:  70%|██████▉   | 37/53 [00:11<00:04,  3.42it/s][A
Training:  77%|███████▋  | 41/53 [00:12<00:03,  3.40it/s][A
Training:  81%|████████  | 43/53 [00

Epoch: 80/95 - Loss: 0.1773 - Accuracy: 0.9341



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:01<00:07,  1.32s/it][A
 43%|████▎     | 3/7 [00:01<00:01,  2.60it/s][A
100%|██████████| 7/7 [00:02<00:00,  2.76it/s][A
Epochs:  84%|████████▍ | 80/95 [24:28<04:26, 17.79s/it]

Val Loss: 0.2092 - Val Accuracy: 0.9123



Training:   0%|          | 0/53 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/53 [00:01<01:16,  1.47s/it][A
Training:   8%|▊         | 4/53 [00:01<00:15,  3.22it/s][A
Training:  11%|█▏        | 6/53 [00:02<00:19,  2.42it/s][A
Training:  15%|█▌        | 8/53 [00:02<00:12,  3.58it/s][A
Training:  19%|█▉        | 10/53 [00:03<00:14,  2.87it/s][A
Training:  23%|██▎       | 12/53 [00:03<00:10,  3.87it/s][A
Training:  25%|██▍       | 13/53 [00:04<00:15,  2.56it/s][A
Training:  26%|██▋       | 14/53 [00:04<00:12,  3.04it/s][A
Training:  30%|███       | 16/53 [00:05<00:08,  4.19it/s][A
Training:  32%|███▏      | 17/53 [00:06<00:13,  2.67it/s][A
Training:  36%|███▌      | 19/53 [00:06<00:08,  3.97it/s][A
Training:  40%|███▉      | 21/53 [00:07<00:11,  2.90it/s][A
Training:  42%|████▏     | 22/53 [00:07<00:09,  3.24it/s][A
Training:  45%|████▌     | 24/53 [00:07<00:06,  4.64it/s][A
Training:  49%|████▉     | 26/53 [00:08<00:08,  3.25it/s][A
Training:  53%|█████▎    | 28/53 [00

Epoch: 81/95 - Loss: 0.1762 - Accuracy: 0.9347



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:01<00:08,  1.36s/it][A
100%|██████████| 7/7 [00:02<00:00,  2.82it/s][A
Epochs:  85%|████████▌ | 81/95 [24:46<04:08, 17.78s/it]

Val Loss: 0.2060 - Val Accuracy: 0.9149



Training:   0%|          | 0/53 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/53 [00:01<01:08,  1.31s/it][A
Training:   4%|▍         | 2/53 [00:01<00:31,  1.64it/s][A
Training:   9%|▉         | 5/53 [00:02<00:19,  2.42it/s][A
Training:  11%|█▏        | 6/53 [00:02<00:16,  2.93it/s][A
Training:  15%|█▌        | 8/53 [00:02<00:09,  4.55it/s][A
Training:  19%|█▉        | 10/53 [00:03<00:14,  3.07it/s][A
Training:  25%|██▍       | 13/53 [00:04<00:12,  3.08it/s][A
Training:  26%|██▋       | 14/53 [00:04<00:11,  3.27it/s][A
Training:  32%|███▏      | 17/53 [00:05<00:11,  3.17it/s][A
Training:  34%|███▍      | 18/53 [00:06<00:10,  3.37it/s][A
Training:  38%|███▊      | 20/53 [00:06<00:07,  4.53it/s][A
Training:  40%|███▉      | 21/53 [00:06<00:10,  3.03it/s][A
Training:  43%|████▎     | 23/53 [00:07<00:07,  4.11it/s][A
Training:  47%|████▋     | 25/53 [00:08<00:08,  3.17it/s][A
Training:  51%|█████     | 27/53 [00:08<00:06,  3.87it/s][A
Training:  55%|█████▍    | 29/53 [00:

Epoch: 82/95 - Loss: 0.1796 - Accuracy: 0.9336



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:01<00:07,  1.32s/it][A
 29%|██▊       | 2/7 [00:01<00:03,  1.51it/s][A
 71%|███████▏  | 5/7 [00:02<00:00,  2.50it/s][A
100%|██████████| 7/7 [00:02<00:00,  2.68it/s][A
Epochs:  86%|████████▋ | 82/95 [25:03<03:50, 17.74s/it]

Val Loss: 0.2093 - Val Accuracy: 0.9139



Training:   0%|          | 0/53 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/53 [00:01<01:14,  1.43s/it][A
Training:   9%|▉         | 5/53 [00:02<00:22,  2.16it/s][A
Training:  17%|█▋        | 9/53 [00:03<00:15,  2.76it/s][A
Training:  23%|██▎       | 12/53 [00:03<00:10,  3.94it/s][A
Training:  25%|██▍       | 13/53 [00:04<00:15,  2.66it/s][A
Training:  30%|███       | 16/53 [00:05<00:08,  4.13it/s][A
Training:  34%|███▍      | 18/53 [00:06<00:11,  3.15it/s][A
Training:  38%|███▊      | 20/53 [00:06<00:08,  4.04it/s][A
Training:  42%|████▏     | 22/53 [00:07<00:09,  3.12it/s][A
Training:  45%|████▌     | 24/53 [00:07<00:07,  4.12it/s][A
Training:  49%|████▉     | 26/53 [00:08<00:08,  3.05it/s][A
Training:  55%|█████▍    | 29/53 [00:09<00:07,  3.05it/s][A
Training:  62%|██████▏   | 33/53 [00:10<00:06,  3.19it/s][A
Training:  66%|██████▌   | 35/53 [00:10<00:04,  3.96it/s][A
Training:  70%|██████▉   | 37/53 [00:11<00:04,  3.27it/s][A
Training:  77%|███████▋  | 41/53 [0

Epoch: 83/95 - Loss: 0.1772 - Accuracy: 0.9336



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:01<00:08,  1.41s/it][A
 43%|████▎     | 3/7 [00:01<00:01,  2.49it/s][A
100%|██████████| 7/7 [00:02<00:00,  2.75it/s][A
Epochs:  87%|████████▋ | 83/95 [25:21<03:32, 17.72s/it]

Val Loss: 0.2063 - Val Accuracy: 0.9144



Training:   0%|          | 0/53 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/53 [00:01<01:15,  1.45s/it][A
Training:   6%|▌         | 3/53 [00:01<00:21,  2.37it/s][A
Training:   9%|▉         | 5/53 [00:02<00:22,  2.11it/s][A
Training:  15%|█▌        | 8/53 [00:02<00:11,  4.06it/s][A
Training:  19%|█▉        | 10/53 [00:03<00:15,  2.79it/s][A
Training:  25%|██▍       | 13/53 [00:05<00:14,  2.74it/s][A
Training:  32%|███▏      | 17/53 [00:06<00:12,  2.98it/s][A
Training:  38%|███▊      | 20/53 [00:06<00:07,  4.18it/s][A
Training:  42%|████▏     | 22/53 [00:07<00:09,  3.24it/s][A
Training:  47%|████▋     | 25/53 [00:08<00:09,  3.00it/s][A
Training:  51%|█████     | 27/53 [00:08<00:06,  3.76it/s][A
Training:  55%|█████▍    | 29/53 [00:09<00:07,  3.17it/s][A
Training:  62%|██████▏   | 33/53 [00:10<00:06,  3.30it/s][A
Training:  66%|██████▌   | 35/53 [00:10<00:04,  4.07it/s][A
Training:  70%|██████▉   | 37/53 [00:11<00:04,  3.38it/s][A
Training:  75%|███████▌  | 40/53 [00

Epoch: 84/95 - Loss: 0.1795 - Accuracy: 0.9342



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:01<00:08,  1.42s/it][A
100%|██████████| 7/7 [00:02<00:00,  2.86it/s][A
Epochs:  88%|████████▊ | 84/95 [25:39<03:14, 17.72s/it]

Val Loss: 0.2060 - Val Accuracy: 0.9128



Training:   0%|          | 0/53 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/53 [00:01<01:13,  1.41s/it][A
Training:   6%|▌         | 3/53 [00:01<00:20,  2.38it/s][A
Training:   9%|▉         | 5/53 [00:02<00:22,  2.17it/s][A
Training:  15%|█▌        | 8/53 [00:02<00:10,  4.14it/s][A
Training:  19%|█▉        | 10/53 [00:03<00:13,  3.09it/s][A
Training:  23%|██▎       | 12/53 [00:03<00:10,  3.94it/s][A
Training:  25%|██▍       | 13/53 [00:04<00:14,  2.72it/s][A
Training:  28%|██▊       | 15/53 [00:04<00:09,  3.87it/s][A
Training:  32%|███▏      | 17/53 [00:05<00:12,  2.97it/s][A
Training:  36%|███▌      | 19/53 [00:06<00:08,  3.86it/s][A
Training:  38%|███▊      | 20/53 [00:06<00:08,  4.02it/s][A
Training:  40%|███▉      | 21/53 [00:06<00:10,  2.91it/s][A
Training:  43%|████▎     | 23/53 [00:07<00:07,  3.84it/s][A
Training:  45%|████▌     | 24/53 [00:07<00:07,  3.97it/s][A
Training:  47%|████▋     | 25/53 [00:08<00:09,  2.91it/s][A
Training:  49%|████▉     | 26/53 [00

Epoch: 85/95 - Loss: 0.1751 - Accuracy: 0.9355



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:01<00:08,  1.44s/it][A
 57%|█████▋    | 4/7 [00:01<00:00,  3.29it/s][A
100%|██████████| 7/7 [00:02<00:00,  2.78it/s][A
Epochs:  89%|████████▉ | 85/95 [25:56<02:56, 17.68s/it]

Val Loss: 0.2063 - Val Accuracy: 0.9144



Training:   0%|          | 0/53 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/53 [00:01<01:14,  1.42s/it][A
Training:   9%|▉         | 5/53 [00:02<00:21,  2.21it/s][A
Training:  15%|█▌        | 8/53 [00:02<00:11,  3.83it/s][A
Training:  19%|█▉        | 10/53 [00:03<00:14,  2.89it/s][A
Training:  23%|██▎       | 12/53 [00:03<00:10,  3.88it/s][A
Training:  26%|██▋       | 14/53 [00:04<00:12,  3.10it/s][A
Training:  28%|██▊       | 15/53 [00:05<00:11,  3.40it/s][A
Training:  32%|███▏      | 17/53 [00:06<00:13,  2.73it/s][A
Training:  36%|███▌      | 19/53 [00:06<00:09,  3.50it/s][A
Training:  40%|███▉      | 21/53 [00:07<00:11,  2.90it/s][A
Training:  43%|████▎     | 23/53 [00:07<00:08,  3.67it/s][A
Training:  47%|████▋     | 25/53 [00:08<00:09,  2.97it/s][A
Training:  51%|█████     | 27/53 [00:08<00:06,  3.73it/s][A
Training:  55%|█████▍    | 29/53 [00:09<00:07,  3.08it/s][A
Training:  58%|█████▊    | 31/53 [00:09<00:05,  3.88it/s][A
Training:  62%|██████▏   | 33/53 [0

Epoch: 86/95 - Loss: 0.1755 - Accuracy: 0.9349



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:01<00:08,  1.39s/it][A
 57%|█████▋    | 4/7 [00:01<00:00,  3.44it/s][A
100%|██████████| 7/7 [00:02<00:00,  2.82it/s][A
Epochs:  91%|█████████ | 86/95 [26:14<02:39, 17.69s/it]

Val Loss: 0.2077 - Val Accuracy: 0.9149



Training:   0%|          | 0/53 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/53 [00:01<01:19,  1.52s/it][A
Training:   9%|▉         | 5/53 [00:02<00:23,  2.03it/s][A
Training:  13%|█▎        | 7/53 [00:02<00:15,  3.06it/s][A
Training:  17%|█▋        | 9/53 [00:03<00:16,  2.59it/s][A
Training:  25%|██▍       | 13/53 [00:04<00:13,  3.04it/s][A
Training:  28%|██▊       | 15/53 [00:05<00:09,  3.88it/s][A
Training:  32%|███▏      | 17/53 [00:06<00:12,  2.97it/s][A
Training:  36%|███▌      | 19/53 [00:06<00:08,  3.90it/s][A
Training:  40%|███▉      | 21/53 [00:07<00:10,  3.06it/s][A
Training:  43%|████▎     | 23/53 [00:07<00:07,  3.99it/s][A
Training:  47%|████▋     | 25/53 [00:08<00:09,  3.07it/s][A
Training:  51%|█████     | 27/53 [00:08<00:06,  3.92it/s][A
Training:  55%|█████▍    | 29/53 [00:09<00:07,  3.13it/s][A
Training:  58%|█████▊    | 31/53 [00:09<00:05,  3.99it/s][A
Training:  62%|██████▏   | 33/53 [00:10<00:06,  3.14it/s][A
Training:  66%|██████▌   | 35/53 [00

Epoch: 87/95 - Loss: 0.1757 - Accuracy: 0.9348



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:01<00:08,  1.41s/it][A
 57%|█████▋    | 4/7 [00:01<00:00,  3.39it/s][A
100%|██████████| 7/7 [00:02<00:00,  2.81it/s][A
Epochs:  92%|█████████▏| 87/95 [26:32<02:21, 17.69s/it]

Val Loss: 0.2062 - Val Accuracy: 0.9144



Training:   0%|          | 0/53 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/53 [00:01<01:20,  1.56s/it][A
Training:   6%|▌         | 3/53 [00:01<00:22,  2.21it/s][A
Training:   9%|▉         | 5/53 [00:02<00:23,  2.08it/s][A
Training:  13%|█▎        | 7/53 [00:02<00:13,  3.34it/s][A
Training:  17%|█▋        | 9/53 [00:03<00:16,  2.63it/s][A
Training:  21%|██        | 11/53 [00:03<00:11,  3.76it/s][A
Training:  25%|██▍       | 13/53 [00:04<00:13,  2.86it/s][A
Training:  32%|███▏      | 17/53 [00:06<00:11,  3.11it/s][A
Training:  38%|███▊      | 20/53 [00:06<00:07,  4.45it/s][A
Training:  42%|████▏     | 22/53 [00:07<00:09,  3.35it/s][A
Training:  47%|████▋     | 25/53 [00:08<00:09,  3.08it/s][A
Training:  51%|█████     | 27/53 [00:08<00:06,  3.89it/s][A
Training:  55%|█████▍    | 29/53 [00:09<00:07,  3.01it/s][A
Training:  60%|██████    | 32/53 [00:09<00:04,  4.41it/s][A
Training:  64%|██████▍   | 34/53 [00:10<00:05,  3.19it/s][A
Training:  70%|██████▉   | 37/53 [00:

Epoch: 88/95 - Loss: 0.1772 - Accuracy: 0.9332



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:01<00:08,  1.40s/it][A
 43%|████▎     | 3/7 [00:01<00:01,  2.46it/s][A
100%|██████████| 7/7 [00:02<00:00,  2.83it/s][A
Epochs:  93%|█████████▎| 88/95 [26:49<02:03, 17.71s/it]

Val Loss: 0.2063 - Val Accuracy: 0.9129



Training:   0%|          | 0/53 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/53 [00:01<01:13,  1.40s/it][A
Training:   6%|▌         | 3/53 [00:01<00:20,  2.39it/s][A
Training:   9%|▉         | 5/53 [00:02<00:22,  2.14it/s][A
Training:  11%|█▏        | 6/53 [00:02<00:17,  2.69it/s][A
Training:  17%|█▋        | 9/53 [00:03<00:15,  2.77it/s][A
Training:  23%|██▎       | 12/53 [00:03<00:09,  4.51it/s][A
Training:  26%|██▋       | 14/53 [00:04<00:12,  3.11it/s][A
Training:  32%|███▏      | 17/53 [00:05<00:11,  3.11it/s][A
Training:  34%|███▍      | 18/53 [00:06<00:10,  3.22it/s][A
Training:  40%|███▉      | 21/53 [00:07<00:10,  3.18it/s][A
Training:  42%|████▏     | 22/53 [00:07<00:09,  3.36it/s][A
Training:  47%|████▋     | 25/53 [00:08<00:08,  3.22it/s][A
Training:  49%|████▉     | 26/53 [00:08<00:07,  3.59it/s][A
Training:  55%|█████▍    | 29/53 [00:09<00:07,  3.27it/s][A
Training:  57%|█████▋    | 30/53 [00:09<00:06,  3.48it/s][A
Training:  60%|██████    | 32/53 [00:

Epoch: 89/95 - Loss: 0.1753 - Accuracy: 0.9363



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:01<00:08,  1.38s/it][A
100%|██████████| 7/7 [00:02<00:00,  2.89it/s][A
Epochs:  94%|█████████▎| 89/95 [27:07<01:46, 17.69s/it]

Val Loss: 0.2100 - Val Accuracy: 0.9176



Training:   0%|          | 0/53 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/53 [00:01<01:17,  1.48s/it][A
Training:   6%|▌         | 3/53 [00:01<00:21,  2.30it/s][A
Training:   9%|▉         | 5/53 [00:02<00:21,  2.20it/s][A
Training:  11%|█▏        | 6/53 [00:02<00:16,  2.77it/s][A
Training:  13%|█▎        | 7/53 [00:02<00:13,  3.29it/s][A
Training:  17%|█▋        | 9/53 [00:03<00:15,  2.81it/s][A
Training:  19%|█▉        | 10/53 [00:03<00:13,  3.23it/s][A
Training:  21%|██        | 11/53 [00:04<00:11,  3.52it/s][A
Training:  25%|██▍       | 13/53 [00:04<00:13,  2.99it/s][A
Training:  28%|██▊       | 15/53 [00:05<00:10,  3.79it/s][A
Training:  32%|███▏      | 17/53 [00:06<00:12,  2.95it/s][A
Training:  36%|███▌      | 19/53 [00:06<00:08,  3.83it/s][A
Training:  40%|███▉      | 21/53 [00:07<00:10,  3.07it/s][A
Training:  43%|████▎     | 23/53 [00:07<00:07,  3.92it/s][A
Training:  47%|████▋     | 25/53 [00:08<00:09,  2.94it/s][A
Training:  53%|█████▎    | 28/53 [00:0

Epoch: 90/95 - Loss: 0.1781 - Accuracy: 0.9338



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:01<00:07,  1.31s/it][A
 29%|██▊       | 2/7 [00:01<00:03,  1.65it/s][A
 71%|███████▏  | 5/7 [00:02<00:00,  2.59it/s][A
100%|██████████| 7/7 [00:02<00:00,  2.79it/s][A
Epochs:  95%|█████████▍| 90/95 [27:25<01:28, 17.73s/it]

Val Loss: 0.2059 - Val Accuracy: 0.9155



Training:   0%|          | 0/53 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/53 [00:01<01:17,  1.50s/it][A
Training:   8%|▊         | 4/53 [00:01<00:15,  3.17it/s][A
Training:  11%|█▏        | 6/53 [00:02<00:19,  2.42it/s][A
Training:  15%|█▌        | 8/53 [00:02<00:12,  3.65it/s][A
Training:  19%|█▉        | 10/53 [00:03<00:15,  2.80it/s][A
Training:  23%|██▎       | 12/53 [00:03<00:10,  3.88it/s][A
Training:  26%|██▋       | 14/53 [00:05<00:13,  2.84it/s][A
Training:  32%|███▏      | 17/53 [00:06<00:12,  2.92it/s][A
Training:  34%|███▍      | 18/53 [00:06<00:10,  3.20it/s][A
Training:  40%|███▉      | 21/53 [00:07<00:10,  3.15it/s][A
Training:  42%|████▏     | 22/53 [00:07<00:08,  3.51it/s][A
Training:  47%|████▋     | 25/53 [00:08<00:08,  3.25it/s][A
Training:  49%|████▉     | 26/53 [00:08<00:07,  3.65it/s][A
Training:  55%|█████▍    | 29/53 [00:09<00:07,  3.25it/s][A
Training:  58%|█████▊    | 31/53 [00:09<00:05,  4.19it/s][A
Training:  62%|██████▏   | 33/53 [00

Epoch: 91/95 - Loss: 0.1747 - Accuracy: 0.9347



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:01<00:07,  1.25s/it][A
 43%|████▎     | 3/7 [00:01<00:01,  2.71it/s][A
100%|██████████| 7/7 [00:02<00:00,  2.90it/s][A
Epochs:  96%|█████████▌| 91/95 [27:43<01:10, 17.73s/it]

Val Loss: 0.2077 - Val Accuracy: 0.9128



Training:   0%|          | 0/53 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/53 [00:01<01:13,  1.42s/it][A
Training:   4%|▍         | 2/53 [00:01<00:33,  1.53it/s][A
Training:   8%|▊         | 4/53 [00:01<00:13,  3.64it/s][A
Training:  11%|█▏        | 6/53 [00:02<00:18,  2.59it/s][A
Training:  17%|█▋        | 9/53 [00:03<00:16,  2.74it/s][A
Training:  21%|██        | 11/53 [00:03<00:11,  3.76it/s][A
Training:  25%|██▍       | 13/53 [00:04<00:13,  2.96it/s][A
Training:  26%|██▋       | 14/53 [00:04<00:11,  3.30it/s][A
Training:  32%|███▏      | 17/53 [00:05<00:11,  3.17it/s][A
Training:  34%|███▍      | 18/53 [00:06<00:10,  3.49it/s][A
Training:  40%|███▉      | 21/53 [00:07<00:09,  3.34it/s][A
Training:  42%|████▏     | 22/53 [00:07<00:08,  3.57it/s][A
Training:  47%|████▋     | 25/53 [00:08<00:08,  3.33it/s][A
Training:  49%|████▉     | 26/53 [00:08<00:07,  3.54it/s][A
Training:  53%|█████▎    | 28/53 [00:08<00:05,  4.73it/s][A
Training:  55%|█████▍    | 29/53 [00:

Epoch: 92/95 - Loss: 0.1758 - Accuracy: 0.9343



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:01<00:07,  1.20s/it][A
 29%|██▊       | 2/7 [00:01<00:02,  1.73it/s][A
 71%|███████▏  | 5/7 [00:02<00:00,  2.68it/s][A
100%|██████████| 7/7 [00:02<00:00,  2.91it/s][A
Epochs:  97%|█████████▋| 92/95 [28:01<00:53, 17.78s/it]

Val Loss: 0.2093 - Val Accuracy: 0.9134



Training:   0%|          | 0/53 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/53 [00:01<01:13,  1.42s/it][A
Training:   9%|▉         | 5/53 [00:02<00:21,  2.25it/s][A
Training:  17%|█▋        | 9/53 [00:03<00:15,  2.79it/s][A
Training:  23%|██▎       | 12/53 [00:03<00:09,  4.18it/s][A
Training:  26%|██▋       | 14/53 [00:04<00:12,  3.05it/s][A
Training:  32%|███▏      | 17/53 [00:06<00:12,  2.91it/s][A
Training:  40%|███▉      | 21/53 [00:07<00:10,  3.13it/s][A
Training:  45%|████▌     | 24/53 [00:07<00:06,  4.28it/s][A
Training:  49%|████▉     | 26/53 [00:08<00:08,  3.28it/s][A
Training:  55%|█████▍    | 29/53 [00:09<00:07,  3.08it/s][A
Training:  60%|██████    | 32/53 [00:09<00:04,  4.25it/s][A
Training:  64%|██████▍   | 34/53 [00:10<00:05,  3.25it/s][A
Training:  70%|██████▉   | 37/53 [00:11<00:05,  3.03it/s][A
Training:  75%|███████▌  | 40/53 [00:11<00:03,  4.18it/s][A
Training:  79%|███████▉  | 42/53 [00:12<00:03,  3.35it/s][A
Training:  83%|████████▎ | 44/53 [0

Epoch: 93/95 - Loss: 0.1755 - Accuracy: 0.9342



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:01<00:07,  1.19s/it][A
100%|██████████| 7/7 [00:02<00:00,  3.15it/s][A
Epochs:  98%|█████████▊| 93/95 [28:18<00:35, 17.71s/it]

Val Loss: 0.2098 - Val Accuracy: 0.9096



Training:   0%|          | 0/53 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/53 [00:01<01:12,  1.39s/it][A
Training:   4%|▍         | 2/53 [00:01<00:32,  1.57it/s][A
Training:   8%|▊         | 4/53 [00:01<00:13,  3.64it/s][A
Training:  11%|█▏        | 6/53 [00:02<00:18,  2.55it/s][A
Training:  15%|█▌        | 8/53 [00:02<00:11,  3.91it/s][A
Training:  19%|█▉        | 10/53 [00:03<00:15,  2.82it/s][A
Training:  25%|██▍       | 13/53 [00:04<00:13,  2.96it/s][A
Training:  26%|██▋       | 14/53 [00:05<00:12,  3.10it/s][A
Training:  30%|███       | 16/53 [00:05<00:08,  4.29it/s][A
Training:  32%|███▏      | 17/53 [00:05<00:11,  3.14it/s][A
Training:  34%|███▍      | 18/53 [00:06<00:11,  3.03it/s][A
Training:  40%|███▉      | 21/53 [00:06<00:09,  3.46it/s][A
Training:  42%|████▏     | 22/53 [00:07<00:09,  3.29it/s][A
Training:  47%|████▋     | 25/53 [00:08<00:08,  3.44it/s][A
Training:  49%|████▉     | 26/53 [00:08<00:08,  3.28it/s][A
Training:  55%|█████▍    | 29/53 [00:

Epoch: 94/95 - Loss: 0.1759 - Accuracy: 0.9341



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:01<00:07,  1.22s/it][A
100%|██████████| 7/7 [00:02<00:00,  3.09it/s][A
Epochs:  99%|█████████▉| 94/95 [28:36<00:17, 17.66s/it]

Val Loss: 0.2097 - Val Accuracy: 0.9134



Training:   0%|          | 0/53 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/53 [00:01<01:13,  1.41s/it][A
Training:   8%|▊         | 4/53 [00:01<00:14,  3.33it/s][A
Training:  11%|█▏        | 6/53 [00:02<00:18,  2.50it/s][A
Training:  17%|█▋        | 9/53 [00:03<00:17,  2.58it/s][A
Training:  21%|██        | 11/53 [00:03<00:11,  3.53it/s][A
Training:  25%|██▍       | 13/53 [00:04<00:13,  2.87it/s][A
Training:  30%|███       | 16/53 [00:04<00:08,  4.39it/s][A
Training:  34%|███▍      | 18/53 [00:06<00:10,  3.24it/s][A
Training:  38%|███▊      | 20/53 [00:06<00:07,  4.22it/s][A
Training:  42%|████▏     | 22/53 [00:07<00:09,  3.12it/s][A
Training:  47%|████▋     | 25/53 [00:08<00:09,  3.05it/s][A
Training:  53%|█████▎    | 28/53 [00:08<00:05,  4.42it/s][A
Training:  57%|█████▋    | 30/53 [00:09<00:06,  3.30it/s][A
Training:  62%|██████▏   | 33/53 [00:10<00:06,  3.05it/s][A
Training:  70%|██████▉   | 37/53 [00:11<00:04,  3.26it/s][A
Training:  74%|███████▎  | 39/53 [00

Epoch: 95/95 - Loss: 0.1782 - Accuracy: 0.9330



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:01<00:07,  1.29s/it][A
 57%|█████▋    | 4/7 [00:01<00:00,  3.69it/s][A
100%|██████████| 7/7 [00:02<00:00,  3.13it/s][A
Epochs: 100%|██████████| 95/95 [28:53<00:00, 18.25s/it]
[32m[I 2023-12-11 23:38:30,347][0m Trial 0 finished with value: 0.9175874590873718 and parameters: {'learning_rate': 0.000287881984666585, 'weight_decay': 0.009570542308397574, 'epsilon': 5.706295335047529e-08, 'batch_size': 268, 'epochs': 95}. Best is trial 0 with value: 0.9175874590873718.[0m


Val Loss: 0.2059 - Val Accuracy: 0.9176
Saving best model...
Learning rate: 0.05684972267027994
Weight decay: 0.003481723709485491
Epsilon: 1.1793575954143915e-09
Batch size: 76
Number of epochs: 45


Epochs:   0%|          | 0/45 [00:00<?, ?it/s]
Training:   0%|          | 0/184 [00:00<?, ?it/s][A
Training:   1%|          | 1/184 [00:00<01:39,  1.83it/s][A
Training:   3%|▎         | 5/184 [00:00<00:26,  6.84it/s][A
Training:   4%|▍         | 7/184 [00:00<00:20,  8.81it/s][A
Training:   5%|▍         | 9/184 [00:01<00:19,  8.86it/s][A
Training:   7%|▋         | 12/184 [00:01<00:14, 11.91it/s][A
Training:   8%|▊         | 14/184 [00:01<00:16, 10.41it/s][A
Training:   9%|▊         | 16/184 [00:01<00:13, 12.03it/s][A
Training:  10%|▉         | 18/184 [00:01<00:15, 10.73it/s][A
Training:  11%|█         | 20/184 [00:02<00:13, 12.09it/s][A
Training:  12%|█▏        | 22/184 [00:02<00:15, 10.78it/s][A
Training:  13%|█▎        | 24/184 [00:02<00:12, 12.42it/s][A
Training:  14%|█▍        | 26/184 [00:02<00:14, 10.97it/s][A
Training:  16%|█▌        | 29/184 [00:02<00:12, 12.04it/s][A
Training:  17%|█▋        | 31/184 [00:02<00:12, 12.13it/s][A
Training:  18%|█▊        | 33/184 [0

Epoch: 1/45 - Loss: 7.0919 - Accuracy: 0.8341



  0%|          | 0/23 [00:00<?, ?it/s][A
  4%|▍         | 1/23 [00:00<00:10,  2.15it/s][A
 22%|██▏       | 5/23 [00:00<00:02,  8.10it/s][A
 39%|███▉      | 9/23 [00:00<00:01, 10.78it/s][A
 57%|█████▋    | 13/23 [00:01<00:00, 12.80it/s][A
 74%|███████▍  | 17/23 [00:01<00:00, 13.42it/s][A
 83%|████████▎ | 19/23 [00:01<00:00, 13.68it/s][A
 91%|█████████▏| 21/23 [00:01<00:00, 13.21it/s][A
100%|██████████| 23/23 [00:02<00:00, 11.39it/s][A
Epochs:   2%|▏         | 1/45 [00:17<13:04, 17.83s/it]

Val Loss: 3.6613 - Val Accuracy: 0.8813



Training:   0%|          | 0/184 [00:00<?, ?it/s][A
Training:   1%|          | 1/184 [00:00<01:41,  1.81it/s][A
Training:   3%|▎         | 5/184 [00:00<00:27,  6.58it/s][A
Training:   5%|▍         | 9/184 [00:01<00:20,  8.45it/s][A
Training:   7%|▋         | 13/184 [00:01<00:17,  9.91it/s][A
Training:   9%|▊         | 16/184 [00:01<00:13, 12.04it/s][A
Training:  10%|▉         | 18/184 [00:01<00:14, 11.30it/s][A
Training:  11%|█▏        | 21/184 [00:02<00:15, 10.66it/s][A
Training:  14%|█▎        | 25/184 [00:02<00:14, 10.96it/s][A
Training:  16%|█▌        | 29/184 [00:02<00:13, 11.40it/s][A
Training:  18%|█▊        | 33/184 [00:03<00:12, 11.76it/s][A
Training:  20%|██        | 37/184 [00:03<00:12, 11.61it/s][A
Training:  22%|██▏       | 41/184 [00:03<00:11, 12.16it/s][A
Training:  24%|██▍       | 44/184 [00:04<00:10, 13.70it/s][A
Training:  25%|██▌       | 46/184 [00:04<00:10, 13.40it/s][A
Training:  26%|██▌       | 48/184 [00:04<00:10, 13.27it/s][A
Training:  27%|██▋ 

Epoch: 2/45 - Loss: 7.7008 - Accuracy: 0.8548



  0%|          | 0/23 [00:00<?, ?it/s][A
  4%|▍         | 1/23 [00:00<00:10,  2.02it/s][A
 22%|██▏       | 5/23 [00:00<00:02,  6.97it/s][A
 39%|███▉      | 9/23 [00:01<00:01, 10.06it/s][A
 57%|█████▋    | 13/23 [00:01<00:00, 11.67it/s][A
 74%|███████▍  | 17/23 [00:01<00:00, 13.01it/s][A
100%|██████████| 23/23 [00:02<00:00, 11.44it/s][A
Epochs:   4%|▍         | 2/45 [00:35<12:45, 17.81s/it]

Val Loss: 15.2200 - Val Accuracy: 0.8894



Training:   0%|          | 0/184 [00:00<?, ?it/s][A
Training:   1%|          | 1/184 [00:00<01:45,  1.73it/s][A
Training:   3%|▎         | 5/184 [00:00<00:28,  6.22it/s][A
Training:   5%|▍         | 9/184 [00:01<00:21,  7.99it/s][A
Training:   7%|▋         | 13/184 [00:01<00:17,  9.69it/s][A
Training:   9%|▉         | 17/184 [00:01<00:15, 10.68it/s][A
Training:  11%|█▏        | 21/184 [00:02<00:14, 10.96it/s][A
Training:  14%|█▎        | 25/184 [00:02<00:14, 11.22it/s][A
Training:  16%|█▌        | 29/184 [00:02<00:13, 11.25it/s][A
Training:  18%|█▊        | 33/184 [00:03<00:13, 11.13it/s][A
Training:  20%|██        | 37/184 [00:03<00:12, 11.80it/s][A
Training:  21%|██        | 39/184 [00:03<00:11, 12.71it/s][A
Training:  22%|██▏       | 41/184 [00:03<00:12, 11.72it/s][A
Training:  23%|██▎       | 43/184 [00:04<00:11, 12.62it/s][A
Training:  24%|██▍       | 45/184 [00:04<00:11, 12.15it/s][A
Training:  26%|██▌       | 47/184 [00:04<00:10, 12.87it/s][A
Training:  27%|██▋ 

Epoch: 3/45 - Loss: 17.2441 - Accuracy: 0.8598



  0%|          | 0/23 [00:00<?, ?it/s][A
  4%|▍         | 1/23 [00:00<00:11,  1.92it/s][A
 22%|██▏       | 5/23 [00:00<00:02,  7.13it/s][A
 39%|███▉      | 9/23 [00:01<00:01,  9.75it/s][A
 57%|█████▋    | 13/23 [00:01<00:00, 11.16it/s][A
 74%|███████▍  | 17/23 [00:01<00:00, 12.43it/s][A
100%|██████████| 23/23 [00:01<00:00, 11.65it/s][A
Epochs:   7%|▋         | 3/45 [00:53<12:26, 17.77s/it]

Val Loss: 16.2061 - Val Accuracy: 0.8482



Training:   0%|          | 0/184 [00:00<?, ?it/s][A
Training:   1%|          | 1/184 [00:00<01:27,  2.08it/s][A
Training:   3%|▎         | 5/184 [00:00<00:28,  6.39it/s][A
Training:   5%|▍         | 9/184 [00:01<00:19,  8.91it/s][A
Training:   7%|▋         | 12/184 [00:01<00:14, 12.02it/s][A
Training:   8%|▊         | 14/184 [00:01<00:16, 10.12it/s][A
Training:   9%|▉         | 17/184 [00:01<00:16, 10.12it/s][A
Training:  11%|█▏        | 21/184 [00:02<00:14, 10.91it/s][A
Training:  14%|█▎        | 25/184 [00:02<00:14, 11.29it/s][A
Training:  16%|█▌        | 29/184 [00:02<00:12, 11.94it/s][A
Training:  18%|█▊        | 33/184 [00:03<00:12, 11.68it/s][A
Training:  20%|██        | 37/184 [00:03<00:12, 11.37it/s][A
Training:  22%|██▏       | 41/184 [00:03<00:12, 11.39it/s][A
Training:  24%|██▍       | 45/184 [00:04<00:16,  8.23it/s][A
Training:  27%|██▋       | 49/184 [00:05<00:15,  8.94it/s][A
Training:  29%|██▉       | 53/184 [00:05<00:13,  9.53it/s][A
Training:  31%|███ 

Epoch: 4/45 - Loss: 22.2228 - Accuracy: 0.8711



  0%|          | 0/23 [00:00<?, ?it/s][A
  4%|▍         | 1/23 [00:00<00:11,  1.88it/s][A
 22%|██▏       | 5/23 [00:00<00:02,  7.75it/s][A
 39%|███▉      | 9/23 [00:01<00:01, 10.64it/s][A
 52%|█████▏    | 12/23 [00:01<00:00, 13.44it/s][A
 61%|██████    | 14/23 [00:01<00:00, 11.83it/s][A
 74%|███████▍  | 17/23 [00:01<00:00, 11.26it/s][A
 87%|████████▋ | 20/23 [00:01<00:00, 14.00it/s][A
100%|██████████| 23/23 [00:02<00:00, 11.27it/s][A
Epochs:   9%|▉         | 4/45 [01:11<12:11, 17.83s/it]

Val Loss: 29.4987 - Val Accuracy: 0.8630



Training:   0%|          | 0/184 [00:00<?, ?it/s][A
Training:   1%|          | 1/184 [00:00<01:31,  2.00it/s][A
Training:   3%|▎         | 5/184 [00:00<00:25,  7.14it/s][A
Training:   5%|▍         | 9/184 [00:01<00:19,  9.21it/s][A
Training:   7%|▋         | 13/184 [00:01<00:15, 10.76it/s][A
Training:   9%|▉         | 17/184 [00:01<00:14, 11.23it/s][A
Training:  11%|█▏        | 21/184 [00:02<00:15, 10.85it/s][A
Training:  14%|█▎        | 25/184 [00:02<00:14, 11.33it/s][A
Training:  16%|█▌        | 29/184 [00:02<00:13, 11.70it/s][A
Training:  18%|█▊        | 33/184 [00:03<00:13, 11.57it/s][A
Training:  20%|██        | 37/184 [00:03<00:15,  9.47it/s][A
Training:  22%|██▏       | 41/184 [00:04<00:14,  9.68it/s][A
Training:  24%|██▍       | 45/184 [00:04<00:13, 10.41it/s][A
Training:  27%|██▋       | 49/184 [00:04<00:12, 11.14it/s][A
Training:  29%|██▉       | 53/184 [00:05<00:12, 10.85it/s][A
Training:  31%|███       | 57/184 [00:05<00:11, 11.25it/s][A
Training:  33%|███▎

Epoch: 5/45 - Loss: 23.9896 - Accuracy: 0.8763



  0%|          | 0/23 [00:00<?, ?it/s][A
  4%|▍         | 1/23 [00:00<00:09,  2.23it/s][A
 22%|██▏       | 5/23 [00:00<00:02,  8.59it/s][A
 39%|███▉      | 9/23 [00:01<00:01, 10.00it/s][A
 57%|█████▋    | 13/23 [00:01<00:00, 10.77it/s][A
 74%|███████▍  | 17/23 [00:01<00:00, 11.53it/s][A
100%|██████████| 23/23 [00:02<00:00, 11.07it/s][A
Epochs:  11%|█         | 5/45 [01:29<11:55, 17.89s/it]

Val Loss: 25.9528 - Val Accuracy: 0.8579



Training:   0%|          | 0/184 [00:00<?, ?it/s][A
Training:   1%|          | 1/184 [00:00<01:35,  1.92it/s][A
Training:   3%|▎         | 5/184 [00:00<00:24,  7.27it/s][A
Training:   5%|▍         | 9/184 [00:01<00:16, 10.39it/s][A
Training:   6%|▌         | 11/184 [00:01<00:14, 11.68it/s][A
Training:   7%|▋         | 13/184 [00:01<00:14, 11.48it/s][A
Training:   8%|▊         | 15/184 [00:01<00:14, 11.57it/s][A
Training:   9%|▉         | 17/184 [00:01<00:14, 11.93it/s][A
Training:  10%|█         | 19/184 [00:01<00:14, 11.20it/s][A
Training:  11%|█▏        | 21/184 [00:02<00:13, 12.04it/s][A
Training:  12%|█▎        | 23/184 [00:02<00:13, 11.74it/s][A
Training:  14%|█▎        | 25/184 [00:02<00:12, 12.43it/s][A
Training:  15%|█▍        | 27/184 [00:02<00:14, 10.88it/s][A
Training:  16%|█▌        | 29/184 [00:02<00:12, 12.47it/s][A
Training:  17%|█▋        | 31/184 [00:02<00:13, 11.31it/s][A
Training:  18%|█▊        | 33/184 [00:03<00:12, 12.03it/s][A
Training:  19%|█▉  

Epoch: 6/45 - Loss: 25.5363 - Accuracy: 0.8821



  0%|          | 0/23 [00:00<?, ?it/s][A
  4%|▍         | 1/23 [00:00<00:10,  2.06it/s][A
 22%|██▏       | 5/23 [00:00<00:02,  8.28it/s][A
 39%|███▉      | 9/23 [00:00<00:01, 10.80it/s][A
 48%|████▊     | 11/23 [00:01<00:00, 12.30it/s][A
 57%|█████▋    | 13/23 [00:01<00:00, 11.57it/s][A
 65%|██████▌   | 15/23 [00:01<00:00, 12.86it/s][A
 74%|███████▍  | 17/23 [00:01<00:00, 11.80it/s][A
 87%|████████▋ | 20/23 [00:01<00:00, 15.34it/s][A
100%|██████████| 23/23 [00:02<00:00, 10.91it/s][A
Epochs:  13%|█▎        | 6/45 [01:47<11:38, 17.90s/it]

Val Loss: 26.6659 - Val Accuracy: 0.8526



Training:   0%|          | 0/184 [00:00<?, ?it/s][A
Training:   1%|          | 1/184 [00:00<01:32,  1.97it/s][A
Training:   3%|▎         | 5/184 [00:00<00:25,  7.01it/s][A
Training:   5%|▍         | 9/184 [00:01<00:17,  9.78it/s][A
Training:   7%|▋         | 13/184 [00:01<00:15, 11.34it/s][A
Training:   9%|▉         | 17/184 [00:01<00:15, 11.09it/s][A
Training:  11%|█▏        | 21/184 [00:02<00:14, 11.10it/s][A
Training:  14%|█▎        | 25/184 [00:02<00:14, 11.36it/s][A
Training:  16%|█▌        | 29/184 [00:03<00:18,  8.27it/s][A
Training:  18%|█▊        | 33/184 [00:03<00:15,  9.66it/s][A
Training:  20%|██        | 37/184 [00:03<00:14, 10.26it/s][A
Training:  22%|██▏       | 41/184 [00:04<00:13, 10.58it/s][A
Training:  24%|██▍       | 44/184 [00:04<00:11, 12.58it/s][A
Training:  25%|██▌       | 46/184 [00:04<00:12, 11.17it/s][A
Training:  27%|██▋       | 49/184 [00:04<00:12, 10.53it/s][A
Training:  29%|██▉       | 53/184 [00:05<00:11, 10.99it/s][A
Training:  31%|███ 

Epoch: 7/45 - Loss: 28.3440 - Accuracy: 0.8804



  0%|          | 0/23 [00:00<?, ?it/s][A
  4%|▍         | 1/23 [00:00<00:10,  2.05it/s][A
 22%|██▏       | 5/23 [00:00<00:02,  8.12it/s][A
 35%|███▍      | 8/23 [00:00<00:01, 12.31it/s][A
 43%|████▎     | 10/23 [00:01<00:01, 10.87it/s][A
 57%|█████▋    | 13/23 [00:01<00:00, 11.58it/s][A
 65%|██████▌   | 15/23 [00:01<00:00, 12.85it/s][A
 74%|███████▍  | 17/23 [00:01<00:00, 10.86it/s][A
 83%|████████▎ | 19/23 [00:01<00:00, 12.27it/s][A
 91%|█████████▏| 21/23 [00:02<00:00, 10.97it/s][A
100%|██████████| 23/23 [00:02<00:00,  9.84it/s][A
Epochs:  16%|█▌        | 7/45 [02:05<11:25, 18.03s/it]

Val Loss: 18.8500 - Val Accuracy: 0.8923



Training:   0%|          | 0/184 [00:00<?, ?it/s][A
Training:   1%|          | 1/184 [00:00<01:29,  2.05it/s][A
Training:   3%|▎         | 5/184 [00:00<00:23,  7.61it/s][A
Training:   5%|▍         | 9/184 [00:01<00:17, 10.01it/s][A
Training:   7%|▋         | 13/184 [00:01<00:15, 11.33it/s][A
Training:   9%|▉         | 17/184 [00:01<00:14, 11.36it/s][A
Training:  11%|█▏        | 21/184 [00:02<00:17,  9.28it/s][A
Training:  13%|█▎        | 24/184 [00:02<00:14, 11.43it/s][A
Training:  14%|█▍        | 26/184 [00:02<00:15, 10.11it/s][A
Training:  16%|█▌        | 29/184 [00:02<00:15, 10.32it/s][A
Training:  17%|█▋        | 32/184 [00:03<00:11, 12.68it/s][A
Training:  18%|█▊        | 34/184 [00:03<00:13, 11.06it/s][A
Training:  20%|██        | 37/184 [00:03<00:13, 10.95it/s][A
Training:  22%|██▏       | 41/184 [00:03<00:12, 11.09it/s][A
Training:  24%|██▍       | 45/184 [00:04<00:11, 11.61it/s][A
Training:  27%|██▋       | 49/184 [00:04<00:11, 11.78it/s][A
Training:  29%|██▉ 

Epoch: 8/45 - Loss: 25.1419 - Accuracy: 0.8815



  0%|          | 0/23 [00:00<?, ?it/s][A
  4%|▍         | 1/23 [00:00<00:11,  1.93it/s][A
 22%|██▏       | 5/23 [00:00<00:02,  7.68it/s][A
 39%|███▉      | 9/23 [00:01<00:01,  9.92it/s][A
 57%|█████▋    | 13/23 [00:01<00:00, 11.28it/s][A
 70%|██████▉   | 16/23 [00:01<00:00,  9.53it/s][A
 78%|███████▊  | 18/23 [00:02<00:00,  8.53it/s][A
 91%|█████████▏| 21/23 [00:02<00:00, 10.23it/s][A
100%|██████████| 23/23 [00:02<00:00,  9.14it/s][A
Epochs:  18%|█▊        | 8/45 [02:23<11:08, 18.06s/it]

Val Loss: 25.7114 - Val Accuracy: 0.8773



Training:   0%|          | 0/184 [00:00<?, ?it/s][A
Training:   1%|          | 1/184 [00:00<01:30,  2.03it/s][A
Training:   3%|▎         | 5/184 [00:00<00:23,  7.58it/s][A
Training:   5%|▍         | 9/184 [00:01<00:18,  9.52it/s][A
Training:   7%|▋         | 13/184 [00:01<00:16, 10.66it/s][A
Training:   9%|▉         | 17/184 [00:01<00:15, 10.75it/s][A
Training:  11%|█▏        | 21/184 [00:02<00:18,  8.94it/s][A
Training:  14%|█▎        | 25/184 [00:02<00:16,  9.82it/s][A
Training:  16%|█▌        | 29/184 [00:03<00:15,  9.87it/s][A
Training:  18%|█▊        | 33/184 [00:03<00:14, 10.49it/s][A
Training:  20%|██        | 37/184 [00:03<00:13, 11.29it/s][A
Training:  22%|██▏       | 41/184 [00:04<00:12, 11.28it/s][A
Training:  24%|██▍       | 45/184 [00:04<00:11, 11.67it/s][A
Training:  27%|██▋       | 49/184 [00:04<00:11, 11.93it/s][A
Training:  29%|██▉       | 53/184 [00:05<00:10, 11.97it/s][A
Training:  31%|███       | 57/184 [00:05<00:10, 11.79it/s][A
Training:  33%|███▎

Epoch: 9/45 - Loss: 26.5178 - Accuracy: 0.8842



  0%|          | 0/23 [00:00<?, ?it/s][A
  4%|▍         | 1/23 [00:00<00:11,  1.90it/s][A
 22%|██▏       | 5/23 [00:00<00:02,  7.22it/s][A
 39%|███▉      | 9/23 [00:01<00:01,  9.55it/s][A
 57%|█████▋    | 13/23 [00:01<00:01,  8.41it/s][A
 74%|███████▍  | 17/23 [00:02<00:00,  9.46it/s][A
100%|██████████| 23/23 [00:02<00:00,  9.59it/s][A
Epochs:  20%|██        | 9/45 [02:41<10:50, 18.08s/it]

Val Loss: 18.0842 - Val Accuracy: 0.8877



Training:   0%|          | 0/184 [00:00<?, ?it/s][A
Training:   1%|          | 1/184 [00:00<01:48,  1.68it/s][A
Training:   3%|▎         | 5/184 [00:00<00:26,  6.77it/s][A
Training:   5%|▍         | 9/184 [00:01<00:19,  9.14it/s][A
Training:   7%|▋         | 13/184 [00:01<00:22,  7.75it/s][A
Training:   9%|▉         | 17/184 [00:02<00:18,  8.88it/s][A
Training:  11%|█▏        | 21/184 [00:02<00:16,  9.77it/s][A
Training:  14%|█▎        | 25/184 [00:02<00:15, 10.32it/s][A
Training:  16%|█▌        | 29/184 [00:03<00:15, 10.30it/s][A
Training:  18%|█▊        | 33/184 [00:03<00:14, 10.76it/s][A
Training:  20%|██        | 37/184 [00:03<00:12, 11.47it/s][A
Training:  22%|██▏       | 41/184 [00:04<00:12, 11.61it/s][A
Training:  24%|██▍       | 45/184 [00:04<00:11, 11.70it/s][A
Training:  27%|██▋       | 49/184 [00:04<00:11, 11.85it/s][A
Training:  29%|██▉       | 53/184 [00:05<00:10, 12.09it/s][A
Training:  31%|███       | 57/184 [00:05<00:10, 12.12it/s][A
Training:  33%|███▎

Epoch: 10/45 - Loss: 26.1150 - Accuracy: 0.8862



  0%|          | 0/23 [00:00<?, ?it/s][A
  4%|▍         | 1/23 [00:00<00:12,  1.78it/s][A
 22%|██▏       | 5/23 [00:00<00:02,  6.77it/s][A
 30%|███       | 7/23 [00:01<00:02,  7.42it/s][A
 39%|███▉      | 9/23 [00:01<00:02,  6.50it/s][A
 57%|█████▋    | 13/23 [00:01<00:01,  8.36it/s][A
 74%|███████▍  | 17/23 [00:02<00:00,  9.77it/s][A
100%|██████████| 23/23 [00:02<00:00,  9.05it/s][A
Epochs:  22%|██▏       | 10/45 [02:59<10:34, 18.14s/it]

Val Loss: 35.7654 - Val Accuracy: 0.8807



Training:   0%|          | 0/184 [00:00<?, ?it/s][A
Training:   1%|          | 1/184 [00:00<01:32,  1.98it/s][A
Training:   3%|▎         | 5/184 [00:01<00:32,  5.43it/s][A
Training:   5%|▍         | 9/184 [00:01<00:21,  8.33it/s][A
Training:   7%|▋         | 13/184 [00:01<00:17,  9.92it/s][A
Training:   8%|▊         | 15/184 [00:01<00:15, 11.01it/s][A
Training:   9%|▉         | 17/184 [00:01<00:15, 10.62it/s][A
Training:  10%|█         | 19/184 [00:02<00:14, 11.72it/s][A
Training:  11%|█▏        | 21/184 [00:02<00:15, 10.58it/s][A
Training:  12%|█▎        | 23/184 [00:02<00:14, 11.44it/s][A
Training:  14%|█▎        | 25/184 [00:02<00:14, 11.07it/s][A
Training:  15%|█▍        | 27/184 [00:02<00:13, 11.45it/s][A
Training:  16%|█▌        | 29/184 [00:02<00:13, 11.28it/s][A
Training:  17%|█▋        | 31/184 [00:03<00:12, 11.93it/s][A
Training:  18%|█▊        | 33/184 [00:03<00:13, 11.31it/s][A
Training:  19%|█▉        | 35/184 [00:03<00:11, 12.81it/s][A
Training:  20%|██  

Epoch: 11/45 - Loss: 24.3544 - Accuracy: 0.8874



  0%|          | 0/23 [00:00<?, ?it/s][A
  4%|▍         | 1/23 [00:00<00:16,  1.33it/s][A
 22%|██▏       | 5/23 [00:01<00:03,  5.71it/s][A
 39%|███▉      | 9/23 [00:01<00:01,  8.18it/s][A
 57%|█████▋    | 13/23 [00:01<00:01,  9.63it/s][A
 65%|██████▌   | 15/23 [00:01<00:00, 10.16it/s][A
 74%|███████▍  | 17/23 [00:02<00:00, 10.37it/s][A
 83%|████████▎ | 19/23 [00:02<00:00, 11.09it/s][A
 91%|█████████▏| 21/23 [00:02<00:00, 12.02it/s][A
100%|██████████| 23/23 [00:02<00:00,  9.07it/s][A
Epochs:  24%|██▍       | 11/45 [03:18<10:18, 18.19s/it]

Val Loss: 22.6316 - Val Accuracy: 0.8652



Training:   0%|          | 0/184 [00:00<?, ?it/s][A
Training:   1%|          | 1/184 [00:00<01:31,  2.00it/s][A
Training:   3%|▎         | 5/184 [00:01<00:34,  5.21it/s][A
Training:   5%|▍         | 9/184 [00:01<00:21,  8.13it/s][A
Training:   7%|▋         | 13/184 [00:01<00:18,  9.23it/s][A
Training:   9%|▉         | 17/184 [00:01<00:15, 10.46it/s][A
Training:  11%|█         | 20/184 [00:02<00:12, 12.76it/s][A
Training:  12%|█▏        | 22/184 [00:02<00:14, 10.92it/s][A
Training:  14%|█▎        | 25/184 [00:02<00:15, 10.03it/s][A
Training:  15%|█▌        | 28/184 [00:02<00:12, 12.34it/s][A
Training:  16%|█▋        | 30/184 [00:03<00:13, 11.15it/s][A
Training:  17%|█▋        | 32/184 [00:03<00:12, 12.29it/s][A
Training:  18%|█▊        | 34/184 [00:03<00:13, 11.40it/s][A
Training:  20%|█▉        | 36/184 [00:03<00:12, 12.32it/s][A
Training:  21%|██        | 38/184 [00:03<00:12, 11.71it/s][A
Training:  22%|██▏       | 40/184 [00:03<00:11, 12.00it/s][A
Training:  23%|██▎ 

Epoch: 12/45 - Loss: 26.7395 - Accuracy: 0.8856



  0%|          | 0/23 [00:00<?, ?it/s][A
  4%|▍         | 1/23 [00:00<00:10,  2.09it/s][A
 22%|██▏       | 5/23 [00:00<00:02,  7.49it/s][A
 30%|███       | 7/23 [00:00<00:01,  9.63it/s][A
 39%|███▉      | 9/23 [00:01<00:01,  9.68it/s][A
 48%|████▊     | 11/23 [00:01<00:01, 10.97it/s][A
 57%|█████▋    | 13/23 [00:01<00:00, 10.31it/s][A
 65%|██████▌   | 15/23 [00:01<00:00, 11.58it/s][A
 74%|███████▍  | 17/23 [00:01<00:00, 11.19it/s][A
 87%|████████▋ | 20/23 [00:01<00:00, 14.80it/s][A
100%|██████████| 23/23 [00:02<00:00, 10.37it/s][A
Epochs:  27%|██▋       | 12/45 [03:36<09:59, 18.18s/it]

Val Loss: 28.8082 - Val Accuracy: 0.8847



Training:   0%|          | 0/184 [00:00<?, ?it/s][A
Training:   1%|          | 1/184 [00:00<01:32,  1.97it/s][A
Training:   3%|▎         | 5/184 [00:00<00:25,  7.14it/s][A
Training:   5%|▍         | 9/184 [00:01<00:18,  9.56it/s][A
Training:   7%|▋         | 13/184 [00:01<00:14, 11.44it/s][A
Training:   9%|▉         | 17/184 [00:01<00:15, 10.90it/s][A
Training:  11%|█▏        | 21/184 [00:02<00:14, 11.33it/s][A
Training:  14%|█▎        | 25/184 [00:02<00:13, 11.77it/s][A
Training:  16%|█▌        | 29/184 [00:02<00:13, 11.64it/s][A
Training:  18%|█▊        | 33/184 [00:03<00:12, 11.74it/s][A
Training:  20%|██        | 37/184 [00:03<00:12, 11.91it/s][A
Training:  22%|██▏       | 41/184 [00:03<00:11, 11.92it/s][A
Training:  24%|██▍       | 45/184 [00:04<00:11, 11.82it/s][A
Training:  27%|██▋       | 49/184 [00:04<00:11, 12.04it/s][A
Training:  29%|██▉       | 53/184 [00:04<00:10, 12.09it/s][A
Training:  31%|███       | 57/184 [00:05<00:10, 12.13it/s][A
Training:  33%|███▎

Epoch: 13/45 - Loss: 25.5806 - Accuracy: 0.8896



  0%|          | 0/23 [00:00<?, ?it/s][A
  4%|▍         | 1/23 [00:00<00:12,  1.80it/s][A
 22%|██▏       | 5/23 [00:00<00:02,  6.40it/s][A
 39%|███▉      | 9/23 [00:01<00:01,  8.38it/s][A
 57%|█████▋    | 13/23 [00:01<00:00, 10.39it/s][A
 74%|███████▍  | 17/23 [00:01<00:00, 11.27it/s][A
100%|██████████| 23/23 [00:02<00:00, 10.25it/s][A
Epochs:  29%|██▉       | 13/45 [03:54<09:36, 18.03s/it]

Val Loss: 27.1341 - Val Accuracy: 0.9083



Training:   0%|          | 0/184 [00:00<?, ?it/s][A
Training:   1%|          | 1/184 [00:00<01:34,  1.93it/s][A
Training:   2%|▏         | 4/184 [00:00<00:22,  8.00it/s][A
Training:   3%|▎         | 6/184 [00:00<00:24,  7.24it/s][A
Training:   5%|▍         | 9/184 [00:01<00:20,  8.36it/s][A
Training:   7%|▋         | 13/184 [00:01<00:16, 10.24it/s][A
Training:   9%|▉         | 17/184 [00:01<00:14, 11.70it/s][A
Training:  11%|█▏        | 21/184 [00:02<00:13, 12.24it/s][A
Training:  13%|█▎        | 24/184 [00:02<00:10, 14.60it/s][A
Training:  14%|█▍        | 26/184 [00:02<00:12, 13.10it/s][A
Training:  15%|█▌        | 28/184 [00:02<00:11, 14.14it/s][A
Training:  16%|█▋        | 30/184 [00:02<00:12, 12.12it/s][A
Training:  17%|█▋        | 32/184 [00:02<00:11, 13.51it/s][A
Training:  18%|█▊        | 34/184 [00:03<00:13, 11.53it/s][A
Training:  20%|█▉        | 36/184 [00:03<00:11, 12.44it/s][A
Training:  21%|██        | 38/184 [00:03<00:12, 11.42it/s][A
Training:  22%|██▏  

Epoch: 14/45 - Loss: 25.4275 - Accuracy: 0.8847



  0%|          | 0/23 [00:00<?, ?it/s][A
  4%|▍         | 1/23 [00:00<00:11,  1.96it/s][A
 22%|██▏       | 5/23 [00:00<00:02,  6.53it/s][A
 39%|███▉      | 9/23 [00:01<00:01,  8.28it/s][A
 57%|█████▋    | 13/23 [00:01<00:01,  9.99it/s][A
 74%|███████▍  | 17/23 [00:01<00:00, 11.45it/s][A
100%|██████████| 23/23 [00:02<00:00, 10.72it/s][A
Epochs:  31%|███       | 14/45 [04:11<09:15, 17.91s/it]

Val Loss: 32.3796 - Val Accuracy: 0.8538



Training:   0%|          | 0/184 [00:00<?, ?it/s][A
Training:   1%|          | 1/184 [00:00<01:29,  2.05it/s][A
Training:   2%|▏         | 3/184 [00:00<00:32,  5.62it/s][A
Training:   3%|▎         | 5/184 [00:00<00:22,  7.81it/s][A
Training:   4%|▍         | 7/184 [00:00<00:17, 10.00it/s][A
Training:   5%|▍         | 9/184 [00:01<00:17,  9.83it/s][A
Training:   6%|▌         | 11/184 [00:01<00:15, 11.29it/s][A
Training:   7%|▋         | 13/184 [00:01<00:15, 11.03it/s][A
Training:   8%|▊         | 15/184 [00:01<00:13, 12.40it/s][A
Training:   9%|▉         | 17/184 [00:01<00:14, 11.60it/s][A
Training:  10%|█         | 19/184 [00:01<00:13, 12.47it/s][A
Training:  11%|█▏        | 21/184 [00:02<00:12, 13.38it/s][A
Training:  12%|█▎        | 23/184 [00:02<00:12, 13.20it/s][A
Training:  14%|█▎        | 25/184 [00:02<00:11, 13.29it/s][A
Training:  15%|█▍        | 27/184 [00:02<00:11, 13.92it/s][A
Training:  16%|█▌        | 29/184 [00:02<00:12, 12.86it/s][A
Training:  17%|█▋    

Epoch: 15/45 - Loss: 28.7131 - Accuracy: 0.8850



  0%|          | 0/23 [00:00<?, ?it/s][A
  4%|▍         | 1/23 [00:00<00:10,  2.02it/s][A
 13%|█▎        | 3/23 [00:00<00:03,  6.01it/s][A
 22%|██▏       | 5/23 [00:00<00:02,  6.68it/s][A
 39%|███▉      | 9/23 [00:01<00:01,  8.77it/s][A
 57%|█████▋    | 13/23 [00:01<00:01,  9.89it/s][A
 74%|███████▍  | 17/23 [00:01<00:00, 10.87it/s][A
100%|██████████| 23/23 [00:02<00:00,  9.90it/s][A
Epochs:  33%|███▎      | 15/45 [04:29<08:54, 17.83s/it]

Val Loss: 22.9367 - Val Accuracy: 0.8755



Training:   0%|          | 0/184 [00:00<?, ?it/s][A
Training:   1%|          | 1/184 [00:00<01:25,  2.14it/s][A
Training:   3%|▎         | 5/184 [00:00<00:24,  7.42it/s][A
Training:   5%|▍         | 9/184 [00:01<00:18,  9.37it/s][A
Training:   7%|▋         | 12/184 [00:01<00:14, 11.99it/s][A
Training:   8%|▊         | 14/184 [00:01<00:16, 10.45it/s][A
Training:   9%|▉         | 17/184 [00:01<00:16, 10.27it/s][A
Training:  11%|█▏        | 21/184 [00:02<00:14, 11.41it/s][A
Training:  13%|█▎        | 24/184 [00:02<00:11, 13.72it/s][A
Training:  14%|█▍        | 26/184 [00:02<00:12, 12.25it/s][A
Training:  15%|█▌        | 28/184 [00:02<00:11, 13.01it/s][A
Training:  16%|█▋        | 30/184 [00:02<00:12, 12.65it/s][A
Training:  17%|█▋        | 32/184 [00:02<00:11, 13.19it/s][A
Training:  18%|█▊        | 34/184 [00:03<00:11, 13.20it/s][A
Training:  20%|█▉        | 36/184 [00:03<00:10, 13.85it/s][A
Training:  21%|██        | 38/184 [00:03<00:11, 12.87it/s][A
Training:  22%|██▏ 

Epoch: 16/45 - Loss: 25.6591 - Accuracy: 0.8896



  0%|          | 0/23 [00:00<?, ?it/s][A
  4%|▍         | 1/23 [00:00<00:12,  1.73it/s][A
 22%|██▏       | 5/23 [00:00<00:02,  6.75it/s][A
 39%|███▉      | 9/23 [00:01<00:01,  8.66it/s][A
 57%|█████▋    | 13/23 [00:01<00:01, 10.00it/s][A
 74%|███████▍  | 17/23 [00:01<00:00, 10.55it/s][A
100%|██████████| 23/23 [00:02<00:00, 10.18it/s][A
Epochs:  36%|███▌      | 16/45 [04:47<08:36, 17.80s/it]

Val Loss: 36.6154 - Val Accuracy: 0.8522



Training:   0%|          | 0/184 [00:00<?, ?it/s][A
Training:   1%|          | 1/184 [00:00<01:37,  1.89it/s][A
Training:   3%|▎         | 5/184 [00:00<00:25,  6.90it/s][A
Training:   5%|▍         | 9/184 [00:01<00:19,  9.18it/s][A
Training:   7%|▋         | 13/184 [00:01<00:17,  9.96it/s][A
Training:   9%|▉         | 17/184 [00:01<00:15, 10.81it/s][A
Training:  11%|█▏        | 21/184 [00:02<00:14, 11.20it/s][A
Training:  14%|█▎        | 25/184 [00:02<00:13, 11.50it/s][A
Training:  16%|█▌        | 29/184 [00:02<00:12, 12.31it/s][A
Training:  18%|█▊        | 33/184 [00:03<00:11, 12.69it/s][A
Training:  20%|██        | 37/184 [00:03<00:11, 12.60it/s][A
Training:  22%|██▏       | 41/184 [00:03<00:11, 12.80it/s][A
Training:  24%|██▍       | 45/184 [00:03<00:10, 13.36it/s][A
Training:  27%|██▋       | 49/184 [00:04<00:09, 13.94it/s][A
Training:  29%|██▉       | 53/184 [00:04<00:09, 13.39it/s][A
Training:  31%|███       | 57/184 [00:04<00:09, 13.13it/s][A
Training:  33%|███▎

Epoch: 17/45 - Loss: 24.4848 - Accuracy: 0.8901



  0%|          | 0/23 [00:00<?, ?it/s][A
  4%|▍         | 1/23 [00:00<00:13,  1.67it/s][A
 22%|██▏       | 5/23 [00:00<00:02,  6.52it/s][A
 39%|███▉      | 9/23 [00:01<00:01,  8.72it/s][A
 52%|█████▏    | 12/23 [00:01<00:00, 11.39it/s][A
 61%|██████    | 14/23 [00:01<00:00,  9.94it/s][A
 74%|███████▍  | 17/23 [00:01<00:00,  9.68it/s][A
100%|██████████| 23/23 [00:02<00:00,  9.75it/s][A
Epochs:  38%|███▊      | 17/45 [05:04<08:14, 17.66s/it]

Val Loss: 34.3228 - Val Accuracy: 0.8802



Training:   0%|          | 0/184 [00:00<?, ?it/s][A
Training:   1%|          | 1/184 [00:00<01:44,  1.74it/s][A
Training:   3%|▎         | 5/184 [00:00<00:26,  6.75it/s][A
Training:   5%|▍         | 9/184 [00:01<00:19,  8.78it/s][A
Training:   7%|▋         | 12/184 [00:01<00:14, 11.89it/s][A
Training:   8%|▊         | 14/184 [00:01<00:16, 10.12it/s][A
Training:   9%|▉         | 17/184 [00:01<00:16, 10.08it/s][A
Training:  11%|█▏        | 21/184 [00:02<00:15, 10.73it/s][A
Training:  14%|█▎        | 25/184 [00:02<00:13, 12.04it/s][A
Training:  16%|█▌        | 29/184 [00:02<00:12, 12.81it/s][A
Training:  17%|█▋        | 32/184 [00:02<00:10, 14.21it/s][A
Training:  18%|█▊        | 34/184 [00:03<00:11, 12.71it/s][A
Training:  20%|█▉        | 36/184 [00:03<00:10, 13.61it/s][A
Training:  21%|██        | 38/184 [00:03<00:12, 11.42it/s][A
Training:  22%|██▏       | 41/184 [00:03<00:12, 11.55it/s][A
Training:  24%|██▍       | 44/184 [00:03<00:10, 13.47it/s][A
Training:  25%|██▌ 

Epoch: 18/45 - Loss: 23.9903 - Accuracy: 0.8879



  0%|          | 0/23 [00:00<?, ?it/s][A
  4%|▍         | 1/23 [00:00<00:11,  1.93it/s][A
 22%|██▏       | 5/23 [00:00<00:02,  7.21it/s][A
 26%|██▌       | 6/23 [00:00<00:02,  7.62it/s][A
 39%|███▉      | 9/23 [00:01<00:01,  9.27it/s][A
 48%|████▊     | 11/23 [00:01<00:01, 11.06it/s][A
 57%|█████▋    | 13/23 [00:01<00:01,  9.36it/s][A
 74%|███████▍  | 17/23 [00:01<00:00, 10.73it/s][A
 83%|████████▎ | 19/23 [00:01<00:00, 11.99it/s][A
100%|██████████| 23/23 [00:02<00:00,  9.84it/s][A
Epochs:  40%|████      | 18/45 [05:22<07:58, 17.71s/it]

Val Loss: 37.0221 - Val Accuracy: 0.8738



Training:   0%|          | 0/184 [00:00<?, ?it/s][A
Training:   1%|          | 1/184 [00:00<01:44,  1.75it/s][A
Training:   3%|▎         | 5/184 [00:00<00:27,  6.45it/s][A
Training:   5%|▍         | 9/184 [00:01<00:20,  8.57it/s][A
Training:   7%|▋         | 13/184 [00:01<00:17,  9.54it/s][A
Training:   9%|▉         | 17/184 [00:01<00:15, 10.52it/s][A
Training:  11%|█▏        | 21/184 [00:02<00:14, 10.90it/s][A
Training:  14%|█▎        | 25/184 [00:02<00:14, 11.28it/s][A
Training:  16%|█▌        | 29/184 [00:02<00:12, 11.97it/s][A
Training:  18%|█▊        | 33/184 [00:03<00:12, 11.92it/s][A
Training:  20%|██        | 37/184 [00:03<00:12, 12.17it/s][A
Training:  22%|██▏       | 41/184 [00:03<00:11, 12.41it/s][A
Training:  24%|██▍       | 45/184 [00:04<00:11, 11.74it/s][A
Training:  27%|██▋       | 49/184 [00:04<00:11, 11.75it/s][A
Training:  29%|██▉       | 53/184 [00:04<00:11, 11.75it/s][A
Training:  31%|███       | 57/184 [00:05<00:10, 12.64it/s][A
Training:  33%|███▎

Epoch: 19/45 - Loss: 25.7284 - Accuracy: 0.8891



  0%|          | 0/23 [00:00<?, ?it/s][A
  4%|▍         | 1/23 [00:00<00:11,  1.92it/s][A
 22%|██▏       | 5/23 [00:00<00:02,  6.92it/s][A
 30%|███       | 7/23 [00:00<00:01,  9.14it/s][A
 39%|███▉      | 9/23 [00:01<00:01,  7.92it/s][A
 57%|█████▋    | 13/23 [00:01<00:01,  9.08it/s][A
 74%|███████▍  | 17/23 [00:01<00:00, 10.03it/s][A
100%|██████████| 23/23 [00:02<00:00,  9.70it/s][A
Epochs:  42%|████▏     | 19/45 [05:40<07:43, 17.84s/it]

Val Loss: 26.9419 - Val Accuracy: 0.8911



Training:   0%|          | 0/184 [00:00<?, ?it/s][A
Training:   1%|          | 1/184 [00:00<01:42,  1.79it/s][A
Training:   2%|▏         | 4/184 [00:00<00:23,  7.51it/s][A
Training:   3%|▎         | 6/184 [00:00<00:24,  7.40it/s][A
Training:   5%|▍         | 9/184 [00:01<00:20,  8.43it/s][A
Training:   7%|▋         | 13/184 [00:01<00:16, 10.48it/s][A
Training:   8%|▊         | 15/184 [00:01<00:14, 11.40it/s][A
Training:   9%|▉         | 17/184 [00:01<00:15, 10.99it/s][A
Training:  10%|█         | 19/184 [00:01<00:13, 12.08it/s][A
Training:  11%|█▏        | 21/184 [00:02<00:16, 10.17it/s][A
Training:  13%|█▎        | 24/184 [00:02<00:12, 13.24it/s][A
Training:  14%|█▍        | 26/184 [00:02<00:14, 10.74it/s][A
Training:  16%|█▌        | 29/184 [00:02<00:13, 11.09it/s][A
Training:  17%|█▋        | 31/184 [00:03<00:12, 12.30it/s][A
Training:  18%|█▊        | 33/184 [00:03<00:15, 10.04it/s][A
Training:  20%|██        | 37/184 [00:03<00:13, 10.62it/s][A
Training:  22%|██▏  

Epoch: 20/45 - Loss: 28.4752 - Accuracy: 0.8889



  0%|          | 0/23 [00:00<?, ?it/s][A
  4%|▍         | 1/23 [00:00<00:13,  1.66it/s][A
 22%|██▏       | 5/23 [00:00<00:02,  6.49it/s][A
 39%|███▉      | 9/23 [00:01<00:01,  8.51it/s][A
 57%|█████▋    | 13/23 [00:01<00:01,  9.45it/s][A
 74%|███████▍  | 17/23 [00:01<00:00, 10.11it/s][A
100%|██████████| 23/23 [00:02<00:00,  9.74it/s][A
Epochs:  44%|████▍     | 20/45 [05:58<07:28, 17.92s/it]

Val Loss: 27.8668 - Val Accuracy: 0.8773



Training:   0%|          | 0/184 [00:00<?, ?it/s][A
Training:   1%|          | 1/184 [00:00<01:45,  1.74it/s][A
Training:   3%|▎         | 5/184 [00:00<00:29,  6.13it/s][A
Training:   5%|▍         | 9/184 [00:01<00:21,  8.17it/s][A
Training:   7%|▋         | 13/184 [00:01<00:17,  9.59it/s][A
Training:   9%|▉         | 17/184 [00:01<00:16, 10.21it/s][A
Training:  11%|█▏        | 21/184 [00:02<00:15, 10.74it/s][A
Training:  14%|█▎        | 25/184 [00:02<00:14, 11.15it/s][A
Training:  16%|█▌        | 29/184 [00:02<00:13, 11.85it/s][A
Training:  18%|█▊        | 33/184 [00:03<00:12, 12.40it/s][A
Training:  20%|██        | 37/184 [00:03<00:12, 12.10it/s][A
Training:  22%|██▏       | 41/184 [00:03<00:11, 12.23it/s][A
Training:  24%|██▍       | 45/184 [00:04<00:11, 12.06it/s][A
Training:  27%|██▋       | 49/184 [00:04<00:11, 11.98it/s][A
Training:  29%|██▉       | 53/184 [00:04<00:11, 11.79it/s][A
Training:  31%|███       | 57/184 [00:05<00:10, 12.24it/s][A
Training:  33%|███▎

Epoch: 21/45 - Loss: 27.8068 - Accuracy: 0.8881



  0%|          | 0/23 [00:00<?, ?it/s][A
  4%|▍         | 1/23 [00:00<00:13,  1.67it/s][A
 22%|██▏       | 5/23 [00:00<00:02,  6.30it/s][A
 39%|███▉      | 9/23 [00:01<00:01,  8.63it/s][A
 57%|█████▋    | 13/23 [00:01<00:01,  9.66it/s][A
 74%|███████▍  | 17/23 [00:01<00:00, 10.60it/s][A
100%|██████████| 23/23 [00:02<00:00,  9.91it/s][A
Epochs:  47%|████▋     | 21/45 [06:16<07:09, 17.90s/it]

Val Loss: 30.3285 - Val Accuracy: 0.8854



Training:   0%|          | 0/184 [00:00<?, ?it/s][A
Training:   1%|          | 1/184 [00:00<01:55,  1.58it/s][A
Training:   3%|▎         | 5/184 [00:00<00:29,  6.09it/s][A
Training:   5%|▍         | 9/184 [00:01<00:21,  8.24it/s][A
Training:   7%|▋         | 13/184 [00:01<00:17,  9.53it/s][A
Training:   9%|▉         | 17/184 [00:01<00:15, 10.77it/s][A
Training:  11%|█▏        | 21/184 [00:02<00:14, 11.21it/s][A
Training:  14%|█▎        | 25/184 [00:02<00:13, 11.63it/s][A
Training:  16%|█▌        | 29/184 [00:02<00:13, 11.77it/s][A
Training:  18%|█▊        | 33/184 [00:03<00:12, 12.58it/s][A
Training:  20%|██        | 37/184 [00:03<00:11, 13.10it/s][A
Training:  22%|██▏       | 41/184 [00:03<00:11, 13.00it/s][A
Training:  24%|██▍       | 45/184 [00:04<00:10, 12.92it/s][A
Training:  27%|██▋       | 49/184 [00:04<00:11, 12.11it/s][A
Training:  29%|██▉       | 53/184 [00:04<00:10, 12.60it/s][A
Training:  31%|███       | 57/184 [00:05<00:10, 12.53it/s][A
Training:  33%|███▎

Epoch: 22/45 - Loss: 30.1810 - Accuracy: 0.8847



  0%|          | 0/23 [00:00<?, ?it/s][A
  4%|▍         | 1/23 [00:00<00:11,  1.92it/s][A
 22%|██▏       | 5/23 [00:00<00:02,  6.43it/s][A
 39%|███▉      | 9/23 [00:01<00:01,  8.64it/s][A
 57%|█████▋    | 13/23 [00:01<00:01,  9.95it/s][A
 74%|███████▍  | 17/23 [00:01<00:00, 10.77it/s][A
100%|██████████| 23/23 [00:02<00:00,  9.92it/s][A
Epochs:  49%|████▉     | 22/45 [06:34<06:51, 17.88s/it]

Val Loss: 27.0697 - Val Accuracy: 0.8785



Training:   0%|          | 0/184 [00:00<?, ?it/s][A
Training:   1%|          | 1/184 [00:00<01:50,  1.66it/s][A
Training:   3%|▎         | 5/184 [00:00<00:27,  6.40it/s][A
Training:   5%|▍         | 9/184 [00:01<00:20,  8.52it/s][A
Training:   7%|▋         | 13/184 [00:01<00:17,  9.60it/s][A
Training:   9%|▉         | 17/184 [00:01<00:16, 10.16it/s][A
Training:  11%|█▏        | 21/184 [00:02<00:16,  9.99it/s][A
Training:  14%|█▎        | 25/184 [00:02<00:14, 11.08it/s][A
Training:  16%|█▌        | 29/184 [00:03<00:13, 11.30it/s][A
Training:  18%|█▊        | 33/184 [00:03<00:12, 11.72it/s][A
Training:  20%|██        | 37/184 [00:03<00:12, 11.99it/s][A
Training:  22%|██▏       | 41/184 [00:03<00:11, 12.67it/s][A
Training:  24%|██▍       | 45/184 [00:04<00:11, 12.62it/s][A
Training:  27%|██▋       | 49/184 [00:04<00:11, 12.26it/s][A
Training:  29%|██▉       | 53/184 [00:04<00:10, 12.20it/s][A
Training:  31%|███       | 57/184 [00:05<00:10, 12.23it/s][A
Training:  33%|███▎

Epoch: 23/45 - Loss: 25.9460 - Accuracy: 0.8903



  0%|          | 0/23 [00:00<?, ?it/s][A
  4%|▍         | 1/23 [00:00<00:13,  1.62it/s][A
 22%|██▏       | 5/23 [00:00<00:02,  6.26it/s][A
 39%|███▉      | 9/23 [00:01<00:01,  8.56it/s][A
 57%|█████▋    | 13/23 [00:01<00:00, 10.21it/s][A
 74%|███████▍  | 17/23 [00:01<00:00, 10.86it/s][A
100%|██████████| 23/23 [00:02<00:00,  9.95it/s][A
Epochs:  51%|█████     | 23/45 [06:52<06:33, 17.91s/it]

Val Loss: 26.8201 - Val Accuracy: 0.8608



Training:   0%|          | 0/184 [00:00<?, ?it/s][A
Training:   1%|          | 1/184 [00:00<01:54,  1.61it/s][A
Training:   3%|▎         | 5/184 [00:00<00:29,  6.04it/s][A
Training:   5%|▍         | 9/184 [00:01<00:21,  8.08it/s][A
Training:   7%|▋         | 13/184 [00:01<00:18,  9.06it/s][A
Training:   9%|▉         | 17/184 [00:02<00:17,  9.52it/s][A
Training:  11%|█▏        | 21/184 [00:02<00:16,  9.91it/s][A
Training:  14%|█▎        | 25/184 [00:02<00:15, 10.27it/s][A
Training:  16%|█▌        | 29/184 [00:03<00:14, 10.88it/s][A
Training:  18%|█▊        | 33/184 [00:03<00:13, 11.35it/s][A
Training:  20%|██        | 37/184 [00:03<00:12, 11.44it/s][A
Training:  22%|██▏       | 41/184 [00:04<00:12, 11.42it/s][A
Training:  24%|██▍       | 45/184 [00:04<00:12, 11.51it/s][A
Training:  27%|██▋       | 49/184 [00:04<00:11, 11.59it/s][A
Training:  29%|██▉       | 53/184 [00:05<00:11, 11.60it/s][A
Training:  31%|███       | 57/184 [00:05<00:10, 11.97it/s][A
Training:  33%|███▎

Epoch: 24/45 - Loss: 25.3583 - Accuracy: 0.8890



  0%|          | 0/23 [00:00<?, ?it/s][A
  4%|▍         | 1/23 [00:00<00:13,  1.64it/s][A
 22%|██▏       | 5/23 [00:00<00:02,  6.49it/s][A
 39%|███▉      | 9/23 [00:01<00:01,  7.97it/s][A
 57%|█████▋    | 13/23 [00:01<00:01,  9.18it/s][A
 74%|███████▍  | 17/23 [00:01<00:00, 10.47it/s][A
100%|██████████| 23/23 [00:02<00:00,  9.61it/s][A
Epochs:  53%|█████▎    | 24/45 [07:10<06:19, 18.05s/it]

Val Loss: 33.6982 - Val Accuracy: 0.8676



Training:   0%|          | 0/184 [00:00<?, ?it/s][A
Training:   1%|          | 1/184 [00:00<01:50,  1.65it/s][A
Training:   3%|▎         | 5/184 [00:00<00:29,  6.17it/s][A
Training:   5%|▍         | 9/184 [00:01<00:22,  7.91it/s][A
Training:   7%|▋         | 13/184 [00:01<00:19,  8.84it/s][A
Training:   9%|▉         | 17/184 [00:02<00:17,  9.77it/s][A
Training:  11%|█▏        | 21/184 [00:02<00:15, 10.67it/s][A
Training:  14%|█▎        | 25/184 [00:02<00:14, 10.88it/s][A
Training:  16%|█▌        | 29/184 [00:03<00:13, 11.69it/s][A
Training:  18%|█▊        | 33/184 [00:03<00:12, 12.16it/s][A
Training:  20%|██        | 37/184 [00:03<00:12, 11.83it/s][A
Training:  22%|██▏       | 41/184 [00:03<00:11, 11.99it/s][A
Training:  24%|██▍       | 45/184 [00:04<00:11, 12.20it/s][A
Training:  27%|██▋       | 49/184 [00:04<00:11, 12.07it/s][A
Training:  29%|██▉       | 53/184 [00:04<00:10, 11.93it/s][A
Training:  31%|███       | 57/184 [00:05<00:10, 11.92it/s][A
Training:  33%|███▎

Epoch: 25/45 - Loss: 27.7858 - Accuracy: 0.8862



  0%|          | 0/23 [00:00<?, ?it/s][A
  4%|▍         | 1/23 [00:00<00:12,  1.79it/s][A
 17%|█▋        | 4/23 [00:00<00:02,  7.39it/s][A
 26%|██▌       | 6/23 [00:00<00:02,  8.11it/s][A
 39%|███▉      | 9/23 [00:01<00:01,  8.91it/s][A
 52%|█████▏    | 12/23 [00:01<00:00, 11.88it/s][A
 61%|██████    | 14/23 [00:01<00:00, 10.39it/s][A
 70%|██████▉   | 16/23 [00:01<00:00, 11.95it/s][A
 78%|███████▊  | 18/23 [00:01<00:00, 11.22it/s][A
 87%|████████▋ | 20/23 [00:01<00:00, 12.71it/s][A
100%|██████████| 23/23 [00:02<00:00,  9.96it/s][A
Epochs:  56%|█████▌    | 25/45 [07:28<06:00, 18.04s/it]

Val Loss: 27.9177 - Val Accuracy: 0.8940



Training:   0%|          | 0/184 [00:00<?, ?it/s][A
Training:   1%|          | 1/184 [00:00<01:45,  1.73it/s][A
Training:   3%|▎         | 5/184 [00:00<00:29,  6.09it/s][A
Training:   5%|▍         | 9/184 [00:01<00:20,  8.45it/s][A
Training:   7%|▋         | 13/184 [00:01<00:17,  9.88it/s][A
Training:   9%|▊         | 16/184 [00:01<00:13, 12.44it/s][A
Training:  10%|▉         | 18/184 [00:01<00:14, 11.15it/s][A
Training:  11%|█▏        | 21/184 [00:02<00:15, 10.60it/s][A
Training:  13%|█▎        | 24/184 [00:02<00:12, 12.52it/s][A
Training:  14%|█▍        | 26/184 [00:02<00:13, 11.83it/s][A
Training:  15%|█▌        | 28/184 [00:02<00:12, 12.08it/s][A
Training:  16%|█▋        | 30/184 [00:02<00:12, 11.90it/s][A
Training:  17%|█▋        | 32/184 [00:03<00:11, 12.81it/s][A
Training:  18%|█▊        | 34/184 [00:03<00:12, 12.10it/s][A
Training:  20%|█▉        | 36/184 [00:03<00:11, 12.78it/s][A
Training:  21%|██        | 38/184 [00:03<00:12, 12.13it/s][A
Training:  22%|██▏ 

Epoch: 26/45 - Loss: 29.7365 - Accuracy: 0.8863



  0%|          | 0/23 [00:00<?, ?it/s][A
  4%|▍         | 1/23 [00:00<00:12,  1.72it/s][A
 22%|██▏       | 5/23 [00:00<00:02,  6.72it/s][A
 39%|███▉      | 9/23 [00:01<00:01,  9.04it/s][A
 48%|████▊     | 11/23 [00:01<00:01, 10.32it/s][A
 57%|█████▋    | 13/23 [00:01<00:01,  9.53it/s][A
 70%|██████▉   | 16/23 [00:01<00:00, 12.61it/s][A
 78%|███████▊  | 18/23 [00:01<00:00, 10.88it/s][A
100%|██████████| 23/23 [00:02<00:00,  9.73it/s][A
Epochs:  58%|█████▊    | 26/45 [07:46<05:44, 18.11s/it]

Val Loss: 32.1866 - Val Accuracy: 0.8813



Training:   0%|          | 0/184 [00:00<?, ?it/s][A
Training:   1%|          | 1/184 [00:00<01:43,  1.77it/s][A
Training:   2%|▏         | 4/184 [00:00<00:24,  7.42it/s][A
Training:   3%|▎         | 6/184 [00:00<00:25,  7.11it/s][A
Training:   5%|▍         | 9/184 [00:01<00:20,  8.68it/s][A
Training:   6%|▌         | 11/184 [00:01<00:16, 10.54it/s][A
Training:   7%|▋         | 13/184 [00:01<00:17,  9.64it/s][A
Training:   9%|▊         | 16/184 [00:01<00:13, 12.36it/s][A
Training:  10%|▉         | 18/184 [00:01<00:16, 10.36it/s][A
Training:  11%|█▏        | 21/184 [00:02<00:15, 10.29it/s][A
Training:  12%|█▎        | 23/184 [00:02<00:13, 11.67it/s][A
Training:  14%|█▎        | 25/184 [00:02<00:15, 10.48it/s][A
Training:  15%|█▌        | 28/184 [00:02<00:12, 12.89it/s][A
Training:  16%|█▋        | 30/184 [00:02<00:13, 11.72it/s][A
Training:  18%|█▊        | 33/184 [00:03<00:13, 11.47it/s][A
Training:  20%|█▉        | 36/184 [00:03<00:10, 14.48it/s][A
Training:  21%|██   

Epoch: 27/45 - Loss: 29.6186 - Accuracy: 0.8898



  0%|          | 0/23 [00:00<?, ?it/s][A
  4%|▍         | 1/23 [00:00<00:12,  1.82it/s][A
 22%|██▏       | 5/23 [00:00<00:02,  6.52it/s][A
 39%|███▉      | 9/23 [00:01<00:01,  8.93it/s][A
 57%|█████▋    | 13/23 [00:01<00:01,  9.94it/s][A
 74%|███████▍  | 17/23 [00:01<00:00, 10.36it/s][A
100%|██████████| 23/23 [00:02<00:00,  9.61it/s][A
Epochs:  60%|██████    | 27/45 [08:04<05:25, 18.06s/it]

Val Loss: 25.4896 - Val Accuracy: 0.8687



Training:   0%|          | 0/184 [00:00<?, ?it/s][A
Training:   1%|          | 1/184 [00:00<01:38,  1.85it/s][A
Training:   3%|▎         | 5/184 [00:00<00:27,  6.43it/s][A
Training:   5%|▍         | 9/184 [00:01<00:21,  7.97it/s][A
Training:   7%|▋         | 13/184 [00:01<00:17,  9.84it/s][A
Training:   9%|▉         | 17/184 [00:01<00:15, 10.78it/s][A
Training:  11%|█▏        | 21/184 [00:02<00:15, 10.75it/s][A
Training:  14%|█▎        | 25/184 [00:02<00:14, 10.81it/s][A
Training:  15%|█▌        | 28/184 [00:02<00:12, 12.98it/s][A
Training:  16%|█▋        | 30/184 [00:02<00:13, 11.77it/s][A
Training:  18%|█▊        | 33/184 [00:03<00:13, 11.53it/s][A
Training:  20%|██        | 37/184 [00:03<00:12, 12.01it/s][A
Training:  22%|██▏       | 41/184 [00:03<00:12, 11.91it/s][A
Training:  24%|██▍       | 45/184 [00:04<00:12, 11.24it/s][A
Training:  27%|██▋       | 49/184 [00:04<00:11, 11.46it/s][A
Training:  29%|██▉       | 53/184 [00:04<00:11, 11.63it/s][A
Training:  31%|███ 

Epoch: 28/45 - Loss: 27.5749 - Accuracy: 0.8889



  0%|          | 0/23 [00:00<?, ?it/s][A
  4%|▍         | 1/23 [00:00<00:12,  1.75it/s][A
 22%|██▏       | 5/23 [00:00<00:02,  6.76it/s][A
 39%|███▉      | 9/23 [00:01<00:01,  8.72it/s][A
 57%|█████▋    | 13/23 [00:01<00:00, 10.09it/s][A
 74%|███████▍  | 17/23 [00:01<00:00, 10.80it/s][A
100%|██████████| 23/23 [00:02<00:00,  9.97it/s][A
Epochs:  62%|██████▏   | 28/45 [08:22<05:06, 18.01s/it]

Val Loss: 25.4759 - Val Accuracy: 0.8728



Training:   0%|          | 0/184 [00:00<?, ?it/s][A
Training:   1%|          | 1/184 [00:00<01:44,  1.74it/s][A
Training:   3%|▎         | 5/184 [00:00<00:27,  6.46it/s][A
Training:   5%|▍         | 9/184 [00:01<00:20,  8.63it/s][A
Training:   7%|▋         | 13/184 [00:01<00:17, 10.04it/s][A
Training:   9%|▉         | 17/184 [00:01<00:15, 10.62it/s][A
Training:  11%|█▏        | 21/184 [00:02<00:15, 10.65it/s][A
Training:  13%|█▎        | 24/184 [00:02<00:12, 12.94it/s][A
Training:  14%|█▍        | 26/184 [00:02<00:15, 10.48it/s][A
Training:  16%|█▌        | 29/184 [00:03<00:15, 10.22it/s][A
Training:  18%|█▊        | 33/184 [00:03<00:13, 10.96it/s][A
Training:  20%|██        | 37/184 [00:03<00:12, 12.08it/s][A
Training:  22%|██▏       | 41/184 [00:03<00:11, 12.24it/s][A
Training:  24%|██▍       | 45/184 [00:04<00:11, 12.06it/s][A
Training:  27%|██▋       | 49/184 [00:04<00:11, 12.06it/s][A
Training:  29%|██▉       | 53/184 [00:04<00:10, 12.30it/s][A
Training:  31%|███ 

Epoch: 29/45 - Loss: 25.1128 - Accuracy: 0.8918



  0%|          | 0/23 [00:00<?, ?it/s][A
  4%|▍         | 1/23 [00:00<00:11,  1.87it/s][A
 22%|██▏       | 5/23 [00:00<00:02,  6.63it/s][A
 39%|███▉      | 9/23 [00:01<00:01,  8.75it/s][A
 57%|█████▋    | 13/23 [00:01<00:01,  9.43it/s][A
 74%|███████▍  | 17/23 [00:01<00:00, 10.23it/s][A
 83%|████████▎ | 19/23 [00:02<00:00, 11.39it/s][A
100%|██████████| 23/23 [00:02<00:00,  9.57it/s][A
Epochs:  64%|██████▍   | 29/45 [08:40<04:48, 18.01s/it]

Val Loss: 25.1993 - Val Accuracy: 0.8693



Training:   0%|          | 0/184 [00:00<?, ?it/s][A
Training:   1%|          | 1/184 [00:00<01:46,  1.72it/s][A
Training:   3%|▎         | 5/184 [00:00<00:27,  6.51it/s][A
Training:   5%|▍         | 9/184 [00:01<00:19,  8.79it/s][A
Training:   7%|▋         | 13/184 [00:01<00:17,  9.56it/s][A
Training:   9%|▊         | 16/184 [00:01<00:13, 12.14it/s][A
Training:  10%|▉         | 18/184 [00:01<00:16, 10.30it/s][A
Training:  11%|█▏        | 21/184 [00:02<00:14, 10.92it/s][A
Training:  12%|█▎        | 23/184 [00:02<00:14, 11.47it/s][A
Training:  14%|█▎        | 25/184 [00:02<00:13, 11.87it/s][A
Training:  15%|█▍        | 27/184 [00:02<00:13, 11.69it/s][A
Training:  16%|█▌        | 29/184 [00:02<00:12, 12.79it/s][A
Training:  17%|█▋        | 31/184 [00:03<00:13, 11.31it/s][A
Training:  18%|█▊        | 33/184 [00:03<00:12, 12.19it/s][A
Training:  19%|█▉        | 35/184 [00:03<00:13, 11.43it/s][A
Training:  20%|██        | 37/184 [00:03<00:12, 12.20it/s][A
Training:  21%|██  

Epoch: 30/45 - Loss: 27.8275 - Accuracy: 0.8862



  0%|          | 0/23 [00:00<?, ?it/s][A
  4%|▍         | 1/23 [00:00<00:12,  1.77it/s][A
 22%|██▏       | 5/23 [00:00<00:02,  6.41it/s][A
 39%|███▉      | 9/23 [00:01<00:01,  8.20it/s][A
 57%|█████▋    | 13/23 [00:01<00:01,  9.76it/s][A
 74%|███████▍  | 17/23 [00:01<00:00, 10.64it/s][A
100%|██████████| 23/23 [00:02<00:00,  9.82it/s][A
Epochs:  67%|██████▋   | 30/45 [08:58<04:30, 18.06s/it]

Val Loss: 30.3037 - Val Accuracy: 0.8929



Training:   0%|          | 0/184 [00:00<?, ?it/s][A
Training:   1%|          | 1/184 [00:00<01:42,  1.78it/s][A
Training:   3%|▎         | 5/184 [00:00<00:27,  6.58it/s][A
Training:   4%|▍         | 8/184 [00:00<00:16, 10.48it/s][A
Training:   5%|▌         | 10/184 [00:01<00:19,  9.06it/s][A
Training:   7%|▋         | 13/184 [00:01<00:19,  8.89it/s][A
Training:   9%|▉         | 17/184 [00:01<00:16, 10.00it/s][A
Training:  11%|█▏        | 21/184 [00:02<00:15, 10.84it/s][A
Training:  14%|█▎        | 25/184 [00:02<00:13, 11.53it/s][A
Training:  15%|█▌        | 28/184 [00:02<00:11, 13.80it/s][A
Training:  16%|█▋        | 30/184 [00:02<00:12, 12.35it/s][A
Training:  17%|█▋        | 32/184 [00:03<00:11, 13.12it/s][A
Training:  18%|█▊        | 34/184 [00:03<00:12, 11.86it/s][A
Training:  20%|██        | 37/184 [00:03<00:12, 12.13it/s][A
Training:  21%|██        | 39/184 [00:03<00:11, 12.77it/s][A
Training:  22%|██▏       | 41/184 [00:03<00:10, 13.18it/s][A
Training:  23%|██▎ 

Epoch: 31/45 - Loss: 23.9709 - Accuracy: 0.8933



  0%|          | 0/23 [00:00<?, ?it/s][A
  4%|▍         | 1/23 [00:00<00:12,  1.81it/s][A
 22%|██▏       | 5/23 [00:00<00:02,  6.76it/s][A
 39%|███▉      | 9/23 [00:01<00:01,  8.90it/s][A
 57%|█████▋    | 13/23 [00:01<00:01,  9.53it/s][A
 74%|███████▍  | 17/23 [00:01<00:00, 10.08it/s][A
100%|██████████| 23/23 [00:02<00:00,  9.85it/s][A
Epochs:  69%|██████▉   | 31/45 [09:16<04:12, 18.01s/it]

Val Loss: 27.4606 - Val Accuracy: 0.8665



Training:   0%|          | 0/184 [00:00<?, ?it/s][A
Training:   1%|          | 1/184 [00:00<01:36,  1.90it/s][A
Training:   2%|▏         | 4/184 [00:00<00:24,  7.45it/s][A
Training:   3%|▎         | 6/184 [00:00<00:25,  7.11it/s][A
Training:   5%|▍         | 9/184 [00:01<00:20,  8.69it/s][A
Training:   7%|▋         | 12/184 [00:01<00:15, 11.18it/s][A
Training:   8%|▊         | 14/184 [00:01<00:17,  9.91it/s][A
Training:   9%|▉         | 17/184 [00:01<00:16, 10.25it/s][A
Training:  10%|█         | 19/184 [00:02<00:14, 11.76it/s][A
Training:  11%|█▏        | 21/184 [00:02<00:16,  9.73it/s][A
Training:  14%|█▎        | 25/184 [00:02<00:14, 10.80it/s][A
Training:  16%|█▌        | 29/184 [00:02<00:14, 10.97it/s][A
Training:  17%|█▋        | 32/184 [00:03<00:11, 13.24it/s][A
Training:  18%|█▊        | 34/184 [00:03<00:13, 11.05it/s][A
Training:  20%|██        | 37/184 [00:03<00:13, 11.25it/s][A
Training:  22%|██▏       | 41/184 [00:03<00:12, 11.82it/s][A
Training:  24%|██▍  

Epoch: 32/45 - Loss: 25.6957 - Accuracy: 0.8887



  0%|          | 0/23 [00:00<?, ?it/s][A
  4%|▍         | 1/23 [00:00<00:12,  1.70it/s][A
 22%|██▏       | 5/23 [00:00<00:02,  6.41it/s][A
 39%|███▉      | 9/23 [00:01<00:01,  8.50it/s][A
 57%|█████▋    | 13/23 [00:01<00:01,  9.94it/s][A
 70%|██████▉   | 16/23 [00:01<00:00, 12.28it/s][A
 78%|███████▊  | 18/23 [00:01<00:00, 11.09it/s][A
100%|██████████| 23/23 [00:02<00:00,  9.71it/s][A
Epochs:  71%|███████   | 32/45 [09:34<03:54, 18.03s/it]

Val Loss: 25.9884 - Val Accuracy: 0.8705



Training:   0%|          | 0/184 [00:00<?, ?it/s][A
Training:   1%|          | 1/184 [00:00<01:40,  1.83it/s][A
Training:   2%|▏         | 4/184 [00:00<00:23,  7.57it/s][A
Training:   3%|▎         | 6/184 [00:00<00:21,  8.14it/s][A
Training:   4%|▍         | 8/184 [00:01<00:17,  9.94it/s][A
Training:   5%|▌         | 10/184 [00:01<00:18,  9.25it/s][A
Training:   7%|▋         | 12/184 [00:01<00:15, 11.04it/s][A
Training:   8%|▊         | 14/184 [00:01<00:16, 10.22it/s][A
Training:   9%|▉         | 17/184 [00:01<00:16, 10.07it/s][A
Training:  11%|█         | 20/184 [00:02<00:12, 13.17it/s][A
Training:  12%|█▏        | 22/184 [00:02<00:13, 11.61it/s][A
Training:  13%|█▎        | 24/184 [00:02<00:12, 12.75it/s][A
Training:  14%|█▍        | 26/184 [00:02<00:14, 11.26it/s][A
Training:  15%|█▌        | 28/184 [00:02<00:12, 12.86it/s][A
Training:  16%|█▋        | 30/184 [00:02<00:13, 11.58it/s][A
Training:  17%|█▋        | 32/184 [00:03<00:11, 12.74it/s][A
Training:  18%|█▊   

Epoch: 33/45 - Loss: 26.3735 - Accuracy: 0.8874



  0%|          | 0/23 [00:00<?, ?it/s][A
  4%|▍         | 1/23 [00:00<00:13,  1.60it/s][A
 22%|██▏       | 5/23 [00:00<00:02,  6.54it/s][A
 39%|███▉      | 9/23 [00:01<00:01,  8.88it/s][A
 57%|█████▋    | 13/23 [00:01<00:01,  9.88it/s][A
 74%|███████▍  | 17/23 [00:01<00:00, 10.59it/s][A
100%|██████████| 23/23 [00:02<00:00,  9.80it/s][A
Epochs:  73%|███████▎  | 33/45 [09:52<03:36, 18.04s/it]

Val Loss: 37.4745 - Val Accuracy: 0.8698



Training:   0%|          | 0/184 [00:00<?, ?it/s][A
Training:   1%|          | 1/184 [00:00<01:49,  1.67it/s][A
Training:   3%|▎         | 5/184 [00:00<00:28,  6.30it/s][A
Training:   5%|▍         | 9/184 [00:01<00:21,  8.25it/s][A
Training:   7%|▋         | 13/184 [00:01<00:17,  9.63it/s][A
Training:   9%|▉         | 17/184 [00:01<00:15, 10.78it/s][A
Training:  11%|█▏        | 21/184 [00:02<00:14, 10.92it/s][A
Training:  14%|█▎        | 25/184 [00:02<00:13, 11.57it/s][A
Training:  16%|█▌        | 29/184 [00:02<00:13, 11.33it/s][A
Training:  18%|█▊        | 33/184 [00:03<00:13, 11.09it/s][A
Training:  20%|██        | 37/184 [00:03<00:13, 11.15it/s][A
Training:  22%|██▏       | 41/184 [00:03<00:12, 11.76it/s][A
Training:  24%|██▍       | 45/184 [00:04<00:11, 12.18it/s][A
Training:  27%|██▋       | 49/184 [00:04<00:10, 12.38it/s][A
Training:  28%|██▊       | 51/184 [00:04<00:10, 13.01it/s][A
Training:  29%|██▉       | 53/184 [00:04<00:10, 12.21it/s][A
Training:  30%|██▉ 

Epoch: 34/45 - Loss: 30.6600 - Accuracy: 0.8879



  0%|          | 0/23 [00:00<?, ?it/s][A
  4%|▍         | 1/23 [00:00<00:11,  1.83it/s][A
 22%|██▏       | 5/23 [00:00<00:02,  6.77it/s][A
 39%|███▉      | 9/23 [00:01<00:01,  8.92it/s][A
 57%|█████▋    | 13/23 [00:01<00:00, 10.38it/s][A
 65%|██████▌   | 15/23 [00:01<00:00, 11.49it/s][A
 74%|███████▍  | 17/23 [00:01<00:00, 10.88it/s][A
 83%|████████▎ | 19/23 [00:01<00:00, 12.00it/s][A
100%|██████████| 23/23 [00:02<00:00,  9.88it/s][A
Epochs:  76%|███████▌  | 34/45 [10:10<03:18, 18.01s/it]

Val Loss: 33.8798 - Val Accuracy: 0.8778



Training:   0%|          | 0/184 [00:00<?, ?it/s][A
Training:   1%|          | 1/184 [00:00<01:46,  1.71it/s][A
Training:   3%|▎         | 5/184 [00:00<00:29,  6.09it/s][A
Training:   5%|▍         | 9/184 [00:01<00:21,  8.28it/s][A
Training:   7%|▋         | 13/184 [00:01<00:17,  9.80it/s][A
Training:   9%|▉         | 17/184 [00:01<00:15, 10.53it/s][A
Training:  11%|█▏        | 21/184 [00:02<00:15, 10.84it/s][A
Training:  14%|█▎        | 25/184 [00:02<00:14, 11.04it/s][A
Training:  16%|█▌        | 29/184 [00:02<00:13, 11.48it/s][A
Training:  18%|█▊        | 33/184 [00:03<00:12, 11.81it/s][A
Training:  20%|██        | 37/184 [00:03<00:12, 12.18it/s][A
Training:  22%|██▏       | 41/184 [00:03<00:11, 12.33it/s][A
Training:  24%|██▍       | 45/184 [00:04<00:11, 12.62it/s][A
Training:  27%|██▋       | 49/184 [00:04<00:10, 13.25it/s][A
Training:  28%|██▊       | 52/184 [00:04<00:08, 15.17it/s][A
Training:  29%|██▉       | 54/184 [00:04<00:09, 13.45it/s][A
Training:  30%|███ 

Epoch: 35/45 - Loss: 27.3378 - Accuracy: 0.8862



  0%|          | 0/23 [00:00<?, ?it/s][A
  4%|▍         | 1/23 [00:00<00:12,  1.79it/s][A
 22%|██▏       | 5/23 [00:00<00:02,  6.62it/s][A
 39%|███▉      | 9/23 [00:01<00:01,  9.14it/s][A
 48%|████▊     | 11/23 [00:01<00:01, 10.69it/s][A
 57%|█████▋    | 13/23 [00:01<00:01,  9.17it/s][A
 74%|███████▍  | 17/23 [00:01<00:00, 10.62it/s][A
100%|██████████| 23/23 [00:02<00:00,  9.85it/s][A
Epochs:  78%|███████▊  | 35/45 [10:28<03:00, 18.04s/it]

Val Loss: 22.8491 - Val Accuracy: 0.8900



Training:   0%|          | 0/184 [00:00<?, ?it/s][A
Training:   1%|          | 1/184 [00:00<01:47,  1.70it/s][A
Training:   2%|▏         | 4/184 [00:00<00:24,  7.21it/s][A
Training:   3%|▎         | 6/184 [00:00<00:23,  7.57it/s][A
Training:   5%|▍         | 9/184 [00:01<00:21,  8.17it/s][A
Training:   7%|▋         | 13/184 [00:01<00:18,  9.38it/s][A
Training:   9%|▉         | 17/184 [00:01<00:16, 10.35it/s][A
Training:  11%|█▏        | 21/184 [00:02<00:14, 10.92it/s][A
Training:  14%|█▎        | 25/184 [00:02<00:13, 11.66it/s][A
Training:  16%|█▌        | 29/184 [00:02<00:13, 11.55it/s][A
Training:  18%|█▊        | 33/184 [00:03<00:13, 10.87it/s][A
Training:  20%|██        | 37/184 [00:03<00:13, 10.83it/s][A
Training:  22%|██▏       | 41/184 [00:04<00:12, 11.47it/s][A
Training:  24%|██▍       | 45/184 [00:04<00:11, 12.15it/s][A
Training:  27%|██▋       | 49/184 [00:04<00:10, 12.37it/s][A
Training:  29%|██▉       | 53/184 [00:04<00:09, 13.38it/s][A
Training:  31%|███  

Epoch: 36/45 - Loss: 26.3527 - Accuracy: 0.8882



  0%|          | 0/23 [00:00<?, ?it/s][A
  4%|▍         | 1/23 [00:00<00:12,  1.72it/s][A
 22%|██▏       | 5/23 [00:00<00:02,  6.34it/s][A
 39%|███▉      | 9/23 [00:01<00:01,  8.16it/s][A
 57%|█████▋    | 13/23 [00:01<00:01,  9.71it/s][A
 74%|███████▍  | 17/23 [00:01<00:00, 10.76it/s][A
100%|██████████| 23/23 [00:02<00:00, 10.05it/s][A
Epochs:  80%|████████  | 36/45 [10:46<02:41, 17.99s/it]

Val Loss: 25.7577 - Val Accuracy: 0.8785



Training:   0%|          | 0/184 [00:00<?, ?it/s][A
Training:   1%|          | 1/184 [00:00<01:42,  1.78it/s][A
Training:   3%|▎         | 5/184 [00:00<00:27,  6.58it/s][A
Training:   5%|▍         | 9/184 [00:01<00:21,  8.17it/s][A
Training:   7%|▋         | 13/184 [00:01<00:18,  9.23it/s][A
Training:   9%|▉         | 17/184 [00:01<00:16, 10.18it/s][A
Training:  11%|█▏        | 21/184 [00:02<00:15, 10.25it/s][A
Training:  14%|█▎        | 25/184 [00:02<00:14, 10.67it/s][A
Training:  16%|█▌        | 29/184 [00:02<00:13, 11.46it/s][A
Training:  18%|█▊        | 33/184 [00:03<00:12, 11.70it/s][A
Training:  20%|██        | 37/184 [00:03<00:13, 11.14it/s][A
Training:  22%|██▏       | 41/184 [00:04<00:12, 11.25it/s][A
Training:  24%|██▍       | 45/184 [00:04<00:12, 10.81it/s][A
Training:  27%|██▋       | 49/184 [00:04<00:11, 11.39it/s][A
Training:  29%|██▉       | 53/184 [00:05<00:11, 11.60it/s][A
Training:  31%|███       | 57/184 [00:05<00:10, 11.64it/s][A
Training:  33%|███▎

Epoch: 37/45 - Loss: 30.6630 - Accuracy: 0.8873



  0%|          | 0/23 [00:00<?, ?it/s][A
  4%|▍         | 1/23 [00:00<00:11,  1.90it/s][A
 22%|██▏       | 5/23 [00:00<00:02,  6.85it/s][A
 26%|██▌       | 6/23 [00:00<00:02,  7.27it/s][A
 39%|███▉      | 9/23 [00:01<00:01,  8.56it/s][A
 57%|█████▋    | 13/23 [00:01<00:01,  9.98it/s][A
 74%|███████▍  | 17/23 [00:01<00:00, 11.03it/s][A
 87%|████████▋ | 20/23 [00:01<00:00, 13.56it/s][A
100%|██████████| 23/23 [00:02<00:00,  9.85it/s][A
Epochs:  82%|████████▏ | 37/45 [11:04<02:23, 17.98s/it]

Val Loss: 34.1414 - Val Accuracy: 0.8561



Training:   0%|          | 0/184 [00:00<?, ?it/s][A
Training:   1%|          | 1/184 [00:00<01:47,  1.71it/s][A
Training:   2%|▏         | 3/184 [00:00<00:34,  5.26it/s][A
Training:   3%|▎         | 5/184 [00:00<00:26,  6.87it/s][A
Training:   4%|▍         | 7/184 [00:01<00:18,  9.38it/s][A
Training:   5%|▍         | 9/184 [00:01<00:19,  9.06it/s][A
Training:   6%|▌         | 11/184 [00:01<00:17,  9.85it/s][A
Training:   7%|▋         | 13/184 [00:01<00:16, 10.22it/s][A
Training:   8%|▊         | 15/184 [00:01<00:15, 10.73it/s][A
Training:   9%|▉         | 17/184 [00:01<00:15, 11.00it/s][A
Training:  10%|█         | 19/184 [00:02<00:14, 11.56it/s][A
Training:  11%|█▏        | 21/184 [00:02<00:14, 11.49it/s][A
Training:  12%|█▎        | 23/184 [00:02<00:15, 10.72it/s][A
Training:  14%|█▎        | 25/184 [00:02<00:13, 11.81it/s][A
Training:  15%|█▍        | 27/184 [00:02<00:13, 11.42it/s][A
Training:  16%|█▌        | 29/184 [00:02<00:12, 12.39it/s][A
Training:  17%|█▋    

Epoch: 38/45 - Loss: 30.7382 - Accuracy: 0.8859



  0%|          | 0/23 [00:00<?, ?it/s][A
  4%|▍         | 1/23 [00:00<00:14,  1.54it/s][A
 22%|██▏       | 5/23 [00:00<00:02,  6.11it/s][A
 39%|███▉      | 9/23 [00:01<00:01,  8.64it/s][A
 57%|█████▋    | 13/23 [00:01<00:01,  9.76it/s][A
 74%|███████▍  | 17/23 [00:01<00:00, 10.11it/s][A
100%|██████████| 23/23 [00:02<00:00,  9.84it/s][A
Epochs:  84%|████████▍ | 38/45 [11:23<02:06, 18.06s/it]

Val Loss: 28.7342 - Val Accuracy: 0.8734



Training:   0%|          | 0/184 [00:00<?, ?it/s][A
Training:   1%|          | 1/184 [00:00<01:48,  1.69it/s][A
Training:   3%|▎         | 5/184 [00:00<00:29,  6.09it/s][A
Training:   5%|▍         | 9/184 [00:01<00:21,  8.33it/s][A
Training:   7%|▋         | 12/184 [00:01<00:15, 11.18it/s][A
Training:   8%|▊         | 14/184 [00:01<00:17,  9.85it/s][A
Training:   9%|▉         | 17/184 [00:01<00:16, 10.03it/s][A
Training:  10%|█         | 19/184 [00:02<00:15, 10.59it/s][A
Training:  11%|█▏        | 21/184 [00:02<00:15, 10.64it/s][A
Training:  12%|█▎        | 23/184 [00:02<00:14, 11.08it/s][A
Training:  14%|█▎        | 25/184 [00:02<00:14, 11.06it/s][A
Training:  15%|█▍        | 27/184 [00:02<00:13, 11.71it/s][A
Training:  16%|█▌        | 29/184 [00:02<00:12, 12.03it/s][A
Training:  17%|█▋        | 31/184 [00:03<00:13, 11.23it/s][A
Training:  18%|█▊        | 33/184 [00:03<00:13, 11.57it/s][A
Training:  19%|█▉        | 35/184 [00:03<00:13, 11.21it/s][A
Training:  20%|██  

Epoch: 39/45 - Loss: 28.0410 - Accuracy: 0.8891



  0%|          | 0/23 [00:00<?, ?it/s][A
  4%|▍         | 1/23 [00:00<00:12,  1.73it/s][A
 22%|██▏       | 5/23 [00:00<00:02,  6.30it/s][A
 39%|███▉      | 9/23 [00:01<00:01,  8.67it/s][A
 57%|█████▋    | 13/23 [00:01<00:01,  9.60it/s][A
 74%|███████▍  | 17/23 [00:01<00:00, 10.29it/s][A
100%|██████████| 23/23 [00:02<00:00,  9.80it/s][A
Epochs:  87%|████████▋ | 39/45 [11:41<01:49, 18.22s/it]

Val Loss: 31.5409 - Val Accuracy: 0.8625



Training:   0%|          | 0/184 [00:00<?, ?it/s][A
Training:   1%|          | 1/184 [00:00<01:53,  1.61it/s][A
Training:   3%|▎         | 5/184 [00:00<00:28,  6.30it/s][A
Training:   5%|▍         | 9/184 [00:01<00:20,  8.35it/s][A
Training:   7%|▋         | 13/184 [00:01<00:19,  8.78it/s][A
Training:   9%|▉         | 17/184 [00:02<00:17,  9.55it/s][A
Training:  11%|█▏        | 21/184 [00:02<00:16, 10.05it/s][A
Training:  14%|█▎        | 25/184 [00:02<00:15, 10.15it/s][A
Training:  16%|█▌        | 29/184 [00:03<00:14, 10.89it/s][A
Training:  18%|█▊        | 33/184 [00:03<00:13, 11.22it/s][A
Training:  20%|██        | 37/184 [00:03<00:13, 11.17it/s][A
Training:  22%|██▏       | 41/184 [00:04<00:11, 12.08it/s][A
Training:  23%|██▎       | 43/184 [00:04<00:10, 12.90it/s][A
Training:  24%|██▍       | 45/184 [00:04<00:11, 12.01it/s][A
Training:  26%|██▌       | 47/184 [00:04<00:11, 12.27it/s][A
Training:  27%|██▋       | 49/184 [00:04<00:11, 11.63it/s][A
Training:  28%|██▊ 

Epoch: 40/45 - Loss: 24.0890 - Accuracy: 0.8917



  0%|          | 0/23 [00:00<?, ?it/s][A
  4%|▍         | 1/23 [00:00<00:12,  1.72it/s][A
 22%|██▏       | 5/23 [00:00<00:02,  6.27it/s][A
 39%|███▉      | 9/23 [00:01<00:01,  8.64it/s][A
 57%|█████▋    | 13/23 [00:01<00:01,  9.10it/s][A
 74%|███████▍  | 17/23 [00:01<00:00,  9.99it/s][A
100%|██████████| 23/23 [00:02<00:00,  9.50it/s][A
Epochs:  89%|████████▉ | 40/45 [12:00<01:31, 18.30s/it]

Val Loss: 35.1701 - Val Accuracy: 0.8555



Training:   0%|          | 0/184 [00:00<?, ?it/s][A
Training:   1%|          | 1/184 [00:00<01:52,  1.62it/s][A
Training:   3%|▎         | 5/184 [00:00<00:29,  6.12it/s][A
Training:   5%|▍         | 9/184 [00:01<00:21,  8.25it/s][A
Training:   7%|▋         | 13/184 [00:01<00:17,  9.50it/s][A
Training:   9%|▉         | 17/184 [00:01<00:16, 10.31it/s][A
Training:  11%|█▏        | 21/184 [00:02<00:16, 10.12it/s][A
Training:  14%|█▎        | 25/184 [00:02<00:15, 10.46it/s][A
Training:  16%|█▌        | 29/184 [00:03<00:14, 10.97it/s][A
Training:  18%|█▊        | 33/184 [00:03<00:13, 11.50it/s][A
Training:  20%|██        | 37/184 [00:03<00:11, 12.28it/s][A
Training:  22%|██▏       | 41/184 [00:03<00:11, 12.54it/s][A
Training:  24%|██▍       | 45/184 [00:04<00:11, 12.52it/s][A
Training:  27%|██▋       | 49/184 [00:04<00:11, 12.11it/s][A
Training:  29%|██▉       | 53/184 [00:05<00:11, 11.66it/s][A
Training:  31%|███       | 57/184 [00:05<00:10, 11.75it/s][A
Training:  33%|███▎

Epoch: 41/45 - Loss: 25.2286 - Accuracy: 0.8904



  0%|          | 0/23 [00:00<?, ?it/s][A
  4%|▍         | 1/23 [00:00<00:14,  1.51it/s][A
 22%|██▏       | 5/23 [00:00<00:02,  6.12it/s][A
 39%|███▉      | 9/23 [00:01<00:01,  8.47it/s][A
 57%|█████▋    | 13/23 [00:01<00:01,  9.68it/s][A
 74%|███████▍  | 17/23 [00:01<00:00, 10.76it/s][A
100%|██████████| 23/23 [00:02<00:00,  9.87it/s][A
Epochs:  91%|█████████ | 41/45 [12:18<01:12, 18.19s/it]

Val Loss: 24.5972 - Val Accuracy: 0.8669



Training:   0%|          | 0/184 [00:00<?, ?it/s][A
Training:   1%|          | 1/184 [00:00<01:50,  1.65it/s][A
Training:   3%|▎         | 5/184 [00:00<00:26,  6.69it/s][A
Training:   5%|▍         | 9/184 [00:01<00:19,  8.89it/s][A
Training:   6%|▌         | 11/184 [00:01<00:16, 10.36it/s][A
Training:   7%|▋         | 13/184 [00:01<00:16, 10.57it/s][A
Training:   8%|▊         | 15/184 [00:01<00:14, 11.91it/s][A
Training:   9%|▉         | 17/184 [00:01<00:15, 10.66it/s][A
Training:  11%|█         | 20/184 [00:01<00:11, 14.16it/s][A
Training:  12%|█▏        | 22/184 [00:02<00:14, 11.56it/s][A
Training:  13%|█▎        | 24/184 [00:02<00:12, 12.40it/s][A
Training:  14%|█▍        | 26/184 [00:02<00:14, 10.68it/s][A
Training:  15%|█▌        | 28/184 [00:02<00:12, 12.26it/s][A
Training:  16%|█▋        | 30/184 [00:02<00:13, 11.12it/s][A
Training:  17%|█▋        | 32/184 [00:03<00:11, 12.79it/s][A
Training:  18%|█▊        | 34/184 [00:03<00:14, 10.60it/s][A
Training:  20%|██  

Epoch: 42/45 - Loss: 25.8794 - Accuracy: 0.8845



  0%|          | 0/23 [00:00<?, ?it/s][A
  4%|▍         | 1/23 [00:00<00:13,  1.65it/s][A
 22%|██▏       | 5/23 [00:00<00:02,  6.55it/s][A
 39%|███▉      | 9/23 [00:01<00:01,  8.73it/s][A
 57%|█████▋    | 13/23 [00:01<00:00, 10.23it/s][A
 74%|███████▍  | 17/23 [00:01<00:00, 10.46it/s][A
100%|██████████| 23/23 [00:02<00:00,  9.81it/s][A
Epochs:  93%|█████████▎| 42/45 [12:36<00:54, 18.16s/it]

Val Loss: 27.9819 - Val Accuracy: 0.8711



Training:   0%|          | 0/184 [00:00<?, ?it/s][A
Training:   1%|          | 1/184 [00:00<01:47,  1.71it/s][A
Training:   3%|▎         | 5/184 [00:00<00:30,  5.96it/s][A
Training:   5%|▍         | 9/184 [00:01<00:21,  8.13it/s][A
Training:   7%|▋         | 13/184 [00:01<00:18,  9.22it/s][A
Training:   9%|▉         | 17/184 [00:02<00:16,  9.91it/s][A
Training:  11%|█▏        | 21/184 [00:02<00:15, 10.40it/s][A
Training:  14%|█▎        | 25/184 [00:02<00:14, 10.90it/s][A
Training:  16%|█▌        | 29/184 [00:03<00:13, 11.34it/s][A
Training:  18%|█▊        | 33/184 [00:03<00:13, 11.36it/s][A
Training:  20%|██        | 37/184 [00:03<00:13, 11.25it/s][A
Training:  22%|██▏       | 41/184 [00:04<00:12, 11.66it/s][A
Training:  24%|██▍       | 45/184 [00:04<00:11, 11.93it/s][A
Training:  27%|██▋       | 49/184 [00:04<00:10, 12.51it/s][A
Training:  29%|██▉       | 53/184 [00:04<00:10, 12.54it/s][A
Training:  31%|███       | 57/184 [00:05<00:09, 12.73it/s][A
Training:  32%|███▏

Epoch: 43/45 - Loss: 26.0104 - Accuracy: 0.8885



  0%|          | 0/23 [00:00<?, ?it/s][A
  4%|▍         | 1/23 [00:00<00:11,  1.91it/s][A
 22%|██▏       | 5/23 [00:00<00:02,  7.09it/s][A
 39%|███▉      | 9/23 [00:01<00:01,  9.00it/s][A
 52%|█████▏    | 12/23 [00:01<00:00, 12.14it/s][A
 61%|██████    | 14/23 [00:01<00:00,  9.51it/s][A
 74%|███████▍  | 17/23 [00:01<00:00, 10.28it/s][A
 83%|████████▎ | 19/23 [00:01<00:00, 11.37it/s][A
 91%|█████████▏| 21/23 [00:02<00:00, 11.09it/s][A
100%|██████████| 23/23 [00:02<00:00,  9.89it/s][A
Epochs:  96%|█████████▌| 43/45 [12:54<00:36, 18.21s/it]

Val Loss: 36.1253 - Val Accuracy: 0.8751



Training:   0%|          | 0/184 [00:00<?, ?it/s][A
Training:   1%|          | 1/184 [00:00<01:53,  1.62it/s][A
Training:   3%|▎         | 5/184 [00:00<00:27,  6.57it/s][A
Training:   5%|▍         | 9/184 [00:01<00:20,  8.64it/s][A
Training:   7%|▋         | 13/184 [00:01<00:17,  9.82it/s][A
Training:   9%|▉         | 17/184 [00:01<00:16,  9.94it/s][A
Training:  11%|█▏        | 21/184 [00:02<00:15, 10.35it/s][A
Training:  14%|█▎        | 25/184 [00:02<00:14, 11.03it/s][A
Training:  16%|█▌        | 29/184 [00:02<00:13, 11.79it/s][A
Training:  18%|█▊        | 33/184 [00:03<00:13, 11.59it/s][A
Training:  20%|██        | 37/184 [00:03<00:13, 11.19it/s][A
Training:  22%|██▏       | 41/184 [00:04<00:12, 11.09it/s][A
Training:  24%|██▍       | 45/184 [00:04<00:11, 11.74it/s][A
Training:  27%|██▋       | 49/184 [00:04<00:11, 12.02it/s][A
Training:  29%|██▉       | 53/184 [00:05<00:11, 11.87it/s][A
Training:  31%|███       | 57/184 [00:05<00:10, 11.85it/s][A
Training:  33%|███▎

Epoch: 44/45 - Loss: 26.9246 - Accuracy: 0.8895



  0%|          | 0/23 [00:00<?, ?it/s][A
  4%|▍         | 1/23 [00:00<00:12,  1.80it/s][A
 22%|██▏       | 5/23 [00:00<00:02,  6.64it/s][A
 39%|███▉      | 9/23 [00:01<00:01,  8.34it/s][A
 57%|█████▋    | 13/23 [00:01<00:01,  9.23it/s][A
 74%|███████▍  | 17/23 [00:01<00:00, 10.15it/s][A
100%|██████████| 23/23 [00:02<00:00,  9.88it/s][A
Epochs:  98%|█████████▊| 44/45 [13:12<00:18, 18.19s/it]

Val Loss: 24.1326 - Val Accuracy: 0.8819



Training:   0%|          | 0/184 [00:00<?, ?it/s][A
Training:   1%|          | 1/184 [00:00<01:37,  1.87it/s][A
Training:   3%|▎         | 5/184 [00:00<00:27,  6.51it/s][A
Training:   5%|▍         | 9/184 [00:01<00:19,  8.95it/s][A
Training:   7%|▋         | 12/184 [00:01<00:14, 12.05it/s][A
Training:   8%|▊         | 14/184 [00:01<00:17,  9.72it/s][A
Training:   9%|▉         | 17/184 [00:01<00:16, 10.07it/s][A
Training:  11%|█         | 20/184 [00:02<00:12, 12.74it/s][A
Training:  12%|█▏        | 22/184 [00:02<00:16, 10.09it/s][A
Training:  14%|█▎        | 25/184 [00:02<00:14, 11.20it/s][A
Training:  15%|█▍        | 27/184 [00:02<00:13, 11.80it/s][A
Training:  16%|█▌        | 29/184 [00:02<00:13, 11.54it/s][A
Training:  17%|█▋        | 31/184 [00:03<00:12, 12.12it/s][A
Training:  18%|█▊        | 33/184 [00:03<00:13, 10.83it/s][A
Training:  19%|█▉        | 35/184 [00:03<00:12, 12.31it/s][A
Training:  20%|██        | 37/184 [00:03<00:13, 11.28it/s][A
Training:  21%|██  

Epoch: 45/45 - Loss: 25.6260 - Accuracy: 0.8908



  0%|          | 0/23 [00:00<?, ?it/s][A
  4%|▍         | 1/23 [00:00<00:12,  1.83it/s][A
 13%|█▎        | 3/23 [00:00<00:03,  5.48it/s][A
 22%|██▏       | 5/23 [00:00<00:02,  6.53it/s][A
 39%|███▉      | 9/23 [00:01<00:01,  8.55it/s][A
 57%|█████▋    | 13/23 [00:01<00:01,  9.75it/s][A
 74%|███████▍  | 17/23 [00:01<00:00, 10.57it/s][A
100%|██████████| 23/23 [00:02<00:00,  9.61it/s][A
Epochs: 100%|██████████| 45/45 [13:30<00:00, 18.02s/it]


Val Loss: 27.6988 - Val Accuracy: 0.8756


[32m[I 2023-12-11 23:52:01,619][0m Trial 1 finished with value: 0.8755995035171509 and parameters: {'learning_rate': 0.05684972267027994, 'weight_decay': 0.003481723709485491, 'epsilon': 1.1793575954143915e-09, 'batch_size': 76, 'epochs': 45}. Best is trial 0 with value: 0.9175874590873718.[0m


Learning rate: 7.580753858884148e-05
Weight decay: 0.0012623191952287505
Epsilon: 1.085471414745964e-09
Batch size: 154
Number of epochs: 93


Epochs:   0%|          | 0/93 [00:00<?, ?it/s]
Training:   0%|          | 0/91 [00:00<?, ?it/s][A
Training:   1%|          | 1/91 [00:00<01:18,  1.15it/s][A
Training:   2%|▏         | 2/91 [00:01<00:39,  2.25it/s][A
Training:   5%|▌         | 5/91 [00:01<00:20,  4.20it/s][A
Training:   7%|▋         | 6/91 [00:01<00:19,  4.43it/s][A
Training:  10%|▉         | 9/91 [00:02<00:16,  4.95it/s][A
Training:  11%|█         | 10/91 [00:02<00:17,  4.72it/s][A
Training:  14%|█▍        | 13/91 [00:02<00:14,  5.47it/s][A
Training:  15%|█▌        | 14/91 [00:03<00:14,  5.42it/s][A
Training:  19%|█▊        | 17/91 [00:03<00:13,  5.47it/s][A
Training:  20%|█▉        | 18/91 [00:03<00:13,  5.40it/s][A
Training:  23%|██▎       | 21/91 [00:04<00:11,  6.04it/s][A
Training:  24%|██▍       | 22/91 [00:04<00:12,  5.51it/s][A
Training:  27%|██▋       | 25/91 [00:04<00:11,  5.88it/s][A
Training:  29%|██▊       | 26/91 [00:05<00:11,  5.73it/s][A
Training:  32%|███▏      | 29/91 [00:05<00:10,  5.81

Epoch: 1/93 - Loss: 0.4473 - Accuracy: 0.8338



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:00<00:10,  1.08it/s][A
 42%|████▏     | 5/12 [00:01<00:01,  3.64it/s][A
100%|██████████| 12/12 [00:02<00:00,  5.10it/s][A
Epochs:   1%|          | 1/93 [00:18<28:00, 18.26s/it]

Val Loss: 0.3158 - Val Accuracy: 0.8895



Training:   0%|          | 0/91 [00:00<?, ?it/s][A
Training:   1%|          | 1/91 [00:01<01:30,  1.00s/it][A
Training:   5%|▌         | 5/91 [00:01<00:26,  3.21it/s][A
Training:   9%|▉         | 8/91 [00:01<00:14,  5.59it/s][A
Training:  11%|█         | 10/91 [00:02<00:17,  4.54it/s][A
Training:  14%|█▍        | 13/91 [00:03<00:17,  4.40it/s][A
Training:  18%|█▊        | 16/91 [00:03<00:11,  6.38it/s][A
Training:  20%|█▉        | 18/91 [00:03<00:13,  5.58it/s][A
Training:  23%|██▎       | 21/91 [00:04<00:13,  5.23it/s][A
Training:  26%|██▋       | 24/91 [00:04<00:09,  7.12it/s][A
Training:  29%|██▊       | 26/91 [00:05<00:11,  5.66it/s][A
Training:  32%|███▏      | 29/91 [00:05<00:11,  5.32it/s][A
Training:  36%|███▋      | 33/91 [00:06<00:10,  5.69it/s][A
Training:  41%|████      | 37/91 [00:07<00:09,  5.83it/s][A
Training:  45%|████▌     | 41/91 [00:07<00:08,  5.72it/s][A
Training:  49%|████▉     | 45/91 [00:08<00:08,  5.59it/s][A
Training:  54%|█████▍    | 49/91 [0

Epoch: 2/93 - Loss: 0.2722 - Accuracy: 0.9046



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:00<00:09,  1.12it/s][A
 42%|████▏     | 5/12 [00:01<00:01,  3.62it/s][A
100%|██████████| 12/12 [00:02<00:00,  5.27it/s][A
Epochs:   2%|▏         | 2/93 [00:36<27:29, 18.13s/it]

Val Loss: 0.2466 - Val Accuracy: 0.9004



Training:   0%|          | 0/91 [00:00<?, ?it/s][A
Training:   1%|          | 1/91 [00:01<01:29,  1.00it/s][A
Training:   4%|▍         | 4/91 [00:01<00:19,  4.52it/s][A
Training:   7%|▋         | 6/91 [00:01<00:21,  3.93it/s][A
Training:  10%|▉         | 9/91 [00:02<00:18,  4.37it/s][A
Training:  12%|█▏        | 11/91 [00:02<00:14,  5.48it/s][A
Training:  14%|█▍        | 13/91 [00:03<00:16,  4.67it/s][A
Training:  16%|█▋        | 15/91 [00:03<00:12,  6.09it/s][A
Training:  19%|█▊        | 17/91 [00:03<00:15,  4.76it/s][A
Training:  22%|██▏       | 20/91 [00:03<00:10,  7.04it/s][A
Training:  24%|██▍       | 22/91 [00:04<00:12,  5.38it/s][A
Training:  27%|██▋       | 25/91 [00:05<00:12,  5.08it/s][A
Training:  32%|███▏      | 29/91 [00:05<00:11,  5.52it/s][A
Training:  35%|███▌      | 32/91 [00:05<00:08,  7.21it/s][A
Training:  37%|███▋      | 34/91 [00:06<00:09,  6.20it/s][A
Training:  40%|███▉      | 36/91 [00:06<00:07,  7.30it/s][A
Training:  42%|████▏     | 38/91 [00

Epoch: 3/93 - Loss: 0.2276 - Accuracy: 0.9171



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:00<00:10,  1.06it/s][A
 33%|███▎      | 4/12 [00:01<00:01,  4.81it/s][A
 50%|█████     | 6/12 [00:01<00:01,  3.81it/s][A
100%|██████████| 12/12 [00:02<00:00,  4.93it/s][A
Epochs:   3%|▎         | 3/93 [00:54<27:20, 18.23s/it]

Val Loss: 0.2243 - Val Accuracy: 0.9112



Training:   0%|          | 0/91 [00:00<?, ?it/s][A
Training:   1%|          | 1/91 [00:01<01:35,  1.06s/it][A
Training:   5%|▌         | 5/91 [00:01<00:25,  3.43it/s][A
Training:   9%|▉         | 8/91 [00:01<00:14,  5.88it/s][A
Training:  11%|█         | 10/91 [00:02<00:17,  4.75it/s][A
Training:  14%|█▍        | 13/91 [00:03<00:16,  4.83it/s][A
Training:  15%|█▌        | 14/91 [00:03<00:14,  5.23it/s][A
Training:  19%|█▊        | 17/91 [00:03<00:13,  5.56it/s][A
Training:  21%|██        | 19/91 [00:03<00:10,  6.96it/s][A
Training:  23%|██▎       | 21/91 [00:04<00:13,  5.27it/s][A
Training:  26%|██▋       | 24/91 [00:04<00:08,  7.59it/s][A
Training:  29%|██▊       | 26/91 [00:05<00:12,  5.40it/s][A
Training:  32%|███▏      | 29/91 [00:05<00:11,  5.28it/s][A
Training:  36%|███▋      | 33/91 [00:06<00:10,  5.47it/s][A
Training:  41%|████      | 37/91 [00:07<00:09,  5.57it/s][A
Training:  45%|████▌     | 41/91 [00:07<00:08,  5.56it/s][A
Training:  49%|████▉     | 45/91 [0

Epoch: 4/93 - Loss: 0.2095 - Accuracy: 0.9241



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:00<00:10,  1.06it/s][A
 42%|████▏     | 5/12 [00:01<00:02,  3.40it/s][A
100%|██████████| 12/12 [00:02<00:00,  5.00it/s][A
Epochs:   4%|▍         | 4/93 [01:12<27:03, 18.24s/it]

Val Loss: 0.2166 - Val Accuracy: 0.9161



Training:   0%|          | 0/91 [00:00<?, ?it/s][A
Training:   1%|          | 1/91 [00:00<01:20,  1.12it/s][A
Training:   4%|▍         | 4/91 [00:01<00:17,  5.04it/s][A
Training:   7%|▋         | 6/91 [00:01<00:21,  3.97it/s][A
Training:  10%|▉         | 9/91 [00:02<00:18,  4.38it/s][A
Training:  11%|█         | 10/91 [00:02<00:16,  4.81it/s][A
Training:  14%|█▍        | 13/91 [00:02<00:15,  4.97it/s][A
Training:  16%|█▋        | 15/91 [00:03<00:12,  6.33it/s][A
Training:  19%|█▊        | 17/91 [00:03<00:13,  5.63it/s][A
Training:  20%|█▉        | 18/91 [00:03<00:13,  5.58it/s][A
Training:  23%|██▎       | 21/91 [00:04<00:12,  5.58it/s][A
Training:  24%|██▍       | 22/91 [00:04<00:12,  5.41it/s][A
Training:  27%|██▋       | 25/91 [00:04<00:11,  5.98it/s][A
Training:  29%|██▊       | 26/91 [00:05<00:11,  5.63it/s][A
Training:  32%|███▏      | 29/91 [00:05<00:09,  6.21it/s][A
Training:  33%|███▎      | 30/91 [00:05<00:10,  5.92it/s][A
Training:  36%|███▋      | 33/91 [00

Epoch: 5/93 - Loss: 0.2000 - Accuracy: 0.9254



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:11,  1.00s/it][A
 42%|████▏     | 5/12 [00:01<00:01,  3.53it/s][A
100%|██████████| 12/12 [00:02<00:00,  4.98it/s][A
Epochs:   5%|▌         | 5/93 [01:30<26:34, 18.12s/it]

Val Loss: 0.2105 - Val Accuracy: 0.9150



Training:   0%|          | 0/91 [00:00<?, ?it/s][A
Training:   1%|          | 1/91 [00:00<01:21,  1.10it/s][A
Training:   4%|▍         | 4/91 [00:01<00:17,  4.94it/s][A
Training:   7%|▋         | 6/91 [00:01<00:20,  4.07it/s][A
Training:  10%|▉         | 9/91 [00:02<00:19,  4.28it/s][A
Training:  12%|█▏        | 11/91 [00:02<00:14,  5.59it/s][A
Training:  14%|█▍        | 13/91 [00:02<00:16,  4.66it/s][A
Training:  18%|█▊        | 16/91 [00:03<00:10,  6.97it/s][A
Training:  20%|█▉        | 18/91 [00:03<00:12,  5.62it/s][A
Training:  23%|██▎       | 21/91 [00:04<00:13,  5.38it/s][A
Training:  27%|██▋       | 25/91 [00:04<00:11,  5.67it/s][A
Training:  32%|███▏      | 29/91 [00:05<00:10,  5.68it/s][A
Training:  36%|███▋      | 33/91 [00:06<00:09,  6.20it/s][A
Training:  40%|███▉      | 36/91 [00:06<00:07,  7.81it/s][A
Training:  42%|████▏     | 38/91 [00:06<00:08,  5.96it/s][A
Training:  45%|████▌     | 41/91 [00:07<00:08,  5.64it/s][A
Training:  47%|████▋     | 43/91 [00

Epoch: 6/93 - Loss: 0.1936 - Accuracy: 0.9284



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:00<00:09,  1.11it/s][A
 42%|████▏     | 5/12 [00:01<00:01,  3.68it/s][A
 50%|█████     | 6/12 [00:01<00:01,  4.31it/s][A
100%|██████████| 12/12 [00:02<00:00,  5.16it/s][A
Epochs:   6%|▋         | 6/93 [01:48<26:09, 18.04s/it]

Val Loss: 0.2100 - Val Accuracy: 0.9150



Training:   0%|          | 0/91 [00:00<?, ?it/s][A
Training:   1%|          | 1/91 [00:00<01:28,  1.02it/s][A
Training:   4%|▍         | 4/91 [00:01<00:18,  4.66it/s][A
Training:   7%|▋         | 6/91 [00:01<00:22,  3.83it/s][A
Training:  10%|▉         | 9/91 [00:02<00:19,  4.29it/s][A
Training:  13%|█▎        | 12/91 [00:02<00:12,  6.45it/s][A
Training:  15%|█▌        | 14/91 [00:03<00:15,  5.07it/s][A
Training:  19%|█▊        | 17/91 [00:03<00:14,  5.07it/s][A
Training:  21%|██        | 19/91 [00:03<00:11,  6.26it/s][A
Training:  23%|██▎       | 21/91 [00:04<00:13,  5.02it/s][A
Training:  27%|██▋       | 25/91 [00:04<00:11,  5.67it/s][A
Training:  31%|███       | 28/91 [00:05<00:08,  7.53it/s][A
Training:  33%|███▎      | 30/91 [00:05<00:10,  5.91it/s][A
Training:  35%|███▌      | 32/91 [00:05<00:08,  7.00it/s][A
Training:  37%|███▋      | 34/91 [00:06<00:09,  5.79it/s][A
Training:  38%|███▊      | 35/91 [00:06<00:09,  6.03it/s][A
Training:  41%|████      | 37/91 [00

Epoch: 7/93 - Loss: 0.1900 - Accuracy: 0.9274



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:00<00:09,  1.17it/s][A
 33%|███▎      | 4/12 [00:01<00:01,  4.92it/s][A
 50%|█████     | 6/12 [00:01<00:01,  4.13it/s][A
 75%|███████▌  | 9/12 [00:02<00:00,  4.78it/s][A
100%|██████████| 12/12 [00:02<00:00,  5.22it/s][A
Epochs:   8%|▊         | 7/93 [02:06<25:53, 18.06s/it]

Val Loss: 0.2085 - Val Accuracy: 0.9161



Training:   0%|          | 0/91 [00:00<?, ?it/s][A
Training:   1%|          | 1/91 [00:00<01:20,  1.12it/s][A
Training:   3%|▎         | 3/91 [00:00<00:23,  3.72it/s][A
Training:   5%|▌         | 5/91 [00:01<00:25,  3.43it/s][A
Training:   7%|▋         | 6/91 [00:01<00:20,  4.15it/s][A
Training:  10%|▉         | 9/91 [00:02<00:17,  4.62it/s][A
Training:  11%|█         | 10/91 [00:02<00:15,  5.09it/s][A
Training:  14%|█▍        | 13/91 [00:02<00:14,  5.30it/s][A
Training:  18%|█▊        | 16/91 [00:03<00:09,  7.57it/s][A
Training:  20%|█▉        | 18/91 [00:03<00:12,  5.88it/s][A
Training:  23%|██▎       | 21/91 [00:04<00:12,  5.76it/s][A
Training:  26%|██▋       | 24/91 [00:04<00:08,  7.96it/s][A
Training:  29%|██▊       | 26/91 [00:04<00:11,  5.84it/s][A
Training:  32%|███▏      | 29/91 [00:05<00:10,  5.65it/s][A
Training:  33%|███▎      | 30/91 [00:05<00:10,  5.90it/s][A
Training:  35%|███▌      | 32/91 [00:05<00:08,  7.14it/s][A
Training:  37%|███▋      | 34/91 [00:

Epoch: 8/93 - Loss: 0.1872 - Accuracy: 0.9294



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:00<00:10,  1.06it/s][A
 33%|███▎      | 4/12 [00:01<00:01,  4.85it/s][A
 50%|█████     | 6/12 [00:01<00:01,  4.02it/s][A
100%|██████████| 12/12 [00:02<00:00,  5.04it/s][A
Epochs:   9%|▊         | 8/93 [02:24<25:32, 18.03s/it]

Val Loss: 0.2091 - Val Accuracy: 0.9101



Training:   0%|          | 0/91 [00:00<?, ?it/s][A
Training:   1%|          | 1/91 [00:00<01:18,  1.14it/s][A
Training:   3%|▎         | 3/91 [00:00<00:23,  3.69it/s][A
Training:   5%|▌         | 5/91 [00:01<00:23,  3.65it/s][A
Training:  10%|▉         | 9/91 [00:02<00:18,  4.47it/s][A
Training:  14%|█▍        | 13/91 [00:02<00:15,  5.10it/s][A
Training:  19%|█▊        | 17/91 [00:03<00:13,  5.35it/s][A
Training:  23%|██▎       | 21/91 [00:04<00:12,  5.60it/s][A
Training:  26%|██▋       | 24/91 [00:04<00:09,  7.16it/s][A
Training:  29%|██▊       | 26/91 [00:04<00:11,  5.90it/s][A
Training:  32%|███▏      | 29/91 [00:05<00:11,  5.31it/s][A
Training:  36%|███▋      | 33/91 [00:06<00:10,  5.69it/s][A
Training:  41%|████      | 37/91 [00:06<00:08,  6.01it/s][A
Training:  45%|████▌     | 41/91 [00:07<00:07,  6.37it/s][A
Training:  46%|████▌     | 42/91 [00:07<00:08,  6.12it/s][A
Training:  49%|████▉     | 45/91 [00:08<00:07,  6.29it/s][A
Training:  51%|█████     | 46/91 [00

Epoch: 9/93 - Loss: 0.1853 - Accuracy: 0.9293



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:00<00:10,  1.05it/s][A
 33%|███▎      | 4/12 [00:01<00:01,  4.52it/s][A
 50%|█████     | 6/12 [00:01<00:01,  4.27it/s][A
 67%|██████▋   | 8/12 [00:01<00:00,  5.80it/s][A
100%|██████████| 12/12 [00:02<00:00,  5.10it/s][A
Epochs:  10%|▉         | 9/93 [02:42<25:11, 17.99s/it]

Val Loss: 0.2092 - Val Accuracy: 0.9095



Training:   0%|          | 0/91 [00:00<?, ?it/s][A
Training:   1%|          | 1/91 [00:00<01:23,  1.07it/s][A
Training:   2%|▏         | 2/91 [00:01<00:39,  2.25it/s][A
Training:   5%|▌         | 5/91 [00:01<00:22,  3.81it/s][A
Training:   8%|▊         | 7/91 [00:01<00:15,  5.59it/s][A
Training:  10%|▉         | 9/91 [00:02<00:18,  4.49it/s][A
Training:  13%|█▎        | 12/91 [00:02<00:11,  6.94it/s][A
Training:  15%|█▌        | 14/91 [00:03<00:14,  5.31it/s][A
Training:  18%|█▊        | 16/91 [00:03<00:11,  6.43it/s][A
Training:  20%|█▉        | 18/91 [00:03<00:14,  5.21it/s][A
Training:  22%|██▏       | 20/91 [00:03<00:10,  6.49it/s][A
Training:  24%|██▍       | 22/91 [00:04<00:12,  5.70it/s][A
Training:  26%|██▋       | 24/91 [00:04<00:09,  6.96it/s][A
Training:  29%|██▊       | 26/91 [00:05<00:11,  5.55it/s][A
Training:  31%|███       | 28/91 [00:05<00:09,  6.47it/s][A
Training:  32%|███▏      | 29/91 [00:05<00:11,  5.25it/s][A
Training:  33%|███▎      | 30/91 [00:

Epoch: 10/93 - Loss: 0.1836 - Accuracy: 0.9306



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:10,  1.00it/s][A
 42%|████▏     | 5/12 [00:01<00:02,  3.38it/s][A
 67%|██████▋   | 8/12 [00:01<00:00,  5.79it/s][A
100%|██████████| 12/12 [00:02<00:00,  4.86it/s][A
Epochs:  11%|█         | 10/93 [03:01<25:02, 18.11s/it]

Val Loss: 0.2092 - Val Accuracy: 0.9123



Training:   0%|          | 0/91 [00:00<?, ?it/s][A
Training:   1%|          | 1/91 [00:00<01:21,  1.11it/s][A
Training:   5%|▌         | 5/91 [00:01<00:23,  3.64it/s][A
Training:  10%|▉         | 9/91 [00:02<00:18,  4.52it/s][A
Training:  14%|█▍        | 13/91 [00:02<00:15,  5.13it/s][A
Training:  18%|█▊        | 16/91 [00:03<00:10,  6.83it/s][A
Training:  20%|█▉        | 18/91 [00:03<00:13,  5.43it/s][A
Training:  23%|██▎       | 21/91 [00:04<00:12,  5.53it/s][A
Training:  24%|██▍       | 22/91 [00:04<00:11,  5.86it/s][A
Training:  27%|██▋       | 25/91 [00:04<00:11,  5.94it/s][A
Training:  29%|██▊       | 26/91 [00:04<00:11,  5.79it/s][A
Training:  32%|███▏      | 29/91 [00:05<00:10,  5.77it/s][A
Training:  33%|███▎      | 30/91 [00:05<00:10,  6.07it/s][A
Training:  36%|███▋      | 33/91 [00:06<00:09,  6.12it/s][A
Training:  37%|███▋      | 34/91 [00:06<00:09,  6.07it/s][A
Training:  41%|████      | 37/91 [00:06<00:08,  6.24it/s][A
Training:  42%|████▏     | 38/91 [0

Epoch: 11/93 - Loss: 0.1826 - Accuracy: 0.9310



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:00<00:09,  1.12it/s][A
 25%|██▌       | 3/12 [00:01<00:02,  3.58it/s][A
 42%|████▏     | 5/12 [00:01<00:01,  3.78it/s][A
 50%|█████     | 6/12 [00:01<00:01,  4.52it/s][A
 67%|██████▋   | 8/12 [00:01<00:00,  6.67it/s][A
100%|██████████| 12/12 [00:02<00:00,  4.89it/s][A
Epochs:  12%|█▏        | 11/93 [03:19<24:41, 18.07s/it]

Val Loss: 0.2078 - Val Accuracy: 0.9117



Training:   0%|          | 0/91 [00:00<?, ?it/s][A
Training:   1%|          | 1/91 [00:00<01:22,  1.09it/s][A
Training:   5%|▌         | 5/91 [00:01<00:22,  3.74it/s][A
Training:   9%|▉         | 8/91 [00:01<00:13,  6.08it/s][A
Training:  11%|█         | 10/91 [00:02<00:16,  4.83it/s][A
Training:  13%|█▎        | 12/91 [00:02<00:12,  6.15it/s][A
Training:  15%|█▌        | 14/91 [00:02<00:14,  5.13it/s][A
Training:  18%|█▊        | 16/91 [00:03<00:12,  6.08it/s][A
Training:  19%|█▊        | 17/91 [00:03<00:16,  4.48it/s][A
Training:  22%|██▏       | 20/91 [00:03<00:10,  6.53it/s][A
Training:  23%|██▎       | 21/91 [00:04<00:14,  4.83it/s][A
Training:  26%|██▋       | 24/91 [00:04<00:09,  7.29it/s][A
Training:  29%|██▊       | 26/91 [00:04<00:11,  5.64it/s][A
Training:  32%|███▏      | 29/91 [00:05<00:11,  5.35it/s][A
Training:  35%|███▌      | 32/91 [00:05<00:07,  7.43it/s][A
Training:  37%|███▋      | 34/91 [00:06<00:09,  5.71it/s][A
Training:  41%|████      | 37/91 [0

Epoch: 12/93 - Loss: 0.1822 - Accuracy: 0.9313



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:00<00:10,  1.01it/s][A
 42%|████▏     | 5/12 [00:01<00:02,  3.36it/s][A
100%|██████████| 12/12 [00:02<00:00,  4.97it/s][A
Epochs:  13%|█▎        | 12/93 [03:37<24:25, 18.09s/it]

Val Loss: 0.2067 - Val Accuracy: 0.9133



Training:   0%|          | 0/91 [00:00<?, ?it/s][A
Training:   1%|          | 1/91 [00:00<01:22,  1.08it/s][A
Training:   5%|▌         | 5/91 [00:01<00:23,  3.63it/s][A
Training:   8%|▊         | 7/91 [00:01<00:15,  5.26it/s][A
Training:  10%|▉         | 9/91 [00:02<00:18,  4.54it/s][A
Training:  12%|█▏        | 11/91 [00:02<00:13,  6.02it/s][A
Training:  14%|█▍        | 13/91 [00:02<00:15,  5.14it/s][A
Training:  16%|█▋        | 15/91 [00:02<00:11,  6.66it/s][A
Training:  19%|█▊        | 17/91 [00:03<00:14,  5.00it/s][A
Training:  22%|██▏       | 20/91 [00:03<00:09,  7.11it/s][A
Training:  24%|██▍       | 22/91 [00:04<00:12,  5.62it/s][A
Training:  27%|██▋       | 25/91 [00:04<00:11,  5.53it/s][A
Training:  31%|███       | 28/91 [00:04<00:08,  7.61it/s][A
Training:  33%|███▎      | 30/91 [00:05<00:10,  5.70it/s][A
Training:  36%|███▋      | 33/91 [00:06<00:11,  5.19it/s][A
Training:  41%|████      | 37/91 [00:06<00:09,  5.63it/s][A
Training:  45%|████▌     | 41/91 [00

Epoch: 13/93 - Loss: 0.1813 - Accuracy: 0.9318



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:00<00:10,  1.03it/s][A
 42%|████▏     | 5/12 [00:01<00:01,  3.53it/s][A
100%|██████████| 12/12 [00:02<00:00,  5.15it/s][A
Epochs:  14%|█▍        | 13/93 [03:55<24:03, 18.04s/it]

Val Loss: 0.2083 - Val Accuracy: 0.9106



Training:   0%|          | 0/91 [00:00<?, ?it/s][A
Training:   1%|          | 1/91 [00:00<01:25,  1.05it/s][A
Training:   4%|▍         | 4/91 [00:01<00:18,  4.62it/s][A
Training:   7%|▋         | 6/91 [00:01<00:22,  3.76it/s][A
Training:  10%|▉         | 9/91 [00:02<00:20,  4.09it/s][A
Training:  13%|█▎        | 12/91 [00:02<00:12,  6.22it/s][A
Training:  15%|█▌        | 14/91 [00:03<00:15,  4.94it/s][A
Training:  19%|█▊        | 17/91 [00:03<00:15,  4.91it/s][A
Training:  23%|██▎       | 21/91 [00:04<00:12,  5.40it/s][A
Training:  27%|██▋       | 25/91 [00:04<00:11,  5.86it/s][A
Training:  31%|███       | 28/91 [00:05<00:08,  7.56it/s][A
Training:  33%|███▎      | 30/91 [00:05<00:10,  5.97it/s][A
Training:  35%|███▌      | 32/91 [00:05<00:08,  7.01it/s][A
Training:  37%|███▋      | 34/91 [00:06<00:10,  5.67it/s][A
Training:  40%|███▉      | 36/91 [00:06<00:07,  6.88it/s][A
Training:  42%|████▏     | 38/91 [00:07<00:09,  5.62it/s][A
Training:  43%|████▎     | 39/91 [00

Epoch: 14/93 - Loss: 0.1797 - Accuracy: 0.9323



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:00<00:10,  1.06it/s][A
 42%|████▏     | 5/12 [00:01<00:02,  3.49it/s][A
 67%|██████▋   | 8/12 [00:01<00:00,  5.72it/s][A
100%|██████████| 12/12 [00:02<00:00,  4.99it/s][A
Epochs:  15%|█▌        | 14/93 [04:13<23:50, 18.11s/it]

Val Loss: 0.2097 - Val Accuracy: 0.9128



Training:   0%|          | 0/91 [00:00<?, ?it/s][A
Training:   1%|          | 1/91 [00:00<01:26,  1.05it/s][A
Training:   4%|▍         | 4/91 [00:01<00:19,  4.46it/s][A
Training:   7%|▋         | 6/91 [00:01<00:21,  4.04it/s][A
Training:   9%|▉         | 8/91 [00:01<00:14,  5.65it/s][A
Training:  11%|█         | 10/91 [00:02<00:16,  4.84it/s][A
Training:  13%|█▎        | 12/91 [00:02<00:12,  6.16it/s][A
Training:  15%|█▌        | 14/91 [00:03<00:15,  5.05it/s][A
Training:  18%|█▊        | 16/91 [00:03<00:12,  5.90it/s][A
Training:  19%|█▊        | 17/91 [00:03<00:15,  4.77it/s][A
Training:  21%|██        | 19/91 [00:03<00:11,  6.43it/s][A
Training:  23%|██▎       | 21/91 [00:04<00:14,  5.00it/s][A
Training:  25%|██▌       | 23/91 [00:04<00:10,  6.57it/s][A
Training:  27%|██▋       | 25/91 [00:04<00:12,  5.43it/s][A
Training:  29%|██▊       | 26/91 [00:05<00:11,  5.60it/s][A
Training:  31%|███       | 28/91 [00:05<00:10,  5.80it/s][A
Training:  32%|███▏      | 29/91 [00

Epoch: 15/93 - Loss: 0.1798 - Accuracy: 0.9326



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:00<00:09,  1.15it/s][A
 25%|██▌       | 3/12 [00:00<00:02,  3.72it/s][A
 42%|████▏     | 5/12 [00:01<00:02,  3.49it/s][A
 75%|███████▌  | 9/12 [00:02<00:00,  4.77it/s][A
100%|██████████| 12/12 [00:02<00:00,  4.94it/s][A
Epochs:  16%|█▌        | 15/93 [04:31<23:35, 18.15s/it]

Val Loss: 0.2080 - Val Accuracy: 0.9117



Training:   0%|          | 0/91 [00:00<?, ?it/s][A
Training:   1%|          | 1/91 [00:00<01:23,  1.08it/s][A
Training:   4%|▍         | 4/91 [00:01<00:18,  4.80it/s][A
Training:   7%|▋         | 6/91 [00:01<00:21,  3.89it/s][A
Training:  10%|▉         | 9/91 [00:02<00:19,  4.28it/s][A
Training:  14%|█▍        | 13/91 [00:02<00:15,  4.96it/s][A
Training:  19%|█▊        | 17/91 [00:03<00:14,  5.27it/s][A
Training:  23%|██▎       | 21/91 [00:04<00:12,  5.62it/s][A
Training:  27%|██▋       | 25/91 [00:04<00:11,  5.99it/s][A
Training:  30%|██▉       | 27/91 [00:05<00:09,  6.88it/s][A
Training:  32%|███▏      | 29/91 [00:05<00:10,  5.73it/s][A
Training:  35%|███▌      | 32/91 [00:05<00:07,  7.66it/s][A
Training:  37%|███▋      | 34/91 [00:06<00:09,  5.78it/s][A
Training:  41%|████      | 37/91 [00:06<00:09,  5.52it/s][A
Training:  44%|████▍     | 40/91 [00:06<00:06,  7.44it/s][A
Training:  46%|████▌     | 42/91 [00:07<00:08,  5.77it/s][A
Training:  49%|████▉     | 45/91 [00

Epoch: 16/93 - Loss: 0.1795 - Accuracy: 0.9325



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:00<00:10,  1.02it/s][A
 42%|████▏     | 5/12 [00:01<00:01,  3.55it/s][A
100%|██████████| 12/12 [00:02<00:00,  5.08it/s][A
Epochs:  17%|█▋        | 16/93 [04:49<23:16, 18.14s/it]

Val Loss: 0.2105 - Val Accuracy: 0.9117



Training:   0%|          | 0/91 [00:00<?, ?it/s][A
Training:   1%|          | 1/91 [00:00<01:20,  1.11it/s][A
Training:   3%|▎         | 3/91 [00:01<00:24,  3.54it/s][A
Training:   5%|▌         | 5/91 [00:01<00:21,  3.94it/s][A
Training:   7%|▋         | 6/91 [00:01<00:18,  4.64it/s][A
Training:   8%|▊         | 7/91 [00:01<00:16,  5.21it/s][A
Training:  10%|▉         | 9/91 [00:02<00:17,  4.79it/s][A
Training:  11%|█         | 10/91 [00:02<00:15,  5.14it/s][A
Training:  14%|█▍        | 13/91 [00:02<00:14,  5.26it/s][A
Training:  16%|█▋        | 15/91 [00:03<00:11,  6.67it/s][A
Training:  19%|█▊        | 17/91 [00:03<00:14,  5.26it/s][A
Training:  21%|██        | 19/91 [00:03<00:10,  6.69it/s][A
Training:  23%|██▎       | 21/91 [00:04<00:12,  5.70it/s][A
Training:  25%|██▌       | 23/91 [00:04<00:10,  6.70it/s][A
Training:  27%|██▋       | 25/91 [00:04<00:11,  5.88it/s][A
Training:  30%|██▉       | 27/91 [00:04<00:08,  7.15it/s][A
Training:  32%|███▏      | 29/91 [00:0

Epoch: 17/93 - Loss: 0.1789 - Accuracy: 0.9334



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:00<00:10,  1.04it/s][A
 42%|████▏     | 5/12 [00:01<00:02,  3.48it/s][A
 67%|██████▋   | 8/12 [00:01<00:00,  5.97it/s][A
100%|██████████| 12/12 [00:02<00:00,  5.05it/s][A
Epochs:  18%|█▊        | 17/93 [05:07<22:56, 18.11s/it]

Val Loss: 0.2104 - Val Accuracy: 0.9106



Training:   0%|          | 0/91 [00:00<?, ?it/s][A
Training:   1%|          | 1/91 [00:00<01:25,  1.05it/s][A
Training:   4%|▍         | 4/91 [00:01<00:18,  4.80it/s][A
Training:   7%|▋         | 6/91 [00:01<00:21,  3.95it/s][A
Training:  10%|▉         | 9/91 [00:02<00:19,  4.22it/s][A
Training:  14%|█▍        | 13/91 [00:03<00:15,  4.89it/s][A
Training:  19%|█▊        | 17/91 [00:03<00:14,  5.25it/s][A
Training:  20%|█▉        | 18/91 [00:03<00:13,  5.58it/s][A
Training:  23%|██▎       | 21/91 [00:04<00:13,  5.35it/s][A
Training:  27%|██▋       | 25/91 [00:04<00:11,  5.87it/s][A
Training:  29%|██▊       | 26/91 [00:05<00:10,  6.13it/s][A
Training:  32%|███▏      | 29/91 [00:05<00:10,  5.82it/s][A
Training:  33%|███▎      | 30/91 [00:05<00:09,  6.14it/s][A
Training:  36%|███▋      | 33/91 [00:06<00:10,  5.70it/s][A
Training:  38%|███▊      | 35/91 [00:06<00:08,  6.91it/s][A
Training:  41%|████      | 37/91 [00:06<00:09,  5.74it/s][A
Training:  45%|████▌     | 41/91 [00

Epoch: 18/93 - Loss: 0.1790 - Accuracy: 0.9321



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:00<00:10,  1.09it/s][A
 33%|███▎      | 4/12 [00:01<00:01,  4.94it/s][A
 50%|█████     | 6/12 [00:01<00:01,  4.24it/s][A
 67%|██████▋   | 8/12 [00:01<00:00,  5.97it/s][A
100%|██████████| 12/12 [00:02<00:00,  5.04it/s][A
Epochs:  19%|█▉        | 18/93 [05:25<22:35, 18.08s/it]

Val Loss: 0.2097 - Val Accuracy: 0.9128



Training:   0%|          | 0/91 [00:00<?, ?it/s][A
Training:   1%|          | 1/91 [00:00<01:19,  1.13it/s][A
Training:   3%|▎         | 3/91 [00:01<00:24,  3.62it/s][A
Training:   5%|▌         | 5/91 [00:01<00:23,  3.59it/s][A
Training:   8%|▊         | 7/91 [00:01<00:15,  5.25it/s][A
Training:  10%|▉         | 9/91 [00:02<00:17,  4.81it/s][A
Training:  11%|█         | 10/91 [00:02<00:15,  5.07it/s][A
Training:  14%|█▍        | 13/91 [00:02<00:15,  5.17it/s][A
Training:  15%|█▌        | 14/91 [00:03<00:14,  5.34it/s][A
Training:  19%|█▊        | 17/91 [00:03<00:13,  5.43it/s][A
Training:  20%|█▉        | 18/91 [00:03<00:13,  5.56it/s][A
Training:  23%|██▎       | 21/91 [00:04<00:12,  5.83it/s][A
Training:  24%|██▍       | 22/91 [00:04<00:11,  6.03it/s][A
Training:  27%|██▋       | 25/91 [00:05<00:11,  5.53it/s][A
Training:  32%|███▏      | 29/91 [00:05<00:11,  5.44it/s][A
Training:  36%|███▋      | 33/91 [00:06<00:09,  5.87it/s][A
Training:  41%|████      | 37/91 [00:

Epoch: 19/93 - Loss: 0.1780 - Accuracy: 0.9332



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:00<00:09,  1.11it/s][A
 25%|██▌       | 3/12 [00:01<00:02,  3.66it/s][A
 42%|████▏     | 5/12 [00:01<00:01,  3.51it/s][A
 58%|█████▊    | 7/12 [00:01<00:00,  5.36it/s][A
100%|██████████| 12/12 [00:02<00:00,  5.04it/s][A
Epochs:  20%|██        | 19/93 [05:43<22:19, 18.10s/it]

Val Loss: 0.2098 - Val Accuracy: 0.9117



Training:   0%|          | 0/91 [00:00<?, ?it/s][A
Training:   1%|          | 1/91 [00:00<01:28,  1.02it/s][A
Training:   5%|▌         | 5/91 [00:01<00:24,  3.44it/s][A
Training:   8%|▊         | 7/91 [00:01<00:17,  4.90it/s][A
Training:  10%|▉         | 9/91 [00:02<00:18,  4.43it/s][A
Training:  12%|█▏        | 11/91 [00:02<00:13,  5.80it/s][A
Training:  14%|█▍        | 13/91 [00:02<00:15,  4.89it/s][A
Training:  16%|█▋        | 15/91 [00:03<00:11,  6.40it/s][A
Training:  19%|█▊        | 17/91 [00:03<00:14,  5.06it/s][A
Training:  23%|██▎       | 21/91 [00:04<00:12,  5.56it/s][A
Training:  27%|██▋       | 25/91 [00:04<00:11,  5.83it/s][A
Training:  30%|██▉       | 27/91 [00:05<00:09,  6.80it/s][A
Training:  32%|███▏      | 29/91 [00:05<00:11,  5.47it/s][A
Training:  33%|███▎      | 30/91 [00:05<00:10,  5.81it/s][A
Training:  36%|███▋      | 33/91 [00:06<00:10,  5.58it/s][A
Training:  37%|███▋      | 34/91 [00:06<00:09,  5.84it/s][A
Training:  41%|████      | 37/91 [00

Epoch: 20/93 - Loss: 0.1778 - Accuracy: 0.9333



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:00<00:09,  1.11it/s][A
 33%|███▎      | 4/12 [00:01<00:01,  5.05it/s][A
 50%|█████     | 6/12 [00:01<00:01,  4.23it/s][A
100%|██████████| 12/12 [00:02<00:00,  5.22it/s][A
Epochs:  22%|██▏       | 20/93 [06:01<21:59, 18.08s/it]

Val Loss: 0.2090 - Val Accuracy: 0.9085



Training:   0%|          | 0/91 [00:00<?, ?it/s][A
Training:   1%|          | 1/91 [00:00<01:21,  1.10it/s][A
Training:   5%|▌         | 5/91 [00:01<00:24,  3.47it/s][A
Training:  10%|▉         | 9/91 [00:02<00:18,  4.38it/s][A
Training:  14%|█▍        | 13/91 [00:03<00:15,  4.88it/s][A
Training:  19%|█▊        | 17/91 [00:03<00:13,  5.29it/s][A
Training:  22%|██▏       | 20/91 [00:03<00:10,  6.95it/s][A
Training:  24%|██▍       | 22/91 [00:04<00:12,  5.64it/s][A
Training:  27%|██▋       | 25/91 [00:04<00:11,  5.55it/s][A
Training:  30%|██▉       | 27/91 [00:05<00:09,  6.67it/s][A
Training:  32%|███▏      | 29/91 [00:05<00:11,  5.41it/s][A
Training:  36%|███▋      | 33/91 [00:06<00:10,  5.57it/s][A
Training:  37%|███▋      | 34/91 [00:06<00:09,  5.90it/s][A
Training:  41%|████      | 37/91 [00:07<00:09,  5.63it/s][A
Training:  45%|████▌     | 41/91 [00:07<00:08,  5.81it/s][A
Training:  49%|████▉     | 45/91 [00:08<00:07,  5.87it/s][A
Training:  54%|█████▍    | 49/91 [0

Epoch: 21/93 - Loss: 0.1776 - Accuracy: 0.9328



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:00<00:09,  1.10it/s][A
 42%|████▏     | 5/12 [00:01<00:01,  3.50it/s][A
100%|██████████| 12/12 [00:02<00:00,  4.98it/s][A
Epochs:  23%|██▎       | 21/93 [06:20<21:44, 18.12s/it]

Val Loss: 0.2107 - Val Accuracy: 0.9101



Training:   0%|          | 0/91 [00:00<?, ?it/s][A
Training:   1%|          | 1/91 [00:00<01:27,  1.02it/s][A
Training:   4%|▍         | 4/91 [00:01<00:18,  4.69it/s][A
Training:   7%|▋         | 6/91 [00:01<00:22,  3.82it/s][A
Training:  10%|▉         | 9/91 [00:02<00:19,  4.28it/s][A
Training:  14%|█▍        | 13/91 [00:03<00:16,  4.84it/s][A
Training:  19%|█▊        | 17/91 [00:03<00:14,  5.22it/s][A
Training:  22%|██▏       | 20/91 [00:03<00:10,  6.96it/s][A
Training:  24%|██▍       | 22/91 [00:04<00:12,  5.65it/s][A
Training:  27%|██▋       | 25/91 [00:05<00:12,  5.41it/s][A
Training:  32%|███▏      | 29/91 [00:05<00:10,  5.68it/s][A
Training:  36%|███▋      | 33/91 [00:06<00:09,  5.85it/s][A
Training:  41%|████      | 37/91 [00:06<00:08,  6.24it/s][A
Training:  44%|████▍     | 40/91 [00:07<00:06,  7.66it/s][A
Training:  46%|████▌     | 42/91 [00:07<00:08,  5.86it/s][A
Training:  49%|████▉     | 45/91 [00:08<00:08,  5.68it/s][A
Training:  51%|█████     | 46/91 [00

Epoch: 22/93 - Loss: 0.1780 - Accuracy: 0.9332



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:00<00:09,  1.11it/s][A
 42%|████▏     | 5/12 [00:01<00:01,  3.58it/s][A
 67%|██████▋   | 8/12 [00:01<00:00,  6.17it/s][A
100%|██████████| 12/12 [00:02<00:00,  5.06it/s][A
Epochs:  24%|██▎       | 22/93 [06:38<21:23, 18.08s/it]

Val Loss: 0.2110 - Val Accuracy: 0.9123



Training:   0%|          | 0/91 [00:00<?, ?it/s][A
Training:   1%|          | 1/91 [00:00<01:14,  1.22it/s][A
Training:   2%|▏         | 2/91 [00:00<00:36,  2.43it/s][A
Training:   5%|▌         | 5/91 [00:01<00:21,  4.00it/s][A
Training:   9%|▉         | 8/91 [00:01<00:13,  6.24it/s][A
Training:  10%|▉         | 9/91 [00:02<00:17,  4.57it/s][A
Training:  13%|█▎        | 12/91 [00:02<00:12,  6.43it/s][A
Training:  14%|█▍        | 13/91 [00:02<00:15,  4.88it/s][A
Training:  18%|█▊        | 16/91 [00:03<00:11,  6.56it/s][A
Training:  19%|█▊        | 17/91 [00:03<00:15,  4.92it/s][A
Training:  22%|██▏       | 20/91 [00:03<00:10,  6.70it/s][A
Training:  23%|██▎       | 21/91 [00:04<00:13,  5.25it/s][A
Training:  26%|██▋       | 24/91 [00:04<00:09,  7.19it/s][A
Training:  27%|██▋       | 25/91 [00:04<00:12,  5.26it/s][A
Training:  30%|██▉       | 27/91 [00:04<00:09,  6.79it/s][A
Training:  32%|███▏      | 29/91 [00:05<00:12,  5.16it/s][A
Training:  34%|███▍      | 31/91 [00:

Epoch: 23/93 - Loss: 0.1770 - Accuracy: 0.9337



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:00<00:10,  1.05it/s][A
 42%|████▏     | 5/12 [00:01<00:02,  3.42it/s][A
100%|██████████| 12/12 [00:02<00:00,  4.91it/s][A
Epochs:  25%|██▍       | 23/93 [06:56<21:04, 18.06s/it]

Val Loss: 0.2115 - Val Accuracy: 0.9106



Training:   0%|          | 0/91 [00:00<?, ?it/s][A
Training:   1%|          | 1/91 [00:01<01:32,  1.03s/it][A
Training:   5%|▌         | 5/91 [00:01<00:24,  3.49it/s][A
Training:  10%|▉         | 9/91 [00:02<00:18,  4.54it/s][A
Training:  14%|█▍        | 13/91 [00:02<00:15,  5.17it/s][A
Training:  16%|█▋        | 15/91 [00:03<00:12,  6.22it/s][A
Training:  19%|█▊        | 17/91 [00:03<00:13,  5.29it/s][A
Training:  22%|██▏       | 20/91 [00:03<00:09,  7.16it/s][A
Training:  24%|██▍       | 22/91 [00:04<00:12,  5.58it/s][A
Training:  27%|██▋       | 25/91 [00:05<00:12,  5.08it/s][A
Training:  32%|███▏      | 29/91 [00:05<00:11,  5.31it/s][A
Training:  36%|███▋      | 33/91 [00:06<00:10,  5.60it/s][A
Training:  41%|████      | 37/91 [00:06<00:08,  6.01it/s][A
Training:  45%|████▌     | 41/91 [00:07<00:08,  6.10it/s][A
Training:  49%|████▉     | 45/91 [00:08<00:07,  6.16it/s][A
Training:  54%|█████▍    | 49/91 [00:08<00:06,  6.11it/s][A
Training:  58%|█████▊    | 53/91 [0

Epoch: 24/93 - Loss: 0.1771 - Accuracy: 0.9338



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:00<00:09,  1.11it/s][A
 42%|████▏     | 5/12 [00:01<00:01,  3.52it/s][A
100%|██████████| 12/12 [00:02<00:00,  5.20it/s][A
Epochs:  26%|██▌       | 24/93 [07:14<20:43, 18.02s/it]

Val Loss: 0.2168 - Val Accuracy: 0.9117



Training:   0%|          | 0/91 [00:00<?, ?it/s][A
Training:   1%|          | 1/91 [00:00<01:27,  1.03it/s][A
Training:   5%|▌         | 5/91 [00:01<00:24,  3.56it/s][A
Training:   8%|▊         | 7/91 [00:01<00:16,  5.04it/s][A
Training:  10%|▉         | 9/91 [00:02<00:18,  4.46it/s][A
Training:  12%|█▏        | 11/91 [00:02<00:13,  6.01it/s][A
Training:  14%|█▍        | 13/91 [00:03<00:16,  4.65it/s][A
Training:  18%|█▊        | 16/91 [00:03<00:10,  6.98it/s][A
Training:  20%|█▉        | 18/91 [00:03<00:13,  5.27it/s][A
Training:  23%|██▎       | 21/91 [00:04<00:13,  5.18it/s][A
Training:  26%|██▋       | 24/91 [00:04<00:09,  7.03it/s][A
Training:  29%|██▊       | 26/91 [00:05<00:11,  5.75it/s][A
Training:  32%|███▏      | 29/91 [00:05<00:11,  5.40it/s][A
Training:  35%|███▌      | 32/91 [00:05<00:08,  7.27it/s][A
Training:  37%|███▋      | 34/91 [00:06<00:10,  5.60it/s][A
Training:  41%|████      | 37/91 [00:07<00:10,  5.35it/s][A
Training:  45%|████▌     | 41/91 [00

Epoch: 25/93 - Loss: 0.1777 - Accuracy: 0.9341



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:00<00:10,  1.02it/s][A
 42%|████▏     | 5/12 [00:01<00:01,  3.57it/s][A
100%|██████████| 12/12 [00:02<00:00,  5.01it/s][A
Epochs:  27%|██▋       | 25/93 [07:32<20:26, 18.03s/it]

Val Loss: 0.2128 - Val Accuracy: 0.9123



Training:   0%|          | 0/91 [00:00<?, ?it/s][A
Training:   1%|          | 1/91 [00:00<01:28,  1.01it/s][A
Training:   5%|▌         | 5/91 [00:01<00:24,  3.54it/s][A
Training:   9%|▉         | 8/91 [00:01<00:13,  6.09it/s][A
Training:  11%|█         | 10/91 [00:02<00:17,  4.65it/s][A
Training:  14%|█▍        | 13/91 [00:03<00:16,  4.66it/s][A
Training:  19%|█▊        | 17/91 [00:03<00:14,  5.19it/s][A
Training:  23%|██▎       | 21/91 [00:04<00:12,  5.62it/s][A
Training:  27%|██▋       | 25/91 [00:05<00:11,  5.64it/s][A
Training:  31%|███       | 28/91 [00:05<00:08,  7.13it/s][A
Training:  33%|███▎      | 30/91 [00:05<00:10,  5.81it/s][A
Training:  36%|███▋      | 33/91 [00:06<00:10,  5.58it/s][A
Training:  41%|████      | 37/91 [00:06<00:09,  5.96it/s][A
Training:  42%|████▏     | 38/91 [00:07<00:08,  6.04it/s][A
Training:  44%|████▍     | 40/91 [00:07<00:07,  7.24it/s][A
Training:  46%|████▌     | 42/91 [00:07<00:08,  5.94it/s][A
Training:  47%|████▋     | 43/91 [0

Epoch: 26/93 - Loss: 0.1771 - Accuracy: 0.9333



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:00<00:10,  1.06it/s][A
 42%|████▏     | 5/12 [00:01<00:02,  3.50it/s][A
 75%|███████▌  | 9/12 [00:02<00:00,  4.63it/s][A
100%|██████████| 12/12 [00:02<00:00,  4.79it/s][A
Epochs:  28%|██▊       | 26/93 [07:50<20:11, 18.08s/it]

Val Loss: 0.2114 - Val Accuracy: 0.9095



Training:   0%|          | 0/91 [00:00<?, ?it/s][A
Training:   1%|          | 1/91 [00:00<01:23,  1.08it/s][A
Training:   4%|▍         | 4/91 [00:01<00:18,  4.82it/s][A
Training:   7%|▋         | 6/91 [00:01<00:20,  4.11it/s][A
Training:  10%|▉         | 9/91 [00:02<00:18,  4.52it/s][A
Training:  12%|█▏        | 11/91 [00:02<00:13,  5.95it/s][A
Training:  14%|█▍        | 13/91 [00:02<00:15,  4.91it/s][A
Training:  15%|█▌        | 14/91 [00:03<00:15,  5.02it/s][A
Training:  19%|█▊        | 17/91 [00:03<00:13,  5.40it/s][A
Training:  20%|█▉        | 18/91 [00:03<00:12,  5.69it/s][A
Training:  23%|██▎       | 21/91 [00:04<00:12,  5.83it/s][A
Training:  24%|██▍       | 22/91 [00:04<00:11,  5.88it/s][A
Training:  27%|██▋       | 25/91 [00:04<00:10,  6.13it/s][A
Training:  29%|██▊       | 26/91 [00:05<00:11,  5.65it/s][A
Training:  32%|███▏      | 29/91 [00:05<00:10,  5.84it/s][A
Training:  33%|███▎      | 30/91 [00:05<00:10,  5.82it/s][A
Training:  36%|███▋      | 33/91 [00

Epoch: 27/93 - Loss: 0.1771 - Accuracy: 0.9332



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:00<00:10,  1.07it/s][A
 42%|████▏     | 5/12 [00:01<00:02,  3.45it/s][A
100%|██████████| 12/12 [00:02<00:00,  5.04it/s][A
Epochs:  29%|██▉       | 27/93 [08:08<20:00, 18.18s/it]

Val Loss: 0.2127 - Val Accuracy: 0.9101



Training:   0%|          | 0/91 [00:00<?, ?it/s][A
Training:   1%|          | 1/91 [00:00<01:23,  1.08it/s][A
Training:   4%|▍         | 4/91 [00:01<00:17,  4.90it/s][A
Training:   7%|▋         | 6/91 [00:01<00:22,  3.72it/s][A
Training:  10%|▉         | 9/91 [00:02<00:18,  4.45it/s][A
Training:  12%|█▏        | 11/91 [00:02<00:13,  5.77it/s][A
Training:  14%|█▍        | 13/91 [00:02<00:16,  4.78it/s][A
Training:  15%|█▌        | 14/91 [00:03<00:14,  5.24it/s][A
Training:  19%|█▊        | 17/91 [00:03<00:13,  5.48it/s][A
Training:  20%|█▉        | 18/91 [00:03<00:12,  5.76it/s][A
Training:  23%|██▎       | 21/91 [00:04<00:13,  5.18it/s][A
Training:  26%|██▋       | 24/91 [00:04<00:08,  7.49it/s][A
Training:  29%|██▊       | 26/91 [00:05<00:11,  5.62it/s][A
Training:  32%|███▏      | 29/91 [00:05<00:11,  5.24it/s][A
Training:  36%|███▋      | 33/91 [00:06<00:10,  5.76it/s][A
Training:  38%|███▊      | 35/91 [00:06<00:08,  6.84it/s][A
Training:  41%|████      | 37/91 [00

Epoch: 28/93 - Loss: 0.1768 - Accuracy: 0.9341



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:00<00:10,  1.02it/s][A
 42%|████▏     | 5/12 [00:01<00:02,  3.31it/s][A
100%|██████████| 12/12 [00:02<00:00,  4.90it/s][A
Epochs:  30%|███       | 28/93 [08:26<19:40, 18.17s/it]

Val Loss: 0.2138 - Val Accuracy: 0.9096



Training:   0%|          | 0/91 [00:00<?, ?it/s][A
Training:   1%|          | 1/91 [00:01<01:30,  1.01s/it][A
Training:   3%|▎         | 3/91 [00:01<00:27,  3.21it/s][A
Training:   5%|▌         | 5/91 [00:01<00:25,  3.43it/s][A
Training:  10%|▉         | 9/91 [00:02<00:18,  4.54it/s][A
Training:  13%|█▎        | 12/91 [00:02<00:11,  6.75it/s][A
Training:  15%|█▌        | 14/91 [00:03<00:15,  4.97it/s][A
Training:  18%|█▊        | 16/91 [00:03<00:12,  6.22it/s][A
Training:  20%|█▉        | 18/91 [00:03<00:13,  5.34it/s][A
Training:  21%|██        | 19/91 [00:03<00:12,  5.77it/s][A
Training:  23%|██▎       | 21/91 [00:04<00:14,  4.86it/s][A
Training:  25%|██▌       | 23/91 [00:04<00:11,  5.94it/s][A
Training:  27%|██▋       | 25/91 [00:05<00:12,  5.10it/s][A
Training:  30%|██▉       | 27/91 [00:05<00:10,  6.02it/s][A
Training:  32%|███▏      | 29/91 [00:05<00:11,  5.37it/s][A
Training:  34%|███▍      | 31/91 [00:05<00:09,  6.27it/s][A
Training:  36%|███▋      | 33/91 [00

Epoch: 29/93 - Loss: 0.1768 - Accuracy: 0.9340



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:00<00:10,  1.08it/s][A
 33%|███▎      | 4/12 [00:01<00:01,  4.86it/s][A
 50%|█████     | 6/12 [00:01<00:01,  4.19it/s][A
 67%|██████▋   | 8/12 [00:01<00:00,  5.97it/s][A
 83%|████████▎ | 10/12 [00:02<00:00,  4.88it/s][A
100%|██████████| 12/12 [00:02<00:00,  4.92it/s][A
Epochs:  31%|███       | 29/93 [08:45<19:26, 18.22s/it]

Val Loss: 0.2139 - Val Accuracy: 0.9112



Training:   0%|          | 0/91 [00:00<?, ?it/s][A
Training:   1%|          | 1/91 [00:00<01:22,  1.09it/s][A
Training:   3%|▎         | 3/91 [00:01<00:24,  3.58it/s][A
Training:   5%|▌         | 5/91 [00:01<00:25,  3.41it/s][A
Training:  10%|▉         | 9/91 [00:02<00:18,  4.52it/s][A
Training:  12%|█▏        | 11/91 [00:02<00:13,  5.87it/s][A
Training:  14%|█▍        | 13/91 [00:03<00:16,  4.83it/s][A
Training:  15%|█▌        | 14/91 [00:03<00:14,  5.27it/s][A
Training:  19%|█▊        | 17/91 [00:03<00:13,  5.43it/s][A
Training:  21%|██        | 19/91 [00:03<00:10,  6.75it/s][A
Training:  23%|██▎       | 21/91 [00:04<00:12,  5.53it/s][A
Training:  24%|██▍       | 22/91 [00:04<00:11,  5.88it/s][A
Training:  27%|██▋       | 25/91 [00:04<00:11,  5.62it/s][A
Training:  30%|██▉       | 27/91 [00:05<00:09,  6.97it/s][A
Training:  32%|███▏      | 29/91 [00:05<00:11,  5.54it/s][A
Training:  35%|███▌      | 32/91 [00:05<00:07,  7.96it/s][A
Training:  37%|███▋      | 34/91 [00

Epoch: 30/93 - Loss: 0.1766 - Accuracy: 0.9336



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:00<00:09,  1.10it/s][A
 42%|████▏     | 5/12 [00:01<00:02,  3.48it/s][A
100%|██████████| 12/12 [00:02<00:00,  4.95it/s][A
Epochs:  32%|███▏      | 30/93 [09:03<19:06, 18.20s/it]

Val Loss: 0.2150 - Val Accuracy: 0.9085



Training:   0%|          | 0/91 [00:00<?, ?it/s][A
Training:   1%|          | 1/91 [00:00<01:20,  1.12it/s][A
Training:   4%|▍         | 4/91 [00:01<00:17,  5.02it/s][A
Training:   7%|▋         | 6/91 [00:01<00:21,  3.96it/s][A
Training:  10%|▉         | 9/91 [00:02<00:18,  4.34it/s][A
Training:  12%|█▏        | 11/91 [00:02<00:14,  5.61it/s][A
Training:  14%|█▍        | 13/91 [00:02<00:16,  4.84it/s][A
Training:  18%|█▊        | 16/91 [00:03<00:10,  7.20it/s][A
Training:  20%|█▉        | 18/91 [00:03<00:12,  5.70it/s][A
Training:  23%|██▎       | 21/91 [00:04<00:13,  5.34it/s][A
Training:  24%|██▍       | 22/91 [00:04<00:12,  5.57it/s][A
Training:  27%|██▋       | 25/91 [00:04<00:11,  5.62it/s][A
Training:  29%|██▊       | 26/91 [00:04<00:10,  6.02it/s][A
Training:  32%|███▏      | 29/91 [00:05<00:11,  5.60it/s][A
Training:  35%|███▌      | 32/91 [00:05<00:07,  7.90it/s][A
Training:  37%|███▋      | 34/91 [00:06<00:10,  5.64it/s][A
Training:  41%|████      | 37/91 [00

Epoch: 31/93 - Loss: 0.1764 - Accuracy: 0.9351



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:00<00:10,  1.09it/s][A
 42%|████▏     | 5/12 [00:01<00:01,  3.66it/s][A
 58%|█████▊    | 7/12 [00:01<00:01,  4.97it/s][A
 75%|███████▌  | 9/12 [00:02<00:00,  4.53it/s][A
100%|██████████| 12/12 [00:02<00:00,  4.92it/s][A
Epochs:  33%|███▎      | 31/93 [09:21<18:48, 18.20s/it]

Val Loss: 0.2161 - Val Accuracy: 0.9096



Training:   0%|          | 0/91 [00:00<?, ?it/s][A
Training:   1%|          | 1/91 [00:00<01:22,  1.09it/s][A
Training:   5%|▌         | 5/91 [00:01<00:23,  3.62it/s][A
Training:   8%|▊         | 7/91 [00:01<00:16,  5.14it/s][A
Training:  10%|▉         | 9/91 [00:02<00:18,  4.53it/s][A
Training:  12%|█▏        | 11/91 [00:02<00:13,  6.06it/s][A
Training:  14%|█▍        | 13/91 [00:02<00:15,  5.08it/s][A
Training:  16%|█▋        | 15/91 [00:03<00:11,  6.44it/s][A
Training:  19%|█▊        | 17/91 [00:03<00:13,  5.30it/s][A
Training:  20%|█▉        | 18/91 [00:03<00:12,  5.77it/s][A
Training:  23%|██▎       | 21/91 [00:04<00:13,  5.33it/s][A
Training:  27%|██▋       | 25/91 [00:04<00:12,  5.40it/s][A
Training:  32%|███▏      | 29/91 [00:05<00:10,  5.82it/s][A
Training:  36%|███▋      | 33/91 [00:06<00:09,  5.87it/s][A
Training:  41%|████      | 37/91 [00:06<00:09,  5.85it/s][A
Training:  45%|████▌     | 41/91 [00:07<00:08,  6.04it/s][A
Training:  48%|████▊     | 44/91 [00

Epoch: 32/93 - Loss: 0.1764 - Accuracy: 0.9341



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:11,  1.03s/it][A
 33%|███▎      | 4/12 [00:01<00:01,  4.49it/s][A
 50%|█████     | 6/12 [00:01<00:01,  4.19it/s][A
 67%|██████▋   | 8/12 [00:01<00:00,  5.77it/s][A
100%|██████████| 12/12 [00:02<00:00,  4.89it/s][A
Epochs:  34%|███▍      | 32/93 [09:39<18:30, 18.20s/it]

Val Loss: 0.2135 - Val Accuracy: 0.9079



Training:   0%|          | 0/91 [00:00<?, ?it/s][A
Training:   1%|          | 1/91 [00:00<01:26,  1.05it/s][A
Training:   4%|▍         | 4/91 [00:01<00:18,  4.77it/s][A
Training:   7%|▋         | 6/91 [00:01<00:21,  3.95it/s][A
Training:  10%|▉         | 9/91 [00:02<00:18,  4.45it/s][A
Training:  14%|█▍        | 13/91 [00:02<00:15,  5.15it/s][A
Training:  19%|█▊        | 17/91 [00:03<00:13,  5.50it/s][A
Training:  23%|██▎       | 21/91 [00:04<00:12,  5.74it/s][A
Training:  26%|██▋       | 24/91 [00:04<00:09,  7.19it/s][A
Training:  29%|██▊       | 26/91 [00:05<00:11,  5.61it/s][A
Training:  32%|███▏      | 29/91 [00:05<00:10,  5.91it/s][A
Training:  33%|███▎      | 30/91 [00:05<00:10,  5.75it/s][A
Training:  36%|███▋      | 33/91 [00:06<00:09,  6.23it/s][A
Training:  37%|███▋      | 34/91 [00:06<00:09,  5.73it/s][A
Training:  41%|████      | 37/91 [00:06<00:08,  6.28it/s][A
Training:  42%|████▏     | 38/91 [00:07<00:09,  5.61it/s][A
Training:  45%|████▌     | 41/91 [00

Epoch: 33/93 - Loss: 0.1766 - Accuracy: 0.9341



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:00<00:09,  1.13it/s][A
 17%|█▋        | 2/12 [00:01<00:04,  2.28it/s][A
 42%|████▏     | 5/12 [00:01<00:01,  4.08it/s][A
 50%|█████     | 6/12 [00:01<00:01,  4.72it/s][A
 75%|███████▌  | 9/12 [00:02<00:00,  4.99it/s][A
100%|██████████| 12/12 [00:02<00:00,  4.90it/s][A
Epochs:  35%|███▌      | 33/93 [09:57<18:09, 18.16s/it]

Val Loss: 0.2115 - Val Accuracy: 0.9101



Training:   0%|          | 0/91 [00:00<?, ?it/s][A
Training:   1%|          | 1/91 [00:00<01:24,  1.07it/s][A
Training:   5%|▌         | 5/91 [00:01<00:24,  3.51it/s][A
Training:   8%|▊         | 7/91 [00:01<00:16,  5.09it/s][A
Training:  10%|▉         | 9/91 [00:02<00:19,  4.22it/s][A
Training:  13%|█▎        | 12/91 [00:02<00:12,  6.57it/s][A
Training:  15%|█▌        | 14/91 [00:02<00:14,  5.48it/s][A
Training:  18%|█▊        | 16/91 [00:03<00:11,  6.80it/s][A
Training:  20%|█▉        | 18/91 [00:03<00:12,  5.67it/s][A
Training:  21%|██        | 19/91 [00:03<00:13,  5.52it/s][A
Training:  23%|██▎       | 21/91 [00:04<00:14,  4.91it/s][A
Training:  25%|██▌       | 23/91 [00:04<00:11,  5.90it/s][A
Training:  27%|██▋       | 25/91 [00:04<00:12,  5.28it/s][A
Training:  30%|██▉       | 27/91 [00:05<00:09,  6.47it/s][A
Training:  32%|███▏      | 29/91 [00:05<00:11,  5.42it/s][A
Training:  34%|███▍      | 31/91 [00:05<00:08,  6.95it/s][A
Training:  36%|███▋      | 33/91 [00

Epoch: 34/93 - Loss: 0.1764 - Accuracy: 0.9335



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:11,  1.01s/it][A
 42%|████▏     | 5/12 [00:01<00:02,  3.35it/s][A
100%|██████████| 12/12 [00:02<00:00,  4.79it/s][A
Epochs:  37%|███▋      | 34/93 [10:16<17:53, 18.19s/it]

Val Loss: 0.2134 - Val Accuracy: 0.9117



Training:   0%|          | 0/91 [00:00<?, ?it/s][A
Training:   1%|          | 1/91 [00:01<01:30,  1.01s/it][A
Training:   5%|▌         | 5/91 [00:01<00:25,  3.42it/s][A
Training:   8%|▊         | 7/91 [00:01<00:16,  4.98it/s][A
Training:  10%|▉         | 9/91 [00:02<00:18,  4.36it/s][A
Training:  12%|█▏        | 11/91 [00:02<00:13,  5.77it/s][A
Training:  14%|█▍        | 13/91 [00:02<00:15,  5.18it/s][A
Training:  16%|█▋        | 15/91 [00:03<00:11,  6.66it/s][A
Training:  19%|█▊        | 17/91 [00:03<00:14,  4.94it/s][A
Training:  23%|██▎       | 21/91 [00:04<00:13,  5.06it/s][A
Training:  27%|██▋       | 25/91 [00:05<00:12,  5.37it/s][A
Training:  32%|███▏      | 29/91 [00:05<00:10,  5.74it/s][A
Training:  35%|███▌      | 32/91 [00:05<00:08,  7.29it/s][A
Training:  37%|███▋      | 34/91 [00:06<00:10,  5.46it/s][A
Training:  41%|████      | 37/91 [00:07<00:10,  5.36it/s][A
Training:  45%|████▌     | 41/91 [00:07<00:09,  5.52it/s][A
Training:  49%|████▉     | 45/91 [00

Epoch: 35/93 - Loss: 0.1768 - Accuracy: 0.9342



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:00<00:10,  1.08it/s][A
 42%|████▏     | 5/12 [00:01<00:01,  3.57it/s][A
100%|██████████| 12/12 [00:02<00:00,  5.07it/s][A
Epochs:  38%|███▊      | 35/93 [10:34<17:36, 18.22s/it]

Val Loss: 0.2114 - Val Accuracy: 0.9117



Training:   0%|          | 0/91 [00:00<?, ?it/s][A
Training:   1%|          | 1/91 [00:00<01:18,  1.15it/s][A
Training:   2%|▏         | 2/91 [00:00<00:38,  2.31it/s][A
Training:   5%|▌         | 5/91 [00:01<00:22,  3.83it/s][A
Training:   9%|▉         | 8/91 [00:01<00:12,  6.73it/s][A
Training:  11%|█         | 10/91 [00:02<00:15,  5.33it/s][A
Training:  13%|█▎        | 12/91 [00:02<00:11,  6.70it/s][A
Training:  15%|█▌        | 14/91 [00:02<00:13,  5.70it/s][A
Training:  18%|█▊        | 16/91 [00:03<00:11,  6.34it/s][A
Training:  19%|█▊        | 17/91 [00:03<00:14,  5.00it/s][A
Training:  21%|██        | 19/91 [00:03<00:10,  6.59it/s][A
Training:  23%|██▎       | 21/91 [00:04<00:14,  4.98it/s][A
Training:  26%|██▋       | 24/91 [00:04<00:09,  6.89it/s][A
Training:  29%|██▊       | 26/91 [00:04<00:11,  5.80it/s][A
Training:  31%|███       | 28/91 [00:04<00:08,  7.23it/s][A
Training:  33%|███▎      | 30/91 [00:05<00:10,  5.83it/s][A
Training:  35%|███▌      | 32/91 [00

Epoch: 36/93 - Loss: 0.1762 - Accuracy: 0.9336



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:00<00:10,  1.10it/s][A
 42%|████▏     | 5/12 [00:01<00:01,  3.51it/s][A
100%|██████████| 12/12 [00:02<00:00,  5.10it/s][A
Epochs:  39%|███▊      | 36/93 [10:52<17:13, 18.13s/it]

Val Loss: 0.2144 - Val Accuracy: 0.9123



Training:   0%|          | 0/91 [00:00<?, ?it/s][A
Training:   1%|          | 1/91 [00:00<01:23,  1.07it/s][A
Training:   4%|▍         | 4/91 [00:01<00:18,  4.67it/s][A
Training:   7%|▋         | 6/91 [00:01<00:20,  4.05it/s][A
Training:  10%|▉         | 9/91 [00:02<00:19,  4.19it/s][A
Training:  13%|█▎        | 12/91 [00:02<00:12,  6.45it/s][A
Training:  15%|█▌        | 14/91 [00:02<00:13,  5.70it/s][A
Training:  19%|█▊        | 17/91 [00:03<00:14,  5.07it/s][A
Training:  23%|██▎       | 21/91 [00:04<00:12,  5.39it/s][A
Training:  27%|██▋       | 25/91 [00:04<00:11,  5.75it/s][A
Training:  32%|███▏      | 29/91 [00:05<00:10,  6.12it/s][A
Training:  36%|███▋      | 33/91 [00:06<00:10,  5.66it/s][A
Training:  40%|███▉      | 36/91 [00:06<00:07,  7.17it/s][A
Training:  42%|████▏     | 38/91 [00:06<00:09,  5.85it/s][A
Training:  45%|████▌     | 41/91 [00:07<00:09,  5.51it/s][A
Training:  48%|████▊     | 44/91 [00:07<00:06,  7.28it/s][A
Training:  51%|█████     | 46/91 [00

Epoch: 37/93 - Loss: 0.1762 - Accuracy: 0.9336



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:00<00:10,  1.07it/s][A
 42%|████▏     | 5/12 [00:01<00:01,  3.62it/s][A
100%|██████████| 12/12 [00:02<00:00,  4.97it/s][A
Epochs:  40%|███▉      | 37/93 [11:10<16:57, 18.17s/it]

Val Loss: 0.2143 - Val Accuracy: 0.9112



Training:   0%|          | 0/91 [00:00<?, ?it/s][A
Training:   1%|          | 1/91 [00:00<01:19,  1.14it/s][A
Training:   2%|▏         | 2/91 [00:00<00:38,  2.34it/s][A
Training:   5%|▌         | 5/91 [00:01<00:22,  3.90it/s][A
Training:   7%|▋         | 6/91 [00:01<00:19,  4.43it/s][A
Training:  10%|▉         | 9/91 [00:02<00:16,  4.86it/s][A
Training:  12%|█▏        | 11/91 [00:02<00:12,  6.38it/s][A
Training:  14%|█▍        | 13/91 [00:02<00:14,  5.31it/s][A
Training:  15%|█▌        | 14/91 [00:03<00:13,  5.63it/s][A
Training:  19%|█▊        | 17/91 [00:03<00:13,  5.52it/s][A
Training:  20%|█▉        | 18/91 [00:03<00:12,  5.83it/s][A
Training:  23%|██▎       | 21/91 [00:04<00:12,  5.61it/s][A
Training:  25%|██▌       | 23/91 [00:04<00:09,  7.06it/s][A
Training:  27%|██▋       | 25/91 [00:04<00:12,  5.47it/s][A
Training:  31%|███       | 28/91 [00:05<00:07,  7.95it/s][A
Training:  33%|███▎      | 30/91 [00:05<00:10,  5.86it/s][A
Training:  36%|███▋      | 33/91 [00:

Epoch: 38/93 - Loss: 0.1758 - Accuracy: 0.9340



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:00<00:09,  1.10it/s][A
 42%|████▏     | 5/12 [00:01<00:01,  3.57it/s][A
100%|██████████| 12/12 [00:02<00:00,  5.06it/s][A
Epochs:  41%|████      | 38/93 [11:28<16:34, 18.09s/it]

Val Loss: 0.2160 - Val Accuracy: 0.9117



Training:   0%|          | 0/91 [00:00<?, ?it/s][A
Training:   1%|          | 1/91 [00:00<01:27,  1.02it/s][A
Training:   4%|▍         | 4/91 [00:01<00:18,  4.68it/s][A
Training:   7%|▋         | 6/91 [00:01<00:21,  3.90it/s][A
Training:  10%|▉         | 9/91 [00:02<00:18,  4.33it/s][A
Training:  13%|█▎        | 12/91 [00:02<00:12,  6.49it/s][A
Training:  15%|█▌        | 14/91 [00:03<00:14,  5.28it/s][A
Training:  19%|█▊        | 17/91 [00:03<00:14,  5.25it/s][A
Training:  20%|█▉        | 18/91 [00:03<00:12,  5.63it/s][A
Training:  23%|██▎       | 21/91 [00:04<00:12,  5.41it/s][A
Training:  25%|██▌       | 23/91 [00:04<00:10,  6.34it/s][A
Training:  27%|██▋       | 25/91 [00:04<00:12,  5.31it/s][A
Training:  30%|██▉       | 27/91 [00:05<00:09,  6.47it/s][A
Training:  32%|███▏      | 29/91 [00:05<00:10,  5.87it/s][A
Training:  34%|███▍      | 31/91 [00:05<00:09,  6.60it/s][A
Training:  36%|███▋      | 33/91 [00:06<00:09,  5.87it/s][A
Training:  37%|███▋      | 34/91 [00

Epoch: 39/93 - Loss: 0.1760 - Accuracy: 0.9338



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:11,  1.00s/it][A
 42%|████▏     | 5/12 [00:01<00:02,  3.50it/s][A
100%|██████████| 12/12 [00:02<00:00,  4.99it/s][A
Epochs:  42%|████▏     | 39/93 [11:46<16:16, 18.08s/it]

Val Loss: 0.2121 - Val Accuracy: 0.9123



Training:   0%|          | 0/91 [00:00<?, ?it/s][A
Training:   1%|          | 1/91 [00:00<01:20,  1.11it/s][A
Training:   4%|▍         | 4/91 [00:01<00:17,  5.00it/s][A
Training:   7%|▋         | 6/91 [00:01<00:20,  4.07it/s][A
Training:  10%|▉         | 9/91 [00:02<00:18,  4.34it/s][A
Training:  13%|█▎        | 12/91 [00:02<00:12,  6.50it/s][A
Training:  15%|█▌        | 14/91 [00:02<00:14,  5.25it/s][A
Training:  19%|█▊        | 17/91 [00:03<00:15,  4.93it/s][A
Training:  23%|██▎       | 21/91 [00:04<00:13,  5.15it/s][A
Training:  27%|██▋       | 25/91 [00:05<00:11,  5.51it/s][A
Training:  32%|███▏      | 29/91 [00:05<00:10,  5.72it/s][A
Training:  36%|███▋      | 33/91 [00:06<00:09,  5.87it/s][A
Training:  40%|███▉      | 36/91 [00:06<00:07,  7.42it/s][A
Training:  42%|████▏     | 38/91 [00:07<00:09,  5.74it/s][A
Training:  45%|████▌     | 41/91 [00:07<00:08,  5.69it/s][A
Training:  46%|████▌     | 42/91 [00:07<00:08,  5.84it/s][A
Training:  49%|████▉     | 45/91 [00

Epoch: 40/93 - Loss: 0.1765 - Accuracy: 0.9348



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:00<00:10,  1.05it/s][A
 42%|████▏     | 5/12 [00:01<00:02,  3.38it/s][A
 67%|██████▋   | 8/12 [00:01<00:00,  5.82it/s][A
100%|██████████| 12/12 [00:02<00:00,  4.82it/s][A
Epochs:  43%|████▎     | 40/93 [12:04<16:00, 18.13s/it]

Val Loss: 0.2134 - Val Accuracy: 0.9079



Training:   0%|          | 0/91 [00:00<?, ?it/s][A
Training:   1%|          | 1/91 [00:00<01:20,  1.12it/s][A
Training:   4%|▍         | 4/91 [00:01<00:17,  5.01it/s][A
Training:   7%|▋         | 6/91 [00:01<00:21,  3.90it/s][A
Training:  10%|▉         | 9/91 [00:02<00:18,  4.42it/s][A
Training:  13%|█▎        | 12/91 [00:02<00:11,  6.61it/s][A
Training:  15%|█▌        | 14/91 [00:02<00:15,  5.12it/s][A
Training:  19%|█▊        | 17/91 [00:03<00:13,  5.34it/s][A
Training:  20%|█▉        | 18/91 [00:03<00:12,  5.64it/s][A
Training:  22%|██▏       | 20/91 [00:03<00:10,  7.00it/s][A
Training:  24%|██▍       | 22/91 [00:04<00:12,  5.37it/s][A
Training:  27%|██▋       | 25/91 [00:04<00:11,  5.72it/s][A
Training:  29%|██▊       | 26/91 [00:04<00:11,  5.84it/s][A
Training:  32%|███▏      | 29/91 [00:05<00:10,  6.01it/s][A
Training:  33%|███▎      | 30/91 [00:05<00:09,  6.42it/s][A
Training:  34%|███▍      | 31/91 [00:05<00:08,  6.74it/s][A
Training:  36%|███▋      | 33/91 [00

Epoch: 41/93 - Loss: 0.1763 - Accuracy: 0.9341



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:00<00:09,  1.16it/s][A
 42%|████▏     | 5/12 [00:01<00:01,  3.74it/s][A
100%|██████████| 12/12 [00:02<00:00,  5.22it/s][A
Epochs:  44%|████▍     | 41/93 [12:22<15:42, 18.13s/it]

Val Loss: 0.2124 - Val Accuracy: 0.9085



Training:   0%|          | 0/91 [00:00<?, ?it/s][A
Training:   1%|          | 1/91 [00:00<01:23,  1.07it/s][A
Training:   3%|▎         | 3/91 [00:01<00:25,  3.50it/s][A
Training:   5%|▌         | 5/91 [00:01<00:23,  3.69it/s][A
Training:   8%|▊         | 7/91 [00:01<00:16,  5.09it/s][A
Training:  10%|▉         | 9/91 [00:02<00:17,  4.75it/s][A
Training:  13%|█▎        | 12/91 [00:02<00:10,  7.41it/s][A
Training:  15%|█▌        | 14/91 [00:02<00:13,  5.80it/s][A
Training:  16%|█▋        | 15/91 [00:03<00:12,  5.85it/s][A
Training:  19%|█▊        | 17/91 [00:03<00:14,  5.19it/s][A
Training:  21%|██        | 19/91 [00:03<00:11,  6.30it/s][A
Training:  23%|██▎       | 21/91 [00:04<00:13,  5.30it/s][A
Training:  25%|██▌       | 23/91 [00:04<00:10,  6.38it/s][A
Training:  27%|██▋       | 25/91 [00:04<00:11,  5.73it/s][A
Training:  30%|██▉       | 27/91 [00:04<00:09,  6.59it/s][A
Training:  32%|███▏      | 29/91 [00:05<00:10,  5.71it/s][A
Training:  34%|███▍      | 31/91 [00:

Epoch: 42/93 - Loss: 0.1762 - Accuracy: 0.9344



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:00<00:09,  1.18it/s][A
 33%|███▎      | 4/12 [00:00<00:01,  5.29it/s][A
 50%|█████     | 6/12 [00:01<00:01,  4.12it/s][A
100%|██████████| 12/12 [00:02<00:00,  5.25it/s][A
Epochs:  45%|████▌     | 42/93 [12:40<15:21, 18.07s/it]

Val Loss: 0.2126 - Val Accuracy: 0.9095



Training:   0%|          | 0/91 [00:00<?, ?it/s][A
Training:   1%|          | 1/91 [00:00<01:29,  1.01it/s][A
Training:   5%|▌         | 5/91 [00:01<00:24,  3.49it/s][A
Training:   9%|▉         | 8/91 [00:01<00:13,  6.01it/s][A
Training:  11%|█         | 10/91 [00:02<00:16,  5.03it/s][A
Training:  14%|█▍        | 13/91 [00:03<00:16,  4.59it/s][A
Training:  18%|█▊        | 16/91 [00:03<00:11,  6.60it/s][A
Training:  20%|█▉        | 18/91 [00:03<00:13,  5.21it/s][A
Training:  23%|██▎       | 21/91 [00:04<00:14,  4.93it/s][A
Training:  27%|██▋       | 25/91 [00:04<00:11,  5.61it/s][A
Training:  32%|███▏      | 29/91 [00:05<00:10,  5.73it/s][A
Training:  36%|███▋      | 33/91 [00:06<00:09,  5.86it/s][A
Training:  41%|████      | 37/91 [00:06<00:08,  6.02it/s][A
Training:  45%|████▌     | 41/91 [00:07<00:08,  5.94it/s][A
Training:  49%|████▉     | 45/91 [00:08<00:07,  5.95it/s][A
Training:  53%|█████▎    | 48/91 [00:08<00:05,  7.35it/s][A
Training:  55%|█████▍    | 50/91 [0

Epoch: 43/93 - Loss: 0.1761 - Accuracy: 0.9339



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:00<00:09,  1.12it/s][A
 25%|██▌       | 3/12 [00:01<00:02,  3.65it/s][A
 42%|████▏     | 5/12 [00:01<00:01,  3.72it/s][A
 58%|█████▊    | 7/12 [00:01<00:00,  5.65it/s][A
 75%|███████▌  | 9/12 [00:02<00:00,  4.76it/s][A
100%|██████████| 12/12 [00:02<00:00,  5.10it/s][A
Epochs:  46%|████▌     | 43/93 [12:58<15:01, 18.02s/it]

Val Loss: 0.2135 - Val Accuracy: 0.9095



Training:   0%|          | 0/91 [00:00<?, ?it/s][A
Training:   1%|          | 1/91 [00:00<01:29,  1.01it/s][A
Training:   5%|▌         | 5/91 [00:01<00:24,  3.45it/s][A
Training:  10%|▉         | 9/91 [00:02<00:17,  4.75it/s][A
Training:  14%|█▍        | 13/91 [00:02<00:15,  5.19it/s][A
Training:  19%|█▊        | 17/91 [00:03<00:13,  5.46it/s][A
Training:  22%|██▏       | 20/91 [00:03<00:10,  6.98it/s][A
Training:  24%|██▍       | 22/91 [00:04<00:11,  5.85it/s][A
Training:  27%|██▋       | 25/91 [00:04<00:11,  5.51it/s][A
Training:  30%|██▉       | 27/91 [00:05<00:09,  6.58it/s][A
Training:  32%|███▏      | 29/91 [00:05<00:11,  5.50it/s][A
Training:  34%|███▍      | 31/91 [00:05<00:08,  6.78it/s][A
Training:  36%|███▋      | 33/91 [00:06<00:10,  5.39it/s][A
Training:  37%|███▋      | 34/91 [00:06<00:10,  5.50it/s][A
Training:  41%|████      | 37/91 [00:06<00:09,  5.48it/s][A
Training:  42%|████▏     | 38/91 [00:07<00:09,  5.83it/s][A
Training:  45%|████▌     | 41/91 [0

Epoch: 44/93 - Loss: 0.1758 - Accuracy: 0.9347



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:10,  1.00it/s][A
 42%|████▏     | 5/12 [00:01<00:01,  3.71it/s][A
100%|██████████| 12/12 [00:02<00:00,  5.20it/s][A
Epochs:  47%|████▋     | 44/93 [13:16<14:41, 17.99s/it]

Val Loss: 0.2136 - Val Accuracy: 0.9085



Training:   0%|          | 0/91 [00:00<?, ?it/s][A
Training:   1%|          | 1/91 [00:01<01:35,  1.06s/it][A
Training:   4%|▍         | 4/91 [00:01<00:20,  4.28it/s][A
Training:   7%|▋         | 6/91 [00:01<00:21,  3.91it/s][A
Training:  10%|▉         | 9/91 [00:02<00:18,  4.54it/s][A
Training:  13%|█▎        | 12/91 [00:02<00:11,  6.74it/s][A
Training:  15%|█▌        | 14/91 [00:03<00:14,  5.25it/s][A
Training:  19%|█▊        | 17/91 [00:03<00:14,  4.97it/s][A
Training:  23%|██▎       | 21/91 [00:04<00:12,  5.66it/s][A
Training:  27%|██▋       | 25/91 [00:04<00:11,  5.84it/s][A
Training:  31%|███       | 28/91 [00:05<00:08,  7.41it/s][A
Training:  33%|███▎      | 30/91 [00:05<00:10,  6.10it/s][A
Training:  35%|███▌      | 32/91 [00:05<00:08,  7.25it/s][A
Training:  37%|███▋      | 34/91 [00:06<00:09,  5.80it/s][A
Training:  38%|███▊      | 35/91 [00:06<00:09,  6.05it/s][A
Training:  41%|████      | 37/91 [00:06<00:10,  5.22it/s][A
Training:  43%|████▎     | 39/91 [00

Epoch: 45/93 - Loss: 0.1759 - Accuracy: 0.9344



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:00<00:10,  1.06it/s][A
 42%|████▏     | 5/12 [00:01<00:01,  3.66it/s][A
100%|██████████| 12/12 [00:02<00:00,  5.23it/s][A
Epochs:  48%|████▊     | 45/93 [13:34<14:24, 18.02s/it]

Val Loss: 0.2125 - Val Accuracy: 0.9106



Training:   0%|          | 0/91 [00:00<?, ?it/s][A
Training:   1%|          | 1/91 [00:00<01:28,  1.02it/s][A
Training:   5%|▌         | 5/91 [00:01<00:24,  3.52it/s][A
Training:  10%|▉         | 9/91 [00:02<00:17,  4.63it/s][A
Training:  14%|█▍        | 13/91 [00:02<00:15,  5.08it/s][A
Training:  19%|█▊        | 17/91 [00:03<00:13,  5.48it/s][A
Training:  23%|██▎       | 21/91 [00:04<00:12,  5.71it/s][A
Training:  27%|██▋       | 25/91 [00:04<00:11,  5.71it/s][A
Training:  32%|███▏      | 29/91 [00:05<00:10,  5.90it/s][A
Training:  35%|███▌      | 32/91 [00:05<00:08,  7.31it/s][A
Training:  37%|███▋      | 34/91 [00:06<00:09,  6.00it/s][A
Training:  41%|████      | 37/91 [00:06<00:09,  5.65it/s][A
Training:  43%|████▎     | 39/91 [00:07<00:07,  6.67it/s][A
Training:  45%|████▌     | 41/91 [00:07<00:09,  5.46it/s][A
Training:  49%|████▉     | 45/91 [00:08<00:08,  5.65it/s][A
Training:  54%|█████▍    | 49/91 [00:08<00:07,  5.80it/s][A
Training:  58%|█████▊    | 53/91 [0

Epoch: 46/93 - Loss: 0.1759 - Accuracy: 0.9345



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:00<00:10,  1.01it/s][A
 33%|███▎      | 4/12 [00:01<00:01,  4.59it/s][A
 50%|█████     | 6/12 [00:01<00:01,  4.28it/s][A
100%|██████████| 12/12 [00:02<00:00,  5.25it/s][A
Epochs:  49%|████▉     | 46/93 [13:52<14:04, 17.96s/it]

Val Loss: 0.2139 - Val Accuracy: 0.9095



Training:   0%|          | 0/91 [00:00<?, ?it/s][A
Training:   1%|          | 1/91 [00:00<01:27,  1.02it/s][A
Training:   3%|▎         | 3/91 [00:01<00:25,  3.43it/s][A
Training:   5%|▌         | 5/91 [00:01<00:23,  3.70it/s][A
Training:  10%|▉         | 9/91 [00:02<00:16,  4.87it/s][A
Training:  14%|█▍        | 13/91 [00:02<00:14,  5.32it/s][A
Training:  18%|█▊        | 16/91 [00:03<00:10,  7.24it/s][A
Training:  20%|█▉        | 18/91 [00:03<00:13,  5.48it/s][A
Training:  23%|██▎       | 21/91 [00:04<00:13,  5.26it/s][A
Training:  27%|██▋       | 25/91 [00:05<00:12,  5.25it/s][A
Training:  31%|███       | 28/91 [00:05<00:09,  6.94it/s][A
Training:  33%|███▎      | 30/91 [00:05<00:10,  5.73it/s][A
Training:  36%|███▋      | 33/91 [00:06<00:10,  5.42it/s][A
Training:  41%|████      | 37/91 [00:06<00:09,  5.63it/s][A
Training:  45%|████▌     | 41/91 [00:07<00:08,  5.64it/s][A
Training:  49%|████▉     | 45/91 [00:08<00:07,  5.76it/s][A
Training:  54%|█████▍    | 49/91 [00

Epoch: 47/93 - Loss: 0.1756 - Accuracy: 0.9341



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:00<00:09,  1.10it/s][A
 42%|████▏     | 5/12 [00:01<00:01,  3.65it/s][A
100%|██████████| 12/12 [00:02<00:00,  5.34it/s][A
Epochs:  51%|█████     | 47/93 [14:10<13:46, 17.97s/it]

Val Loss: 0.2143 - Val Accuracy: 0.9079



Training:   0%|          | 0/91 [00:00<?, ?it/s][A
Training:   1%|          | 1/91 [00:00<01:19,  1.13it/s][A
Training:   3%|▎         | 3/91 [00:00<00:23,  3.73it/s][A
Training:   5%|▌         | 5/91 [00:01<00:21,  4.04it/s][A
Training:   8%|▊         | 7/91 [00:01<00:14,  5.97it/s][A
Training:  10%|▉         | 9/91 [00:02<00:18,  4.53it/s][A
Training:  13%|█▎        | 12/91 [00:02<00:11,  6.80it/s][A
Training:  15%|█▌        | 14/91 [00:02<00:14,  5.17it/s][A
Training:  19%|█▊        | 17/91 [00:03<00:14,  5.16it/s][A
Training:  22%|██▏       | 20/91 [00:03<00:09,  7.29it/s][A
Training:  24%|██▍       | 22/91 [00:04<00:12,  5.44it/s][A
Training:  27%|██▋       | 25/91 [00:04<00:12,  5.44it/s][A
Training:  30%|██▉       | 27/91 [00:04<00:09,  6.58it/s][A
Training:  32%|███▏      | 29/91 [00:05<00:11,  5.49it/s][A
Training:  33%|███▎      | 30/91 [00:05<00:11,  5.49it/s][A
Training:  36%|███▋      | 33/91 [00:06<00:10,  5.59it/s][A
Training:  37%|███▋      | 34/91 [00:

Epoch: 48/93 - Loss: 0.1756 - Accuracy: 0.9347



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:00<00:09,  1.11it/s][A
 42%|████▏     | 5/12 [00:01<00:01,  3.74it/s][A
 58%|█████▊    | 7/12 [00:01<00:00,  5.21it/s][A
 75%|███████▌  | 9/12 [00:02<00:00,  4.88it/s][A
100%|██████████| 12/12 [00:02<00:00,  5.14it/s][A
Epochs:  52%|█████▏    | 48/93 [14:28<13:28, 17.97s/it]

Val Loss: 0.2139 - Val Accuracy: 0.9095



Training:   0%|          | 0/91 [00:00<?, ?it/s][A
Training:   1%|          | 1/91 [00:00<01:19,  1.13it/s][A
Training:   5%|▌         | 5/91 [00:01<00:21,  3.96it/s][A
Training:   8%|▊         | 7/91 [00:01<00:14,  5.64it/s][A
Training:  10%|▉         | 9/91 [00:02<00:16,  4.91it/s][A
Training:  11%|█         | 10/91 [00:02<00:15,  5.33it/s][A
Training:  14%|█▍        | 13/91 [00:02<00:14,  5.54it/s][A
Training:  15%|█▌        | 14/91 [00:02<00:13,  5.66it/s][A
Training:  19%|█▊        | 17/91 [00:03<00:12,  6.02it/s][A
Training:  20%|█▉        | 18/91 [00:03<00:12,  5.69it/s][A
Training:  23%|██▎       | 21/91 [00:03<00:10,  6.38it/s][A
Training:  24%|██▍       | 22/91 [00:04<00:11,  5.90it/s][A
Training:  27%|██▋       | 25/91 [00:04<00:10,  6.26it/s][A
Training:  29%|██▊       | 26/91 [00:04<00:10,  6.25it/s][A
Training:  32%|███▏      | 29/91 [00:05<00:10,  6.04it/s][A
Training:  33%|███▎      | 30/91 [00:05<00:09,  6.15it/s][A
Training:  36%|███▋      | 33/91 [00

Epoch: 49/93 - Loss: 0.1755 - Accuracy: 0.9351



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:00<00:09,  1.12it/s][A
 42%|████▏     | 5/12 [00:01<00:02,  3.49it/s][A
100%|██████████| 12/12 [00:02<00:00,  5.24it/s][A
Epochs:  53%|█████▎    | 49/93 [14:46<13:09, 17.95s/it]

Val Loss: 0.2147 - Val Accuracy: 0.9112



Training:   0%|          | 0/91 [00:00<?, ?it/s][A
Training:   1%|          | 1/91 [00:00<01:15,  1.19it/s][A
Training:   3%|▎         | 3/91 [00:00<00:22,  3.84it/s][A
Training:   5%|▌         | 5/91 [00:01<00:21,  3.95it/s][A
Training:   7%|▋         | 6/91 [00:01<00:20,  4.16it/s][A
Training:  10%|▉         | 9/91 [00:02<00:16,  5.05it/s][A
Training:  11%|█         | 10/91 [00:02<00:15,  5.12it/s][A
Training:  14%|█▍        | 13/91 [00:02<00:12,  6.01it/s][A
Training:  15%|█▌        | 14/91 [00:03<00:14,  5.23it/s][A
Training:  19%|█▊        | 17/91 [00:03<00:11,  6.53it/s][A
Training:  20%|█▉        | 18/91 [00:03<00:13,  5.37it/s][A
Training:  23%|██▎       | 21/91 [00:03<00:10,  6.93it/s][A
Training:  24%|██▍       | 22/91 [00:04<00:13,  5.16it/s][A
Training:  27%|██▋       | 25/91 [00:04<00:08,  7.43it/s][A
Training:  29%|██▊       | 26/91 [00:05<00:12,  5.01it/s][A
Training:  32%|███▏      | 29/91 [00:05<00:08,  7.33it/s][A
Training:  34%|███▍      | 31/91 [00:

Epoch: 50/93 - Loss: 0.1760 - Accuracy: 0.9343



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:00<00:09,  1.13it/s][A
 25%|██▌       | 3/12 [00:00<00:02,  3.73it/s][A
 42%|████▏     | 5/12 [00:01<00:01,  3.62it/s][A
100%|██████████| 12/12 [00:02<00:00,  5.17it/s][A
Epochs:  54%|█████▍    | 50/93 [15:04<12:56, 18.05s/it]

Val Loss: 0.2143 - Val Accuracy: 0.9112



Training:   0%|          | 0/91 [00:00<?, ?it/s][A
Training:   1%|          | 1/91 [00:00<01:10,  1.29it/s][A
Training:   3%|▎         | 3/91 [00:00<00:21,  4.18it/s][A
Training:   5%|▌         | 5/91 [00:01<00:22,  3.76it/s][A
Training:   8%|▊         | 7/91 [00:01<00:14,  5.69it/s][A
Training:  10%|▉         | 9/91 [00:02<00:17,  4.65it/s][A
Training:  13%|█▎        | 12/91 [00:02<00:10,  7.36it/s][A
Training:  15%|█▌        | 14/91 [00:02<00:13,  5.56it/s][A
Training:  19%|█▊        | 17/91 [00:03<00:13,  5.29it/s][A
Training:  21%|██        | 19/91 [00:03<00:10,  6.57it/s][A
Training:  23%|██▎       | 21/91 [00:04<00:12,  5.41it/s][A
Training:  26%|██▋       | 24/91 [00:04<00:08,  7.75it/s][A
Training:  29%|██▊       | 26/91 [00:04<00:11,  5.47it/s][A
Training:  32%|███▏      | 29/91 [00:05<00:11,  5.18it/s][A
Training:  35%|███▌      | 32/91 [00:05<00:08,  7.16it/s][A
Training:  37%|███▋      | 34/91 [00:06<00:10,  5.59it/s][A
Training:  41%|████      | 37/91 [00:

Epoch: 51/93 - Loss: 0.1756 - Accuracy: 0.9339



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:00<00:09,  1.14it/s][A
 33%|███▎      | 4/12 [00:00<00:01,  5.09it/s][A
 50%|█████     | 6/12 [00:01<00:01,  4.14it/s][A
 75%|███████▌  | 9/12 [00:02<00:00,  4.79it/s][A
100%|██████████| 12/12 [00:02<00:00,  5.23it/s][A
Epochs:  55%|█████▍    | 51/93 [15:22<12:37, 18.03s/it]

Val Loss: 0.2132 - Val Accuracy: 0.9085



Training:   0%|          | 0/91 [00:00<?, ?it/s][A
Training:   1%|          | 1/91 [00:00<01:11,  1.26it/s][A
Training:   3%|▎         | 3/91 [00:00<00:21,  4.11it/s][A
Training:   5%|▌         | 5/91 [00:01<00:21,  3.93it/s][A
Training:   8%|▊         | 7/91 [00:01<00:14,  5.76it/s][A
Training:  10%|▉         | 9/91 [00:02<00:16,  5.01it/s][A
Training:  12%|█▏        | 11/91 [00:02<00:13,  5.79it/s][A
Training:  14%|█▍        | 13/91 [00:02<00:13,  5.67it/s][A
Training:  15%|█▌        | 14/91 [00:02<00:12,  5.97it/s][A
Training:  19%|█▊        | 17/91 [00:03<00:11,  6.20it/s][A
Training:  20%|█▉        | 18/91 [00:03<00:12,  5.90it/s][A
Training:  21%|██        | 19/91 [00:03<00:11,  6.15it/s][A
Training:  23%|██▎       | 21/91 [00:03<00:11,  6.15it/s][A
Training:  24%|██▍       | 22/91 [00:04<00:11,  5.75it/s][A
Training:  25%|██▌       | 23/91 [00:04<00:10,  6.28it/s][A
Training:  27%|██▋       | 25/91 [00:04<00:11,  5.82it/s][A
Training:  29%|██▊       | 26/91 [00:

Epoch: 52/93 - Loss: 0.1761 - Accuracy: 0.9338



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:00<00:09,  1.18it/s][A
 42%|████▏     | 5/12 [00:01<00:01,  3.73it/s][A
100%|██████████| 12/12 [00:02<00:00,  5.24it/s][A
Epochs:  56%|█████▌    | 52/93 [15:40<12:17, 18.00s/it]

Val Loss: 0.2130 - Val Accuracy: 0.9112



Training:   0%|          | 0/91 [00:00<?, ?it/s][A
Training:   1%|          | 1/91 [00:00<01:21,  1.11it/s][A
Training:   5%|▌         | 5/91 [00:01<00:23,  3.67it/s][A
Training:   9%|▉         | 8/91 [00:01<00:13,  6.30it/s][A
Training:  11%|█         | 10/91 [00:02<00:16,  4.95it/s][A
Training:  14%|█▍        | 13/91 [00:02<00:15,  4.95it/s][A
Training:  18%|█▊        | 16/91 [00:02<00:10,  7.06it/s][A
Training:  20%|█▉        | 18/91 [00:03<00:12,  5.66it/s][A
Training:  23%|██▎       | 21/91 [00:04<00:13,  5.35it/s][A
Training:  27%|██▋       | 25/91 [00:04<00:11,  5.57it/s][A
Training:  32%|███▏      | 29/91 [00:05<00:10,  5.81it/s][A
Training:  35%|███▌      | 32/91 [00:05<00:08,  7.35it/s][A
Training:  37%|███▋      | 34/91 [00:06<00:09,  5.91it/s][A
Training:  41%|████      | 37/91 [00:06<00:10,  5.24it/s][A
Training:  45%|████▌     | 41/91 [00:07<00:09,  5.49it/s][A
Training:  49%|████▉     | 45/91 [00:08<00:08,  5.61it/s][A
Training:  53%|█████▎    | 48/91 [0

Epoch: 53/93 - Loss: 0.1762 - Accuracy: 0.9337



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:00<00:09,  1.20it/s][A
 42%|████▏     | 5/12 [00:01<00:01,  3.82it/s][A
100%|██████████| 12/12 [00:02<00:00,  5.55it/s][A
Epochs:  57%|█████▋    | 53/93 [15:58<11:59, 18.00s/it]

Val Loss: 0.2132 - Val Accuracy: 0.9101



Training:   0%|          | 0/91 [00:00<?, ?it/s][A
Training:   1%|          | 1/91 [00:00<01:17,  1.15it/s][A
Training:   4%|▍         | 4/91 [00:00<00:16,  5.19it/s][A
Training:   7%|▋         | 6/91 [00:01<00:19,  4.28it/s][A
Training:  10%|▉         | 9/91 [00:02<00:16,  4.83it/s][A
Training:  13%|█▎        | 12/91 [00:02<00:11,  7.15it/s][A
Training:  15%|█▌        | 14/91 [00:02<00:14,  5.46it/s][A
Training:  19%|█▊        | 17/91 [00:03<00:14,  5.14it/s][A
Training:  23%|██▎       | 21/91 [00:04<00:13,  5.33it/s][A
Training:  24%|██▍       | 22/91 [00:04<00:12,  5.59it/s][A
Training:  27%|██▋       | 25/91 [00:04<00:11,  5.55it/s][A
Training:  29%|██▊       | 26/91 [00:04<00:11,  5.63it/s][A
Training:  32%|███▏      | 29/91 [00:05<00:11,  5.44it/s][A
Training:  33%|███▎      | 30/91 [00:05<00:10,  5.61it/s][A
Training:  36%|███▋      | 33/91 [00:06<00:10,  5.58it/s][A
Training:  37%|███▋      | 34/91 [00:06<00:10,  5.56it/s][A
Training:  41%|████      | 37/91 [00

Epoch: 54/93 - Loss: 0.1757 - Accuracy: 0.9335



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:00<00:08,  1.31it/s][A
 33%|███▎      | 4/12 [00:00<00:01,  5.79it/s][A
 50%|█████     | 6/12 [00:01<00:01,  4.27it/s][A
100%|██████████| 12/12 [00:02<00:00,  5.54it/s][A
Epochs:  58%|█████▊    | 54/93 [16:16<11:41, 18.00s/it]

Val Loss: 0.2135 - Val Accuracy: 0.9090



Training:   0%|          | 0/91 [00:00<?, ?it/s][A
Training:   1%|          | 1/91 [00:00<01:19,  1.13it/s][A
Training:   5%|▌         | 5/91 [00:01<00:22,  3.81it/s][A
Training:  10%|▉         | 9/91 [00:02<00:16,  4.91it/s][A
Training:  13%|█▎        | 12/91 [00:02<00:11,  7.03it/s][A
Training:  15%|█▌        | 14/91 [00:02<00:14,  5.29it/s][A
Training:  19%|█▊        | 17/91 [00:03<00:15,  4.77it/s][A
Training:  23%|██▎       | 21/91 [00:04<00:13,  5.27it/s][A
Training:  27%|██▋       | 25/91 [00:04<00:11,  5.64it/s][A
Training:  32%|███▏      | 29/91 [00:05<00:10,  5.78it/s][A
Training:  36%|███▋      | 33/91 [00:06<00:09,  5.80it/s][A
Training:  40%|███▉      | 36/91 [00:06<00:07,  7.32it/s][A
Training:  42%|████▏     | 38/91 [00:06<00:08,  6.19it/s][A
Training:  45%|████▌     | 41/91 [00:07<00:09,  5.49it/s][A
Training:  49%|████▉     | 45/91 [00:08<00:08,  5.69it/s][A
Training:  54%|█████▍    | 49/91 [00:08<00:07,  5.94it/s][A
Training:  58%|█████▊    | 53/91 [0

Epoch: 55/93 - Loss: 0.1755 - Accuracy: 0.9349



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:00<00:08,  1.22it/s][A
 42%|████▏     | 5/12 [00:01<00:01,  4.10it/s][A
100%|██████████| 12/12 [00:02<00:00,  5.50it/s][A
Epochs:  59%|█████▉    | 55/93 [16:34<11:22, 17.97s/it]

Val Loss: 0.2130 - Val Accuracy: 0.9106



Training:   0%|          | 0/91 [00:00<?, ?it/s][A
Training:   1%|          | 1/91 [00:00<01:19,  1.14it/s][A
Training:   5%|▌         | 5/91 [00:01<00:20,  4.12it/s][A
Training:  10%|▉         | 9/91 [00:01<00:14,  5.55it/s][A
Training:  13%|█▎        | 12/91 [00:02<00:10,  7.85it/s][A
Training:  15%|█▌        | 14/91 [00:02<00:13,  5.55it/s][A
Training:  19%|█▊        | 17/91 [00:03<00:14,  5.28it/s][A
Training:  23%|██▎       | 21/91 [00:03<00:12,  5.64it/s][A
Training:  27%|██▋       | 25/91 [00:04<00:11,  5.89it/s][A
Training:  32%|███▏      | 29/91 [00:05<00:10,  5.89it/s][A
Training:  36%|███▋      | 33/91 [00:05<00:09,  5.93it/s][A
Training:  41%|████      | 37/91 [00:06<00:09,  6.00it/s][A
Training:  44%|████▍     | 40/91 [00:06<00:06,  7.49it/s][A
Training:  46%|████▌     | 42/91 [00:07<00:07,  6.15it/s][A
Training:  49%|████▉     | 45/91 [00:07<00:08,  5.69it/s][A
Training:  52%|█████▏    | 47/91 [00:08<00:06,  6.45it/s][A
Training:  54%|█████▍    | 49/91 [0

Epoch: 56/93 - Loss: 0.1754 - Accuracy: 0.9343



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:00<00:08,  1.26it/s][A
 42%|████▏     | 5/12 [00:01<00:01,  4.40it/s][A
 75%|███████▌  | 9/12 [00:01<00:00,  5.94it/s][A
100%|██████████| 12/12 [00:01<00:00,  6.16it/s][A
Epochs:  60%|██████    | 56/93 [16:51<10:56, 17.73s/it]

Val Loss: 0.2192 - Val Accuracy: 0.9128



Training:   0%|          | 0/91 [00:00<?, ?it/s][A
Training:   1%|          | 1/91 [00:00<01:17,  1.16it/s][A
Training:   5%|▌         | 5/91 [00:01<00:21,  3.97it/s][A
Training:   7%|▋         | 6/91 [00:01<00:18,  4.56it/s][A
Training:  10%|▉         | 9/91 [00:02<00:15,  5.19it/s][A
Training:  12%|█▏        | 11/91 [00:02<00:11,  6.71it/s][A
Training:  14%|█▍        | 13/91 [00:02<00:13,  5.81it/s][A
Training:  16%|█▋        | 15/91 [00:02<00:10,  7.26it/s][A
Training:  19%|█▊        | 17/91 [00:03<00:13,  5.38it/s][A
Training:  22%|██▏       | 20/91 [00:03<00:08,  7.94it/s][A
Training:  24%|██▍       | 22/91 [00:04<00:12,  5.53it/s][A
Training:  27%|██▋       | 25/91 [00:04<00:12,  5.32it/s][A
Training:  30%|██▉       | 27/91 [00:04<00:10,  6.40it/s][A
Training:  32%|███▏      | 29/91 [00:05<00:11,  5.27it/s][A
Training:  36%|███▋      | 33/91 [00:06<00:10,  5.60it/s][A
Training:  38%|███▊      | 35/91 [00:06<00:08,  6.69it/s][A
Training:  41%|████      | 37/91 [00

Epoch: 57/93 - Loss: 0.1756 - Accuracy: 0.9348



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:00<00:09,  1.21it/s][A
 33%|███▎      | 4/12 [00:00<00:01,  5.14it/s][A
 50%|█████     | 6/12 [00:01<00:01,  4.61it/s][A
100%|██████████| 12/12 [00:02<00:00,  5.90it/s][A
Epochs:  61%|██████▏   | 57/93 [17:09<10:35, 17.65s/it]

Val Loss: 0.2142 - Val Accuracy: 0.9107



Training:   0%|          | 0/91 [00:00<?, ?it/s][A
Training:   1%|          | 1/91 [00:00<01:20,  1.12it/s][A
Training:   5%|▌         | 5/91 [00:01<00:21,  3.99it/s][A
Training:  10%|▉         | 9/91 [00:02<00:15,  5.19it/s][A
Training:  14%|█▍        | 13/91 [00:02<00:12,  6.05it/s][A
Training:  18%|█▊        | 16/91 [00:02<00:09,  8.07it/s][A
Training:  20%|█▉        | 18/91 [00:03<00:11,  6.23it/s][A
Training:  22%|██▏       | 20/91 [00:03<00:09,  7.48it/s][A
Training:  24%|██▍       | 22/91 [00:03<00:11,  5.76it/s][A
Training:  27%|██▋       | 25/91 [00:04<00:12,  5.45it/s][A
Training:  30%|██▉       | 27/91 [00:04<00:09,  6.57it/s][A
Training:  32%|███▏      | 29/91 [00:05<00:10,  5.71it/s][A
Training:  33%|███▎      | 30/91 [00:05<00:10,  6.00it/s][A
Training:  35%|███▌      | 32/91 [00:05<00:07,  7.69it/s][A
Training:  37%|███▋      | 34/91 [00:05<00:09,  5.77it/s][A
Training:  40%|███▉      | 36/91 [00:05<00:07,  7.32it/s][A
Training:  42%|████▏     | 38/91 [0

Epoch: 58/93 - Loss: 0.1758 - Accuracy: 0.9348



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:00<00:09,  1.19it/s][A
 33%|███▎      | 4/12 [00:00<00:01,  5.27it/s][A
 50%|█████     | 6/12 [00:01<00:01,  4.32it/s][A
100%|██████████| 12/12 [00:02<00:00,  5.65it/s][A
Epochs:  62%|██████▏   | 58/93 [17:26<10:15, 17.58s/it]

Val Loss: 0.2143 - Val Accuracy: 0.9090



Training:   0%|          | 0/91 [00:00<?, ?it/s][A
Training:   1%|          | 1/91 [00:00<01:18,  1.14it/s][A
Training:   5%|▌         | 5/91 [00:01<00:22,  3.79it/s][A
Training:  10%|▉         | 9/91 [00:02<00:16,  5.03it/s][A
Training:  14%|█▍        | 13/91 [00:02<00:13,  5.83it/s][A
Training:  19%|█▊        | 17/91 [00:03<00:11,  6.38it/s][A
Training:  21%|██        | 19/91 [00:03<00:09,  7.41it/s][A
Training:  23%|██▎       | 21/91 [00:03<00:11,  6.11it/s][A
Training:  27%|██▋       | 25/91 [00:04<00:11,  5.98it/s][A
Training:  31%|███       | 28/91 [00:04<00:08,  7.73it/s][A
Training:  33%|███▎      | 30/91 [00:05<00:09,  6.12it/s][A
Training:  35%|███▌      | 32/91 [00:05<00:08,  7.23it/s][A
Training:  37%|███▋      | 34/91 [00:05<00:09,  6.05it/s][A
Training:  40%|███▉      | 36/91 [00:05<00:07,  7.18it/s][A
Training:  42%|████▏     | 38/91 [00:06<00:09,  5.54it/s][A
Training:  44%|████▍     | 40/91 [00:06<00:07,  6.76it/s][A
Training:  46%|████▌     | 42/91 [0

Epoch: 59/93 - Loss: 0.1756 - Accuracy: 0.9348



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:00<00:09,  1.13it/s][A
 25%|██▌       | 3/12 [00:01<00:02,  3.66it/s][A
 42%|████▏     | 5/12 [00:01<00:01,  3.92it/s][A
 50%|█████     | 6/12 [00:01<00:01,  4.53it/s][A
100%|██████████| 12/12 [00:02<00:00,  5.45it/s][A
Epochs:  63%|██████▎   | 59/93 [17:44<09:56, 17.54s/it]

Val Loss: 0.2132 - Val Accuracy: 0.9106



Training:   0%|          | 0/91 [00:00<?, ?it/s][A
Training:   1%|          | 1/91 [00:00<01:16,  1.18it/s][A
Training:   5%|▌         | 5/91 [00:01<00:20,  4.18it/s][A
Training:  10%|▉         | 9/91 [00:01<00:15,  5.19it/s][A
Training:  14%|█▍        | 13/91 [00:02<00:13,  5.83it/s][A
Training:  18%|█▊        | 16/91 [00:02<00:09,  7.72it/s][A
Training:  20%|█▉        | 18/91 [00:03<00:11,  6.37it/s][A
Training:  23%|██▎       | 21/91 [00:03<00:11,  6.01it/s][A
Training:  27%|██▋       | 25/91 [00:04<00:10,  6.35it/s][A
Training:  30%|██▉       | 27/91 [00:04<00:08,  7.42it/s][A
Training:  32%|███▏      | 29/91 [00:04<00:10,  6.06it/s][A
Training:  33%|███▎      | 30/91 [00:05<00:10,  6.09it/s][A
Training:  36%|███▋      | 33/91 [00:05<00:09,  5.80it/s][A
Training:  37%|███▋      | 34/91 [00:05<00:09,  6.05it/s][A
Training:  41%|████      | 37/91 [00:06<00:09,  5.67it/s][A
Training:  44%|████▍     | 40/91 [00:06<00:06,  7.95it/s][A
Training:  46%|████▌     | 42/91 [0

Epoch: 60/93 - Loss: 0.1759 - Accuracy: 0.9334



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:00<00:10,  1.02it/s][A
 33%|███▎      | 4/12 [00:01<00:01,  4.51it/s][A
 50%|█████     | 6/12 [00:01<00:01,  4.37it/s][A
 75%|███████▌  | 9/12 [00:02<00:00,  4.80it/s][A
100%|██████████| 12/12 [00:02<00:00,  5.17it/s][A
Epochs:  65%|██████▍   | 60/93 [18:01<09:37, 17.49s/it]

Val Loss: 0.2168 - Val Accuracy: 0.9123



Training:   0%|          | 0/91 [00:00<?, ?it/s][A
Training:   1%|          | 1/91 [00:00<01:11,  1.26it/s][A
Training:   5%|▌         | 5/91 [00:01<00:20,  4.16it/s][A
Training:   9%|▉         | 8/91 [00:01<00:11,  6.97it/s][A
Training:  11%|█         | 10/91 [00:01<00:14,  5.71it/s][A
Training:  14%|█▍        | 13/91 [00:02<00:13,  5.59it/s][A
Training:  15%|█▌        | 14/91 [00:02<00:13,  5.64it/s][A
Training:  19%|█▊        | 17/91 [00:03<00:11,  6.19it/s][A
Training:  20%|█▉        | 18/91 [00:03<00:12,  6.05it/s][A
Training:  23%|██▎       | 21/91 [00:03<00:11,  6.14it/s][A
Training:  24%|██▍       | 22/91 [00:03<00:11,  5.96it/s][A
Training:  27%|██▋       | 25/91 [00:04<00:10,  6.51it/s][A
Training:  29%|██▊       | 26/91 [00:04<00:10,  6.02it/s][A
Training:  32%|███▏      | 29/91 [00:04<00:08,  7.10it/s][A
Training:  33%|███▎      | 30/91 [00:05<00:10,  5.57it/s][A
Training:  36%|███▋      | 33/91 [00:05<00:08,  6.98it/s][A
Training:  37%|███▋      | 34/91 [0

Epoch: 61/93 - Loss: 0.1753 - Accuracy: 0.9354



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:00<00:09,  1.17it/s][A
 33%|███▎      | 4/12 [00:00<00:01,  5.06it/s][A
 50%|█████     | 6/12 [00:01<00:01,  4.04it/s][A
 67%|██████▋   | 8/12 [00:01<00:00,  5.65it/s][A
100%|██████████| 12/12 [00:02<00:00,  5.20it/s][A
Epochs:  66%|██████▌   | 61/93 [18:18<09:19, 17.47s/it]

Val Loss: 0.2155 - Val Accuracy: 0.9123



Training:   0%|          | 0/91 [00:00<?, ?it/s][A
Training:   1%|          | 1/91 [00:00<01:18,  1.14it/s][A
Training:   5%|▌         | 5/91 [00:01<00:22,  3.80it/s][A
Training:  10%|▉         | 9/91 [00:02<00:15,  5.21it/s][A
Training:  14%|█▍        | 13/91 [00:02<00:13,  5.90it/s][A
Training:  19%|█▊        | 17/91 [00:03<00:11,  6.30it/s][A
Training:  23%|██▎       | 21/91 [00:03<00:10,  6.49it/s][A
Training:  26%|██▋       | 24/91 [00:03<00:08,  8.21it/s][A
Training:  29%|██▊       | 26/91 [00:04<00:09,  6.59it/s][A
Training:  31%|███       | 28/91 [00:04<00:08,  7.75it/s][A
Training:  33%|███▎      | 30/91 [00:05<00:09,  6.26it/s][A
Training:  35%|███▌      | 32/91 [00:05<00:07,  7.54it/s][A
Training:  37%|███▋      | 34/91 [00:05<00:09,  6.09it/s][A
Training:  41%|████      | 37/91 [00:06<00:09,  5.63it/s][A
Training:  44%|████▍     | 40/91 [00:06<00:06,  7.67it/s][A
Training:  46%|████▌     | 42/91 [00:06<00:08,  5.79it/s][A
Training:  49%|████▉     | 45/91 [0

Epoch: 62/93 - Loss: 0.1755 - Accuracy: 0.9348



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:00<00:10,  1.09it/s][A
 42%|████▏     | 5/12 [00:01<00:01,  3.56it/s][A
100%|██████████| 12/12 [00:02<00:00,  5.21it/s][A
Epochs:  67%|██████▋   | 62/93 [18:36<08:59, 17.41s/it]

Val Loss: 0.2127 - Val Accuracy: 0.9079



Training:   0%|          | 0/91 [00:00<?, ?it/s][A
Training:   1%|          | 1/91 [00:00<01:22,  1.09it/s][A
Training:   5%|▌         | 5/91 [00:01<00:22,  3.89it/s][A
Training:  10%|▉         | 9/91 [00:02<00:16,  4.84it/s][A
Training:  13%|█▎        | 12/91 [00:02<00:11,  6.92it/s][A
Training:  15%|█▌        | 14/91 [00:02<00:12,  5.97it/s][A
Training:  19%|█▊        | 17/91 [00:03<00:12,  5.93it/s][A
Training:  22%|██▏       | 20/91 [00:03<00:08,  7.91it/s][A
Training:  24%|██▍       | 22/91 [00:03<00:10,  6.35it/s][A
Training:  27%|██▋       | 25/91 [00:04<00:10,  6.39it/s][A
Training:  29%|██▊       | 26/91 [00:04<00:10,  6.12it/s][A
Training:  32%|███▏      | 29/91 [00:04<00:09,  6.66it/s][A
Training:  33%|███▎      | 30/91 [00:05<00:10,  6.08it/s][A
Training:  36%|███▋      | 33/91 [00:05<00:08,  6.54it/s][A
Training:  37%|███▋      | 34/91 [00:05<00:08,  6.63it/s][A
Training:  41%|████      | 37/91 [00:06<00:08,  6.67it/s][A
Training:  42%|████▏     | 38/91 [0

Epoch: 63/93 - Loss: 0.1754 - Accuracy: 0.9352



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:00<00:09,  1.12it/s][A
 42%|████▏     | 5/12 [00:01<00:01,  3.71it/s][A
 67%|██████▋   | 8/12 [00:01<00:00,  6.16it/s][A
100%|██████████| 12/12 [00:02<00:00,  5.13it/s][A
Epochs:  68%|██████▊   | 63/93 [18:53<08:41, 17.39s/it]

Val Loss: 0.2120 - Val Accuracy: 0.9079



Training:   0%|          | 0/91 [00:00<?, ?it/s][A
Training:   1%|          | 1/91 [00:00<01:17,  1.16it/s][A
Training:   5%|▌         | 5/91 [00:01<00:21,  3.97it/s][A
Training:   9%|▉         | 8/91 [00:01<00:12,  6.65it/s][A
Training:  11%|█         | 10/91 [00:02<00:14,  5.51it/s][A
Training:  13%|█▎        | 12/91 [00:02<00:11,  6.91it/s][A
Training:  15%|█▌        | 14/91 [00:02<00:14,  5.42it/s][A
Training:  19%|█▊        | 17/91 [00:03<00:13,  5.62it/s][A
Training:  21%|██        | 19/91 [00:03<00:10,  6.80it/s][A
Training:  23%|██▎       | 21/91 [00:03<00:11,  5.90it/s][A
Training:  26%|██▋       | 24/91 [00:03<00:08,  7.87it/s][A
Training:  29%|██▊       | 26/91 [00:04<00:09,  7.18it/s][A
Training:  30%|██▉       | 27/91 [00:04<00:08,  7.23it/s][A
Training:  32%|███▏      | 29/91 [00:05<00:11,  5.60it/s][A
Training:  34%|███▍      | 31/91 [00:05<00:08,  7.06it/s][A
Training:  36%|███▋      | 33/91 [00:05<00:11,  5.25it/s][A
Training:  41%|████      | 37/91 [0

Epoch: 64/93 - Loss: 0.1754 - Accuracy: 0.9340



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:00<00:09,  1.15it/s][A
 33%|███▎      | 4/12 [00:00<00:01,  5.13it/s][A
 50%|█████     | 6/12 [00:01<00:01,  4.34it/s][A
 67%|██████▋   | 8/12 [00:01<00:00,  6.08it/s][A
100%|██████████| 12/12 [00:02<00:00,  5.16it/s][A
Epochs:  69%|██████▉   | 64/93 [19:10<08:23, 17.38s/it]

Val Loss: 0.2117 - Val Accuracy: 0.9079



Training:   0%|          | 0/91 [00:00<?, ?it/s][A
Training:   1%|          | 1/91 [00:00<01:17,  1.16it/s][A
Training:   4%|▍         | 4/91 [00:00<00:16,  5.20it/s][A
Training:   7%|▋         | 6/91 [00:01<00:20,  4.07it/s][A
Training:  10%|▉         | 9/91 [00:02<00:17,  4.60it/s][A
Training:  14%|█▍        | 13/91 [00:02<00:14,  5.26it/s][A
Training:  19%|█▊        | 17/91 [00:03<00:13,  5.51it/s][A
Training:  23%|██▎       | 21/91 [00:04<00:11,  5.92it/s][A
Training:  27%|██▋       | 25/91 [00:04<00:10,  6.46it/s][A
Training:  32%|███▏      | 29/91 [00:05<00:09,  6.72it/s][A
Training:  34%|███▍      | 31/91 [00:05<00:07,  7.59it/s][A
Training:  36%|███▋      | 33/91 [00:05<00:09,  6.07it/s][A
Training:  38%|███▊      | 35/91 [00:05<00:07,  7.24it/s][A
Training:  41%|████      | 37/91 [00:06<00:08,  6.04it/s][A
Training:  42%|████▏     | 38/91 [00:06<00:08,  6.39it/s][A
Training:  45%|████▌     | 41/91 [00:07<00:08,  6.14it/s][A
Training:  48%|████▊     | 44/91 [00

Epoch: 65/93 - Loss: 0.1753 - Accuracy: 0.9354



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:00<00:09,  1.14it/s][A
 33%|███▎      | 4/12 [00:01<00:01,  4.49it/s][A
 42%|████▏     | 5/12 [00:01<00:02,  3.29it/s][A
 67%|██████▋   | 8/12 [00:01<00:00,  5.61it/s][A
100%|██████████| 12/12 [00:02<00:00,  5.07it/s][A
Epochs:  70%|██████▉   | 65/93 [19:28<08:07, 17.41s/it]

Val Loss: 0.2144 - Val Accuracy: 0.9112



Training:   0%|          | 0/91 [00:00<?, ?it/s][A
Training:   1%|          | 1/91 [00:00<01:25,  1.06it/s][A
Training:   3%|▎         | 3/91 [00:01<00:25,  3.41it/s][A
Training:   5%|▌         | 5/91 [00:01<00:24,  3.55it/s][A
Training:  10%|▉         | 9/91 [00:02<00:16,  4.90it/s][A
Training:  14%|█▍        | 13/91 [00:02<00:13,  5.96it/s][A
Training:  19%|█▊        | 17/91 [00:03<00:12,  6.03it/s][A
Training:  23%|██▎       | 21/91 [00:04<00:11,  6.06it/s][A
Training:  27%|██▋       | 25/91 [00:04<00:10,  6.40it/s][A
Training:  32%|███▏      | 29/91 [00:05<00:09,  6.76it/s][A
Training:  36%|███▋      | 33/91 [00:05<00:08,  6.63it/s][A
Training:  41%|████      | 37/91 [00:06<00:08,  6.47it/s][A
Training:  43%|████▎     | 39/91 [00:06<00:07,  7.31it/s][A
Training:  45%|████▌     | 41/91 [00:07<00:08,  6.19it/s][A
Training:  49%|████▉     | 45/91 [00:07<00:07,  6.19it/s][A
Training:  54%|█████▍    | 49/91 [00:08<00:06,  6.18it/s][A
Training:  58%|█████▊    | 53/91 [00

Epoch: 66/93 - Loss: 0.1753 - Accuracy: 0.9351



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:00<00:09,  1.17it/s][A
 17%|█▋        | 2/12 [00:00<00:04,  2.33it/s][A
 42%|████▏     | 5/12 [00:01<00:01,  3.98it/s][A
 58%|█████▊    | 7/12 [00:01<00:00,  5.88it/s][A
100%|██████████| 12/12 [00:02<00:00,  5.19it/s][A
Epochs:  71%|███████   | 66/93 [19:45<07:49, 17.40s/it]

Val Loss: 0.2118 - Val Accuracy: 0.9068



Training:   0%|          | 0/91 [00:00<?, ?it/s][A
Training:   1%|          | 1/91 [00:00<01:22,  1.09it/s][A
Training:   5%|▌         | 5/91 [00:01<00:22,  3.86it/s][A
Training:   8%|▊         | 7/91 [00:01<00:15,  5.52it/s][A
Training:  10%|▉         | 9/91 [00:02<00:17,  4.71it/s][A
Training:  12%|█▏        | 11/91 [00:02<00:12,  6.16it/s][A
Training:  14%|█▍        | 13/91 [00:02<00:13,  5.62it/s][A
Training:  15%|█▌        | 14/91 [00:02<00:12,  5.99it/s][A
Training:  19%|█▊        | 17/91 [00:03<00:11,  6.41it/s][A
Training:  20%|█▉        | 18/91 [00:03<00:11,  6.17it/s][A
Training:  23%|██▎       | 21/91 [00:03<00:11,  6.29it/s][A
Training:  24%|██▍       | 22/91 [00:04<00:11,  5.76it/s][A
Training:  27%|██▋       | 25/91 [00:04<00:11,  5.86it/s][A
Training:  29%|██▊       | 26/91 [00:04<00:10,  6.06it/s][A
Training:  32%|███▏      | 29/91 [00:05<00:09,  6.41it/s][A
Training:  34%|███▍      | 31/91 [00:05<00:07,  7.54it/s][A
Training:  36%|███▋      | 33/91 [00

Epoch: 67/93 - Loss: 0.1760 - Accuracy: 0.9339



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:00<00:10,  1.03it/s][A
 42%|████▏     | 5/12 [00:01<00:01,  3.61it/s][A
100%|██████████| 12/12 [00:02<00:00,  5.06it/s][A
Epochs:  72%|███████▏  | 67/93 [20:02<07:31, 17.38s/it]

Val Loss: 0.2130 - Val Accuracy: 0.9095



Training:   0%|          | 0/91 [00:00<?, ?it/s][A
Training:   1%|          | 1/91 [00:01<01:36,  1.08s/it][A
Training:   5%|▌         | 5/91 [00:01<00:26,  3.30it/s][A
Training:  10%|▉         | 9/91 [00:02<00:18,  4.48it/s][A
Training:  14%|█▍        | 13/91 [00:02<00:15,  5.20it/s][A
Training:  19%|█▊        | 17/91 [00:03<00:12,  5.87it/s][A
Training:  23%|██▎       | 21/91 [00:04<00:11,  6.15it/s][A
Training:  26%|██▋       | 24/91 [00:04<00:08,  7.85it/s][A
Training:  29%|██▊       | 26/91 [00:04<00:10,  6.22it/s][A
Training:  32%|███▏      | 29/91 [00:05<00:10,  5.79it/s][A
Training:  34%|███▍      | 31/91 [00:05<00:08,  6.81it/s][A
Training:  36%|███▋      | 33/91 [00:05<00:09,  6.11it/s][A
Training:  37%|███▋      | 34/91 [00:06<00:09,  6.33it/s][A
Training:  41%|████      | 37/91 [00:06<00:07,  6.92it/s][A
Training:  42%|████▏     | 38/91 [00:06<00:07,  6.96it/s][A
Training:  45%|████▌     | 41/91 [00:07<00:07,  6.80it/s][A
Training:  46%|████▌     | 42/91 [0

Epoch: 68/93 - Loss: 0.1760 - Accuracy: 0.9331



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:00<00:10,  1.04it/s][A
 42%|████▏     | 5/12 [00:01<00:02,  3.46it/s][A
 67%|██████▋   | 8/12 [00:01<00:00,  5.75it/s][A
100%|██████████| 12/12 [00:02<00:00,  5.11it/s][A
Epochs:  73%|███████▎  | 68/93 [20:20<07:14, 17.39s/it]

Val Loss: 0.2114 - Val Accuracy: 0.9123



Training:   0%|          | 0/91 [00:00<?, ?it/s][A
Training:   1%|          | 1/91 [00:01<01:31,  1.01s/it][A
Training:   5%|▌         | 5/91 [00:01<00:24,  3.49it/s][A
Training:  10%|▉         | 9/91 [00:02<00:17,  4.60it/s][A
Training:  14%|█▍        | 13/91 [00:02<00:15,  5.09it/s][A
Training:  16%|█▋        | 15/91 [00:03<00:12,  6.17it/s][A
Training:  19%|█▊        | 17/91 [00:03<00:13,  5.50it/s][A
Training:  20%|█▉        | 18/91 [00:03<00:12,  5.80it/s][A
Training:  23%|██▎       | 21/91 [00:04<00:11,  6.36it/s][A
Training:  24%|██▍       | 22/91 [00:04<00:10,  6.62it/s][A
Training:  27%|██▋       | 25/91 [00:04<00:11,  5.68it/s][A
Training:  31%|███       | 28/91 [00:04<00:07,  7.99it/s][A
Training:  33%|███▎      | 30/91 [00:05<00:09,  6.14it/s][A
Training:  35%|███▌      | 32/91 [00:05<00:08,  7.12it/s][A
Training:  37%|███▋      | 34/91 [00:06<00:09,  5.94it/s][A
Training:  40%|███▉      | 36/91 [00:06<00:07,  7.22it/s][A
Training:  42%|████▏     | 38/91 [0

Epoch: 69/93 - Loss: 0.1757 - Accuracy: 0.9357



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:00<00:10,  1.03it/s][A
 33%|███▎      | 4/12 [00:01<00:01,  4.70it/s][A
 50%|█████     | 6/12 [00:01<00:01,  3.92it/s][A
 75%|███████▌  | 9/12 [00:02<00:00,  4.58it/s][A
100%|██████████| 12/12 [00:02<00:00,  4.98it/s][A
Epochs:  74%|███████▍  | 69/93 [20:37<06:56, 17.35s/it]

Val Loss: 0.2147 - Val Accuracy: 0.9123



Training:   0%|          | 0/91 [00:00<?, ?it/s][A
Training:   1%|          | 1/91 [00:00<01:20,  1.11it/s][A
Training:   4%|▍         | 4/91 [00:01<00:17,  5.04it/s][A
Training:   7%|▋         | 6/91 [00:01<00:20,  4.12it/s][A
Training:  10%|▉         | 9/91 [00:02<00:18,  4.38it/s][A
Training:  13%|█▎        | 12/91 [00:02<00:11,  6.68it/s][A
Training:  15%|█▌        | 14/91 [00:03<00:15,  5.00it/s][A
Training:  19%|█▊        | 17/91 [00:03<00:14,  5.04it/s][A
Training:  23%|██▎       | 21/91 [00:04<00:12,  5.48it/s][A
Training:  27%|██▋       | 25/91 [00:04<00:10,  6.05it/s][A
Training:  31%|███       | 28/91 [00:04<00:08,  7.73it/s][A
Training:  33%|███▎      | 30/91 [00:05<00:09,  6.33it/s][A
Training:  36%|███▋      | 33/91 [00:05<00:09,  6.10it/s][A
Training:  40%|███▉      | 36/91 [00:06<00:06,  7.96it/s][A
Training:  42%|████▏     | 38/91 [00:06<00:08,  6.03it/s][A
Training:  45%|████▌     | 41/91 [00:07<00:08,  5.62it/s][A
Training:  49%|████▉     | 45/91 [00

Epoch: 70/93 - Loss: 0.1755 - Accuracy: 0.9340



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:00<00:10,  1.05it/s][A
 42%|████▏     | 5/12 [00:01<00:01,  3.53it/s][A
100%|██████████| 12/12 [00:02<00:00,  5.19it/s][A
Epochs:  75%|███████▌  | 70/93 [20:54<06:37, 17.29s/it]

Val Loss: 0.2135 - Val Accuracy: 0.9096



Training:   0%|          | 0/91 [00:00<?, ?it/s][A
Training:   1%|          | 1/91 [00:00<01:23,  1.07it/s][A
Training:   4%|▍         | 4/91 [00:01<00:18,  4.83it/s][A
Training:   7%|▋         | 6/91 [00:01<00:20,  4.07it/s][A
Training:  10%|▉         | 9/91 [00:02<00:18,  4.33it/s][A
Training:  14%|█▍        | 13/91 [00:03<00:16,  4.85it/s][A
Training:  18%|█▊        | 16/91 [00:03<00:11,  6.74it/s][A
Training:  20%|█▉        | 18/91 [00:03<00:13,  5.24it/s][A
Training:  23%|██▎       | 21/91 [00:04<00:13,  5.10it/s][A
Training:  27%|██▋       | 25/91 [00:05<00:12,  5.46it/s][A
Training:  32%|███▏      | 29/91 [00:05<00:10,  5.74it/s][A
Training:  36%|███▋      | 33/91 [00:06<00:09,  6.16it/s][A
Training:  41%|████      | 37/91 [00:06<00:08,  6.26it/s][A
Training:  45%|████▌     | 41/91 [00:07<00:08,  6.23it/s][A
Training:  49%|████▉     | 45/91 [00:08<00:07,  6.34it/s][A
Training:  54%|█████▍    | 49/91 [00:08<00:06,  6.75it/s][A
Training:  58%|█████▊    | 53/91 [00

Epoch: 71/93 - Loss: 0.1755 - Accuracy: 0.9344



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:00<00:09,  1.17it/s][A
 25%|██▌       | 3/12 [00:00<00:02,  3.79it/s][A
 42%|████▏     | 5/12 [00:01<00:01,  3.78it/s][A
 58%|█████▊    | 7/12 [00:01<00:00,  5.73it/s][A
100%|██████████| 12/12 [00:02<00:00,  5.15it/s][A
Epochs:  76%|███████▋  | 71/93 [21:12<06:19, 17.26s/it]

Val Loss: 0.2161 - Val Accuracy: 0.9112



Training:   0%|          | 0/91 [00:00<?, ?it/s][A
Training:   1%|          | 1/91 [00:00<01:21,  1.11it/s][A
Training:   5%|▌         | 5/91 [00:01<00:23,  3.66it/s][A
Training:   9%|▉         | 8/91 [00:01<00:13,  6.09it/s][A
Training:  11%|█         | 10/91 [00:02<00:16,  4.86it/s][A
Training:  14%|█▍        | 13/91 [00:02<00:15,  4.88it/s][A
Training:  19%|█▊        | 17/91 [00:03<00:14,  5.18it/s][A
Training:  22%|██▏       | 20/91 [00:03<00:10,  6.96it/s][A
Training:  24%|██▍       | 22/91 [00:04<00:12,  5.50it/s][A
Training:  27%|██▋       | 25/91 [00:04<00:12,  5.28it/s][A
Training:  31%|███       | 28/91 [00:05<00:08,  7.16it/s][A
Training:  33%|███▎      | 30/91 [00:05<00:10,  5.81it/s][A
Training:  36%|███▋      | 33/91 [00:06<00:10,  5.49it/s][A
Training:  41%|████      | 37/91 [00:06<00:09,  5.78it/s][A
Training:  45%|████▌     | 41/91 [00:07<00:08,  6.03it/s][A
Training:  49%|████▉     | 45/91 [00:08<00:07,  6.06it/s][A
Training:  54%|█████▍    | 49/91 [0

Epoch: 72/93 - Loss: 0.1755 - Accuracy: 0.9346



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:00<00:09,  1.19it/s][A
 25%|██▌       | 3/12 [00:00<00:02,  3.76it/s][A
 42%|████▏     | 5/12 [00:01<00:01,  3.78it/s][A
 58%|█████▊    | 7/12 [00:01<00:00,  5.36it/s][A
 75%|███████▌  | 9/12 [00:02<00:00,  4.86it/s][A
100%|██████████| 12/12 [00:02<00:00,  5.13it/s][A
Epochs:  77%|███████▋  | 72/93 [21:29<06:02, 17.27s/it]

Val Loss: 0.2129 - Val Accuracy: 0.9123



Training:   0%|          | 0/91 [00:00<?, ?it/s][A
Training:   1%|          | 1/91 [00:00<01:21,  1.11it/s][A
Training:   5%|▌         | 5/91 [00:01<00:24,  3.54it/s][A
Training:  10%|▉         | 9/91 [00:02<00:18,  4.51it/s][A
Training:  12%|█▏        | 11/91 [00:02<00:13,  5.74it/s][A
Training:  14%|█▍        | 13/91 [00:02<00:15,  4.94it/s][A
Training:  19%|█▊        | 17/91 [00:03<00:13,  5.43it/s][A
Training:  23%|██▎       | 21/91 [00:04<00:12,  5.46it/s][A
Training:  26%|██▋       | 24/91 [00:04<00:09,  7.18it/s][A
Training:  29%|██▊       | 26/91 [00:05<00:11,  5.80it/s][A
Training:  32%|███▏      | 29/91 [00:05<00:11,  5.59it/s][A
Training:  36%|███▋      | 33/91 [00:06<00:10,  5.72it/s][A
Training:  41%|████      | 37/91 [00:06<00:09,  5.69it/s][A
Training:  45%|████▌     | 41/91 [00:07<00:08,  6.14it/s][A
Training:  49%|████▉     | 45/91 [00:08<00:07,  6.09it/s][A
Training:  54%|█████▍    | 49/91 [00:08<00:07,  5.94it/s][A
Training:  58%|█████▊    | 53/91 [0

Epoch: 73/93 - Loss: 0.1752 - Accuracy: 0.9341



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:00<00:09,  1.14it/s][A
 17%|█▋        | 2/12 [00:00<00:04,  2.35it/s][A
 42%|████▏     | 5/12 [00:01<00:01,  3.97it/s][A
 67%|██████▋   | 8/12 [00:01<00:00,  6.92it/s][A
100%|██████████| 12/12 [00:02<00:00,  5.20it/s][A
Epochs:  78%|███████▊  | 73/93 [21:46<05:44, 17.23s/it]

Val Loss: 0.2158 - Val Accuracy: 0.9123



Training:   0%|          | 0/91 [00:00<?, ?it/s][A
Training:   1%|          | 1/91 [00:00<01:26,  1.03it/s][A
Training:   5%|▌         | 5/91 [00:01<00:23,  3.59it/s][A
Training:  10%|▉         | 9/91 [00:02<00:17,  4.71it/s][A
Training:  12%|█▏        | 11/91 [00:02<00:13,  5.91it/s][A
Training:  14%|█▍        | 13/91 [00:02<00:15,  5.08it/s][A
Training:  15%|█▌        | 14/91 [00:03<00:14,  5.44it/s][A
Training:  18%|█▊        | 16/91 [00:03<00:11,  6.54it/s][A
Training:  19%|█▊        | 17/91 [00:03<00:14,  5.07it/s][A
Training:  20%|█▉        | 18/91 [00:03<00:13,  5.52it/s][A
Training:  22%|██▏       | 20/91 [00:03<00:10,  6.73it/s][A
Training:  23%|██▎       | 21/91 [00:04<00:14,  4.83it/s][A
Training:  25%|██▌       | 23/91 [00:04<00:10,  6.40it/s][A
Training:  27%|██▋       | 25/91 [00:04<00:12,  5.21it/s][A
Training:  30%|██▉       | 27/91 [00:05<00:10,  6.26it/s][A
Training:  32%|███▏      | 29/91 [00:05<00:11,  5.25it/s][A
Training:  34%|███▍      | 31/91 [0

Epoch: 74/93 - Loss: 0.1753 - Accuracy: 0.9345



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:00<00:10,  1.04it/s][A
 42%|████▏     | 5/12 [00:01<00:01,  3.58it/s][A
 67%|██████▋   | 8/12 [00:01<00:00,  6.16it/s][A
100%|██████████| 12/12 [00:02<00:00,  4.90it/s][A
Epochs:  80%|███████▉  | 74/93 [22:04<05:29, 17.36s/it]

Val Loss: 0.2139 - Val Accuracy: 0.9096



Training:   0%|          | 0/91 [00:00<?, ?it/s][A
Training:   1%|          | 1/91 [00:00<01:25,  1.05it/s][A
Training:   3%|▎         | 3/91 [00:01<00:25,  3.52it/s][A
Training:   5%|▌         | 5/91 [00:01<00:23,  3.62it/s][A
Training:   9%|▉         | 8/91 [00:01<00:12,  6.55it/s][A
Training:  11%|█         | 10/91 [00:02<00:15,  5.10it/s][A
Training:  14%|█▍        | 13/91 [00:02<00:16,  4.71it/s][A
Training:  19%|█▊        | 17/91 [00:03<00:13,  5.33it/s][A
Training:  22%|██▏       | 20/91 [00:03<00:09,  7.15it/s][A
Training:  24%|██▍       | 22/91 [00:04<00:12,  5.64it/s][A
Training:  27%|██▋       | 25/91 [00:04<00:12,  5.21it/s][A
Training:  32%|███▏      | 29/91 [00:05<00:10,  5.70it/s][A
Training:  36%|███▋      | 33/91 [00:06<00:09,  5.99it/s][A
Training:  40%|███▉      | 36/91 [00:06<00:07,  7.61it/s][A
Training:  42%|████▏     | 38/91 [00:06<00:08,  6.07it/s][A
Training:  45%|████▌     | 41/91 [00:07<00:08,  5.57it/s][A
Training:  48%|████▊     | 44/91 [00

Epoch: 75/93 - Loss: 0.1754 - Accuracy: 0.9345



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:00<00:09,  1.13it/s][A
 42%|████▏     | 5/12 [00:01<00:01,  3.60it/s][A
100%|██████████| 12/12 [00:02<00:00,  5.20it/s][A
Epochs:  81%|████████  | 75/93 [22:21<05:12, 17.36s/it]

Val Loss: 0.2152 - Val Accuracy: 0.9112



Training:   0%|          | 0/91 [00:00<?, ?it/s][A
Training:   1%|          | 1/91 [00:00<01:28,  1.01it/s][A
Training:   5%|▌         | 5/91 [00:01<00:24,  3.48it/s][A
Training:  10%|▉         | 9/91 [00:02<00:18,  4.54it/s][A
Training:  13%|█▎        | 12/91 [00:02<00:12,  6.51it/s][A
Training:  15%|█▌        | 14/91 [00:03<00:14,  5.32it/s][A
Training:  19%|█▊        | 17/91 [00:03<00:14,  5.08it/s][A
Training:  23%|██▎       | 21/91 [00:04<00:12,  5.43it/s][A
Training:  27%|██▋       | 25/91 [00:04<00:11,  5.62it/s][A
Training:  32%|███▏      | 29/91 [00:05<00:11,  5.53it/s][A
Training:  36%|███▋      | 33/91 [00:06<00:10,  5.55it/s][A
Training:  40%|███▉      | 36/91 [00:06<00:07,  6.94it/s][A
Training:  42%|████▏     | 38/91 [00:07<00:09,  5.67it/s][A
Training:  45%|████▌     | 41/91 [00:07<00:09,  5.19it/s][A
Training:  49%|████▉     | 45/91 [00:08<00:08,  5.61it/s][A
Training:  54%|█████▍    | 49/91 [00:09<00:06,  6.15it/s][A
Training:  58%|█████▊    | 53/91 [0

Epoch: 76/93 - Loss: 0.1754 - Accuracy: 0.9342



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:00<00:09,  1.13it/s][A
 33%|███▎      | 4/12 [00:01<00:01,  4.90it/s][A
 50%|█████     | 6/12 [00:01<00:01,  4.32it/s][A
100%|██████████| 12/12 [00:02<00:00,  5.11it/s][A
Epochs:  82%|████████▏ | 76/93 [22:38<04:55, 17.40s/it]

Val Loss: 0.2113 - Val Accuracy: 0.9090



Training:   0%|          | 0/91 [00:00<?, ?it/s][A
Training:   1%|          | 1/91 [00:00<01:27,  1.03it/s][A
Training:   4%|▍         | 4/91 [00:01<00:18,  4.64it/s][A
Training:   7%|▋         | 6/91 [00:01<00:20,  4.13it/s][A
Training:  10%|▉         | 9/91 [00:02<00:18,  4.43it/s][A
Training:  14%|█▍        | 13/91 [00:02<00:15,  5.10it/s][A
Training:  18%|█▊        | 16/91 [00:03<00:10,  7.00it/s][A
Training:  20%|█▉        | 18/91 [00:03<00:12,  5.64it/s][A
Training:  23%|██▎       | 21/91 [00:04<00:13,  5.20it/s][A
Training:  27%|██▋       | 25/91 [00:04<00:12,  5.37it/s][A
Training:  31%|███       | 28/91 [00:05<00:08,  7.10it/s][A
Training:  33%|███▎      | 30/91 [00:05<00:10,  5.83it/s][A
Training:  36%|███▋      | 33/91 [00:06<00:10,  5.56it/s][A
Training:  41%|████      | 37/91 [00:06<00:09,  5.74it/s][A
Training:  45%|████▌     | 41/91 [00:07<00:08,  5.81it/s][A
Training:  49%|████▉     | 45/91 [00:08<00:07,  5.94it/s][A
Training:  54%|█████▍    | 49/91 [00

Epoch: 77/93 - Loss: 0.1757 - Accuracy: 0.9346



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:00<00:08,  1.28it/s][A
 25%|██▌       | 3/12 [00:00<00:02,  4.16it/s][A
 42%|████▏     | 5/12 [00:01<00:01,  3.82it/s][A
100%|██████████| 12/12 [00:02<00:00,  5.45it/s][A
Epochs:  83%|████████▎ | 77/93 [22:56<04:38, 17.41s/it]

Val Loss: 0.2135 - Val Accuracy: 0.9123



Training:   0%|          | 0/91 [00:00<?, ?it/s][A
Training:   1%|          | 1/91 [00:00<01:17,  1.16it/s][A
Training:   3%|▎         | 3/91 [00:00<00:23,  3.79it/s][A
Training:   5%|▌         | 5/91 [00:01<00:24,  3.52it/s][A
Training:   7%|▋         | 6/91 [00:01<00:20,  4.22it/s][A
Training:  10%|▉         | 9/91 [00:02<00:16,  4.83it/s][A
Training:  11%|█         | 10/91 [00:02<00:16,  4.96it/s][A
Training:  14%|█▍        | 13/91 [00:02<00:14,  5.27it/s][A
Training:  15%|█▌        | 14/91 [00:03<00:14,  5.46it/s][A
Training:  19%|█▊        | 17/91 [00:03<00:12,  5.88it/s][A
Training:  20%|█▉        | 18/91 [00:03<00:13,  5.39it/s][A
Training:  23%|██▎       | 21/91 [00:04<00:11,  6.22it/s][A
Training:  24%|██▍       | 22/91 [00:04<00:11,  5.80it/s][A
Training:  27%|██▋       | 25/91 [00:04<00:10,  6.23it/s][A
Training:  29%|██▊       | 26/91 [00:05<00:11,  5.77it/s][A
Training:  32%|███▏      | 29/91 [00:05<00:09,  6.36it/s][A
Training:  33%|███▎      | 30/91 [00:

Epoch: 78/93 - Loss: 0.1756 - Accuracy: 0.9338



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:00<00:08,  1.25it/s][A
 42%|████▏     | 5/12 [00:01<00:01,  3.97it/s][A
100%|██████████| 12/12 [00:02<00:00,  5.64it/s][A
Epochs:  84%|████████▍ | 78/93 [23:13<04:21, 17.41s/it]

Val Loss: 0.2146 - Val Accuracy: 0.9101



Training:   0%|          | 0/91 [00:00<?, ?it/s][A
Training:   1%|          | 1/91 [00:00<01:25,  1.05it/s][A
Training:   3%|▎         | 3/91 [00:01<00:26,  3.35it/s][A
Training:   5%|▌         | 5/91 [00:01<00:22,  3.84it/s][A
Training:   7%|▋         | 6/91 [00:01<00:18,  4.57it/s][A
Training:   8%|▊         | 7/91 [00:01<00:16,  5.12it/s][A
Training:  10%|▉         | 9/91 [00:02<00:16,  5.06it/s][A
Training:  12%|█▏        | 11/91 [00:02<00:13,  5.96it/s][A
Training:  14%|█▍        | 13/91 [00:02<00:15,  5.20it/s][A
Training:  16%|█▋        | 15/91 [00:03<00:11,  6.49it/s][A
Training:  19%|█▊        | 17/91 [00:03<00:14,  5.10it/s][A
Training:  23%|██▎       | 21/91 [00:04<00:12,  5.56it/s][A
Training:  25%|██▌       | 23/91 [00:04<00:10,  6.72it/s][A
Training:  27%|██▋       | 25/91 [00:04<00:12,  5.43it/s][A
Training:  31%|███       | 28/91 [00:05<00:08,  7.66it/s][A
Training:  33%|███▎      | 30/91 [00:05<00:10,  5.56it/s][A
Training:  36%|███▋      | 33/91 [00:0

Epoch: 79/93 - Loss: 0.1753 - Accuracy: 0.9344



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:00<00:10,  1.10it/s][A
 42%|████▏     | 5/12 [00:01<00:01,  3.61it/s][A
100%|██████████| 12/12 [00:02<00:00,  5.42it/s][A
Epochs:  85%|████████▍ | 79/93 [23:31<04:04, 17.45s/it]

Val Loss: 0.2131 - Val Accuracy: 0.9074



Training:   0%|          | 0/91 [00:00<?, ?it/s][A
Training:   1%|          | 1/91 [00:00<01:22,  1.10it/s][A
Training:   4%|▍         | 4/91 [00:01<00:18,  4.83it/s][A
Training:   7%|▋         | 6/91 [00:01<00:21,  4.03it/s][A
Training:  10%|▉         | 9/91 [00:02<00:18,  4.33it/s][A
Training:  14%|█▍        | 13/91 [00:02<00:15,  4.99it/s][A
Training:  19%|█▊        | 17/91 [00:03<00:14,  5.23it/s][A
Training:  23%|██▎       | 21/91 [00:04<00:12,  5.68it/s][A
Training:  27%|██▋       | 25/91 [00:04<00:11,  5.88it/s][A
Training:  31%|███       | 28/91 [00:05<00:08,  7.49it/s][A
Training:  33%|███▎      | 30/91 [00:05<00:10,  5.93it/s][A
Training:  36%|███▋      | 33/91 [00:06<00:10,  5.60it/s][A
Training:  41%|████      | 37/91 [00:06<00:09,  5.62it/s][A
Training:  44%|████▍     | 40/91 [00:07<00:07,  7.23it/s][A
Training:  46%|████▌     | 42/91 [00:07<00:08,  6.01it/s][A
Training:  49%|████▉     | 45/91 [00:08<00:08,  5.34it/s][A
Training:  53%|█████▎    | 48/91 [00

Epoch: 80/93 - Loss: 0.1753 - Accuracy: 0.9345



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:00<00:09,  1.14it/s][A
 25%|██▌       | 3/12 [00:01<00:02,  3.67it/s][A
 42%|████▏     | 5/12 [00:01<00:01,  3.88it/s][A
 50%|█████     | 6/12 [00:01<00:01,  4.47it/s][A
100%|██████████| 12/12 [00:02<00:00,  5.40it/s][A
Epochs:  86%|████████▌ | 80/93 [23:48<03:47, 17.47s/it]

Val Loss: 0.2113 - Val Accuracy: 0.9112



Training:   0%|          | 0/91 [00:00<?, ?it/s][A
Training:   1%|          | 1/91 [00:00<01:11,  1.25it/s][A
Training:   3%|▎         | 3/91 [00:00<00:21,  4.06it/s][A
Training:   5%|▌         | 5/91 [00:01<00:23,  3.59it/s][A
Training:   7%|▋         | 6/91 [00:01<00:20,  4.12it/s][A
Training:  10%|▉         | 9/91 [00:02<00:17,  4.78it/s][A
Training:  11%|█         | 10/91 [00:02<00:16,  5.00it/s][A
Training:  14%|█▍        | 13/91 [00:02<00:14,  5.40it/s][A
Training:  16%|█▋        | 15/91 [00:03<00:11,  6.65it/s][A
Training:  19%|█▊        | 17/91 [00:03<00:14,  5.28it/s][A
Training:  22%|██▏       | 20/91 [00:03<00:09,  7.74it/s][A
Training:  24%|██▍       | 22/91 [00:04<00:12,  5.73it/s][A
Training:  26%|██▋       | 24/91 [00:04<00:09,  6.82it/s][A
Training:  29%|██▊       | 26/91 [00:04<00:11,  5.60it/s][A
Training:  31%|███       | 28/91 [00:05<00:09,  6.96it/s][A
Training:  33%|███▎      | 30/91 [00:05<00:11,  5.50it/s][A
Training:  35%|███▌      | 32/91 [00:

Epoch: 81/93 - Loss: 0.1754 - Accuracy: 0.9345



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:00<00:09,  1.21it/s][A
 42%|████▏     | 5/12 [00:01<00:01,  3.91it/s][A
 58%|█████▊    | 7/12 [00:01<00:00,  5.45it/s][A
 75%|███████▌  | 9/12 [00:02<00:00,  4.95it/s][A
100%|██████████| 12/12 [00:02<00:00,  5.21it/s][A
Epochs:  87%|████████▋ | 81/93 [24:06<03:30, 17.56s/it]

Val Loss: 0.2138 - Val Accuracy: 0.9101



Training:   0%|          | 0/91 [00:00<?, ?it/s][A
Training:   1%|          | 1/91 [00:00<01:17,  1.17it/s][A
Training:   5%|▌         | 5/91 [00:01<00:21,  3.92it/s][A
Training:  10%|▉         | 9/91 [00:02<00:16,  4.92it/s][A
Training:  13%|█▎        | 12/91 [00:02<00:11,  7.06it/s][A
Training:  15%|█▌        | 14/91 [00:02<00:14,  5.31it/s][A
Training:  19%|█▊        | 17/91 [00:03<00:14,  5.21it/s][A
Training:  22%|██▏       | 20/91 [00:03<00:09,  7.15it/s][A
Training:  24%|██▍       | 22/91 [00:04<00:12,  5.33it/s][A
Training:  27%|██▋       | 25/91 [00:04<00:12,  5.19it/s][A
Training:  32%|███▏      | 29/91 [00:05<00:11,  5.59it/s][A
Training:  36%|███▋      | 33/91 [00:06<00:10,  5.72it/s][A
Training:  38%|███▊      | 35/91 [00:06<00:08,  6.53it/s][A
Training:  41%|████      | 37/91 [00:06<00:09,  5.55it/s][A
Training:  44%|████▍     | 40/91 [00:06<00:06,  7.51it/s][A
Training:  46%|████▌     | 42/91 [00:07<00:08,  5.63it/s][A
Training:  49%|████▉     | 45/91 [0

Epoch: 82/93 - Loss: 0.1750 - Accuracy: 0.9348



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:00<00:08,  1.23it/s][A
 42%|████▏     | 5/12 [00:01<00:01,  3.96it/s][A
100%|██████████| 12/12 [00:02<00:00,  5.53it/s][A
Epochs:  88%|████████▊ | 82/93 [24:24<03:13, 17.58s/it]

Val Loss: 0.2116 - Val Accuracy: 0.9068



Training:   0%|          | 0/91 [00:00<?, ?it/s][A
Training:   1%|          | 1/91 [00:00<01:29,  1.01it/s][A
Training:   5%|▌         | 5/91 [00:01<00:22,  3.82it/s][A
Training:  10%|▉         | 9/91 [00:02<00:17,  4.77it/s][A
Training:  14%|█▍        | 13/91 [00:02<00:15,  5.17it/s][A
Training:  19%|█▊        | 17/91 [00:03<00:13,  5.43it/s][A
Training:  22%|██▏       | 20/91 [00:03<00:10,  7.03it/s][A
Training:  24%|██▍       | 22/91 [00:04<00:12,  5.69it/s][A
Training:  27%|██▋       | 25/91 [00:04<00:12,  5.40it/s][A
Training:  32%|███▏      | 29/91 [00:05<00:10,  5.72it/s][A
Training:  36%|███▋      | 33/91 [00:06<00:09,  5.91it/s][A
Training:  38%|███▊      | 35/91 [00:06<00:08,  6.73it/s][A
Training:  41%|████      | 37/91 [00:06<00:09,  5.80it/s][A
Training:  43%|████▎     | 39/91 [00:06<00:07,  6.73it/s][A
Training:  45%|████▌     | 41/91 [00:07<00:09,  5.48it/s][A
Training:  48%|████▊     | 44/91 [00:07<00:06,  7.71it/s][A
Training:  51%|█████     | 46/91 [0

Epoch: 83/93 - Loss: 0.1750 - Accuracy: 0.9345



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:00<00:09,  1.15it/s][A
 42%|████▏     | 5/12 [00:01<00:01,  3.92it/s][A
100%|██████████| 12/12 [00:02<00:00,  5.56it/s][A
Epochs:  89%|████████▉ | 83/93 [24:41<02:55, 17.59s/it]

Val Loss: 0.2171 - Val Accuracy: 0.9123



Training:   0%|          | 0/91 [00:00<?, ?it/s][A
Training:   1%|          | 1/91 [00:00<01:19,  1.13it/s][A
Training:   5%|▌         | 5/91 [00:01<00:21,  3.93it/s][A
Training:   8%|▊         | 7/91 [00:01<00:15,  5.55it/s][A
Training:  10%|▉         | 9/91 [00:02<00:16,  5.03it/s][A
Training:  13%|█▎        | 12/91 [00:02<00:10,  7.60it/s][A
Training:  15%|█▌        | 14/91 [00:02<00:13,  5.52it/s][A
Training:  19%|█▊        | 17/91 [00:03<00:13,  5.43it/s][A
Training:  20%|█▉        | 18/91 [00:03<00:13,  5.45it/s][A
Training:  23%|██▎       | 21/91 [00:04<00:12,  5.70it/s][A
Training:  24%|██▍       | 22/91 [00:04<00:12,  5.68it/s][A
Training:  27%|██▋       | 25/91 [00:04<00:11,  5.86it/s][A
Training:  29%|██▊       | 26/91 [00:04<00:11,  5.87it/s][A
Training:  32%|███▏      | 29/91 [00:05<00:10,  5.98it/s][A
Training:  33%|███▎      | 30/91 [00:05<00:09,  6.19it/s][A
Training:  36%|███▋      | 33/91 [00:06<00:09,  5.94it/s][A
Training:  37%|███▋      | 34/91 [00

Epoch: 84/93 - Loss: 0.1755 - Accuracy: 0.9350



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:00<00:10,  1.08it/s][A
 33%|███▎      | 4/12 [00:01<00:01,  4.91it/s][A
 50%|█████     | 6/12 [00:01<00:01,  4.52it/s][A
 67%|██████▋   | 8/12 [00:01<00:00,  6.10it/s][A
100%|██████████| 12/12 [00:02<00:00,  5.52it/s][A
Epochs:  90%|█████████ | 84/93 [24:59<02:37, 17.49s/it]

Val Loss: 0.2146 - Val Accuracy: 0.9112



Training:   0%|          | 0/91 [00:00<?, ?it/s][A
Training:   1%|          | 1/91 [00:00<01:16,  1.18it/s][A
Training:   2%|▏         | 2/91 [00:00<00:36,  2.42it/s][A
Training:   5%|▌         | 5/91 [00:01<00:21,  3.97it/s][A
Training:   7%|▋         | 6/91 [00:01<00:18,  4.67it/s][A
Training:  10%|▉         | 9/91 [00:02<00:16,  5.07it/s][A
Training:  11%|█         | 10/91 [00:02<00:14,  5.55it/s][A
Training:  14%|█▍        | 13/91 [00:02<00:13,  5.87it/s][A
Training:  16%|█▋        | 15/91 [00:02<00:10,  7.38it/s][A
Training:  19%|█▊        | 17/91 [00:03<00:12,  5.83it/s][A
Training:  20%|█▉        | 18/91 [00:03<00:11,  6.16it/s][A
Training:  23%|██▎       | 21/91 [00:03<00:11,  6.11it/s][A
Training:  24%|██▍       | 22/91 [00:04<00:11,  5.90it/s][A
Training:  27%|██▋       | 25/91 [00:04<00:11,  5.77it/s][A
Training:  29%|██▊       | 26/91 [00:04<00:10,  6.06it/s][A
Training:  32%|███▏      | 29/91 [00:05<00:10,  5.88it/s][A
Training:  33%|███▎      | 30/91 [00:

Epoch: 85/93 - Loss: 0.1753 - Accuracy: 0.9342



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:00<00:09,  1.12it/s][A
 42%|████▏     | 5/12 [00:01<00:01,  3.68it/s][A
100%|██████████| 12/12 [00:02<00:00,  5.28it/s][A
Epochs:  91%|█████████▏| 85/93 [25:16<02:20, 17.54s/it]

Val Loss: 0.2162 - Val Accuracy: 0.9112



Training:   0%|          | 0/91 [00:00<?, ?it/s][A
Training:   1%|          | 1/91 [00:00<01:18,  1.15it/s][A
Training:   4%|▍         | 4/91 [00:00<00:17,  5.08it/s][A
Training:   7%|▋         | 6/91 [00:01<00:20,  4.14it/s][A
Training:  10%|▉         | 9/91 [00:02<00:18,  4.35it/s][A
Training:  14%|█▍        | 13/91 [00:02<00:14,  5.32it/s][A
Training:  19%|█▊        | 17/91 [00:03<00:12,  5.89it/s][A
Training:  23%|██▎       | 21/91 [00:04<00:12,  5.82it/s][A
Training:  26%|██▋       | 24/91 [00:04<00:08,  7.53it/s][A
Training:  29%|██▊       | 26/91 [00:04<00:11,  5.77it/s][A
Training:  32%|███▏      | 29/91 [00:05<00:11,  5.53it/s][A
Training:  35%|███▌      | 32/91 [00:05<00:07,  7.38it/s][A
Training:  37%|███▋      | 34/91 [00:06<00:09,  5.90it/s][A
Training:  40%|███▉      | 36/91 [00:06<00:07,  6.95it/s][A
Training:  42%|████▏     | 38/91 [00:06<00:09,  5.88it/s][A
Training:  45%|████▌     | 41/91 [00:07<00:09,  5.51it/s][A
Training:  49%|████▉     | 45/91 [00

Epoch: 86/93 - Loss: 0.1750 - Accuracy: 0.9341



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:00<00:07,  1.42it/s][A
 42%|████▏     | 5/12 [00:01<00:01,  4.84it/s][A
 67%|██████▋   | 8/12 [00:01<00:00,  8.00it/s][A
100%|██████████| 12/12 [00:01<00:00,  6.68it/s][A
Epochs:  92%|█████████▏| 86/93 [25:32<01:59, 17.06s/it]

Val Loss: 0.2169 - Val Accuracy: 0.9117



Training:   0%|          | 0/91 [00:00<?, ?it/s][A
Training:   1%|          | 1/91 [00:00<00:54,  1.66it/s][A
Training:   5%|▌         | 5/91 [00:01<00:15,  5.58it/s][A
Training:  10%|▉         | 9/91 [00:01<00:12,  6.55it/s][A
Training:  14%|█▍        | 13/91 [00:01<00:10,  7.43it/s][A
Training:  19%|█▊        | 17/91 [00:02<00:09,  8.02it/s][A
Training:  23%|██▎       | 21/91 [00:02<00:08,  8.63it/s][A
Training:  27%|██▋       | 25/91 [00:03<00:07,  8.54it/s][A
Training:  30%|██▉       | 27/91 [00:03<00:06,  9.56it/s][A
Training:  32%|███▏      | 29/91 [00:03<00:07,  8.11it/s][A
Training:  35%|███▌      | 32/91 [00:03<00:05, 10.38it/s][A
Training:  37%|███▋      | 34/91 [00:04<00:06,  8.36it/s][A
Training:  40%|███▉      | 36/91 [00:04<00:05,  9.58it/s][A
Training:  42%|████▏     | 38/91 [00:04<00:06,  7.62it/s][A
Training:  44%|████▍     | 40/91 [00:04<00:05,  9.10it/s][A
Training:  46%|████▌     | 42/91 [00:05<00:06,  7.65it/s][A
Training:  48%|████▊     | 44/91 [0

Epoch: 87/93 - Loss: 0.1751 - Accuracy: 0.9340



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:00<00:07,  1.38it/s][A
 42%|████▏     | 5/12 [00:01<00:01,  4.77it/s][A
100%|██████████| 12/12 [00:01<00:00,  6.84it/s][A
Epochs:  94%|█████████▎| 87/93 [25:45<01:35, 15.88s/it]

Val Loss: 0.2134 - Val Accuracy: 0.9106



Training:   0%|          | 0/91 [00:00<?, ?it/s][A
Training:   1%|          | 1/91 [00:00<00:58,  1.53it/s][A
Training:   5%|▌         | 5/91 [00:01<00:15,  5.38it/s][A
Training:  10%|▉         | 9/91 [00:01<00:12,  6.69it/s][A
Training:  14%|█▍        | 13/91 [00:02<00:10,  7.39it/s][A
Training:  19%|█▊        | 17/91 [00:02<00:09,  7.86it/s][A
Training:  23%|██▎       | 21/91 [00:02<00:08,  8.26it/s][A
Training:  27%|██▋       | 25/91 [00:03<00:07,  8.65it/s][A
Training:  32%|███▏      | 29/91 [00:03<00:07,  8.33it/s][A
Training:  36%|███▋      | 33/91 [00:04<00:07,  7.97it/s][A
Training:  41%|████      | 37/91 [00:04<00:06,  7.94it/s][A
Training:  45%|████▌     | 41/91 [00:05<00:06,  8.00it/s][A
Training:  49%|████▉     | 45/91 [00:05<00:05,  7.99it/s][A
Training:  54%|█████▍    | 49/91 [00:06<00:05,  7.95it/s][A
Training:  58%|█████▊    | 53/91 [00:06<00:04,  7.97it/s][A
Training:  63%|██████▎   | 57/91 [00:07<00:04,  7.98it/s][A
Training:  67%|██████▋   | 61/91 [0

Epoch: 88/93 - Loss: 0.1754 - Accuracy: 0.9350



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:00<00:07,  1.38it/s][A
 42%|████▏     | 5/12 [00:01<00:01,  4.81it/s][A
100%|██████████| 12/12 [00:01<00:00,  6.77it/s][A
Epochs:  95%|█████████▍| 88/93 [25:59<01:15, 15.09s/it]

Val Loss: 0.2143 - Val Accuracy: 0.9096



Training:   0%|          | 0/91 [00:00<?, ?it/s][A
Training:   1%|          | 1/91 [00:00<01:02,  1.44it/s][A
Training:   5%|▌         | 5/91 [00:01<00:17,  5.04it/s][A
Training:  10%|▉         | 9/91 [00:01<00:12,  6.73it/s][A
Training:  14%|█▍        | 13/91 [00:02<00:10,  7.40it/s][A
Training:  19%|█▊        | 17/91 [00:02<00:09,  7.89it/s][A
Training:  23%|██▎       | 21/91 [00:02<00:08,  7.96it/s][A
Training:  27%|██▋       | 25/91 [00:03<00:07,  8.39it/s][A
Training:  32%|███▏      | 29/91 [00:03<00:07,  8.72it/s][A
Training:  36%|███▋      | 33/91 [00:04<00:06,  8.66it/s][A
Training:  41%|████      | 37/91 [00:04<00:06,  8.32it/s][A
Training:  45%|████▌     | 41/91 [00:05<00:06,  8.19it/s][A
Training:  49%|████▉     | 45/91 [00:05<00:05,  8.10it/s][A
Training:  54%|█████▍    | 49/91 [00:06<00:05,  8.12it/s][A
Training:  58%|█████▊    | 53/91 [00:06<00:04,  8.05it/s][A
Training:  63%|██████▎   | 57/91 [00:07<00:04,  8.01it/s][A
Training:  67%|██████▋   | 61/91 [0

Epoch: 89/93 - Loss: 0.1752 - Accuracy: 0.9341



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:00<00:07,  1.44it/s][A
 42%|████▏     | 5/12 [00:01<00:01,  4.71it/s][A
100%|██████████| 12/12 [00:01<00:00,  6.76it/s][A
Epochs:  96%|█████████▌| 89/93 [26:12<00:58, 14.52s/it]

Val Loss: 0.2116 - Val Accuracy: 0.9096



Training:   0%|          | 0/91 [00:00<?, ?it/s][A
Training:   1%|          | 1/91 [00:00<01:10,  1.27it/s][A
Training:   5%|▌         | 5/91 [00:01<00:18,  4.66it/s][A
Training:  10%|▉         | 9/91 [00:01<00:13,  5.90it/s][A
Training:  14%|█▍        | 13/91 [00:02<00:11,  6.99it/s][A
Training:  19%|█▊        | 17/91 [00:02<00:10,  7.40it/s][A
Training:  23%|██▎       | 21/91 [00:03<00:09,  7.52it/s][A
Training:  27%|██▋       | 25/91 [00:03<00:08,  7.88it/s][A
Training:  32%|███▏      | 29/91 [00:04<00:07,  8.26it/s][A
Training:  36%|███▋      | 33/91 [00:04<00:06,  8.42it/s][A
Training:  41%|████      | 37/91 [00:05<00:06,  8.43it/s][A
Training:  45%|████▌     | 41/91 [00:05<00:05,  8.34it/s][A
Training:  49%|████▉     | 45/91 [00:06<00:05,  8.34it/s][A
Training:  54%|█████▍    | 49/91 [00:06<00:05,  8.38it/s][A
Training:  58%|█████▊    | 53/91 [00:06<00:04,  8.29it/s][A
Training:  63%|██████▎   | 57/91 [00:07<00:04,  8.38it/s][A
Training:  67%|██████▋   | 61/91 [0

Epoch: 90/93 - Loss: 0.1756 - Accuracy: 0.9350



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:00<00:07,  1.42it/s][A
 42%|████▏     | 5/12 [00:01<00:01,  4.68it/s][A
100%|██████████| 12/12 [00:01<00:00,  6.78it/s][A
Epochs:  97%|█████████▋| 90/93 [26:25<00:42, 14.14s/it]

Val Loss: 0.2143 - Val Accuracy: 0.9079



Training:   0%|          | 0/91 [00:00<?, ?it/s][A
Training:   1%|          | 1/91 [00:00<01:04,  1.39it/s][A
Training:   5%|▌         | 5/91 [00:01<00:18,  4.77it/s][A
Training:  10%|▉         | 9/91 [00:01<00:13,  6.08it/s][A
Training:  14%|█▍        | 13/91 [00:02<00:10,  7.17it/s][A
Training:  19%|█▊        | 17/91 [00:02<00:09,  7.67it/s][A
Training:  23%|██▎       | 21/91 [00:03<00:08,  8.09it/s][A
Training:  27%|██▋       | 25/91 [00:03<00:08,  8.14it/s][A
Training:  32%|███▏      | 29/91 [00:03<00:07,  8.37it/s][A
Training:  36%|███▋      | 33/91 [00:04<00:06,  8.58it/s][A
Training:  41%|████      | 37/91 [00:04<00:06,  8.44it/s][A
Training:  44%|████▍     | 40/91 [00:05<00:04, 10.29it/s][A
Training:  46%|████▌     | 42/91 [00:05<00:05,  8.30it/s][A
Training:  49%|████▉     | 45/91 [00:05<00:06,  7.60it/s][A
Training:  53%|█████▎    | 48/91 [00:06<00:04,  9.67it/s][A
Training:  55%|█████▍    | 50/91 [00:06<00:05,  7.92it/s][A
Training:  58%|█████▊    | 53/91 [0

Epoch: 91/93 - Loss: 0.1754 - Accuracy: 0.9348



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:00<00:07,  1.39it/s][A
 42%|████▏     | 5/12 [00:01<00:01,  4.67it/s][A
100%|██████████| 12/12 [00:01<00:00,  6.67it/s][A
Epochs:  98%|█████████▊| 91/93 [26:38<00:27, 13.88s/it]

Val Loss: 0.2126 - Val Accuracy: 0.9074



Training:   0%|          | 0/91 [00:00<?, ?it/s][A
Training:   1%|          | 1/91 [00:00<01:04,  1.40it/s][A
Training:   5%|▌         | 5/91 [00:01<00:17,  4.82it/s][A
Training:  10%|▉         | 9/91 [00:01<00:13,  6.13it/s][A
Training:  14%|█▍        | 13/91 [00:02<00:10,  7.17it/s][A
Training:  19%|█▊        | 17/91 [00:02<00:09,  7.74it/s][A
Training:  23%|██▎       | 21/91 [00:03<00:08,  8.06it/s][A
Training:  27%|██▋       | 25/91 [00:03<00:07,  8.26it/s][A
Training:  32%|███▏      | 29/91 [00:03<00:07,  8.42it/s][A
Training:  36%|███▋      | 33/91 [00:04<00:06,  8.44it/s][A
Training:  41%|████      | 37/91 [00:04<00:06,  8.44it/s][A
Training:  45%|████▌     | 41/91 [00:05<00:05,  8.48it/s][A
Training:  49%|████▉     | 45/91 [00:05<00:05,  8.35it/s][A
Training:  54%|█████▍    | 49/91 [00:06<00:05,  8.16it/s][A
Training:  58%|█████▊    | 53/91 [00:06<00:04,  8.22it/s][A
Training:  63%|██████▎   | 57/91 [00:07<00:04,  8.09it/s][A
Training:  67%|██████▋   | 61/91 [0

Epoch: 92/93 - Loss: 0.1755 - Accuracy: 0.9343



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:00<00:07,  1.49it/s][A
 33%|███▎      | 4/12 [00:00<00:01,  6.36it/s][A
 50%|█████     | 6/12 [00:01<00:01,  5.48it/s][A
100%|██████████| 12/12 [00:01<00:00,  6.89it/s][A
Epochs:  99%|█████████▉| 92/93 [26:52<00:13, 13.68s/it]

Val Loss: 0.2129 - Val Accuracy: 0.9112



Training:   0%|          | 0/91 [00:00<?, ?it/s][A
Training:   1%|          | 1/91 [00:00<01:07,  1.33it/s][A
Training:   5%|▌         | 5/91 [00:01<00:18,  4.53it/s][A
Training:  10%|▉         | 9/91 [00:01<00:13,  5.90it/s][A
Training:  14%|█▍        | 13/91 [00:02<00:11,  6.89it/s][A
Training:  19%|█▊        | 17/91 [00:02<00:09,  7.60it/s][A
Training:  23%|██▎       | 21/91 [00:03<00:08,  8.07it/s][A
Training:  27%|██▋       | 25/91 [00:03<00:08,  8.21it/s][A
Training:  32%|███▏      | 29/91 [00:04<00:07,  8.34it/s][A
Training:  36%|███▋      | 33/91 [00:04<00:06,  8.69it/s][A
Training:  41%|████      | 37/91 [00:04<00:06,  8.64it/s][A
Training:  45%|████▌     | 41/91 [00:05<00:05,  8.51it/s][A
Training:  49%|████▉     | 45/91 [00:05<00:05,  8.44it/s][A
Training:  54%|█████▍    | 49/91 [00:06<00:05,  8.21it/s][A
Training:  58%|█████▊    | 53/91 [00:06<00:04,  8.31it/s][A
Training:  63%|██████▎   | 57/91 [00:07<00:04,  8.37it/s][A
Training:  65%|██████▍   | 59/91 [0

Epoch: 93/93 - Loss: 0.1754 - Accuracy: 0.9351



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:00<00:07,  1.41it/s][A
 42%|████▏     | 5/12 [00:01<00:01,  4.71it/s][A
100%|██████████| 12/12 [00:01<00:00,  6.76it/s][A
Epochs: 100%|██████████| 93/93 [27:05<00:00, 17.48s/it]
[32m[I 2023-12-12 00:19:07,321][0m Trial 2 finished with value: 0.9100988507270813 and parameters: {'learning_rate': 7.580753858884148e-05, 'weight_decay': 0.0012623191952287505, 'epsilon': 1.085471414745964e-09, 'batch_size': 154, 'epochs': 93}. Best is trial 0 with value: 0.9175874590873718.[0m


Val Loss: 0.2137 - Val Accuracy: 0.9101
Learning rate: 0.002230137964712427
Weight decay: 0.002429072096567442
Epsilon: 2.1026581349206555e-09
Batch size: 213
Number of epochs: 41


Epochs:   0%|          | 0/41 [00:00<?, ?it/s]
Training:   0%|          | 0/66 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/66 [00:00<01:00,  1.08it/s][A
Training:   8%|▊         | 5/66 [00:01<00:17,  3.56it/s][A
Training:  14%|█▎        | 9/66 [00:02<00:12,  4.72it/s][A
Training:  20%|█▉        | 13/66 [00:02<00:09,  5.30it/s][A
Training:  26%|██▌       | 17/66 [00:03<00:08,  5.54it/s][A
Training:  32%|███▏      | 21/66 [00:04<00:07,  5.93it/s][A
Training:  38%|███▊      | 25/66 [00:04<00:06,  6.04it/s][A
Training:  44%|████▍     | 29/66 [00:05<00:06,  6.00it/s][A
Training:  50%|█████     | 33/66 [00:06<00:05,  6.02it/s][A
Training:  55%|█████▍    | 36/66 [00:06<00:04,  7.48it/s][A
Training:  58%|█████▊    | 38/66 [00:06<00:04,  6.05it/s][A
Training:  62%|██████▏   | 41/66 [00:07<00:04,  5.58it/s][A
Training:  67%|██████▋   | 44/66 [00:07<00:03,  7.07it/s][A
Training:  70%|██████▉   | 46/66 [00:08<00:03,  5.92it/s][A
Training:  73%|███████▎  | 48/66 [00:08<00:02,  6.

Epoch: 1/41 - Loss: 0.2656 - Accuracy: 0.8893



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:00<00:07,  1.08it/s][A
 56%|█████▌    | 5/9 [00:01<00:01,  3.60it/s][A
100%|██████████| 9/9 [00:01<00:00,  5.17it/s][A
Epochs:   2%|▏         | 1/41 [00:13<08:50, 13.26s/it]

Val Loss: 0.2347 - Val Accuracy: 0.9002



Training:   0%|          | 0/66 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/66 [00:00<00:59,  1.09it/s][A
Training:   8%|▊         | 5/66 [00:01<00:17,  3.58it/s][A
Training:  14%|█▎        | 9/66 [00:02<00:11,  4.76it/s][A
Training:  20%|█▉        | 13/66 [00:02<00:09,  5.48it/s][A
Training:  26%|██▌       | 17/66 [00:03<00:08,  5.64it/s][A
Training:  32%|███▏      | 21/66 [00:04<00:07,  5.92it/s][A
Training:  38%|███▊      | 25/66 [00:04<00:06,  6.18it/s][A
Training:  42%|████▏     | 28/66 [00:04<00:04,  7.63it/s][A
Training:  45%|████▌     | 30/66 [00:05<00:06,  5.97it/s][A
Training:  50%|█████     | 33/66 [00:05<00:05,  5.76it/s][A
Training:  52%|█████▏    | 34/66 [00:06<00:05,  6.01it/s][A
Training:  56%|█████▌    | 37/66 [00:06<00:04,  5.80it/s][A
Training:  58%|█████▊    | 38/66 [00:06<00:04,  6.13it/s][A
Training:  62%|██████▏   | 41/66 [00:07<00:04,  5.85it/s][A
Training:  65%|██████▌   | 43/66 [00:07<00:03,  6.89it/s][A
Training:  68%|██████▊   | 45/66 [0

Epoch: 2/41 - Loss: 0.2105 - Accuracy: 0.9207



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:00<00:07,  1.09it/s][A
 56%|█████▌    | 5/9 [00:01<00:01,  3.63it/s][A
100%|██████████| 9/9 [00:01<00:00,  5.18it/s][A
Epochs:   5%|▍         | 2/41 [00:26<08:36, 13.25s/it]

Val Loss: 0.2315 - Val Accuracy: 0.9022



Training:   0%|          | 0/66 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/66 [00:00<01:01,  1.05it/s][A
Training:   8%|▊         | 5/66 [00:01<00:17,  3.50it/s][A
Training:  14%|█▎        | 9/66 [00:02<00:12,  4.64it/s][A
Training:  20%|█▉        | 13/66 [00:02<00:10,  5.24it/s][A
Training:  26%|██▌       | 17/66 [00:03<00:09,  5.44it/s][A
Training:  32%|███▏      | 21/66 [00:04<00:07,  5.85it/s][A
Training:  38%|███▊      | 25/66 [00:04<00:06,  5.97it/s][A
Training:  44%|████▍     | 29/66 [00:05<00:06,  5.78it/s][A
Training:  50%|█████     | 33/66 [00:06<00:05,  5.74it/s][A
Training:  56%|█████▌    | 37/66 [00:06<00:04,  5.86it/s][A
Training:  62%|██████▏   | 41/66 [00:07<00:04,  5.79it/s][A
Training:  68%|██████▊   | 45/66 [00:08<00:03,  5.84it/s][A
Training:  74%|███████▍  | 49/66 [00:09<00:02,  5.78it/s][A
Training:  80%|████████  | 53/66 [00:09<00:02,  5.90it/s][A
Training:  86%|████████▋ | 57/66 [00:10<00:01,  5.83it/s][A
Training:  92%|█████████▏| 61/66 [0

Epoch: 3/41 - Loss: 0.2073 - Accuracy: 0.9205



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:00<00:07,  1.07it/s][A
 56%|█████▌    | 5/9 [00:01<00:01,  3.55it/s][A
100%|██████████| 9/9 [00:01<00:00,  5.09it/s][A
Epochs:   7%|▋         | 3/41 [00:39<08:26, 13.34s/it]

Val Loss: 0.2312 - Val Accuracy: 0.8980



Training:   0%|          | 0/66 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/66 [00:00<00:58,  1.11it/s][A
Training:   8%|▊         | 5/66 [00:01<00:16,  3.66it/s][A
Training:  14%|█▎        | 9/66 [00:02<00:11,  4.87it/s][A
Training:  20%|█▉        | 13/66 [00:02<00:09,  5.44it/s][A
Training:  26%|██▌       | 17/66 [00:03<00:08,  5.61it/s][A
Training:  32%|███▏      | 21/66 [00:04<00:07,  5.91it/s][A
Training:  38%|███▊      | 25/66 [00:04<00:06,  6.09it/s][A
Training:  44%|████▍     | 29/66 [00:05<00:06,  5.94it/s][A
Training:  50%|█████     | 33/66 [00:06<00:05,  5.98it/s][A
Training:  53%|█████▎    | 35/66 [00:06<00:04,  6.86it/s][A
Training:  56%|█████▌    | 37/66 [00:06<00:05,  5.78it/s][A
Training:  58%|█████▊    | 38/66 [00:06<00:04,  5.95it/s][A
Training:  62%|██████▏   | 41/66 [00:07<00:04,  5.81it/s][A
Training:  64%|██████▎   | 42/66 [00:07<00:04,  5.81it/s][A
Training:  68%|██████▊   | 45/66 [00:08<00:03,  5.81it/s][A
Training:  70%|██████▉   | 46/66 [0

Epoch: 4/41 - Loss: 0.2050 - Accuracy: 0.9207



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:00<00:07,  1.08it/s][A
 56%|█████▌    | 5/9 [00:01<00:01,  3.64it/s][A
100%|██████████| 9/9 [00:01<00:00,  5.20it/s][A
Epochs:  10%|▉         | 4/41 [00:53<08:12, 13.30s/it]

Val Loss: 0.2326 - Val Accuracy: 0.8959



Training:   0%|          | 0/66 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/66 [00:00<01:02,  1.04it/s][A
Training:   8%|▊         | 5/66 [00:01<00:17,  3.48it/s][A
Training:  14%|█▎        | 9/66 [00:02<00:12,  4.65it/s][A
Training:  20%|█▉        | 13/66 [00:02<00:10,  5.12it/s][A
Training:  26%|██▌       | 17/66 [00:03<00:08,  5.46it/s][A
Training:  32%|███▏      | 21/66 [00:04<00:07,  5.82it/s][A
Training:  38%|███▊      | 25/66 [00:04<00:06,  6.00it/s][A
Training:  44%|████▍     | 29/66 [00:05<00:06,  5.79it/s][A
Training:  50%|█████     | 33/66 [00:06<00:05,  5.77it/s][A
Training:  56%|█████▌    | 37/66 [00:06<00:04,  5.90it/s][A
Training:  62%|██████▏   | 41/66 [00:07<00:04,  5.92it/s][A
Training:  65%|██████▌   | 43/66 [00:07<00:03,  6.72it/s][A
Training:  68%|██████▊   | 45/66 [00:08<00:03,  5.66it/s][A
Training:  73%|███████▎  | 48/66 [00:08<00:02,  7.51it/s][A
Training:  76%|███████▌  | 50/66 [00:08<00:02,  5.78it/s][A
Training:  80%|████████  | 53/66 [0

Epoch: 5/41 - Loss: 0.2014 - Accuracy: 0.9239



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:00<00:07,  1.10it/s][A
 56%|█████▌    | 5/9 [00:01<00:01,  3.58it/s][A
100%|██████████| 9/9 [00:01<00:00,  5.17it/s][A
Epochs:  12%|█▏        | 5/41 [01:06<08:00, 13.35s/it]

Val Loss: 0.2350 - Val Accuracy: 0.8985



Training:   0%|          | 0/66 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/66 [00:00<01:03,  1.02it/s][A
Training:   8%|▊         | 5/66 [00:01<00:17,  3.53it/s][A
Training:  14%|█▎        | 9/66 [00:02<00:12,  4.68it/s][A
Training:  20%|█▉        | 13/66 [00:02<00:10,  5.20it/s][A
Training:  26%|██▌       | 17/66 [00:03<00:08,  5.54it/s][A
Training:  32%|███▏      | 21/66 [00:04<00:07,  5.90it/s][A
Training:  38%|███▊      | 25/66 [00:04<00:06,  5.89it/s][A
Training:  44%|████▍     | 29/66 [00:05<00:06,  5.84it/s][A
Training:  50%|█████     | 33/66 [00:06<00:05,  5.84it/s][A
Training:  56%|█████▌    | 37/66 [00:06<00:04,  5.82it/s][A
Training:  62%|██████▏   | 41/66 [00:07<00:04,  5.81it/s][A
Training:  68%|██████▊   | 45/66 [00:08<00:03,  5.90it/s][A
Training:  74%|███████▍  | 49/66 [00:08<00:02,  5.87it/s][A
Training:  80%|████████  | 53/66 [00:09<00:02,  5.89it/s][A
Training:  86%|████████▋ | 57/66 [00:10<00:01,  6.00it/s][A
Training:  92%|█████████▏| 61/66 [0

Epoch: 6/41 - Loss: 0.2008 - Accuracy: 0.9256



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:00<00:07,  1.11it/s][A
 56%|█████▌    | 5/9 [00:01<00:01,  3.67it/s][A
100%|██████████| 9/9 [00:01<00:00,  5.21it/s][A
Epochs:  15%|█▍        | 6/41 [01:19<07:47, 13.35s/it]

Val Loss: 0.2221 - Val Accuracy: 0.9059



Training:   0%|          | 0/66 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/66 [00:00<00:58,  1.10it/s][A
Training:   6%|▌         | 4/66 [00:01<00:12,  4.97it/s][A
Training:   9%|▉         | 6/66 [00:01<00:14,  4.22it/s][A
Training:  12%|█▏        | 8/66 [00:01<00:09,  5.98it/s][A
Training:  15%|█▌        | 10/66 [00:02<00:10,  5.11it/s][A
Training:  18%|█▊        | 12/66 [00:02<00:08,  6.44it/s][A
Training:  21%|██        | 14/66 [00:02<00:09,  5.30it/s][A
Training:  23%|██▎       | 15/66 [00:02<00:08,  5.68it/s][A
Training:  26%|██▌       | 17/66 [00:03<00:10,  4.80it/s][A
Training:  30%|███       | 20/66 [00:03<00:06,  7.45it/s][A
Training:  33%|███▎      | 22/66 [00:04<00:07,  5.77it/s][A
Training:  38%|███▊      | 25/66 [00:04<00:07,  5.38it/s][A
Training:  44%|████▍     | 29/66 [00:05<00:06,  5.50it/s][A
Training:  50%|█████     | 33/66 [00:06<00:05,  5.59it/s][A
Training:  56%|█████▌    | 37/66 [00:06<00:05,  5.66it/s][A
Training:  62%|██████▏   | 41/66 [00

Epoch: 7/41 - Loss: 0.1991 - Accuracy: 0.9250



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:00<00:07,  1.11it/s][A
100%|██████████| 9/9 [00:01<00:00,  5.18it/s][A
Epochs:  17%|█▋        | 7/41 [01:33<07:34, 13.36s/it]

Val Loss: 0.2357 - Val Accuracy: 0.8974



Training:   0%|          | 0/66 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/66 [00:00<00:58,  1.11it/s][A
Training:   8%|▊         | 5/66 [00:01<00:17,  3.57it/s][A
Training:  14%|█▎        | 9/66 [00:02<00:11,  4.83it/s][A
Training:  20%|█▉        | 13/66 [00:02<00:10,  5.26it/s][A
Training:  26%|██▌       | 17/66 [00:03<00:08,  5.60it/s][A
Training:  30%|███       | 20/66 [00:03<00:06,  7.30it/s][A
Training:  33%|███▎      | 22/66 [00:04<00:07,  5.95it/s][A
Training:  38%|███▊      | 25/66 [00:04<00:07,  5.64it/s][A
Training:  44%|████▍     | 29/66 [00:05<00:06,  5.72it/s][A
Training:  50%|█████     | 33/66 [00:06<00:05,  5.75it/s][A
Training:  56%|█████▌    | 37/66 [00:06<00:04,  5.81it/s][A
Training:  62%|██████▏   | 41/66 [00:07<00:04,  5.95it/s][A
Training:  67%|██████▋   | 44/66 [00:07<00:02,  7.39it/s][A
Training:  70%|██████▉   | 46/66 [00:08<00:03,  5.81it/s][A
Training:  74%|███████▍  | 49/66 [00:08<00:03,  5.58it/s][A
Training:  77%|███████▋  | 51/66 [0

Epoch: 8/41 - Loss: 0.1955 - Accuracy: 0.9273



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:00<00:07,  1.13it/s][A
 56%|█████▌    | 5/9 [00:01<00:01,  3.85it/s][A
100%|██████████| 9/9 [00:01<00:00,  5.24it/s][A
Epochs:  20%|█▉        | 8/41 [01:46<07:19, 13.32s/it]

Val Loss: 0.2243 - Val Accuracy: 0.9091



Training:   0%|          | 0/66 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/66 [00:00<00:59,  1.10it/s][A
Training:   8%|▊         | 5/66 [00:01<00:16,  3.65it/s][A
Training:  14%|█▎        | 9/66 [00:02<00:12,  4.71it/s][A
Training:  20%|█▉        | 13/66 [00:02<00:09,  5.38it/s][A
Training:  24%|██▍       | 16/66 [00:02<00:06,  7.28it/s][A
Training:  27%|██▋       | 18/66 [00:03<00:08,  5.73it/s][A
Training:  32%|███▏      | 21/66 [00:04<00:08,  5.58it/s][A
Training:  35%|███▍      | 23/66 [00:04<00:06,  6.74it/s][A
Training:  38%|███▊      | 25/66 [00:04<00:07,  5.57it/s][A
Training:  42%|████▏     | 28/66 [00:04<00:04,  7.72it/s][A
Training:  45%|████▌     | 30/66 [00:05<00:06,  5.64it/s][A
Training:  50%|█████     | 33/66 [00:06<00:06,  5.37it/s][A
Training:  53%|█████▎    | 35/66 [00:06<00:04,  6.54it/s][A
Training:  56%|█████▌    | 37/66 [00:06<00:05,  5.22it/s][A
Training:  61%|██████    | 40/66 [00:06<00:03,  7.19it/s][A
Training:  64%|██████▎   | 42/66 [0

Epoch: 9/41 - Loss: 0.1992 - Accuracy: 0.9232



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:00<00:07,  1.13it/s][A
 56%|█████▌    | 5/9 [00:01<00:01,  3.67it/s][A
100%|██████████| 9/9 [00:01<00:00,  5.27it/s][A
Epochs:  22%|██▏       | 9/41 [01:59<07:06, 13.32s/it]

Val Loss: 0.2286 - Val Accuracy: 0.9046



Training:   0%|          | 0/66 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/66 [00:00<00:58,  1.11it/s][A
Training:   8%|▊         | 5/66 [00:01<00:16,  3.67it/s][A
Training:  14%|█▎        | 9/66 [00:02<00:12,  4.73it/s][A
Training:  20%|█▉        | 13/66 [00:02<00:10,  5.20it/s][A
Training:  26%|██▌       | 17/66 [00:03<00:08,  5.49it/s][A
Training:  32%|███▏      | 21/66 [00:04<00:07,  5.77it/s][A
Training:  38%|███▊      | 25/66 [00:04<00:06,  5.95it/s][A
Training:  44%|████▍     | 29/66 [00:05<00:06,  6.05it/s][A
Training:  50%|█████     | 33/66 [00:06<00:05,  6.01it/s][A
Training:  56%|█████▌    | 37/66 [00:06<00:04,  5.98it/s][A
Training:  62%|██████▏   | 41/66 [00:07<00:04,  6.01it/s][A
Training:  68%|██████▊   | 45/66 [00:08<00:03,  6.09it/s][A
Training:  74%|███████▍  | 49/66 [00:08<00:02,  6.11it/s][A
Training:  79%|███████▉  | 52/66 [00:08<00:01,  7.30it/s][A
Training:  80%|████████  | 53/66 [00:09<00:02,  5.51it/s][A
Training:  85%|████████▍ | 56/66 [0

Epoch: 10/41 - Loss: 0.1953 - Accuracy: 0.9260



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:00<00:07,  1.08it/s][A
 56%|█████▌    | 5/9 [00:01<00:01,  3.57it/s][A
100%|██████████| 9/9 [00:01<00:00,  5.08it/s][A
Epochs:  24%|██▍       | 10/41 [02:13<06:53, 13.33s/it]

Val Loss: 0.2389 - Val Accuracy: 0.9039



Training:   0%|          | 0/66 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/66 [00:00<00:58,  1.11it/s][A
Training:   8%|▊         | 5/66 [00:01<00:16,  3.61it/s][A
Training:  14%|█▎        | 9/66 [00:02<00:12,  4.71it/s][A
Training:  20%|█▉        | 13/66 [00:02<00:10,  5.27it/s][A
Training:  26%|██▌       | 17/66 [00:03<00:08,  5.54it/s][A
Training:  32%|███▏      | 21/66 [00:04<00:07,  5.87it/s][A
Training:  38%|███▊      | 25/66 [00:04<00:06,  5.98it/s][A
Training:  44%|████▍     | 29/66 [00:05<00:06,  6.08it/s][A
Training:  47%|████▋     | 31/66 [00:05<00:05,  6.98it/s][A
Training:  50%|█████     | 33/66 [00:06<00:05,  5.74it/s][A
Training:  53%|█████▎    | 35/66 [00:06<00:04,  6.84it/s][A
Training:  56%|█████▌    | 37/66 [00:06<00:05,  5.44it/s][A
Training:  61%|██████    | 40/66 [00:06<00:03,  7.51it/s][A
Training:  64%|██████▎   | 42/66 [00:07<00:04,  5.63it/s][A
Training:  68%|██████▊   | 45/66 [00:08<00:04,  5.24it/s][A
Training:  74%|███████▍  | 49/66 [0

Epoch: 11/41 - Loss: 0.1960 - Accuracy: 0.9263



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:00<00:07,  1.08it/s][A
 56%|█████▌    | 5/9 [00:01<00:01,  3.55it/s][A
100%|██████████| 9/9 [00:01<00:00,  5.08it/s][A
Epochs:  27%|██▋       | 11/41 [02:26<06:40, 13.34s/it]

Val Loss: 0.2306 - Val Accuracy: 0.9001



Training:   0%|          | 0/66 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/66 [00:00<01:00,  1.08it/s][A
Training:   8%|▊         | 5/66 [00:01<00:17,  3.55it/s][A
Training:  14%|█▎        | 9/66 [00:02<00:11,  4.77it/s][A
Training:  20%|█▉        | 13/66 [00:02<00:10,  5.28it/s][A
Training:  26%|██▌       | 17/66 [00:03<00:08,  5.62it/s][A
Training:  32%|███▏      | 21/66 [00:04<00:07,  5.91it/s][A
Training:  38%|███▊      | 25/66 [00:04<00:06,  5.97it/s][A
Training:  44%|████▍     | 29/66 [00:05<00:06,  5.93it/s][A
Training:  50%|█████     | 33/66 [00:06<00:05,  5.96it/s][A
Training:  56%|█████▌    | 37/66 [00:06<00:04,  6.00it/s][A
Training:  61%|██████    | 40/66 [00:06<00:03,  7.43it/s][A
Training:  64%|██████▎   | 42/66 [00:07<00:04,  5.84it/s][A
Training:  68%|██████▊   | 45/66 [00:08<00:03,  5.72it/s][A
Training:  70%|██████▉   | 46/66 [00:08<00:03,  5.95it/s][A
Training:  74%|███████▍  | 49/66 [00:08<00:02,  5.74it/s][A
Training:  76%|███████▌  | 50/66 [0

Epoch: 12/41 - Loss: 0.1956 - Accuracy: 0.9265



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:00<00:07,  1.12it/s][A
 56%|█████▌    | 5/9 [00:01<00:01,  3.65it/s][A
100%|██████████| 9/9 [00:01<00:00,  5.18it/s][A
Epochs:  29%|██▉       | 12/41 [02:39<06:25, 13.31s/it]

Val Loss: 0.2513 - Val Accuracy: 0.9050



Training:   0%|          | 0/66 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/66 [00:00<00:59,  1.08it/s][A
Training:   8%|▊         | 5/66 [00:01<00:16,  3.66it/s][A
Training:  14%|█▎        | 9/66 [00:02<00:11,  4.88it/s][A
Training:  20%|█▉        | 13/66 [00:02<00:09,  5.42it/s][A
Training:  26%|██▌       | 17/66 [00:03<00:08,  5.70it/s][A
Training:  32%|███▏      | 21/66 [00:04<00:07,  5.97it/s][A
Training:  38%|███▊      | 25/66 [00:04<00:06,  6.13it/s][A
Training:  42%|████▏     | 28/66 [00:04<00:04,  7.73it/s][A
Training:  45%|████▌     | 30/66 [00:05<00:05,  6.14it/s][A
Training:  50%|█████     | 33/66 [00:06<00:05,  5.52it/s][A
Training:  56%|█████▌    | 37/66 [00:06<00:05,  5.65it/s][A
Training:  62%|██████▏   | 41/66 [00:07<00:04,  5.83it/s][A
Training:  67%|██████▋   | 44/66 [00:07<00:02,  7.40it/s][A
Training:  70%|██████▉   | 46/66 [00:08<00:03,  5.92it/s][A
Training:  74%|███████▍  | 49/66 [00:08<00:03,  5.39it/s][A
Training:  79%|███████▉  | 52/66 [0

Epoch: 13/41 - Loss: 0.1958 - Accuracy: 0.9266



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:00<00:07,  1.13it/s][A
 56%|█████▌    | 5/9 [00:01<00:01,  3.64it/s][A
100%|██████████| 9/9 [00:01<00:00,  5.16it/s][A
Epochs:  32%|███▏      | 13/41 [02:53<06:12, 13.30s/it]

Val Loss: 0.2470 - Val Accuracy: 0.9039



Training:   0%|          | 0/66 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/66 [00:00<00:58,  1.10it/s][A
Training:   8%|▊         | 5/66 [00:01<00:16,  3.64it/s][A
Training:  14%|█▎        | 9/66 [00:02<00:12,  4.64it/s][A
Training:  20%|█▉        | 13/66 [00:02<00:10,  5.21it/s][A
Training:  26%|██▌       | 17/66 [00:03<00:08,  5.51it/s][A
Training:  32%|███▏      | 21/66 [00:04<00:07,  5.87it/s][A
Training:  38%|███▊      | 25/66 [00:04<00:06,  5.88it/s][A
Training:  44%|████▍     | 29/66 [00:05<00:06,  5.73it/s][A
Training:  50%|█████     | 33/66 [00:06<00:05,  5.74it/s][A
Training:  56%|█████▌    | 37/66 [00:06<00:05,  5.65it/s][A
Training:  62%|██████▏   | 41/66 [00:07<00:04,  5.75it/s][A
Training:  68%|██████▊   | 45/66 [00:08<00:03,  5.83it/s][A
Training:  74%|███████▍  | 49/66 [00:08<00:02,  5.83it/s][A
Training:  80%|████████  | 53/66 [00:09<00:02,  5.82it/s][A
Training:  86%|████████▋ | 57/66 [00:10<00:01,  5.85it/s][A
Training:  92%|█████████▏| 61/66 [0

Epoch: 14/41 - Loss: 0.1961 - Accuracy: 0.9257



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:00<00:07,  1.11it/s][A
100%|██████████| 9/9 [00:01<00:00,  5.14it/s][A
Epochs:  34%|███▍      | 14/41 [03:06<06:00, 13.34s/it]

Val Loss: 0.2284 - Val Accuracy: 0.9023



Training:   0%|          | 0/66 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/66 [00:00<01:03,  1.02it/s][A
Training:   8%|▊         | 5/66 [00:01<00:17,  3.56it/s][A
Training:  11%|█         | 7/66 [00:01<00:11,  5.10it/s][A
Training:  14%|█▎        | 9/66 [00:02<00:12,  4.70it/s][A
Training:  17%|█▋        | 11/66 [00:02<00:08,  6.15it/s][A
Training:  20%|█▉        | 13/66 [00:02<00:10,  4.99it/s][A
Training:  23%|██▎       | 15/66 [00:03<00:07,  6.43it/s][A
Training:  26%|██▌       | 17/66 [00:03<00:09,  5.23it/s][A
Training:  30%|███       | 20/66 [00:03<00:05,  7.68it/s][A
Training:  33%|███▎      | 22/66 [00:04<00:07,  5.80it/s][A
Training:  38%|███▊      | 25/66 [00:04<00:07,  5.48it/s][A
Training:  41%|████      | 27/66 [00:04<00:05,  6.64it/s][A
Training:  44%|████▍     | 29/66 [00:05<00:06,  5.36it/s][A
Training:  45%|████▌     | 30/66 [00:05<00:06,  5.76it/s][A
Training:  50%|█████     | 33/66 [00:06<00:05,  5.57it/s][A
Training:  52%|█████▏    | 34/66 [00

Epoch: 15/41 - Loss: 0.1923 - Accuracy: 0.9284



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:00<00:07,  1.13it/s][A
 56%|█████▌    | 5/9 [00:01<00:01,  3.70it/s][A
100%|██████████| 9/9 [00:01<00:00,  5.34it/s][A
Epochs:  37%|███▋      | 15/41 [03:19<05:46, 13.34s/it]

Val Loss: 0.2187 - Val Accuracy: 0.9091



Training:   0%|          | 0/66 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/66 [00:00<00:57,  1.12it/s][A
Training:   8%|▊         | 5/66 [00:01<00:16,  3.73it/s][A
Training:   9%|▉         | 6/66 [00:01<00:13,  4.30it/s][A
Training:  14%|█▎        | 9/66 [00:02<00:11,  4.90it/s][A
Training:  18%|█▊        | 12/66 [00:02<00:07,  7.41it/s][A
Training:  21%|██        | 14/66 [00:02<00:09,  5.48it/s][A
Training:  26%|██▌       | 17/66 [00:03<00:09,  5.35it/s][A
Training:  27%|██▋       | 18/66 [00:03<00:08,  5.74it/s][A
Training:  32%|███▏      | 21/66 [00:04<00:07,  5.72it/s][A
Training:  36%|███▋      | 24/66 [00:04<00:05,  8.05it/s][A
Training:  39%|███▉      | 26/66 [00:04<00:06,  5.81it/s][A
Training:  44%|████▍     | 29/66 [00:05<00:06,  5.42it/s][A
Training:  50%|█████     | 33/66 [00:06<00:05,  5.61it/s][A
Training:  56%|█████▌    | 37/66 [00:06<00:05,  5.76it/s][A
Training:  62%|██████▏   | 41/66 [00:07<00:04,  5.91it/s][A
Training:  68%|██████▊   | 45/66 [00

Epoch: 16/41 - Loss: 0.1993 - Accuracy: 0.9260



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:00<00:07,  1.08it/s][A
 56%|█████▌    | 5/9 [00:01<00:01,  3.61it/s][A
100%|██████████| 9/9 [00:01<00:00,  5.11it/s][A
Epochs:  39%|███▉      | 16/41 [03:33<05:32, 13.32s/it]

Val Loss: 0.2283 - Val Accuracy: 0.9001



Training:   0%|          | 0/66 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/66 [00:00<00:57,  1.13it/s][A
Training:   8%|▊         | 5/66 [00:01<00:17,  3.59it/s][A
Training:  14%|█▎        | 9/66 [00:02<00:11,  4.81it/s][A
Training:  20%|█▉        | 13/66 [00:02<00:09,  5.37it/s][A
Training:  26%|██▌       | 17/66 [00:03<00:08,  5.59it/s][A
Training:  32%|███▏      | 21/66 [00:04<00:07,  5.82it/s][A
Training:  38%|███▊      | 25/66 [00:04<00:06,  5.99it/s][A
Training:  44%|████▍     | 29/66 [00:05<00:06,  5.94it/s][A
Training:  50%|█████     | 33/66 [00:06<00:05,  5.92it/s][A
Training:  56%|█████▌    | 37/66 [00:06<00:04,  5.92it/s][A
Training:  62%|██████▏   | 41/66 [00:07<00:04,  5.97it/s][A
Training:  68%|██████▊   | 45/66 [00:08<00:03,  5.86it/s][A
Training:  74%|███████▍  | 49/66 [00:08<00:02,  5.90it/s][A
Training:  80%|████████  | 53/66 [00:09<00:02,  5.92it/s][A
Training:  86%|████████▋ | 57/66 [00:10<00:01,  5.90it/s][A
Training:  92%|█████████▏| 61/66 [0

Epoch: 17/41 - Loss: 0.1957 - Accuracy: 0.9252



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:00<00:07,  1.09it/s][A
 56%|█████▌    | 5/9 [00:01<00:01,  3.69it/s][A
100%|██████████| 9/9 [00:01<00:00,  5.25it/s][A
Epochs:  41%|████▏     | 17/41 [03:46<05:19, 13.30s/it]

Val Loss: 0.2244 - Val Accuracy: 0.9172



Training:   0%|          | 0/66 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/66 [00:00<00:57,  1.13it/s][A
Training:   8%|▊         | 5/66 [00:01<00:17,  3.58it/s][A
Training:  14%|█▎        | 9/66 [00:02<00:12,  4.70it/s][A
Training:  20%|█▉        | 13/66 [00:02<00:10,  5.30it/s][A
Training:  26%|██▌       | 17/66 [00:03<00:08,  5.46it/s][A
Training:  32%|███▏      | 21/66 [00:04<00:07,  5.79it/s][A
Training:  38%|███▊      | 25/66 [00:04<00:06,  6.00it/s][A
Training:  44%|████▍     | 29/66 [00:05<00:06,  5.94it/s][A
Training:  50%|█████     | 33/66 [00:06<00:05,  5.90it/s][A
Training:  56%|█████▌    | 37/66 [00:06<00:04,  5.96it/s][A
Training:  62%|██████▏   | 41/66 [00:07<00:04,  5.96it/s][A
Training:  68%|██████▊   | 45/66 [00:08<00:03,  5.75it/s][A
Training:  74%|███████▍  | 49/66 [00:08<00:02,  5.78it/s][A
Training:  80%|████████  | 53/66 [00:09<00:02,  5.86it/s][A
Training:  86%|████████▋ | 57/66 [00:10<00:01,  5.74it/s][A
Training:  92%|█████████▏| 61/66 [0

Epoch: 18/41 - Loss: 0.1926 - Accuracy: 0.9292



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:00<00:07,  1.10it/s][A
 56%|█████▌    | 5/9 [00:01<00:01,  3.67it/s][A
100%|██████████| 9/9 [00:01<00:00,  5.22it/s][A
Epochs:  44%|████▍     | 18/41 [03:59<05:06, 13.32s/it]

Val Loss: 0.2384 - Val Accuracy: 0.9008



Training:   0%|          | 0/66 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/66 [00:00<00:59,  1.09it/s][A
Training:   8%|▊         | 5/66 [00:01<00:17,  3.51it/s][A
Training:  14%|█▎        | 9/66 [00:02<00:12,  4.73it/s][A
Training:  20%|█▉        | 13/66 [00:02<00:09,  5.40it/s][A
Training:  26%|██▌       | 17/66 [00:03<00:08,  5.53it/s][A
Training:  32%|███▏      | 21/66 [00:04<00:07,  5.80it/s][A
Training:  38%|███▊      | 25/66 [00:04<00:06,  6.04it/s][A
Training:  44%|████▍     | 29/66 [00:05<00:06,  6.13it/s][A
Training:  50%|█████     | 33/66 [00:06<00:05,  6.12it/s][A
Training:  55%|█████▍    | 36/66 [00:06<00:03,  7.64it/s][A
Training:  58%|█████▊    | 38/66 [00:06<00:04,  5.96it/s][A
Training:  62%|██████▏   | 41/66 [00:07<00:04,  5.46it/s][A
Training:  68%|██████▊   | 45/66 [00:08<00:03,  5.55it/s][A
Training:  74%|███████▍  | 49/66 [00:08<00:03,  5.66it/s][A
Training:  80%|████████  | 53/66 [00:09<00:02,  5.78it/s][A
Training:  86%|████████▋ | 57/66 [0

Epoch: 19/41 - Loss: 0.1955 - Accuracy: 0.9254



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:00<00:07,  1.05it/s][A
 56%|█████▌    | 5/9 [00:01<00:01,  3.63it/s][A
100%|██████████| 9/9 [00:01<00:00,  5.21it/s][A
Epochs:  46%|████▋     | 19/41 [04:13<04:52, 13.31s/it]

Val Loss: 0.2443 - Val Accuracy: 0.9032



Training:   0%|          | 0/66 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/66 [00:00<00:59,  1.09it/s][A
Training:   8%|▊         | 5/66 [00:01<00:17,  3.55it/s][A
Training:  14%|█▎        | 9/66 [00:02<00:12,  4.63it/s][A
Training:  20%|█▉        | 13/66 [00:02<00:10,  5.23it/s][A
Training:  26%|██▌       | 17/66 [00:03<00:08,  5.49it/s][A
Training:  32%|███▏      | 21/66 [00:04<00:07,  5.80it/s][A
Training:  38%|███▊      | 25/66 [00:04<00:06,  5.96it/s][A
Training:  44%|████▍     | 29/66 [00:05<00:06,  5.95it/s][A
Training:  50%|█████     | 33/66 [00:06<00:05,  5.88it/s][A
Training:  56%|█████▌    | 37/66 [00:06<00:04,  6.03it/s][A
Training:  62%|██████▏   | 41/66 [00:07<00:04,  6.00it/s][A
Training:  65%|██████▌   | 43/66 [00:07<00:03,  6.85it/s][A
Training:  68%|██████▊   | 45/66 [00:08<00:03,  5.66it/s][A
Training:  71%|███████   | 47/66 [00:08<00:02,  6.70it/s][A
Training:  74%|███████▍  | 49/66 [00:08<00:03,  5.56it/s][A
Training:  76%|███████▌  | 50/66 [0

Epoch: 20/41 - Loss: 0.1916 - Accuracy: 0.9262



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:00<00:07,  1.06it/s][A
 56%|█████▌    | 5/9 [00:01<00:01,  3.57it/s][A
100%|██████████| 9/9 [00:01<00:00,  5.07it/s][A
Epochs:  49%|████▉     | 20/41 [04:26<04:40, 13.34s/it]

Val Loss: 0.2356 - Val Accuracy: 0.9043



Training:   0%|          | 0/66 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/66 [00:00<01:00,  1.08it/s][A
Training:   8%|▊         | 5/66 [00:01<00:17,  3.50it/s][A
Training:  14%|█▎        | 9/66 [00:02<00:12,  4.68it/s][A
Training:  20%|█▉        | 13/66 [00:02<00:10,  5.25it/s][A
Training:  26%|██▌       | 17/66 [00:03<00:08,  5.52it/s][A
Training:  32%|███▏      | 21/66 [00:04<00:07,  5.84it/s][A
Training:  38%|███▊      | 25/66 [00:04<00:06,  6.13it/s][A
Training:  41%|████      | 27/66 [00:04<00:05,  7.05it/s][A
Training:  44%|████▍     | 29/66 [00:05<00:06,  5.72it/s][A
Training:  45%|████▌     | 30/66 [00:05<00:06,  5.94it/s][A
Training:  50%|█████     | 33/66 [00:06<00:05,  5.80it/s][A
Training:  52%|█████▏    | 34/66 [00:06<00:05,  5.76it/s][A
Training:  56%|█████▌    | 37/66 [00:06<00:04,  6.00it/s][A
Training:  58%|█████▊    | 38/66 [00:06<00:04,  5.89it/s][A
Training:  62%|██████▏   | 41/66 [00:07<00:04,  5.81it/s][A
Training:  64%|██████▎   | 42/66 [0

Epoch: 21/41 - Loss: 0.1927 - Accuracy: 0.9273



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:00<00:07,  1.04it/s][A
 56%|█████▌    | 5/9 [00:01<00:01,  3.47it/s][A
100%|██████████| 9/9 [00:01<00:00,  4.98it/s][A
Epochs:  51%|█████     | 21/41 [04:39<04:27, 13.36s/it]

Val Loss: 0.2378 - Val Accuracy: 0.9001



Training:   0%|          | 0/66 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/66 [00:00<01:00,  1.07it/s][A
Training:   8%|▊         | 5/66 [00:01<00:17,  3.48it/s][A
Training:  14%|█▎        | 9/66 [00:02<00:12,  4.63it/s][A
Training:  20%|█▉        | 13/66 [00:02<00:10,  5.17it/s][A
Training:  26%|██▌       | 17/66 [00:03<00:09,  5.37it/s][A
Training:  32%|███▏      | 21/66 [00:04<00:07,  5.74it/s][A
Training:  38%|███▊      | 25/66 [00:04<00:06,  5.90it/s][A
Training:  44%|████▍     | 29/66 [00:05<00:06,  5.94it/s][A
Training:  50%|█████     | 33/66 [00:06<00:05,  5.97it/s][A
Training:  56%|█████▌    | 37/66 [00:06<00:04,  5.96it/s][A
Training:  62%|██████▏   | 41/66 [00:07<00:04,  5.93it/s][A
Training:  68%|██████▊   | 45/66 [00:08<00:03,  6.00it/s][A
Training:  74%|███████▍  | 49/66 [00:08<00:02,  5.92it/s][A
Training:  80%|████████  | 53/66 [00:09<00:02,  5.97it/s][A
Training:  86%|████████▋ | 57/66 [00:10<00:01,  5.99it/s][A
Training:  89%|████████▉ | 59/66 [0

Epoch: 22/41 - Loss: 0.1970 - Accuracy: 0.9274



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:00<00:07,  1.05it/s][A
 56%|█████▌    | 5/9 [00:01<00:01,  3.51it/s][A
100%|██████████| 9/9 [00:01<00:00,  4.98it/s][A
Epochs:  54%|█████▎    | 22/41 [04:53<04:14, 13.37s/it]

Val Loss: 0.2235 - Val Accuracy: 0.9141



Training:   0%|          | 0/66 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/66 [00:00<01:00,  1.07it/s][A
Training:   8%|▊         | 5/66 [00:01<00:17,  3.50it/s][A
Training:  14%|█▎        | 9/66 [00:02<00:11,  4.77it/s][A
Training:  20%|█▉        | 13/66 [00:02<00:10,  5.28it/s][A
Training:  26%|██▌       | 17/66 [00:03<00:08,  5.54it/s][A
Training:  32%|███▏      | 21/66 [00:04<00:07,  5.81it/s][A
Training:  38%|███▊      | 25/66 [00:04<00:06,  5.95it/s][A
Training:  44%|████▍     | 29/66 [00:05<00:06,  6.08it/s][A
Training:  50%|█████     | 33/66 [00:06<00:05,  6.01it/s][A
Training:  56%|█████▌    | 37/66 [00:06<00:04,  6.03it/s][A
Training:  62%|██████▏   | 41/66 [00:07<00:04,  5.86it/s][A
Training:  68%|██████▊   | 45/66 [00:08<00:03,  5.86it/s][A
Training:  74%|███████▍  | 49/66 [00:08<00:02,  5.82it/s][A
Training:  80%|████████  | 53/66 [00:09<00:02,  5.75it/s][A
Training:  86%|████████▋ | 57/66 [00:10<00:01,  5.83it/s][A
Training:  92%|█████████▏| 61/66 [0

Epoch: 23/41 - Loss: 0.1945 - Accuracy: 0.9267



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:00<00:07,  1.06it/s][A
100%|██████████| 9/9 [00:01<00:00,  5.23it/s][A
Epochs:  56%|█████▌    | 23/41 [05:06<04:00, 13.35s/it]

Val Loss: 0.2198 - Val Accuracy: 0.9073



Training:   0%|          | 0/66 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/66 [00:00<01:04,  1.02it/s][A
Training:   8%|▊         | 5/66 [00:01<00:18,  3.35it/s][A
Training:  14%|█▎        | 9/66 [00:02<00:12,  4.67it/s][A
Training:  20%|█▉        | 13/66 [00:02<00:10,  5.25it/s][A
Training:  26%|██▌       | 17/66 [00:03<00:08,  5.49it/s][A
Training:  32%|███▏      | 21/66 [00:04<00:07,  5.76it/s][A
Training:  38%|███▊      | 25/66 [00:04<00:06,  6.03it/s][A
Training:  44%|████▍     | 29/66 [00:05<00:06,  6.02it/s][A
Training:  45%|████▌     | 30/66 [00:05<00:05,  6.24it/s][A
Training:  50%|█████     | 33/66 [00:06<00:05,  6.07it/s][A
Training:  52%|█████▏    | 34/66 [00:06<00:05,  6.24it/s][A
Training:  56%|█████▌    | 37/66 [00:06<00:04,  5.93it/s][A
Training:  58%|█████▊    | 38/66 [00:06<00:04,  6.06it/s][A
Training:  62%|██████▏   | 41/66 [00:07<00:04,  5.72it/s][A
Training:  65%|██████▌   | 43/66 [00:07<00:03,  6.98it/s][A
Training:  68%|██████▊   | 45/66 [0

Epoch: 24/41 - Loss: 0.1913 - Accuracy: 0.9296



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:00<00:07,  1.10it/s][A
 56%|█████▌    | 5/9 [00:01<00:01,  3.60it/s][A
100%|██████████| 9/9 [00:01<00:00,  5.15it/s][A
Epochs:  59%|█████▊    | 24/41 [05:20<03:47, 13.38s/it]

Val Loss: 0.2294 - Val Accuracy: 0.9087



Training:   0%|          | 0/66 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/66 [00:00<01:01,  1.05it/s][A
Training:   8%|▊         | 5/66 [00:01<00:16,  3.67it/s][A
Training:  14%|█▎        | 9/66 [00:02<00:11,  4.84it/s][A
Training:  20%|█▉        | 13/66 [00:02<00:10,  5.28it/s][A
Training:  26%|██▌       | 17/66 [00:03<00:08,  5.56it/s][A
Training:  32%|███▏      | 21/66 [00:04<00:07,  5.91it/s][A
Training:  38%|███▊      | 25/66 [00:04<00:06,  5.89it/s][A
Training:  44%|████▍     | 29/66 [00:05<00:06,  5.89it/s][A
Training:  50%|█████     | 33/66 [00:06<00:05,  6.00it/s][A
Training:  56%|█████▌    | 37/66 [00:06<00:04,  6.05it/s][A
Training:  62%|██████▏   | 41/66 [00:07<00:04,  5.97it/s][A
Training:  68%|██████▊   | 45/66 [00:08<00:03,  5.95it/s][A
Training:  74%|███████▍  | 49/66 [00:08<00:02,  5.96it/s][A
Training:  80%|████████  | 53/66 [00:09<00:02,  5.90it/s][A
Training:  86%|████████▋ | 57/66 [00:10<00:01,  5.93it/s][A
Training:  92%|█████████▏| 61/66 [0

Epoch: 25/41 - Loss: 0.1924 - Accuracy: 0.9288



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:00<00:07,  1.10it/s][A
 56%|█████▌    | 5/9 [00:01<00:01,  3.58it/s][A
100%|██████████| 9/9 [00:01<00:00,  5.15it/s][A
Epochs:  61%|██████    | 25/41 [05:33<03:33, 13.34s/it]

Val Loss: 0.2312 - Val Accuracy: 0.8998



Training:   0%|          | 0/66 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/66 [00:00<00:58,  1.11it/s][A
Training:   6%|▌         | 4/66 [00:01<00:12,  4.97it/s][A
Training:   9%|▉         | 6/66 [00:01<00:14,  4.09it/s][A
Training:  14%|█▎        | 9/66 [00:02<00:12,  4.48it/s][A
Training:  17%|█▋        | 11/66 [00:02<00:09,  5.70it/s][A
Training:  20%|█▉        | 13/66 [00:02<00:10,  5.02it/s][A
Training:  23%|██▎       | 15/66 [00:02<00:08,  6.32it/s][A
Training:  26%|██▌       | 17/66 [00:03<00:09,  5.32it/s][A
Training:  29%|██▉       | 19/66 [00:03<00:07,  6.51it/s][A
Training:  32%|███▏      | 21/66 [00:04<00:08,  5.61it/s][A
Training:  35%|███▍      | 23/66 [00:04<00:06,  6.81it/s][A
Training:  38%|███▊      | 25/66 [00:04<00:07,  5.76it/s][A
Training:  41%|████      | 27/66 [00:04<00:05,  6.78it/s][A
Training:  44%|████▍     | 29/66 [00:05<00:06,  5.47it/s][A
Training:  47%|████▋     | 31/66 [00:05<00:05,  6.63it/s][A
Training:  50%|█████     | 33/66 [00

Epoch: 26/41 - Loss: 0.1947 - Accuracy: 0.9289



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:00<00:07,  1.12it/s][A
 56%|█████▌    | 5/9 [00:01<00:01,  3.70it/s][A
100%|██████████| 9/9 [00:01<00:00,  5.27it/s][A
Epochs:  63%|██████▎   | 26/41 [05:46<03:19, 13.33s/it]

Val Loss: 0.2258 - Val Accuracy: 0.9028



Training:   0%|          | 0/66 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/66 [00:00<00:59,  1.08it/s][A
Training:   8%|▊         | 5/66 [00:01<00:17,  3.58it/s][A
Training:  14%|█▎        | 9/66 [00:02<00:12,  4.67it/s][A
Training:  20%|█▉        | 13/66 [00:02<00:10,  5.29it/s][A
Training:  26%|██▌       | 17/66 [00:03<00:08,  5.65it/s][A
Training:  32%|███▏      | 21/66 [00:04<00:07,  5.96it/s][A
Training:  38%|███▊      | 25/66 [00:04<00:06,  6.13it/s][A
Training:  44%|████▍     | 29/66 [00:05<00:06,  6.10it/s][A
Training:  50%|█████     | 33/66 [00:06<00:05,  5.97it/s][A
Training:  56%|█████▌    | 37/66 [00:06<00:04,  5.95it/s][A
Training:  62%|██████▏   | 41/66 [00:07<00:04,  5.87it/s][A
Training:  68%|██████▊   | 45/66 [00:08<00:03,  5.90it/s][A
Training:  74%|███████▍  | 49/66 [00:08<00:02,  5.84it/s][A
Training:  79%|███████▉  | 52/66 [00:08<00:01,  7.27it/s][A
Training:  82%|████████▏ | 54/66 [00:09<00:02,  5.70it/s][A
Training:  86%|████████▋ | 57/66 [0

Epoch: 27/41 - Loss: 0.1903 - Accuracy: 0.9294



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:00<00:07,  1.13it/s][A
 56%|█████▌    | 5/9 [00:01<00:01,  3.75it/s][A
100%|██████████| 9/9 [00:01<00:00,  5.27it/s][A
Epochs:  66%|██████▌   | 27/41 [05:59<03:06, 13.32s/it]

Val Loss: 0.2351 - Val Accuracy: 0.8991



Training:   0%|          | 0/66 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/66 [00:00<00:59,  1.09it/s][A
Training:   8%|▊         | 5/66 [00:01<00:17,  3.59it/s][A
Training:  14%|█▎        | 9/66 [00:02<00:12,  4.60it/s][A
Training:  20%|█▉        | 13/66 [00:02<00:09,  5.32it/s][A
Training:  26%|██▌       | 17/66 [00:03<00:08,  5.60it/s][A
Training:  32%|███▏      | 21/66 [00:04<00:07,  5.82it/s][A
Training:  38%|███▊      | 25/66 [00:04<00:06,  5.98it/s][A
Training:  44%|████▍     | 29/66 [00:05<00:06,  5.95it/s][A
Training:  50%|█████     | 33/66 [00:06<00:05,  5.97it/s][A
Training:  56%|█████▌    | 37/66 [00:06<00:04,  5.94it/s][A
Training:  62%|██████▏   | 41/66 [00:07<00:04,  5.91it/s][A
Training:  68%|██████▊   | 45/66 [00:08<00:03,  5.88it/s][A
Training:  74%|███████▍  | 49/66 [00:08<00:02,  5.84it/s][A
Training:  80%|████████  | 53/66 [00:09<00:02,  5.81it/s][A
Training:  86%|████████▋ | 57/66 [00:10<00:01,  5.76it/s][A
Training:  92%|█████████▏| 61/66 [0

Epoch: 28/41 - Loss: 0.1919 - Accuracy: 0.9268



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:00<00:07,  1.07it/s][A
 56%|█████▌    | 5/9 [00:01<00:01,  3.57it/s][A
100%|██████████| 9/9 [00:01<00:00,  5.07it/s][A
Epochs:  68%|██████▊   | 28/41 [06:13<02:53, 13.35s/it]

Val Loss: 0.2537 - Val Accuracy: 0.8961



Training:   0%|          | 0/66 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/66 [00:00<00:59,  1.10it/s][A
Training:   8%|▊         | 5/66 [00:01<00:17,  3.54it/s][A
Training:  14%|█▎        | 9/66 [00:02<00:12,  4.69it/s][A
Training:  18%|█▊        | 12/66 [00:02<00:07,  6.76it/s][A
Training:  21%|██        | 14/66 [00:02<00:09,  5.41it/s][A
Training:  26%|██▌       | 17/66 [00:03<00:09,  5.24it/s][A
Training:  32%|███▏      | 21/66 [00:04<00:07,  5.74it/s][A
Training:  38%|███▊      | 25/66 [00:04<00:06,  6.03it/s][A
Training:  42%|████▏     | 28/66 [00:04<00:04,  7.66it/s][A
Training:  45%|████▌     | 30/66 [00:05<00:05,  6.00it/s][A
Training:  50%|█████     | 33/66 [00:06<00:06,  5.39it/s][A
Training:  56%|█████▌    | 37/66 [00:06<00:05,  5.57it/s][A
Training:  62%|██████▏   | 41/66 [00:07<00:04,  5.66it/s][A
Training:  68%|██████▊   | 45/66 [00:08<00:03,  5.78it/s][A
Training:  74%|███████▍  | 49/66 [00:08<00:02,  5.77it/s][A
Training:  80%|████████  | 53/66 [0

Epoch: 29/41 - Loss: 0.1922 - Accuracy: 0.9274



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:00<00:07,  1.11it/s][A
 56%|█████▌    | 5/9 [00:01<00:01,  3.54it/s][A
100%|██████████| 9/9 [00:01<00:00,  5.12it/s][A
Epochs:  71%|███████   | 29/41 [06:26<02:40, 13.37s/it]

Val Loss: 0.2358 - Val Accuracy: 0.8970



Training:   0%|          | 0/66 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/66 [00:00<00:56,  1.16it/s][A
Training:   8%|▊         | 5/66 [00:01<00:15,  3.83it/s][A
Training:  11%|█         | 7/66 [00:01<00:10,  5.41it/s][A
Training:  14%|█▎        | 9/66 [00:02<00:11,  4.83it/s][A
Training:  17%|█▋        | 11/66 [00:02<00:08,  6.18it/s][A
Training:  20%|█▉        | 13/66 [00:02<00:10,  5.23it/s][A
Training:  23%|██▎       | 15/66 [00:02<00:08,  6.37it/s][A
Training:  26%|██▌       | 17/66 [00:03<00:09,  5.22it/s][A
Training:  29%|██▉       | 19/66 [00:03<00:06,  6.73it/s][A
Training:  32%|███▏      | 21/66 [00:04<00:08,  5.56it/s][A
Training:  36%|███▋      | 24/66 [00:04<00:05,  7.97it/s][A
Training:  39%|███▉      | 26/66 [00:04<00:06,  6.09it/s][A
Training:  42%|████▏     | 28/66 [00:04<00:05,  7.29it/s][A
Training:  45%|████▌     | 30/66 [00:05<00:06,  5.75it/s][A
Training:  47%|████▋     | 31/66 [00:05<00:05,  5.97it/s][A
Training:  50%|█████     | 33/66 [00

Epoch: 30/41 - Loss: 0.1915 - Accuracy: 0.9287



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:00<00:07,  1.10it/s][A
 56%|█████▌    | 5/9 [00:01<00:01,  3.60it/s][A
100%|██████████| 9/9 [00:01<00:00,  5.18it/s][A
Epochs:  73%|███████▎  | 30/41 [06:40<02:26, 13.35s/it]

Val Loss: 0.2285 - Val Accuracy: 0.9049



Training:   0%|          | 0/66 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/66 [00:00<01:00,  1.08it/s][A
Training:   8%|▊         | 5/66 [00:01<00:17,  3.54it/s][A
Training:  14%|█▎        | 9/66 [00:02<00:12,  4.73it/s][A
Training:  20%|█▉        | 13/66 [00:02<00:09,  5.40it/s][A
Training:  26%|██▌       | 17/66 [00:03<00:08,  5.69it/s][A
Training:  32%|███▏      | 21/66 [00:04<00:07,  6.06it/s][A
Training:  38%|███▊      | 25/66 [00:04<00:06,  6.20it/s][A
Training:  41%|████      | 27/66 [00:04<00:05,  7.13it/s][A
Training:  44%|████▍     | 29/66 [00:05<00:06,  5.95it/s][A
Training:  45%|████▌     | 30/66 [00:05<00:05,  6.22it/s][A
Training:  50%|█████     | 33/66 [00:05<00:05,  5.92it/s][A
Training:  52%|█████▏    | 34/66 [00:06<00:05,  6.14it/s][A
Training:  56%|█████▌    | 37/66 [00:06<00:05,  5.73it/s][A
Training:  58%|█████▊    | 38/66 [00:06<00:04,  6.01it/s][A
Training:  62%|██████▏   | 41/66 [00:07<00:04,  5.80it/s][A
Training:  64%|██████▎   | 42/66 [0

Epoch: 31/41 - Loss: 0.1912 - Accuracy: 0.9271



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:00<00:07,  1.10it/s][A
 56%|█████▌    | 5/9 [00:01<00:01,  3.56it/s][A
100%|██████████| 9/9 [00:01<00:00,  5.11it/s][A
Epochs:  76%|███████▌  | 31/41 [06:53<02:13, 13.32s/it]

Val Loss: 0.2444 - Val Accuracy: 0.9066



Training:   0%|          | 0/66 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/66 [00:00<01:01,  1.06it/s][A
Training:   8%|▊         | 5/66 [00:01<00:16,  3.60it/s][A
Training:  14%|█▎        | 9/66 [00:02<00:12,  4.62it/s][A
Training:  20%|█▉        | 13/66 [00:02<00:09,  5.34it/s][A
Training:  26%|██▌       | 17/66 [00:03<00:08,  5.58it/s][A
Training:  32%|███▏      | 21/66 [00:04<00:07,  5.82it/s][A
Training:  38%|███▊      | 25/66 [00:04<00:06,  5.87it/s][A
Training:  44%|████▍     | 29/66 [00:05<00:06,  5.78it/s][A
Training:  50%|█████     | 33/66 [00:06<00:05,  5.84it/s][A
Training:  56%|█████▌    | 37/66 [00:06<00:05,  5.79it/s][A
Training:  61%|██████    | 40/66 [00:07<00:03,  7.23it/s][A
Training:  64%|██████▎   | 42/66 [00:07<00:04,  5.77it/s][A
Training:  68%|██████▊   | 45/66 [00:08<00:03,  5.48it/s][A
Training:  73%|███████▎  | 48/66 [00:08<00:02,  7.13it/s][A
Training:  76%|███████▌  | 50/66 [00:09<00:02,  5.59it/s][A
Training:  80%|████████  | 53/66 [0

Epoch: 32/41 - Loss: 0.1931 - Accuracy: 0.9277



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:00<00:07,  1.09it/s][A
 56%|█████▌    | 5/9 [00:01<00:01,  3.57it/s][A
100%|██████████| 9/9 [00:01<00:00,  5.16it/s][A
Epochs:  78%|███████▊  | 32/41 [07:06<02:00, 13.39s/it]

Val Loss: 0.2338 - Val Accuracy: 0.9071



Training:   0%|          | 0/66 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/66 [00:00<01:01,  1.06it/s][A
Training:   8%|▊         | 5/66 [00:01<00:17,  3.54it/s][A
Training:  11%|█         | 7/66 [00:01<00:11,  5.04it/s][A
Training:  14%|█▎        | 9/66 [00:02<00:12,  4.54it/s][A
Training:  18%|█▊        | 12/66 [00:02<00:07,  7.05it/s][A
Training:  21%|██        | 14/66 [00:02<00:09,  5.36it/s][A
Training:  26%|██▌       | 17/66 [00:03<00:09,  5.22it/s][A
Training:  30%|███       | 20/66 [00:03<00:06,  7.30it/s][A
Training:  33%|███▎      | 22/66 [00:04<00:07,  5.74it/s][A
Training:  38%|███▊      | 25/66 [00:04<00:07,  5.52it/s][A
Training:  42%|████▏     | 28/66 [00:04<00:05,  7.43it/s][A
Training:  45%|████▌     | 30/66 [00:05<00:06,  5.71it/s][A
Training:  50%|█████     | 33/66 [00:06<00:06,  5.29it/s][A
Training:  55%|█████▍    | 36/66 [00:06<00:04,  7.18it/s][A
Training:  58%|█████▊    | 38/66 [00:06<00:05,  5.44it/s][A
Training:  62%|██████▏   | 41/66 [00

Epoch: 33/41 - Loss: 0.1934 - Accuracy: 0.9290



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:00<00:07,  1.11it/s][A
 56%|█████▌    | 5/9 [00:01<00:01,  3.50it/s][A
100%|██████████| 9/9 [00:01<00:00,  5.10it/s][A
Epochs:  80%|████████  | 33/41 [07:20<01:47, 13.42s/it]

Val Loss: 0.2279 - Val Accuracy: 0.9016



Training:   0%|          | 0/66 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/66 [00:00<00:58,  1.10it/s][A
Training:   8%|▊         | 5/66 [00:01<00:17,  3.54it/s][A
Training:  14%|█▎        | 9/66 [00:02<00:12,  4.68it/s][A
Training:  20%|█▉        | 13/66 [00:02<00:10,  5.27it/s][A
Training:  26%|██▌       | 17/66 [00:03<00:08,  5.57it/s][A
Training:  32%|███▏      | 21/66 [00:04<00:07,  5.87it/s][A
Training:  38%|███▊      | 25/66 [00:04<00:06,  5.93it/s][A
Training:  44%|████▍     | 29/66 [00:05<00:06,  5.89it/s][A
Training:  50%|█████     | 33/66 [00:06<00:05,  5.83it/s][A
Training:  56%|█████▌    | 37/66 [00:06<00:05,  5.79it/s][A
Training:  62%|██████▏   | 41/66 [00:07<00:04,  5.94it/s][A
Training:  68%|██████▊   | 45/66 [00:08<00:03,  5.90it/s][A
Training:  73%|███████▎  | 48/66 [00:08<00:02,  7.29it/s][A
Training:  76%|███████▌  | 50/66 [00:08<00:02,  6.05it/s][A
Training:  79%|███████▉  | 52/66 [00:09<00:01,  7.02it/s][A
Training:  82%|████████▏ | 54/66 [0

Epoch: 34/41 - Loss: 0.1896 - Accuracy: 0.9274



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:00<00:07,  1.07it/s][A
100%|██████████| 9/9 [00:01<00:00,  5.18it/s][A
Epochs:  83%|████████▎ | 34/41 [07:33<01:33, 13.41s/it]

Val Loss: 0.2394 - Val Accuracy: 0.9037



Training:   0%|          | 0/66 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/66 [00:00<00:57,  1.13it/s][A
Training:   6%|▌         | 4/66 [00:01<00:12,  4.96it/s][A
Training:   9%|▉         | 6/66 [00:01<00:14,  4.24it/s][A
Training:  14%|█▎        | 9/66 [00:02<00:12,  4.67it/s][A
Training:  18%|█▊        | 12/66 [00:02<00:07,  7.07it/s][A
Training:  21%|██        | 14/66 [00:02<00:09,  5.37it/s][A
Training:  26%|██▌       | 17/66 [00:03<00:09,  5.14it/s][A
Training:  32%|███▏      | 21/66 [00:04<00:08,  5.58it/s][A
Training:  38%|███▊      | 25/66 [00:04<00:06,  5.86it/s][A
Training:  42%|████▏     | 28/66 [00:04<00:04,  7.61it/s][A
Training:  45%|████▌     | 30/66 [00:05<00:06,  5.76it/s][A
Training:  50%|█████     | 33/66 [00:06<00:06,  5.46it/s][A
Training:  56%|█████▌    | 37/66 [00:06<00:05,  5.57it/s][A
Training:  62%|██████▏   | 41/66 [00:07<00:04,  5.69it/s][A
Training:  68%|██████▊   | 45/66 [00:08<00:03,  5.70it/s][A
Training:  74%|███████▍  | 49/66 [00

Epoch: 35/41 - Loss: 0.1913 - Accuracy: 0.9289



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:00<00:07,  1.11it/s][A
 56%|█████▌    | 5/9 [00:01<00:01,  3.59it/s][A
100%|██████████| 9/9 [00:01<00:00,  5.14it/s][A
Epochs:  85%|████████▌ | 35/41 [07:47<01:20, 13.39s/it]

Val Loss: 0.2240 - Val Accuracy: 0.9080



Training:   0%|          | 0/66 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/66 [00:00<00:58,  1.12it/s][A
Training:   8%|▊         | 5/66 [00:01<00:17,  3.57it/s][A
Training:  14%|█▎        | 9/66 [00:02<00:11,  4.80it/s][A
Training:  20%|█▉        | 13/66 [00:02<00:09,  5.41it/s][A
Training:  26%|██▌       | 17/66 [00:03<00:08,  5.52it/s][A
Training:  32%|███▏      | 21/66 [00:04<00:07,  5.87it/s][A
Training:  38%|███▊      | 25/66 [00:04<00:06,  6.10it/s][A
Training:  42%|████▏     | 28/66 [00:04<00:04,  7.64it/s][A
Training:  45%|████▌     | 30/66 [00:05<00:06,  5.77it/s][A
Training:  50%|█████     | 33/66 [00:06<00:06,  5.50it/s][A
Training:  53%|█████▎    | 35/66 [00:06<00:04,  6.56it/s][A
Training:  56%|█████▌    | 37/66 [00:06<00:05,  5.33it/s][A
Training:  59%|█████▉    | 39/66 [00:06<00:04,  6.50it/s][A
Training:  62%|██████▏   | 41/66 [00:07<00:04,  5.34it/s][A
Training:  65%|██████▌   | 43/66 [00:07<00:03,  6.60it/s][A
Training:  68%|██████▊   | 45/66 [0

Epoch: 36/41 - Loss: 0.1930 - Accuracy: 0.9266



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:00<00:07,  1.10it/s][A
 56%|█████▌    | 5/9 [00:01<00:01,  3.66it/s][A
100%|██████████| 9/9 [00:01<00:00,  5.21it/s][A
Epochs:  88%|████████▊ | 36/41 [08:00<01:06, 13.38s/it]

Val Loss: 0.2381 - Val Accuracy: 0.9033



Training:   0%|          | 0/66 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/66 [00:00<00:58,  1.10it/s][A
Training:   8%|▊         | 5/66 [00:01<00:17,  3.58it/s][A
Training:  14%|█▎        | 9/66 [00:02<00:12,  4.74it/s][A
Training:  18%|█▊        | 12/66 [00:02<00:08,  6.71it/s][A
Training:  21%|██        | 14/66 [00:02<00:09,  5.48it/s][A
Training:  26%|██▌       | 17/66 [00:03<00:09,  5.24it/s][A
Training:  30%|███       | 20/66 [00:03<00:06,  7.12it/s][A
Training:  33%|███▎      | 22/66 [00:04<00:07,  5.89it/s][A
Training:  38%|███▊      | 25/66 [00:04<00:07,  5.35it/s][A
Training:  44%|████▍     | 29/66 [00:05<00:06,  5.54it/s][A
Training:  50%|█████     | 33/66 [00:06<00:05,  5.65it/s][A
Training:  56%|█████▌    | 37/66 [00:06<00:05,  5.79it/s][A
Training:  61%|██████    | 40/66 [00:06<00:03,  7.34it/s][A
Training:  64%|██████▎   | 42/66 [00:07<00:04,  5.90it/s][A
Training:  67%|██████▋   | 44/66 [00:07<00:03,  6.95it/s][A
Training:  70%|██████▉   | 46/66 [0

Epoch: 37/41 - Loss: 0.1915 - Accuracy: 0.9267



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:00<00:07,  1.07it/s][A
 56%|█████▌    | 5/9 [00:01<00:01,  3.56it/s][A
100%|██████████| 9/9 [00:01<00:00,  5.12it/s][A
Epochs:  90%|█████████ | 37/41 [08:13<00:53, 13.38s/it]

Val Loss: 0.2235 - Val Accuracy: 0.9092



Training:   0%|          | 0/66 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/66 [00:00<00:59,  1.09it/s][A
Training:   8%|▊         | 5/66 [00:01<00:17,  3.55it/s][A
Training:  14%|█▎        | 9/66 [00:02<00:11,  4.77it/s][A
Training:  20%|█▉        | 13/66 [00:02<00:09,  5.30it/s][A
Training:  26%|██▌       | 17/66 [00:03<00:08,  5.67it/s][A
Training:  32%|███▏      | 21/66 [00:04<00:07,  5.85it/s][A
Training:  38%|███▊      | 25/66 [00:04<00:06,  5.96it/s][A
Training:  44%|████▍     | 29/66 [00:05<00:06,  5.92it/s][A
Training:  50%|█████     | 33/66 [00:06<00:05,  5.98it/s][A
Training:  56%|█████▌    | 37/66 [00:06<00:04,  5.95it/s][A
Training:  62%|██████▏   | 41/66 [00:07<00:04,  5.92it/s][A
Training:  68%|██████▊   | 45/66 [00:08<00:03,  5.94it/s][A
Training:  74%|███████▍  | 49/66 [00:08<00:02,  5.87it/s][A
Training:  80%|████████  | 53/66 [00:09<00:02,  5.92it/s][A
Training:  86%|████████▋ | 57/66 [00:10<00:01,  5.85it/s][A
Training:  92%|█████████▏| 61/66 [0

Epoch: 38/41 - Loss: 0.1904 - Accuracy: 0.9291



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:00<00:07,  1.10it/s][A
 56%|█████▌    | 5/9 [00:01<00:01,  3.59it/s][A
100%|██████████| 9/9 [00:01<00:00,  5.15it/s][A
Epochs:  93%|█████████▎| 38/41 [08:27<00:40, 13.37s/it]

Val Loss: 0.2332 - Val Accuracy: 0.9032



Training:   0%|          | 0/66 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/66 [00:00<01:02,  1.03it/s][A
Training:   8%|▊         | 5/66 [00:01<00:17,  3.54it/s][A
Training:  14%|█▎        | 9/66 [00:02<00:12,  4.67it/s][A
Training:  20%|█▉        | 13/66 [00:02<00:10,  5.28it/s][A
Training:  26%|██▌       | 17/66 [00:03<00:08,  5.61it/s][A
Training:  32%|███▏      | 21/66 [00:04<00:07,  5.96it/s][A
Training:  38%|███▊      | 25/66 [00:04<00:06,  5.88it/s][A
Training:  44%|████▍     | 29/66 [00:05<00:06,  5.85it/s][A
Training:  50%|█████     | 33/66 [00:06<00:05,  5.91it/s][A
Training:  56%|█████▌    | 37/66 [00:06<00:04,  5.97it/s][A
Training:  62%|██████▏   | 41/66 [00:07<00:04,  5.97it/s][A
Training:  68%|██████▊   | 45/66 [00:08<00:03,  5.93it/s][A
Training:  74%|███████▍  | 49/66 [00:08<00:02,  6.02it/s][A
Training:  80%|████████  | 53/66 [00:09<00:02,  5.89it/s][A
Training:  86%|████████▋ | 57/66 [00:10<00:01,  5.89it/s][A
Training:  92%|█████████▏| 61/66 [0

Epoch: 39/41 - Loss: 0.1915 - Accuracy: 0.9278



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:00<00:07,  1.10it/s][A
 56%|█████▌    | 5/9 [00:01<00:01,  3.57it/s][A
100%|██████████| 9/9 [00:01<00:00,  5.14it/s][A
Epochs:  95%|█████████▌| 39/41 [08:40<00:26, 13.37s/it]

Val Loss: 0.2324 - Val Accuracy: 0.8996



Training:   0%|          | 0/66 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/66 [00:00<01:00,  1.07it/s][A
Training:   8%|▊         | 5/66 [00:01<00:17,  3.56it/s][A
Training:  14%|█▎        | 9/66 [00:02<00:12,  4.74it/s][A
Training:  20%|█▉        | 13/66 [00:02<00:10,  5.11it/s][A
Training:  26%|██▌       | 17/66 [00:03<00:09,  5.39it/s][A
Training:  32%|███▏      | 21/66 [00:04<00:07,  5.64it/s][A
Training:  38%|███▊      | 25/66 [00:04<00:07,  5.75it/s][A
Training:  44%|████▍     | 29/66 [00:05<00:06,  5.83it/s][A
Training:  50%|█████     | 33/66 [00:06<00:05,  5.91it/s][A
Training:  56%|█████▌    | 37/66 [00:06<00:04,  5.89it/s][A
Training:  62%|██████▏   | 41/66 [00:07<00:04,  5.89it/s][A
Training:  68%|██████▊   | 45/66 [00:08<00:03,  5.97it/s][A
Training:  74%|███████▍  | 49/66 [00:08<00:02,  5.93it/s][A
Training:  80%|████████  | 53/66 [00:09<00:02,  5.93it/s][A
Training:  86%|████████▋ | 57/66 [00:10<00:01,  5.94it/s][A
Training:  91%|█████████ | 60/66 [0

Epoch: 40/41 - Loss: 0.1903 - Accuracy: 0.9284



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:00<00:07,  1.09it/s][A
 56%|█████▌    | 5/9 [00:01<00:01,  3.60it/s][A
100%|██████████| 9/9 [00:01<00:00,  5.10it/s][A
Epochs:  98%|█████████▊| 40/41 [08:53<00:13, 13.39s/it]

Val Loss: 0.2370 - Val Accuracy: 0.9006



Training:   0%|          | 0/66 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/66 [00:00<01:01,  1.06it/s][A
Training:   8%|▊         | 5/66 [00:01<00:16,  3.60it/s][A
Training:  14%|█▎        | 9/66 [00:02<00:12,  4.72it/s][A
Training:  20%|█▉        | 13/66 [00:02<00:10,  5.20it/s][A
Training:  23%|██▎       | 15/66 [00:02<00:08,  6.30it/s][A
Training:  26%|██▌       | 17/66 [00:03<00:09,  5.43it/s][A
Training:  27%|██▋       | 18/66 [00:03<00:08,  5.77it/s][A
Training:  32%|███▏      | 21/66 [00:04<00:07,  5.77it/s][A
Training:  33%|███▎      | 22/66 [00:04<00:07,  6.17it/s][A
Training:  38%|███▊      | 25/66 [00:04<00:07,  5.61it/s][A
Training:  39%|███▉      | 26/66 [00:04<00:06,  5.78it/s][A
Training:  44%|████▍     | 29/66 [00:05<00:06,  5.82it/s][A
Training:  45%|████▌     | 30/66 [00:05<00:06,  5.79it/s][A
Training:  50%|█████     | 33/66 [00:06<00:05,  5.96it/s][A
Training:  52%|█████▏    | 34/66 [00:06<00:05,  5.81it/s][A
Training:  56%|█████▌    | 37/66 [0

Epoch: 41/41 - Loss: 0.1945 - Accuracy: 0.9289



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:00<00:07,  1.14it/s][A
 56%|█████▌    | 5/9 [00:01<00:01,  3.55it/s][A
100%|██████████| 9/9 [00:01<00:00,  5.05it/s][A
Epochs: 100%|██████████| 41/41 [09:07<00:00, 13.35s/it]
[32m[I 2023-12-12 00:28:15,009][0m Trial 3 finished with value: 0.9096657633781433 and parameters: {'learning_rate': 0.002230137964712427, 'weight_decay': 0.002429072096567442, 'epsilon': 2.1026581349206555e-09, 'batch_size': 213, 'epochs': 41}. Best is trial 0 with value: 0.9175874590873718.[0m


Val Loss: 0.2287 - Val Accuracy: 0.9097
Learning rate: 0.09923013627376329
Weight decay: 0.002591295182102534
Epsilon: 1.45661760180232e-09
Batch size: 245
Number of epochs: 16


Epochs:   0%|          | 0/16 [00:00<?, ?it/s]
Training:   0%|          | 0/58 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/58 [00:01<00:56,  1.00it/s][A
Training:   9%|▊         | 5/58 [00:01<00:15,  3.33it/s][A
Training:  16%|█▌        | 9/58 [00:02<00:11,  4.10it/s][A
Training:  22%|██▏       | 13/58 [00:03<00:09,  4.62it/s][A
Training:  29%|██▉       | 17/58 [00:03<00:08,  4.95it/s][A
Training:  36%|███▌      | 21/58 [00:04<00:07,  4.97it/s][A
Training:  43%|████▎     | 25/58 [00:05<00:06,  5.00it/s][A
Training:  50%|█████     | 29/58 [00:06<00:05,  5.04it/s][A
Training:  57%|█████▋    | 33/58 [00:07<00:04,  5.09it/s][A
Training:  64%|██████▍   | 37/58 [00:07<00:04,  5.12it/s][A
Training:  71%|███████   | 41/58 [00:08<00:03,  5.10it/s][A
Training:  78%|███████▊  | 45/58 [00:09<00:02,  5.17it/s][A
Training:  84%|████████▍ | 49/58 [00:10<00:01,  5.13it/s][A
Training:  90%|████████▉ | 52/58 [00:10<00:00,  6.43it/s][A
Training:  93%|█████████▎| 54/58 [00:11<00:00,  5.

Epoch: 1/16 - Loss: 36.2680 - Accuracy: 0.8232



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:01<00:07,  1.01s/it][A
100%|██████████| 8/8 [00:01<00:00,  4.23it/s][A
Epochs:   6%|▋         | 1/16 [00:13<03:24, 13.63s/it]

Val Loss: 20.6988 - Val Accuracy: 0.8067



Training:   0%|          | 0/58 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/58 [00:00<00:56,  1.01it/s][A
Training:   9%|▊         | 5/58 [00:01<00:16,  3.19it/s][A
Training:  16%|█▌        | 9/58 [00:02<00:11,  4.09it/s][A
Training:  22%|██▏       | 13/58 [00:03<00:09,  4.71it/s][A
Training:  29%|██▉       | 17/58 [00:04<00:08,  4.80it/s][A
Training:  36%|███▌      | 21/58 [00:04<00:07,  4.88it/s][A
Training:  43%|████▎     | 25/58 [00:05<00:06,  5.01it/s][A
Training:  50%|█████     | 29/58 [00:06<00:05,  5.03it/s][A
Training:  57%|█████▋    | 33/58 [00:07<00:04,  5.11it/s][A
Training:  64%|██████▍   | 37/58 [00:07<00:04,  5.07it/s][A
Training:  69%|██████▉   | 40/58 [00:08<00:02,  6.39it/s][A
Training:  72%|███████▏  | 42/58 [00:08<00:03,  5.02it/s][A
Training:  78%|███████▊  | 45/58 [00:09<00:02,  4.61it/s][A
Training:  84%|████████▍ | 49/58 [00:10<00:01,  4.74it/s][A
Training:  91%|█████████▏| 53/58 [00:11<00:01,  4.88it/s][A
Training:  98%|█████████▊| 57/58 [0

Epoch: 2/16 - Loss: 5.4844 - Accuracy: 0.8696



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:01<00:07,  1.02s/it][A
100%|██████████| 8/8 [00:01<00:00,  4.25it/s][A
Epochs:  12%|█▎        | 2/16 [00:27<03:11, 13.71s/it]

Val Loss: 3.9509 - Val Accuracy: 0.8842



Training:   0%|          | 0/58 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/58 [00:00<00:53,  1.07it/s][A
Training:   9%|▊         | 5/58 [00:01<00:15,  3.38it/s][A
Training:  14%|█▍        | 8/58 [00:01<00:08,  5.77it/s][A
Training:  17%|█▋        | 10/58 [00:02<00:10,  4.55it/s][A
Training:  22%|██▏       | 13/58 [00:03<00:10,  4.28it/s][A
Training:  29%|██▉       | 17/58 [00:03<00:08,  4.62it/s][A
Training:  36%|███▌      | 21/58 [00:04<00:07,  4.83it/s][A
Training:  43%|████▎     | 25/58 [00:05<00:06,  4.98it/s][A
Training:  50%|█████     | 29/58 [00:06<00:05,  5.03it/s][A
Training:  57%|█████▋    | 33/58 [00:07<00:04,  5.00it/s][A
Training:  64%|██████▍   | 37/58 [00:07<00:04,  4.96it/s][A
Training:  71%|███████   | 41/58 [00:08<00:03,  5.00it/s][A
Training:  78%|███████▊  | 45/58 [00:09<00:02,  5.01it/s][A
Training:  84%|████████▍ | 49/58 [00:10<00:01,  5.02it/s][A
Training:  91%|█████████▏| 53/58 [00:11<00:00,  5.07it/s][A
Training:  98%|█████████▊| 57/58 [0

Epoch: 3/16 - Loss: 3.9560 - Accuracy: 0.8794



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:01<00:07,  1.01s/it][A
100%|██████████| 8/8 [00:01<00:00,  4.29it/s][A
Epochs:  19%|█▉        | 3/16 [00:41<02:57, 13.69s/it]

Val Loss: 24.9796 - Val Accuracy: 0.3106



Training:   0%|          | 0/58 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/58 [00:01<00:57,  1.00s/it][A
Training:   9%|▊         | 5/58 [00:01<00:16,  3.26it/s][A
Training:  16%|█▌        | 9/58 [00:02<00:11,  4.20it/s][A
Training:  22%|██▏       | 13/58 [00:03<00:09,  4.51it/s][A
Training:  29%|██▉       | 17/58 [00:04<00:08,  4.67it/s][A
Training:  36%|███▌      | 21/58 [00:04<00:07,  4.76it/s][A
Training:  43%|████▎     | 25/58 [00:05<00:06,  4.91it/s][A
Training:  50%|█████     | 29/58 [00:06<00:05,  5.03it/s][A
Training:  57%|█████▋    | 33/58 [00:07<00:04,  5.04it/s][A
Training:  64%|██████▍   | 37/58 [00:07<00:04,  5.04it/s][A
Training:  71%|███████   | 41/58 [00:08<00:03,  5.07it/s][A
Training:  78%|███████▊  | 45/58 [00:09<00:02,  5.00it/s][A
Training:  84%|████████▍ | 49/58 [00:10<00:01,  5.05it/s][A
Training:  91%|█████████▏| 53/58 [00:11<00:00,  5.02it/s][A
Training:  98%|█████████▊| 57/58 [00:11<00:00,  5.32it/s][A
                                   

Epoch: 4/16 - Loss: 25.1891 - Accuracy: 0.8626



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:01<00:07,  1.00s/it][A
100%|██████████| 8/8 [00:01<00:00,  4.52it/s][A
Epochs:  25%|██▌       | 4/16 [00:54<02:44, 13.70s/it]

Val Loss: 33.9265 - Val Accuracy: 0.6483



Training:   0%|          | 0/58 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/58 [00:01<00:58,  1.02s/it][A
Training:   9%|▊         | 5/58 [00:01<00:16,  3.25it/s][A
Training:  16%|█▌        | 9/58 [00:02<00:11,  4.22it/s][A
Training:  22%|██▏       | 13/58 [00:03<00:09,  4.68it/s][A
Training:  29%|██▉       | 17/58 [00:03<00:08,  4.89it/s][A
Training:  34%|███▍      | 20/58 [00:04<00:06,  6.23it/s][A
Training:  36%|███▌      | 21/58 [00:04<00:07,  4.65it/s][A
Training:  41%|████▏     | 24/58 [00:04<00:05,  6.25it/s][A
Training:  45%|████▍     | 26/58 [00:05<00:06,  4.98it/s][A
Training:  48%|████▊     | 28/58 [00:05<00:05,  5.88it/s][A
Training:  50%|█████     | 29/58 [00:06<00:06,  4.21it/s][A
Training:  55%|█████▌    | 32/58 [00:06<00:04,  6.02it/s][A
Training:  57%|█████▋    | 33/58 [00:07<00:05,  4.19it/s][A
Training:  62%|██████▏   | 36/58 [00:07<00:03,  6.05it/s][A
Training:  66%|██████▌   | 38/58 [00:07<00:04,  4.74it/s][A
Training:  69%|██████▉   | 40/58 [0

Epoch: 5/16 - Loss: 14.1747 - Accuracy: 0.8774



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:01<00:07,  1.01s/it][A
100%|██████████| 8/8 [00:01<00:00,  4.47it/s][A
Epochs:  31%|███▏      | 5/16 [01:08<02:30, 13.69s/it]

Val Loss: 9.7987 - Val Accuracy: 0.8599



Training:   0%|          | 0/58 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/58 [00:01<00:57,  1.02s/it][A
Training:   9%|▊         | 5/58 [00:01<00:16,  3.27it/s][A
Training:  16%|█▌        | 9/58 [00:02<00:11,  4.15it/s][A
Training:  22%|██▏       | 13/58 [00:03<00:09,  4.58it/s][A
Training:  29%|██▉       | 17/58 [00:04<00:08,  4.77it/s][A
Training:  36%|███▌      | 21/58 [00:04<00:07,  4.87it/s][A
Training:  43%|████▎     | 25/58 [00:05<00:06,  4.95it/s][A
Training:  50%|█████     | 29/58 [00:06<00:05,  4.99it/s][A
Training:  57%|█████▋    | 33/58 [00:07<00:04,  5.01it/s][A
Training:  64%|██████▍   | 37/58 [00:07<00:04,  5.08it/s][A
Training:  71%|███████   | 41/58 [00:08<00:03,  5.04it/s][A
Training:  78%|███████▊  | 45/58 [00:09<00:02,  5.08it/s][A
Training:  84%|████████▍ | 49/58 [00:10<00:01,  5.11it/s][A
Training:  91%|█████████▏| 53/58 [00:11<00:00,  5.07it/s][A
Training:  98%|█████████▊| 57/58 [00:11<00:00,  5.44it/s][A
                                   

Epoch: 6/16 - Loss: 5.4803 - Accuracy: 0.8885



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:00<00:06,  1.05it/s][A
100%|██████████| 8/8 [00:01<00:00,  4.60it/s][A
Epochs:  38%|███▊      | 6/16 [01:22<02:16, 13.66s/it]

Val Loss: 7.6330 - Val Accuracy: 0.8549



Training:   0%|          | 0/58 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/58 [00:00<00:54,  1.04it/s][A
Training:   7%|▋         | 4/58 [00:01<00:11,  4.73it/s][A
Training:  10%|█         | 6/58 [00:01<00:13,  3.92it/s][A
Training:  16%|█▌        | 9/58 [00:02<00:12,  4.04it/s][A
Training:  22%|██▏       | 13/58 [00:03<00:09,  4.53it/s][A
Training:  29%|██▉       | 17/58 [00:03<00:08,  4.71it/s][A
Training:  36%|███▌      | 21/58 [00:04<00:07,  4.88it/s][A
Training:  43%|████▎     | 25/58 [00:05<00:06,  4.99it/s][A
Training:  50%|█████     | 29/58 [00:06<00:05,  5.06it/s][A
Training:  57%|█████▋    | 33/58 [00:07<00:04,  5.15it/s][A
Training:  60%|██████    | 35/58 [00:07<00:03,  5.88it/s][A
Training:  64%|██████▍   | 37/58 [00:07<00:04,  5.00it/s][A
Training:  66%|██████▌   | 38/58 [00:07<00:03,  5.19it/s][A
Training:  71%|███████   | 41/58 [00:08<00:03,  4.93it/s][A
Training:  72%|███████▏  | 42/58 [00:08<00:03,  5.23it/s][A
Training:  78%|███████▊  | 45/58 [00

Epoch: 7/16 - Loss: 4.5895 - Accuracy: 0.8909



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:00<00:06,  1.06it/s][A
100%|██████████| 8/8 [00:01<00:00,  4.52it/s][A
Epochs:  44%|████▍     | 7/16 [01:35<02:02, 13.59s/it]

Val Loss: 6.9126 - Val Accuracy: 0.8662



Training:   0%|          | 0/58 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/58 [00:00<00:54,  1.05it/s][A
Training:   9%|▊         | 5/58 [00:01<00:15,  3.33it/s][A
Training:  16%|█▌        | 9/58 [00:02<00:11,  4.10it/s][A
Training:  22%|██▏       | 13/58 [00:03<00:10,  4.45it/s][A
Training:  29%|██▉       | 17/58 [00:04<00:08,  4.77it/s][A
Training:  36%|███▌      | 21/58 [00:04<00:07,  4.92it/s][A
Training:  43%|████▎     | 25/58 [00:05<00:06,  4.94it/s][A
Training:  50%|█████     | 29/58 [00:06<00:05,  4.99it/s][A
Training:  57%|█████▋    | 33/58 [00:07<00:04,  5.07it/s][A
Training:  64%|██████▍   | 37/58 [00:07<00:04,  5.07it/s][A
Training:  71%|███████   | 41/58 [00:08<00:03,  5.14it/s][A
Training:  78%|███████▊  | 45/58 [00:09<00:02,  5.15it/s][A
Training:  84%|████████▍ | 49/58 [00:10<00:01,  5.15it/s][A
Training:  91%|█████████▏| 53/58 [00:11<00:00,  5.16it/s][A
Training:  98%|█████████▊| 57/58 [00:11<00:00,  5.47it/s][A
                                   

Epoch: 8/16 - Loss: 4.5076 - Accuracy: 0.8902



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:00<00:06,  1.10it/s][A
 50%|█████     | 4/8 [00:01<00:00,  4.92it/s][A
100%|██████████| 8/8 [00:01<00:00,  4.63it/s][A
Epochs:  50%|█████     | 8/16 [01:48<01:48, 13.56s/it]

Val Loss: 15.1862 - Val Accuracy: 0.8209



Training:   0%|          | 0/58 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/58 [00:00<00:53,  1.06it/s][A
Training:   9%|▊         | 5/58 [00:01<00:16,  3.25it/s][A
Training:  16%|█▌        | 9/58 [00:02<00:12,  4.03it/s][A
Training:  22%|██▏       | 13/58 [00:03<00:10,  4.50it/s][A
Training:  29%|██▉       | 17/58 [00:04<00:08,  4.74it/s][A
Training:  36%|███▌      | 21/58 [00:04<00:07,  4.86it/s][A
Training:  43%|████▎     | 25/58 [00:05<00:06,  4.93it/s][A
Training:  50%|█████     | 29/58 [00:06<00:05,  4.98it/s][A
Training:  57%|█████▋    | 33/58 [00:07<00:04,  5.13it/s][A
Training:  64%|██████▍   | 37/58 [00:07<00:04,  5.13it/s][A
Training:  71%|███████   | 41/58 [00:08<00:03,  5.13it/s][A
Training:  78%|███████▊  | 45/58 [00:09<00:02,  5.18it/s][A
Training:  84%|████████▍ | 49/58 [00:10<00:01,  5.13it/s][A
Training:  86%|████████▌ | 50/58 [00:10<00:01,  5.38it/s][A
Training:  91%|█████████▏| 53/58 [00:11<00:01,  5.00it/s][A
Training:  93%|█████████▎| 54/58 [0

Epoch: 9/16 - Loss: 14.6051 - Accuracy: 0.8847



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:00<00:06,  1.07it/s][A
100%|██████████| 8/8 [00:01<00:00,  4.59it/s][A
Epochs:  56%|█████▋    | 9/16 [02:02<01:34, 13.56s/it]

Val Loss: 25.7508 - Val Accuracy: 0.8157



Training:   0%|          | 0/58 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/58 [00:00<00:53,  1.06it/s][A
Training:   9%|▊         | 5/58 [00:01<00:16,  3.30it/s][A
Training:  16%|█▌        | 9/58 [00:02<00:12,  4.00it/s][A
Training:  22%|██▏       | 13/58 [00:03<00:10,  4.42it/s][A
Training:  29%|██▉       | 17/58 [00:04<00:08,  4.72it/s][A
Training:  36%|███▌      | 21/58 [00:04<00:07,  4.90it/s][A
Training:  43%|████▎     | 25/58 [00:05<00:06,  4.99it/s][A
Training:  47%|████▋     | 27/58 [00:05<00:05,  5.82it/s][A
Training:  50%|█████     | 29/58 [00:06<00:06,  4.81it/s][A
Training:  53%|█████▎    | 31/58 [00:06<00:04,  5.85it/s][A
Training:  57%|█████▋    | 33/58 [00:07<00:05,  4.58it/s][A
Training:  60%|██████    | 35/58 [00:07<00:04,  5.74it/s][A
Training:  64%|██████▍   | 37/58 [00:07<00:04,  4.57it/s][A
Training:  67%|██████▋   | 39/58 [00:08<00:03,  5.76it/s][A
Training:  71%|███████   | 41/58 [00:08<00:03,  4.49it/s][A
Training:  76%|███████▌  | 44/58 [0

Epoch: 10/16 - Loss: 19.0323 - Accuracy: 0.8781



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:01<00:06,  1.01it/s][A
100%|██████████| 8/8 [00:01<00:00,  4.49it/s][A
Epochs:  62%|██████▎   | 10/16 [02:16<01:21, 13.60s/it]

Val Loss: 43.8742 - Val Accuracy: 0.6966



Training:   0%|          | 0/58 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/58 [00:00<00:56,  1.01it/s][A
Training:   9%|▊         | 5/58 [00:01<00:16,  3.19it/s][A
Training:  16%|█▌        | 9/58 [00:02<00:12,  3.93it/s][A
Training:  22%|██▏       | 13/58 [00:03<00:10,  4.38it/s][A
Training:  29%|██▉       | 17/58 [00:04<00:08,  4.69it/s][A
Training:  36%|███▌      | 21/58 [00:04<00:07,  4.81it/s][A
Training:  43%|████▎     | 25/58 [00:05<00:06,  4.85it/s][A
Training:  50%|█████     | 29/58 [00:06<00:05,  4.98it/s][A
Training:  57%|█████▋    | 33/58 [00:07<00:04,  5.01it/s][A
Training:  64%|██████▍   | 37/58 [00:08<00:04,  5.02it/s][A
Training:  71%|███████   | 41/58 [00:08<00:03,  5.05it/s][A
Training:  78%|███████▊  | 45/58 [00:09<00:02,  5.09it/s][A
Training:  84%|████████▍ | 49/58 [00:10<00:01,  5.13it/s][A
Training:  91%|█████████▏| 53/58 [00:11<00:00,  5.12it/s][A
Training:  98%|█████████▊| 57/58 [00:11<00:00,  5.42it/s][A
                                   

Epoch: 11/16 - Loss: 24.1674 - Accuracy: 0.8789



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:01<00:07,  1.00s/it][A
100%|██████████| 8/8 [00:01<00:00,  4.45it/s][A
Epochs:  69%|██████▉   | 11/16 [02:29<01:08, 13.64s/it]

Val Loss: 18.0565 - Val Accuracy: 0.8399



Training:   0%|          | 0/58 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/58 [00:00<00:55,  1.02it/s][A
Training:   9%|▊         | 5/58 [00:01<00:16,  3.27it/s][A
Training:  14%|█▍        | 8/58 [00:01<00:08,  5.63it/s][A
Training:  17%|█▋        | 10/58 [00:02<00:11,  4.32it/s][A
Training:  22%|██▏       | 13/58 [00:03<00:10,  4.25it/s][A
Training:  26%|██▌       | 15/58 [00:03<00:08,  5.36it/s][A
Training:  29%|██▉       | 17/58 [00:04<00:09,  4.42it/s][A
Training:  31%|███       | 18/58 [00:04<00:08,  4.75it/s][A
Training:  36%|███▌      | 21/58 [00:04<00:08,  4.62it/s][A
Training:  38%|███▊      | 22/58 [00:04<00:07,  5.02it/s][A
Training:  43%|████▎     | 25/58 [00:05<00:07,  4.69it/s][A
Training:  45%|████▍     | 26/58 [00:05<00:06,  5.12it/s][A
Training:  50%|█████     | 29/58 [00:06<00:06,  4.69it/s][A
Training:  52%|█████▏    | 30/58 [00:06<00:05,  5.04it/s][A
Training:  57%|█████▋    | 33/58 [00:07<00:05,  4.86it/s][A
Training:  59%|█████▊    | 34/58 [0

Epoch: 12/16 - Loss: 14.9812 - Accuracy: 0.8861



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:00<00:06,  1.08it/s][A
100%|██████████| 8/8 [00:01<00:00,  4.65it/s][A
Epochs:  75%|███████▌  | 12/16 [02:43<00:54, 13.65s/it]

Val Loss: 21.0892 - Val Accuracy: 0.8520



Training:   0%|          | 0/58 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/58 [00:01<01:02,  1.09s/it][A
Training:   9%|▊         | 5/58 [00:01<00:16,  3.12it/s][A
Training:  16%|█▌        | 9/58 [00:02<00:12,  3.98it/s][A
Training:  22%|██▏       | 13/58 [00:03<00:10,  4.46it/s][A
Training:  29%|██▉       | 17/58 [00:04<00:08,  4.71it/s][A
Training:  36%|███▌      | 21/58 [00:04<00:07,  4.84it/s][A
Training:  41%|████▏     | 24/58 [00:05<00:05,  6.27it/s][A
Training:  45%|████▍     | 26/58 [00:05<00:06,  4.92it/s][A
Training:  50%|█████     | 29/58 [00:06<00:06,  4.64it/s][A
Training:  57%|█████▋    | 33/58 [00:07<00:05,  4.87it/s][A
Training:  62%|██████▏   | 36/58 [00:07<00:03,  6.33it/s][A
Training:  66%|██████▌   | 38/58 [00:08<00:04,  4.83it/s][A
Training:  71%|███████   | 41/58 [00:08<00:03,  4.62it/s][A
Training:  78%|███████▊  | 45/58 [00:09<00:02,  4.75it/s][A
Training:  84%|████████▍ | 49/58 [00:10<00:01,  4.79it/s][A
Training:  91%|█████████▏| 53/58 [0

Epoch: 13/16 - Loss: 13.6785 - Accuracy: 0.8871



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:00<00:06,  1.09it/s][A
100%|██████████| 8/8 [00:01<00:00,  4.58it/s][A
Epochs:  81%|████████▏ | 13/16 [02:57<00:40, 13.66s/it]

Val Loss: 23.3486 - Val Accuracy: 0.8167



Training:   0%|          | 0/58 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/58 [00:00<00:53,  1.06it/s][A
Training:   7%|▋         | 4/58 [00:01<00:11,  4.77it/s][A
Training:  10%|█         | 6/58 [00:01<00:14,  3.58it/s][A
Training:  16%|█▌        | 9/58 [00:02<00:12,  3.85it/s][A
Training:  21%|██        | 12/58 [00:02<00:07,  5.92it/s][A
Training:  24%|██▍       | 14/58 [00:03<00:09,  4.41it/s][A
Training:  29%|██▉       | 17/58 [00:04<00:09,  4.33it/s][A
Training:  36%|███▌      | 21/58 [00:04<00:07,  4.70it/s][A
Training:  38%|███▊      | 22/58 [00:04<00:07,  5.01it/s][A
Training:  43%|████▎     | 25/58 [00:05<00:06,  4.80it/s][A
Training:  47%|████▋     | 27/58 [00:05<00:05,  5.89it/s][A
Training:  50%|█████     | 29/58 [00:06<00:06,  4.73it/s][A
Training:  52%|█████▏    | 30/58 [00:06<00:05,  5.11it/s][A
Training:  57%|█████▋    | 33/58 [00:07<00:05,  4.78it/s][A
Training:  59%|█████▊    | 34/58 [00:07<00:04,  5.13it/s][A
Training:  64%|██████▍   | 37/58 [00

Epoch: 14/16 - Loss: 22.5012 - Accuracy: 0.8856



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:00<00:06,  1.11it/s][A
100%|██████████| 8/8 [00:01<00:00,  4.55it/s][A
Epochs:  88%|████████▊ | 14/16 [03:10<00:27, 13.62s/it]

Val Loss: 29.5763 - Val Accuracy: 0.8236



Training:   0%|          | 0/58 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/58 [00:01<00:59,  1.05s/it][A
Training:   9%|▊         | 5/58 [00:01<00:16,  3.17it/s][A
Training:  16%|█▌        | 9/58 [00:02<00:12,  3.94it/s][A
Training:  22%|██▏       | 13/58 [00:03<00:10,  4.36it/s][A
Training:  29%|██▉       | 17/58 [00:04<00:08,  4.61it/s][A
Training:  36%|███▌      | 21/58 [00:05<00:07,  4.73it/s][A
Training:  41%|████▏     | 24/58 [00:05<00:05,  6.16it/s][A
Training:  45%|████▍     | 26/58 [00:05<00:06,  4.83it/s][A
Training:  50%|█████     | 29/58 [00:06<00:06,  4.69it/s][A
Training:  53%|█████▎    | 31/58 [00:06<00:04,  5.63it/s][A
Training:  57%|█████▋    | 33/58 [00:07<00:05,  4.70it/s][A
Training:  59%|█████▊    | 34/58 [00:07<00:04,  5.07it/s][A
Training:  64%|██████▍   | 37/58 [00:08<00:04,  4.84it/s][A
Training:  66%|██████▌   | 38/58 [00:08<00:03,  5.17it/s][A
Training:  71%|███████   | 41/58 [00:08<00:03,  5.00it/s][A
Training:  72%|███████▏  | 42/58 [0

Epoch: 15/16 - Loss: 14.4597 - Accuracy: 0.8863



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:00<00:06,  1.06it/s][A
 62%|██████▎   | 5/8 [00:01<00:00,  3.40it/s][A
100%|██████████| 8/8 [00:01<00:00,  4.35it/s][A
Epochs:  94%|█████████▍| 15/16 [03:24<00:13, 13.62s/it]

Val Loss: 13.1163 - Val Accuracy: 0.8817



Training:   0%|          | 0/58 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/58 [00:00<00:56,  1.01it/s][A
Training:   7%|▋         | 4/58 [00:01<00:11,  4.67it/s][A
Training:  10%|█         | 6/58 [00:01<00:14,  3.60it/s][A
Training:  16%|█▌        | 9/58 [00:02<00:12,  3.90it/s][A
Training:  19%|█▉        | 11/58 [00:02<00:09,  5.19it/s][A
Training:  22%|██▏       | 13/58 [00:03<00:10,  4.24it/s][A
Training:  26%|██▌       | 15/58 [00:03<00:07,  5.58it/s][A
Training:  29%|██▉       | 17/58 [00:04<00:09,  4.45it/s][A
Training:  36%|███▌      | 21/58 [00:04<00:07,  4.65it/s][A
Training:  43%|████▎     | 25/58 [00:05<00:06,  4.81it/s][A
Training:  50%|█████     | 29/58 [00:06<00:05,  5.00it/s][A
Training:  57%|█████▋    | 33/58 [00:07<00:05,  4.99it/s][A
Training:  64%|██████▍   | 37/58 [00:07<00:04,  5.08it/s][A
Training:  71%|███████   | 41/58 [00:08<00:03,  5.11it/s][A
Training:  78%|███████▊  | 45/58 [00:09<00:02,  5.22it/s][A
Training:  84%|████████▍ | 49/58 [00

Epoch: 16/16 - Loss: 11.4949 - Accuracy: 0.8926



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:00<00:06,  1.01it/s][A
100%|██████████| 8/8 [00:01<00:00,  4.36it/s][A
Epochs: 100%|██████████| 16/16 [03:38<00:00, 13.63s/it]
[32m[I 2023-12-12 00:31:53,344][0m Trial 4 finished with value: 0.875595211982727 and parameters: {'learning_rate': 0.09923013627376329, 'weight_decay': 0.002591295182102534, 'epsilon': 1.45661760180232e-09, 'batch_size': 245, 'epochs': 16}. Best is trial 0 with value: 0.9175874590873718.[0m


Val Loss: 15.5291 - Val Accuracy: 0.8756
Learning rate: 6.27996009958689e-05
Weight decay: 0.005170597799208986
Epsilon: 6.850290470052475e-08
Batch size: 147
Number of epochs: 27


Epochs:   0%|          | 0/27 [00:00<?, ?it/s]
Training:   0%|          | 0/96 [00:00<?, ?it/s][A
Training:   1%|          | 1/96 [00:00<01:05,  1.45it/s][A
Training:   5%|▌         | 5/96 [00:01<00:18,  4.91it/s][A
Training:   9%|▉         | 9/96 [00:01<00:13,  6.28it/s][A
Training:  14%|█▎        | 13/96 [00:02<00:11,  7.27it/s][A
Training:  18%|█▊        | 17/96 [00:02<00:10,  7.57it/s][A
Training:  22%|██▏       | 21/96 [00:03<00:09,  7.98it/s][A
Training:  26%|██▌       | 25/96 [00:03<00:08,  8.29it/s][A
Training:  30%|███       | 29/96 [00:03<00:08,  8.27it/s][A
Training:  34%|███▍      | 33/96 [00:04<00:07,  8.38it/s][A
Training:  39%|███▊      | 37/96 [00:04<00:07,  8.36it/s][A
Training:  43%|████▎     | 41/96 [00:05<00:06,  8.42it/s][A
Training:  47%|████▋     | 45/96 [00:05<00:06,  8.39it/s][A
Training:  51%|█████     | 49/96 [00:06<00:05,  8.50it/s][A
Training:  55%|█████▌    | 53/96 [00:06<00:04,  8.75it/s][A
Training:  58%|█████▊    | 56/96 [00:06<00:03, 10.

Epoch: 1/27 - Loss: 0.4670 - Accuracy: 0.8163



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:00<00:08,  1.37it/s][A
 42%|████▏     | 5/12 [00:01<00:01,  4.46it/s][A
100%|██████████| 12/12 [00:01<00:00,  6.62it/s][A
Epochs:   0%|          | 0/27 [00:13<?, ?it/s]
[32m[I 2023-12-12 00:32:06,776][0m Trial 5 pruned. [0m


Val Loss: 0.3355 - Val Accuracy: 0.8861
Learning rate: 2.910784677931652e-05
Weight decay: 0.0007525866272266529
Epsilon: 8.61445374185814e-09
Batch size: 300
Number of epochs: 28


Epochs:   0%|          | 0/28 [00:00<?, ?it/s]
Training:   0%|          | 0/47 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/47 [00:01<00:55,  1.21s/it][A
Training:  11%|█         | 5/47 [00:02<00:15,  2.63it/s][A
Training:  19%|█▉        | 9/47 [00:03<00:11,  3.37it/s][A
Training:  28%|██▊       | 13/47 [00:04<00:09,  3.71it/s][A
Training:  36%|███▌      | 17/47 [00:04<00:07,  3.87it/s][A
Training:  45%|████▍     | 21/47 [00:05<00:06,  3.97it/s][A
Training:  53%|█████▎    | 25/47 [00:06<00:05,  4.05it/s][A
Training:  62%|██████▏   | 29/47 [00:07<00:04,  4.02it/s][A
Training:  70%|███████   | 33/47 [00:08<00:03,  4.13it/s][A
Training:  79%|███████▊  | 37/47 [00:09<00:02,  4.24it/s][A
Training:  87%|████████▋ | 41/47 [00:10<00:01,  4.29it/s][A
Training:  96%|█████████▌| 45/47 [00:11<00:00,  4.53it/s][A
                                                         [A

Epoch: 1/28 - Loss: 0.5995 - Accuracy: 0.7092



  0%|          | 0/6 [00:00<?, ?it/s][A
 17%|█▋        | 1/6 [00:01<00:06,  1.23s/it][A
100%|██████████| 6/6 [00:02<00:00,  2.83it/s][A
Epochs:   0%|          | 0/28 [00:13<?, ?it/s]
[32m[I 2023-12-12 00:32:20,672][0m Trial 6 pruned. [0m


Val Loss: 0.5264 - Val Accuracy: 0.8041
Learning rate: 0.011031309402311463
Weight decay: 0.0008333695361572575
Epsilon: 1.2763557896199372e-09
Batch size: 213
Number of epochs: 69


Epochs:   0%|          | 0/69 [00:00<?, ?it/s]
Training:   0%|          | 0/66 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/66 [00:00<01:00,  1.07it/s][A
Training:   8%|▊         | 5/66 [00:01<00:17,  3.55it/s][A
Training:  14%|█▎        | 9/66 [00:02<00:12,  4.58it/s][A
Training:  20%|█▉        | 13/66 [00:02<00:10,  5.14it/s][A
Training:  26%|██▌       | 17/66 [00:03<00:09,  5.41it/s][A
Training:  32%|███▏      | 21/66 [00:04<00:08,  5.61it/s][A
Training:  38%|███▊      | 25/66 [00:04<00:07,  5.81it/s][A
Training:  42%|████▏     | 28/66 [00:05<00:05,  7.28it/s][A
Training:  45%|████▌     | 30/66 [00:05<00:06,  5.87it/s][A
Training:  50%|█████     | 33/66 [00:06<00:06,  5.38it/s][A
Training:  56%|█████▌    | 37/66 [00:06<00:05,  5.55it/s][A
Training:  62%|██████▏   | 41/66 [00:07<00:04,  5.74it/s][A
Training:  67%|██████▋   | 44/66 [00:07<00:03,  7.29it/s][A
Training:  70%|██████▉   | 46/66 [00:08<00:03,  6.19it/s][A
Training:  73%|███████▎  | 48/66 [00:08<00:02,  7.

Epoch: 1/69 - Loss: 0.3827 - Accuracy: 0.8608



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:00<00:06,  1.14it/s][A
 56%|█████▌    | 5/9 [00:01<00:01,  3.79it/s][A
100%|██████████| 9/9 [00:01<00:00,  5.37it/s][A
Epochs:   1%|▏         | 1/69 [00:13<14:58, 13.22s/it]

Val Loss: 0.2338 - Val Accuracy: 0.8970



Training:   0%|          | 0/66 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/66 [00:00<00:58,  1.11it/s][A
Training:   8%|▊         | 5/66 [00:01<00:16,  3.75it/s][A
Training:  14%|█▎        | 9/66 [00:02<00:12,  4.72it/s][A
Training:  20%|█▉        | 13/66 [00:02<00:10,  5.27it/s][A
Training:  23%|██▎       | 15/66 [00:02<00:08,  6.16it/s][A
Training:  26%|██▌       | 17/66 [00:03<00:09,  5.23it/s][A
Training:  29%|██▉       | 19/66 [00:03<00:07,  6.49it/s][A
Training:  32%|███▏      | 21/66 [00:04<00:08,  5.21it/s][A
Training:  38%|███▊      | 25/66 [00:04<00:07,  5.48it/s][A
Training:  42%|████▏     | 28/66 [00:05<00:05,  7.40it/s][A
Training:  45%|████▌     | 30/66 [00:05<00:06,  5.77it/s][A
Training:  50%|█████     | 33/66 [00:06<00:06,  5.30it/s][A
Training:  53%|█████▎    | 35/66 [00:06<00:04,  6.37it/s][A
Training:  56%|█████▌    | 37/66 [00:06<00:05,  5.31it/s][A
Training:  59%|█████▉    | 39/66 [00:07<00:04,  6.54it/s][A
Training:  62%|██████▏   | 41/66 [0

Epoch: 2/69 - Loss: 0.2386 - Accuracy: 0.9112



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:00<00:07,  1.12it/s][A
 56%|█████▌    | 5/9 [00:01<00:01,  3.67it/s][A
100%|██████████| 9/9 [00:01<00:00,  5.17it/s][A
Epochs:   1%|▏         | 1/69 [00:26<29:55, 26.40s/it]
[32m[I 2023-12-12 00:32:47,346][0m Trial 7 pruned. [0m


Val Loss: 0.2515 - Val Accuracy: 0.8986
Learning rate: 0.043656523668272246
Weight decay: 0.0006295528525199638
Epsilon: 3.684563053602628e-09
Batch size: 135
Number of epochs: 57


Epochs:   0%|          | 0/57 [00:00<?, ?it/s]
Training:   0%|          | 0/104 [00:00<?, ?it/s][A
Training:   1%|          | 1/104 [00:00<01:05,  1.57it/s][A
Training:   5%|▍         | 5/104 [00:01<00:17,  5.52it/s][A
Training:   9%|▊         | 9/104 [00:01<00:13,  7.01it/s][A
Training:  12%|█▎        | 13/104 [00:01<00:11,  7.94it/s][A
Training:  16%|█▋        | 17/104 [00:02<00:10,  8.15it/s][A
Training:  20%|██        | 21/104 [00:02<00:09,  8.58it/s][A
Training:  24%|██▍       | 25/104 [00:03<00:09,  8.71it/s][A
Training:  28%|██▊       | 29/104 [00:03<00:08,  8.79it/s][A
Training:  32%|███▏      | 33/104 [00:04<00:08,  8.78it/s][A
Training:  36%|███▌      | 37/104 [00:04<00:07,  8.73it/s][A
Training:  39%|███▉      | 41/104 [00:05<00:07,  8.68it/s][A
Training:  43%|████▎     | 45/104 [00:05<00:06,  8.97it/s][A
Training:  47%|████▋     | 49/104 [00:05<00:06,  8.97it/s][A
Training:  51%|█████     | 53/104 [00:06<00:05,  9.01it/s][A
Training:  55%|█████▍    | 57/104 [

Epoch: 1/57 - Loss: 4.4709 - Accuracy: 0.8357



  0%|          | 0/13 [00:00<?, ?it/s][A
  8%|▊         | 1/13 [00:00<00:07,  1.54it/s][A
 38%|███▊      | 5/13 [00:01<00:01,  5.34it/s][A
 69%|██████▉   | 9/13 [00:01<00:00,  6.87it/s][A
100%|██████████| 13/13 [00:01<00:00,  6.90it/s][A
Epochs:   0%|          | 0/57 [00:13<?, ?it/s]
[32m[I 2023-12-12 00:33:00,922][0m Trial 8 pruned. [0m


Val Loss: 2.1253 - Val Accuracy: 0.7708
Learning rate: 2.698916375584444e-05
Weight decay: 0.0009560780903533698
Epsilon: 1.0158503990349767e-09
Batch size: 187
Number of epochs: 21


Epochs:   0%|          | 0/21 [00:00<?, ?it/s]
Training:   0%|          | 0/75 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/75 [00:00<01:00,  1.23it/s][A
Training:   7%|▋         | 5/75 [00:01<00:17,  3.98it/s][A
Training:  12%|█▏        | 9/75 [00:02<00:13,  5.07it/s][A
Training:  17%|█▋        | 13/75 [00:02<00:10,  5.64it/s][A
Training:  23%|██▎       | 17/75 [00:03<00:09,  5.99it/s][A
Training:  28%|██▊       | 21/75 [00:03<00:08,  6.38it/s][A
Training:  33%|███▎      | 25/75 [00:04<00:07,  6.45it/s][A
Training:  39%|███▊      | 29/75 [00:04<00:06,  6.71it/s][A
Training:  43%|████▎     | 32/75 [00:05<00:05,  8.11it/s][A
Training:  45%|████▌     | 34/75 [00:05<00:05,  6.89it/s][A
Training:  48%|████▊     | 36/75 [00:05<00:04,  7.94it/s][A
Training:  51%|█████     | 38/75 [00:06<00:05,  6.32it/s][A
Training:  55%|█████▍    | 41/75 [00:06<00:05,  5.87it/s][A
Training:  59%|█████▊    | 44/75 [00:06<00:03,  7.84it/s][A
Training:  61%|██████▏   | 46/75 [00:07<00:04,  6.

Epoch: 1/21 - Loss: 0.5904 - Accuracy: 0.7069



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:00<00:06,  1.30it/s][A
 50%|█████     | 5/10 [00:01<00:01,  4.09it/s][A
100%|██████████| 10/10 [00:01<00:00,  5.10it/s][A
Epochs:   0%|          | 0/21 [00:13<?, ?it/s]
[32m[I 2023-12-12 00:33:14,581][0m Trial 9 pruned. [0m


Val Loss: 0.4967 - Val Accuracy: 0.8293

Study statistics: 
  Number of finished trials:  10
  Number of pruned trials:  5
  Number of complete trials:  5


In [22]:
print("Best trial:")
trial = study.best_trial

print("  Value: ", trial.value)

print("  Params: ")
for key, value in trial.params.items():
    print("    {}: {}".format(key, value))

Best trial:
  Value:  0.9175874590873718
  Params: 
    batch_size: 268
    epochs: 95
    epsilon: 5.706295335047529e-08
    learning_rate: 0.000287881984666585
    weight_decay: 0.009570542308397574


In [None]:
# ViT 8-8 CrossEntropyLoss

Best trial:
Value:  0.9175874590873718
Params: 
batch_size: 268
epochs: 95
epsilon: 5.706295335047529e-08
learning_rate: 0.000287881984666585
weight_decay: 0.009570542308397574