In [1]:
import os
import random
import pandas as pd
import numpy as np
import mxnet as mx
import torch
import torch.nn as nn
import torch.nn.functional as F
import torch.optim as opt
from torch.utils.data import Dataset, DataLoader
from pytorch_metric_learning import losses
from einops import rearrange, repeat
import optuna
from optuna.trial import TrialState
from tqdm import tqdm

In [2]:
def file_to_embed(embeds, file):
    emb = []
    for f in file:
        emb.append(embeds[f][0])
    return torch.stack(emb)

In [3]:
MIN_NUM_PATCHES = 16

In [4]:
device = torch.device("cuda:2" if torch.cuda.is_available() else "cpu")
device

device(type='cuda', index=2)

In [5]:
class AdienceDataset(Dataset):
    def __init__(self, annot_file, img_dir):
        self.img_lbls = pd.read_csv(annot_file, header=None)
        self.img_dir = img_dir
    
    def __len__(self):
        return len(self.img_lbls)
    
    def __getitem__(self, idx):
        img_file = self.img_lbls.iloc[idx, 0]
        img_path = os.path.join(self.img_dir, img_file)
        image = mx.image.imread(img_path)
        if image.shape[1] != 112:
            image = mx.image.resize_short(image, 112)
        image = mx.nd.transpose(image, axes=(2,0,1))
        image = torch.tensor(image.asnumpy()).type(torch.FloatTensor)
        label = self.img_lbls.iloc[idx, 1]

        return image, label, img_file

In [6]:
train_data = AdienceDataset("../train.csv", "../cropped_Adience/")
val_data = AdienceDataset("../val.csv", "../cropped_Adience/")

In [7]:
class CosFace(nn.Module):
    r"""Implement of CosFace (https://arxiv.org/pdf/1801.09414.pdf):
    Args:
        in_features: size of each input sample
        out_features: size of each output sample
        device_id: the ID of GPU where the model will be trained by model parallel.
                       if device_id=None, it will be trained on CPU without model parallel.
        s: norm of input feature
        m: margin
        cos(theta)-m
    """

    def __init__(self, in_features, out_features, device_id, s=64.0, m=0.35):
        super(CosFace, self).__init__()
        self.in_features = in_features
        self.out_features = out_features
        self.device_id = device_id
        self.s = s
        self.m = m
        print("self.device_id", self.device_id)
        self.weight = nn.Parameter(torch.FloatTensor(out_features, in_features))
        nn.init.xavier_uniform_(self.weight)

    def forward(self, input, label):
        # --------------------------- cos(theta) & phi(theta) ---------------------------

        if self.device_id == None:
            cosine = F.linear(F.normalize(input), F.normalize(self.weight))
        else:
            x = input
            sub_weights = torch.chunk(self.weight, len(self.device_id), dim=0)
            temp_x = x.cuda(self.device_id[0])
            weight = sub_weights[0].cuda(self.device_id[0])
            cosine = F.linear(F.normalize(temp_x), F.normalize(weight))
            for i in range(1, len(self.device_id)):
                temp_x = x.cuda(self.device_id[i])
                weight = sub_weights[i].cuda(self.device_id[i])
                cosine = torch.cat((cosine, F.linear(F.normalize(temp_x), F.normalize(weight)).cuda(self.device_id[0])),
                                   dim=1)
        phi = cosine - self.m
        # --------------------------- convert label to one-hot ---------------------------
        one_hot = torch.zeros(cosine.size())
        if self.device_id != None:
            one_hot = one_hot.cuda(self.device_id[0])
        # one_hot = one_hot.cuda() if cosine.is_cuda else one_hot

        one_hot.scatter_(1, label.view(-1, 1).long(), 1)
        # -------------torch.where(out_i = {x_i if condition_i else y_i) -------------
        output = (one_hot * phi) + (
                    (1.0 - one_hot) * cosine)  # you can use torch.where if your torch.__version__ is 0.4
        output *= self.s

        return output

    def __repr__(self):
        return self.__class__.__name__ + '(' \
               + 'in_features = ' + str(self.in_features) \
               + ', out_features = ' + str(self.out_features) \
               + ', s = ' + str(self.s) \
               + ', m = ' + str(self.m) + ')'

In [8]:
class Residual(nn.Module):
    def __init__(self, fn):
        super().__init__()
        self.fn = fn
    def forward(self, x, **kwargs):
        return self.fn(x, **kwargs) + x

In [9]:
class PreNorm(nn.Module):
    def __init__(self, dim, fn):
        super().__init__()
        self.norm = nn.LayerNorm(dim)
        self.fn = fn
    def forward(self, x, **kwargs):
        return self.fn(self.norm(x), **kwargs)

In [10]:
class FeedForward(nn.Module):
    def __init__(self, dim, hidden_dim, dropout = 0.):
        super().__init__()
        self.net = nn.Sequential(
            nn.Linear(dim, hidden_dim),
            nn.GELU(),
            nn.Dropout(dropout),
            nn.Linear(hidden_dim, dim),
            nn.Dropout(dropout)
        )
    def forward(self, x):
        return self.net(x)

In [11]:
class Attention(nn.Module):
    def __init__(self, dim, heads = 8, dim_head = 64, dropout = 0.):
        super().__init__()
        inner_dim = dim_head *  heads
        self.heads = heads
        self.scale = dim ** -0.5

        self.to_qkv = nn.Linear(dim, inner_dim * 3, bias = False)
        self.to_out = nn.Sequential(
            nn.Linear(inner_dim, dim),
            nn.Dropout(dropout)
        )

    def forward(self, x, mask = None):
        b, n, _, h = *x.shape, self.heads
        qkv = self.to_qkv(x).chunk(3, dim = -1)

        q, k, v = map(lambda t: rearrange(t, 'b n (h d) -> b h n d', h = h), qkv)
        dots = torch.einsum('bhid,bhjd->bhij', q, k) * self.scale
        mask_value = -torch.finfo(dots.dtype).max
        #embed()
        if mask is not None:
            mask = F.pad(mask.flatten(1), (1, 0), value = True)
            assert mask.shape[-1] == dots.shape[-1], 'mask has incorrect dimensions'
            mask = mask[:, None, :] * mask[:, :, None]
            dots.masked_fill_(~mask, mask_value)
            del mask

        attn = dots.softmax(dim=-1)

        out = torch.einsum('bhij,bhjd->bhid', attn, v)
        out = rearrange(out, 'b h n d -> b n (h d)')
        out =  self.to_out(out)

        return out

In [12]:
class Transformer(nn.Module):
    def __init__(self, dim, depth, heads, dim_head, mlp_dim, dropout):
        super().__init__()
        self.layers = nn.ModuleList([])
        for _ in range(depth):
            self.layers.append(nn.ModuleList([
                Residual(PreNorm(dim, Attention(dim, heads = heads, dim_head = dim_head, dropout = dropout))),
                Residual(PreNorm(dim, FeedForward(dim, mlp_dim, dropout = dropout)))
            ]))
    def forward(self, x, mask = None):
        for attn, ff in self.layers:
            x = attn(x, mask = mask)
            #embed()
            x = ff(x)
        return x

In [13]:
class ViTs_face(nn.Module):
    def __init__(self, *, loss_type, GPU_ID, num_class, image_size, patch_size, ac_patch_size,
                         pad, dim, depth, heads, mlp_dim, pool = 'mean', channels = 3, dim_head = 64, dropout = 0., emb_dropout = 0.):
        super().__init__()
        assert image_size % patch_size == 0, 'Image dimensions must be divisible by the patch size.'
        num_patches = (image_size // patch_size) ** 2
        patch_dim = channels * ac_patch_size ** 2
        assert num_patches > MIN_NUM_PATCHES, f'your number of patches ({num_patches}) is way too small for attention to be effective (at least 16). Try decreasing your patch size'
        assert pool in {'cls', 'mean'}, 'pool type must be either cls (cls token) or mean (mean pooling)'

        self.patch_size = patch_size
        self.soft_split = nn.Unfold(kernel_size=(ac_patch_size, ac_patch_size), stride=(self.patch_size, self.patch_size), padding=(pad, pad))


        self.pos_embedding = nn.Parameter(torch.randn(1, num_patches + 1, dim))
        self.patch_to_embedding = nn.Linear(patch_dim, dim)
        self.cls_token = nn.Parameter(torch.randn(1, 1, dim))
        self.dropout = nn.Dropout(emb_dropout)

        self.transformer = Transformer(dim, depth, heads, dim_head, mlp_dim, dropout)

        self.pool = pool
        self.to_latent = nn.Identity()

        self.mlp_head = nn.Sequential(
            nn.LayerNorm(dim),
        )
        self.loss_type = loss_type
        self.GPU_ID = GPU_ID
        if self.loss_type == 'None':
            print("no loss for vit_face")
        else:
            if self.loss_type == 'CosFace':
                self.loss = CosFace(in_features=dim, out_features=num_class, device_id=self.GPU_ID)

    def forward(self, img, label= None , mask = None):
        p = self.patch_size
        x = self.soft_split(img).transpose(1, 2)
        x = self.patch_to_embedding(x)
        b, n, _ = x.shape

        cls_tokens = repeat(self.cls_token, '() n d -> b n d', b = b)
        x = torch.cat((cls_tokens, x), dim=1)
        x += self.pos_embedding[:, :(n + 1)]
        x = self.dropout(x)
        x = self.transformer(x, mask)

        # y = x[:, 0]
        z = x[:, 1:].mean(dim = 1)

        # y = self.to_latent(y)
        # emb_y = self.mlp_head(y)
        z = self.to_latent(z)
        emb_z = self.mlp_head(z)
        # emb = torch.cat((emb_y, emb_z), dim=1)
        emb = emb_z
        if label is not None:
            x = self.loss(emb, label)
            return x, emb
        else:
            return emb

In [14]:
class ViT_plus(nn.Module):
    def __init__(self):
        super(ViT_plus, self).__init__()
        
        self.fc1 = nn.Linear(in_features=512, out_features=512)
        self.fc2 = nn.Linear(in_features=512, out_features=2)
        
    def forward(self, x):
        x = self.fc1(x)
        x_cosface = x
        x_classification = self.fc2(x)
        
        return x_cosface, x_classification

In [15]:
model = ViTs_face(
            loss_type='CosFace',
            GPU_ID=[device],
            num_class=93431,
            image_size=112,
            patch_size=8,
            ac_patch_size=12,
            pad=4,
            dim=512,
            depth=20,
            heads=8,
            mlp_dim=2048,
            dropout=0.1,
            emb_dropout=0.1
        ).to(device)
model.load_state_dict(
    torch.load("../Backbone_VITs_Epoch_2_Batch_12000_Time_2021-03-17-04-05_checkpoint.pth", map_location=device)
)

self.device_id [device(type='cuda', index=2)]


<All keys matched successfully>

In [16]:
for param in model.parameters():
    param.requires_grad = False

In [17]:
embeds = {}
model.eval()

with torch.no_grad():
    for img, label, file in train_data:
        img = img.to(device)
        embeds[file] = model(torch.unsqueeze(img, 0))

    for img, label, file in val_data:
        img = img.to(device)
        embeds[file] = model(torch.unsqueeze(img, 0))

In [18]:
best_accu = 0.0
def objective(trial):
    model_xtr = ViT_plus().to(device)
    
    loss_lr = trial.suggest_float("loss_learning_rate", 1e-4, 1e-2, log=True)
    cos_margin = losses.CosFaceLoss(2, 512).to(device)
    loss_optimizer = opt.AdamW(cos_margin.parameters(), lr=loss_lr)
    
    lr = trial.suggest_float("learning_rate", 1e-5, 1e-1, log=True)
    wd = trial.suggest_float('weight_decay', 1e-4, 1e-2, log=True)
    eps = trial.suggest_float("epsilon", 1e-9, 1e-7, log=True)
    optimizer = opt.AdamW(model_xtr.parameters(), lr=lr, eps=eps, weight_decay=wd)
    
    criterion = nn.CrossEntropyLoss()
    
    batch_size = trial.suggest_int('batch_size', 50, 300)
    num_epochs = trial.suggest_int('epochs', 10, 100)
    
    print("Learning rate for Loss: "+ str(loss_lr))
    print("Learning rate: "+ str(lr))
    print("Weight decay: "+ str(wd))
    print("Epsilon: "+ str(eps))
    print("Batch size: "+ str(batch_size))
    print("Number of epochs: "+ str(num_epochs))
    
    for epoch in tqdm(range(num_epochs), desc="Epochs"):
        train_loader = DataLoader(train_data, batch_size=batch_size, shuffle=True, num_workers=4)
        val_loader = DataLoader(val_data, batch_size=batch_size, shuffle=False, num_workers=4)
        
        # training loop
        running_loss = []
        running_accu = []
        
        model_xtr.train()
        for img, label, file in tqdm(train_loader, desc="Training", leave=False):
            img, label = img.to(device), label.to(device)

            x = file_to_embed(embeds, file)
            
            optimizer.zero_grad()
            embed, output = model_xtr(x)
            
            pred = torch.argmax(output, 1)
            accuracy = torch.eq(pred, label).sum() / len(img)

            class_loss = criterion(output, label)
            cos_loss = cos_margin(embed, label)
            loss = class_loss + cos_loss
            loss.backward()
            loss_optimizer.step()
            optimizer.step()

            running_accu.append(accuracy.cpu().detach().numpy())
            running_loss.append(loss.cpu().detach().numpy())
        print("Epoch: {}/{} - Loss: {:.4f} - Accuracy: {:.4f}".format(epoch+1, num_epochs, np.mean(running_loss), np.mean(running_accu)))
        
        # validation loop
        val_loss = []
        val_accu = []

        model_xtr.eval()
        with torch.no_grad():
            for img, label, file in tqdm(val_loader):
                img, label = img.to(device), label.to(device)
                
                x = file_to_embed(embeds, file)
                
                embed, output = model_xtr(x)
                
                pred = torch.argmax(output, 1)
                accuracy = torch.eq(pred, label).sum() / len(img)
                
                class_loss = criterion(output, label)
                cos_loss = cos_margin(embed, label)
                loss = class_loss + cos_loss
                
                val_accu.append(accuracy.cpu().detach().numpy())
                val_loss.append(loss.cpu().detach().numpy())
        val_accu = np.mean(val_accu)
        val_loss = np.mean(val_loss)
        print("Val Loss: {:.4f} - Val Accuracy: {:.4f}".format(val_loss, val_accu))
        
        trial.report(val_accu, epoch)
        if trial.should_prune():
            raise optuna.exceptions.TrialPruned()
    
    global best_accu
    if val_accu > best_accu:
        best_accu = val_accu
        print("Saving best model...")
        torch.save(model_xtr.state_dict(), "../vit_12-8_cosface_mean_only.pt")
            
    return val_accu

In [19]:
study = optuna.create_study(direction='maximize',
                            study_name='cosface-12-8-mean-only-vit-study',
                            storage='sqlite:///study2.db',
                            load_if_exists=True)
study.optimize(objective, n_trials=20)

pruned_trials = study.get_trials(deepcopy=False, states=[TrialState.PRUNED])
complete_trials = study.get_trials(deepcopy=False, states=[TrialState.COMPLETE])

# Display the study statistics
print("\nStudy statistics: ")
print("  Number of finished trials: ", len(study.trials))
print("  Number of pruned trials: ", len(pruned_trials))
print("  Number of complete trials: ", len(complete_trials))

[32m[I 2023-12-14 22:16:12,794][0m A new study created in RDB with name: cosface-12-8-mean-only-vit-study[0m


Learning rate for Loss: 0.0007572018927627318
Learning rate: 0.0013729418906665127
Weight decay: 0.006436609159123359
Epsilon: 9.49605063494801e-08
Batch size: 296
Number of epochs: 71


Epochs:   0%|          | 0/71 [00:00<?, ?it/s]
Training:   0%|          | 0/48 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/48 [00:02<01:44,  2.22s/it][A
Training:   4%|▍         | 2/48 [00:02<00:45,  1.01it/s][A
Training:   8%|▊         | 4/48 [00:02<00:18,  2.37it/s][A
Training:  10%|█         | 5/48 [00:03<00:28,  1.49it/s][A
Training:  12%|█▎        | 6/48 [00:03<00:21,  1.97it/s][A
Training:  17%|█▋        | 8/48 [00:03<00:11,  3.40it/s][A
Training:  21%|██        | 10/48 [00:05<00:20,  1.84it/s][A
Training:  23%|██▎       | 11/48 [00:05<00:16,  2.23it/s][A
Training:  25%|██▌       | 12/48 [00:06<00:13,  2.70it/s][A
Training:  27%|██▋       | 13/48 [00:07<00:19,  1.78it/s][A
Training:  29%|██▉       | 14/48 [00:07<00:16,  2.12it/s][A
Training:  35%|███▌      | 17/48 [00:08<00:14,  2.18it/s][A
Training:  38%|███▊      | 18/48 [00:09<00:13,  2.23it/s][A
Training:  42%|████▏     | 20/48 [00:09<00:08,  3.23it/s][A
Training:  44%|████▍     | 21/48 [00:10<00:12,  2.13i

Epoch: 1/71 - Loss: 9.8028 - Accuracy: 0.7304



  0%|          | 0/6 [00:00<?, ?it/s][A
 17%|█▋        | 1/6 [00:02<00:14,  2.83s/it][A
 33%|███▎      | 2/6 [00:02<00:04,  1.24s/it][A
 50%|█████     | 3/6 [00:03<00:02,  1.39it/s][A
100%|██████████| 6/6 [00:05<00:00,  1.16it/s][A
Epochs:   1%|▏         | 1/71 [00:29<34:29, 29.56s/it]

Val Loss: 5.0560 - Val Accuracy: 0.9053



Training:   0%|          | 0/48 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/48 [00:03<02:23,  3.05s/it][A
Training:   8%|▊         | 4/48 [00:03<00:27,  1.62it/s][A
Training:  12%|█▎        | 6/48 [00:05<00:33,  1.25it/s][A
Training:  15%|█▍        | 7/48 [00:05<00:26,  1.56it/s][A
Training:  17%|█▋        | 8/48 [00:05<00:20,  1.98it/s][A
Training:  19%|█▉        | 9/48 [00:06<00:29,  1.33it/s][A
Training:  23%|██▎       | 11/48 [00:07<00:16,  2.19it/s][A
Training:  25%|██▌       | 12/48 [00:07<00:14,  2.55it/s][A
Training:  27%|██▋       | 13/48 [00:09<00:26,  1.31it/s][A
Training:  29%|██▉       | 14/48 [00:09<00:20,  1.69it/s][A
Training:  31%|███▏      | 15/48 [00:09<00:15,  2.17it/s][A
Training:  33%|███▎      | 16/48 [00:09<00:11,  2.67it/s][A
Training:  35%|███▌      | 17/48 [00:11<00:22,  1.41it/s][A
Training:  40%|███▉      | 19/48 [00:11<00:12,  2.39it/s][A
Training:  44%|████▍     | 21/48 [00:13<00:16,  1.59it/s][A
Training:  46%|████▌     | 22/48 [00:1

Epoch: 2/71 - Loss: 4.5154 - Accuracy: 0.9178



  0%|          | 0/6 [00:00<?, ?it/s][A
 17%|█▋        | 1/6 [00:02<00:13,  2.61s/it][A
 33%|███▎      | 2/6 [00:02<00:04,  1.15s/it][A
 50%|█████     | 3/6 [00:02<00:02,  1.48it/s][A
100%|██████████| 6/6 [00:04<00:00,  1.26it/s][A
Epochs:   3%|▎         | 2/71 [01:00<34:57, 30.39s/it]

Val Loss: 4.6236 - Val Accuracy: 0.9155



Training:   0%|          | 0/48 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/48 [00:02<02:06,  2.68s/it][A
Training:   8%|▊         | 4/48 [00:02<00:23,  1.85it/s][A
Training:  12%|█▎        | 6/48 [00:04<00:31,  1.33it/s][A
Training:  17%|█▋        | 8/48 [00:05<00:19,  2.01it/s][A
Training:  19%|█▉        | 9/48 [00:06<00:29,  1.33it/s][A
Training:  23%|██▎       | 11/48 [00:06<00:18,  2.03it/s][A
Training:  27%|██▋       | 13/48 [00:08<00:22,  1.53it/s][A
Training:  35%|███▌      | 17/48 [00:10<00:16,  1.90it/s][A
Training:  38%|███▊      | 18/48 [00:10<00:13,  2.16it/s][A
Training:  40%|███▉      | 19/48 [00:10<00:11,  2.46it/s][A
Training:  42%|████▏     | 20/48 [00:10<00:09,  2.91it/s][A
Training:  44%|████▍     | 21/48 [00:12<00:19,  1.37it/s][A
Training:  46%|████▌     | 22/48 [00:12<00:15,  1.69it/s][A
Training:  50%|█████     | 24/48 [00:13<00:09,  2.64it/s][A
Training:  52%|█████▏    | 25/48 [00:14<00:15,  1.51it/s][A
Training:  54%|█████▍    | 26/48 [00:

Epoch: 3/71 - Loss: 4.2497 - Accuracy: 0.9238



  0%|          | 0/6 [00:00<?, ?it/s][A
 17%|█▋        | 1/6 [00:03<00:15,  3.10s/it][A
 67%|██████▋   | 4/6 [00:03<00:01,  1.60it/s][A
100%|██████████| 6/6 [00:04<00:00,  1.21it/s][A
Epochs:   4%|▍         | 3/71 [01:32<35:00, 30.89s/it]

Val Loss: 3.7737 - Val Accuracy: 0.9310



Training:   0%|          | 0/48 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/48 [00:02<02:02,  2.61s/it][A
Training:   6%|▋         | 3/48 [00:02<00:33,  1.34it/s][A
Training:  10%|█         | 5/48 [00:04<00:37,  1.14it/s][A
Training:  15%|█▍        | 7/48 [00:04<00:22,  1.83it/s][A
Training:  17%|█▋        | 8/48 [00:05<00:17,  2.25it/s][A
Training:  19%|█▉        | 9/48 [00:06<00:29,  1.31it/s][A
Training:  23%|██▎       | 11/48 [00:06<00:17,  2.09it/s][A
Training:  27%|██▋       | 13/48 [00:08<00:21,  1.62it/s][A
Training:  29%|██▉       | 14/48 [00:08<00:17,  1.97it/s][A
Training:  31%|███▏      | 15/48 [00:08<00:13,  2.36it/s][A
Training:  35%|███▌      | 17/48 [00:10<00:17,  1.73it/s][A
Training:  38%|███▊      | 18/48 [00:10<00:14,  2.09it/s][A
Training:  42%|████▏     | 20/48 [00:10<00:09,  3.02it/s][A
Training:  44%|████▍     | 21/48 [00:12<00:16,  1.62it/s][A
Training:  46%|████▌     | 22/48 [00:12<00:13,  1.89it/s][A
Training:  48%|████▊     | 23/48 [00:1

Epoch: 4/71 - Loss: 4.3774 - Accuracy: 0.9222



  0%|          | 0/6 [00:00<?, ?it/s][A
 17%|█▋        | 1/6 [00:02<00:14,  2.86s/it][A
100%|██████████| 6/6 [00:05<00:00,  1.19it/s][A
Epochs:   6%|▌         | 4/71 [02:02<34:30, 30.90s/it]

Val Loss: 4.5269 - Val Accuracy: 0.9218



Training:   0%|          | 0/48 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/48 [00:02<02:08,  2.73s/it][A
Training:   4%|▍         | 2/48 [00:02<00:56,  1.22s/it][A
Training:   6%|▋         | 3/48 [00:03<00:33,  1.36it/s][A
Training:   8%|▊         | 4/48 [00:03<00:22,  1.97it/s][A
Training:  10%|█         | 5/48 [00:05<00:48,  1.12s/it][A
Training:  12%|█▎        | 6/48 [00:05<00:32,  1.29it/s][A
Training:  15%|█▍        | 7/48 [00:05<00:23,  1.78it/s][A
Training:  19%|█▉        | 9/48 [00:07<00:24,  1.58it/s][A
Training:  21%|██        | 10/48 [00:07<00:19,  1.99it/s][A
Training:  25%|██▌       | 12/48 [00:07<00:12,  2.92it/s][A
Training:  27%|██▋       | 13/48 [00:08<00:19,  1.77it/s][A
Training:  29%|██▉       | 14/48 [00:09<00:19,  1.73it/s][A
Training:  33%|███▎      | 16/48 [00:09<00:11,  2.74it/s][A
Training:  35%|███▌      | 17/48 [00:10<00:18,  1.65it/s][A
Training:  38%|███▊      | 18/48 [00:11<00:19,  1.57it/s][A
Training:  40%|███▉      | 19/48 [00:11<

Epoch: 5/71 - Loss: 3.6925 - Accuracy: 0.9346



  0%|          | 0/6 [00:00<?, ?it/s][A
 17%|█▋        | 1/6 [00:02<00:13,  2.66s/it][A
 33%|███▎      | 2/6 [00:02<00:04,  1.16s/it][A
 50%|█████     | 3/6 [00:02<00:02,  1.47it/s][A
100%|██████████| 6/6 [00:04<00:00,  1.23it/s][A
Epochs:   7%|▋         | 5/71 [02:34<34:07, 31.02s/it]

Val Loss: 4.3729 - Val Accuracy: 0.9249



Training:   0%|          | 0/48 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/48 [00:02<02:05,  2.67s/it][A
Training:   4%|▍         | 2/48 [00:02<00:58,  1.26s/it][A
Training:   8%|▊         | 4/48 [00:03<00:22,  1.95it/s][A
Training:  10%|█         | 5/48 [00:04<00:35,  1.22it/s][A
Training:  12%|█▎        | 6/48 [00:04<00:26,  1.59it/s][A
Training:  15%|█▍        | 7/48 [00:04<00:19,  2.08it/s][A
Training:  19%|█▉        | 9/48 [00:06<00:27,  1.44it/s][A
Training:  21%|██        | 10/48 [00:07<00:23,  1.63it/s][A
Training:  23%|██▎       | 11/48 [00:07<00:17,  2.08it/s][A
Training:  27%|██▋       | 13/48 [00:08<00:20,  1.71it/s][A
Training:  29%|██▉       | 14/48 [00:09<00:19,  1.71it/s][A
Training:  31%|███▏      | 15/48 [00:09<00:15,  2.12it/s][A
Training:  33%|███▎      | 16/48 [00:09<00:12,  2.62it/s][A
Training:  35%|███▌      | 17/48 [00:11<00:21,  1.42it/s][A
Training:  38%|███▊      | 18/48 [00:11<00:17,  1.73it/s][A
Training:  40%|███▉      | 19/48 [00:11

Epoch: 6/71 - Loss: 3.6771 - Accuracy: 0.9336



  0%|          | 0/6 [00:00<?, ?it/s][A
 17%|█▋        | 1/6 [00:02<00:13,  2.71s/it][A
 33%|███▎      | 2/6 [00:02<00:04,  1.21s/it][A
 50%|█████     | 3/6 [00:03<00:02,  1.39it/s][A
 83%|████████▎ | 5/6 [00:04<00:00,  1.46it/s][A
100%|██████████| 6/6 [00:04<00:00,  1.32it/s][A
Epochs:   8%|▊         | 6/71 [03:05<33:33, 30.98s/it]

Val Loss: 4.2419 - Val Accuracy: 0.9276



Training:   0%|          | 0/48 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/48 [00:02<01:57,  2.50s/it][A
Training:   6%|▋         | 3/48 [00:02<00:31,  1.43it/s][A
Training:  10%|█         | 5/48 [00:04<00:30,  1.40it/s][A
Training:  15%|█▍        | 7/48 [00:04<00:17,  2.31it/s][A
Training:  19%|█▉        | 9/48 [00:05<00:23,  1.68it/s][A
Training:  23%|██▎       | 11/48 [00:06<00:15,  2.41it/s][A
Training:  27%|██▋       | 13/48 [00:07<00:18,  1.92it/s][A
Training:  31%|███▏      | 15/48 [00:07<00:12,  2.63it/s][A
Training:  33%|███▎      | 16/48 [00:07<00:10,  3.02it/s][A
Training:  35%|███▌      | 17/48 [00:09<00:19,  1.60it/s][A
Training:  40%|███▉      | 19/48 [00:09<00:12,  2.34it/s][A
Training:  42%|████▏     | 20/48 [00:09<00:10,  2.64it/s][A
Training:  44%|████▍     | 21/48 [00:11<00:18,  1.49it/s][A
Training:  46%|████▌     | 22/48 [00:11<00:13,  1.87it/s][A
Training:  48%|████▊     | 23/48 [00:11<00:10,  2.36it/s][A
Training:  52%|█████▏    | 25/48 [00:

Epoch: 7/71 - Loss: 3.7629 - Accuracy: 0.9338



  0%|          | 0/6 [00:00<?, ?it/s][A
 17%|█▋        | 1/6 [00:02<00:13,  2.70s/it][A
 50%|█████     | 3/6 [00:02<00:02,  1.33it/s][A
100%|██████████| 6/6 [00:04<00:00,  1.33it/s][A
Epochs:  10%|▉         | 7/71 [03:32<31:58, 29.98s/it]

Val Loss: 3.5672 - Val Accuracy: 0.9333



Training:   0%|          | 0/48 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/48 [00:02<01:45,  2.25s/it][A
Training:   6%|▋         | 3/48 [00:02<00:28,  1.58it/s][A
Training:  10%|█         | 5/48 [00:04<00:32,  1.31it/s][A
Training:  15%|█▍        | 7/48 [00:04<00:19,  2.08it/s][A
Training:  17%|█▋        | 8/48 [00:04<00:15,  2.50it/s][A
Training:  19%|█▉        | 9/48 [00:06<00:26,  1.46it/s][A
Training:  23%|██▎       | 11/48 [00:06<00:16,  2.30it/s][A
Training:  27%|██▋       | 13/48 [00:07<00:20,  1.71it/s][A
Training:  31%|███▏      | 15/48 [00:08<00:14,  2.33it/s][A
Training:  35%|███▌      | 17/48 [00:09<00:16,  1.92it/s][A
Training:  38%|███▊      | 18/48 [00:09<00:13,  2.24it/s][A
Training:  40%|███▉      | 19/48 [00:10<00:13,  2.14it/s][A
Training:  44%|████▍     | 21/48 [00:11<00:14,  1.93it/s][A
Training:  46%|████▌     | 22/48 [00:11<00:12,  2.16it/s][A
Training:  48%|████▊     | 23/48 [00:12<00:13,  1.85it/s][A
Training:  50%|█████     | 24/48 [00:1

Epoch: 8/71 - Loss: 3.3569 - Accuracy: 0.9393



  0%|          | 0/6 [00:00<?, ?it/s][A
 17%|█▋        | 1/6 [00:02<00:11,  2.36s/it][A
 50%|█████     | 3/6 [00:02<00:02,  1.48it/s][A
 67%|██████▋   | 4/6 [00:02<00:00,  2.07it/s][A
100%|██████████| 6/6 [00:04<00:00,  1.43it/s][A
Epochs:  11%|█▏        | 8/71 [04:02<31:11, 29.71s/it]

Val Loss: 3.5455 - Val Accuracy: 0.9355



Training:   0%|          | 0/48 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/48 [00:02<01:51,  2.36s/it][A
Training:   4%|▍         | 2/48 [00:02<00:55,  1.20s/it][A
Training:   8%|▊         | 4/48 [00:02<00:21,  2.01it/s][A
Training:  10%|█         | 5/48 [00:04<00:34,  1.26it/s][A
Training:  12%|█▎        | 6/48 [00:04<00:27,  1.53it/s][A
Training:  15%|█▍        | 7/48 [00:04<00:20,  2.00it/s][A
Training:  17%|█▋        | 8/48 [00:05<00:15,  2.56it/s][A
Training:  19%|█▉        | 9/48 [00:06<00:27,  1.42it/s][A
Training:  21%|██        | 10/48 [00:06<00:24,  1.56it/s][A
Training:  23%|██▎       | 11/48 [00:07<00:18,  2.03it/s][A
Training:  25%|██▌       | 12/48 [00:07<00:13,  2.60it/s][A
Training:  27%|██▋       | 13/48 [00:08<00:24,  1.45it/s][A
Training:  29%|██▉       | 14/48 [00:09<00:21,  1.61it/s][A
Training:  31%|███▏      | 15/48 [00:09<00:15,  2.15it/s][A
Training:  33%|███▎      | 16/48 [00:09<00:11,  2.79it/s][A
Training:  35%|███▌      | 17/48 [00:10<

Epoch: 9/71 - Loss: 3.3188 - Accuracy: 0.9406



  0%|          | 0/6 [00:00<?, ?it/s][A
 17%|█▋        | 1/6 [00:02<00:11,  2.33s/it][A
 33%|███▎      | 2/6 [00:02<00:04,  1.05s/it][A
 50%|█████     | 3/6 [00:02<00:01,  1.61it/s][A
100%|██████████| 6/6 [00:04<00:00,  1.44it/s][A
Epochs:  13%|█▎        | 9/71 [04:32<31:03, 30.05s/it]

Val Loss: 3.7831 - Val Accuracy: 0.9362



Training:   0%|          | 0/48 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/48 [00:02<02:05,  2.66s/it][A
Training:   6%|▋         | 3/48 [00:02<00:33,  1.35it/s][A
Training:  10%|█         | 5/48 [00:04<00:31,  1.35it/s][A
Training:  12%|█▎        | 6/48 [00:04<00:26,  1.58it/s][A
Training:  15%|█▍        | 7/48 [00:04<00:20,  2.04it/s][A
Training:  17%|█▋        | 8/48 [00:04<00:16,  2.49it/s][A
Training:  19%|█▉        | 9/48 [00:06<00:28,  1.39it/s][A
Training:  21%|██        | 10/48 [00:06<00:25,  1.51it/s][A
Training:  23%|██▎       | 11/48 [00:07<00:18,  1.99it/s][A
Training:  25%|██▌       | 12/48 [00:07<00:13,  2.61it/s][A
Training:  27%|██▋       | 13/48 [00:08<00:22,  1.54it/s][A
Training:  29%|██▉       | 14/48 [00:09<00:22,  1.51it/s][A
Training:  31%|███▏      | 15/48 [00:09<00:16,  2.00it/s][A
Training:  33%|███▎      | 16/48 [00:09<00:12,  2.61it/s][A
Training:  35%|███▌      | 17/48 [00:10<00:18,  1.66it/s][A
Training:  38%|███▊      | 18/48 [00:11

Epoch: 10/71 - Loss: 3.2399 - Accuracy: 0.9424



  0%|          | 0/6 [00:00<?, ?it/s][A
 17%|█▋        | 1/6 [00:02<00:13,  2.66s/it][A
100%|██████████| 6/6 [00:04<00:00,  1.25it/s][A
Epochs:  14%|█▍        | 10/71 [05:04<30:53, 30.38s/it]

Val Loss: 3.3675 - Val Accuracy: 0.9369



Training:   0%|          | 0/48 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/48 [00:02<01:50,  2.35s/it][A
Training:   4%|▍         | 2/48 [00:02<00:52,  1.15s/it][A
Training:   6%|▋         | 3/48 [00:02<00:31,  1.44it/s][A
Training:   8%|▊         | 4/48 [00:02<00:20,  2.15it/s][A
Training:  10%|█         | 5/48 [00:04<00:37,  1.16it/s][A
Training:  12%|█▎        | 6/48 [00:04<00:27,  1.55it/s][A
Training:  17%|█▋        | 8/48 [00:04<00:14,  2.82it/s][A
Training:  19%|█▉        | 9/48 [00:06<00:32,  1.22it/s][A
Training:  23%|██▎       | 11/48 [00:07<00:18,  2.02it/s][A
Training:  25%|██▌       | 12/48 [00:07<00:14,  2.41it/s][A
Training:  27%|██▋       | 13/48 [00:09<00:26,  1.33it/s][A
Training:  31%|███▏      | 15/48 [00:09<00:16,  2.04it/s][A
Training:  35%|███▌      | 17/48 [00:11<00:20,  1.50it/s][A
Training:  40%|███▉      | 19/48 [00:11<00:13,  2.13it/s][A
Training:  42%|████▏     | 20/48 [00:11<00:11,  2.45it/s][A
Training:  44%|████▍     | 21/48 [00:13<

Epoch: 11/71 - Loss: 3.2548 - Accuracy: 0.9422



  0%|          | 0/6 [00:00<?, ?it/s][A
 17%|█▋        | 1/6 [00:02<00:11,  2.37s/it][A
 33%|███▎      | 2/6 [00:02<00:04,  1.03s/it][A
 67%|██████▋   | 4/6 [00:02<00:00,  2.34it/s][A
100%|██████████| 6/6 [00:04<00:00,  1.36it/s][A
Epochs:  15%|█▌        | 11/71 [05:34<30:26, 30.43s/it]

Val Loss: 3.7303 - Val Accuracy: 0.9303



Training:   0%|          | 0/48 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/48 [00:02<02:12,  2.81s/it][A
Training:   4%|▍         | 2/48 [00:02<00:56,  1.24s/it][A
Training:   8%|▊         | 4/48 [00:03<00:22,  1.96it/s][A
Training:  10%|█         | 5/48 [00:04<00:35,  1.20it/s][A
Training:  12%|█▎        | 6/48 [00:04<00:26,  1.56it/s][A
Training:  17%|█▋        | 8/48 [00:05<00:15,  2.56it/s][A
Training:  19%|█▉        | 9/48 [00:06<00:25,  1.51it/s][A
Training:  21%|██        | 10/48 [00:06<00:22,  1.69it/s][A
Training:  23%|██▎       | 11/48 [00:07<00:17,  2.11it/s][A
Training:  25%|██▌       | 12/48 [00:07<00:17,  2.08it/s][A
Training:  27%|██▋       | 13/48 [00:08<00:23,  1.52it/s][A
Training:  29%|██▉       | 14/48 [00:09<00:22,  1.48it/s][A
Training:  33%|███▎      | 16/48 [00:09<00:15,  2.03it/s][A
Training:  35%|███▌      | 17/48 [00:10<00:17,  1.74it/s][A
Training:  38%|███▊      | 18/48 [00:11<00:18,  1.66it/s][A
Training:  42%|████▏     | 20/48 [00:12

Epoch: 12/71 - Loss: 3.1291 - Accuracy: 0.9430



  0%|          | 0/6 [00:00<?, ?it/s][A
 17%|█▋        | 1/6 [00:02<00:14,  2.85s/it][A
 50%|█████     | 3/6 [00:02<00:02,  1.28it/s][A
100%|██████████| 6/6 [00:05<00:00,  1.17it/s][A
Epochs:  17%|█▋        | 12/71 [06:06<30:20, 30.85s/it]

Val Loss: 3.4576 - Val Accuracy: 0.9397



Training:   0%|          | 0/48 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/48 [00:02<02:08,  2.74s/it][A
Training:   4%|▍         | 2/48 [00:02<00:54,  1.19s/it][A
Training:   6%|▋         | 3/48 [00:02<00:31,  1.43it/s][A
Training:   8%|▊         | 4/48 [00:03<00:21,  2.09it/s][A
Training:  10%|█         | 5/48 [00:05<00:44,  1.03s/it][A
Training:  12%|█▎        | 6/48 [00:05<00:30,  1.38it/s][A
Training:  17%|█▋        | 8/48 [00:05<00:16,  2.38it/s][A
Training:  19%|█▉        | 9/48 [00:07<00:28,  1.38it/s][A
Training:  21%|██        | 10/48 [00:07<00:21,  1.78it/s][A
Training:  25%|██▌       | 12/48 [00:07<00:12,  2.79it/s][A
Training:  27%|██▋       | 13/48 [00:09<00:26,  1.33it/s][A
Training:  29%|██▉       | 14/48 [00:09<00:20,  1.68it/s][A
Training:  31%|███▏      | 15/48 [00:09<00:15,  2.16it/s][A
Training:  33%|███▎      | 16/48 [00:09<00:11,  2.71it/s][A
Training:  35%|███▌      | 17/48 [00:11<00:23,  1.32it/s][A
Training:  38%|███▊      | 18/48 [00:11<

Epoch: 13/71 - Loss: 3.2912 - Accuracy: 0.9418



  0%|          | 0/6 [00:00<?, ?it/s][A
 17%|█▋        | 1/6 [00:02<00:14,  2.80s/it][A
 67%|██████▋   | 4/6 [00:02<00:01,  1.78it/s][A
100%|██████████| 6/6 [00:05<00:00,  1.17it/s][A
Epochs:  18%|█▊        | 13/71 [06:37<30:00, 31.04s/it]

Val Loss: 4.3436 - Val Accuracy: 0.9242



Training:   0%|          | 0/48 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/48 [00:02<02:16,  2.90s/it][A
Training:   6%|▋         | 3/48 [00:03<00:35,  1.27it/s][A
Training:  10%|█         | 5/48 [00:04<00:36,  1.17it/s][A
Training:  12%|█▎        | 6/48 [00:05<00:28,  1.47it/s][A
Training:  15%|█▍        | 7/48 [00:05<00:21,  1.92it/s][A
Training:  19%|█▉        | 9/48 [00:07<00:27,  1.42it/s][A
Training:  21%|██        | 10/48 [00:07<00:23,  1.62it/s][A
Training:  25%|██▌       | 12/48 [00:07<00:14,  2.44it/s][A
Training:  27%|██▋       | 13/48 [00:09<00:23,  1.49it/s][A
Training:  29%|██▉       | 14/48 [00:09<00:19,  1.72it/s][A
Training:  31%|███▏      | 15/48 [00:09<00:15,  2.11it/s][A
Training:  33%|███▎      | 16/48 [00:09<00:12,  2.64it/s][A
Training:  35%|███▌      | 17/48 [00:11<00:22,  1.35it/s][A
Training:  38%|███▊      | 18/48 [00:11<00:19,  1.57it/s][A
Training:  40%|███▉      | 19/48 [00:12<00:15,  1.81it/s][A
Training:  42%|████▏     | 20/48 [00:1

Epoch: 14/71 - Loss: 3.0925 - Accuracy: 0.9444



  0%|          | 0/6 [00:00<?, ?it/s][A
 17%|█▋        | 1/6 [00:02<00:11,  2.26s/it][A
 33%|███▎      | 2/6 [00:02<00:04,  1.02s/it][A
100%|██████████| 6/6 [00:04<00:00,  1.36it/s][A
Epochs:  20%|█▉        | 14/71 [07:08<29:16, 30.81s/it]

Val Loss: 3.4795 - Val Accuracy: 0.9368



Training:   0%|          | 0/48 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/48 [00:02<02:12,  2.81s/it][A
Training:   4%|▍         | 2/48 [00:02<00:56,  1.22s/it][A
Training:   8%|▊         | 4/48 [00:03<00:22,  1.97it/s][A
Training:  10%|█         | 5/48 [00:04<00:39,  1.09it/s][A
Training:  15%|█▍        | 7/48 [00:05<00:21,  1.95it/s][A
Training:  19%|█▉        | 9/48 [00:07<00:28,  1.37it/s][A
Training:  21%|██        | 10/48 [00:07<00:23,  1.65it/s][A
Training:  23%|██▎       | 11/48 [00:07<00:18,  2.04it/s][A
Training:  27%|██▋       | 13/48 [00:09<00:22,  1.58it/s][A
Training:  29%|██▉       | 14/48 [00:09<00:18,  1.83it/s][A
Training:  31%|███▏      | 15/48 [00:09<00:14,  2.25it/s][A
Training:  33%|███▎      | 16/48 [00:09<00:11,  2.76it/s][A
Training:  35%|███▌      | 17/48 [00:11<00:19,  1.55it/s][A
Training:  38%|███▊      | 18/48 [00:11<00:18,  1.66it/s][A
Training:  40%|███▉      | 19/48 [00:11<00:13,  2.17it/s][A
Training:  44%|████▍     | 21/48 [00:1

Epoch: 15/71 - Loss: 2.9899 - Accuracy: 0.9464



  0%|          | 0/6 [00:00<?, ?it/s][A
 17%|█▋        | 1/6 [00:02<00:12,  2.55s/it][A
 33%|███▎      | 2/6 [00:02<00:04,  1.24s/it][A
 50%|█████     | 3/6 [00:03<00:02,  1.36it/s][A
 83%|████████▎ | 5/6 [00:04<00:00,  1.40it/s][A
100%|██████████| 6/6 [00:04<00:00,  1.27it/s][A
Epochs:  21%|██        | 15/71 [07:39<28:49, 30.88s/it]

Val Loss: 3.4072 - Val Accuracy: 0.9367



Training:   0%|          | 0/48 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/48 [00:02<02:14,  2.86s/it][A
Training:   6%|▋         | 3/48 [00:03<00:37,  1.19it/s][A
Training:   8%|▊         | 4/48 [00:03<00:25,  1.70it/s][A
Training:  10%|█         | 5/48 [00:05<00:43,  1.01s/it][A
Training:  15%|█▍        | 7/48 [00:05<00:22,  1.81it/s][A
Training:  19%|█▉        | 9/48 [00:07<00:31,  1.25it/s][A
Training:  25%|██▌       | 12/48 [00:07<00:16,  2.22it/s][A
Training:  29%|██▉       | 14/48 [00:09<00:20,  1.62it/s][A
Training:  33%|███▎      | 16/48 [00:09<00:14,  2.21it/s][A
Training:  35%|███▌      | 17/48 [00:11<00:21,  1.42it/s][A
Training:  38%|███▊      | 18/48 [00:11<00:17,  1.67it/s][A
Training:  40%|███▉      | 19/48 [00:12<00:14,  2.00it/s][A
Training:  42%|████▏     | 20/48 [00:12<00:11,  2.41it/s][A
Training:  44%|████▍     | 21/48 [00:14<00:20,  1.29it/s][A
Training:  46%|████▌     | 22/48 [00:14<00:15,  1.66it/s][A
Training:  48%|████▊     | 23/48 [00:1

Epoch: 16/71 - Loss: 2.8822 - Accuracy: 0.9489



  0%|          | 0/6 [00:00<?, ?it/s][A
 17%|█▋        | 1/6 [00:02<00:12,  2.53s/it][A
 67%|██████▋   | 4/6 [00:02<00:01,  1.97it/s][A
100%|██████████| 6/6 [00:04<00:00,  1.32it/s][A
Epochs:  23%|██▎       | 16/71 [08:09<28:11, 30.75s/it]

Val Loss: 3.3930 - Val Accuracy: 0.9441



Training:   0%|          | 0/48 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/48 [00:02<02:17,  2.92s/it][A
Training:   6%|▋         | 3/48 [00:03<00:36,  1.24it/s][A
Training:  10%|█         | 5/48 [00:04<00:35,  1.20it/s][A
Training:  12%|█▎        | 6/48 [00:04<00:26,  1.56it/s][A
Training:  17%|█▋        | 8/48 [00:05<00:15,  2.54it/s][A
Training:  19%|█▉        | 9/48 [00:06<00:27,  1.41it/s][A
Training:  21%|██        | 10/48 [00:06<00:21,  1.80it/s][A
Training:  25%|██▌       | 12/48 [00:07<00:12,  2.80it/s][A
Training:  27%|██▋       | 13/48 [00:08<00:23,  1.48it/s][A
Training:  31%|███▏      | 15/48 [00:08<00:14,  2.30it/s][A
Training:  33%|███▎      | 16/48 [00:09<00:12,  2.47it/s][A
Training:  35%|███▌      | 17/48 [00:10<00:19,  1.62it/s][A
Training:  38%|███▊      | 18/48 [00:10<00:14,  2.05it/s][A
Training:  40%|███▉      | 19/48 [00:10<00:11,  2.56it/s][A
Training:  42%|████▏     | 20/48 [00:10<00:10,  2.80it/s][A
Training:  44%|████▍     | 21/48 [00:1

Epoch: 17/71 - Loss: 3.0500 - Accuracy: 0.9446



  0%|          | 0/6 [00:00<?, ?it/s][A
 17%|█▋        | 1/6 [00:02<00:11,  2.21s/it][A
 33%|███▎      | 2/6 [00:02<00:04,  1.02s/it][A
 67%|██████▋   | 4/6 [00:02<00:00,  2.25it/s][A
100%|██████████| 6/6 [00:04<00:00,  1.44it/s][A
Epochs:  24%|██▍       | 17/71 [08:37<26:54, 29.90s/it]

Val Loss: 3.3420 - Val Accuracy: 0.9406



Training:   0%|          | 0/48 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/48 [00:02<01:50,  2.36s/it][A
Training:   6%|▋         | 3/48 [00:02<00:31,  1.44it/s][A
Training:   8%|▊         | 4/48 [00:02<00:22,  2.00it/s][A
Training:  10%|█         | 5/48 [00:04<00:40,  1.05it/s][A
Training:  12%|█▎        | 6/48 [00:04<00:28,  1.45it/s][A
Training:  15%|█▍        | 7/48 [00:04<00:20,  1.96it/s][A
Training:  17%|█▋        | 8/48 [00:04<00:15,  2.59it/s][A
Training:  19%|█▉        | 9/48 [00:06<00:30,  1.27it/s][A
Training:  21%|██        | 10/48 [00:06<00:22,  1.72it/s][A
Training:  23%|██▎       | 11/48 [00:06<00:16,  2.21it/s][A
Training:  25%|██▌       | 12/48 [00:07<00:12,  2.86it/s][A
Training:  27%|██▋       | 13/48 [00:08<00:24,  1.43it/s][A
Training:  31%|███▏      | 15/48 [00:08<00:13,  2.37it/s][A
Training:  35%|███▌      | 17/48 [00:10<00:18,  1.71it/s][A
Training:  38%|███▊      | 18/48 [00:10<00:14,  2.04it/s][A
Training:  44%|████▍     | 21/48 [00:12<

Epoch: 18/71 - Loss: 2.9225 - Accuracy: 0.9463



  0%|          | 0/6 [00:00<?, ?it/s][A
 17%|█▋        | 1/6 [00:02<00:12,  2.54s/it][A
 50%|█████     | 3/6 [00:02<00:02,  1.42it/s][A
100%|██████████| 6/6 [00:04<00:00,  1.32it/s][A
Epochs:  25%|██▌       | 18/71 [09:06<26:01, 29.47s/it]

Val Loss: 3.6431 - Val Accuracy: 0.9312



Training:   0%|          | 0/48 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/48 [00:02<02:04,  2.64s/it][A
Training:   8%|▊         | 4/48 [00:02<00:23,  1.85it/s][A
Training:  12%|█▎        | 6/48 [00:04<00:30,  1.40it/s][A
Training:  17%|█▋        | 8/48 [00:04<00:19,  2.06it/s][A
Training:  19%|█▉        | 9/48 [00:06<00:28,  1.39it/s][A
Training:  21%|██        | 10/48 [00:06<00:22,  1.66it/s][A
Training:  23%|██▎       | 11/48 [00:06<00:17,  2.08it/s][A
Training:  25%|██▌       | 12/48 [00:06<00:13,  2.62it/s][A
Training:  27%|██▋       | 13/48 [00:08<00:24,  1.42it/s][A
Training:  29%|██▉       | 14/48 [00:08<00:20,  1.66it/s][A
Training:  33%|███▎      | 16/48 [00:09<00:12,  2.65it/s][A
Training:  35%|███▌      | 17/48 [00:10<00:19,  1.62it/s][A
Training:  38%|███▊      | 18/48 [00:10<00:17,  1.73it/s][A
Training:  40%|███▉      | 19/48 [00:11<00:13,  2.13it/s][A
Training:  42%|████▏     | 20/48 [00:11<00:10,  2.64it/s][A
Training:  44%|████▍     | 21/48 [00:

Epoch: 19/71 - Loss: 2.9970 - Accuracy: 0.9444



  0%|          | 0/6 [00:00<?, ?it/s][A
 17%|█▋        | 1/6 [00:02<00:12,  2.57s/it][A
 50%|█████     | 3/6 [00:02<00:02,  1.38it/s][A
100%|██████████| 6/6 [00:04<00:00,  1.33it/s][A
Epochs:  27%|██▋       | 19/71 [09:34<25:23, 29.31s/it]

Val Loss: 3.6691 - Val Accuracy: 0.9374



Training:   0%|          | 0/48 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/48 [00:02<02:00,  2.57s/it][A
Training:   6%|▋         | 3/48 [00:02<00:32,  1.40it/s][A
Training:  10%|█         | 5/48 [00:04<00:34,  1.23it/s][A
Training:  15%|█▍        | 7/48 [00:04<00:21,  1.88it/s][A
Training:  17%|█▋        | 8/48 [00:04<00:17,  2.29it/s][A
Training:  19%|█▉        | 9/48 [00:06<00:29,  1.31it/s][A
Training:  23%|██▎       | 11/48 [00:06<00:17,  2.08it/s][A
Training:  27%|██▋       | 13/48 [00:08<00:22,  1.58it/s][A
Training:  31%|███▏      | 15/48 [00:08<00:15,  2.18it/s][A
Training:  35%|███▌      | 17/48 [00:10<00:18,  1.69it/s][A
Training:  38%|███▊      | 18/48 [00:10<00:15,  2.00it/s][A
Training:  40%|███▉      | 19/48 [00:10<00:12,  2.25it/s][A
Training:  44%|████▍     | 21/48 [00:12<00:14,  1.91it/s][A
Training:  48%|████▊     | 23/48 [00:12<00:11,  2.27it/s][A
Training:  50%|█████     | 24/48 [00:12<00:08,  2.67it/s][A
Training:  52%|█████▏    | 25/48 [00:1

Epoch: 20/71 - Loss: 2.8901 - Accuracy: 0.9472



  0%|          | 0/6 [00:00<?, ?it/s][A
 17%|█▋        | 1/6 [00:02<00:12,  2.60s/it][A
 50%|█████     | 3/6 [00:02<00:02,  1.40it/s][A
100%|██████████| 6/6 [00:04<00:00,  1.33it/s][A
Epochs:  28%|██▊       | 20/71 [10:03<24:50, 29.22s/it]

Val Loss: 3.6407 - Val Accuracy: 0.9403



Training:   0%|          | 0/48 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/48 [00:02<01:42,  2.18s/it][A
Training:   4%|▍         | 2/48 [00:02<00:43,  1.05it/s][A
Training:   8%|▊         | 4/48 [00:02<00:18,  2.41it/s][A
Training:  10%|█         | 5/48 [00:03<00:31,  1.35it/s][A
Training:  12%|█▎        | 6/48 [00:04<00:23,  1.79it/s][A
Training:  15%|█▍        | 7/48 [00:04<00:21,  1.94it/s][A
Training:  17%|█▋        | 8/48 [00:04<00:17,  2.35it/s][A
Training:  19%|█▉        | 9/48 [00:05<00:26,  1.48it/s][A
Training:  23%|██▎       | 11/48 [00:06<00:18,  2.00it/s][A
Training:  25%|██▌       | 12/48 [00:06<00:14,  2.43it/s][A
Training:  27%|██▋       | 13/48 [00:07<00:22,  1.59it/s][A
Training:  29%|██▉       | 14/48 [00:08<00:17,  1.89it/s][A
Training:  31%|███▏      | 15/48 [00:08<00:15,  2.18it/s][A
Training:  33%|███▎      | 16/48 [00:08<00:13,  2.31it/s][A
Training:  35%|███▌      | 17/48 [00:09<00:19,  1.62it/s][A
Training:  38%|███▊      | 18/48 [00:10<

Epoch: 21/71 - Loss: 2.8864 - Accuracy: 0.9461



  0%|          | 0/6 [00:00<?, ?it/s][A
 17%|█▋        | 1/6 [00:02<00:12,  2.41s/it][A
 50%|█████     | 3/6 [00:02<00:01,  1.51it/s][A
100%|██████████| 6/6 [00:04<00:00,  1.39it/s][A
Epochs:  30%|██▉       | 21/71 [10:32<24:10, 29.01s/it]

Val Loss: 3.3732 - Val Accuracy: 0.9391



Training:   0%|          | 0/48 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/48 [00:02<01:58,  2.52s/it][A
Training:   4%|▍         | 2/48 [00:02<00:51,  1.11s/it][A
Training:   6%|▋         | 3/48 [00:02<00:29,  1.53it/s][A
Training:  10%|█         | 5/48 [00:04<00:30,  1.42it/s][A
Training:  15%|█▍        | 7/48 [00:04<00:17,  2.36it/s][A
Training:  19%|█▉        | 9/48 [00:06<00:23,  1.67it/s][A
Training:  23%|██▎       | 11/48 [00:06<00:14,  2.47it/s][A
Training:  27%|██▋       | 13/48 [00:07<00:18,  1.85it/s][A
Training:  31%|███▏      | 15/48 [00:08<00:12,  2.56it/s][A
Training:  33%|███▎      | 16/48 [00:08<00:10,  2.98it/s][A
Training:  35%|███▌      | 17/48 [00:09<00:18,  1.70it/s][A
Training:  40%|███▉      | 19/48 [00:09<00:11,  2.54it/s][A
Training:  42%|████▏     | 20/48 [00:09<00:09,  3.00it/s][A
Training:  44%|████▍     | 21/48 [00:11<00:18,  1.45it/s][A
Training:  46%|████▌     | 22/48 [00:11<00:14,  1.83it/s][A
Training:  50%|█████     | 24/48 [00:1

Epoch: 22/71 - Loss: 2.9584 - Accuracy: 0.9455



  0%|          | 0/6 [00:00<?, ?it/s][A
 17%|█▋        | 1/6 [00:02<00:12,  2.59s/it][A
 50%|█████     | 3/6 [00:02<00:02,  1.40it/s][A
100%|██████████| 6/6 [00:04<00:00,  1.26it/s][A
Epochs:  31%|███       | 22/71 [11:02<23:54, 29.27s/it]

Val Loss: 3.5333 - Val Accuracy: 0.9355



Training:   0%|          | 0/48 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/48 [00:03<02:26,  3.11s/it][A
Training:   8%|▊         | 4/48 [00:03<00:27,  1.62it/s][A
Training:  12%|█▎        | 6/48 [00:05<00:35,  1.18it/s][A
Training:  17%|█▋        | 8/48 [00:05<00:21,  1.82it/s][A
Training:  21%|██        | 10/48 [00:07<00:27,  1.39it/s][A
Training:  23%|██▎       | 11/48 [00:07<00:22,  1.68it/s][A
Training:  25%|██▌       | 12/48 [00:07<00:17,  2.00it/s][A
Training:  27%|██▋       | 13/48 [00:09<00:29,  1.19it/s][A
Training:  31%|███▏      | 15/48 [00:10<00:17,  1.90it/s][A
Training:  35%|███▌      | 17/48 [00:11<00:20,  1.48it/s][A
Training:  38%|███▊      | 18/48 [00:12<00:17,  1.76it/s][A
Training:  40%|███▉      | 19/48 [00:12<00:13,  2.12it/s][A
Training:  42%|████▏     | 20/48 [00:12<00:11,  2.40it/s][A
Training:  44%|████▍     | 21/48 [00:13<00:17,  1.55it/s][A
Training:  50%|█████     | 24/48 [00:13<00:08,  2.88it/s][A
Training:  52%|█████▏    | 25/48 [00

Epoch: 23/71 - Loss: 2.8004 - Accuracy: 0.9464



  0%|          | 0/6 [00:00<?, ?it/s][A
 17%|█▋        | 1/6 [00:02<00:13,  2.69s/it][A
 67%|██████▋   | 4/6 [00:02<00:01,  1.84it/s][A
100%|██████████| 6/6 [00:04<00:00,  1.32it/s][A
Epochs:  32%|███▏      | 23/71 [11:33<23:47, 29.73s/it]

Val Loss: 3.8553 - Val Accuracy: 0.9352



Training:   0%|          | 0/48 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/48 [00:02<02:00,  2.56s/it][A
Training:   4%|▍         | 2/48 [00:02<00:56,  1.24s/it][A
Training:   8%|▊         | 4/48 [00:03<00:22,  2.00it/s][A
Training:  10%|█         | 5/48 [00:04<00:36,  1.18it/s][A
Training:  12%|█▎        | 6/48 [00:04<00:27,  1.55it/s][A
Training:  17%|█▋        | 8/48 [00:04<00:14,  2.72it/s][A
Training:  21%|██        | 10/48 [00:06<00:21,  1.76it/s][A
Training:  25%|██▌       | 12/48 [00:06<00:15,  2.38it/s][A
Training:  27%|██▋       | 13/48 [00:08<00:22,  1.56it/s][A
Training:  29%|██▉       | 14/48 [00:08<00:18,  1.85it/s][A
Training:  33%|███▎      | 16/48 [00:08<00:12,  2.66it/s][A
Training:  35%|███▌      | 17/48 [00:10<00:19,  1.60it/s][A
Training:  40%|███▉      | 19/48 [00:10<00:12,  2.32it/s][A
Training:  42%|████▏     | 20/48 [00:11<00:12,  2.26it/s][A
Training:  44%|████▍     | 21/48 [00:12<00:18,  1.50it/s][A
Training:  50%|█████     | 24/48 [00:1

Epoch: 24/71 - Loss: 2.7943 - Accuracy: 0.9477



  0%|          | 0/6 [00:00<?, ?it/s][A
 17%|█▋        | 1/6 [00:02<00:13,  2.64s/it][A
 33%|███▎      | 2/6 [00:02<00:04,  1.15s/it][A
 67%|██████▋   | 4/6 [00:02<00:00,  2.13it/s][A
100%|██████████| 6/6 [00:04<00:00,  1.24it/s][A
Epochs:  34%|███▍      | 24/71 [12:03<23:19, 29.77s/it]

Val Loss: 3.4870 - Val Accuracy: 0.9411



Training:   0%|          | 0/48 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/48 [00:02<01:51,  2.37s/it][A
Training:   4%|▍         | 2/48 [00:02<00:48,  1.05s/it][A
Training:   8%|▊         | 4/48 [00:02<00:19,  2.31it/s][A
Training:  10%|█         | 5/48 [00:04<00:35,  1.21it/s][A
Training:  12%|█▎        | 6/48 [00:04<00:28,  1.49it/s][A
Training:  15%|█▍        | 7/48 [00:04<00:22,  1.80it/s][A
Training:  19%|█▉        | 9/48 [00:06<00:22,  1.72it/s][A
Training:  21%|██        | 10/48 [00:06<00:20,  1.87it/s][A
Training:  23%|██▎       | 11/48 [00:06<00:17,  2.08it/s][A
Training:  27%|██▋       | 13/48 [00:08<00:18,  1.91it/s][A
Training:  29%|██▉       | 14/48 [00:08<00:17,  1.90it/s][A
Training:  31%|███▏      | 15/48 [00:08<00:14,  2.24it/s][A
Training:  33%|███▎      | 16/48 [00:08<00:11,  2.76it/s][A
Training:  35%|███▌      | 17/48 [00:10<00:20,  1.48it/s][A
Training:  38%|███▊      | 18/48 [00:10<00:16,  1.87it/s][A
Training:  40%|███▉      | 19/48 [00:10

Epoch: 25/71 - Loss: 2.7157 - Accuracy: 0.9500



  0%|          | 0/6 [00:00<?, ?it/s][A
 17%|█▋        | 1/6 [00:02<00:11,  2.35s/it][A
 33%|███▎      | 2/6 [00:02<00:04,  1.24s/it][A
 67%|██████▋   | 4/6 [00:02<00:01,  2.00it/s][A
 83%|████████▎ | 5/6 [00:04<00:00,  1.34it/s][A
100%|██████████| 6/6 [00:04<00:00,  1.20it/s][A
Epochs:  35%|███▌      | 25/71 [12:33<22:53, 29.86s/it]

Val Loss: 3.3313 - Val Accuracy: 0.9470



Training:   0%|          | 0/48 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/48 [00:02<02:08,  2.73s/it][A
Training:   4%|▍         | 2/48 [00:02<00:57,  1.25s/it][A
Training:   6%|▋         | 3/48 [00:03<00:33,  1.34it/s][A
Training:  10%|█         | 5/48 [00:04<00:36,  1.16it/s][A
Training:  12%|█▎        | 6/48 [00:05<00:27,  1.54it/s][A
Training:  15%|█▍        | 7/48 [00:05<00:20,  2.01it/s][A
Training:  19%|█▉        | 9/48 [00:06<00:21,  1.83it/s][A
Training:  25%|██▌       | 12/48 [00:06<00:10,  3.41it/s][A
Training:  29%|██▉       | 14/48 [00:08<00:16,  2.04it/s][A
Training:  31%|███▏      | 15/48 [00:08<00:14,  2.23it/s][A
Training:  33%|███▎      | 16/48 [00:08<00:12,  2.66it/s][A
Training:  35%|███▌      | 17/48 [00:10<00:18,  1.68it/s][A
Training:  40%|███▉      | 19/48 [00:10<00:12,  2.35it/s][A
Training:  44%|████▍     | 21/48 [00:12<00:16,  1.69it/s][A
Training:  46%|████▌     | 22/48 [00:12<00:13,  1.99it/s][A
Training:  48%|████▊     | 23/48 [00:12

Epoch: 26/71 - Loss: 2.7935 - Accuracy: 0.9479



  0%|          | 0/6 [00:00<?, ?it/s][A
 17%|█▋        | 1/6 [00:02<00:12,  2.57s/it][A
 33%|███▎      | 2/6 [00:02<00:04,  1.15s/it][A
 67%|██████▋   | 4/6 [00:02<00:00,  2.05it/s][A
100%|██████████| 6/6 [00:04<00:00,  1.26it/s][A
Epochs:  37%|███▋      | 26/71 [13:03<22:25, 29.91s/it]

Val Loss: 3.6331 - Val Accuracy: 0.9351



Training:   0%|          | 0/48 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/48 [00:02<01:49,  2.33s/it][A
Training:   6%|▋         | 3/48 [00:02<00:29,  1.53it/s][A
Training:   8%|▊         | 4/48 [00:02<00:20,  2.15it/s][A
Training:  10%|█         | 5/48 [00:04<00:40,  1.07it/s][A
Training:  17%|█▋        | 8/48 [00:04<00:17,  2.30it/s][A
Training:  19%|█▉        | 9/48 [00:05<00:23,  1.65it/s][A
Training:  21%|██        | 10/48 [00:06<00:21,  1.79it/s][A
Training:  23%|██▎       | 11/48 [00:06<00:16,  2.24it/s][A
Training:  25%|██▌       | 12/48 [00:06<00:13,  2.74it/s][A
Training:  27%|██▋       | 13/48 [00:07<00:21,  1.67it/s][A
Training:  29%|██▉       | 14/48 [00:08<00:21,  1.55it/s][A
Training:  33%|███▎      | 16/48 [00:08<00:12,  2.59it/s][A
Training:  35%|███▌      | 17/48 [00:09<00:16,  1.87it/s][A
Training:  38%|███▊      | 18/48 [00:10<00:18,  1.58it/s][A
Training:  40%|███▉      | 19/48 [00:10<00:14,  2.00it/s][A
Training:  42%|████▏     | 20/48 [00:1

Epoch: 27/71 - Loss: 2.7041 - Accuracy: 0.9481



  0%|          | 0/6 [00:00<?, ?it/s][A
 17%|█▋        | 1/6 [00:02<00:12,  2.42s/it][A
 50%|█████     | 3/6 [00:02<00:02,  1.49it/s][A
100%|██████████| 6/6 [00:04<00:00,  1.31it/s][A
Epochs:  38%|███▊      | 27/71 [13:32<21:53, 29.85s/it]

Val Loss: 3.6573 - Val Accuracy: 0.9369



Training:   0%|          | 0/48 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/48 [00:02<01:48,  2.32s/it][A
Training:   4%|▍         | 2/48 [00:02<00:47,  1.04s/it][A
Training:   6%|▋         | 3/48 [00:02<00:28,  1.59it/s][A
Training:   8%|▊         | 4/48 [00:02<00:18,  2.34it/s][A
Training:  10%|█         | 5/48 [00:04<00:33,  1.28it/s][A
Training:  12%|█▎        | 6/48 [00:04<00:23,  1.77it/s][A
Training:  17%|█▋        | 8/48 [00:04<00:12,  3.12it/s][A
Training:  19%|█▉        | 9/48 [00:05<00:25,  1.56it/s][A
Training:  21%|██        | 10/48 [00:06<00:21,  1.73it/s][A
Training:  25%|██▌       | 12/48 [00:06<00:12,  2.77it/s][A
Training:  27%|██▋       | 13/48 [00:07<00:18,  1.92it/s][A
Training:  29%|██▉       | 14/48 [00:08<00:18,  1.82it/s][A
Training:  35%|███▌      | 17/48 [00:09<00:13,  2.29it/s][A
Training:  38%|███▊      | 18/48 [00:10<00:15,  1.92it/s][A
Training:  44%|████▍     | 21/48 [00:11<00:12,  2.11it/s][A
Training:  46%|████▌     | 22/48 [00:11<

Epoch: 28/71 - Loss: 2.8947 - Accuracy: 0.9443



  0%|          | 0/6 [00:00<?, ?it/s][A
 17%|█▋        | 1/6 [00:02<00:12,  2.49s/it][A
 50%|█████     | 3/6 [00:02<00:02,  1.46it/s][A
100%|██████████| 6/6 [00:04<00:00,  1.42it/s][A
Epochs:  39%|███▉      | 28/71 [14:01<21:08, 29.51s/it]

Val Loss: 3.5221 - Val Accuracy: 0.9380



Training:   0%|          | 0/48 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/48 [00:02<01:55,  2.46s/it][A
Training:   4%|▍         | 2/48 [00:02<00:50,  1.09s/it][A
Training:   6%|▋         | 3/48 [00:03<00:35,  1.28it/s][A
Training:  10%|█         | 5/48 [00:04<00:31,  1.35it/s][A
Training:  12%|█▎        | 6/48 [00:04<00:25,  1.64it/s][A
Training:  17%|█▋        | 8/48 [00:04<00:14,  2.76it/s][A
Training:  19%|█▉        | 9/48 [00:06<00:23,  1.65it/s][A
Training:  21%|██        | 10/48 [00:06<00:19,  1.91it/s][A
Training:  23%|██▎       | 11/48 [00:06<00:17,  2.14it/s][A
Training:  27%|██▋       | 13/48 [00:07<00:18,  1.93it/s][A
Training:  29%|██▉       | 14/48 [00:08<00:16,  2.01it/s][A
Training:  31%|███▏      | 15/48 [00:08<00:14,  2.29it/s][A
Training:  35%|███▌      | 17/48 [00:10<00:16,  1.85it/s][A
Training:  38%|███▊      | 18/48 [00:10<00:14,  2.07it/s][A
Training:  40%|███▉      | 19/48 [00:10<00:11,  2.47it/s][A
Training:  44%|████▍     | 21/48 [00:12

Epoch: 29/71 - Loss: 2.7741 - Accuracy: 0.9494



  0%|          | 0/6 [00:00<?, ?it/s][A
 17%|█▋        | 1/6 [00:02<00:11,  2.34s/it][A
 33%|███▎      | 2/6 [00:02<00:04,  1.12s/it][A
 83%|████████▎ | 5/6 [00:04<00:00,  1.49it/s][A
100%|██████████| 6/6 [00:04<00:00,  1.34it/s][A
Epochs:  41%|████      | 29/71 [14:31<20:39, 29.52s/it]

Val Loss: 3.4961 - Val Accuracy: 0.9396



Training:   0%|          | 0/48 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/48 [00:02<01:47,  2.29s/it][A
Training:   6%|▋         | 3/48 [00:02<00:29,  1.54it/s][A
Training:   8%|▊         | 4/48 [00:02<00:20,  2.10it/s][A
Training:  10%|█         | 5/48 [00:04<00:36,  1.17it/s][A
Training:  15%|█▍        | 7/48 [00:04<00:19,  2.05it/s][A
Training:  17%|█▋        | 8/48 [00:04<00:16,  2.48it/s][A
Training:  19%|█▉        | 9/48 [00:06<00:30,  1.29it/s][A
Training:  23%|██▎       | 11/48 [00:06<00:17,  2.14it/s][A
Training:  27%|██▋       | 13/48 [00:08<00:24,  1.40it/s][A
Training:  31%|███▏      | 15/48 [00:08<00:16,  2.05it/s][A
Training:  35%|███▌      | 17/48 [00:10<00:20,  1.54it/s][A
Training:  40%|███▉      | 19/48 [00:10<00:13,  2.16it/s][A
Training:  42%|████▏     | 20/48 [00:11<00:11,  2.51it/s][A
Training:  44%|████▍     | 21/48 [00:12<00:17,  1.55it/s][A
Training:  48%|████▊     | 23/48 [00:12<00:11,  2.27it/s][A
Training:  52%|█████▏    | 25/48 [00:14

Epoch: 30/71 - Loss: 2.9896 - Accuracy: 0.9438



  0%|          | 0/6 [00:00<?, ?it/s][A
 17%|█▋        | 1/6 [00:02<00:12,  2.52s/it][A
 67%|██████▋   | 4/6 [00:02<00:01,  1.97it/s][A
100%|██████████| 6/6 [00:04<00:00,  1.39it/s][A
Epochs:  42%|████▏     | 30/71 [15:00<20:05, 29.41s/it]

Val Loss: 3.6075 - Val Accuracy: 0.9361



Training:   0%|          | 0/48 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/48 [00:02<01:42,  2.19s/it][A
Training:   4%|▍         | 2/48 [00:02<00:47,  1.04s/it][A
Training:  10%|█         | 5/48 [00:04<00:30,  1.40it/s][A
Training:  15%|█▍        | 7/48 [00:04<00:20,  1.96it/s][A
Training:  19%|█▉        | 9/48 [00:06<00:23,  1.64it/s][A
Training:  21%|██        | 10/48 [00:06<00:19,  1.97it/s][A
Training:  23%|██▎       | 11/48 [00:06<00:15,  2.40it/s][A
Training:  25%|██▌       | 12/48 [00:06<00:12,  2.94it/s][A
Training:  27%|██▋       | 13/48 [00:08<00:23,  1.47it/s][A
Training:  29%|██▉       | 14/48 [00:08<00:19,  1.73it/s][A
Training:  33%|███▎      | 16/48 [00:08<00:11,  2.72it/s][A
Training:  35%|███▌      | 17/48 [00:10<00:19,  1.56it/s][A
Training:  38%|███▊      | 18/48 [00:10<00:17,  1.68it/s][A
Training:  40%|███▉      | 19/48 [00:10<00:13,  2.11it/s][A
Training:  44%|████▍     | 21/48 [00:12<00:15,  1.77it/s][A
Training:  46%|████▌     | 22/48 [00:

Epoch: 31/71 - Loss: 2.9114 - Accuracy: 0.9443



  0%|          | 0/6 [00:00<?, ?it/s][A
 17%|█▋        | 1/6 [00:02<00:10,  2.15s/it][A
 33%|███▎      | 2/6 [00:02<00:03,  1.06it/s][A
 67%|██████▋   | 4/6 [00:02<00:00,  2.41it/s][A
100%|██████████| 6/6 [00:04<00:00,  1.48it/s][A
Epochs:  44%|████▎     | 31/71 [15:29<19:31, 29.30s/it]

Val Loss: 4.6023 - Val Accuracy: 0.9173



Training:   0%|          | 0/48 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/48 [00:02<01:39,  2.12s/it][A
Training:   4%|▍         | 2/48 [00:02<00:45,  1.01it/s][A
Training:   6%|▋         | 3/48 [00:02<00:27,  1.64it/s][A
Training:  10%|█         | 5/48 [00:04<00:34,  1.26it/s][A
Training:  12%|█▎        | 6/48 [00:04<00:24,  1.68it/s][A
Training:  15%|█▍        | 7/48 [00:04<00:18,  2.21it/s][A
Training:  19%|█▉        | 9/48 [00:06<00:24,  1.60it/s][A
Training:  23%|██▎       | 11/48 [00:06<00:16,  2.18it/s][A
Training:  25%|██▌       | 12/48 [00:06<00:13,  2.63it/s][A
Training:  27%|██▋       | 13/48 [00:08<00:22,  1.53it/s][A
Training:  31%|███▏      | 15/48 [00:08<00:14,  2.23it/s][A
Training:  33%|███▎      | 16/48 [00:08<00:12,  2.62it/s][A
Training:  35%|███▌      | 17/48 [00:10<00:20,  1.51it/s][A
Training:  38%|███▊      | 18/48 [00:10<00:15,  1.90it/s][A
Training:  42%|████▏     | 20/48 [00:10<00:10,  2.73it/s][A
Training:  44%|████▍     | 21/48 [00:12

Epoch: 32/71 - Loss: 2.8644 - Accuracy: 0.9437



  0%|          | 0/6 [00:00<?, ?it/s][A
 17%|█▋        | 1/6 [00:02<00:12,  2.46s/it][A
100%|██████████| 6/6 [00:04<00:00,  1.44it/s][A
Epochs:  45%|████▌     | 32/71 [15:57<18:51, 29.01s/it]

Val Loss: 3.3395 - Val Accuracy: 0.9407



Training:   0%|          | 0/48 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/48 [00:02<01:47,  2.29s/it][A
Training:   6%|▋         | 3/48 [00:02<00:29,  1.53it/s][A
Training:   8%|▊         | 4/48 [00:02<00:23,  1.89it/s][A
Training:  10%|█         | 5/48 [00:04<00:34,  1.26it/s][A
Training:  12%|█▎        | 6/48 [00:04<00:27,  1.50it/s][A
Training:  15%|█▍        | 7/48 [00:04<00:20,  1.97it/s][A
Training:  17%|█▋        | 8/48 [00:05<00:18,  2.15it/s][A
Training:  19%|█▉        | 9/48 [00:06<00:24,  1.59it/s][A
Training:  21%|██        | 10/48 [00:06<00:23,  1.62it/s][A
Training:  23%|██▎       | 11/48 [00:06<00:17,  2.15it/s][A
Training:  25%|██▌       | 12/48 [00:06<00:13,  2.72it/s][A
Training:  27%|██▋       | 13/48 [00:08<00:21,  1.64it/s][A
Training:  29%|██▉       | 14/48 [00:08<00:19,  1.76it/s][A
Training:  31%|███▏      | 15/48 [00:08<00:14,  2.33it/s][A
Training:  33%|███▎      | 16/48 [00:08<00:12,  2.52it/s][A
Training:  35%|███▌      | 17/48 [00:09<

Epoch: 33/71 - Loss: 2.7868 - Accuracy: 0.9489



  0%|          | 0/6 [00:00<?, ?it/s][A
 17%|█▋        | 1/6 [00:02<00:10,  2.15s/it][A
 67%|██████▋   | 4/6 [00:02<00:00,  2.28it/s][A
100%|██████████| 6/6 [00:04<00:00,  1.46it/s][A
Epochs:  46%|████▋     | 33/71 [16:26<18:17, 28.89s/it]

Val Loss: 4.8900 - Val Accuracy: 0.9108



Training:   0%|          | 0/48 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/48 [00:02<02:03,  2.62s/it][A
Training:   4%|▍         | 2/48 [00:02<00:54,  1.18s/it][A
Training:  10%|█         | 5/48 [00:04<00:34,  1.25it/s][A
Training:  12%|█▎        | 6/48 [00:04<00:26,  1.61it/s][A
Training:  15%|█▍        | 7/48 [00:04<00:20,  2.02it/s][A
Training:  19%|█▉        | 9/48 [00:06<00:27,  1.43it/s][A
Training:  21%|██        | 10/48 [00:07<00:21,  1.79it/s][A
Training:  23%|██▎       | 11/48 [00:07<00:16,  2.22it/s][A
Training:  27%|██▋       | 13/48 [00:08<00:22,  1.55it/s][A
Training:  31%|███▏      | 15/48 [00:09<00:15,  2.18it/s][A
Training:  33%|███▎      | 16/48 [00:09<00:12,  2.58it/s][A
Training:  35%|███▌      | 17/48 [00:11<00:22,  1.40it/s][A
Training:  38%|███▊      | 18/48 [00:11<00:16,  1.78it/s][A
Training:  44%|████▍     | 21/48 [00:12<00:14,  1.92it/s][A
Training:  46%|████▌     | 22/48 [00:13<00:12,  2.01it/s][A
Training:  50%|█████     | 24/48 [00:1

Epoch: 34/71 - Loss: 2.7256 - Accuracy: 0.9487



  0%|          | 0/6 [00:00<?, ?it/s][A
 17%|█▋        | 1/6 [00:02<00:11,  2.33s/it][A
 50%|█████     | 3/6 [00:02<00:01,  1.55it/s][A
100%|██████████| 6/6 [00:04<00:00,  1.41it/s][A
Epochs:  48%|████▊     | 34/71 [16:55<17:55, 29.08s/it]

Val Loss: 3.5732 - Val Accuracy: 0.9362



Training:   0%|          | 0/48 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/48 [00:02<01:54,  2.43s/it][A
Training:   4%|▍         | 2/48 [00:02<00:49,  1.08s/it][A
Training:   8%|▊         | 4/48 [00:02<00:19,  2.26it/s][A
Training:  10%|█         | 5/48 [00:04<00:38,  1.11it/s][A
Training:  12%|█▎        | 6/48 [00:04<00:27,  1.52it/s][A
Training:  17%|█▋        | 8/48 [00:04<00:14,  2.67it/s][A
Training:  21%|██        | 10/48 [00:06<00:23,  1.64it/s][A
Training:  23%|██▎       | 11/48 [00:06<00:18,  1.98it/s][A
Training:  25%|██▌       | 12/48 [00:07<00:14,  2.41it/s][A
Training:  27%|██▋       | 13/48 [00:08<00:25,  1.37it/s][A
Training:  29%|██▉       | 14/48 [00:08<00:19,  1.76it/s][A
Training:  31%|███▏      | 15/48 [00:08<00:14,  2.27it/s][A
Training:  35%|███▌      | 17/48 [00:10<00:19,  1.60it/s][A
Training:  40%|███▉      | 19/48 [00:10<00:11,  2.42it/s][A
Training:  44%|████▍     | 21/48 [00:12<00:14,  1.80it/s][A
Training:  46%|████▌     | 22/48 [00:1

Epoch: 35/71 - Loss: 2.7202 - Accuracy: 0.9471



  0%|          | 0/6 [00:00<?, ?it/s][A
 17%|█▋        | 1/6 [00:02<00:11,  2.35s/it][A
 33%|███▎      | 2/6 [00:02<00:04,  1.03s/it][A
 67%|██████▋   | 4/6 [00:02<00:00,  2.29it/s][A
100%|██████████| 6/6 [00:04<00:00,  1.39it/s][A
Epochs:  49%|████▉     | 35/71 [17:24<17:18, 28.86s/it]

Val Loss: 3.3497 - Val Accuracy: 0.9418



Training:   0%|          | 0/48 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/48 [00:02<01:59,  2.55s/it][A
Training:   4%|▍         | 2/48 [00:02<00:51,  1.11s/it][A
Training:   8%|▊         | 4/48 [00:02<00:21,  2.07it/s][A
Training:  10%|█         | 5/48 [00:04<00:34,  1.23it/s][A
Training:  12%|█▎        | 6/48 [00:04<00:25,  1.65it/s][A
Training:  15%|█▍        | 7/48 [00:04<00:18,  2.20it/s][A
Training:  17%|█▋        | 8/48 [00:04<00:13,  2.88it/s][A
Training:  19%|█▉        | 9/48 [00:06<00:27,  1.40it/s][A
Training:  21%|██        | 10/48 [00:06<00:20,  1.84it/s][A
Training:  23%|██▎       | 11/48 [00:06<00:15,  2.40it/s][A
Training:  27%|██▋       | 13/48 [00:08<00:23,  1.47it/s][A
Training:  31%|███▏      | 15/48 [00:08<00:14,  2.30it/s][A
Training:  35%|███▌      | 17/48 [00:10<00:18,  1.64it/s][A
Training:  38%|███▊      | 18/48 [00:10<00:15,  1.97it/s][A
Training:  42%|████▏     | 20/48 [00:10<00:09,  2.84it/s][A
Training:  44%|████▍     | 21/48 [00:12<

Epoch: 36/71 - Loss: 2.6650 - Accuracy: 0.9487



  0%|          | 0/6 [00:00<?, ?it/s][A
 17%|█▋        | 1/6 [00:02<00:12,  2.50s/it][A
100%|██████████| 6/6 [00:04<00:00,  1.37it/s][A
Epochs:  51%|█████     | 36/71 [17:52<16:46, 28.75s/it]

Val Loss: 3.5308 - Val Accuracy: 0.9379



Training:   0%|          | 0/48 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/48 [00:02<01:48,  2.31s/it][A
Training:   4%|▍         | 2/48 [00:02<00:49,  1.09s/it][A
Training:  10%|█         | 5/48 [00:04<00:32,  1.32it/s][A
Training:  12%|█▎        | 6/48 [00:04<00:28,  1.50it/s][A
Training:  15%|█▍        | 7/48 [00:04<00:21,  1.90it/s][A
Training:  19%|█▉        | 9/48 [00:06<00:25,  1.51it/s][A
Training:  21%|██        | 10/48 [00:06<00:20,  1.82it/s][A
Training:  27%|██▋       | 13/48 [00:08<00:19,  1.80it/s][A
Training:  29%|██▉       | 14/48 [00:08<00:17,  1.96it/s][A
Training:  33%|███▎      | 16/48 [00:09<00:11,  2.78it/s][A
Training:  35%|███▌      | 17/48 [00:10<00:16,  1.84it/s][A
Training:  38%|███▊      | 18/48 [00:10<00:15,  1.93it/s][A
Training:  40%|███▉      | 19/48 [00:10<00:12,  2.35it/s][A
Training:  42%|████▏     | 20/48 [00:11<00:10,  2.80it/s][A
Training:  44%|████▍     | 21/48 [00:12<00:19,  1.41it/s][A
Training:  48%|████▊     | 23/48 [00:1

Epoch: 37/71 - Loss: 2.6626 - Accuracy: 0.9491



  0%|          | 0/6 [00:00<?, ?it/s][A
 17%|█▋        | 1/6 [00:02<00:11,  2.30s/it][A
 33%|███▎      | 2/6 [00:02<00:04,  1.11s/it][A
 50%|█████     | 3/6 [00:02<00:01,  1.54it/s][A
 67%|██████▋   | 4/6 [00:02<00:00,  2.28it/s][A
100%|██████████| 6/6 [00:04<00:00,  1.43it/s][A
Epochs:  52%|█████▏    | 37/71 [18:20<16:09, 28.52s/it]

Val Loss: 3.3636 - Val Accuracy: 0.9413



Training:   0%|          | 0/48 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/48 [00:02<02:00,  2.56s/it][A
Training:   4%|▍         | 2/48 [00:02<00:53,  1.17s/it][A
Training:   6%|▋         | 3/48 [00:02<00:30,  1.46it/s][A
Training:   8%|▊         | 4/48 [00:02<00:19,  2.20it/s][A
Training:  10%|█         | 5/48 [00:04<00:36,  1.17it/s][A
Training:  12%|█▎        | 6/48 [00:04<00:25,  1.63it/s][A
Training:  15%|█▍        | 7/48 [00:04<00:18,  2.22it/s][A
Training:  17%|█▋        | 8/48 [00:04<00:13,  2.95it/s][A
Training:  19%|█▉        | 9/48 [00:06<00:25,  1.55it/s][A
Training:  21%|██        | 10/48 [00:06<00:19,  1.93it/s][A
Training:  27%|██▋       | 13/48 [00:07<00:17,  1.99it/s][A
Training:  29%|██▉       | 14/48 [00:08<00:18,  1.86it/s][A
Training:  31%|███▏      | 15/48 [00:08<00:14,  2.29it/s][A
Training:  35%|███▌      | 17/48 [00:09<00:15,  2.00it/s][A
Training:  38%|███▊      | 18/48 [00:10<00:17,  1.76it/s][A
Training:  40%|███▉      | 19/48 [00:10<0

Epoch: 38/71 - Loss: 2.6336 - Accuracy: 0.9485



  0%|          | 0/6 [00:00<?, ?it/s][A
 17%|█▋        | 1/6 [00:02<00:13,  2.72s/it][A
 67%|██████▋   | 4/6 [00:02<00:01,  1.83it/s][A
100%|██████████| 6/6 [00:04<00:00,  1.33it/s][A
Epochs:  54%|█████▎    | 38/71 [18:49<15:46, 28.70s/it]

Val Loss: 3.5581 - Val Accuracy: 0.9351



Training:   0%|          | 0/48 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/48 [00:02<02:02,  2.61s/it][A
Training:   4%|▍         | 2/48 [00:02<00:53,  1.17s/it][A
Training:   8%|▊         | 4/48 [00:02<00:21,  2.07it/s][A
Training:  10%|█         | 5/48 [00:04<00:36,  1.18it/s][A
Training:  12%|█▎        | 6/48 [00:04<00:26,  1.60it/s][A
Training:  17%|█▋        | 8/48 [00:04<00:14,  2.77it/s][A
Training:  19%|█▉        | 9/48 [00:06<00:27,  1.41it/s][A
Training:  23%|██▎       | 11/48 [00:06<00:16,  2.19it/s][A
Training:  25%|██▌       | 12/48 [00:06<00:13,  2.66it/s][A
Training:  27%|██▋       | 13/48 [00:08<00:22,  1.53it/s][A
Training:  29%|██▉       | 14/48 [00:08<00:17,  1.94it/s][A
Training:  31%|███▏      | 15/48 [00:08<00:13,  2.46it/s][A
Training:  35%|███▌      | 17/48 [00:10<00:18,  1.65it/s][A
Training:  38%|███▊      | 18/48 [00:10<00:14,  2.04it/s][A
Training:  40%|███▉      | 19/48 [00:10<00:11,  2.55it/s][A
Training:  44%|████▍     | 21/48 [00:12

Epoch: 39/71 - Loss: 2.5289 - Accuracy: 0.9520



  0%|          | 0/6 [00:00<?, ?it/s][A
 17%|█▋        | 1/6 [00:02<00:12,  2.53s/it][A
100%|██████████| 6/6 [00:04<00:00,  1.36it/s][A
Epochs:  55%|█████▍    | 39/71 [19:18<15:17, 28.67s/it]

Val Loss: 3.2861 - Val Accuracy: 0.9416



Training:   0%|          | 0/48 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/48 [00:02<01:59,  2.55s/it][A
Training:   4%|▍         | 2/48 [00:02<00:52,  1.14s/it][A
Training:   8%|▊         | 4/48 [00:02<00:20,  2.13it/s][A
Training:  10%|█         | 5/48 [00:04<00:36,  1.19it/s][A
Training:  12%|█▎        | 6/48 [00:04<00:26,  1.61it/s][A
Training:  15%|█▍        | 7/48 [00:04<00:19,  2.12it/s][A
Training:  17%|█▋        | 8/48 [00:04<00:14,  2.75it/s][A
Training:  19%|█▉        | 9/48 [00:06<00:30,  1.26it/s][A
Training:  21%|██        | 10/48 [00:06<00:22,  1.71it/s][A
Training:  25%|██▌       | 12/48 [00:06<00:12,  2.96it/s][A
Training:  29%|██▉       | 14/48 [00:08<00:19,  1.76it/s][A
Training:  33%|███▎      | 16/48 [00:08<00:12,  2.61it/s][A
Training:  38%|███▊      | 18/48 [00:10<00:16,  1.77it/s][A
Training:  42%|████▏     | 20/48 [00:10<00:11,  2.49it/s][A
Training:  44%|████▍     | 21/48 [00:11<00:14,  1.88it/s][A
Training:  46%|████▌     | 22/48 [00:12<

Epoch: 40/71 - Loss: 2.6364 - Accuracy: 0.9488



  0%|          | 0/6 [00:00<?, ?it/s][A
 17%|█▋        | 1/6 [00:02<00:13,  2.70s/it][A
 50%|█████     | 3/6 [00:02<00:02,  1.34it/s][A
100%|██████████| 6/6 [00:04<00:00,  1.27it/s][A
Epochs:  56%|█████▋    | 40/71 [19:47<14:49, 28.68s/it]

Val Loss: 3.6434 - Val Accuracy: 0.9366



Training:   0%|          | 0/48 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/48 [00:02<01:44,  2.21s/it][A
Training:   4%|▍         | 2/48 [00:02<00:47,  1.04s/it][A
Training:   6%|▋         | 3/48 [00:02<00:28,  1.56it/s][A
Training:  10%|█         | 5/48 [00:04<00:31,  1.36it/s][A
Training:  12%|█▎        | 6/48 [00:04<00:24,  1.71it/s][A
Training:  15%|█▍        | 7/48 [00:04<00:19,  2.10it/s][A
Training:  19%|█▉        | 9/48 [00:06<00:23,  1.68it/s][A
Training:  21%|██        | 10/48 [00:06<00:19,  1.91it/s][A
Training:  23%|██▎       | 11/48 [00:06<00:15,  2.39it/s][A
Training:  25%|██▌       | 12/48 [00:06<00:12,  2.94it/s][A
Training:  27%|██▋       | 13/48 [00:08<00:24,  1.42it/s][A
Training:  31%|███▏      | 15/48 [00:08<00:13,  2.36it/s][A
Training:  35%|███▌      | 17/48 [00:09<00:15,  1.96it/s][A
Training:  38%|███▊      | 18/48 [00:10<00:14,  2.05it/s][A
Training:  40%|███▉      | 19/48 [00:10<00:12,  2.33it/s][A
Training:  44%|████▍     | 21/48 [00:11

Epoch: 41/71 - Loss: 2.6068 - Accuracy: 0.9499



  0%|          | 0/6 [00:00<?, ?it/s][A
 17%|█▋        | 1/6 [00:02<00:12,  2.49s/it][A
 33%|███▎      | 2/6 [00:02<00:04,  1.09s/it][A
 67%|██████▋   | 4/6 [00:02<00:00,  2.26it/s][A
100%|██████████| 6/6 [00:04<00:00,  1.37it/s][A
Epochs:  58%|█████▊    | 41/71 [20:14<14:11, 28.38s/it]

Val Loss: 3.4327 - Val Accuracy: 0.9395



Training:   0%|          | 0/48 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/48 [00:02<01:43,  2.20s/it][A
Training:   8%|▊         | 4/48 [00:02<00:20,  2.13it/s][A
Training:  10%|█         | 5/48 [00:04<00:38,  1.11it/s][A
Training:  12%|█▎        | 6/48 [00:04<00:28,  1.48it/s][A
Training:  15%|█▍        | 7/48 [00:04<00:21,  1.94it/s][A
Training:  19%|█▉        | 9/48 [00:06<00:27,  1.43it/s][A
Training:  23%|██▎       | 11/48 [00:06<00:16,  2.18it/s][A
Training:  27%|██▋       | 13/48 [00:08<00:20,  1.71it/s][A
Training:  29%|██▉       | 14/48 [00:08<00:17,  1.92it/s][A
Training:  31%|███▏      | 15/48 [00:08<00:14,  2.35it/s][A
Training:  35%|███▌      | 17/48 [00:09<00:15,  1.95it/s][A
Training:  38%|███▊      | 18/48 [00:10<00:15,  2.00it/s][A
Training:  40%|███▉      | 19/48 [00:10<00:11,  2.46it/s][A
Training:  42%|████▏     | 20/48 [00:10<00:09,  3.02it/s][A
Training:  44%|████▍     | 21/48 [00:11<00:16,  1.67it/s][A
Training:  46%|████▌     | 22/48 [00:1

Epoch: 42/71 - Loss: 2.7068 - Accuracy: 0.9472



  0%|          | 0/6 [00:00<?, ?it/s][A
 17%|█▋        | 1/6 [00:02<00:12,  2.41s/it][A
 50%|█████     | 3/6 [00:02<00:02,  1.49it/s][A
100%|██████████| 6/6 [00:04<00:00,  1.36it/s][A
Epochs:  59%|█████▉    | 42/71 [20:43<13:44, 28.42s/it]

Val Loss: 3.7917 - Val Accuracy: 0.9388



Training:   0%|          | 0/48 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/48 [00:02<01:58,  2.52s/it][A
Training:   4%|▍         | 2/48 [00:02<00:53,  1.15s/it][A
Training:   6%|▋         | 3/48 [00:02<00:31,  1.44it/s][A
Training:  10%|█         | 5/48 [00:04<00:34,  1.25it/s][A
Training:  12%|█▎        | 6/48 [00:04<00:25,  1.63it/s][A
Training:  15%|█▍        | 7/48 [00:04<00:19,  2.13it/s][A
Training:  19%|█▉        | 9/48 [00:06<00:25,  1.53it/s][A
Training:  21%|██        | 10/48 [00:06<00:21,  1.80it/s][A
Training:  25%|██▌       | 12/48 [00:07<00:13,  2.71it/s][A
Training:  27%|██▋       | 13/48 [00:08<00:20,  1.67it/s][A
Training:  29%|██▉       | 14/48 [00:08<00:18,  1.83it/s][A
Training:  33%|███▎      | 16/48 [00:09<00:11,  2.88it/s][A
Training:  35%|███▌      | 17/48 [00:10<00:19,  1.62it/s][A
Training:  38%|███▊      | 18/48 [00:10<00:15,  2.00it/s][A
Training:  40%|███▉      | 19/48 [00:10<00:11,  2.46it/s][A
Training:  42%|████▏     | 20/48 [00:10

Epoch: 43/71 - Loss: 2.6085 - Accuracy: 0.9494



  0%|          | 0/6 [00:00<?, ?it/s][A
 17%|█▋        | 1/6 [00:02<00:12,  2.51s/it][A
 33%|███▎      | 2/6 [00:02<00:04,  1.10s/it][A
 67%|██████▋   | 4/6 [00:02<00:00,  2.19it/s][A
100%|██████████| 6/6 [00:04<00:00,  1.34it/s][A
Epochs:  61%|██████    | 43/71 [21:11<13:18, 28.52s/it]

Val Loss: 3.4021 - Val Accuracy: 0.9388



Training:   0%|          | 0/48 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/48 [00:02<01:47,  2.29s/it][A
Training:   4%|▍         | 2/48 [00:02<00:53,  1.15s/it][A
Training:   8%|▊         | 4/48 [00:02<00:21,  2.03it/s][A
Training:  10%|█         | 5/48 [00:04<00:31,  1.37it/s][A
Training:  12%|█▎        | 6/48 [00:04<00:25,  1.62it/s][A
Training:  15%|█▍        | 7/48 [00:04<00:19,  2.12it/s][A
Training:  19%|█▉        | 9/48 [00:06<00:23,  1.65it/s][A
Training:  21%|██        | 10/48 [00:06<00:20,  1.85it/s][A
Training:  25%|██▌       | 12/48 [00:06<00:12,  2.92it/s][A
Training:  27%|██▋       | 13/48 [00:07<00:20,  1.74it/s][A
Training:  29%|██▉       | 14/48 [00:08<00:19,  1.73it/s][A
Training:  31%|███▏      | 15/48 [00:08<00:15,  2.16it/s][A
Training:  33%|███▎      | 16/48 [00:08<00:11,  2.70it/s][A
Training:  35%|███▌      | 17/48 [00:09<00:17,  1.77it/s][A
Training:  38%|███▊      | 18/48 [00:10<00:17,  1.69it/s][A
Training:  40%|███▉      | 19/48 [00:10

Epoch: 44/71 - Loss: 2.4830 - Accuracy: 0.9522



  0%|          | 0/6 [00:00<?, ?it/s][A
 17%|█▋        | 1/6 [00:02<00:11,  2.23s/it][A
 33%|███▎      | 2/6 [00:02<00:04,  1.12s/it][A
 83%|████████▎ | 5/6 [00:04<00:00,  1.48it/s][A
100%|██████████| 6/6 [00:04<00:00,  1.39it/s][A
Epochs:  62%|██████▏   | 44/71 [21:40<12:52, 28.63s/it]

Val Loss: 3.8589 - Val Accuracy: 0.9283



Training:   0%|          | 0/48 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/48 [00:02<01:58,  2.53s/it][A
Training:   6%|▋         | 3/48 [00:02<00:33,  1.35it/s][A
Training:   8%|▊         | 4/48 [00:02<00:23,  1.89it/s][A
Training:  10%|█         | 5/48 [00:04<00:36,  1.16it/s][A
Training:  15%|█▍        | 7/48 [00:04<00:19,  2.11it/s][A
Training:  19%|█▉        | 9/48 [00:06<00:24,  1.56it/s][A
Training:  21%|██        | 10/48 [00:06<00:19,  1.93it/s][A
Training:  23%|██▎       | 11/48 [00:06<00:15,  2.39it/s][A
Training:  27%|██▋       | 13/48 [00:08<00:20,  1.74it/s][A
Training:  29%|██▉       | 14/48 [00:08<00:16,  2.11it/s][A
Training:  35%|███▌      | 17/48 [00:10<00:17,  1.79it/s][A
Training:  38%|███▊      | 18/48 [00:10<00:14,  2.06it/s][A
Training:  40%|███▉      | 19/48 [00:10<00:11,  2.45it/s][A
Training:  42%|████▏     | 20/48 [00:10<00:09,  2.98it/s][A
Training:  44%|████▍     | 21/48 [00:12<00:17,  1.57it/s][A
Training:  46%|████▌     | 22/48 [00:1

Epoch: 45/71 - Loss: 2.6421 - Accuracy: 0.9480



  0%|          | 0/6 [00:00<?, ?it/s][A
 17%|█▋        | 1/6 [00:02<00:10,  2.19s/it][A
 33%|███▎      | 2/6 [00:02<00:03,  1.00it/s][A
 67%|██████▋   | 4/6 [00:02<00:00,  2.47it/s][A
100%|██████████| 6/6 [00:04<00:00,  1.49it/s][A
Epochs:  63%|██████▎   | 45/71 [22:08<12:20, 28.47s/it]

Val Loss: 3.4342 - Val Accuracy: 0.9379



Training:   0%|          | 0/48 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/48 [00:02<01:46,  2.26s/it][A
Training:   4%|▍         | 2/48 [00:02<00:47,  1.04s/it][A
Training:   6%|▋         | 3/48 [00:02<00:27,  1.63it/s][A
Training:  10%|█         | 5/48 [00:04<00:29,  1.45it/s][A
Training:  12%|█▎        | 6/48 [00:04<00:23,  1.78it/s][A
Training:  19%|█▉        | 9/48 [00:05<00:20,  1.88it/s][A
Training:  21%|██        | 10/48 [00:06<00:17,  2.13it/s][A
Training:  25%|██▌       | 12/48 [00:06<00:11,  3.14it/s][A
Training:  27%|██▋       | 13/48 [00:07<00:19,  1.75it/s][A
Training:  29%|██▉       | 14/48 [00:08<00:17,  1.91it/s][A
Training:  31%|███▏      | 15/48 [00:08<00:13,  2.38it/s][A
Training:  33%|███▎      | 16/48 [00:08<00:10,  2.92it/s][A
Training:  35%|███▌      | 17/48 [00:09<00:19,  1.59it/s][A
Training:  38%|███▊      | 18/48 [00:10<00:16,  1.79it/s][A
Training:  42%|████▏     | 20/48 [00:10<00:09,  2.94it/s][A
Training:  44%|████▍     | 21/48 [00:1

Epoch: 46/71 - Loss: 2.5062 - Accuracy: 0.9492



  0%|          | 0/6 [00:00<?, ?it/s][A
 17%|█▋        | 1/6 [00:02<00:12,  2.42s/it][A
 50%|█████     | 3/6 [00:02<00:02,  1.49it/s][A
100%|██████████| 6/6 [00:04<00:00,  1.46it/s][A
Epochs:  65%|██████▍   | 46/71 [22:37<11:52, 28.52s/it]

Val Loss: 3.2542 - Val Accuracy: 0.9413



Training:   0%|          | 0/48 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/48 [00:02<01:38,  2.11s/it][A
Training:   4%|▍         | 2/48 [00:02<00:43,  1.05it/s][A
Training:   8%|▊         | 4/48 [00:02<00:17,  2.46it/s][A
Training:  10%|█         | 5/48 [00:04<00:33,  1.28it/s][A
Training:  12%|█▎        | 6/48 [00:04<00:24,  1.73it/s][A
Training:  15%|█▍        | 7/48 [00:04<00:17,  2.28it/s][A
Training:  17%|█▋        | 8/48 [00:04<00:13,  2.92it/s][A
Training:  19%|█▉        | 9/48 [00:06<00:29,  1.33it/s][A
Training:  21%|██        | 10/48 [00:06<00:21,  1.76it/s][A
Training:  25%|██▌       | 12/48 [00:06<00:12,  2.85it/s][A
Training:  27%|██▋       | 13/48 [00:07<00:22,  1.55it/s][A
Training:  31%|███▏      | 15/48 [00:08<00:13,  2.39it/s][A
Training:  33%|███▎      | 16/48 [00:08<00:11,  2.89it/s][A
Training:  35%|███▌      | 17/48 [00:10<00:22,  1.37it/s][A
Training:  40%|███▉      | 19/48 [00:10<00:13,  2.15it/s][A
Training:  42%|████▏     | 20/48 [00:10<

Epoch: 47/71 - Loss: 2.5523 - Accuracy: 0.9518



  0%|          | 0/6 [00:00<?, ?it/s][A
 17%|█▋        | 1/6 [00:02<00:12,  2.55s/it][A
 33%|███▎      | 2/6 [00:02<00:04,  1.13s/it][A
 67%|██████▋   | 4/6 [00:02<00:00,  2.18it/s][A
100%|██████████| 6/6 [00:04<00:00,  1.42it/s][A
Epochs:  66%|██████▌   | 47/71 [23:07<11:32, 28.87s/it]

Val Loss: 3.5449 - Val Accuracy: 0.9400



Training:   0%|          | 0/48 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/48 [00:02<01:44,  2.23s/it][A
Training:   4%|▍         | 2/48 [00:02<00:45,  1.00it/s][A
Training:   6%|▋         | 3/48 [00:02<00:26,  1.68it/s][A
Training:  10%|█         | 5/48 [00:04<00:31,  1.39it/s][A
Training:  12%|█▎        | 6/48 [00:04<00:26,  1.60it/s][A
Training:  15%|█▍        | 7/48 [00:04<00:19,  2.09it/s][A
Training:  19%|█▉        | 9/48 [00:05<00:21,  1.81it/s][A
Training:  21%|██        | 10/48 [00:06<00:20,  1.81it/s][A
Training:  23%|██▎       | 11/48 [00:06<00:18,  1.96it/s][A
Training:  27%|██▋       | 13/48 [00:07<00:18,  1.90it/s][A
Training:  29%|██▉       | 14/48 [00:08<00:19,  1.78it/s][A
Training:  31%|███▏      | 15/48 [00:08<00:14,  2.22it/s][A
Training:  33%|███▎      | 16/48 [00:08<00:11,  2.77it/s][A
Training:  35%|███▌      | 17/48 [00:09<00:14,  2.11it/s][A
Training:  38%|███▊      | 18/48 [00:10<00:17,  1.67it/s][A
Training:  40%|███▉      | 19/48 [00:10

Epoch: 48/71 - Loss: 2.4538 - Accuracy: 0.9521



  0%|          | 0/6 [00:00<?, ?it/s][A
 17%|█▋        | 1/6 [00:02<00:11,  2.23s/it][A
 50%|█████     | 3/6 [00:02<00:01,  1.62it/s][A
100%|██████████| 6/6 [00:03<00:00,  1.54it/s][A
Epochs:  68%|██████▊   | 48/71 [23:36<11:07, 29.04s/it]

Val Loss: 3.3245 - Val Accuracy: 0.9402



Training:   0%|          | 0/48 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/48 [00:02<01:55,  2.45s/it][A
Training:   4%|▍         | 2/48 [00:02<00:49,  1.08s/it][A
Training:   8%|▊         | 4/48 [00:02<00:19,  2.20it/s][A
Training:  10%|█         | 5/48 [00:04<00:33,  1.28it/s][A
Training:  15%|█▍        | 7/48 [00:04<00:18,  2.24it/s][A
Training:  19%|█▉        | 9/48 [00:06<00:25,  1.51it/s][A
Training:  21%|██        | 10/48 [00:06<00:20,  1.84it/s][A
Training:  23%|██▎       | 11/48 [00:06<00:16,  2.29it/s][A
Training:  25%|██▌       | 12/48 [00:06<00:12,  2.84it/s][A
Training:  27%|██▋       | 13/48 [00:08<00:23,  1.49it/s][A
Training:  31%|███▏      | 15/48 [00:08<00:13,  2.47it/s][A
Training:  35%|███▌      | 17/48 [00:10<00:18,  1.68it/s][A
Training:  38%|███▊      | 18/48 [00:10<00:14,  2.04it/s][A
Training:  40%|███▉      | 19/48 [00:10<00:11,  2.50it/s][A
Training:  42%|████▏     | 20/48 [00:10<00:09,  3.02it/s][A
Training:  44%|████▍     | 21/48 [00:1

Epoch: 49/71 - Loss: 2.4952 - Accuracy: 0.9524



  0%|          | 0/6 [00:00<?, ?it/s][A
 17%|█▋        | 1/6 [00:02<00:12,  2.49s/it][A
 67%|██████▋   | 4/6 [00:02<00:01,  1.98it/s][A
100%|██████████| 6/6 [00:04<00:00,  1.36it/s][A
Epochs:  69%|██████▉   | 49/71 [24:04<10:33, 28.81s/it]

Val Loss: 3.4617 - Val Accuracy: 0.9356



Training:   0%|          | 0/48 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/48 [00:02<02:05,  2.66s/it][A
Training:   6%|▋         | 3/48 [00:02<00:32,  1.37it/s][A
Training:  10%|█         | 5/48 [00:04<00:36,  1.17it/s][A
Training:  15%|█▍        | 7/48 [00:04<00:21,  1.90it/s][A
Training:  19%|█▉        | 9/48 [00:06<00:24,  1.57it/s][A
Training:  21%|██        | 10/48 [00:06<00:20,  1.87it/s][A
Training:  23%|██▎       | 11/48 [00:06<00:16,  2.30it/s][A
Training:  27%|██▋       | 13/48 [00:08<00:22,  1.57it/s][A
Training:  29%|██▉       | 14/48 [00:08<00:17,  1.92it/s][A
Training:  33%|███▎      | 16/48 [00:08<00:11,  2.79it/s][A
Training:  35%|███▌      | 17/48 [00:10<00:18,  1.68it/s][A
Training:  38%|███▊      | 18/48 [00:10<00:16,  1.85it/s][A
Training:  42%|████▏     | 20/48 [00:10<00:09,  2.88it/s][A
Training:  44%|████▍     | 21/48 [00:12<00:16,  1.59it/s][A
Training:  46%|████▌     | 22/48 [00:12<00:14,  1.78it/s][A
Training:  48%|████▊     | 23/48 [00:

Epoch: 50/71 - Loss: 2.5993 - Accuracy: 0.9490



  0%|          | 0/6 [00:00<?, ?it/s][A
 17%|█▋        | 1/6 [00:02<00:12,  2.50s/it][A
 50%|█████     | 3/6 [00:02<00:02,  1.44it/s][A
100%|██████████| 6/6 [00:04<00:00,  1.32it/s][A
Epochs:  70%|███████   | 50/71 [24:34<10:11, 29.11s/it]

Val Loss: 3.3859 - Val Accuracy: 0.9439



Training:   0%|          | 0/48 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/48 [00:02<02:11,  2.79s/it][A
Training:   6%|▋         | 3/48 [00:02<00:34,  1.29it/s][A
Training:  10%|█         | 5/48 [00:04<00:38,  1.11it/s][A
Training:  12%|█▎        | 6/48 [00:05<00:29,  1.45it/s][A
Training:  15%|█▍        | 7/48 [00:05<00:21,  1.89it/s][A
Training:  19%|█▉        | 9/48 [00:06<00:25,  1.52it/s][A
Training:  21%|██        | 10/48 [00:06<00:19,  1.91it/s][A
Training:  23%|██▎       | 11/48 [00:07<00:15,  2.40it/s][A
Training:  25%|██▌       | 12/48 [00:07<00:12,  2.87it/s][A
Training:  27%|██▋       | 13/48 [00:08<00:25,  1.36it/s][A
Training:  29%|██▉       | 14/48 [00:09<00:19,  1.77it/s][A
Training:  33%|███▎      | 16/48 [00:09<00:11,  2.88it/s][A
Training:  35%|███▌      | 17/48 [00:10<00:21,  1.48it/s][A
Training:  40%|███▉      | 19/48 [00:11<00:12,  2.35it/s][A
Training:  42%|████▏     | 20/48 [00:11<00:10,  2.66it/s][A
Training:  44%|████▍     | 21/48 [00:1

Epoch: 51/71 - Loss: 2.7369 - Accuracy: 0.9467



  0%|          | 0/6 [00:00<?, ?it/s][A
 17%|█▋        | 1/6 [00:02<00:11,  2.33s/it][A
 50%|█████     | 3/6 [00:02<00:01,  1.55it/s][A
100%|██████████| 6/6 [00:04<00:00,  1.37it/s][A
Epochs:  72%|███████▏  | 51/71 [25:03<09:42, 29.14s/it]

Val Loss: 3.8796 - Val Accuracy: 0.9327



Training:   0%|          | 0/48 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/48 [00:02<01:39,  2.12s/it][A
Training:   4%|▍         | 2/48 [00:02<00:47,  1.04s/it][A
Training:   6%|▋         | 3/48 [00:02<00:29,  1.54it/s][A
Training:   8%|▊         | 4/48 [00:02<00:19,  2.24it/s][A
Training:  10%|█         | 5/48 [00:04<00:34,  1.26it/s][A
Training:  12%|█▎        | 6/48 [00:04<00:26,  1.59it/s][A
Training:  17%|█▋        | 8/48 [00:04<00:14,  2.69it/s][A
Training:  19%|█▉        | 9/48 [00:06<00:25,  1.53it/s][A
Training:  21%|██        | 10/48 [00:06<00:20,  1.84it/s][A
Training:  23%|██▎       | 11/48 [00:06<00:15,  2.32it/s][A
Training:  25%|██▌       | 12/48 [00:06<00:12,  2.81it/s][A
Training:  27%|██▋       | 13/48 [00:08<00:24,  1.45it/s][A
Training:  29%|██▉       | 14/48 [00:08<00:18,  1.88it/s][A
Training:  33%|███▎      | 16/48 [00:08<00:13,  2.42it/s][A
Training:  35%|███▌      | 17/48 [00:10<00:19,  1.57it/s][A
Training:  40%|███▉      | 19/48 [00:10<

Epoch: 52/71 - Loss: 2.5032 - Accuracy: 0.9519



  0%|          | 0/6 [00:00<?, ?it/s][A
 17%|█▋        | 1/6 [00:02<00:12,  2.54s/it][A
100%|██████████| 6/6 [00:04<00:00,  1.37it/s][A
Epochs:  73%|███████▎  | 52/71 [25:32<09:12, 29.08s/it]

Val Loss: 3.3892 - Val Accuracy: 0.9391



Training:   0%|          | 0/48 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/48 [00:02<01:42,  2.17s/it][A
Training:   4%|▍         | 2/48 [00:02<00:46,  1.02s/it][A
Training:   8%|▊         | 4/48 [00:02<00:19,  2.25it/s][A
Training:  10%|█         | 5/48 [00:04<00:39,  1.10it/s][A
Training:  12%|█▎        | 6/48 [00:04<00:27,  1.51it/s][A
Training:  17%|█▋        | 8/48 [00:04<00:15,  2.64it/s][A
Training:  21%|██        | 10/48 [00:06<00:24,  1.55it/s][A
Training:  23%|██▎       | 11/48 [00:06<00:19,  1.91it/s][A
Training:  25%|██▌       | 12/48 [00:07<00:15,  2.36it/s][A
Training:  27%|██▋       | 13/48 [00:08<00:25,  1.37it/s][A
Training:  33%|███▎      | 16/48 [00:08<00:11,  2.67it/s][A
Training:  38%|███▊      | 18/48 [00:10<00:17,  1.75it/s][A
Training:  40%|███▉      | 19/48 [00:10<00:14,  2.07it/s][A
Training:  44%|████▍     | 21/48 [00:12<00:17,  1.59it/s][A
Training:  48%|████▊     | 23/48 [00:12<00:11,  2.17it/s][A
Training:  52%|█████▏    | 25/48 [00:1

Epoch: 53/71 - Loss: 2.6100 - Accuracy: 0.9485



  0%|          | 0/6 [00:00<?, ?it/s][A
 17%|█▋        | 1/6 [00:02<00:12,  2.60s/it][A
 50%|█████     | 3/6 [00:02<00:02,  1.39it/s][A
100%|██████████| 6/6 [00:04<00:00,  1.33it/s][A
Epochs:  75%|███████▍  | 53/71 [26:02<08:44, 29.15s/it]

Val Loss: 3.3596 - Val Accuracy: 0.9384



Training:   0%|          | 0/48 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/48 [00:02<02:10,  2.79s/it][A
Training:   4%|▍         | 2/48 [00:02<00:55,  1.21s/it][A
Training:   8%|▊         | 4/48 [00:03<00:22,  1.95it/s][A
Training:  10%|█         | 5/48 [00:04<00:37,  1.13it/s][A
Training:  15%|█▍        | 7/48 [00:04<00:20,  1.95it/s][A
Training:  19%|█▉        | 9/48 [00:06<00:24,  1.61it/s][A
Training:  21%|██        | 10/48 [00:06<00:19,  1.98it/s][A
Training:  25%|██▌       | 12/48 [00:06<00:12,  2.86it/s][A
Training:  27%|██▋       | 13/48 [00:08<00:23,  1.49it/s][A
Training:  31%|███▏      | 15/48 [00:08<00:14,  2.20it/s][A
Training:  33%|███▎      | 16/48 [00:09<00:12,  2.62it/s][A
Training:  35%|███▌      | 17/48 [00:10<00:18,  1.64it/s][A
Training:  38%|███▊      | 18/48 [00:10<00:14,  2.05it/s][A
Training:  40%|███▉      | 19/48 [00:10<00:11,  2.56it/s][A
Training:  42%|████▏     | 20/48 [00:11<00:13,  2.10it/s][A
Training:  44%|████▍     | 21/48 [00:1

Epoch: 54/71 - Loss: 2.4928 - Accuracy: 0.9510



  0%|          | 0/6 [00:00<?, ?it/s][A
 17%|█▋        | 1/6 [00:02<00:12,  2.47s/it][A
 50%|█████     | 3/6 [00:02<00:02,  1.34it/s][A
100%|██████████| 6/6 [00:04<00:00,  1.31it/s][A
Epochs:  76%|███████▌  | 54/71 [26:31<08:15, 29.12s/it]

Val Loss: 4.2604 - Val Accuracy: 0.9296



Training:   0%|          | 0/48 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/48 [00:02<02:19,  2.96s/it][A
Training:   6%|▋         | 3/48 [00:03<00:36,  1.22it/s][A
Training:   8%|▊         | 4/48 [00:03<00:25,  1.73it/s][A
Training:  10%|█         | 5/48 [00:04<00:39,  1.08it/s][A
Training:  15%|█▍        | 7/48 [00:05<00:21,  1.91it/s][A
Training:  19%|█▉        | 9/48 [00:07<00:28,  1.35it/s][A
Training:  23%|██▎       | 11/48 [00:07<00:19,  1.91it/s][A
Training:  25%|██▌       | 12/48 [00:07<00:15,  2.28it/s][A
Training:  27%|██▋       | 13/48 [00:09<00:25,  1.40it/s][A
Training:  31%|███▏      | 15/48 [00:09<00:15,  2.16it/s][A
Training:  35%|███▌      | 17/48 [00:11<00:19,  1.58it/s][A
Training:  38%|███▊      | 18/48 [00:11<00:15,  1.88it/s][A
Training:  40%|███▉      | 19/48 [00:12<00:17,  1.70it/s][A
Training:  44%|████▍     | 21/48 [00:13<00:17,  1.54it/s][A
Training:  46%|████▌     | 22/48 [00:13<00:13,  1.87it/s][A
Training:  48%|████▊     | 23/48 [00:1

Epoch: 55/71 - Loss: 2.5117 - Accuracy: 0.9506



  0%|          | 0/6 [00:00<?, ?it/s][A
 17%|█▋        | 1/6 [00:02<00:12,  2.51s/it][A
 67%|██████▋   | 4/6 [00:02<00:01,  1.98it/s][A
100%|██████████| 6/6 [00:04<00:00,  1.38it/s][A
Epochs:  77%|███████▋  | 55/71 [27:02<07:55, 29.73s/it]

Val Loss: 3.2863 - Val Accuracy: 0.9390



Training:   0%|          | 0/48 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/48 [00:02<01:45,  2.24s/it][A
Training:   4%|▍         | 2/48 [00:02<00:47,  1.02s/it][A
Training:   6%|▋         | 3/48 [00:02<00:27,  1.63it/s][A
Training:   8%|▊         | 4/48 [00:02<00:18,  2.32it/s][A
Training:  10%|█         | 5/48 [00:04<00:36,  1.16it/s][A
Training:  15%|█▍        | 7/48 [00:04<00:19,  2.12it/s][A
Training:  19%|█▉        | 9/48 [00:06<00:23,  1.65it/s][A
Training:  21%|██        | 10/48 [00:06<00:18,  2.02it/s][A
Training:  25%|██▌       | 12/48 [00:06<00:11,  3.10it/s][A
Training:  27%|██▋       | 13/48 [00:08<00:23,  1.49it/s][A
Training:  31%|███▏      | 15/48 [00:08<00:14,  2.27it/s][A
Training:  35%|███▌      | 17/48 [00:09<00:16,  1.88it/s][A
Training:  38%|███▊      | 18/48 [00:10<00:14,  2.02it/s][A
Training:  40%|███▉      | 19/48 [00:10<00:13,  2.08it/s][A
Training:  42%|████▏     | 20/48 [00:10<00:11,  2.44it/s][A
Training:  44%|████▍     | 21/48 [00:12

Epoch: 56/71 - Loss: 2.4412 - Accuracy: 0.9507



  0%|          | 0/6 [00:00<?, ?it/s][A
 17%|█▋        | 1/6 [00:02<00:13,  2.73s/it][A
 33%|███▎      | 2/6 [00:02<00:04,  1.25s/it][A
100%|██████████| 6/6 [00:04<00:00,  1.29it/s][A
Epochs:  79%|███████▉  | 56/71 [27:32<07:27, 29.84s/it]

Val Loss: 3.2848 - Val Accuracy: 0.9428



Training:   0%|          | 0/48 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/48 [00:02<02:01,  2.58s/it][A
Training:   6%|▋         | 3/48 [00:02<00:34,  1.29it/s][A
Training:  10%|█         | 5/48 [00:04<00:34,  1.26it/s][A
Training:  12%|█▎        | 6/48 [00:04<00:25,  1.63it/s][A
Training:  17%|█▋        | 8/48 [00:04<00:14,  2.68it/s][A
Training:  19%|█▉        | 9/48 [00:06<00:25,  1.54it/s][A
Training:  21%|██        | 10/48 [00:06<00:19,  1.94it/s][A
Training:  23%|██▎       | 11/48 [00:06<00:17,  2.09it/s][A
Training:  27%|██▋       | 13/48 [00:07<00:18,  1.92it/s][A
Training:  29%|██▉       | 14/48 [00:08<00:16,  2.12it/s][A
Training:  31%|███▏      | 15/48 [00:08<00:16,  1.96it/s][A
Training:  35%|███▌      | 17/48 [00:09<00:14,  2.07it/s][A
Training:  38%|███▊      | 18/48 [00:10<00:16,  1.84it/s][A
Training:  40%|███▉      | 19/48 [00:11<00:19,  1.51it/s][A
Training:  42%|████▏     | 20/48 [00:11<00:14,  1.87it/s][A
Training:  44%|████▍     | 21/48 [00:1

Epoch: 57/71 - Loss: 2.4832 - Accuracy: 0.9497



  0%|          | 0/6 [00:00<?, ?it/s][A
 17%|█▋        | 1/6 [00:02<00:12,  2.43s/it][A
 50%|█████     | 3/6 [00:02<00:02,  1.50it/s][A
100%|██████████| 6/6 [00:04<00:00,  1.38it/s][A
Epochs:  80%|████████  | 57/71 [28:02<06:59, 29.95s/it]

Val Loss: 3.5949 - Val Accuracy: 0.9388



Training:   0%|          | 0/48 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/48 [00:02<01:58,  2.52s/it][A
Training:   4%|▍         | 2/48 [00:02<00:52,  1.13s/it][A
Training:   6%|▋         | 3/48 [00:02<00:30,  1.48it/s][A
Training:   8%|▊         | 4/48 [00:02<00:20,  2.15it/s][A
Training:  10%|█         | 5/48 [00:04<00:34,  1.24it/s][A
Training:  12%|█▎        | 6/48 [00:04<00:26,  1.58it/s][A
Training:  15%|█▍        | 7/48 [00:04<00:18,  2.17it/s][A
Training:  19%|█▉        | 9/48 [00:06<00:22,  1.75it/s][A
Training:  21%|██        | 10/48 [00:06<00:22,  1.70it/s][A
Training:  25%|██▌       | 12/48 [00:06<00:13,  2.69it/s][A
Training:  27%|██▋       | 13/48 [00:08<00:19,  1.84it/s][A
Training:  29%|██▉       | 14/48 [00:08<00:19,  1.79it/s][A
Training:  31%|███▏      | 15/48 [00:09<00:16,  1.98it/s][A
Training:  35%|███▌      | 17/48 [00:10<00:17,  1.73it/s][A
Training:  38%|███▊      | 18/48 [00:10<00:17,  1.74it/s][A
Training:  44%|████▍     | 21/48 [00:12<

Epoch: 58/71 - Loss: 2.4351 - Accuracy: 0.9514



  0%|          | 0/6 [00:00<?, ?it/s][A
 17%|█▋        | 1/6 [00:02<00:12,  2.42s/it][A
 33%|███▎      | 2/6 [00:02<00:04,  1.07s/it][A
 50%|█████     | 3/6 [00:02<00:01,  1.59it/s][A
100%|██████████| 6/6 [00:04<00:00,  1.36it/s][A
Epochs:  82%|████████▏ | 58/71 [28:32<06:28, 29.91s/it]

Val Loss: 3.2844 - Val Accuracy: 0.9384



Training:   0%|          | 0/48 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/48 [00:02<01:53,  2.41s/it][A
Training:   4%|▍         | 2/48 [00:02<00:48,  1.06s/it][A
Training:  10%|█         | 5/48 [00:04<00:30,  1.42it/s][A
Training:  12%|█▎        | 6/48 [00:04<00:24,  1.74it/s][A
Training:  15%|█▍        | 7/48 [00:04<00:18,  2.19it/s][A
Training:  17%|█▋        | 8/48 [00:04<00:14,  2.75it/s][A
Training:  19%|█▉        | 9/48 [00:06<00:25,  1.55it/s][A
Training:  21%|██        | 10/48 [00:06<00:24,  1.57it/s][A
Training:  23%|██▎       | 11/48 [00:06<00:17,  2.07it/s][A
Training:  25%|██▌       | 12/48 [00:07<00:15,  2.31it/s][A
Training:  27%|██▋       | 13/48 [00:08<00:25,  1.38it/s][A
Training:  29%|██▉       | 14/48 [00:09<00:27,  1.22it/s][A
Training:  31%|███▏      | 15/48 [00:09<00:20,  1.60it/s][A
Training:  35%|███▌      | 17/48 [00:10<00:17,  1.81it/s][A
Training:  38%|███▊      | 18/48 [00:11<00:18,  1.63it/s][A
Training:  42%|████▏     | 20/48 [00:11

Epoch: 59/71 - Loss: 2.3716 - Accuracy: 0.9526



  0%|          | 0/6 [00:00<?, ?it/s][A
 17%|█▋        | 1/6 [00:02<00:12,  2.47s/it][A
 33%|███▎      | 2/6 [00:02<00:04,  1.11s/it][A
100%|██████████| 6/6 [00:04<00:00,  1.36it/s][A
Epochs:  83%|████████▎ | 59/71 [29:02<05:59, 29.94s/it]

Val Loss: 3.4321 - Val Accuracy: 0.9379



Training:   0%|          | 0/48 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/48 [00:02<01:54,  2.43s/it][A
Training:   4%|▍         | 2/48 [00:02<00:49,  1.08s/it][A
Training:   8%|▊         | 4/48 [00:02<00:20,  2.13it/s][A
Training:  10%|█         | 5/48 [00:04<00:37,  1.14it/s][A
Training:  17%|█▋        | 8/48 [00:04<00:15,  2.51it/s][A
Training:  21%|██        | 10/48 [00:06<00:22,  1.70it/s][A
Training:  23%|██▎       | 11/48 [00:06<00:18,  2.01it/s][A
Training:  27%|██▋       | 13/48 [00:08<00:23,  1.47it/s][A
Training:  31%|███▏      | 15/48 [00:08<00:15,  2.12it/s][A
Training:  35%|███▌      | 17/48 [00:10<00:19,  1.63it/s][A
Training:  38%|███▊      | 18/48 [00:10<00:15,  1.92it/s][A
Training:  42%|████▏     | 20/48 [00:10<00:10,  2.78it/s][A
Training:  44%|████▍     | 21/48 [00:12<00:17,  1.54it/s][A
Training:  50%|█████     | 24/48 [00:12<00:08,  2.70it/s][A
Training:  54%|█████▍    | 26/48 [00:14<00:11,  1.85it/s][A
Training:  56%|█████▋    | 27/48 [00:

Epoch: 60/71 - Loss: 2.4221 - Accuracy: 0.9518



  0%|          | 0/6 [00:00<?, ?it/s][A
 17%|█▋        | 1/6 [00:02<00:12,  2.44s/it][A
 33%|███▎      | 2/6 [00:02<00:04,  1.09s/it][A
100%|██████████| 6/6 [00:04<00:00,  1.38it/s][A
Epochs:  85%|████████▍ | 60/71 [29:30<05:23, 29.42s/it]

Val Loss: 3.3986 - Val Accuracy: 0.9390



Training:   0%|          | 0/48 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/48 [00:02<01:43,  2.21s/it][A
Training:   6%|▋         | 3/48 [00:02<00:28,  1.56it/s][A
Training:   8%|▊         | 4/48 [00:02<00:20,  2.18it/s][A
Training:  10%|█         | 5/48 [00:04<00:35,  1.20it/s][A
Training:  15%|█▍        | 7/48 [00:04<00:26,  1.56it/s][A
Training:  19%|█▉        | 9/48 [00:06<00:24,  1.58it/s][A
Training:  23%|██▎       | 11/48 [00:06<00:18,  1.95it/s][A
Training:  25%|██▌       | 12/48 [00:06<00:15,  2.32it/s][A
Training:  27%|██▋       | 13/48 [00:08<00:21,  1.64it/s][A
Training:  31%|███▏      | 15/48 [00:08<00:15,  2.08it/s][A
Training:  33%|███▎      | 16/48 [00:08<00:12,  2.50it/s][A
Training:  35%|███▌      | 17/48 [00:10<00:20,  1.53it/s][A
Training:  40%|███▉      | 19/48 [00:10<00:14,  2.02it/s][A
Training:  42%|████▏     | 20/48 [00:10<00:11,  2.46it/s][A
Training:  44%|████▍     | 21/48 [00:12<00:17,  1.53it/s][A
Training:  46%|████▌     | 22/48 [00:1

Epoch: 61/71 - Loss: 2.4078 - Accuracy: 0.9511



  0%|          | 0/6 [00:00<?, ?it/s][A
 17%|█▋        | 1/6 [00:02<00:11,  2.39s/it][A
 50%|█████     | 3/6 [00:02<00:02,  1.48it/s][A
 83%|████████▎ | 5/6 [00:03<00:00,  1.48it/s][A
100%|██████████| 6/6 [00:04<00:00,  1.32it/s][A
Epochs:  86%|████████▌ | 61/71 [30:00<04:55, 29.53s/it]

Val Loss: 3.4861 - Val Accuracy: 0.9394



Training:   0%|          | 0/48 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/48 [00:02<01:47,  2.29s/it][A
Training:   4%|▍         | 2/48 [00:02<00:46,  1.01s/it][A
Training:   8%|▊         | 4/48 [00:02<00:18,  2.35it/s][A
Training:  10%|█         | 5/48 [00:04<00:35,  1.20it/s][A
Training:  15%|█▍        | 7/48 [00:05<00:25,  1.63it/s][A
Training:  19%|█▉        | 9/48 [00:06<00:27,  1.43it/s][A
Training:  21%|██        | 10/48 [00:06<00:21,  1.76it/s][A
Training:  23%|██▎       | 11/48 [00:06<00:17,  2.15it/s][A
Training:  25%|██▌       | 12/48 [00:07<00:13,  2.67it/s][A
Training:  27%|██▋       | 13/48 [00:08<00:26,  1.34it/s][A
Training:  29%|██▉       | 14/48 [00:08<00:19,  1.75it/s][A
Training:  33%|███▎      | 16/48 [00:09<00:10,  2.92it/s][A
Training:  35%|███▌      | 17/48 [00:10<00:22,  1.40it/s][A
Training:  40%|███▉      | 19/48 [00:11<00:13,  2.16it/s][A
Training:  44%|████▍     | 21/48 [00:12<00:16,  1.59it/s][A
Training:  46%|████▌     | 22/48 [00:1

Epoch: 62/71 - Loss: 2.4019 - Accuracy: 0.9524



  0%|          | 0/6 [00:00<?, ?it/s][A
 17%|█▋        | 1/6 [00:02<00:11,  2.29s/it][A
 50%|█████     | 3/6 [00:02<00:01,  1.54it/s][A
100%|██████████| 6/6 [00:04<00:00,  1.34it/s][A
Epochs:  87%|████████▋ | 62/71 [30:29<04:24, 29.42s/it]

Val Loss: 3.4092 - Val Accuracy: 0.9383



Training:   0%|          | 0/48 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/48 [00:02<02:11,  2.79s/it][A
Training:   6%|▋         | 3/48 [00:02<00:35,  1.25it/s][A
Training:  10%|█         | 5/48 [00:05<00:39,  1.09it/s][A
Training:  15%|█▍        | 7/48 [00:05<00:23,  1.77it/s][A
Training:  19%|█▉        | 9/48 [00:07<00:27,  1.43it/s][A
Training:  21%|██        | 10/48 [00:07<00:23,  1.64it/s][A
Training:  27%|██▋       | 13/48 [00:09<00:21,  1.66it/s][A
Training:  29%|██▉       | 14/48 [00:09<00:18,  1.85it/s][A
Training:  35%|███▌      | 17/48 [00:11<00:18,  1.67it/s][A
Training:  42%|████▏     | 20/48 [00:11<00:10,  2.58it/s][A
Training:  44%|████▍     | 21/48 [00:13<00:16,  1.67it/s][A
Training:  48%|████▊     | 23/48 [00:13<00:11,  2.27it/s][A
Training:  52%|█████▏    | 25/48 [00:15<00:12,  1.82it/s][A
Training:  54%|█████▍    | 26/48 [00:15<00:10,  2.05it/s][A
Training:  58%|█████▊    | 28/48 [00:15<00:07,  2.86it/s][A
Training:  60%|██████    | 29/48 [00:

Epoch: 63/71 - Loss: 2.4560 - Accuracy: 0.9503



  0%|          | 0/6 [00:00<?, ?it/s][A
 17%|█▋        | 1/6 [00:02<00:12,  2.46s/it][A
 50%|█████     | 3/6 [00:02<00:02,  1.43it/s][A
100%|██████████| 6/6 [00:04<00:00,  1.42it/s][A
Epochs:  89%|████████▊ | 63/71 [30:58<03:54, 29.33s/it]

Val Loss: 3.2852 - Val Accuracy: 0.9402



Training:   0%|          | 0/48 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/48 [00:02<01:56,  2.48s/it][A
Training:   8%|▊         | 4/48 [00:02<00:22,  1.92it/s][A
Training:  10%|█         | 5/48 [00:04<00:38,  1.10it/s][A
Training:  12%|█▎        | 6/48 [00:05<00:33,  1.27it/s][A
Training:  15%|█▍        | 7/48 [00:05<00:24,  1.66it/s][A
Training:  19%|█▉        | 9/48 [00:07<00:32,  1.22it/s][A
Training:  23%|██▎       | 11/48 [00:07<00:19,  1.90it/s][A
Training:  27%|██▋       | 13/48 [00:09<00:22,  1.53it/s][A
Training:  31%|███▏      | 15/48 [00:09<00:14,  2.21it/s][A
Training:  35%|███▌      | 17/48 [00:11<00:18,  1.68it/s][A
Training:  40%|███▉      | 19/48 [00:11<00:12,  2.33it/s][A
Training:  44%|████▍     | 21/48 [00:13<00:15,  1.71it/s][A
Training:  48%|████▊     | 23/48 [00:13<00:10,  2.33it/s][A
Training:  52%|█████▏    | 25/48 [00:15<00:13,  1.76it/s][A
Training:  54%|█████▍    | 26/48 [00:15<00:10,  2.04it/s][A
Training:  56%|█████▋    | 27/48 [00:1

Epoch: 64/71 - Loss: 2.4527 - Accuracy: 0.9519



  0%|          | 0/6 [00:00<?, ?it/s][A
 17%|█▋        | 1/6 [00:02<00:11,  2.20s/it][A
 50%|█████     | 3/6 [00:02<00:01,  1.60it/s][A
100%|██████████| 6/6 [00:04<00:00,  1.45it/s][A
Epochs:  90%|█████████ | 64/71 [31:28<03:25, 29.36s/it]

Val Loss: 3.2501 - Val Accuracy: 0.9423



Training:   0%|          | 0/48 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/48 [00:02<01:55,  2.46s/it][A
Training:   4%|▍         | 2/48 [00:02<00:49,  1.09s/it][A
Training:   8%|▊         | 4/48 [00:02<00:19,  2.20it/s][A
Training:  10%|█         | 5/48 [00:04<00:36,  1.18it/s][A
Training:  12%|█▎        | 6/48 [00:04<00:26,  1.61it/s][A
Training:  17%|█▋        | 8/48 [00:04<00:14,  2.67it/s][A
Training:  19%|█▉        | 9/48 [00:06<00:32,  1.20it/s][A
Training:  27%|██▋       | 13/48 [00:08<00:21,  1.64it/s][A
Training:  29%|██▉       | 14/48 [00:08<00:17,  1.91it/s][A
Training:  35%|███▌      | 17/48 [00:10<00:17,  1.82it/s][A
Training:  40%|███▉      | 19/48 [00:10<00:12,  2.41it/s][A
Training:  42%|████▏     | 20/48 [00:10<00:10,  2.75it/s][A
Training:  44%|████▍     | 21/48 [00:12<00:15,  1.70it/s][A
Training:  48%|████▊     | 23/48 [00:12<00:10,  2.42it/s][A
Training:  52%|█████▏    | 25/48 [00:14<00:11,  1.92it/s][A
Training:  54%|█████▍    | 26/48 [00:14

Epoch: 65/71 - Loss: 2.6452 - Accuracy: 0.9474



  0%|          | 0/6 [00:00<?, ?it/s][A
 17%|█▋        | 1/6 [00:02<00:11,  2.35s/it][A
 67%|██████▋   | 4/6 [00:02<00:00,  2.09it/s][A
100%|██████████| 6/6 [00:04<00:00,  1.43it/s][A
Epochs:  92%|█████████▏| 65/71 [31:56<02:54, 29.02s/it]

Val Loss: 3.7872 - Val Accuracy: 0.9360



Training:   0%|          | 0/48 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/48 [00:02<01:50,  2.34s/it][A
Training:   4%|▍         | 2/48 [00:02<00:47,  1.03s/it][A
Training:   6%|▋         | 3/48 [00:02<00:27,  1.64it/s][A
Training:   8%|▊         | 4/48 [00:02<00:18,  2.40it/s][A
Training:  10%|█         | 5/48 [00:04<00:38,  1.11it/s][A
Training:  12%|█▎        | 6/48 [00:04<00:26,  1.58it/s][A
Training:  15%|█▍        | 7/48 [00:04<00:19,  2.14it/s][A
Training:  17%|█▋        | 8/48 [00:04<00:15,  2.58it/s][A
Training:  19%|█▉        | 9/48 [00:06<00:24,  1.62it/s][A
Training:  21%|██        | 10/48 [00:06<00:18,  2.08it/s][A
Training:  23%|██▎       | 11/48 [00:06<00:16,  2.28it/s][A
Training:  27%|██▋       | 13/48 [00:07<00:19,  1.82it/s][A
Training:  29%|██▉       | 14/48 [00:08<00:15,  2.13it/s][A
Training:  31%|███▏      | 15/48 [00:08<00:15,  2.19it/s][A
Training:  33%|███▎      | 16/48 [00:08<00:11,  2.74it/s][A
Training:  35%|███▌      | 17/48 [00:09<0

Epoch: 66/71 - Loss: 2.6557 - Accuracy: 0.9449



  0%|          | 0/6 [00:00<?, ?it/s][A
 17%|█▋        | 1/6 [00:02<00:10,  2.08s/it][A
 33%|███▎      | 2/6 [00:02<00:03,  1.09it/s][A
 50%|█████     | 3/6 [00:02<00:02,  1.22it/s][A
100%|██████████| 6/6 [00:04<00:00,  1.41it/s][A
Epochs:  93%|█████████▎| 66/71 [32:24<02:23, 28.69s/it]

Val Loss: 3.2428 - Val Accuracy: 0.9406



Training:   0%|          | 0/48 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/48 [00:02<01:59,  2.55s/it][A
Training:   4%|▍         | 2/48 [00:02<00:51,  1.13s/it][A
Training:   6%|▋         | 3/48 [00:02<00:29,  1.51it/s][A
Training:  10%|█         | 5/48 [00:04<00:30,  1.39it/s][A
Training:  12%|█▎        | 6/48 [00:04<00:25,  1.65it/s][A
Training:  17%|█▋        | 8/48 [00:04<00:14,  2.79it/s][A
Training:  19%|█▉        | 9/48 [00:06<00:24,  1.61it/s][A
Training:  21%|██        | 10/48 [00:06<00:23,  1.60it/s][A
Training:  25%|██▌       | 12/48 [00:07<00:14,  2.52it/s][A
Training:  27%|██▋       | 13/48 [00:08<00:18,  1.86it/s][A
Training:  29%|██▉       | 14/48 [00:08<00:20,  1.64it/s][A
Training:  31%|███▏      | 15/48 [00:08<00:15,  2.07it/s][A
Training:  35%|███▌      | 17/48 [00:10<00:15,  2.00it/s][A
Training:  38%|███▊      | 18/48 [00:10<00:16,  1.82it/s][A
Training:  42%|████▏     | 20/48 [00:10<00:09,  2.84it/s][A
Training:  44%|████▍     | 21/48 [00:11

Epoch: 67/71 - Loss: 2.3828 - Accuracy: 0.9529



  0%|          | 0/6 [00:00<?, ?it/s][A
 17%|█▋        | 1/6 [00:02<00:12,  2.47s/it][A
 50%|█████     | 3/6 [00:02<00:02,  1.43it/s][A
100%|██████████| 6/6 [00:04<00:00,  1.36it/s][A
Epochs:  94%|█████████▍| 67/71 [32:53<01:54, 28.68s/it]

Val Loss: 3.2917 - Val Accuracy: 0.9418



Training:   0%|          | 0/48 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/48 [00:02<02:02,  2.61s/it][A
Training:   6%|▋         | 3/48 [00:02<00:32,  1.37it/s][A
Training:   8%|▊         | 4/48 [00:02<00:22,  1.94it/s][A
Training:  10%|█         | 5/48 [00:04<00:39,  1.08it/s][A
Training:  15%|█▍        | 7/48 [00:04<00:21,  1.91it/s][A
Training:  17%|█▋        | 8/48 [00:04<00:16,  2.40it/s][A
Training:  19%|█▉        | 9/48 [00:06<00:28,  1.37it/s][A
Training:  25%|██▌       | 12/48 [00:06<00:13,  2.71it/s][A
Training:  27%|██▋       | 13/48 [00:08<00:21,  1.66it/s][A
Training:  31%|███▏      | 15/48 [00:08<00:13,  2.43it/s][A
Training:  33%|███▎      | 16/48 [00:08<00:11,  2.87it/s][A
Training:  35%|███▌      | 17/48 [00:09<00:16,  1.84it/s][A
Training:  38%|███▊      | 18/48 [00:09<00:13,  2.30it/s][A
Training:  42%|████▏     | 20/48 [00:10<00:08,  3.16it/s][A
Training:  44%|████▍     | 21/48 [00:11<00:15,  1.75it/s][A
Training:  48%|████▊     | 23/48 [00:11

Epoch: 68/71 - Loss: 2.3291 - Accuracy: 0.9533



  0%|          | 0/6 [00:00<?, ?it/s][A
 17%|█▋        | 1/6 [00:02<00:14,  2.88s/it][A
 50%|█████     | 3/6 [00:03<00:02,  1.15it/s][A
 67%|██████▋   | 4/6 [00:03<00:01,  1.43it/s][A
100%|██████████| 6/6 [00:04<00:00,  1.29it/s][A
Epochs:  96%|█████████▌| 68/71 [33:20<01:25, 28.45s/it]

Val Loss: 3.4084 - Val Accuracy: 0.9345



Training:   0%|          | 0/48 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/48 [00:02<02:14,  2.87s/it][A
Training:   4%|▍         | 2/48 [00:03<01:02,  1.36s/it][A
Training:   6%|▋         | 3/48 [00:03<00:35,  1.26it/s][A
Training:  10%|█         | 5/48 [00:04<00:33,  1.29it/s][A
Training:  12%|█▎        | 6/48 [00:05<00:26,  1.57it/s][A
Training:  19%|█▉        | 9/48 [00:06<00:23,  1.66it/s][A
Training:  21%|██        | 10/48 [00:07<00:19,  1.91it/s][A
Training:  23%|██▎       | 11/48 [00:07<00:16,  2.31it/s][A
Training:  27%|██▋       | 13/48 [00:08<00:18,  1.84it/s][A
Training:  29%|██▉       | 14/48 [00:08<00:15,  2.23it/s][A
Training:  33%|███▎      | 16/48 [00:08<00:09,  3.33it/s][A
Training:  35%|███▌      | 17/48 [00:10<00:18,  1.69it/s][A
Training:  38%|███▊      | 18/48 [00:10<00:14,  2.10it/s][A
Training:  42%|████▏     | 20/48 [00:10<00:08,  3.21it/s][A
Training:  44%|████▍     | 21/48 [00:12<00:16,  1.64it/s][A
Training:  46%|████▌     | 22/48 [00:1

Epoch: 69/71 - Loss: 2.4174 - Accuracy: 0.9503



  0%|          | 0/6 [00:00<?, ?it/s][A
 17%|█▋        | 1/6 [00:02<00:12,  2.44s/it][A
 33%|███▎      | 2/6 [00:02<00:04,  1.16s/it][A
 50%|█████     | 3/6 [00:02<00:02,  1.34it/s][A
 67%|██████▋   | 4/6 [00:03<00:01,  1.44it/s][A
100%|██████████| 6/6 [00:04<00:00,  1.39it/s][A
Epochs:  97%|█████████▋| 69/71 [33:49<00:56, 28.39s/it]

Val Loss: 3.2562 - Val Accuracy: 0.9402



Training:   0%|          | 0/48 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/48 [00:03<02:29,  3.17s/it][A
Training:   6%|▋         | 3/48 [00:03<00:39,  1.15it/s][A
Training:  10%|█         | 5/48 [00:05<00:38,  1.11it/s][A
Training:  12%|█▎        | 6/48 [00:05<00:28,  1.46it/s][A
Training:  17%|█▋        | 8/48 [00:05<00:16,  2.43it/s][A
Training:  21%|██        | 10/48 [00:07<00:22,  1.69it/s][A
Training:  25%|██▌       | 12/48 [00:07<00:14,  2.49it/s][A
Training:  29%|██▉       | 14/48 [00:08<00:18,  1.83it/s][A
Training:  31%|███▏      | 15/48 [00:09<00:15,  2.17it/s][A
Training:  35%|███▌      | 17/48 [00:10<00:18,  1.65it/s][A
Training:  42%|████▏     | 20/48 [00:10<00:10,  2.74it/s][A
Training:  46%|████▌     | 22/48 [00:12<00:12,  2.02it/s][A
Training:  52%|█████▏    | 25/48 [00:14<00:12,  1.80it/s][A
Training:  54%|█████▍    | 26/48 [00:14<00:10,  2.06it/s][A
Training:  60%|██████    | 29/48 [00:16<00:10,  1.78it/s][A
Training:  65%|██████▍   | 31/48 [00:

Epoch: 70/71 - Loss: 2.3260 - Accuracy: 0.9538



  0%|          | 0/6 [00:00<?, ?it/s][A
 17%|█▋        | 1/6 [00:02<00:13,  2.72s/it][A
 33%|███▎      | 2/6 [00:02<00:04,  1.19s/it][A
 67%|██████▋   | 4/6 [00:03<00:01,  1.97it/s][A
 83%|████████▎ | 5/6 [00:04<00:00,  1.27it/s][A
100%|██████████| 6/6 [00:04<00:00,  1.27it/s][A
Epochs:  99%|█████████▊| 70/71 [34:18<00:28, 28.58s/it]

Val Loss: 3.4542 - Val Accuracy: 0.9402



Training:   0%|          | 0/48 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/48 [00:03<02:36,  3.33s/it][A
Training:   4%|▍         | 2/48 [00:03<01:06,  1.44s/it][A
Training:   8%|▊         | 4/48 [00:03<00:25,  1.75it/s][A
Training:  12%|█▎        | 6/48 [00:05<00:31,  1.35it/s][A
Training:  15%|█▍        | 7/48 [00:05<00:24,  1.70it/s][A
Training:  17%|█▋        | 8/48 [00:05<00:18,  2.18it/s][A
Training:  19%|█▉        | 9/48 [00:07<00:27,  1.42it/s][A
Training:  21%|██        | 10/48 [00:07<00:20,  1.87it/s][A
Training:  23%|██▎       | 11/48 [00:07<00:15,  2.35it/s][A
Training:  25%|██▌       | 12/48 [00:07<00:11,  3.00it/s][A
Training:  27%|██▋       | 13/48 [00:08<00:23,  1.47it/s][A
Training:  29%|██▉       | 14/48 [00:09<00:17,  1.93it/s][A
Training:  31%|███▏      | 15/48 [00:09<00:13,  2.44it/s][A
Training:  35%|███▌      | 17/48 [00:10<00:17,  1.78it/s][A
Training:  42%|████▏     | 20/48 [00:10<00:08,  3.26it/s][A
Training:  44%|████▍     | 21/48 [00:12

Epoch: 71/71 - Loss: 2.3277 - Accuracy: 0.9531



  0%|          | 0/6 [00:00<?, ?it/s][A
 17%|█▋        | 1/6 [00:02<00:14,  2.94s/it][A
 50%|█████     | 3/6 [00:03<00:02,  1.21it/s][A
100%|██████████| 6/6 [00:04<00:00,  1.24it/s][A
Epochs: 100%|██████████| 71/71 [34:47<00:00, 29.40s/it]


Val Loss: 3.3994 - Val Accuracy: 0.9373
Saving best model...


[32m[I 2023-12-14 22:51:00,887][0m Trial 0 finished with value: 0.9373385310173035 and parameters: {'loss_learning_rate': 0.0007572018927627318, 'learning_rate': 0.0013729418906665127, 'weight_decay': 0.006436609159123359, 'epsilon': 9.49605063494801e-08, 'batch_size': 296, 'epochs': 71}. Best is trial 0 with value: 0.9373385310173035.[0m


Learning rate for Loss: 0.00015990828325747049
Learning rate: 0.005697946086593603
Weight decay: 0.0001473649085987928
Epsilon: 4.963406823015153e-09
Batch size: 77
Number of epochs: 12


Epochs:   0%|          | 0/12 [00:00<?, ?it/s]
Training:   0%|          | 0/182 [00:00<?, ?it/s][A
Training:   1%|          | 1/182 [00:00<02:25,  1.24it/s][A
Training:   2%|▏         | 4/182 [00:00<00:32,  5.50it/s][A
Training:   3%|▎         | 6/182 [00:01<00:33,  5.25it/s][A
Training:   5%|▍         | 9/182 [00:01<00:29,  5.77it/s][A
Training:   7%|▋         | 12/182 [00:01<00:19,  8.54it/s][A
Training:   8%|▊         | 14/182 [00:02<00:22,  7.48it/s][A
Training:   9%|▉         | 17/182 [00:02<00:22,  7.23it/s][A
Training:  12%|█▏        | 21/182 [00:03<00:21,  7.64it/s][A
Training:  14%|█▎        | 25/182 [00:03<00:21,  7.28it/s][A
Training:  15%|█▌        | 28/182 [00:03<00:17,  8.99it/s][A
Training:  16%|█▋        | 30/182 [00:04<00:21,  7.07it/s][A
Training:  18%|█▊        | 32/182 [00:04<00:18,  8.14it/s][A
Training:  19%|█▊        | 34/182 [00:04<00:22,  6.69it/s][A
Training:  20%|█▉        | 36/182 [00:05<00:18,  7.98it/s][A
Training:  21%|██        | 38/182 [0

Epoch: 1/12 - Loss: 9.5630 - Accuracy: 0.8386



  0%|          | 0/23 [00:00<?, ?it/s][A
  4%|▍         | 1/23 [00:00<00:17,  1.25it/s][A
 17%|█▋        | 4/23 [00:00<00:03,  5.49it/s][A
 26%|██▌       | 6/23 [00:01<00:03,  5.17it/s][A
 35%|███▍      | 8/23 [00:01<00:02,  6.92it/s][A
 43%|████▎     | 10/23 [00:01<00:02,  6.03it/s][A
 57%|█████▋    | 13/23 [00:02<00:01,  6.16it/s][A
 65%|██████▌   | 15/23 [00:02<00:01,  7.49it/s][A
 74%|███████▍  | 17/23 [00:02<00:00,  7.34it/s][A
 83%|████████▎ | 19/23 [00:03<00:00,  7.13it/s][A
 91%|█████████▏| 21/23 [00:03<00:00,  7.24it/s][A
100%|██████████| 23/23 [00:03<00:00,  6.55it/s][A
Epochs:   8%|▊         | 1/12 [00:26<04:56, 26.97s/it]

Val Loss: 7.3239 - Val Accuracy: 0.8565



Training:   0%|          | 0/182 [00:00<?, ?it/s][A
Training:   1%|          | 1/182 [00:00<02:45,  1.09it/s][A
Training:   2%|▏         | 3/182 [00:01<00:50,  3.52it/s][A
Training:   3%|▎         | 5/182 [00:01<00:39,  4.45it/s][A
Training:   4%|▍         | 8/182 [00:01<00:22,  7.63it/s][A
Training:   5%|▌         | 10/182 [00:01<00:28,  6.01it/s][A
Training:   7%|▋         | 13/182 [00:02<00:27,  6.11it/s][A
Training:   9%|▉         | 17/182 [00:02<00:24,  6.82it/s][A
Training:  11%|█         | 20/182 [00:03<00:17,  9.02it/s][A
Training:  12%|█▏        | 22/182 [00:03<00:21,  7.60it/s][A
Training:  14%|█▎        | 25/182 [00:03<00:21,  7.20it/s][A
Training:  16%|█▌        | 29/182 [00:04<00:20,  7.41it/s][A
Training:  18%|█▊        | 33/182 [00:04<00:18,  8.05it/s][A
Training:  20%|██        | 37/182 [00:05<00:16,  8.57it/s][A
Training:  21%|██        | 38/182 [00:05<00:17,  8.28it/s][A
Training:  22%|██▏       | 40/182 [00:05<00:14,  9.55it/s][A
Training:  23%|██▎  

Epoch: 2/12 - Loss: 4.7988 - Accuracy: 0.9065



  0%|          | 0/23 [00:00<?, ?it/s][A
  4%|▍         | 1/23 [00:00<00:21,  1.01it/s][A
 17%|█▋        | 4/23 [00:01<00:04,  4.62it/s][A
 26%|██▌       | 6/23 [00:01<00:03,  4.94it/s][A
 35%|███▍      | 8/23 [00:01<00:02,  6.87it/s][A
 43%|████▎     | 10/23 [00:02<00:02,  5.50it/s][A
 57%|█████▋    | 13/23 [00:02<00:01,  5.52it/s][A
 74%|███████▍  | 17/23 [00:03<00:00,  6.35it/s][A
100%|██████████| 23/23 [00:03<00:00,  6.17it/s][A
Epochs:  17%|█▋        | 2/12 [00:54<04:33, 27.40s/it]

Val Loss: 4.1475 - Val Accuracy: 0.9130



Training:   0%|          | 0/182 [00:00<?, ?it/s][A
Training:   1%|          | 1/182 [00:00<02:44,  1.10it/s][A
Training:   2%|▏         | 3/182 [00:01<00:52,  3.44it/s][A
Training:   3%|▎         | 5/182 [00:01<00:39,  4.44it/s][A
Training:   4%|▍         | 7/182 [00:01<00:27,  6.29it/s][A
Training:   5%|▍         | 9/182 [00:02<00:34,  5.00it/s][A
Training:   7%|▋         | 13/182 [00:02<00:27,  6.16it/s][A
Training:   9%|▉         | 17/182 [00:02<00:22,  7.47it/s][A
Training:  11%|█         | 20/182 [00:03<00:16,  9.62it/s][A
Training:  12%|█▏        | 22/182 [00:03<00:18,  8.85it/s][A
Training:  14%|█▎        | 25/182 [00:03<00:20,  7.85it/s][A
Training:  15%|█▍        | 27/182 [00:03<00:17,  8.83it/s][A
Training:  16%|█▌        | 29/182 [00:04<00:18,  8.30it/s][A
Training:  18%|█▊        | 32/182 [00:04<00:14, 10.08it/s][A
Training:  19%|█▊        | 34/182 [00:04<00:18,  8.17it/s][A
Training:  20%|█▉        | 36/182 [00:04<00:16,  8.94it/s][A
Training:  21%|██    

Epoch: 3/12 - Loss: 4.2397 - Accuracy: 0.9163



  0%|          | 0/23 [00:00<?, ?it/s][A
  4%|▍         | 1/23 [00:00<00:20,  1.10it/s][A
 13%|█▎        | 3/23 [00:01<00:05,  3.45it/s][A
 22%|██▏       | 5/23 [00:01<00:03,  4.69it/s][A
 30%|███       | 7/23 [00:01<00:02,  6.52it/s][A
 39%|███▉      | 9/23 [00:01<00:02,  6.22it/s][A
 52%|█████▏    | 12/23 [00:01<00:01,  8.81it/s][A
 61%|██████    | 14/23 [00:02<00:01,  6.98it/s][A
 74%|███████▍  | 17/23 [00:02<00:00,  7.69it/s][A
 78%|███████▊  | 18/23 [00:02<00:00,  7.25it/s][A
100%|██████████| 23/23 [00:03<00:00,  6.73it/s][A
Epochs:  25%|██▌       | 3/12 [01:21<04:06, 27.35s/it]

Val Loss: 3.8109 - Val Accuracy: 0.9221



Training:   0%|          | 0/182 [00:00<?, ?it/s][A
Training:   1%|          | 1/182 [00:00<02:36,  1.16it/s][A
Training:   2%|▏         | 4/182 [00:00<00:34,  5.17it/s][A
Training:   3%|▎         | 6/182 [00:01<00:39,  4.48it/s][A
Training:   5%|▍         | 9/182 [00:02<00:36,  4.75it/s][A
Training:   6%|▌         | 11/182 [00:02<00:27,  6.21it/s][A
Training:   7%|▋         | 13/182 [00:02<00:28,  5.89it/s][A
Training:   9%|▉         | 16/182 [00:02<00:19,  8.45it/s][A
Training:  10%|▉         | 18/182 [00:02<00:20,  8.10it/s][A
Training:  12%|█▏        | 21/182 [00:03<00:20,  7.88it/s][A
Training:  13%|█▎        | 23/182 [00:03<00:17,  9.04it/s][A
Training:  14%|█▎        | 25/182 [00:03<00:20,  7.67it/s][A
Training:  15%|█▌        | 28/182 [00:04<00:15,  9.98it/s][A
Training:  16%|█▋        | 30/182 [00:04<00:22,  6.85it/s][A
Training:  18%|█▊        | 32/182 [00:04<00:18,  8.27it/s][A
Training:  19%|█▊        | 34/182 [00:05<00:21,  6.91it/s][A
Training:  20%|█▉   

Epoch: 4/12 - Loss: 3.8191 - Accuracy: 0.9271



  0%|          | 0/23 [00:00<?, ?it/s][A
  4%|▍         | 1/23 [00:00<00:19,  1.12it/s][A
 17%|█▋        | 4/23 [00:01<00:04,  4.73it/s][A
 26%|██▌       | 6/23 [00:01<00:03,  4.96it/s][A
 39%|███▉      | 9/23 [00:01<00:02,  5.33it/s][A
 52%|█████▏    | 12/23 [00:02<00:01,  7.48it/s][A
 61%|██████    | 14/23 [00:02<00:01,  6.62it/s][A
 65%|██████▌   | 15/23 [00:02<00:01,  6.50it/s][A
 74%|███████▍  | 17/23 [00:03<00:01,  5.79it/s][A
 83%|████████▎ | 19/23 [00:03<00:00,  7.11it/s][A
100%|██████████| 23/23 [00:03<00:00,  5.90it/s][A
Epochs:  33%|███▎      | 4/12 [01:49<03:40, 27.54s/it]

Val Loss: 3.9813 - Val Accuracy: 0.9297



Training:   0%|          | 0/182 [00:00<?, ?it/s][A
Training:   1%|          | 1/182 [00:00<02:46,  1.09it/s][A
Training:   2%|▏         | 3/182 [00:01<00:50,  3.55it/s][A
Training:   3%|▎         | 5/182 [00:01<00:41,  4.29it/s][A
Training:   4%|▍         | 8/182 [00:01<00:22,  7.67it/s][A
Training:   5%|▌         | 10/182 [00:01<00:27,  6.18it/s][A
Training:   7%|▋         | 13/182 [00:02<00:23,  7.08it/s][A
Training:   8%|▊         | 15/182 [00:02<00:20,  8.05it/s][A
Training:   9%|▉         | 17/182 [00:02<00:21,  7.76it/s][A
Training:  10%|▉         | 18/182 [00:02<00:21,  7.70it/s][A
Training:  12%|█▏        | 21/182 [00:03<00:20,  7.99it/s][A
Training:  13%|█▎        | 24/182 [00:03<00:14, 10.95it/s][A
Training:  14%|█▍        | 26/182 [00:03<00:17,  9.04it/s][A
Training:  16%|█▌        | 29/182 [00:04<00:16,  9.06it/s][A
Training:  17%|█▋        | 31/182 [00:04<00:14, 10.31it/s][A
Training:  18%|█▊        | 33/182 [00:04<00:16,  9.30it/s][A
Training:  19%|█▉   

Epoch: 5/12 - Loss: 3.8157 - Accuracy: 0.9243



  0%|          | 0/23 [00:00<?, ?it/s][A
  4%|▍         | 1/23 [00:00<00:18,  1.22it/s][A
 13%|█▎        | 3/23 [00:00<00:05,  3.96it/s][A
 22%|██▏       | 5/23 [00:01<00:03,  5.11it/s][A
 26%|██▌       | 6/23 [00:01<00:03,  5.36it/s][A
 39%|███▉      | 9/23 [00:01<00:02,  6.34it/s][A
 43%|████▎     | 10/23 [00:01<00:02,  6.31it/s][A
 57%|█████▋    | 13/23 [00:02<00:01,  6.10it/s][A
 74%|███████▍  | 17/23 [00:02<00:00,  7.02it/s][A
100%|██████████| 23/23 [00:03<00:00,  6.35it/s][A
Epochs:  42%|████▏     | 5/12 [02:17<03:12, 27.44s/it]

Val Loss: 3.9200 - Val Accuracy: 0.9218



Training:   0%|          | 0/182 [00:00<?, ?it/s][A
Training:   1%|          | 1/182 [00:00<02:45,  1.09it/s][A
Training:   2%|▏         | 3/182 [00:01<00:49,  3.59it/s][A
Training:   3%|▎         | 5/182 [00:01<00:39,  4.44it/s][A
Training:   4%|▍         | 8/182 [00:01<00:21,  7.96it/s][A
Training:   5%|▌         | 10/182 [00:01<00:27,  6.29it/s][A
Training:   7%|▋         | 12/182 [00:02<00:21,  7.84it/s][A
Training:   8%|▊         | 14/182 [00:02<00:23,  7.03it/s][A
Training:   9%|▉         | 16/182 [00:02<00:20,  8.29it/s][A
Training:  10%|▉         | 18/182 [00:02<00:22,  7.22it/s][A
Training:  11%|█         | 20/182 [00:03<00:18,  8.89it/s][A
Training:  12%|█▏        | 22/182 [00:03<00:23,  6.69it/s][A
Training:  13%|█▎        | 24/182 [00:03<00:19,  8.13it/s][A
Training:  14%|█▍        | 26/182 [00:04<00:22,  6.88it/s][A
Training:  15%|█▍        | 27/182 [00:04<00:21,  7.10it/s][A
Training:  16%|█▌        | 29/182 [00:04<00:22,  6.91it/s][A
Training:  18%|█▊   

Epoch: 6/12 - Loss: 3.5845 - Accuracy: 0.9293



  0%|          | 0/23 [00:00<?, ?it/s][A
  4%|▍         | 1/23 [00:00<00:20,  1.08it/s][A
 22%|██▏       | 5/23 [00:01<00:04,  4.21it/s][A
 35%|███▍      | 8/23 [00:01<00:02,  6.82it/s][A
 43%|████▎     | 10/23 [00:01<00:02,  6.38it/s][A
 48%|████▊     | 11/23 [00:02<00:01,  6.65it/s][A
 57%|█████▋    | 13/23 [00:02<00:01,  6.19it/s][A
 65%|██████▌   | 15/23 [00:02<00:01,  6.83it/s][A
 74%|███████▍  | 17/23 [00:02<00:00,  6.94it/s][A
 83%|████████▎ | 19/23 [00:03<00:00,  7.58it/s][A
100%|██████████| 23/23 [00:03<00:00,  6.67it/s][A
Epochs:  50%|█████     | 6/12 [02:43<02:43, 27.20s/it]

Val Loss: 3.9438 - Val Accuracy: 0.9212



Training:   0%|          | 0/182 [00:00<?, ?it/s][A
Training:   1%|          | 1/182 [00:00<02:44,  1.10it/s][A
Training:   2%|▏         | 4/182 [00:01<00:36,  4.88it/s][A
Training:   3%|▎         | 6/182 [00:01<00:36,  4.79it/s][A
Training:   5%|▍         | 9/182 [00:02<00:36,  4.78it/s][A
Training:   7%|▋         | 12/182 [00:02<00:23,  7.10it/s][A
Training:   8%|▊         | 14/182 [00:02<00:28,  5.98it/s][A
Training:   9%|▉         | 17/182 [00:03<00:27,  6.01it/s][A
Training:  12%|█▏        | 21/182 [00:03<00:24,  6.47it/s][A
Training:  14%|█▎        | 25/182 [00:04<00:23,  6.56it/s][A
Training:  16%|█▌        | 29/182 [00:04<00:22,  6.77it/s][A
Training:  18%|█▊        | 32/182 [00:05<00:17,  8.37it/s][A
Training:  19%|█▊        | 34/182 [00:05<00:20,  7.12it/s][A
Training:  20%|██        | 37/182 [00:05<00:21,  6.61it/s][A
Training:  23%|██▎       | 41/182 [00:06<00:19,  7.24it/s][A
Training:  24%|██▍       | 44/182 [00:06<00:15,  8.99it/s][A
Training:  25%|██▌  

Epoch: 7/12 - Loss: 3.6910 - Accuracy: 0.9228



  0%|          | 0/23 [00:00<?, ?it/s][A
  4%|▍         | 1/23 [00:01<00:22,  1.04s/it][A
 22%|██▏       | 5/23 [00:01<00:05,  3.35it/s][A
 35%|███▍      | 8/23 [00:01<00:02,  5.78it/s][A
 43%|████▎     | 10/23 [00:02<00:02,  5.50it/s][A
 57%|█████▋    | 13/23 [00:02<00:01,  5.45it/s][A
 70%|██████▉   | 16/23 [00:02<00:00,  7.70it/s][A
 78%|███████▊  | 18/23 [00:03<00:00,  6.92it/s][A
100%|██████████| 23/23 [00:03<00:00,  5.97it/s][A
Epochs:  58%|█████▊    | 7/12 [03:11<02:16, 27.37s/it]

Val Loss: 3.7473 - Val Accuracy: 0.9277



Training:   0%|          | 0/182 [00:00<?, ?it/s][A
Training:   1%|          | 1/182 [00:00<02:44,  1.10it/s][A
Training:   2%|▏         | 3/182 [00:01<00:51,  3.47it/s][A
Training:   3%|▎         | 5/182 [00:01<00:41,  4.32it/s][A
Training:   4%|▍         | 7/182 [00:01<00:28,  6.24it/s][A
Training:   5%|▍         | 9/182 [00:01<00:29,  5.79it/s][A
Training:   6%|▌         | 11/182 [00:02<00:23,  7.31it/s][A
Training:   7%|▋         | 13/182 [00:02<00:26,  6.34it/s][A
Training:   8%|▊         | 14/182 [00:02<00:26,  6.30it/s][A
Training:   9%|▉         | 17/182 [00:02<00:21,  7.73it/s][A
Training:  10%|▉         | 18/182 [00:03<00:25,  6.51it/s][A
Training:  11%|█         | 20/182 [00:03<00:19,  8.34it/s][A
Training:  12%|█▏        | 22/182 [00:03<00:24,  6.61it/s][A
Training:  13%|█▎        | 24/182 [00:03<00:19,  8.20it/s][A
Training:  14%|█▍        | 26/182 [00:04<00:23,  6.55it/s][A
Training:  16%|█▌        | 29/182 [00:04<00:18,  8.40it/s][A
Training:  17%|█▋    

Epoch: 8/12 - Loss: 3.6998 - Accuracy: 0.9213



  0%|          | 0/23 [00:00<?, ?it/s][A
  4%|▍         | 1/23 [00:01<00:23,  1.08s/it][A
  9%|▊         | 2/23 [00:01<00:10,  1.94it/s][A
 22%|██▏       | 5/23 [00:01<00:04,  4.31it/s][A
 26%|██▌       | 6/23 [00:01<00:03,  4.98it/s][A
 39%|███▉      | 9/23 [00:02<00:02,  5.72it/s][A
 57%|█████▋    | 13/23 [00:02<00:01,  6.48it/s][A
 70%|██████▉   | 16/23 [00:02<00:00,  8.61it/s][A
 78%|███████▊  | 18/23 [00:03<00:00,  7.22it/s][A
 87%|████████▋ | 20/23 [00:03<00:00,  8.67it/s][A
100%|██████████| 23/23 [00:03<00:00,  6.08it/s][A
Epochs:  67%|██████▋   | 8/12 [03:39<01:50, 27.64s/it]

Val Loss: 3.8913 - Val Accuracy: 0.9350



Training:   0%|          | 0/182 [00:00<?, ?it/s][A
Training:   1%|          | 1/182 [00:00<02:41,  1.12it/s][A
Training:   2%|▏         | 3/182 [00:01<00:51,  3.49it/s][A
Training:   3%|▎         | 5/182 [00:01<00:39,  4.45it/s][A
Training:   4%|▍         | 7/182 [00:01<00:26,  6.57it/s][A
Training:   5%|▍         | 9/182 [00:01<00:27,  6.18it/s][A
Training:   6%|▌         | 11/182 [00:01<00:21,  7.96it/s][A
Training:   7%|▋         | 13/182 [00:02<00:26,  6.49it/s][A
Training:   8%|▊         | 15/182 [00:02<00:20,  8.10it/s][A
Training:   9%|▉         | 17/182 [00:02<00:25,  6.48it/s][A
Training:  10%|█         | 19/182 [00:03<00:20,  8.04it/s][A
Training:  12%|█▏        | 21/182 [00:03<00:23,  6.95it/s][A
Training:  13%|█▎        | 23/182 [00:03<00:19,  8.13it/s][A
Training:  14%|█▎        | 25/182 [00:03<00:23,  6.73it/s][A
Training:  15%|█▌        | 28/182 [00:04<00:18,  8.13it/s][A
Training:  16%|█▌        | 29/182 [00:04<00:20,  7.56it/s][A
Training:  17%|█▋    

Epoch: 9/12 - Loss: 3.5056 - Accuracy: 0.9285



  0%|          | 0/23 [00:00<?, ?it/s][A
  4%|▍         | 1/23 [00:00<00:20,  1.05it/s][A
 22%|██▏       | 5/23 [00:01<00:04,  4.21it/s][A
 39%|███▉      | 9/23 [00:01<00:02,  5.43it/s][A
 48%|████▊     | 11/23 [00:02<00:01,  6.60it/s][A
 57%|█████▋    | 13/23 [00:02<00:01,  6.05it/s][A
 65%|██████▌   | 15/23 [00:02<00:01,  6.73it/s][A
 74%|███████▍  | 17/23 [00:02<00:00,  6.90it/s][A
 83%|████████▎ | 19/23 [00:03<00:00,  7.78it/s][A
 91%|█████████▏| 21/23 [00:03<00:00,  7.61it/s][A
100%|██████████| 23/23 [00:03<00:00,  6.31it/s][A
Epochs:  75%|███████▌  | 9/12 [04:06<01:21, 27.31s/it]

Val Loss: 3.6481 - Val Accuracy: 0.9209



Training:   0%|          | 0/182 [00:00<?, ?it/s][A
Training:   1%|          | 1/182 [00:01<03:01,  1.00s/it][A
Training:   3%|▎         | 5/182 [00:01<00:47,  3.72it/s][A
Training:   5%|▍         | 9/182 [00:02<00:33,  5.13it/s][A
Training:   6%|▌         | 11/182 [00:02<00:26,  6.46it/s][A
Training:   7%|▋         | 13/182 [00:02<00:28,  5.96it/s][A
Training:   9%|▉         | 16/182 [00:02<00:19,  8.35it/s][A
Training:  10%|▉         | 18/182 [00:03<00:23,  6.94it/s][A
Training:  12%|█▏        | 21/182 [00:03<00:25,  6.36it/s][A
Training:  13%|█▎        | 24/182 [00:03<00:18,  8.48it/s][A
Training:  14%|█▍        | 26/182 [00:04<00:21,  7.41it/s][A
Training:  15%|█▌        | 28/182 [00:04<00:22,  6.96it/s][A
Training:  16%|█▌        | 29/182 [00:04<00:22,  6.70it/s][A
Training:  17%|█▋        | 31/182 [00:05<00:22,  6.84it/s][A
Training:  18%|█▊        | 33/182 [00:05<00:21,  7.08it/s][A
Training:  19%|█▉        | 35/182 [00:05<00:22,  6.62it/s][A
Training:  20%|██  

Epoch: 10/12 - Loss: 3.3026 - Accuracy: 0.9323



  0%|          | 0/23 [00:00<?, ?it/s][A
  4%|▍         | 1/23 [00:00<00:20,  1.05it/s][A
 17%|█▋        | 4/23 [00:01<00:04,  4.73it/s][A
 26%|██▌       | 6/23 [00:01<00:03,  5.09it/s][A
 35%|███▍      | 8/23 [00:01<00:02,  6.38it/s][A
 43%|████▎     | 10/23 [00:02<00:02,  5.84it/s][A
 48%|████▊     | 11/23 [00:02<00:02,  5.80it/s][A
 57%|█████▋    | 13/23 [00:02<00:01,  6.27it/s][A
 65%|██████▌   | 15/23 [00:02<00:01,  6.96it/s][A
 74%|███████▍  | 17/23 [00:02<00:00,  6.97it/s][A
 83%|████████▎ | 19/23 [00:03<00:00,  6.85it/s][A
100%|██████████| 23/23 [00:03<00:00,  6.29it/s][A
Epochs:  83%|████████▎ | 10/12 [04:34<00:54, 27.45s/it]

Val Loss: 3.3063 - Val Accuracy: 0.9407



Training:   0%|          | 0/182 [00:00<?, ?it/s][A
Training:   1%|          | 1/182 [00:00<02:47,  1.08it/s][A
Training:   2%|▏         | 3/182 [00:01<00:51,  3.49it/s][A
Training:   3%|▎         | 5/182 [00:01<00:40,  4.35it/s][A
Training:   3%|▎         | 6/182 [00:01<00:38,  4.63it/s][A
Training:   4%|▍         | 8/182 [00:01<00:25,  6.76it/s][A
Training:   5%|▌         | 10/182 [00:02<00:30,  5.72it/s][A
Training:   7%|▋         | 13/182 [00:02<00:22,  7.58it/s][A
Training:   8%|▊         | 14/182 [00:02<00:26,  6.43it/s][A
Training:   9%|▉         | 17/182 [00:02<00:19,  8.48it/s][A
Training:  10%|█         | 19/182 [00:03<00:19,  8.38it/s][A
Training:  12%|█▏        | 21/182 [00:03<00:18,  8.56it/s][A
Training:  12%|█▏        | 22/182 [00:03<00:22,  7.12it/s][A
Training:  13%|█▎        | 24/182 [00:03<00:18,  8.60it/s][A
Training:  14%|█▎        | 25/182 [00:03<00:21,  7.37it/s][A
Training:  14%|█▍        | 26/182 [00:04<00:21,  7.15it/s][A
Training:  15%|█▌    

Epoch: 11/12 - Loss: 3.1843 - Accuracy: 0.9350



  0%|          | 0/23 [00:00<?, ?it/s][A
  4%|▍         | 1/23 [00:00<00:17,  1.23it/s][A
  9%|▊         | 2/23 [00:00<00:08,  2.45it/s][A
 22%|██▏       | 5/23 [00:01<00:03,  5.05it/s][A
 26%|██▌       | 6/23 [00:01<00:03,  5.52it/s][A
 39%|███▉      | 9/23 [00:01<00:02,  6.41it/s][A
 48%|████▊     | 11/23 [00:01<00:01,  7.53it/s][A
 57%|█████▋    | 13/23 [00:02<00:01,  6.27it/s][A
 65%|██████▌   | 15/23 [00:02<00:01,  7.00it/s][A
 74%|███████▍  | 17/23 [00:02<00:00,  6.77it/s][A
 83%|████████▎ | 19/23 [00:03<00:00,  7.13it/s][A
 91%|█████████▏| 21/23 [00:03<00:00,  7.28it/s][A
100%|██████████| 23/23 [00:03<00:00,  6.26it/s][A
Epochs:  92%|█████████▏| 11/12 [05:01<00:27, 27.49s/it]

Val Loss: 4.0672 - Val Accuracy: 0.9209



Training:   0%|          | 0/182 [00:00<?, ?it/s][A
Training:   1%|          | 1/182 [00:00<02:55,  1.03it/s][A
Training:   2%|▏         | 3/182 [00:01<00:51,  3.45it/s][A
Training:   3%|▎         | 5/182 [00:01<00:44,  3.99it/s][A
Training:   4%|▍         | 8/182 [00:01<00:24,  7.13it/s][A
Training:   5%|▌         | 10/182 [00:02<00:26,  6.38it/s][A
Training:   7%|▋         | 13/182 [00:02<00:23,  7.05it/s][A
Training:   9%|▉         | 16/182 [00:02<00:17,  9.58it/s][A
Training:  10%|▉         | 18/182 [00:03<00:24,  6.73it/s][A
Training:  12%|█▏        | 21/182 [00:03<00:25,  6.20it/s][A
Training:  13%|█▎        | 23/182 [00:03<00:21,  7.47it/s][A
Training:  14%|█▎        | 25/182 [00:04<00:26,  5.98it/s][A
Training:  15%|█▌        | 28/182 [00:04<00:19,  7.79it/s][A
Training:  16%|█▋        | 30/182 [00:04<00:21,  6.94it/s][A
Training:  18%|█▊        | 33/182 [00:05<00:23,  6.30it/s][A
Training:  19%|█▉        | 35/182 [00:05<00:19,  7.61it/s][A
Training:  20%|██   

Epoch: 12/12 - Loss: 3.2701 - Accuracy: 0.9262



  0%|          | 0/23 [00:00<?, ?it/s][A
  4%|▍         | 1/23 [00:00<00:19,  1.13it/s][A
  9%|▊         | 2/23 [00:01<00:09,  2.28it/s][A
 17%|█▋        | 4/23 [00:01<00:03,  4.94it/s][A
 26%|██▌       | 6/23 [00:01<00:03,  5.54it/s][A
 35%|███▍      | 8/23 [00:01<00:02,  6.54it/s][A
 39%|███▉      | 9/23 [00:01<00:02,  6.38it/s][A
 43%|████▎     | 10/23 [00:01<00:01,  6.72it/s][A
 52%|█████▏    | 12/23 [00:02<00:01,  7.19it/s][A
 61%|██████    | 14/23 [00:02<00:01,  8.20it/s][A
 65%|██████▌   | 15/23 [00:02<00:01,  7.26it/s][A
 70%|██████▉   | 16/23 [00:02<00:00,  7.06it/s][A
 83%|████████▎ | 19/23 [00:03<00:00,  7.42it/s][A
 87%|████████▋ | 20/23 [00:03<00:00,  7.66it/s][A
100%|██████████| 23/23 [00:03<00:00,  6.28it/s][A
Epochs: 100%|██████████| 12/12 [05:28<00:00, 27.41s/it]


Val Loss: 3.6441 - Val Accuracy: 0.9331


[32m[I 2023-12-14 22:56:30,425][0m Trial 1 finished with value: 0.9330719709396362 and parameters: {'loss_learning_rate': 0.00015990828325747049, 'learning_rate': 0.005697946086593603, 'weight_decay': 0.0001473649085987928, 'epsilon': 4.963406823015153e-09, 'batch_size': 77, 'epochs': 12}. Best is trial 0 with value: 0.9373385310173035.[0m


Learning rate for Loss: 0.000515322161093277
Learning rate: 0.01295417626729335
Weight decay: 0.00010094083028756503
Epsilon: 3.4787628785215855e-08
Batch size: 111
Number of epochs: 33


Epochs:   0%|          | 0/33 [00:00<?, ?it/s]
Training:   0%|          | 0/126 [00:00<?, ?it/s][A
Training:   1%|          | 1/126 [00:01<02:15,  1.09s/it][A
Training:   2%|▏         | 3/126 [00:01<00:41,  2.96it/s][A
Training:   4%|▍         | 5/126 [00:01<00:36,  3.27it/s][A
Training:   6%|▋         | 8/126 [00:01<00:20,  5.77it/s][A
Training:   8%|▊         | 10/126 [00:02<00:23,  5.03it/s][A
Training:   9%|▊         | 11/126 [00:02<00:23,  4.86it/s][A
Training:  10%|█         | 13/126 [00:03<00:26,  4.25it/s][A
Training:  13%|█▎        | 16/126 [00:03<00:17,  6.36it/s][A
Training:  13%|█▎        | 17/126 [00:04<00:27,  3.91it/s][A
Training:  14%|█▍        | 18/126 [00:04<00:24,  4.43it/s][A
Training:  16%|█▌        | 20/126 [00:04<00:17,  5.89it/s][A
Training:  17%|█▋        | 21/126 [00:05<00:27,  3.81it/s][A
Training:  19%|█▉        | 24/126 [00:05<00:16,  6.25it/s][A
Training:  21%|██        | 26/126 [00:05<00:18,  5.37it/s][A
Training:  22%|██▏       | 28/126 [0

Epoch: 1/33 - Loss: 10.7777 - Accuracy: 0.8106



  0%|          | 0/16 [00:00<?, ?it/s][A
  6%|▋         | 1/16 [00:00<00:13,  1.12it/s][A
 12%|█▎        | 2/16 [00:01<00:06,  2.14it/s][A
 31%|███▏      | 5/16 [00:01<00:02,  3.83it/s][A
 38%|███▊      | 6/16 [00:01<00:02,  3.92it/s][A
 50%|█████     | 8/16 [00:01<00:01,  5.75it/s][A
 56%|█████▋    | 9/16 [00:02<00:01,  4.76it/s][A
 62%|██████▎   | 10/16 [00:02<00:01,  4.45it/s][A
 75%|███████▌  | 12/16 [00:02<00:00,  6.55it/s][A
100%|██████████| 16/16 [00:03<00:00,  4.76it/s][A
Epochs:   3%|▎         | 1/33 [00:26<14:13, 26.68s/it]

Val Loss: 4.5930 - Val Accuracy: 0.9097



Training:   0%|          | 0/126 [00:00<?, ?it/s][A
Training:   1%|          | 1/126 [00:01<02:10,  1.04s/it][A
Training:   2%|▏         | 3/126 [00:01<00:39,  3.09it/s][A
Training:   4%|▍         | 5/126 [00:01<00:33,  3.56it/s][A
Training:   5%|▍         | 6/126 [00:01<00:28,  4.26it/s][A
Training:   6%|▌         | 7/126 [00:01<00:23,  5.03it/s][A
Training:   7%|▋         | 9/126 [00:02<00:29,  3.97it/s][A
Training:   9%|▊         | 11/126 [00:02<00:22,  5.22it/s][A
Training:  10%|█         | 13/126 [00:03<00:24,  4.57it/s][A
Training:  12%|█▏        | 15/126 [00:03<00:21,  5.08it/s][A
Training:  13%|█▎        | 17/126 [00:03<00:22,  4.95it/s][A
Training:  15%|█▌        | 19/126 [00:04<00:21,  5.04it/s][A
Training:  17%|█▋        | 21/126 [00:04<00:18,  5.53it/s][A
Training:  18%|█▊        | 23/126 [00:05<00:19,  5.38it/s][A
Training:  20%|█▉        | 25/126 [00:05<00:19,  5.06it/s][A
Training:  21%|██▏       | 27/126 [00:05<00:18,  5.41it/s][A
Training:  23%|██▎    

Epoch: 2/33 - Loss: 5.2297 - Accuracy: 0.8958



  0%|          | 0/16 [00:00<?, ?it/s][A
  6%|▋         | 1/16 [00:00<00:13,  1.13it/s][A
 12%|█▎        | 2/16 [00:01<00:06,  2.03it/s][A
 31%|███▏      | 5/16 [00:01<00:02,  4.07it/s][A
 38%|███▊      | 6/16 [00:01<00:02,  3.95it/s][A
 56%|█████▋    | 9/16 [00:02<00:01,  4.92it/s][A
 62%|██████▎   | 10/16 [00:02<00:01,  4.18it/s][A
 81%|████████▏ | 13/16 [00:03<00:00,  5.16it/s][A
100%|██████████| 16/16 [00:03<00:00,  4.49it/s][A
Epochs:   6%|▌         | 2/33 [00:53<13:54, 26.91s/it]

Val Loss: 6.1992 - Val Accuracy: 0.8924



Training:   0%|          | 0/126 [00:00<?, ?it/s][A
Training:   1%|          | 1/126 [00:00<02:01,  1.03it/s][A
Training:   2%|▏         | 2/126 [00:01<01:04,  1.91it/s][A
Training:   4%|▍         | 5/126 [00:01<00:29,  4.07it/s][A
Training:   5%|▍         | 6/126 [00:01<00:30,  3.88it/s][A
Training:   6%|▌         | 7/126 [00:02<00:26,  4.52it/s][A
Training:   7%|▋         | 9/126 [00:02<00:22,  5.22it/s][A
Training:   8%|▊         | 10/126 [00:02<00:25,  4.47it/s][A
Training:  10%|█         | 13/126 [00:03<00:22,  4.98it/s][A
Training:  11%|█         | 14/126 [00:03<00:27,  4.12it/s][A
Training:  13%|█▎        | 16/126 [00:03<00:19,  5.68it/s][A
Training:  13%|█▎        | 17/126 [00:04<00:22,  4.80it/s][A
Training:  14%|█▍        | 18/126 [00:04<00:25,  4.32it/s][A
Training:  17%|█▋        | 21/126 [00:04<00:19,  5.41it/s][A
Training:  17%|█▋        | 22/126 [00:04<00:20,  5.15it/s][A
Training:  19%|█▉        | 24/126 [00:05<00:15,  6.78it/s][A
Training:  20%|█▉     

Epoch: 3/33 - Loss: 4.3175 - Accuracy: 0.9135



  0%|          | 0/16 [00:00<?, ?it/s][A
  6%|▋         | 1/16 [00:01<00:21,  1.41s/it][A
 19%|█▉        | 3/16 [00:01<00:05,  2.43it/s][A
 31%|███▏      | 5/16 [00:02<00:04,  2.75it/s][A
 44%|████▍     | 7/16 [00:02<00:02,  4.32it/s][A
 56%|█████▋    | 9/16 [00:03<00:02,  3.46it/s][A
100%|██████████| 16/16 [00:03<00:00,  4.02it/s][A
Epochs:   9%|▉         | 3/33 [01:22<13:50, 27.68s/it]

Val Loss: 3.8972 - Val Accuracy: 0.9320



Training:   0%|          | 0/126 [00:00<?, ?it/s][A
Training:   1%|          | 1/126 [00:01<02:23,  1.15s/it][A
Training:   2%|▏         | 2/126 [00:01<01:14,  1.66it/s][A
Training:   3%|▎         | 4/126 [00:01<00:33,  3.69it/s][A
Training:   4%|▍         | 5/126 [00:02<00:40,  2.98it/s][A
Training:   6%|▌         | 7/126 [00:02<00:25,  4.72it/s][A
Training:   7%|▋         | 9/126 [00:02<00:27,  4.23it/s][A
Training:   8%|▊         | 10/126 [00:02<00:24,  4.74it/s][A
Training:  10%|█         | 13/126 [00:03<00:22,  4.91it/s][A
Training:  11%|█         | 14/126 [00:03<00:21,  5.23it/s][A
Training:  12%|█▏        | 15/126 [00:03<00:21,  5.20it/s][A
Training:  13%|█▎        | 17/126 [00:04<00:23,  4.68it/s][A
Training:  15%|█▌        | 19/126 [00:04<00:19,  5.52it/s][A
Training:  17%|█▋        | 21/126 [00:05<00:22,  4.68it/s][A
Training:  18%|█▊        | 23/126 [00:05<00:20,  5.15it/s][A
Training:  20%|█▉        | 25/126 [00:05<00:22,  4.45it/s][A
Training:  21%|██▏    

Epoch: 4/33 - Loss: 4.1275 - Accuracy: 0.9144



  0%|          | 0/16 [00:00<?, ?it/s][A
  6%|▋         | 1/16 [00:01<00:21,  1.44s/it][A
 31%|███▏      | 5/16 [00:02<00:03,  2.80it/s][A
 50%|█████     | 8/16 [00:02<00:01,  4.85it/s][A
 62%|██████▎   | 10/16 [00:02<00:01,  4.23it/s][A
 75%|███████▌  | 12/16 [00:02<00:00,  5.59it/s][A
100%|██████████| 16/16 [00:03<00:00,  4.37it/s][A
Epochs:  12%|█▏        | 4/33 [01:50<13:29, 27.90s/it]

Val Loss: 5.0806 - Val Accuracy: 0.9196



Training:   0%|          | 0/126 [00:00<?, ?it/s][A
Training:   1%|          | 1/126 [00:01<02:22,  1.14s/it][A
Training:   2%|▏         | 2/126 [00:01<01:07,  1.84it/s][A
Training:   3%|▎         | 4/126 [00:01<00:29,  4.16it/s][A
Training:   5%|▍         | 6/126 [00:02<00:34,  3.43it/s][A
Training:   6%|▋         | 8/126 [00:02<00:23,  4.96it/s][A
Training:   8%|▊         | 10/126 [00:02<00:31,  3.71it/s][A
Training:  10%|█         | 13/126 [00:03<00:27,  4.08it/s][A
Training:  13%|█▎        | 16/126 [00:03<00:18,  5.92it/s][A
Training:  14%|█▍        | 18/126 [00:04<00:24,  4.46it/s][A
Training:  16%|█▌        | 20/126 [00:04<00:19,  5.50it/s][A
Training:  17%|█▋        | 22/126 [00:05<00:24,  4.29it/s][A
Training:  19%|█▉        | 24/126 [00:05<00:18,  5.47it/s][A
Training:  21%|██        | 26/126 [00:06<00:24,  4.14it/s][A
Training:  22%|██▏       | 28/126 [00:06<00:18,  5.34it/s][A
Training:  24%|██▍       | 30/126 [00:07<00:22,  4.23it/s][A
Training:  25%|██▌   

Epoch: 5/33 - Loss: 3.8889 - Accuracy: 0.9174



  0%|          | 0/16 [00:00<?, ?it/s][A
  6%|▋         | 1/16 [00:01<00:21,  1.40s/it][A
 19%|█▉        | 3/16 [00:01<00:05,  2.48it/s][A
 31%|███▏      | 5/16 [00:02<00:03,  2.87it/s][A
 44%|████▍     | 7/16 [00:02<00:02,  4.45it/s][A
 56%|█████▋    | 9/16 [00:02<00:01,  3.82it/s][A
 69%|██████▉   | 11/16 [00:02<00:00,  5.30it/s][A
 81%|████████▏ | 13/16 [00:03<00:00,  4.19it/s][A
100%|██████████| 16/16 [00:03<00:00,  4.07it/s][A
Epochs:  15%|█▌        | 5/33 [02:18<13:04, 28.01s/it]

Val Loss: 3.8946 - Val Accuracy: 0.8979



Training:   0%|          | 0/126 [00:00<?, ?it/s][A
Training:   1%|          | 1/126 [00:01<02:33,  1.23s/it][A
Training:   2%|▏         | 3/126 [00:01<00:44,  2.74it/s][A
Training:   4%|▍         | 5/126 [00:01<00:40,  2.97it/s][A
Training:   7%|▋         | 9/126 [00:02<00:31,  3.77it/s][A
Training:  10%|▉         | 12/126 [00:02<00:19,  5.71it/s][A
Training:  11%|█         | 14/126 [00:03<00:26,  4.25it/s][A
Training:  13%|█▎        | 16/126 [00:03<00:20,  5.41it/s][A
Training:  14%|█▍        | 18/126 [00:04<00:27,  3.99it/s][A
Training:  16%|█▌        | 20/126 [00:04<00:20,  5.16it/s][A
Training:  17%|█▋        | 22/126 [00:05<00:23,  4.47it/s][A
Training:  20%|█▉        | 25/126 [00:06<00:22,  4.55it/s][A
Training:  21%|██▏       | 27/126 [00:06<00:17,  5.55it/s][A
Training:  23%|██▎       | 29/126 [00:06<00:18,  5.27it/s][A
Training:  25%|██▌       | 32/126 [00:06<00:14,  6.27it/s][A
Training:  26%|██▌       | 33/126 [00:07<00:17,  5.37it/s][A
Training:  27%|██▋  

Epoch: 6/33 - Loss: 3.6587 - Accuracy: 0.9231



  0%|          | 0/16 [00:00<?, ?it/s][A
  6%|▋         | 1/16 [00:01<00:19,  1.28s/it][A
 31%|███▏      | 5/16 [00:02<00:03,  2.86it/s][A
 44%|████▍     | 7/16 [00:02<00:02,  4.09it/s][A
 56%|█████▋    | 9/16 [00:02<00:01,  3.79it/s][A
 75%|███████▌  | 12/16 [00:02<00:00,  5.95it/s][A
100%|██████████| 16/16 [00:03<00:00,  4.32it/s][A
Epochs:  18%|█▊        | 6/33 [02:47<12:42, 28.26s/it]

Val Loss: 3.7748 - Val Accuracy: 0.9321



Training:   0%|          | 0/126 [00:00<?, ?it/s][A
Training:   1%|          | 1/126 [00:01<02:36,  1.25s/it][A
Training:   2%|▏         | 3/126 [00:01<00:45,  2.70it/s][A
Training:   4%|▍         | 5/126 [00:01<00:39,  3.04it/s][A
Training:   6%|▌         | 7/126 [00:02<00:25,  4.64it/s][A
Training:   7%|▋         | 9/126 [00:02<00:28,  4.08it/s][A
Training:  10%|▉         | 12/126 [00:02<00:18,  6.31it/s][A
Training:  11%|█         | 14/126 [00:03<00:22,  5.09it/s][A
Training:  13%|█▎        | 16/126 [00:03<00:17,  6.43it/s][A
Training:  14%|█▍        | 18/126 [00:04<00:24,  4.33it/s][A
Training:  17%|█▋        | 21/126 [00:05<00:25,  4.16it/s][A
Training:  18%|█▊        | 23/126 [00:05<00:19,  5.15it/s][A
Training:  20%|█▉        | 25/126 [00:05<00:20,  4.93it/s][A
Training:  22%|██▏       | 28/126 [00:05<00:13,  7.16it/s][A
Training:  24%|██▍       | 30/126 [00:06<00:16,  5.67it/s][A
Training:  26%|██▌       | 33/126 [00:06<00:17,  5.31it/s][A
Training:  29%|██▊   

Epoch: 7/33 - Loss: 3.6192 - Accuracy: 0.9242



  0%|          | 0/16 [00:00<?, ?it/s][A
  6%|▋         | 1/16 [00:01<00:17,  1.15s/it][A
 31%|███▏      | 5/16 [00:01<00:03,  3.28it/s][A
 50%|█████     | 8/16 [00:01<00:01,  5.55it/s][A
 62%|██████▎   | 10/16 [00:02<00:01,  4.30it/s][A
 81%|████████▏ | 13/16 [00:03<00:00,  4.46it/s][A
100%|██████████| 16/16 [00:03<00:00,  4.59it/s][A
Epochs:  21%|██        | 7/33 [03:14<12:05, 27.91s/it]

Val Loss: 3.7049 - Val Accuracy: 0.9312



Training:   0%|          | 0/126 [00:00<?, ?it/s][A
Training:   1%|          | 1/126 [00:01<02:40,  1.28s/it][A
Training:   2%|▏         | 2/126 [00:01<01:12,  1.71it/s][A
Training:   3%|▎         | 4/126 [00:01<00:31,  3.91it/s][A
Training:   5%|▍         | 6/126 [00:02<00:30,  3.94it/s][A
Training:   6%|▋         | 8/126 [00:02<00:20,  5.79it/s][A
Training:   8%|▊         | 10/126 [00:02<00:24,  4.69it/s][A
Training:  10%|█         | 13/126 [00:03<00:24,  4.59it/s][A
Training:  13%|█▎        | 17/126 [00:04<00:22,  4.76it/s][A
Training:  14%|█▍        | 18/126 [00:04<00:21,  5.02it/s][A
Training:  16%|█▌        | 20/126 [00:04<00:17,  6.19it/s][A
Training:  17%|█▋        | 21/126 [00:04<00:20,  5.11it/s][A
Training:  17%|█▋        | 22/126 [00:05<00:22,  4.62it/s][A
Training:  18%|█▊        | 23/126 [00:05<00:19,  5.22it/s][A
Training:  20%|█▉        | 25/126 [00:05<00:17,  5.74it/s][A
Training:  21%|██        | 26/126 [00:05<00:20,  4.90it/s][A
Training:  23%|██▎   

Epoch: 8/33 - Loss: 3.3971 - Accuracy: 0.9291



  0%|          | 0/16 [00:00<?, ?it/s][A
  6%|▋         | 1/16 [00:01<00:17,  1.18s/it][A
 25%|██▌       | 4/16 [00:01<00:03,  3.80it/s][A
 38%|███▊      | 6/16 [00:01<00:02,  3.42it/s][A
 50%|█████     | 8/16 [00:02<00:01,  4.98it/s][A
 62%|██████▎   | 10/16 [00:02<00:01,  4.07it/s][A
100%|██████████| 16/16 [00:03<00:00,  4.41it/s][A
Epochs:  24%|██▍       | 8/33 [03:41<11:28, 27.52s/it]

Val Loss: 3.5809 - Val Accuracy: 0.9257



Training:   0%|          | 0/126 [00:00<?, ?it/s][A
Training:   1%|          | 1/126 [00:01<02:17,  1.10s/it][A
Training:   2%|▏         | 3/126 [00:01<00:43,  2.84it/s][A
Training:   4%|▍         | 5/126 [00:01<00:37,  3.20it/s][A
Training:   5%|▍         | 6/126 [00:02<00:32,  3.67it/s][A
Training:   6%|▋         | 8/126 [00:02<00:21,  5.44it/s][A
Training:   7%|▋         | 9/126 [00:02<00:28,  4.05it/s][A
Training:   8%|▊         | 10/126 [00:02<00:25,  4.46it/s][A
Training:  10%|▉         | 12/126 [00:02<00:17,  6.47it/s][A
Training:  10%|█         | 13/126 [00:03<00:25,  4.42it/s][A
Training:  11%|█         | 14/126 [00:03<00:23,  4.82it/s][A
Training:  13%|█▎        | 16/126 [00:03<00:15,  7.00it/s][A
Training:  14%|█▍        | 18/126 [00:04<00:22,  4.81it/s][A
Training:  16%|█▌        | 20/126 [00:04<00:16,  6.29it/s][A
Training:  17%|█▋        | 22/126 [00:04<00:21,  4.74it/s][A
Training:  20%|█▉        | 25/126 [00:05<00:17,  5.65it/s][A
Training:  21%|██     

Epoch: 9/33 - Loss: 3.4265 - Accuracy: 0.9271



  0%|          | 0/16 [00:00<?, ?it/s][A
  6%|▋         | 1/16 [00:01<00:19,  1.29s/it][A
 12%|█▎        | 2/16 [00:01<00:09,  1.54it/s][A
 19%|█▉        | 3/16 [00:01<00:05,  2.34it/s][A
 31%|███▏      | 5/16 [00:02<00:03,  3.26it/s][A
 38%|███▊      | 6/16 [00:02<00:02,  3.99it/s][A
 44%|████▍     | 7/16 [00:02<00:02,  4.05it/s][A
 56%|█████▋    | 9/16 [00:02<00:01,  4.69it/s][A
 62%|██████▎   | 10/16 [00:02<00:01,  5.14it/s][A
 69%|██████▉   | 11/16 [00:03<00:01,  4.35it/s][A
 81%|████████▏ | 13/16 [00:03<00:00,  5.47it/s][A
100%|██████████| 16/16 [00:04<00:00,  3.99it/s][A
Epochs:  27%|██▋       | 9/33 [04:08<10:55, 27.30s/it]

Val Loss: 3.6052 - Val Accuracy: 0.9266



Training:   0%|          | 0/126 [00:00<?, ?it/s][A
Training:   1%|          | 1/126 [00:01<02:04,  1.01it/s][A
Training:   2%|▏         | 2/126 [00:01<01:00,  2.04it/s][A
Training:   3%|▎         | 4/126 [00:01<00:27,  4.43it/s][A
Training:   4%|▍         | 5/126 [00:01<00:37,  3.21it/s][A
Training:   6%|▋         | 8/126 [00:01<00:19,  6.15it/s][A
Training:   8%|▊         | 10/126 [00:02<00:26,  4.39it/s][A
Training:  10%|█         | 13/126 [00:03<00:26,  4.32it/s][A
Training:  12%|█▏        | 15/126 [00:03<00:20,  5.42it/s][A
Training:  13%|█▎        | 17/126 [00:03<00:21,  5.07it/s][A
Training:  15%|█▌        | 19/126 [00:04<00:17,  6.24it/s][A
Training:  16%|█▌        | 20/126 [00:04<00:16,  6.44it/s][A
Training:  17%|█▋        | 21/126 [00:04<00:23,  4.48it/s][A
Training:  18%|█▊        | 23/126 [00:04<00:18,  5.48it/s][A
Training:  20%|█▉        | 25/126 [00:05<00:22,  4.40it/s][A
Training:  21%|██▏       | 27/126 [00:05<00:17,  5.56it/s][A
Training:  23%|██▎   

Epoch: 10/33 - Loss: 3.4614 - Accuracy: 0.9247



  0%|          | 0/16 [00:00<?, ?it/s][A
  6%|▋         | 1/16 [00:01<00:18,  1.25s/it][A
 31%|███▏      | 5/16 [00:01<00:03,  3.11it/s][A
 38%|███▊      | 6/16 [00:02<00:02,  3.64it/s][A
 50%|█████     | 8/16 [00:02<00:01,  5.39it/s][A
 62%|██████▎   | 10/16 [00:02<00:01,  4.42it/s][A
 81%|████████▏ | 13/16 [00:03<00:00,  4.57it/s][A
100%|██████████| 16/16 [00:03<00:00,  4.46it/s][A
Epochs:  30%|███       | 10/33 [04:35<10:30, 27.42s/it]

Val Loss: 8.8320 - Val Accuracy: 0.9159



Training:   0%|          | 0/126 [00:00<?, ?it/s][A
Training:   1%|          | 1/126 [00:01<02:42,  1.30s/it][A
Training:   2%|▏         | 3/126 [00:01<00:47,  2.59it/s][A
Training:   4%|▍         | 5/126 [00:01<00:38,  3.15it/s][A
Training:   6%|▌         | 7/126 [00:02<00:26,  4.47it/s][A
Training:   6%|▋         | 8/126 [00:02<00:24,  4.85it/s][A
Training:   7%|▋         | 9/126 [00:02<00:29,  3.94it/s][A
Training:   9%|▊         | 11/126 [00:02<00:20,  5.64it/s][A
Training:  10%|▉         | 12/126 [00:02<00:19,  5.87it/s][A
Training:  10%|█         | 13/126 [00:03<00:26,  4.27it/s][A
Training:  12%|█▏        | 15/126 [00:03<00:18,  5.94it/s][A
Training:  13%|█▎        | 16/126 [00:03<00:19,  5.79it/s][A
Training:  13%|█▎        | 17/126 [00:04<00:26,  4.15it/s][A
Training:  15%|█▌        | 19/126 [00:04<00:18,  5.72it/s][A
Training:  17%|█▋        | 21/126 [00:05<00:24,  4.20it/s][A
Training:  18%|█▊        | 23/126 [00:05<00:18,  5.65it/s][A
Training:  20%|█▉     

Epoch: 11/33 - Loss: 4.0274 - Accuracy: 0.9231



  0%|          | 0/16 [00:00<?, ?it/s][A
  6%|▋         | 1/16 [00:01<00:16,  1.11s/it][A
 19%|█▉        | 3/16 [00:01<00:04,  2.89it/s][A
 31%|███▏      | 5/16 [00:01<00:03,  3.24it/s][A
 44%|████▍     | 7/16 [00:02<00:01,  4.59it/s][A
 56%|█████▋    | 9/16 [00:02<00:01,  4.23it/s][A
 62%|██████▎   | 10/16 [00:02<00:01,  4.61it/s][A
 81%|████████▏ | 13/16 [00:03<00:00,  4.84it/s][A
100%|██████████| 16/16 [00:03<00:00,  4.45it/s][A
Epochs:  33%|███▎      | 11/33 [05:02<09:58, 27.20s/it]

Val Loss: 4.0563 - Val Accuracy: 0.9323



Training:   0%|          | 0/126 [00:00<?, ?it/s][A
Training:   1%|          | 1/126 [00:01<02:35,  1.24s/it][A
Training:   2%|▏         | 3/126 [00:01<00:45,  2.69it/s][A
Training:   4%|▍         | 5/126 [00:01<00:40,  3.02it/s][A
Training:   6%|▌         | 7/126 [00:02<00:25,  4.63it/s][A
Training:   7%|▋         | 9/126 [00:02<00:29,  4.02it/s][A
Training:  10%|▉         | 12/126 [00:02<00:18,  6.32it/s][A
Training:  11%|█         | 14/126 [00:03<00:25,  4.45it/s][A
Training:  13%|█▎        | 16/126 [00:03<00:19,  5.60it/s][A
Training:  14%|█▍        | 18/126 [00:04<00:26,  4.10it/s][A
Training:  16%|█▌        | 20/126 [00:04<00:19,  5.35it/s][A
Training:  17%|█▋        | 22/126 [00:05<00:23,  4.46it/s][A
Training:  19%|█▉        | 24/126 [00:05<00:17,  5.71it/s][A
Training:  21%|██        | 26/126 [00:06<00:24,  4.09it/s][A
Training:  22%|██▏       | 28/126 [00:06<00:19,  5.14it/s][A
Training:  23%|██▎       | 29/126 [00:06<00:24,  4.01it/s][A
Training:  25%|██▍   

Epoch: 12/33 - Loss: 4.6011 - Accuracy: 0.9243



  0%|          | 0/16 [00:00<?, ?it/s][A
  6%|▋         | 1/16 [00:01<00:20,  1.34s/it][A
 19%|█▉        | 3/16 [00:01<00:05,  2.58it/s][A
 31%|███▏      | 5/16 [00:02<00:03,  3.00it/s][A
 56%|█████▋    | 9/16 [00:02<00:01,  3.78it/s][A
 75%|███████▌  | 12/16 [00:03<00:00,  5.55it/s][A
100%|██████████| 16/16 [00:03<00:00,  4.29it/s][A
Epochs:  36%|███▋      | 12/33 [05:30<09:33, 27.29s/it]

Val Loss: 3.6201 - Val Accuracy: 0.8830



Training:   0%|          | 0/126 [00:00<?, ?it/s][A
Training:   1%|          | 1/126 [00:01<02:26,  1.18s/it][A
Training:   2%|▏         | 3/126 [00:01<00:43,  2.84it/s][A
Training:   4%|▍         | 5/126 [00:01<00:41,  2.91it/s][A
Training:   6%|▌         | 7/126 [00:02<00:26,  4.50it/s][A
Training:   7%|▋         | 9/126 [00:02<00:29,  3.92it/s][A
Training:   9%|▊         | 11/126 [00:02<00:21,  5.34it/s][A
Training:  10%|█         | 13/126 [00:03<00:25,  4.41it/s][A
Training:  12%|█▏        | 15/126 [00:03<00:18,  5.88it/s][A
Training:  13%|█▎        | 17/126 [00:04<00:23,  4.73it/s][A
Training:  17%|█▋        | 21/126 [00:04<00:19,  5.28it/s][A
Training:  18%|█▊        | 23/126 [00:04<00:16,  6.42it/s][A
Training:  20%|█▉        | 25/126 [00:05<00:21,  4.71it/s][A
Training:  22%|██▏       | 28/126 [00:05<00:14,  6.64it/s][A
Training:  24%|██▍       | 30/126 [00:06<00:19,  4.99it/s][A
Training:  25%|██▌       | 32/126 [00:06<00:15,  6.17it/s][A
Training:  27%|██▋   

Epoch: 13/33 - Loss: 3.2360 - Accuracy: 0.9298



  0%|          | 0/16 [00:00<?, ?it/s][A
  6%|▋         | 1/16 [00:01<00:17,  1.15s/it][A
 19%|█▉        | 3/16 [00:01<00:04,  2.85it/s][A
 25%|██▌       | 4/16 [00:01<00:03,  3.77it/s][A
 31%|███▏      | 5/16 [00:01<00:03,  3.14it/s][A
 50%|█████     | 8/16 [00:02<00:01,  5.03it/s][A
 56%|█████▋    | 9/16 [00:02<00:01,  3.90it/s][A
 69%|██████▉   | 11/16 [00:02<00:00,  5.63it/s][A
 81%|████████▏ | 13/16 [00:03<00:00,  4.51it/s][A
100%|██████████| 16/16 [00:03<00:00,  4.26it/s][A
Epochs:  39%|███▉      | 13/33 [05:57<09:04, 27.22s/it]

Val Loss: 3.3879 - Val Accuracy: 0.9356



Training:   0%|          | 0/126 [00:00<?, ?it/s][A
Training:   1%|          | 1/126 [00:01<02:09,  1.04s/it][A
Training:   2%|▏         | 2/126 [00:01<01:02,  1.98it/s][A
Training:   3%|▎         | 4/126 [00:01<00:27,  4.37it/s][A
Training:   4%|▍         | 5/126 [00:01<00:34,  3.53it/s][A
Training:   6%|▌         | 7/126 [00:01<00:24,  4.94it/s][A
Training:   7%|▋         | 9/126 [00:02<00:25,  4.66it/s][A
Training:   8%|▊         | 10/126 [00:02<00:23,  4.94it/s][A
Training:  10%|▉         | 12/126 [00:02<00:17,  6.39it/s][A
Training:  10%|█         | 13/126 [00:03<00:27,  4.18it/s][A
Training:  12%|█▏        | 15/126 [00:03<00:19,  5.75it/s][A
Training:  13%|█▎        | 17/126 [00:03<00:21,  5.08it/s][A
Training:  15%|█▌        | 19/126 [00:03<00:16,  6.68it/s][A
Training:  17%|█▋        | 21/126 [00:04<00:21,  4.99it/s][A
Training:  19%|█▉        | 24/126 [00:04<00:13,  7.53it/s][A
Training:  21%|██        | 26/126 [00:05<00:18,  5.31it/s][A
Training:  22%|██▏    

Epoch: 14/33 - Loss: 3.5865 - Accuracy: 0.9242



  0%|          | 0/16 [00:00<?, ?it/s][A
  6%|▋         | 1/16 [00:01<00:16,  1.12s/it][A
 31%|███▏      | 5/16 [00:01<00:03,  3.42it/s][A
 50%|█████     | 8/16 [00:01<00:01,  5.75it/s][A
 62%|██████▎   | 10/16 [00:02<00:01,  4.75it/s][A
 75%|███████▌  | 12/16 [00:02<00:00,  6.02it/s][A
100%|██████████| 16/16 [00:03<00:00,  4.69it/s][A
Epochs:  42%|████▏     | 14/33 [06:23<08:34, 27.05s/it]

Val Loss: 3.4300 - Val Accuracy: 0.9263



Training:   0%|          | 0/126 [00:00<?, ?it/s][A
Training:   1%|          | 1/126 [00:01<02:17,  1.10s/it][A
Training:   2%|▏         | 2/126 [00:01<01:09,  1.77it/s][A
Training:   3%|▎         | 4/126 [00:01<00:30,  4.05it/s][A
Training:   4%|▍         | 5/126 [00:01<00:32,  3.77it/s][A
Training:   5%|▍         | 6/126 [00:01<00:29,  4.03it/s][A
Training:   7%|▋         | 9/126 [00:02<00:23,  4.94it/s][A
Training:   8%|▊         | 10/126 [00:02<00:22,  5.25it/s][A
Training:  10%|▉         | 12/126 [00:02<00:17,  6.57it/s][A
Training:  10%|█         | 13/126 [00:03<00:23,  4.86it/s][A
Training:  11%|█         | 14/126 [00:03<00:24,  4.65it/s][A
Training:  13%|█▎        | 16/126 [00:03<00:17,  6.33it/s][A
Training:  13%|█▎        | 17/126 [00:03<00:21,  4.97it/s][A
Training:  14%|█▍        | 18/126 [00:04<00:19,  5.65it/s][A
Training:  16%|█▌        | 20/126 [00:04<00:19,  5.36it/s][A
Training:  17%|█▋        | 21/126 [00:04<00:22,  4.61it/s][A
Training:  18%|█▊     

Epoch: 15/33 - Loss: 3.3032 - Accuracy: 0.9263



  0%|          | 0/16 [00:00<?, ?it/s][A
  6%|▋         | 1/16 [00:01<00:15,  1.01s/it][A
 19%|█▉        | 3/16 [00:01<00:03,  3.32it/s][A
 31%|███▏      | 5/16 [00:01<00:03,  3.48it/s][A
 38%|███▊      | 6/16 [00:01<00:02,  3.94it/s][A
 50%|█████     | 8/16 [00:01<00:01,  6.02it/s][A
 62%|██████▎   | 10/16 [00:02<00:01,  4.62it/s][A
 75%|███████▌  | 12/16 [00:02<00:00,  6.01it/s][A
 88%|████████▊ | 14/16 [00:03<00:00,  4.95it/s][A
100%|██████████| 16/16 [00:03<00:00,  4.51it/s][A
Epochs:  45%|████▌     | 15/33 [06:51<08:09, 27.20s/it]

Val Loss: 3.7079 - Val Accuracy: 0.8621



Training:   0%|          | 0/126 [00:00<?, ?it/s][A
Training:   1%|          | 1/126 [00:01<02:22,  1.14s/it][A
Training:   2%|▏         | 2/126 [00:01<01:05,  1.88it/s][A
Training:   4%|▍         | 5/126 [00:01<00:35,  3.43it/s][A
Training:   5%|▍         | 6/126 [00:01<00:29,  4.09it/s][A
Training:   7%|▋         | 9/126 [00:02<00:23,  4.91it/s][A
Training:   8%|▊         | 10/126 [00:02<00:22,  5.08it/s][A
Training:  10%|▉         | 12/126 [00:02<00:17,  6.58it/s][A
Training:  10%|█         | 13/126 [00:03<00:25,  4.49it/s][A
Training:  11%|█         | 14/126 [00:03<00:23,  4.78it/s][A
Training:  13%|█▎        | 16/126 [00:03<00:17,  6.41it/s][A
Training:  13%|█▎        | 17/126 [00:04<00:26,  4.09it/s][A
Training:  15%|█▌        | 19/126 [00:04<00:19,  5.53it/s][A
Training:  17%|█▋        | 21/126 [00:04<00:23,  4.49it/s][A
Training:  18%|█▊        | 23/126 [00:04<00:17,  6.04it/s][A
Training:  20%|█▉        | 25/126 [00:05<00:22,  4.55it/s][A
Training:  21%|██▏   

Epoch: 16/33 - Loss: 3.1219 - Accuracy: 0.9307



  0%|          | 0/16 [00:00<?, ?it/s][A
  6%|▋         | 1/16 [00:01<00:18,  1.25s/it][A
 25%|██▌       | 4/16 [00:01<00:03,  3.45it/s][A
 31%|███▏      | 5/16 [00:01<00:03,  2.89it/s][A
 44%|████▍     | 7/16 [00:02<00:01,  4.61it/s][A
 56%|█████▋    | 9/16 [00:02<00:01,  3.79it/s][A
 69%|██████▉   | 11/16 [00:02<00:00,  5.20it/s][A
100%|██████████| 16/16 [00:03<00:00,  4.47it/s][A
Epochs:  48%|████▊     | 16/33 [07:18<07:41, 27.13s/it]

Val Loss: 3.5751 - Val Accuracy: 0.9365



Training:   0%|          | 0/126 [00:00<?, ?it/s][A
Training:   1%|          | 1/126 [00:01<02:37,  1.26s/it][A
Training:   2%|▏         | 3/126 [00:01<00:49,  2.49it/s][A
Training:   4%|▍         | 5/126 [00:02<00:41,  2.92it/s][A
Training:   6%|▋         | 8/126 [00:02<00:22,  5.24it/s][A
Training:   8%|▊         | 10/126 [00:02<00:24,  4.65it/s][A
Training:  10%|▉         | 12/126 [00:02<00:18,  6.05it/s][A
Training:  11%|█         | 14/126 [00:03<00:25,  4.36it/s][A
Training:  13%|█▎        | 17/126 [00:04<00:24,  4.48it/s][A
Training:  15%|█▌        | 19/126 [00:04<00:19,  5.44it/s][A
Training:  17%|█▋        | 21/126 [00:05<00:24,  4.28it/s][A
Training:  17%|█▋        | 22/126 [00:05<00:22,  4.67it/s][A
Training:  19%|█▉        | 24/126 [00:05<00:16,  6.07it/s][A
Training:  21%|██        | 26/126 [00:06<00:23,  4.26it/s][A
Training:  22%|██▏       | 28/126 [00:06<00:17,  5.58it/s][A
Training:  24%|██▍       | 30/126 [00:06<00:22,  4.30it/s][A
Training:  26%|██▌  

Epoch: 17/33 - Loss: 3.3038 - Accuracy: 0.9276



  0%|          | 0/16 [00:00<?, ?it/s][A
  6%|▋         | 1/16 [00:01<00:16,  1.12s/it][A
 12%|█▎        | 2/16 [00:01<00:07,  1.87it/s][A
 31%|███▏      | 5/16 [00:01<00:03,  3.62it/s][A
 38%|███▊      | 6/16 [00:02<00:02,  3.63it/s][A
 56%|█████▋    | 9/16 [00:02<00:01,  4.97it/s][A
 62%|██████▎   | 10/16 [00:02<00:01,  4.02it/s][A
 81%|████████▏ | 13/16 [00:03<00:00,  5.62it/s][A
100%|██████████| 16/16 [00:03<00:00,  4.28it/s][A
Epochs:  52%|█████▏    | 17/33 [07:45<07:15, 27.19s/it]

Val Loss: 3.4576 - Val Accuracy: 0.9354



Training:   0%|          | 0/126 [00:00<?, ?it/s][A
Training:   1%|          | 1/126 [00:01<02:27,  1.18s/it][A
Training:   2%|▏         | 3/126 [00:01<00:42,  2.88it/s][A
Training:   4%|▍         | 5/126 [00:01<00:41,  2.93it/s][A
Training:   6%|▋         | 8/126 [00:02<00:22,  5.28it/s][A
Training:   8%|▊         | 10/126 [00:02<00:28,  4.02it/s][A
Training:  10%|▉         | 12/126 [00:02<00:21,  5.36it/s][A
Training:  11%|█         | 14/126 [00:03<00:25,  4.42it/s][A
Training:  13%|█▎        | 16/126 [00:03<00:19,  5.63it/s][A
Training:  14%|█▍        | 18/126 [00:04<00:24,  4.48it/s][A
Training:  17%|█▋        | 21/126 [00:04<00:20,  5.12it/s][A
Training:  18%|█▊        | 23/126 [00:04<00:16,  6.13it/s][A
Training:  20%|█▉        | 25/126 [00:05<00:18,  5.33it/s][A
Training:  21%|██        | 26/126 [00:05<00:17,  5.76it/s][A
Training:  22%|██▏       | 28/126 [00:05<00:13,  7.24it/s][A
Training:  24%|██▍       | 30/126 [00:06<00:17,  5.52it/s][A
Training:  26%|██▌  

Epoch: 18/33 - Loss: 3.1875 - Accuracy: 0.9278



  0%|          | 0/16 [00:00<?, ?it/s][A
  6%|▋         | 1/16 [00:01<00:15,  1.04s/it][A
 19%|█▉        | 3/16 [00:01<00:04,  3.19it/s][A
 31%|███▏      | 5/16 [00:01<00:03,  3.13it/s][A
 44%|████▍     | 7/16 [00:02<00:01,  4.55it/s][A
 56%|█████▋    | 9/16 [00:02<00:01,  4.05it/s][A
 75%|███████▌  | 12/16 [00:02<00:00,  6.29it/s][A
100%|██████████| 16/16 [00:03<00:00,  4.71it/s][A
Epochs:  55%|█████▍    | 18/33 [08:12<06:44, 26.95s/it]

Val Loss: 3.5022 - Val Accuracy: 0.9352



Training:   0%|          | 0/126 [00:00<?, ?it/s][A
Training:   1%|          | 1/126 [00:01<02:17,  1.10s/it][A
Training:   4%|▍         | 5/126 [00:01<00:37,  3.20it/s][A
Training:   6%|▋         | 8/126 [00:01<00:21,  5.57it/s][A
Training:   8%|▊         | 10/126 [00:02<00:29,  3.96it/s][A
Training:  10%|▉         | 12/126 [00:02<00:21,  5.19it/s][A
Training:  11%|█         | 14/126 [00:03<00:25,  4.42it/s][A
Training:  13%|█▎        | 17/126 [00:04<00:24,  4.52it/s][A
Training:  15%|█▌        | 19/126 [00:04<00:19,  5.63it/s][A
Training:  17%|█▋        | 21/126 [00:04<00:22,  4.68it/s][A
Training:  17%|█▋        | 22/126 [00:04<00:20,  5.13it/s][A
Training:  19%|█▉        | 24/126 [00:05<00:15,  6.69it/s][A
Training:  21%|██        | 26/126 [00:05<00:19,  5.04it/s][A
Training:  22%|██▏       | 28/126 [00:05<00:15,  6.46it/s][A
Training:  24%|██▍       | 30/126 [00:06<00:19,  5.02it/s][A
Training:  25%|██▌       | 32/126 [00:06<00:15,  6.22it/s][A
Training:  27%|██▋ 

Epoch: 19/33 - Loss: 3.3561 - Accuracy: 0.9233



  0%|          | 0/16 [00:00<?, ?it/s][A
  6%|▋         | 1/16 [00:01<00:16,  1.11s/it][A
 25%|██▌       | 4/16 [00:01<00:02,  4.20it/s][A
 38%|███▊      | 6/16 [00:01<00:02,  3.55it/s][A
 56%|█████▋    | 9/16 [00:02<00:01,  3.99it/s][A
100%|██████████| 16/16 [00:03<00:00,  4.72it/s][A
Epochs:  58%|█████▊    | 19/33 [08:39<06:18, 27.04s/it]

Val Loss: 3.5068 - Val Accuracy: 0.9434



Training:   0%|          | 0/126 [00:00<?, ?it/s][A
Training:   1%|          | 1/126 [00:01<02:42,  1.30s/it][A
Training:   3%|▎         | 4/126 [00:01<00:35,  3.46it/s][A
Training:   5%|▍         | 6/126 [00:02<00:38,  3.16it/s][A
Training:   7%|▋         | 9/126 [00:02<00:25,  4.55it/s][A
Training:   8%|▊         | 10/126 [00:02<00:28,  4.07it/s][A
Training:  10%|█         | 13/126 [00:03<00:22,  5.11it/s][A
Training:  11%|█         | 14/126 [00:03<00:22,  4.99it/s][A
Training:  13%|█▎        | 16/126 [00:03<00:17,  6.35it/s][A
Training:  13%|█▎        | 17/126 [00:04<00:25,  4.33it/s][A
Training:  14%|█▍        | 18/126 [00:04<00:23,  4.51it/s][A
Training:  16%|█▌        | 20/126 [00:04<00:17,  6.06it/s][A
Training:  17%|█▋        | 21/126 [00:04<00:21,  4.85it/s][A
Training:  17%|█▋        | 22/126 [00:05<00:23,  4.34it/s][A
Training:  19%|█▉        | 24/126 [00:05<00:16,  6.29it/s][A
Training:  20%|█▉        | 25/126 [00:05<00:20,  4.99it/s][A
Training:  21%|██   

Epoch: 20/33 - Loss: 5.5452 - Accuracy: 0.9194



  0%|          | 0/16 [00:00<?, ?it/s][A
  6%|▋         | 1/16 [00:01<00:17,  1.16s/it][A
 19%|█▉        | 3/16 [00:01<00:04,  2.94it/s][A
 31%|███▏      | 5/16 [00:01<00:03,  3.13it/s][A
 44%|████▍     | 7/16 [00:02<00:01,  4.66it/s][A
 56%|█████▋    | 9/16 [00:02<00:01,  4.40it/s][A
 62%|██████▎   | 10/16 [00:02<00:01,  4.73it/s][A
 75%|███████▌  | 12/16 [00:02<00:00,  6.53it/s][A
100%|██████████| 16/16 [00:03<00:00,  4.52it/s][A
Epochs:  61%|██████    | 20/33 [09:06<05:52, 27.13s/it]

Val Loss: 3.5983 - Val Accuracy: 0.9302



Training:   0%|          | 0/126 [00:00<?, ?it/s][A
Training:   1%|          | 1/126 [00:01<02:13,  1.07s/it][A
Training:   2%|▏         | 3/126 [00:01<00:40,  3.02it/s][A
Training:   3%|▎         | 4/126 [00:01<00:30,  3.94it/s][A
Training:   4%|▍         | 5/126 [00:01<00:35,  3.40it/s][A
Training:   6%|▌         | 7/126 [00:01<00:22,  5.32it/s][A
Training:   7%|▋         | 9/126 [00:02<00:27,  4.22it/s][A
Training:   8%|▊         | 10/126 [00:02<00:24,  4.75it/s][A
Training:  10%|▉         | 12/126 [00:02<00:17,  6.70it/s][A
Training:  11%|█         | 14/126 [00:03<00:25,  4.32it/s][A
Training:  13%|█▎        | 17/126 [00:04<00:26,  4.17it/s][A
Training:  14%|█▍        | 18/126 [00:04<00:23,  4.62it/s][A
Training:  15%|█▌        | 19/126 [00:04<00:20,  5.12it/s][A
Training:  17%|█▋        | 21/126 [00:04<00:22,  4.76it/s][A
Training:  18%|█▊        | 23/126 [00:05<00:17,  6.04it/s][A
Training:  20%|█▉        | 25/126 [00:05<00:20,  4.83it/s][A
Training:  21%|██▏    

Epoch: 21/33 - Loss: 2.9502 - Accuracy: 0.9302



  0%|          | 0/16 [00:00<?, ?it/s][A
  6%|▋         | 1/16 [00:01<00:16,  1.07s/it][A
 31%|███▏      | 5/16 [00:01<00:03,  3.54it/s][A
 38%|███▊      | 6/16 [00:01<00:02,  3.97it/s][A
 56%|█████▋    | 9/16 [00:02<00:01,  4.56it/s][A
 62%|██████▎   | 10/16 [00:02<00:01,  4.85it/s][A
 81%|████████▏ | 13/16 [00:03<00:00,  5.15it/s][A
100%|██████████| 16/16 [00:03<00:00,  4.57it/s][A
Epochs:  64%|██████▎   | 21/33 [09:33<05:24, 27.04s/it]

Val Loss: 3.6647 - Val Accuracy: 0.9227



Training:   0%|          | 0/126 [00:00<?, ?it/s][A
Training:   1%|          | 1/126 [00:01<02:07,  1.02s/it][A
Training:   3%|▎         | 4/126 [00:01<00:30,  4.03it/s][A
Training:   4%|▍         | 5/126 [00:01<00:39,  3.07it/s][A
Training:   5%|▍         | 6/126 [00:01<00:32,  3.74it/s][A
Training:   6%|▋         | 8/126 [00:02<00:20,  5.63it/s][A
Training:   7%|▋         | 9/126 [00:02<00:29,  3.95it/s][A
Training:   8%|▊         | 10/126 [00:02<00:25,  4.52it/s][A
Training:  10%|▉         | 12/126 [00:02<00:16,  6.71it/s][A
Training:  11%|█         | 14/126 [00:03<00:26,  4.29it/s][A
Training:  13%|█▎        | 17/126 [00:03<00:19,  5.51it/s][A
Training:  14%|█▍        | 18/126 [00:04<00:22,  4.71it/s][A
Training:  17%|█▋        | 21/126 [00:04<00:16,  6.45it/s][A
Training:  17%|█▋        | 22/126 [00:04<00:22,  4.59it/s][A
Training:  19%|█▉        | 24/126 [00:05<00:16,  6.01it/s][A
Training:  21%|██        | 26/126 [00:05<00:21,  4.75it/s][A
Training:  22%|██▏    

Epoch: 22/33 - Loss: 3.1663 - Accuracy: 0.9310



  0%|          | 0/16 [00:00<?, ?it/s][A
  6%|▋         | 1/16 [00:01<00:20,  1.34s/it][A
 31%|███▏      | 5/16 [00:01<00:03,  2.98it/s][A
 44%|████▍     | 7/16 [00:02<00:02,  4.34it/s][A
 56%|█████▋    | 9/16 [00:02<00:01,  3.88it/s][A
100%|██████████| 16/16 [00:03<00:00,  4.55it/s][A
Epochs:  67%|██████▋   | 22/33 [10:00<04:56, 26.95s/it]

Val Loss: 4.6115 - Val Accuracy: 0.9282



Training:   0%|          | 0/126 [00:00<?, ?it/s][A
Training:   1%|          | 1/126 [00:01<02:07,  1.02s/it][A
Training:   2%|▏         | 2/126 [00:01<01:00,  2.06it/s][A
Training:   3%|▎         | 4/126 [00:01<00:26,  4.64it/s][A
Training:   5%|▍         | 6/126 [00:01<00:27,  4.40it/s][A
Training:   6%|▋         | 8/126 [00:01<00:19,  5.95it/s][A
Training:   7%|▋         | 9/126 [00:02<00:28,  4.17it/s][A
Training:  10%|▉         | 12/126 [00:02<00:17,  6.54it/s][A
Training:  11%|█         | 14/126 [00:03<00:20,  5.54it/s][A
Training:  13%|█▎        | 16/126 [00:03<00:17,  6.44it/s][A
Training:  13%|█▎        | 17/126 [00:03<00:23,  4.57it/s][A
Training:  14%|█▍        | 18/126 [00:03<00:22,  4.82it/s][A
Training:  16%|█▌        | 20/126 [00:04<00:18,  5.77it/s][A
Training:  17%|█▋        | 21/126 [00:04<00:23,  4.56it/s][A
Training:  17%|█▋        | 22/126 [00:04<00:20,  5.17it/s][A
Training:  18%|█▊        | 23/126 [00:04<00:18,  5.63it/s][A
Training:  19%|█▉     

Epoch: 23/33 - Loss: 3.6708 - Accuracy: 0.9262



  0%|          | 0/16 [00:00<?, ?it/s][A
  6%|▋         | 1/16 [00:01<00:19,  1.28s/it][A
 19%|█▉        | 3/16 [00:01<00:04,  2.65it/s][A
 31%|███▏      | 5/16 [00:02<00:03,  2.77it/s][A
 56%|█████▋    | 9/16 [00:02<00:01,  3.92it/s][A
100%|██████████| 16/16 [00:03<00:00,  4.50it/s][A
Epochs:  70%|██████▉   | 23/33 [10:27<04:30, 27.02s/it]

Val Loss: 3.9557 - Val Accuracy: 0.8686



Training:   0%|          | 0/126 [00:00<?, ?it/s][A
Training:   1%|          | 1/126 [00:01<02:20,  1.12s/it][A
Training:   3%|▎         | 4/126 [00:01<00:31,  3.93it/s][A
Training:   5%|▍         | 6/126 [00:01<00:34,  3.48it/s][A
Training:   6%|▋         | 8/126 [00:02<00:23,  4.95it/s][A
Training:   8%|▊         | 10/126 [00:02<00:29,  3.99it/s][A
Training:  10%|▉         | 12/126 [00:02<00:20,  5.46it/s][A
Training:  11%|█         | 14/126 [00:03<00:26,  4.17it/s][A
Training:  13%|█▎        | 17/126 [00:04<00:25,  4.19it/s][A
Training:  15%|█▌        | 19/126 [00:04<00:20,  5.22it/s][A
Training:  17%|█▋        | 21/126 [00:05<00:23,  4.48it/s][A
Training:  20%|█▉        | 25/126 [00:05<00:21,  4.60it/s][A
Training:  21%|██▏       | 27/126 [00:05<00:17,  5.59it/s][A
Training:  23%|██▎       | 29/126 [00:06<00:20,  4.80it/s][A
Training:  25%|██▍       | 31/126 [00:06<00:15,  5.99it/s][A
Training:  26%|██▌       | 33/126 [00:07<00:17,  5.42it/s][A
Training:  29%|██▉  

Epoch: 24/33 - Loss: 3.2194 - Accuracy: 0.9287



  0%|          | 0/16 [00:00<?, ?it/s][A
  6%|▋         | 1/16 [00:01<00:15,  1.06s/it][A
 25%|██▌       | 4/16 [00:01<00:02,  4.38it/s][A
 38%|███▊      | 6/16 [00:01<00:02,  3.88it/s][A
 50%|█████     | 8/16 [00:01<00:01,  5.16it/s][A
 62%|██████▎   | 10/16 [00:02<00:01,  4.46it/s][A
100%|██████████| 16/16 [00:03<00:00,  4.85it/s][A
Epochs:  73%|███████▎  | 24/33 [10:54<04:03, 27.01s/it]

Val Loss: 3.6277 - Val Accuracy: 0.9089



Training:   0%|          | 0/126 [00:00<?, ?it/s][A
Training:   1%|          | 1/126 [00:01<02:22,  1.14s/it][A
Training:   3%|▎         | 4/126 [00:01<00:30,  3.99it/s][A
Training:   5%|▍         | 6/126 [00:01<00:34,  3.50it/s][A
Training:   7%|▋         | 9/126 [00:02<00:30,  3.86it/s][A
Training:  10%|█         | 13/126 [00:03<00:27,  4.11it/s][A
Training:  13%|█▎        | 16/126 [00:03<00:19,  5.66it/s][A
Training:  14%|█▍        | 18/126 [00:04<00:25,  4.31it/s][A
Training:  16%|█▌        | 20/126 [00:04<00:20,  5.27it/s][A
Training:  17%|█▋        | 22/126 [00:05<00:22,  4.60it/s][A
Training:  20%|█▉        | 25/126 [00:05<00:21,  4.73it/s][A
Training:  22%|██▏       | 28/126 [00:05<00:14,  6.59it/s][A
Training:  24%|██▍       | 30/126 [00:06<00:20,  4.61it/s][A
Training:  25%|██▌       | 32/126 [00:06<00:16,  5.56it/s][A
Training:  27%|██▋       | 34/126 [00:07<00:18,  4.90it/s][A
Training:  29%|██▊       | 36/126 [00:07<00:14,  6.07it/s][A
Training:  30%|███  

Epoch: 25/33 - Loss: 3.3799 - Accuracy: 0.9321



  0%|          | 0/16 [00:00<?, ?it/s][A
  6%|▋         | 1/16 [00:00<00:13,  1.08it/s][A
 12%|█▎        | 2/16 [00:01<00:06,  2.24it/s][A
 31%|███▏      | 5/16 [00:01<00:02,  4.40it/s][A
 38%|███▊      | 6/16 [00:01<00:02,  4.71it/s][A
 56%|█████▋    | 9/16 [00:02<00:01,  5.35it/s][A
 62%|██████▎   | 10/16 [00:02<00:01,  5.34it/s][A
 81%|████████▏ | 13/16 [00:02<00:00,  5.15it/s][A
100%|██████████| 16/16 [00:03<00:00,  4.98it/s][A
Epochs:  76%|███████▌  | 25/33 [11:21<03:35, 26.96s/it]

Val Loss: 4.2134 - Val Accuracy: 0.9425



Training:   0%|          | 0/126 [00:00<?, ?it/s][A
Training:   1%|          | 1/126 [00:01<02:13,  1.07s/it][A
Training:   2%|▏         | 3/126 [00:01<00:39,  3.13it/s][A
Training:   4%|▍         | 5/126 [00:01<00:37,  3.22it/s][A
Training:   7%|▋         | 9/126 [00:02<00:24,  4.77it/s][A
Training:   8%|▊         | 10/126 [00:02<00:22,  5.14it/s][A
Training:  10%|█         | 13/126 [00:03<00:22,  4.93it/s][A
Training:  11%|█         | 14/126 [00:03<00:21,  5.17it/s][A
Training:  13%|█▎        | 17/126 [00:03<00:21,  4.97it/s][A
Training:  14%|█▍        | 18/126 [00:04<00:20,  5.32it/s][A
Training:  16%|█▌        | 20/126 [00:04<00:15,  6.64it/s][A
Training:  17%|█▋        | 21/126 [00:04<00:21,  4.82it/s][A
Training:  17%|█▋        | 22/126 [00:04<00:22,  4.61it/s][A
Training:  20%|█▉        | 25/126 [00:05<00:19,  5.28it/s][A
Training:  21%|██        | 26/126 [00:05<00:18,  5.28it/s][A
Training:  23%|██▎       | 29/126 [00:06<00:19,  4.97it/s][A
Training:  24%|██▍  

Epoch: 26/33 - Loss: 3.3397 - Accuracy: 0.9302



  0%|          | 0/16 [00:00<?, ?it/s][A
  6%|▋         | 1/16 [00:01<00:15,  1.05s/it][A
 25%|██▌       | 4/16 [00:01<00:02,  4.28it/s][A
 38%|███▊      | 6/16 [00:01<00:02,  3.56it/s][A
 56%|█████▋    | 9/16 [00:02<00:01,  3.82it/s][A
 75%|███████▌  | 12/16 [00:02<00:00,  5.91it/s][A
100%|██████████| 16/16 [00:03<00:00,  4.54it/s][A
Epochs:  79%|███████▉  | 26/33 [11:48<03:09, 27.02s/it]

Val Loss: 3.9272 - Val Accuracy: 0.9272



Training:   0%|          | 0/126 [00:00<?, ?it/s][A
Training:   1%|          | 1/126 [00:01<02:29,  1.19s/it][A
Training:   2%|▏         | 3/126 [00:01<00:43,  2.85it/s][A
Training:   4%|▍         | 5/126 [00:01<00:33,  3.57it/s][A
Training:   6%|▌         | 7/126 [00:01<00:23,  5.14it/s][A
Training:   6%|▋         | 8/126 [00:02<00:23,  4.99it/s][A
Training:   7%|▋         | 9/126 [00:02<00:25,  4.65it/s][A
Training:   8%|▊         | 10/126 [00:02<00:21,  5.31it/s][A
Training:  10%|▉         | 12/126 [00:02<00:20,  5.46it/s][A
Training:  10%|█         | 13/126 [00:03<00:24,  4.64it/s][A
Training:  11%|█         | 14/126 [00:03<00:23,  4.71it/s][A
Training:  13%|█▎        | 16/126 [00:03<00:21,  5.20it/s][A
Training:  13%|█▎        | 17/126 [00:03<00:21,  5.10it/s][A
Training:  15%|█▌        | 19/126 [00:04<00:17,  6.16it/s][A
Training:  16%|█▌        | 20/126 [00:04<00:18,  5.65it/s][A
Training:  17%|█▋        | 21/126 [00:04<00:20,  5.02it/s][A
Training:  18%|█▊     

Epoch: 27/33 - Loss: 7.7330 - Accuracy: 0.9116



  0%|          | 0/16 [00:00<?, ?it/s][A
  6%|▋         | 1/16 [00:00<00:14,  1.03it/s][A
 12%|█▎        | 2/16 [00:01<00:07,  1.99it/s][A
 31%|███▏      | 5/16 [00:01<00:02,  3.73it/s][A
 38%|███▊      | 6/16 [00:01<00:02,  3.87it/s][A
 50%|█████     | 8/16 [00:02<00:01,  5.82it/s][A
 56%|█████▋    | 9/16 [00:02<00:01,  5.16it/s][A
 62%|██████▎   | 10/16 [00:02<00:01,  5.27it/s][A
 81%|████████▏ | 13/16 [00:02<00:00,  5.46it/s][A
100%|██████████| 16/16 [00:03<00:00,  4.76it/s][A
Epochs:  82%|████████▏ | 27/33 [12:15<02:41, 26.93s/it]

Val Loss: 4.2932 - Val Accuracy: 0.9056



Training:   0%|          | 0/126 [00:00<?, ?it/s][A
Training:   1%|          | 1/126 [00:01<02:26,  1.18s/it][A
Training:   3%|▎         | 4/126 [00:01<00:30,  3.95it/s][A
Training:   5%|▍         | 6/126 [00:01<00:32,  3.67it/s][A
Training:   7%|▋         | 9/126 [00:02<00:27,  4.30it/s][A
Training:   8%|▊         | 10/126 [00:02<00:26,  4.30it/s][A
Training:  10%|▉         | 12/126 [00:02<00:19,  5.71it/s][A
Training:  10%|█         | 13/126 [00:03<00:24,  4.52it/s][A
Training:  11%|█         | 14/126 [00:03<00:23,  4.68it/s][A
Training:  12%|█▏        | 15/126 [00:03<00:20,  5.31it/s][A
Training:  13%|█▎        | 17/126 [00:03<00:21,  5.11it/s][A
Training:  14%|█▍        | 18/126 [00:04<00:20,  5.21it/s][A
Training:  16%|█▌        | 20/126 [00:04<00:15,  7.03it/s][A
Training:  17%|█▋        | 21/126 [00:04<00:18,  5.61it/s][A
Training:  17%|█▋        | 22/126 [00:04<00:19,  5.25it/s][A
Training:  19%|█▉        | 24/126 [00:04<00:13,  7.36it/s][A
Training:  20%|█▉   

Epoch: 28/33 - Loss: 3.0529 - Accuracy: 0.9326



  0%|          | 0/16 [00:00<?, ?it/s][A
  6%|▋         | 1/16 [00:00<00:14,  1.02it/s][A
 12%|█▎        | 2/16 [00:01<00:07,  1.92it/s][A
 31%|███▏      | 5/16 [00:01<00:02,  3.88it/s][A
 38%|███▊      | 6/16 [00:01<00:02,  4.20it/s][A
 56%|█████▋    | 9/16 [00:02<00:01,  4.76it/s][A
 62%|██████▎   | 10/16 [00:02<00:01,  4.86it/s][A
 81%|████████▏ | 13/16 [00:03<00:00,  5.40it/s][A
100%|██████████| 16/16 [00:03<00:00,  4.68it/s][A
Epochs:  85%|████████▍ | 28/33 [12:42<02:14, 26.96s/it]

Val Loss: 3.5156 - Val Accuracy: 0.9159



Training:   0%|          | 0/126 [00:00<?, ?it/s][A
Training:   1%|          | 1/126 [00:00<01:54,  1.09it/s][A
Training:   2%|▏         | 2/126 [00:01<00:54,  2.26it/s][A
Training:   3%|▎         | 4/126 [00:01<00:24,  5.05it/s][A
Training:   5%|▍         | 6/126 [00:01<00:28,  4.27it/s][A
Training:   6%|▋         | 8/126 [00:01<00:20,  5.72it/s][A
Training:   7%|▋         | 9/126 [00:02<00:26,  4.41it/s][A
Training:   8%|▊         | 10/126 [00:02<00:26,  4.37it/s][A
Training:  10%|█         | 13/126 [00:02<00:20,  5.56it/s][A
Training:  11%|█         | 14/126 [00:03<00:21,  5.13it/s][A
Training:  13%|█▎        | 17/126 [00:03<00:19,  5.59it/s][A
Training:  14%|█▍        | 18/126 [00:03<00:21,  5.07it/s][A
Training:  17%|█▋        | 21/126 [00:04<00:18,  5.63it/s][A
Training:  17%|█▋        | 22/126 [00:04<00:19,  5.37it/s][A
Training:  19%|█▉        | 24/126 [00:04<00:15,  6.74it/s][A
Training:  20%|█▉        | 25/126 [00:05<00:19,  5.20it/s][A
Training:  21%|██     

Epoch: 29/33 - Loss: 2.9331 - Accuracy: 0.9338



  0%|          | 0/16 [00:00<?, ?it/s][A
  6%|▋         | 1/16 [00:00<00:14,  1.04it/s][A
 25%|██▌       | 4/16 [00:01<00:02,  4.64it/s][A
 38%|███▊      | 6/16 [00:01<00:02,  4.04it/s][A
 50%|█████     | 8/16 [00:01<00:01,  5.32it/s][A
 62%|██████▎   | 10/16 [00:02<00:01,  4.98it/s][A
 75%|███████▌  | 12/16 [00:02<00:00,  6.53it/s][A
100%|██████████| 16/16 [00:02<00:00,  5.46it/s][A
Epochs:  88%|████████▊ | 29/33 [13:08<01:47, 26.76s/it]

Val Loss: 3.5779 - Val Accuracy: 0.9325



Training:   0%|          | 0/126 [00:00<?, ?it/s][A
Training:   1%|          | 1/126 [00:00<02:00,  1.04it/s][A
Training:   2%|▏         | 3/126 [00:01<00:36,  3.35it/s][A
Training:   4%|▍         | 5/126 [00:01<00:33,  3.57it/s][A
Training:   6%|▌         | 7/126 [00:01<00:22,  5.34it/s][A
Training:   7%|▋         | 9/126 [00:02<00:28,  4.14it/s][A
Training:   9%|▊         | 11/126 [00:02<00:20,  5.59it/s][A
Training:  10%|█         | 13/126 [00:03<00:25,  4.45it/s][A
Training:  13%|█▎        | 16/126 [00:03<00:16,  6.76it/s][A
Training:  14%|█▍        | 18/126 [00:03<00:18,  5.71it/s][A
Training:  16%|█▌        | 20/126 [00:03<00:14,  7.10it/s][A
Training:  17%|█▋        | 22/126 [00:04<00:18,  5.55it/s][A
Training:  20%|█▉        | 25/126 [00:04<00:18,  5.48it/s][A
Training:  22%|██▏       | 28/126 [00:05<00:14,  6.77it/s][A
Training:  23%|██▎       | 29/126 [00:05<00:17,  5.44it/s][A
Training:  25%|██▌       | 32/126 [00:05<00:14,  6.66it/s][A
Training:  26%|██▌   

Epoch: 30/33 - Loss: 2.9782 - Accuracy: 0.9383



  0%|          | 0/16 [00:00<?, ?it/s][A
  6%|▋         | 1/16 [00:01<00:15,  1.05s/it][A
 12%|█▎        | 2/16 [00:01<00:07,  1.99it/s][A
 25%|██▌       | 4/16 [00:01<00:02,  4.28it/s][A
 31%|███▏      | 5/16 [00:01<00:03,  3.31it/s][A
 38%|███▊      | 6/16 [00:01<00:02,  3.69it/s][A
 50%|█████     | 8/16 [00:02<00:01,  5.51it/s][A
 56%|█████▋    | 9/16 [00:02<00:01,  4.11it/s][A
 62%|██████▎   | 10/16 [00:02<00:01,  3.98it/s][A
 75%|███████▌  | 12/16 [00:02<00:00,  5.96it/s][A
 81%|████████▏ | 13/16 [00:03<00:00,  5.05it/s][A
100%|██████████| 16/16 [00:03<00:00,  4.40it/s][A
Epochs:  91%|█████████ | 30/33 [13:34<01:20, 26.68s/it]

Val Loss: 5.1230 - Val Accuracy: 0.9259



Training:   0%|          | 0/126 [00:00<?, ?it/s][A
Training:   1%|          | 1/126 [00:01<02:30,  1.21s/it][A
Training:   2%|▏         | 3/126 [00:01<00:43,  2.83it/s][A
Training:   4%|▍         | 5/126 [00:02<00:41,  2.88it/s][A
Training:   6%|▌         | 7/126 [00:02<00:26,  4.44it/s][A
Training:   7%|▋         | 9/126 [00:02<00:32,  3.59it/s][A
Training:   9%|▊         | 11/126 [00:03<00:23,  4.82it/s][A
Training:  10%|█         | 13/126 [00:03<00:27,  4.09it/s][A
Training:  12%|█▏        | 15/126 [00:03<00:20,  5.44it/s][A
Training:  13%|█▎        | 17/126 [00:04<00:22,  4.77it/s][A
Training:  15%|█▌        | 19/126 [00:04<00:17,  6.17it/s][A
Training:  17%|█▋        | 21/126 [00:04<00:21,  4.98it/s][A
Training:  20%|█▉        | 25/126 [00:05<00:19,  5.16it/s][A
Training:  23%|██▎       | 29/126 [00:06<00:18,  5.17it/s][A
Training:  26%|██▌       | 33/126 [00:07<00:17,  5.29it/s][A
Training:  28%|██▊       | 35/126 [00:07<00:14,  6.18it/s][A
Training:  29%|██▉   

Epoch: 31/33 - Loss: 2.8394 - Accuracy: 0.9358



  0%|          | 0/16 [00:00<?, ?it/s][A
  6%|▋         | 1/16 [00:01<00:17,  1.19s/it][A
 12%|█▎        | 2/16 [00:01<00:07,  1.76it/s][A
 31%|███▏      | 5/16 [00:01<00:03,  3.21it/s][A
 50%|█████     | 8/16 [00:02<00:01,  5.73it/s][A
 62%|██████▎   | 10/16 [00:02<00:01,  4.64it/s][A
100%|██████████| 16/16 [00:03<00:00,  4.55it/s][A
Epochs:  94%|█████████▍| 31/33 [14:02<00:54, 27.01s/it]

Val Loss: 3.1671 - Val Accuracy: 0.9332



Training:   0%|          | 0/126 [00:00<?, ?it/s][A
Training:   1%|          | 1/126 [00:01<02:05,  1.00s/it][A
Training:   3%|▎         | 4/126 [00:01<00:27,  4.41it/s][A
Training:   5%|▍         | 6/126 [00:01<00:29,  4.06it/s][A
Training:   7%|▋         | 9/126 [00:02<00:30,  3.87it/s][A
Training:   9%|▊         | 11/126 [00:02<00:22,  5.10it/s][A
Training:  10%|█         | 13/126 [00:03<00:23,  4.72it/s][A
Training:  12%|█▏        | 15/126 [00:03<00:19,  5.55it/s][A
Training:  13%|█▎        | 17/126 [00:03<00:22,  4.82it/s][A
Training:  15%|█▌        | 19/126 [00:04<00:20,  5.13it/s][A
Training:  17%|█▋        | 21/126 [00:04<00:17,  5.95it/s][A
Training:  18%|█▊        | 23/126 [00:04<00:18,  5.49it/s][A
Training:  20%|█▉        | 25/126 [00:05<00:15,  6.37it/s][A
Training:  21%|██▏       | 27/126 [00:05<00:18,  5.29it/s][A
Training:  23%|██▎       | 29/126 [00:05<00:14,  6.65it/s][A
Training:  25%|██▍       | 31/126 [00:06<00:17,  5.38it/s][A
Training:  27%|██▋  

Epoch: 32/33 - Loss: 2.8201 - Accuracy: 0.9393



  0%|          | 0/16 [00:00<?, ?it/s][A
  6%|▋         | 1/16 [00:01<00:17,  1.15s/it][A
 25%|██▌       | 4/16 [00:01<00:02,  4.04it/s][A
 38%|███▊      | 6/16 [00:01<00:02,  3.61it/s][A
 50%|█████     | 8/16 [00:02<00:01,  4.56it/s][A
 56%|█████▋    | 9/16 [00:02<00:01,  3.60it/s][A
 69%|██████▉   | 11/16 [00:02<00:00,  5.17it/s][A
100%|██████████| 16/16 [00:03<00:00,  4.52it/s][A
Epochs:  97%|█████████▋| 32/33 [14:29<00:26, 26.87s/it]

Val Loss: 3.7395 - Val Accuracy: 0.9283



Training:   0%|          | 0/126 [00:00<?, ?it/s][A
Training:   1%|          | 1/126 [00:01<02:09,  1.04s/it][A
Training:   2%|▏         | 3/126 [00:01<00:40,  3.01it/s][A
Training:   4%|▍         | 5/126 [00:01<00:34,  3.51it/s][A
Training:   5%|▍         | 6/126 [00:01<00:28,  4.22it/s][A
Training:   7%|▋         | 9/126 [00:02<00:26,  4.36it/s][A
Training:   8%|▊         | 10/126 [00:02<00:25,  4.54it/s][A
Training:  10%|█         | 13/126 [00:03<00:21,  5.32it/s][A
Training:  11%|█         | 14/126 [00:03<00:24,  4.49it/s][A
Training:  13%|█▎        | 16/126 [00:03<00:18,  5.92it/s][A
Training:  13%|█▎        | 17/126 [00:03<00:19,  5.56it/s][A
Training:  14%|█▍        | 18/126 [00:03<00:18,  5.89it/s][A
Training:  17%|█▋        | 21/126 [00:04<00:18,  5.62it/s][A
Training:  17%|█▋        | 22/126 [00:04<00:18,  5.68it/s][A
Training:  20%|█▉        | 25/126 [00:05<00:17,  5.69it/s][A
Training:  21%|██        | 26/126 [00:05<00:17,  5.79it/s][A
Training:  23%|██▎   

Epoch: 33/33 - Loss: 2.6253 - Accuracy: 0.9385



  0%|          | 0/16 [00:00<?, ?it/s][A
  6%|▋         | 1/16 [00:01<00:19,  1.27s/it][A
 25%|██▌       | 4/16 [00:01<00:03,  3.69it/s][A
 38%|███▊      | 6/16 [00:01<00:02,  3.76it/s][A
 56%|█████▋    | 9/16 [00:02<00:01,  3.66it/s][A
 75%|███████▌  | 12/16 [00:02<00:00,  5.66it/s][A
100%|██████████| 16/16 [00:03<00:00,  4.53it/s][A
Epochs: 100%|██████████| 33/33 [14:56<00:00, 27.17s/it]


Val Loss: 3.3435 - Val Accuracy: 0.9378
Saving best model...


[32m[I 2023-12-14 23:11:27,639][0m Trial 2 finished with value: 0.937753438949585 and parameters: {'loss_learning_rate': 0.000515322161093277, 'learning_rate': 0.01295417626729335, 'weight_decay': 0.00010094083028756503, 'epsilon': 3.4787628785215855e-08, 'batch_size': 111, 'epochs': 33}. Best is trial 2 with value: 0.937753438949585.[0m


Learning rate for Loss: 0.007241145783203654
Learning rate: 0.02124392374572327
Weight decay: 0.0004373342967663484
Epsilon: 8.320175162308942e-08
Batch size: 203
Number of epochs: 59


Epochs:   0%|          | 0/59 [00:00<?, ?it/s]
Training:   0%|          | 0/69 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/69 [00:01<01:45,  1.55s/it][A
Training:   3%|▎         | 2/69 [00:01<00:47,  1.42it/s][A
Training:   6%|▌         | 4/69 [00:01<00:19,  3.25it/s][A
Training:   7%|▋         | 5/69 [00:02<00:35,  1.80it/s][A
Training:  10%|█         | 7/69 [00:03<00:24,  2.57it/s][A
Training:  12%|█▏        | 8/69 [00:03<00:19,  3.15it/s][A
Training:  13%|█▎        | 9/69 [00:04<00:29,  2.04it/s][A
Training:  16%|█▌        | 11/69 [00:04<00:17,  3.25it/s][A
Training:  19%|█▉        | 13/69 [00:05<00:21,  2.56it/s][A
Training:  22%|██▏       | 15/69 [00:05<00:14,  3.62it/s][A
Training:  25%|██▍       | 17/69 [00:06<00:19,  2.67it/s][A
Training:  28%|██▊       | 19/69 [00:07<00:15,  3.27it/s][A
Training:  30%|███       | 21/69 [00:08<00:17,  2.69it/s][A
Training:  33%|███▎      | 23/69 [00:08<00:13,  3.45it/s][A
Training:  36%|███▌      | 25/69 [00:09<00:15,  2.86it

Epoch: 1/59 - Loss: 14.4922 - Accuracy: 0.7875



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:01<00:13,  1.65s/it][A
 22%|██▏       | 2/9 [00:01<00:05,  1.35it/s][A
 44%|████▍     | 4/9 [00:01<00:01,  3.08it/s][A
 56%|█████▌    | 5/9 [00:02<00:02,  1.91it/s][A
 67%|██████▋   | 6/9 [00:03<00:01,  2.51it/s][A
100%|██████████| 9/9 [00:03<00:00,  2.42it/s][A
Epochs:   2%|▏         | 1/59 [00:27<26:10, 27.08s/it]

Val Loss: 4.7358 - Val Accuracy: 0.8979



Training:   0%|          | 0/69 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/69 [00:01<01:47,  1.58s/it][A
Training:   4%|▍         | 3/69 [00:01<00:29,  2.20it/s][A
Training:   7%|▋         | 5/69 [00:02<00:31,  2.02it/s][A
Training:  10%|█         | 7/69 [00:02<00:19,  3.12it/s][A
Training:  12%|█▏        | 8/69 [00:03<00:16,  3.68it/s][A
Training:  13%|█▎        | 9/69 [00:04<00:30,  1.99it/s][A
Training:  16%|█▌        | 11/69 [00:04<00:18,  3.07it/s][A
Training:  19%|█▉        | 13/69 [00:05<00:21,  2.62it/s][A
Training:  22%|██▏       | 15/69 [00:05<00:14,  3.70it/s][A
Training:  25%|██▍       | 17/69 [00:06<00:19,  2.73it/s][A
Training:  29%|██▉       | 20/69 [00:06<00:11,  4.31it/s][A
Training:  32%|███▏      | 22/69 [00:08<00:17,  2.73it/s][A
Training:  36%|███▌      | 25/69 [00:09<00:16,  2.72it/s][A
Training:  38%|███▊      | 26/69 [00:09<00:14,  3.03it/s][A
Training:  41%|████      | 28/69 [00:09<00:10,  3.97it/s][A
Training:  42%|████▏     | 29/69 [00:1

Epoch: 2/59 - Loss: 4.8709 - Accuracy: 0.9148



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:02<00:17,  2.21s/it][A
 33%|███▎      | 3/9 [00:02<00:03,  1.61it/s][A
 56%|█████▌    | 5/9 [00:03<00:02,  1.68it/s][A
100%|██████████| 9/9 [00:04<00:00,  2.11it/s][A
Epochs:   3%|▎         | 2/59 [00:55<26:12, 27.58s/it]

Val Loss: 6.7161 - Val Accuracy: 0.9096



Training:   0%|          | 0/69 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/69 [00:01<02:05,  1.85s/it][A
Training:   4%|▍         | 3/69 [00:02<00:35,  1.87it/s][A
Training:   7%|▋         | 5/69 [00:03<00:34,  1.86it/s][A
Training:   9%|▊         | 6/69 [00:03<00:28,  2.20it/s][A
Training:  12%|█▏        | 8/69 [00:03<00:17,  3.43it/s][A
Training:  13%|█▎        | 9/69 [00:04<00:27,  2.22it/s][A
Training:  14%|█▍        | 10/69 [00:04<00:23,  2.50it/s][A
Training:  16%|█▌        | 11/69 [00:04<00:19,  2.99it/s][A
Training:  19%|█▉        | 13/69 [00:05<00:19,  2.82it/s][A
Training:  20%|██        | 14/69 [00:05<00:17,  3.23it/s][A
Training:  22%|██▏       | 15/69 [00:06<00:16,  3.24it/s][A
Training:  23%|██▎       | 16/69 [00:06<00:13,  3.82it/s][A
Training:  25%|██▍       | 17/69 [00:06<00:18,  2.87it/s][A
Training:  26%|██▌       | 18/69 [00:07<00:18,  2.78it/s][A
Training:  28%|██▊       | 19/69 [00:07<00:16,  3.05it/s][A
Training:  30%|███       | 21/69 [00:0

Epoch: 3/59 - Loss: 4.4409 - Accuracy: 0.9223



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:01<00:14,  1.81s/it][A
 22%|██▏       | 2/9 [00:01<00:05,  1.22it/s][A
 56%|█████▌    | 5/9 [00:03<00:02,  1.92it/s][A
 67%|██████▋   | 6/9 [00:03<00:01,  2.31it/s][A
 89%|████████▉ | 8/9 [00:03<00:00,  3.58it/s][A
100%|██████████| 9/9 [00:03<00:00,  2.28it/s][A
Epochs:   5%|▌         | 3/59 [01:22<25:46, 27.62s/it]

Val Loss: 4.0227 - Val Accuracy: 0.9255



Training:   0%|          | 0/69 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/69 [00:01<02:04,  1.83s/it][A
Training:   3%|▎         | 2/69 [00:01<00:55,  1.20it/s][A
Training:   6%|▌         | 4/69 [00:02<00:23,  2.77it/s][A
Training:   7%|▋         | 5/69 [00:02<00:33,  1.94it/s][A
Training:   9%|▊         | 6/69 [00:03<00:27,  2.29it/s][A
Training:  13%|█▎        | 9/69 [00:04<00:21,  2.77it/s][A
Training:  14%|█▍        | 10/69 [00:04<00:20,  2.90it/s][A
Training:  19%|█▉        | 13/69 [00:05<00:17,  3.12it/s][A
Training:  20%|██        | 14/69 [00:05<00:19,  2.80it/s][A
Training:  23%|██▎       | 16/69 [00:06<00:13,  3.85it/s][A
Training:  25%|██▍       | 17/69 [00:06<00:16,  3.10it/s][A
Training:  26%|██▌       | 18/69 [00:07<00:18,  2.74it/s][A
Training:  29%|██▉       | 20/69 [00:07<00:12,  3.97it/s][A
Training:  30%|███       | 21/69 [00:07<00:14,  3.27it/s][A
Training:  32%|███▏      | 22/69 [00:08<00:19,  2.45it/s][A
Training:  35%|███▍      | 24/69 [00:0

Epoch: 4/59 - Loss: 4.2097 - Accuracy: 0.9338



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:01<00:12,  1.54s/it][A
 22%|██▏       | 2/9 [00:01<00:04,  1.41it/s][A
 33%|███▎      | 3/9 [00:01<00:03,  1.99it/s][A
 56%|█████▌    | 5/9 [00:02<00:01,  2.03it/s][A
 78%|███████▊  | 7/9 [00:03<00:00,  3.09it/s][A
100%|██████████| 9/9 [00:03<00:00,  2.45it/s][A
Epochs:   7%|▋         | 4/59 [01:49<25:03, 27.34s/it]

Val Loss: 3.7421 - Val Accuracy: 0.9224



Training:   0%|          | 0/69 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/69 [00:01<01:47,  1.59s/it][A
Training:   4%|▍         | 3/69 [00:01<00:30,  2.17it/s][A
Training:   7%|▋         | 5/69 [00:02<00:34,  1.87it/s][A
Training:  10%|█         | 7/69 [00:03<00:21,  2.95it/s][A
Training:  13%|█▎        | 9/69 [00:04<00:24,  2.41it/s][A
Training:  16%|█▌        | 11/69 [00:04<00:16,  3.47it/s][A
Training:  19%|█▉        | 13/69 [00:05<00:21,  2.63it/s][A
Training:  22%|██▏       | 15/69 [00:05<00:15,  3.57it/s][A
Training:  25%|██▍       | 17/69 [00:06<00:18,  2.78it/s][A
Training:  28%|██▊       | 19/69 [00:06<00:13,  3.76it/s][A
Training:  30%|███       | 21/69 [00:07<00:15,  3.05it/s][A
Training:  32%|███▏      | 22/69 [00:08<00:16,  2.83it/s][A
Training:  35%|███▍      | 24/69 [00:08<00:11,  3.78it/s][A
Training:  36%|███▌      | 25/69 [00:08<00:13,  3.16it/s][A
Training:  38%|███▊      | 26/69 [00:09<00:15,  2.78it/s][A
Training:  42%|████▏     | 29/69 [00:

Epoch: 5/59 - Loss: 3.8035 - Accuracy: 0.9316



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:01<00:13,  1.74s/it][A
 22%|██▏       | 2/9 [00:01<00:05,  1.19it/s][A
 33%|███▎      | 3/9 [00:02<00:03,  1.93it/s][A
 56%|█████▌    | 5/9 [00:03<00:02,  1.95it/s][A
 67%|██████▋   | 6/9 [00:03<00:01,  2.34it/s][A
 89%|████████▉ | 8/9 [00:03<00:00,  3.75it/s][A
100%|██████████| 9/9 [00:03<00:00,  2.36it/s][A
Epochs:   8%|▊         | 5/59 [02:16<24:18, 27.02s/it]

Val Loss: 3.6859 - Val Accuracy: 0.9317



Training:   0%|          | 0/69 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/69 [00:01<01:52,  1.66s/it][A
Training:   4%|▍         | 3/69 [00:01<00:31,  2.08it/s][A
Training:   7%|▋         | 5/69 [00:02<00:31,  2.06it/s][A
Training:   9%|▊         | 6/69 [00:02<00:25,  2.47it/s][A
Training:  13%|█▎        | 9/69 [00:04<00:23,  2.54it/s][A
Training:  14%|█▍        | 10/69 [00:04<00:20,  2.90it/s][A
Training:  17%|█▋        | 12/69 [00:04<00:14,  4.06it/s][A
Training:  19%|█▉        | 13/69 [00:05<00:20,  2.74it/s][A
Training:  20%|██        | 14/69 [00:05<00:20,  2.65it/s][A
Training:  22%|██▏       | 15/69 [00:05<00:16,  3.20it/s][A
Training:  25%|██▍       | 17/69 [00:06<00:14,  3.67it/s][A
Training:  26%|██▌       | 18/69 [00:07<00:21,  2.39it/s][A
Training:  29%|██▉       | 20/69 [00:07<00:14,  3.50it/s][A
Training:  32%|███▏      | 22/69 [00:08<00:18,  2.53it/s][A
Training:  35%|███▍      | 24/69 [00:08<00:12,  3.48it/s][A
Training:  36%|███▌      | 25/69 [00:

Epoch: 6/59 - Loss: 3.5628 - Accuracy: 0.9367



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:01<00:13,  1.71s/it][A
 33%|███▎      | 3/9 [00:01<00:02,  2.04it/s][A
 56%|█████▌    | 5/9 [00:03<00:02,  1.77it/s][A
100%|██████████| 9/9 [00:03<00:00,  2.35it/s][A
Epochs:  10%|█         | 6/59 [02:42<23:44, 26.87s/it]

Val Loss: 3.8169 - Val Accuracy: 0.9301



Training:   0%|          | 0/69 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/69 [00:01<02:01,  1.79s/it][A
Training:   6%|▌         | 4/69 [00:01<00:24,  2.69it/s][A
Training:   9%|▊         | 6/69 [00:03<00:29,  2.13it/s][A
Training:  13%|█▎        | 9/69 [00:04<00:27,  2.21it/s][A
Training:  16%|█▌        | 11/69 [00:04<00:19,  2.98it/s][A
Training:  19%|█▉        | 13/69 [00:05<00:22,  2.49it/s][A
Training:  20%|██        | 14/69 [00:05<00:19,  2.87it/s][A
Training:  23%|██▎       | 16/69 [00:05<00:13,  3.80it/s][A
Training:  25%|██▍       | 17/69 [00:06<00:19,  2.68it/s][A
Training:  29%|██▉       | 20/69 [00:07<00:12,  3.83it/s][A
Training:  30%|███       | 21/69 [00:08<00:19,  2.42it/s][A
Training:  32%|███▏      | 22/69 [00:08<00:16,  2.81it/s][A
Training:  35%|███▍      | 24/69 [00:08<00:12,  3.68it/s][A
Training:  36%|███▌      | 25/69 [00:09<00:17,  2.53it/s][A
Training:  39%|███▉      | 27/69 [00:09<00:11,  3.70it/s][A
Training:  41%|████      | 28/69 [00

Epoch: 7/59 - Loss: 3.5527 - Accuracy: 0.9340



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:01<00:13,  1.68s/it][A
 33%|███▎      | 3/9 [00:01<00:03,  1.99it/s][A
 56%|█████▌    | 5/9 [00:03<00:02,  1.75it/s][A
100%|██████████| 9/9 [00:03<00:00,  2.28it/s][A
Epochs:  12%|█▏        | 7/59 [03:10<23:33, 27.18s/it]

Val Loss: 4.0611 - Val Accuracy: 0.9356



Training:   0%|          | 0/69 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/69 [00:01<01:47,  1.58s/it][A
Training:   4%|▍         | 3/69 [00:01<00:30,  2.18it/s][A
Training:   7%|▋         | 5/69 [00:02<00:33,  1.89it/s][A
Training:  12%|█▏        | 8/69 [00:03<00:16,  3.65it/s][A
Training:  14%|█▍        | 10/69 [00:04<00:24,  2.44it/s][A
Training:  19%|█▉        | 13/69 [00:05<00:21,  2.60it/s][A
Training:  20%|██        | 14/69 [00:05<00:18,  2.93it/s][A
Training:  23%|██▎       | 16/69 [00:05<00:13,  4.02it/s][A
Training:  26%|██▌       | 18/69 [00:06<00:18,  2.79it/s][A
Training:  29%|██▉       | 20/69 [00:07<00:13,  3.64it/s][A
Training:  30%|███       | 21/69 [00:07<00:18,  2.60it/s][A
Training:  32%|███▏      | 22/69 [00:08<00:17,  2.76it/s][A
Training:  35%|███▍      | 24/69 [00:08<00:12,  3.66it/s][A
Training:  36%|███▌      | 25/69 [00:09<00:17,  2.55it/s][A
Training:  38%|███▊      | 26/69 [00:09<00:16,  2.62it/s][A
Training:  41%|████      | 28/69 [00

Epoch: 8/59 - Loss: 3.5649 - Accuracy: 0.9345



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:01<00:15,  1.91s/it][A
 33%|███▎      | 3/9 [00:02<00:03,  1.86it/s][A
 56%|█████▌    | 5/9 [00:03<00:02,  1.67it/s][A
100%|██████████| 9/9 [00:04<00:00,  2.11it/s][A
Epochs:  14%|█▎        | 8/59 [03:38<23:21, 27.47s/it]

Val Loss: 4.2020 - Val Accuracy: 0.9215



Training:   0%|          | 0/69 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/69 [00:01<01:52,  1.65s/it][A
Training:   6%|▌         | 4/69 [00:01<00:22,  2.91it/s][A
Training:   9%|▊         | 6/69 [00:03<00:31,  2.03it/s][A
Training:  12%|█▏        | 8/69 [00:03<00:20,  2.98it/s][A
Training:  14%|█▍        | 10/69 [00:04<00:24,  2.44it/s][A
Training:  17%|█▋        | 12/69 [00:04<00:17,  3.30it/s][A
Training:  19%|█▉        | 13/69 [00:05<00:23,  2.37it/s][A
Training:  25%|██▍       | 17/69 [00:06<00:17,  3.02it/s][A
Training:  26%|██▌       | 18/69 [00:06<00:15,  3.28it/s][A
Training:  29%|██▉       | 20/69 [00:06<00:11,  4.37it/s][A
Training:  30%|███       | 21/69 [00:07<00:17,  2.79it/s][A
Training:  32%|███▏      | 22/69 [00:08<00:16,  2.85it/s][A
Training:  35%|███▍      | 24/69 [00:08<00:10,  4.12it/s][A
Training:  36%|███▌      | 25/69 [00:08<00:15,  2.91it/s][A
Training:  38%|███▊      | 26/69 [00:09<00:14,  3.00it/s][A
Training:  42%|████▏     | 29/69 [00

Epoch: 9/59 - Loss: 3.4284 - Accuracy: 0.9323



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:01<00:14,  1.80s/it][A
 22%|██▏       | 2/9 [00:01<00:05,  1.24it/s][A
 56%|█████▌    | 5/9 [00:03<00:02,  1.89it/s][A
100%|██████████| 9/9 [00:03<00:00,  2.30it/s][A
Epochs:  15%|█▌        | 9/59 [04:06<22:55, 27.52s/it]

Val Loss: 4.2487 - Val Accuracy: 0.9301



Training:   0%|          | 0/69 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/69 [00:01<02:02,  1.80s/it][A
Training:   3%|▎         | 2/69 [00:01<00:54,  1.23it/s][A
Training:   6%|▌         | 4/69 [00:02<00:21,  2.97it/s][A
Training:   9%|▊         | 6/69 [00:03<00:27,  2.32it/s][A
Training:  10%|█         | 7/69 [00:03<00:21,  2.85it/s][A
Training:  13%|█▎        | 9/69 [00:04<00:26,  2.30it/s][A
Training:  16%|█▌        | 11/69 [00:04<00:17,  3.28it/s][A
Training:  19%|█▉        | 13/69 [00:05<00:23,  2.36it/s][A
Training:  25%|██▍       | 17/69 [00:07<00:19,  2.73it/s][A
Training:  28%|██▊       | 19/69 [00:07<00:14,  3.48it/s][A
Training:  30%|███       | 21/69 [00:08<00:19,  2.50it/s][A
Training:  33%|███▎      | 23/69 [00:08<00:14,  3.24it/s][A
Training:  36%|███▌      | 25/69 [00:09<00:17,  2.56it/s][A
Training:  41%|████      | 28/69 [00:10<00:10,  3.88it/s][A
Training:  43%|████▎     | 30/69 [00:11<00:13,  2.88it/s][A
Training:  46%|████▋     | 32/69 [00:1

Epoch: 10/59 - Loss: 3.5231 - Accuracy: 0.9302



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:01<00:14,  1.86s/it][A
 33%|███▎      | 3/9 [00:02<00:03,  1.86it/s][A
 56%|█████▌    | 5/9 [00:03<00:02,  1.81it/s][A
 78%|███████▊  | 7/9 [00:03<00:00,  2.82it/s][A
100%|██████████| 9/9 [00:03<00:00,  2.25it/s][A
Epochs:  17%|█▋        | 10/59 [04:34<22:42, 27.80s/it]

Val Loss: 3.5769 - Val Accuracy: 0.9293



Training:   0%|          | 0/69 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/69 [00:01<02:09,  1.90s/it][A
Training:   6%|▌         | 4/69 [00:02<00:25,  2.57it/s][A
Training:   9%|▊         | 6/69 [00:03<00:31,  1.99it/s][A
Training:  12%|█▏        | 8/69 [00:03<00:20,  3.02it/s][A
Training:  14%|█▍        | 10/69 [00:04<00:26,  2.25it/s][A
Training:  19%|█▉        | 13/69 [00:05<00:23,  2.39it/s][A
Training:  23%|██▎       | 16/69 [00:06<00:14,  3.62it/s][A
Training:  26%|██▌       | 18/69 [00:07<00:19,  2.56it/s][A
Training:  29%|██▉       | 20/69 [00:07<00:14,  3.31it/s][A
Training:  32%|███▏      | 22/69 [00:08<00:17,  2.64it/s][A
Training:  36%|███▌      | 25/69 [00:09<00:15,  2.89it/s][A
Training:  38%|███▊      | 26/69 [00:09<00:14,  2.99it/s][A
Training:  41%|████      | 28/69 [00:10<00:10,  3.85it/s][A
Training:  42%|████▏     | 29/69 [00:10<00:15,  2.67it/s][A
Training:  43%|████▎     | 30/69 [00:11<00:14,  2.67it/s][A
Training:  46%|████▋     | 32/69 [00

Epoch: 11/59 - Loss: 3.3004 - Accuracy: 0.9316



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:01<00:11,  1.50s/it][A
 33%|███▎      | 3/9 [00:01<00:02,  2.31it/s][A
 56%|█████▌    | 5/9 [00:02<00:02,  1.87it/s][A
 78%|███████▊  | 7/9 [00:03<00:00,  2.92it/s][A
100%|██████████| 9/9 [00:03<00:00,  2.39it/s][A
Epochs:  19%|█▊        | 11/59 [05:02<22:19, 27.91s/it]

Val Loss: 3.5032 - Val Accuracy: 0.9356



Training:   0%|          | 0/69 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/69 [00:01<01:35,  1.41s/it][A
Training:   4%|▍         | 3/69 [00:01<00:27,  2.37it/s][A
Training:   7%|▋         | 5/69 [00:02<00:31,  2.02it/s][A
Training:   9%|▊         | 6/69 [00:02<00:24,  2.55it/s][A
Training:  10%|█         | 7/69 [00:03<00:21,  2.82it/s][A
Training:  13%|█▎        | 9/69 [00:03<00:23,  2.58it/s][A
Training:  16%|█▌        | 11/69 [00:04<00:16,  3.53it/s][A
Training:  19%|█▉        | 13/69 [00:05<00:21,  2.64it/s][A
Training:  20%|██        | 14/69 [00:05<00:18,  2.98it/s][A
Training:  22%|██▏       | 15/69 [00:05<00:16,  3.34it/s][A
Training:  25%|██▍       | 17/69 [00:06<00:20,  2.55it/s][A
Training:  26%|██▌       | 18/69 [00:06<00:17,  2.90it/s][A
Training:  30%|███       | 21/69 [00:07<00:16,  2.85it/s][A
Training:  32%|███▏      | 22/69 [00:08<00:15,  3.11it/s][A
Training:  35%|███▍      | 24/69 [00:08<00:10,  4.23it/s][A
Training:  36%|███▌      | 25/69 [00:0

Epoch: 12/59 - Loss: 3.1570 - Accuracy: 0.9399



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:01<00:12,  1.59s/it][A
 33%|███▎      | 3/9 [00:01<00:02,  2.19it/s][A
 56%|█████▌    | 5/9 [00:02<00:02,  1.99it/s][A
100%|██████████| 9/9 [00:03<00:00,  2.58it/s][A
Epochs:  20%|██        | 12/59 [05:29<21:39, 27.66s/it]

Val Loss: 3.8910 - Val Accuracy: 0.9379



Training:   0%|          | 0/69 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/69 [00:01<01:33,  1.37s/it][A
Training:   4%|▍         | 3/69 [00:01<00:26,  2.50it/s][A
Training:   7%|▋         | 5/69 [00:02<00:31,  2.06it/s][A
Training:  10%|█         | 7/69 [00:02<00:20,  3.07it/s][A
Training:  13%|█▎        | 9/69 [00:03<00:24,  2.43it/s][A
Training:  16%|█▌        | 11/69 [00:04<00:17,  3.38it/s][A
Training:  17%|█▋        | 12/69 [00:04<00:15,  3.73it/s][A
Training:  19%|█▉        | 13/69 [00:05<00:27,  2.03it/s][A
Training:  20%|██        | 14/69 [00:05<00:21,  2.51it/s][A
Training:  23%|██▎       | 16/69 [00:05<00:13,  3.80it/s][A
Training:  25%|██▍       | 17/69 [00:06<00:23,  2.17it/s][A
Training:  29%|██▉       | 20/69 [00:07<00:12,  3.93it/s][A
Training:  32%|███▏      | 22/69 [00:08<00:18,  2.53it/s][A
Training:  36%|███▌      | 25/69 [00:09<00:17,  2.57it/s][A
Training:  38%|███▊      | 26/69 [00:09<00:14,  2.91it/s][A
Training:  41%|████      | 28/69 [00:

Epoch: 13/59 - Loss: 5.6108 - Accuracy: 0.9207



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:01<00:12,  1.56s/it][A
 56%|█████▌    | 5/9 [00:02<00:02,  1.97it/s][A
100%|██████████| 9/9 [00:03<00:00,  2.54it/s][A
Epochs:  22%|██▏       | 13/59 [05:57<21:16, 27.75s/it]

Val Loss: 7.9450 - Val Accuracy: 0.9136



Training:   0%|          | 0/69 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/69 [00:01<01:45,  1.55s/it][A
Training:   3%|▎         | 2/69 [00:01<00:47,  1.42it/s][A
Training:   6%|▌         | 4/69 [00:01<00:19,  3.27it/s][A
Training:   7%|▋         | 5/69 [00:02<00:29,  2.16it/s][A
Training:   9%|▊         | 6/69 [00:02<00:25,  2.46it/s][A
Training:  12%|█▏        | 8/69 [00:03<00:15,  4.00it/s][A
Training:  13%|█▎        | 9/69 [00:04<00:26,  2.27it/s][A
Training:  14%|█▍        | 10/69 [00:04<00:21,  2.68it/s][A
Training:  16%|█▌        | 11/69 [00:04<00:17,  3.26it/s][A
Training:  19%|█▉        | 13/69 [00:05<00:23,  2.34it/s][A
Training:  20%|██        | 14/69 [00:05<00:19,  2.81it/s][A
Training:  23%|██▎       | 16/69 [00:05<00:13,  3.96it/s][A
Training:  25%|██▍       | 17/69 [00:06<00:20,  2.56it/s][A
Training:  26%|██▌       | 18/69 [00:06<00:18,  2.78it/s][A
Training:  29%|██▉       | 20/69 [00:07<00:14,  3.48it/s][A
Training:  30%|███       | 21/69 [00:07

Epoch: 14/59 - Loss: 3.9280 - Accuracy: 0.9200



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:01<00:12,  1.62s/it][A
 33%|███▎      | 3/9 [00:01<00:02,  2.18it/s][A
 56%|█████▌    | 5/9 [00:02<00:02,  1.83it/s][A
100%|██████████| 9/9 [00:03<00:00,  2.31it/s][A
Epochs:  24%|██▎       | 14/59 [06:25<20:49, 27.78s/it]

Val Loss: 3.3150 - Val Accuracy: 0.9301



Training:   0%|          | 0/69 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/69 [00:01<01:39,  1.47s/it][A
Training:   3%|▎         | 2/69 [00:01<00:44,  1.50it/s][A
Training:   7%|▋         | 5/69 [00:02<00:31,  2.05it/s][A
Training:   9%|▊         | 6/69 [00:02<00:24,  2.56it/s][A
Training:  10%|█         | 7/69 [00:03<00:19,  3.17it/s][A
Training:  13%|█▎        | 9/69 [00:04<00:26,  2.26it/s][A
Training:  16%|█▌        | 11/69 [00:04<00:17,  3.34it/s][A
Training:  19%|█▉        | 13/69 [00:05<00:21,  2.67it/s][A
Training:  22%|██▏       | 15/69 [00:05<00:15,  3.58it/s][A
Training:  25%|██▍       | 17/69 [00:06<00:19,  2.61it/s][A
Training:  28%|██▊       | 19/69 [00:06<00:14,  3.45it/s][A
Training:  30%|███       | 21/69 [00:08<00:18,  2.63it/s][A
Training:  33%|███▎      | 23/69 [00:08<00:13,  3.45it/s][A
Training:  36%|███▌      | 25/69 [00:09<00:16,  2.72it/s][A
Training:  39%|███▉      | 27/69 [00:09<00:11,  3.66it/s][A
Training:  42%|████▏     | 29/69 [00:1

Epoch: 15/59 - Loss: 3.0437 - Accuracy: 0.9340



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:01<00:13,  1.64s/it][A
 33%|███▎      | 3/9 [00:01<00:02,  2.09it/s][A
 56%|█████▌    | 5/9 [00:02<00:01,  2.05it/s][A
 67%|██████▋   | 6/9 [00:02<00:01,  2.58it/s][A
100%|██████████| 9/9 [00:03<00:00,  2.55it/s][A
Epochs:  25%|██▌       | 15/59 [06:53<20:23, 27.80s/it]

Val Loss: 3.8521 - Val Accuracy: 0.9357



Training:   0%|          | 0/69 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/69 [00:01<02:03,  1.82s/it][A
Training:   4%|▍         | 3/69 [00:01<00:35,  1.87it/s][A
Training:   7%|▋         | 5/69 [00:03<00:35,  1.81it/s][A
Training:  10%|█         | 7/69 [00:03<00:21,  2.84it/s][A
Training:  13%|█▎        | 9/69 [00:04<00:26,  2.23it/s][A
Training:  16%|█▌        | 11/69 [00:04<00:18,  3.16it/s][A
Training:  19%|█▉        | 13/69 [00:05<00:22,  2.52it/s][A
Training:  20%|██        | 14/69 [00:06<00:20,  2.70it/s][A
Training:  23%|██▎       | 16/69 [00:06<00:14,  3.76it/s][A
Training:  25%|██▍       | 17/69 [00:07<00:21,  2.45it/s][A
Training:  26%|██▌       | 18/69 [00:07<00:18,  2.72it/s][A
Training:  30%|███       | 21/69 [00:08<00:18,  2.64it/s][A
Training:  32%|███▏      | 22/69 [00:08<00:15,  3.06it/s][A
Training:  35%|███▍      | 24/69 [00:08<00:10,  4.19it/s][A
Training:  36%|███▌      | 25/69 [00:09<00:18,  2.34it/s][A
Training:  39%|███▉      | 27/69 [00:

Epoch: 16/59 - Loss: 7.3930 - Accuracy: 0.9207



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:01<00:11,  1.46s/it][A
 44%|████▍     | 4/9 [00:01<00:01,  3.01it/s][A
 56%|█████▌    | 5/9 [00:02<00:02,  1.73it/s][A
100%|██████████| 9/9 [00:03<00:00,  2.49it/s][A
Epochs:  27%|██▋       | 16/59 [07:21<19:55, 27.81s/it]

Val Loss: 13.3956 - Val Accuracy: 0.8974



Training:   0%|          | 0/69 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/69 [00:01<01:55,  1.70s/it][A
Training:   4%|▍         | 3/69 [00:01<00:31,  2.09it/s][A
Training:   7%|▋         | 5/69 [00:02<00:33,  1.92it/s][A
Training:  12%|█▏        | 8/69 [00:03<00:16,  3.76it/s][A
Training:  14%|█▍        | 10/69 [00:04<00:25,  2.33it/s][A
Training:  17%|█▋        | 12/69 [00:04<00:17,  3.17it/s][A
Training:  20%|██        | 14/69 [00:05<00:22,  2.49it/s][A
Training:  25%|██▍       | 17/69 [00:07<00:21,  2.47it/s][A
Training:  29%|██▉       | 20/69 [00:07<00:13,  3.65it/s][A
Training:  32%|███▏      | 22/69 [00:08<00:17,  2.61it/s][A
Training:  35%|███▍      | 24/69 [00:08<00:13,  3.36it/s][A
Training:  38%|███▊      | 26/69 [00:09<00:16,  2.61it/s][A
Training:  39%|███▉      | 27/69 [00:10<00:14,  2.92it/s][A
Training:  42%|████▏     | 29/69 [00:11<00:16,  2.49it/s][A
Training:  46%|████▋     | 32/69 [00:11<00:09,  3.89it/s][A
Training:  49%|████▉     | 34/69 [00

Epoch: 17/59 - Loss: 4.7126 - Accuracy: 0.9174



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:01<00:12,  1.53s/it][A
 44%|████▍     | 4/9 [00:01<00:01,  3.11it/s][A
 67%|██████▋   | 6/9 [00:03<00:01,  2.00it/s][A
100%|██████████| 9/9 [00:03<00:00,  2.30it/s][A
Epochs:  29%|██▉       | 17/59 [07:49<19:32, 27.92s/it]

Val Loss: 3.3710 - Val Accuracy: 0.8883



Training:   0%|          | 0/69 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/69 [00:01<01:49,  1.61s/it][A
Training:   4%|▍         | 3/69 [00:01<00:31,  2.10it/s][A
Training:   6%|▌         | 4/69 [00:01<00:22,  2.89it/s][A
Training:   7%|▋         | 5/69 [00:02<00:38,  1.66it/s][A
Training:   9%|▊         | 6/69 [00:03<00:28,  2.22it/s][A
Training:  12%|█▏        | 8/69 [00:03<00:15,  3.84it/s][A
Training:  14%|█▍        | 10/69 [00:04<00:25,  2.33it/s][A
Training:  17%|█▋        | 12/69 [00:04<00:16,  3.36it/s][A
Training:  19%|█▉        | 13/69 [00:05<00:25,  2.17it/s][A
Training:  22%|██▏       | 15/69 [00:05<00:16,  3.19it/s][A
Training:  25%|██▍       | 17/69 [00:07<00:21,  2.42it/s][A
Training:  26%|██▌       | 18/69 [00:07<00:17,  2.85it/s][A
Training:  29%|██▉       | 20/69 [00:07<00:12,  3.95it/s][A
Training:  30%|███       | 21/69 [00:08<00:21,  2.25it/s][A
Training:  33%|███▎      | 23/69 [00:08<00:14,  3.24it/s][A
Training:  36%|███▌      | 25/69 [00:0

Epoch: 18/59 - Loss: 3.0515 - Accuracy: 0.9308



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:01<00:14,  1.86s/it][A
 33%|███▎      | 3/9 [00:01<00:03,  1.89it/s][A
 56%|█████▌    | 5/9 [00:03<00:02,  1.77it/s][A
100%|██████████| 9/9 [00:03<00:00,  2.35it/s][A
Epochs:  31%|███       | 18/59 [08:17<19:04, 27.92s/it]

Val Loss: 3.9018 - Val Accuracy: 0.9290



Training:   0%|          | 0/69 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/69 [00:01<02:06,  1.85s/it][A
Training:   3%|▎         | 2/69 [00:01<00:55,  1.21it/s][A
Training:   6%|▌         | 4/69 [00:02<00:23,  2.81it/s][A
Training:   7%|▋         | 5/69 [00:03<00:38,  1.66it/s][A
Training:  10%|█         | 7/69 [00:03<00:21,  2.91it/s][A
Training:  13%|█▎        | 9/69 [00:04<00:26,  2.26it/s][A
Training:  16%|█▌        | 11/69 [00:04<00:17,  3.27it/s][A
Training:  19%|█▉        | 13/69 [00:05<00:22,  2.46it/s][A
Training:  20%|██        | 14/69 [00:05<00:19,  2.89it/s][A
Training:  22%|██▏       | 15/69 [00:06<00:15,  3.38it/s][A
Training:  25%|██▍       | 17/69 [00:07<00:19,  2.62it/s][A
Training:  26%|██▌       | 18/69 [00:07<00:16,  3.06it/s][A
Training:  29%|██▉       | 20/69 [00:07<00:11,  4.30it/s][A
Training:  30%|███       | 21/69 [00:08<00:20,  2.32it/s][A
Training:  33%|███▎      | 23/69 [00:08<00:13,  3.36it/s][A
Training:  35%|███▍      | 24/69 [00:0

Epoch: 19/59 - Loss: 2.9994 - Accuracy: 0.9338



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:01<00:12,  1.52s/it][A
 22%|██▏       | 2/9 [00:01<00:05,  1.33it/s][A
 56%|█████▌    | 5/9 [00:02<00:01,  2.09it/s][A
 67%|██████▋   | 6/9 [00:03<00:01,  2.28it/s][A
100%|██████████| 9/9 [00:03<00:00,  2.52it/s][A
Epochs:  32%|███▏      | 19/59 [08:45<18:39, 27.98s/it]

Val Loss: 4.0149 - Val Accuracy: 0.9414



Training:   0%|          | 0/69 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/69 [00:01<01:44,  1.54s/it][A
Training:   3%|▎         | 2/69 [00:01<00:54,  1.24it/s][A
Training:   6%|▌         | 4/69 [00:01<00:22,  2.92it/s][A
Training:   7%|▋         | 5/69 [00:03<00:35,  1.79it/s][A
Training:   9%|▊         | 6/69 [00:03<00:30,  2.09it/s][A
Training:  13%|█▎        | 9/69 [00:04<00:25,  2.35it/s][A
Training:  16%|█▌        | 11/69 [00:04<00:17,  3.30it/s][A
Training:  19%|█▉        | 13/69 [00:05<00:21,  2.55it/s][A
Training:  22%|██▏       | 15/69 [00:05<00:15,  3.47it/s][A
Training:  23%|██▎       | 16/69 [00:06<00:13,  3.93it/s][A
Training:  25%|██▍       | 17/69 [00:07<00:23,  2.23it/s][A
Training:  28%|██▊       | 19/69 [00:07<00:15,  3.30it/s][A
Training:  30%|███       | 21/69 [00:08<00:18,  2.59it/s][A
Training:  35%|███▍      | 24/69 [00:08<00:10,  4.24it/s][A
Training:  38%|███▊      | 26/69 [00:09<00:12,  3.35it/s][A
Training:  41%|████      | 28/69 [00:0

Epoch: 20/59 - Loss: 5.9875 - Accuracy: 0.9156



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:01<00:11,  1.50s/it][A
 33%|███▎      | 3/9 [00:01<00:02,  2.27it/s][A
 44%|████▍     | 4/9 [00:01<00:01,  2.85it/s][A
 56%|█████▌    | 5/9 [00:03<00:02,  1.60it/s][A
 78%|███████▊  | 7/9 [00:03<00:00,  2.87it/s][A
100%|██████████| 9/9 [00:03<00:00,  2.45it/s][A
Epochs:  34%|███▍      | 20/59 [09:12<17:59, 27.67s/it]

Val Loss: 3.6737 - Val Accuracy: 0.9215



Training:   0%|          | 0/69 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/69 [00:01<01:53,  1.67s/it][A
Training:   3%|▎         | 2/69 [00:01<00:51,  1.31it/s][A
Training:   6%|▌         | 4/69 [00:01<00:21,  2.98it/s][A
Training:   7%|▋         | 5/69 [00:03<00:39,  1.62it/s][A
Training:  12%|█▏        | 8/69 [00:03<00:17,  3.40it/s][A
Training:  14%|█▍        | 10/69 [00:04<00:23,  2.54it/s][A
Training:  17%|█▋        | 12/69 [00:04<00:16,  3.53it/s][A
Training:  19%|█▉        | 13/69 [00:05<00:26,  2.15it/s][A
Training:  22%|██▏       | 15/69 [00:05<00:17,  3.12it/s][A
Training:  25%|██▍       | 17/69 [00:07<00:20,  2.50it/s][A
Training:  26%|██▌       | 18/69 [00:07<00:17,  2.87it/s][A
Training:  28%|██▊       | 19/69 [00:07<00:14,  3.39it/s][A
Training:  30%|███       | 21/69 [00:08<00:18,  2.64it/s][A
Training:  32%|███▏      | 22/69 [00:08<00:18,  2.49it/s][A
Training:  35%|███▍      | 24/69 [00:08<00:12,  3.65it/s][A
Training:  36%|███▌      | 25/69 [00:

Epoch: 21/59 - Loss: 3.2033 - Accuracy: 0.9280



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:01<00:14,  1.87s/it][A
 44%|████▍     | 4/9 [00:02<00:01,  2.54it/s][A
 67%|██████▋   | 6/9 [00:03<00:01,  2.23it/s][A
100%|██████████| 9/9 [00:03<00:00,  2.40it/s][A
Epochs:  36%|███▌      | 21/59 [09:40<17:33, 27.72s/it]

Val Loss: 3.9480 - Val Accuracy: 0.9021



Training:   0%|          | 0/69 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/69 [00:01<02:12,  1.95s/it][A
Training:   4%|▍         | 3/69 [00:02<00:35,  1.84it/s][A
Training:   7%|▋         | 5/69 [00:03<00:37,  1.69it/s][A
Training:  10%|█         | 7/69 [00:03<00:23,  2.65it/s][A
Training:  13%|█▎        | 9/69 [00:04<00:29,  2.04it/s][A
Training:  16%|█▌        | 11/69 [00:04<00:19,  2.96it/s][A
Training:  19%|█▉        | 13/69 [00:06<00:24,  2.25it/s][A
Training:  20%|██        | 14/69 [00:06<00:20,  2.64it/s][A
Training:  23%|██▎       | 16/69 [00:06<00:14,  3.66it/s][A
Training:  25%|██▍       | 17/69 [00:07<00:21,  2.42it/s][A
Training:  28%|██▊       | 19/69 [00:07<00:14,  3.49it/s][A
Training:  30%|███       | 21/69 [00:09<00:21,  2.23it/s][A
Training:  33%|███▎      | 23/69 [00:09<00:14,  3.15it/s][A
Training:  36%|███▌      | 25/69 [00:10<00:17,  2.46it/s][A
Training:  38%|███▊      | 26/69 [00:10<00:15,  2.85it/s][A
Training:  39%|███▉      | 27/69 [00:

Epoch: 22/59 - Loss: 2.9203 - Accuracy: 0.9312



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:01<00:13,  1.65s/it][A
 33%|███▎      | 3/9 [00:01<00:02,  2.03it/s][A
 56%|█████▌    | 5/9 [00:03<00:02,  1.75it/s][A
100%|██████████| 9/9 [00:03<00:00,  2.38it/s][A
Epochs:  37%|███▋      | 22/59 [10:08<17:10, 27.84s/it]

Val Loss: 3.4453 - Val Accuracy: 0.9208



Training:   0%|          | 0/69 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/69 [00:01<02:01,  1.79s/it][A
Training:   3%|▎         | 2/69 [00:01<00:53,  1.24it/s][A
Training:   4%|▍         | 3/69 [00:02<00:32,  2.01it/s][A
Training:   7%|▋         | 5/69 [00:03<00:34,  1.85it/s][A
Training:  10%|█         | 7/69 [00:03<00:20,  3.00it/s][A
Training:  13%|█▎        | 9/69 [00:04<00:28,  2.12it/s][A
Training:  16%|█▌        | 11/69 [00:04<00:18,  3.11it/s][A
Training:  19%|█▉        | 13/69 [00:05<00:21,  2.61it/s][A
Training:  22%|██▏       | 15/69 [00:05<00:15,  3.58it/s][A
Training:  25%|██▍       | 17/69 [00:07<00:19,  2.68it/s][A
Training:  28%|██▊       | 19/69 [00:07<00:13,  3.58it/s][A
Training:  30%|███       | 21/69 [00:08<00:18,  2.54it/s][A
Training:  35%|███▍      | 24/69 [00:08<00:11,  3.85it/s][A
Training:  38%|███▊      | 26/69 [00:09<00:15,  2.84it/s][A
Training:  41%|████      | 28/69 [00:10<00:11,  3.65it/s][A
Training:  42%|████▏     | 29/69 [00:1

Epoch: 23/59 - Loss: 2.9472 - Accuracy: 0.9259



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:01<00:13,  1.72s/it][A
 44%|████▍     | 4/9 [00:01<00:01,  2.81it/s][A
 67%|██████▋   | 6/9 [00:03<00:01,  2.15it/s][A
100%|██████████| 9/9 [00:03<00:00,  2.37it/s][A
Epochs:  39%|███▉      | 23/59 [10:35<16:34, 27.63s/it]

Val Loss: 3.7917 - Val Accuracy: 0.9241



Training:   0%|          | 0/69 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/69 [00:01<01:57,  1.73s/it][A
Training:   3%|▎         | 2/69 [00:01<00:52,  1.27it/s][A
Training:   6%|▌         | 4/69 [00:02<00:22,  2.92it/s][A
Training:   7%|▋         | 5/69 [00:03<00:39,  1.63it/s][A
Training:  10%|█         | 7/69 [00:03<00:22,  2.71it/s][A
Training:  13%|█▎        | 9/69 [00:04<00:28,  2.14it/s][A
Training:  16%|█▌        | 11/69 [00:04<00:19,  3.03it/s][A
Training:  19%|█▉        | 13/69 [00:06<00:23,  2.37it/s][A
Training:  22%|██▏       | 15/69 [00:06<00:16,  3.23it/s][A
Training:  25%|██▍       | 17/69 [00:07<00:19,  2.68it/s][A
Training:  29%|██▉       | 20/69 [00:07<00:11,  4.20it/s][A
Training:  32%|███▏      | 22/69 [00:08<00:15,  2.99it/s][A
Training:  35%|███▍      | 24/69 [00:08<00:11,  3.85it/s][A
Training:  38%|███▊      | 26/69 [00:10<00:16,  2.62it/s][A
Training:  39%|███▉      | 27/69 [00:10<00:14,  2.98it/s][A
Training:  42%|████▏     | 29/69 [00:1

Epoch: 24/59 - Loss: 2.7152 - Accuracy: 0.9398



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:01<00:14,  1.80s/it][A
 33%|███▎      | 3/9 [00:01<00:03,  1.96it/s][A
 56%|█████▌    | 5/9 [00:02<00:01,  2.07it/s][A
 67%|██████▋   | 6/9 [00:02<00:01,  2.52it/s][A
 89%|████████▉ | 8/9 [00:03<00:00,  3.79it/s][A
100%|██████████| 9/9 [00:03<00:00,  2.50it/s][A
Epochs:  41%|████      | 24/59 [11:02<16:03, 27.53s/it]

Val Loss: 3.4572 - Val Accuracy: 0.9264



Training:   0%|          | 0/69 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/69 [00:01<02:03,  1.81s/it][A
Training:   6%|▌         | 4/69 [00:02<00:26,  2.41it/s][A
Training:   7%|▋         | 5/69 [00:03<00:37,  1.70it/s][A
Training:  12%|█▏        | 8/69 [00:03<00:20,  3.00it/s][A
Training:  13%|█▎        | 9/69 [00:04<00:27,  2.16it/s][A
Training:  16%|█▌        | 11/69 [00:04<00:18,  3.11it/s][A
Training:  17%|█▋        | 12/69 [00:04<00:16,  3.37it/s][A
Training:  19%|█▉        | 13/69 [00:05<00:26,  2.14it/s][A
Training:  22%|██▏       | 15/69 [00:06<00:16,  3.21it/s][A
Training:  23%|██▎       | 16/69 [00:06<00:14,  3.61it/s][A
Training:  25%|██▍       | 17/69 [00:07<00:22,  2.27it/s][A
Training:  26%|██▌       | 18/69 [00:07<00:18,  2.79it/s][A
Training:  29%|██▉       | 20/69 [00:07<00:11,  4.18it/s][A
Training:  30%|███       | 21/69 [00:08<00:21,  2.19it/s][A
Training:  33%|███▎      | 23/69 [00:08<00:14,  3.27it/s][A
Training:  36%|███▌      | 25/69 [00:

Epoch: 25/59 - Loss: 3.2434 - Accuracy: 0.9309



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:01<00:14,  1.81s/it][A
 33%|███▎      | 3/9 [00:01<00:03,  1.89it/s][A
 56%|█████▌    | 5/9 [00:03<00:02,  1.83it/s][A
100%|██████████| 9/9 [00:03<00:00,  2.31it/s][A
Epochs:  42%|████▏     | 25/59 [11:30<15:35, 27.52s/it]

Val Loss: 3.9384 - Val Accuracy: 0.9321



Training:   0%|          | 0/69 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/69 [00:01<02:04,  1.83s/it][A
Training:   4%|▍         | 3/69 [00:01<00:34,  1.92it/s][A
Training:   6%|▌         | 4/69 [00:02<00:24,  2.66it/s][A
Training:   7%|▋         | 5/69 [00:03<00:39,  1.61it/s][A
Training:   9%|▊         | 6/69 [00:03<00:28,  2.19it/s][A
Training:  12%|█▏        | 8/69 [00:03<00:16,  3.68it/s][A
Training:  13%|█▎        | 9/69 [00:04<00:29,  2.05it/s][A
Training:  16%|█▌        | 11/69 [00:04<00:18,  3.07it/s][A
Training:  19%|█▉        | 13/69 [00:05<00:23,  2.43it/s][A
Training:  22%|██▏       | 15/69 [00:06<00:15,  3.39it/s][A
Training:  23%|██▎       | 16/69 [00:06<00:13,  3.90it/s][A
Training:  25%|██▍       | 17/69 [00:07<00:22,  2.30it/s][A
Training:  28%|██▊       | 19/69 [00:07<00:15,  3.32it/s][A
Training:  30%|███       | 21/69 [00:08<00:19,  2.48it/s][A
Training:  33%|███▎      | 23/69 [00:08<00:14,  3.26it/s][A
Training:  36%|███▌      | 25/69 [00:09

Epoch: 26/59 - Loss: 3.3482 - Accuracy: 0.9283



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:02<00:16,  2.03s/it][A
 33%|███▎      | 3/9 [00:02<00:03,  1.76it/s][A
 56%|█████▌    | 5/9 [00:03<00:02,  1.82it/s][A
100%|██████████| 9/9 [00:03<00:00,  2.33it/s][A
Epochs:  44%|████▍     | 26/59 [11:57<15:09, 27.56s/it]

Val Loss: 5.7662 - Val Accuracy: 0.9399



Training:   0%|          | 0/69 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/69 [00:01<01:58,  1.75s/it][A
Training:   3%|▎         | 2/69 [00:01<00:52,  1.28it/s][A
Training:   4%|▍         | 3/69 [00:02<00:32,  2.02it/s][A
Training:   6%|▌         | 4/69 [00:02<00:22,  2.84it/s][A
Training:   7%|▋         | 5/69 [00:03<00:36,  1.75it/s][A
Training:  10%|█         | 7/69 [00:03<00:20,  2.98it/s][A
Training:  13%|█▎        | 9/69 [00:04<00:24,  2.43it/s][A
Training:  14%|█▍        | 10/69 [00:04<00:20,  2.91it/s][A
Training:  17%|█▋        | 12/69 [00:04<00:13,  4.35it/s][A
Training:  19%|█▉        | 13/69 [00:05<00:24,  2.33it/s][A
Training:  20%|██        | 14/69 [00:05<00:19,  2.77it/s][A
Training:  23%|██▎       | 16/69 [00:06<00:14,  3.78it/s][A
Training:  25%|██▍       | 17/69 [00:07<00:21,  2.43it/s][A
Training:  26%|██▌       | 18/69 [00:07<00:18,  2.73it/s][A
Training:  28%|██▊       | 19/69 [00:07<00:15,  3.33it/s][A
Training:  30%|███       | 21/69 [00:08

Epoch: 27/59 - Loss: 5.2136 - Accuracy: 0.9212



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:01<00:14,  1.85s/it][A
 22%|██▏       | 2/9 [00:01<00:05,  1.20it/s][A
 56%|█████▌    | 5/9 [00:02<00:01,  2.17it/s][A
 67%|██████▋   | 6/9 [00:03<00:01,  2.35it/s][A
 89%|████████▉ | 8/9 [00:03<00:00,  3.63it/s][A
100%|██████████| 9/9 [00:03<00:00,  2.40it/s][A
Epochs:  46%|████▌     | 27/59 [12:25<14:41, 27.55s/it]

Val Loss: 4.3481 - Val Accuracy: 0.9255



Training:   0%|          | 0/69 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/69 [00:01<01:39,  1.46s/it][A
Training:   7%|▋         | 5/69 [00:02<00:29,  2.15it/s][A
Training:  10%|█         | 7/69 [00:02<00:20,  3.02it/s][A
Training:  13%|█▎        | 9/69 [00:04<00:26,  2.28it/s][A
Training:  16%|█▌        | 11/69 [00:04<00:18,  3.14it/s][A
Training:  19%|█▉        | 13/69 [00:05<00:21,  2.58it/s][A
Training:  22%|██▏       | 15/69 [00:05<00:15,  3.48it/s][A
Training:  25%|██▍       | 17/69 [00:06<00:19,  2.66it/s][A
Training:  28%|██▊       | 19/69 [00:06<00:14,  3.53it/s][A
Training:  30%|███       | 21/69 [00:07<00:18,  2.66it/s][A
Training:  32%|███▏      | 22/69 [00:08<00:15,  3.05it/s][A
Training:  36%|███▌      | 25/69 [00:09<00:16,  2.70it/s][A
Training:  39%|███▉      | 27/69 [00:09<00:11,  3.53it/s][A
Training:  41%|████      | 28/69 [00:09<00:10,  3.97it/s][A
Training:  42%|████▏     | 29/69 [00:10<00:15,  2.60it/s][A
Training:  45%|████▍     | 31/69 [00

Epoch: 28/59 - Loss: 5.2680 - Accuracy: 0.9169



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:01<00:12,  1.61s/it][A
 33%|███▎      | 3/9 [00:01<00:02,  2.17it/s][A
 56%|█████▌    | 5/9 [00:02<00:01,  2.12it/s][A
 67%|██████▋   | 6/9 [00:02<00:01,  2.44it/s][A
100%|██████████| 9/9 [00:03<00:00,  2.60it/s][A
Epochs:  47%|████▋     | 28/59 [12:52<14:06, 27.31s/it]

Val Loss: 3.8387 - Val Accuracy: 0.9252



Training:   0%|          | 0/69 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/69 [00:01<02:04,  1.83s/it][A
Training:   3%|▎         | 2/69 [00:01<00:54,  1.22it/s][A
Training:   4%|▍         | 3/69 [00:02<00:32,  2.04it/s][A
Training:   7%|▋         | 5/69 [00:03<00:36,  1.75it/s][A
Training:  10%|█         | 7/69 [00:03<00:21,  2.86it/s][A
Training:  13%|█▎        | 9/69 [00:04<00:28,  2.13it/s][A
Training:  19%|█▉        | 13/69 [00:06<00:21,  2.61it/s][A
Training:  20%|██        | 14/69 [00:06<00:18,  2.93it/s][A
Training:  23%|██▎       | 16/69 [00:06<00:14,  3.78it/s][A
Training:  25%|██▍       | 17/69 [00:07<00:18,  2.76it/s][A
Training:  26%|██▌       | 18/69 [00:07<00:16,  3.10it/s][A
Training:  28%|██▊       | 19/69 [00:07<00:13,  3.62it/s][A
Training:  30%|███       | 21/69 [00:08<00:17,  2.73it/s][A
Training:  33%|███▎      | 23/69 [00:08<00:13,  3.33it/s][A
Training:  35%|███▍      | 24/69 [00:08<00:11,  3.84it/s][A
Training:  36%|███▌      | 25/69 [00:0

Epoch: 29/59 - Loss: 2.9099 - Accuracy: 0.9377



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:01<00:14,  1.80s/it][A
 56%|█████▌    | 5/9 [00:03<00:02,  1.86it/s][A
 67%|██████▋   | 6/9 [00:03<00:01,  2.20it/s][A
 89%|████████▉ | 8/9 [00:03<00:00,  3.30it/s][A
100%|██████████| 9/9 [00:03<00:00,  2.34it/s][A
Epochs:  49%|████▉     | 29/59 [13:20<13:47, 27.57s/it]

Val Loss: 3.1461 - Val Accuracy: 0.9336



Training:   0%|          | 0/69 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/69 [00:01<01:49,  1.60s/it][A
Training:   4%|▍         | 3/69 [00:01<00:36,  1.82it/s][A
Training:   7%|▋         | 5/69 [00:03<00:34,  1.88it/s][A
Training:   9%|▊         | 6/69 [00:03<00:27,  2.33it/s][A
Training:  10%|█         | 7/69 [00:03<00:21,  2.84it/s][A
Training:  13%|█▎        | 9/69 [00:04<00:25,  2.37it/s][A
Training:  14%|█▍        | 10/69 [00:04<00:20,  2.85it/s][A
Training:  16%|█▌        | 11/69 [00:04<00:18,  3.11it/s][A
Training:  19%|█▉        | 13/69 [00:05<00:22,  2.46it/s][A
Training:  22%|██▏       | 15/69 [00:06<00:16,  3.28it/s][A
Training:  25%|██▍       | 17/69 [00:06<00:18,  2.83it/s][A
Training:  26%|██▌       | 18/69 [00:07<00:16,  3.09it/s][A
Training:  28%|██▊       | 19/69 [00:07<00:16,  3.06it/s][A
Training:  29%|██▉       | 20/69 [00:07<00:13,  3.61it/s][A
Training:  30%|███       | 21/69 [00:08<00:19,  2.47it/s][A
Training:  32%|███▏      | 22/69 [00:0

Epoch: 30/59 - Loss: 3.6438 - Accuracy: 0.9318



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:01<00:12,  1.54s/it][A
 22%|██▏       | 2/9 [00:01<00:04,  1.41it/s][A
 33%|███▎      | 3/9 [00:01<00:02,  2.24it/s][A
 56%|█████▌    | 5/9 [00:02<00:01,  2.03it/s][A
 67%|██████▋   | 6/9 [00:03<00:01,  2.44it/s][A
 89%|████████▉ | 8/9 [00:03<00:00,  4.04it/s][A
100%|██████████| 9/9 [00:03<00:00,  2.45it/s][A
Epochs:  51%|█████     | 30/59 [13:48<13:23, 27.71s/it]

Val Loss: 17.3435 - Val Accuracy: 0.9255



Training:   0%|          | 0/69 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/69 [00:01<01:57,  1.73s/it][A
Training:   3%|▎         | 2/69 [00:01<00:53,  1.26it/s][A
Training:   4%|▍         | 3/69 [00:02<00:33,  1.98it/s][A
Training:   6%|▌         | 4/69 [00:02<00:22,  2.84it/s][A
Training:   7%|▋         | 5/69 [00:03<00:35,  1.81it/s][A
Training:  10%|█         | 7/69 [00:03<00:20,  2.98it/s][A
Training:  13%|█▎        | 9/69 [00:04<00:24,  2.46it/s][A
Training:  16%|█▌        | 11/69 [00:04<00:16,  3.48it/s][A
Training:  17%|█▋        | 12/69 [00:04<00:15,  3.68it/s][A
Training:  19%|█▉        | 13/69 [00:05<00:24,  2.33it/s][A
Training:  20%|██        | 14/69 [00:05<00:20,  2.74it/s][A
Training:  22%|██▏       | 15/69 [00:05<00:16,  3.37it/s][A
Training:  23%|██▎       | 16/69 [00:06<00:15,  3.51it/s][A
Training:  25%|██▍       | 17/69 [00:06<00:21,  2.38it/s][A
Training:  26%|██▌       | 18/69 [00:07<00:18,  2.83it/s][A
Training:  29%|██▉       | 20/69 [00:07

Epoch: 31/59 - Loss: 10.5755 - Accuracy: 0.9189



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:01<00:12,  1.62s/it][A
 44%|████▍     | 4/9 [00:01<00:01,  2.95it/s][A
 67%|██████▋   | 6/9 [00:02<00:01,  2.44it/s][A
100%|██████████| 9/9 [00:03<00:00,  2.64it/s][A
Epochs:  53%|█████▎    | 31/59 [14:15<12:47, 27.42s/it]

Val Loss: 4.3832 - Val Accuracy: 0.7771



Training:   0%|          | 0/69 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/69 [00:01<02:04,  1.83s/it][A
Training:   7%|▋         | 5/69 [00:03<00:33,  1.88it/s][A
Training:  12%|█▏        | 8/69 [00:03<00:17,  3.40it/s][A
Training:  14%|█▍        | 10/69 [00:04<00:25,  2.28it/s][A
Training:  17%|█▋        | 12/69 [00:04<00:18,  3.07it/s][A
Training:  20%|██        | 14/69 [00:05<00:22,  2.48it/s][A
Training:  23%|██▎       | 16/69 [00:06<00:15,  3.38it/s][A
Training:  26%|██▌       | 18/69 [00:07<00:19,  2.58it/s][A
Training:  29%|██▉       | 20/69 [00:07<00:14,  3.46it/s][A
Training:  32%|███▏      | 22/69 [00:08<00:18,  2.49it/s][A
Training:  33%|███▎      | 23/69 [00:08<00:16,  2.87it/s][A
Training:  35%|███▍      | 24/69 [00:08<00:13,  3.32it/s][A
Training:  36%|███▌      | 25/69 [00:09<00:19,  2.30it/s][A
Training:  39%|███▉      | 27/69 [00:09<00:12,  3.39it/s][A
Training:  42%|████▏     | 29/69 [00:11<00:15,  2.63it/s][A
Training:  48%|████▊     | 33/69 [0

Epoch: 32/59 - Loss: 3.2987 - Accuracy: 0.9307



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:01<00:13,  1.74s/it][A
 33%|███▎      | 3/9 [00:01<00:03,  1.97it/s][A
 56%|█████▌    | 5/9 [00:02<00:02,  1.95it/s][A
 78%|███████▊  | 7/9 [00:03<00:00,  3.02it/s][A
 89%|████████▉ | 8/9 [00:03<00:00,  3.55it/s][A
100%|██████████| 9/9 [00:03<00:00,  2.39it/s][A
Epochs:  54%|█████▍    | 32/59 [14:42<12:20, 27.44s/it]

Val Loss: 3.2936 - Val Accuracy: 0.9326



Training:   0%|          | 0/69 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/69 [00:01<02:03,  1.82s/it][A
Training:   3%|▎         | 2/69 [00:01<00:54,  1.22it/s][A
Training:   6%|▌         | 4/69 [00:02<00:22,  2.90it/s][A
Training:   9%|▊         | 6/69 [00:03<00:29,  2.13it/s][A
Training:  12%|█▏        | 8/69 [00:03<00:18,  3.23it/s][A
Training:  13%|█▎        | 9/69 [00:04<00:28,  2.13it/s][A
Training:  14%|█▍        | 10/69 [00:04<00:24,  2.39it/s][A
Training:  19%|█▉        | 13/69 [00:05<00:20,  2.74it/s][A
Training:  20%|██        | 14/69 [00:06<00:19,  2.77it/s][A
Training:  22%|██▏       | 15/69 [00:06<00:16,  3.27it/s][A
Training:  25%|██▍       | 17/69 [00:07<00:19,  2.68it/s][A
Training:  26%|██▌       | 18/69 [00:07<00:20,  2.49it/s][A
Training:  29%|██▉       | 20/69 [00:07<00:13,  3.64it/s][A
Training:  30%|███       | 21/69 [00:08<00:15,  3.14it/s][A
Training:  32%|███▏      | 22/69 [00:08<00:18,  2.52it/s][A
Training:  35%|███▍      | 24/69 [00:0

Epoch: 33/59 - Loss: 2.8951 - Accuracy: 0.9300



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:02<00:16,  2.03s/it][A
 22%|██▏       | 2/9 [00:02<00:06,  1.10it/s][A
 44%|████▍     | 4/9 [00:02<00:01,  2.57it/s][A
 56%|█████▌    | 5/9 [00:03<00:02,  1.75it/s][A
100%|██████████| 9/9 [00:04<00:00,  2.16it/s][A
Epochs:  56%|█████▌    | 33/59 [15:10<11:56, 27.57s/it]

Val Loss: 3.2544 - Val Accuracy: 0.9271



Training:   0%|          | 0/69 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/69 [00:01<02:07,  1.88s/it][A
Training:   4%|▍         | 3/69 [00:02<00:35,  1.85it/s][A
Training:   6%|▌         | 4/69 [00:02<00:26,  2.42it/s][A
Training:   7%|▋         | 5/69 [00:03<00:39,  1.63it/s][A
Training:   9%|▊         | 6/69 [00:03<00:29,  2.14it/s][A
Training:  12%|█▏        | 8/69 [00:03<00:17,  3.41it/s][A
Training:  13%|█▎        | 9/69 [00:04<00:29,  2.02it/s][A
Training:  14%|█▍        | 10/69 [00:04<00:23,  2.56it/s][A
Training:  16%|█▌        | 11/69 [00:04<00:18,  3.16it/s][A
Training:  19%|█▉        | 13/69 [00:06<00:26,  2.12it/s][A
Training:  20%|██        | 14/69 [00:06<00:21,  2.59it/s][A
Training:  23%|██▎       | 16/69 [00:06<00:13,  3.89it/s][A
Training:  25%|██▍       | 17/69 [00:07<00:20,  2.50it/s][A
Training:  28%|██▊       | 19/69 [00:07<00:13,  3.73it/s][A
Training:  29%|██▉       | 20/69 [00:07<00:12,  4.04it/s][A
Training:  30%|███       | 21/69 [00:08

Epoch: 34/59 - Loss: 2.6708 - Accuracy: 0.9392



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:01<00:13,  1.74s/it][A
 33%|███▎      | 3/9 [00:01<00:03,  1.97it/s][A
 56%|█████▌    | 5/9 [00:03<00:02,  1.79it/s][A
 78%|███████▊  | 7/9 [00:03<00:00,  2.87it/s][A
100%|██████████| 9/9 [00:03<00:00,  2.31it/s][A
Epochs:  58%|█████▊    | 34/59 [15:38<11:35, 27.82s/it]

Val Loss: 4.0324 - Val Accuracy: 0.9414



Training:   0%|          | 0/69 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/69 [00:01<02:06,  1.86s/it][A
Training:   3%|▎         | 2/69 [00:01<00:55,  1.20it/s][A
Training:   6%|▌         | 4/69 [00:02<00:24,  2.71it/s][A
Training:   7%|▋         | 5/69 [00:03<00:35,  1.79it/s][A
Training:   9%|▊         | 6/69 [00:03<00:30,  2.06it/s][A
Training:  10%|█         | 7/69 [00:03<00:22,  2.71it/s][A
Training:  13%|█▎        | 9/69 [00:04<00:24,  2.40it/s][A
Training:  14%|█▍        | 10/69 [00:04<00:20,  2.94it/s][A
Training:  16%|█▌        | 11/69 [00:04<00:17,  3.36it/s][A
Training:  19%|█▉        | 13/69 [00:05<00:22,  2.54it/s][A
Training:  22%|██▏       | 15/69 [00:06<00:16,  3.23it/s][A
Training:  25%|██▍       | 17/69 [00:07<00:19,  2.66it/s][A
Training:  28%|██▊       | 19/69 [00:07<00:17,  2.87it/s][A
Training:  30%|███       | 21/69 [00:08<00:17,  2.70it/s][A
Training:  33%|███▎      | 23/69 [00:08<00:14,  3.27it/s][A
Training:  36%|███▌      | 25/69 [00:09

Epoch: 35/59 - Loss: 4.9275 - Accuracy: 0.9221



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:01<00:13,  1.63s/it][A
 22%|██▏       | 2/9 [00:01<00:05,  1.34it/s][A
 33%|███▎      | 3/9 [00:01<00:02,  2.21it/s][A
 56%|█████▌    | 5/9 [00:02<00:02,  1.99it/s][A
 78%|███████▊  | 7/9 [00:03<00:00,  3.04it/s][A
100%|██████████| 9/9 [00:03<00:00,  2.42it/s][A
Epochs:  59%|█████▉    | 35/59 [16:06<11:05, 27.72s/it]

Val Loss: 3.6767 - Val Accuracy: 0.9178



Training:   0%|          | 0/69 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/69 [00:01<02:00,  1.77s/it][A
Training:   3%|▎         | 2/69 [00:02<01:02,  1.07it/s][A
Training:   6%|▌         | 4/69 [00:02<00:26,  2.47it/s][A
Training:   7%|▋         | 5/69 [00:03<00:34,  1.85it/s][A
Training:   9%|▊         | 6/69 [00:03<00:27,  2.26it/s][A
Training:  13%|█▎        | 9/69 [00:04<00:21,  2.82it/s][A
Training:  14%|█▍        | 10/69 [00:04<00:20,  2.85it/s][A
Training:  17%|█▋        | 12/69 [00:04<00:13,  4.20it/s][A
Training:  19%|█▉        | 13/69 [00:05<00:18,  3.04it/s][A
Training:  20%|██        | 14/69 [00:05<00:20,  2.69it/s][A
Training:  23%|██▎       | 16/69 [00:06<00:13,  3.95it/s][A
Training:  25%|██▍       | 17/69 [00:06<00:18,  2.80it/s][A
Training:  26%|██▌       | 18/69 [00:07<00:20,  2.48it/s][A
Training:  30%|███       | 21/69 [00:08<00:15,  3.08it/s][A
Training:  32%|███▏      | 22/69 [00:08<00:16,  2.92it/s][A
Training:  35%|███▍      | 24/69 [00:0

Epoch: 36/59 - Loss: 2.7233 - Accuracy: 0.9360



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:01<00:13,  1.65s/it][A
 44%|████▍     | 4/9 [00:01<00:01,  2.80it/s][A
 67%|██████▋   | 6/9 [00:02<00:01,  2.28it/s][A
 78%|███████▊  | 7/9 [00:03<00:00,  2.62it/s][A
 89%|████████▉ | 8/9 [00:03<00:00,  2.83it/s][A
100%|██████████| 9/9 [00:03<00:00,  2.44it/s][A
Epochs:  61%|██████    | 36/59 [16:34<10:36, 27.70s/it]

Val Loss: 3.5581 - Val Accuracy: 0.9286



Training:   0%|          | 0/69 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/69 [00:01<01:57,  1.72s/it][A
Training:   3%|▎         | 2/69 [00:01<00:51,  1.30it/s][A
Training:   6%|▌         | 4/69 [00:01<00:21,  3.01it/s][A
Training:   7%|▋         | 5/69 [00:03<00:39,  1.61it/s][A
Training:   9%|▊         | 6/69 [00:03<00:29,  2.15it/s][A
Training:  10%|█         | 7/69 [00:03<00:22,  2.80it/s][A
Training:  13%|█▎        | 9/69 [00:04<00:23,  2.53it/s][A
Training:  14%|█▍        | 10/69 [00:04<00:19,  3.10it/s][A
Training:  17%|█▋        | 12/69 [00:04<00:12,  4.73it/s][A
Training:  20%|██        | 14/69 [00:05<00:19,  2.76it/s][A
Training:  25%|██▍       | 17/69 [00:07<00:20,  2.55it/s][A
Training:  28%|██▊       | 19/69 [00:07<00:14,  3.41it/s][A
Training:  30%|███       | 21/69 [00:08<00:18,  2.67it/s][A
Training:  32%|███▏      | 22/69 [00:08<00:15,  3.06it/s][A
Training:  35%|███▍      | 24/69 [00:08<00:10,  4.21it/s][A
Training:  38%|███▊      | 26/69 [00:09

Epoch: 37/59 - Loss: 3.2074 - Accuracy: 0.9422



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:01<00:12,  1.62s/it][A
 33%|███▎      | 3/9 [00:01<00:02,  2.02it/s][A
 56%|█████▌    | 5/9 [00:03<00:02,  1.80it/s][A
100%|██████████| 9/9 [00:03<00:00,  2.33it/s][A
Epochs:  63%|██████▎   | 37/59 [17:01<10:09, 27.70s/it]

Val Loss: 7.5259 - Val Accuracy: 0.9271



Training:   0%|          | 0/69 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/69 [00:01<02:01,  1.79s/it][A
Training:   4%|▍         | 3/69 [00:01<00:34,  1.92it/s][A
Training:   6%|▌         | 4/69 [00:02<00:24,  2.65it/s][A
Training:   7%|▋         | 5/69 [00:03<00:36,  1.76it/s][A
Training:  10%|█         | 7/69 [00:03<00:20,  3.05it/s][A
Training:  12%|█▏        | 8/69 [00:03<00:16,  3.59it/s][A
Training:  13%|█▎        | 9/69 [00:04<00:30,  1.96it/s][A
Training:  16%|█▌        | 11/69 [00:04<00:18,  3.12it/s][A
Training:  19%|█▉        | 13/69 [00:05<00:23,  2.35it/s][A
Training:  23%|██▎       | 16/69 [00:05<00:13,  3.88it/s][A
Training:  26%|██▌       | 18/69 [00:07<00:18,  2.73it/s][A
Training:  29%|██▉       | 20/69 [00:07<00:14,  3.50it/s][A
Training:  30%|███       | 21/69 [00:08<00:18,  2.66it/s][A
Training:  33%|███▎      | 23/69 [00:08<00:13,  3.32it/s][A
Training:  35%|███▍      | 24/69 [00:08<00:13,  3.42it/s][A
Training:  36%|███▌      | 25/69 [00:09

Epoch: 38/59 - Loss: 3.9026 - Accuracy: 0.9296



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:01<00:11,  1.45s/it][A
 22%|██▏       | 2/9 [00:01<00:05,  1.23it/s][A
 56%|█████▌    | 5/9 [00:02<00:01,  2.02it/s][A
 67%|██████▋   | 6/9 [00:03<00:01,  2.25it/s][A
 89%|████████▉ | 8/9 [00:03<00:00,  3.54it/s][A
100%|██████████| 9/9 [00:03<00:00,  2.43it/s][A
Epochs:  64%|██████▍   | 38/59 [17:29<09:44, 27.82s/it]

Val Loss: 3.3899 - Val Accuracy: 0.9140



Training:   0%|          | 0/69 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/69 [00:01<01:53,  1.67s/it][A
Training:   4%|▍         | 3/69 [00:01<00:32,  2.04it/s][A
Training:   7%|▋         | 5/69 [00:03<00:35,  1.80it/s][A
Training:   9%|▊         | 6/69 [00:03<00:27,  2.26it/s][A
Training:  13%|█▎        | 9/69 [00:04<00:23,  2.51it/s][A
Training:  16%|█▌        | 11/69 [00:04<00:16,  3.43it/s][A
Training:  19%|█▉        | 13/69 [00:05<00:21,  2.63it/s][A
Training:  20%|██        | 14/69 [00:05<00:18,  3.05it/s][A
Training:  22%|██▏       | 15/69 [00:05<00:15,  3.44it/s][A
Training:  25%|██▍       | 17/69 [00:06<00:20,  2.51it/s][A
Training:  29%|██▉       | 20/69 [00:07<00:11,  4.18it/s][A
Training:  32%|███▏      | 22/69 [00:08<00:15,  3.04it/s][A
Training:  35%|███▍      | 24/69 [00:08<00:11,  4.05it/s][A
Training:  38%|███▊      | 26/69 [00:09<00:15,  2.76it/s][A
Training:  39%|███▉      | 27/69 [00:09<00:13,  3.07it/s][A
Training:  42%|████▏     | 29/69 [00:

Epoch: 39/59 - Loss: 2.6440 - Accuracy: 0.9403



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:01<00:14,  1.79s/it][A
 22%|██▏       | 2/9 [00:01<00:05,  1.23it/s][A
 56%|█████▌    | 5/9 [00:03<00:02,  1.77it/s][A
100%|██████████| 9/9 [00:04<00:00,  2.23it/s][A
Epochs:  66%|██████▌   | 39/59 [17:56<09:10, 27.55s/it]

Val Loss: 3.2510 - Val Accuracy: 0.9288



Training:   0%|          | 0/69 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/69 [00:01<01:43,  1.53s/it][A
Training:   3%|▎         | 2/69 [00:01<00:47,  1.41it/s][A
Training:   6%|▌         | 4/69 [00:01<00:21,  3.08it/s][A
Training:   7%|▋         | 5/69 [00:02<00:32,  2.00it/s][A
Training:  10%|█         | 7/69 [00:02<00:18,  3.32it/s][A
Training:  13%|█▎        | 9/69 [00:04<00:25,  2.39it/s][A
Training:  16%|█▌        | 11/69 [00:04<00:17,  3.36it/s][A
Training:  17%|█▋        | 12/69 [00:04<00:14,  3.86it/s][A
Training:  19%|█▉        | 13/69 [00:05<00:25,  2.20it/s][A
Training:  23%|██▎       | 16/69 [00:05<00:13,  4.03it/s][A
Training:  26%|██▌       | 18/69 [00:06<00:19,  2.67it/s][A
Training:  29%|██▉       | 20/69 [00:07<00:13,  3.56it/s][A
Training:  32%|███▏      | 22/69 [00:08<00:18,  2.60it/s][A
Training:  35%|███▍      | 24/69 [00:08<00:12,  3.53it/s][A
Training:  38%|███▊      | 26/69 [00:09<00:17,  2.45it/s][A
Training:  39%|███▉      | 27/69 [00:0

Epoch: 40/59 - Loss: 4.8536 - Accuracy: 0.9326



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:01<00:13,  1.68s/it][A
 22%|██▏       | 2/9 [00:01<00:05,  1.33it/s][A
 44%|████▍     | 4/9 [00:01<00:01,  3.18it/s][A
 67%|██████▋   | 6/9 [00:03<00:01,  2.25it/s][A
100%|██████████| 9/9 [00:03<00:00,  2.37it/s][A
Epochs:  68%|██████▊   | 40/59 [18:24<08:43, 27.53s/it]

Val Loss: 13.5723 - Val Accuracy: 0.9180



Training:   0%|          | 0/69 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/69 [00:01<01:50,  1.63s/it][A
Training:   3%|▎         | 2/69 [00:01<00:49,  1.35it/s][A
Training:   4%|▍         | 3/69 [00:01<00:29,  2.21it/s][A
Training:   7%|▋         | 5/69 [00:02<00:32,  1.97it/s][A
Training:   9%|▊         | 6/69 [00:03<00:24,  2.55it/s][A
Training:  13%|█▎        | 9/69 [00:04<00:23,  2.59it/s][A
Training:  14%|█▍        | 10/69 [00:04<00:19,  2.98it/s][A
Training:  19%|█▉        | 13/69 [00:05<00:19,  2.92it/s][A
Training:  20%|██        | 14/69 [00:05<00:17,  3.14it/s][A
Training:  23%|██▎       | 16/69 [00:05<00:12,  4.35it/s][A
Training:  25%|██▍       | 17/69 [00:06<00:18,  2.83it/s][A
Training:  28%|██▊       | 19/69 [00:06<00:12,  3.89it/s][A
Training:  29%|██▉       | 20/69 [00:07<00:13,  3.73it/s][A
Training:  30%|███       | 21/69 [00:08<00:21,  2.23it/s][A
Training:  33%|███▎      | 23/69 [00:08<00:14,  3.28it/s][A
Training:  35%|███▍      | 24/69 [00:0

Epoch: 41/59 - Loss: 4.4470 - Accuracy: 0.9288



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:01<00:12,  1.62s/it][A
 22%|██▏       | 2/9 [00:01<00:05,  1.35it/s][A
 33%|███▎      | 3/9 [00:01<00:02,  2.18it/s][A
 56%|█████▌    | 5/9 [00:03<00:02,  1.89it/s][A
100%|██████████| 9/9 [00:03<00:00,  2.30it/s][A
Epochs:  69%|██████▉   | 41/59 [18:51<08:14, 27.46s/it]

Val Loss: 3.4199 - Val Accuracy: 0.9377



Training:   0%|          | 0/69 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/69 [00:01<01:48,  1.60s/it][A
Training:   3%|▎         | 2/69 [00:01<00:49,  1.34it/s][A
Training:   7%|▋         | 5/69 [00:02<00:31,  2.04it/s][A
Training:   9%|▊         | 6/69 [00:03<00:25,  2.49it/s][A
Training:  12%|█▏        | 8/69 [00:03<00:16,  3.73it/s][A
Training:  13%|█▎        | 9/69 [00:04<00:27,  2.19it/s][A
Training:  14%|█▍        | 10/69 [00:04<00:21,  2.69it/s][A
Training:  17%|█▋        | 12/69 [00:04<00:14,  3.96it/s][A
Training:  19%|█▉        | 13/69 [00:05<00:24,  2.26it/s][A
Training:  22%|██▏       | 15/69 [00:05<00:15,  3.44it/s][A
Training:  25%|██▍       | 17/69 [00:06<00:19,  2.61it/s][A
Training:  28%|██▊       | 19/69 [00:07<00:14,  3.49it/s][A
Training:  30%|███       | 21/69 [00:08<00:18,  2.58it/s][A
Training:  33%|███▎      | 23/69 [00:08<00:13,  3.40it/s][A
Training:  35%|███▍      | 24/69 [00:08<00:11,  3.77it/s][A
Training:  36%|███▌      | 25/69 [00:0

Epoch: 42/59 - Loss: 2.8774 - Accuracy: 0.9393



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:01<00:13,  1.72s/it][A
 44%|████▍     | 4/9 [00:01<00:01,  2.75it/s][A
 67%|██████▋   | 6/9 [00:03<00:01,  2.12it/s][A
100%|██████████| 9/9 [00:03<00:00,  2.28it/s][A
Epochs:  71%|███████   | 42/59 [19:19<07:47, 27.53s/it]

Val Loss: 5.2810 - Val Accuracy: 0.8222



Training:   0%|          | 0/69 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/69 [00:01<01:34,  1.39s/it][A
Training:   3%|▎         | 2/69 [00:01<00:42,  1.57it/s][A
Training:   6%|▌         | 4/69 [00:01<00:17,  3.64it/s][A
Training:   9%|▊         | 6/69 [00:03<00:29,  2.12it/s][A
Training:  12%|█▏        | 8/69 [00:03<00:18,  3.23it/s][A
Training:  13%|█▎        | 9/69 [00:04<00:30,  2.00it/s][A
Training:  16%|█▌        | 11/69 [00:04<00:19,  3.03it/s][A
Training:  19%|█▉        | 13/69 [00:05<00:23,  2.36it/s][A
Training:  22%|██▏       | 15/69 [00:05<00:16,  3.25it/s][A
Training:  25%|██▍       | 17/69 [00:07<00:21,  2.41it/s][A
Training:  28%|██▊       | 19/69 [00:07<00:15,  3.28it/s][A
Training:  29%|██▉       | 20/69 [00:07<00:13,  3.64it/s][A
Training:  30%|███       | 21/69 [00:08<00:21,  2.20it/s][A
Training:  33%|███▎      | 23/69 [00:08<00:14,  3.16it/s][A
Training:  36%|███▌      | 25/69 [00:09<00:18,  2.34it/s][A
Training:  42%|████▏     | 29/69 [00:1

Epoch: 43/59 - Loss: 3.0810 - Accuracy: 0.9298



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:01<00:11,  1.48s/it][A
 22%|██▏       | 2/9 [00:01<00:04,  1.44it/s][A
 33%|███▎      | 3/9 [00:01<00:02,  2.31it/s][A
 56%|█████▌    | 5/9 [00:02<00:01,  2.39it/s][A
 67%|██████▋   | 6/9 [00:02<00:01,  2.71it/s][A
 89%|████████▉ | 8/9 [00:02<00:00,  4.33it/s][A
100%|██████████| 9/9 [00:03<00:00,  2.80it/s][A
Epochs:  73%|███████▎  | 43/59 [19:46<07:18, 27.41s/it]

Val Loss: 5.1089 - Val Accuracy: 0.9377



Training:   0%|          | 0/69 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/69 [00:01<01:58,  1.74s/it][A
Training:   3%|▎         | 2/69 [00:01<00:52,  1.29it/s][A
Training:   4%|▍         | 3/69 [00:01<00:32,  2.04it/s][A
Training:   7%|▋         | 5/69 [00:03<00:33,  1.92it/s][A
Training:   9%|▊         | 6/69 [00:03<00:25,  2.47it/s][A
Training:  12%|█▏        | 8/69 [00:03<00:15,  3.90it/s][A
Training:  13%|█▎        | 9/69 [00:04<00:26,  2.23it/s][A
Training:  16%|█▌        | 11/69 [00:04<00:16,  3.46it/s][A
Training:  19%|█▉        | 13/69 [00:05<00:23,  2.35it/s][A
Training:  20%|██        | 14/69 [00:05<00:20,  2.74it/s][A
Training:  23%|██▎       | 16/69 [00:06<00:13,  3.95it/s][A
Training:  25%|██▍       | 17/69 [00:07<00:20,  2.51it/s][A
Training:  28%|██▊       | 19/69 [00:07<00:13,  3.59it/s][A
Training:  30%|███       | 21/69 [00:08<00:18,  2.58it/s][A
Training:  32%|███▏      | 22/69 [00:08<00:15,  2.96it/s][A
Training:  35%|███▍      | 24/69 [00:08

Epoch: 44/59 - Loss: 3.0969 - Accuracy: 0.9351



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:01<00:15,  1.93s/it][A
 56%|█████▌    | 5/9 [00:03<00:02,  1.90it/s][A
100%|██████████| 9/9 [00:03<00:00,  2.38it/s][A
Epochs:  75%|███████▍  | 44/59 [20:14<06:52, 27.53s/it]

Val Loss: 3.4205 - Val Accuracy: 0.9332



Training:   0%|          | 0/69 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/69 [00:01<02:13,  1.96s/it][A
Training:   4%|▍         | 3/69 [00:02<00:36,  1.83it/s][A
Training:   7%|▋         | 5/69 [00:03<00:38,  1.67it/s][A
Training:  10%|█         | 7/69 [00:03<00:23,  2.61it/s][A
Training:  13%|█▎        | 9/69 [00:04<00:29,  2.07it/s][A
Training:  17%|█▋        | 12/69 [00:04<00:16,  3.49it/s][A
Training:  20%|██        | 14/69 [00:06<00:21,  2.59it/s][A
Training:  23%|██▎       | 16/69 [00:06<00:15,  3.40it/s][A
Training:  25%|██▍       | 17/69 [00:07<00:22,  2.33it/s][A
Training:  26%|██▌       | 18/69 [00:07<00:18,  2.72it/s][A
Training:  28%|██▊       | 19/69 [00:07<00:15,  3.21it/s][A
Training:  30%|███       | 21/69 [00:08<00:20,  2.30it/s][A
Training:  33%|███▎      | 23/69 [00:09<00:14,  3.28it/s][A
Training:  36%|███▌      | 25/69 [00:10<00:17,  2.47it/s][A
Training:  38%|███▊      | 26/69 [00:10<00:14,  2.87it/s][A
Training:  42%|████▏     | 29/69 [00:

Epoch: 45/59 - Loss: 2.4905 - Accuracy: 0.9445



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:01<00:13,  1.70s/it][A
 44%|████▍     | 4/9 [00:01<00:01,  2.83it/s][A
 67%|██████▋   | 6/9 [00:03<00:01,  2.18it/s][A
 78%|███████▊  | 7/9 [00:03<00:00,  2.67it/s][A
100%|██████████| 9/9 [00:03<00:00,  2.38it/s][A
Epochs:  76%|███████▋  | 45/59 [20:42<06:26, 27.62s/it]

Val Loss: 3.4213 - Val Accuracy: 0.9250



Training:   0%|          | 0/69 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/69 [00:02<02:27,  2.17s/it][A
Training:   6%|▌         | 4/69 [00:02<00:28,  2.25it/s][A
Training:   9%|▊         | 6/69 [00:03<00:31,  1.97it/s][A
Training:  12%|█▏        | 8/69 [00:03<00:20,  2.92it/s][A
Training:  14%|█▍        | 10/69 [00:04<00:26,  2.21it/s][A
Training:  17%|█▋        | 12/69 [00:05<00:18,  3.01it/s][A
Training:  19%|█▉        | 13/69 [00:06<00:25,  2.17it/s][A
Training:  22%|██▏       | 15/69 [00:06<00:17,  3.15it/s][A
Training:  25%|██▍       | 17/69 [00:07<00:22,  2.26it/s][A
Training:  28%|██▊       | 19/69 [00:07<00:15,  3.15it/s][A
Training:  30%|███       | 21/69 [00:09<00:20,  2.38it/s][A
Training:  33%|███▎      | 23/69 [00:09<00:14,  3.24it/s][A
Training:  36%|███▌      | 25/69 [00:10<00:17,  2.46it/s][A
Training:  38%|███▊      | 26/69 [00:10<00:15,  2.83it/s][A
Training:  42%|████▏     | 29/69 [00:11<00:14,  2.72it/s][A
Training:  43%|████▎     | 30/69 [00

Epoch: 46/59 - Loss: 2.5311 - Accuracy: 0.9404



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:01<00:13,  1.69s/it][A
 33%|███▎      | 3/9 [00:01<00:02,  2.03it/s][A
 56%|█████▌    | 5/9 [00:03<00:02,  1.83it/s][A
 78%|███████▊  | 7/9 [00:03<00:00,  2.72it/s][A
100%|██████████| 9/9 [00:04<00:00,  2.23it/s][A
Epochs:  78%|███████▊  | 46/59 [21:09<05:59, 27.68s/it]

Val Loss: 3.4858 - Val Accuracy: 0.9304



Training:   0%|          | 0/69 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/69 [00:01<02:01,  1.78s/it][A
Training:   3%|▎         | 2/69 [00:01<00:54,  1.24it/s][A
Training:   4%|▍         | 3/69 [00:02<00:32,  2.04it/s][A
Training:   6%|▌         | 4/69 [00:02<00:22,  2.89it/s][A
Training:   7%|▋         | 5/69 [00:03<00:33,  1.90it/s][A
Training:   9%|▊         | 6/69 [00:03<00:25,  2.47it/s][A
Training:  10%|█         | 7/69 [00:03<00:20,  3.06it/s][A
Training:  13%|█▎        | 9/69 [00:04<00:27,  2.20it/s][A
Training:  17%|█▋        | 12/69 [00:04<00:14,  3.90it/s][A
Training:  19%|█▉        | 13/69 [00:05<00:24,  2.31it/s][A
Training:  20%|██        | 14/69 [00:05<00:19,  2.76it/s][A
Training:  23%|██▎       | 16/69 [00:06<00:13,  3.95it/s][A
Training:  25%|██▍       | 17/69 [00:07<00:22,  2.30it/s][A
Training:  26%|██▌       | 18/69 [00:07<00:18,  2.77it/s][A
Training:  29%|██▉       | 20/69 [00:07<00:12,  3.96it/s][A
Training:  30%|███       | 21/69 [00:08<

Epoch: 47/59 - Loss: 2.8645 - Accuracy: 0.9303



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:01<00:14,  1.76s/it][A
 22%|██▏       | 2/9 [00:02<00:06,  1.13it/s][A
 56%|█████▌    | 5/9 [00:03<00:01,  2.02it/s][A
 67%|██████▋   | 6/9 [00:03<00:01,  2.36it/s][A
100%|██████████| 9/9 [00:03<00:00,  2.41it/s][A
Epochs:  80%|███████▉  | 47/59 [21:37<05:31, 27.60s/it]

Val Loss: 3.8311 - Val Accuracy: 0.9383



Training:   0%|          | 0/69 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/69 [00:01<02:08,  1.89s/it][A
Training:   4%|▍         | 3/69 [00:02<00:36,  1.82it/s][A
Training:   7%|▋         | 5/69 [00:03<00:33,  1.91it/s][A
Training:   9%|▊         | 6/69 [00:03<00:25,  2.43it/s][A
Training:  10%|█         | 7/69 [00:03<00:21,  2.94it/s][A
Training:  13%|█▎        | 9/69 [00:04<00:25,  2.34it/s][A
Training:  14%|█▍        | 10/69 [00:04<00:21,  2.74it/s][A
Training:  16%|█▌        | 11/69 [00:04<00:18,  3.11it/s][A
Training:  17%|█▋        | 12/69 [00:04<00:15,  3.66it/s][A
Training:  19%|█▉        | 13/69 [00:05<00:26,  2.12it/s][A
Training:  20%|██        | 14/69 [00:06<00:22,  2.48it/s][A
Training:  22%|██▏       | 15/69 [00:06<00:19,  2.83it/s][A
Training:  25%|██▍       | 17/69 [00:07<00:22,  2.31it/s][A
Training:  28%|██▊       | 19/69 [00:07<00:14,  3.34it/s][A
Training:  30%|███       | 21/69 [00:08<00:18,  2.53it/s][A
Training:  33%|███▎      | 23/69 [00:0

Epoch: 48/59 - Loss: 5.7583 - Accuracy: 0.9199



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:01<00:14,  1.83s/it][A
 22%|██▏       | 2/9 [00:01<00:05,  1.21it/s][A
 44%|████▍     | 4/9 [00:02<00:01,  2.80it/s][A
 56%|█████▌    | 5/9 [00:03<00:02,  1.61it/s][A
 78%|███████▊  | 7/9 [00:03<00:00,  2.84it/s][A
100%|██████████| 9/9 [00:04<00:00,  2.18it/s][A
Epochs:  81%|████████▏ | 48/59 [22:04<05:03, 27.56s/it]

Val Loss: 6.3848 - Val Accuracy: 0.9215



Training:   0%|          | 0/69 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/69 [00:01<02:01,  1.78s/it][A
Training:   4%|▍         | 3/69 [00:01<00:35,  1.86it/s][A
Training:   6%|▌         | 4/69 [00:02<00:25,  2.53it/s][A
Training:   7%|▋         | 5/69 [00:03<00:42,  1.51it/s][A
Training:  10%|█         | 7/69 [00:03<00:23,  2.63it/s][A
Training:  13%|█▎        | 9/69 [00:04<00:29,  2.04it/s][A
Training:  16%|█▌        | 11/69 [00:04<00:19,  2.99it/s][A
Training:  19%|█▉        | 13/69 [00:06<00:23,  2.37it/s][A
Training:  25%|██▍       | 17/69 [00:07<00:19,  2.67it/s][A
Training:  30%|███       | 21/69 [00:08<00:17,  2.79it/s][A
Training:  33%|███▎      | 23/69 [00:08<00:13,  3.45it/s][A
Training:  36%|███▌      | 25/69 [00:10<00:16,  2.62it/s][A
Training:  39%|███▉      | 27/69 [00:10<00:12,  3.32it/s][A
Training:  42%|████▏     | 29/69 [00:11<00:14,  2.67it/s][A
Training:  45%|████▍     | 31/69 [00:11<00:10,  3.47it/s][A
Training:  48%|████▊     | 33/69 [00:1

Epoch: 49/59 - Loss: 3.3554 - Accuracy: 0.9311



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:01<00:14,  1.81s/it][A
 44%|████▍     | 4/9 [00:01<00:01,  2.67it/s][A
 67%|██████▋   | 6/9 [00:03<00:01,  1.99it/s][A
100%|██████████| 9/9 [00:03<00:00,  2.31it/s][A
Epochs:  83%|████████▎ | 49/59 [22:32<04:35, 27.57s/it]

Val Loss: 3.4015 - Val Accuracy: 0.9164



Training:   0%|          | 0/69 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/69 [00:01<01:57,  1.73s/it][A
Training:   3%|▎         | 2/69 [00:01<00:52,  1.28it/s][A
Training:   6%|▌         | 4/69 [00:02<00:22,  2.90it/s][A
Training:   7%|▋         | 5/69 [00:03<00:39,  1.62it/s][A
Training:  12%|█▏        | 8/69 [00:03<00:17,  3.49it/s][A
Training:  14%|█▍        | 10/69 [00:04<00:24,  2.44it/s][A
Training:  19%|█▉        | 13/69 [00:05<00:23,  2.41it/s][A
Training:  22%|██▏       | 15/69 [00:06<00:16,  3.19it/s][A
Training:  25%|██▍       | 17/69 [00:07<00:21,  2.38it/s][A
Training:  28%|██▊       | 19/69 [00:07<00:15,  3.15it/s][A
Training:  30%|███       | 21/69 [00:08<00:19,  2.52it/s][A
Training:  33%|███▎      | 23/69 [00:08<00:13,  3.29it/s][A
Training:  36%|███▌      | 25/69 [00:10<00:16,  2.61it/s][A
Training:  39%|███▉      | 27/69 [00:10<00:12,  3.37it/s][A
Training:  41%|████      | 28/69 [00:10<00:11,  3.68it/s][A
Training:  42%|████▏     | 29/69 [00:

Epoch: 50/59 - Loss: 2.6116 - Accuracy: 0.9382



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:01<00:13,  1.66s/it][A
 33%|███▎      | 3/9 [00:01<00:02,  2.04it/s][A
 44%|████▍     | 4/9 [00:02<00:01,  2.61it/s][A
 56%|█████▌    | 5/9 [00:03<00:02,  1.61it/s][A
 67%|██████▋   | 6/9 [00:03<00:01,  2.13it/s][A
100%|██████████| 9/9 [00:03<00:00,  2.32it/s][A
Epochs:  85%|████████▍ | 50/59 [23:00<04:08, 27.62s/it]

Val Loss: 3.4805 - Val Accuracy: 0.9394



Training:   0%|          | 0/69 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/69 [00:01<02:13,  1.97s/it][A
Training:   4%|▍         | 3/69 [00:02<00:36,  1.80it/s][A
Training:   7%|▋         | 5/69 [00:03<00:39,  1.60it/s][A
Training:  10%|█         | 7/69 [00:03<00:24,  2.56it/s][A
Training:  13%|█▎        | 9/69 [00:04<00:29,  2.04it/s][A
Training:  16%|█▌        | 11/69 [00:05<00:19,  2.91it/s][A
Training:  19%|█▉        | 13/69 [00:06<00:22,  2.46it/s][A
Training:  22%|██▏       | 15/69 [00:06<00:15,  3.39it/s][A
Training:  25%|██▍       | 17/69 [00:07<00:19,  2.69it/s][A
Training:  28%|██▊       | 19/69 [00:07<00:13,  3.64it/s][A
Training:  30%|███       | 21/69 [00:08<00:16,  2.83it/s][A
Training:  33%|███▎      | 23/69 [00:08<00:12,  3.79it/s][A
Training:  36%|███▌      | 25/69 [00:09<00:15,  2.76it/s][A
Training:  38%|███▊      | 26/69 [00:09<00:13,  3.13it/s][A
Training:  41%|████      | 28/69 [00:10<00:09,  4.18it/s][A
Training:  42%|████▏     | 29/69 [00:

Epoch: 51/59 - Loss: 3.1232 - Accuracy: 0.9348



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:01<00:12,  1.56s/it][A
 22%|██▏       | 2/9 [00:01<00:05,  1.35it/s][A
 44%|████▍     | 4/9 [00:01<00:01,  3.23it/s][A
 67%|██████▋   | 6/9 [00:03<00:01,  2.11it/s][A
100%|██████████| 9/9 [00:03<00:00,  2.47it/s][A
Epochs:  86%|████████▋ | 51/59 [23:27<03:40, 27.61s/it]

Val Loss: 3.4436 - Val Accuracy: 0.9377



Training:   0%|          | 0/69 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/69 [00:01<01:55,  1.70s/it][A
Training:   4%|▍         | 3/69 [00:01<00:31,  2.09it/s][A
Training:   7%|▋         | 5/69 [00:02<00:34,  1.87it/s][A
Training:  10%|█         | 7/69 [00:03<00:20,  2.99it/s][A
Training:  13%|█▎        | 9/69 [00:04<00:26,  2.24it/s][A
Training:  14%|█▍        | 10/69 [00:04<00:22,  2.61it/s][A
Training:  16%|█▌        | 11/69 [00:04<00:18,  3.13it/s][A
Training:  19%|█▉        | 13/69 [00:05<00:24,  2.24it/s][A
Training:  20%|██        | 14/69 [00:05<00:20,  2.71it/s][A
Training:  23%|██▎       | 16/69 [00:06<00:13,  3.84it/s][A
Training:  25%|██▍       | 17/69 [00:07<00:21,  2.43it/s][A
Training:  26%|██▌       | 18/69 [00:07<00:17,  2.89it/s][A
Training:  28%|██▊       | 19/69 [00:07<00:15,  3.33it/s][A
Training:  29%|██▉       | 20/69 [00:07<00:12,  3.99it/s][A
Training:  30%|███       | 21/69 [00:08<00:24,  1.93it/s][A
Training:  32%|███▏      | 22/69 [00:

Epoch: 52/59 - Loss: 4.1630 - Accuracy: 0.9317



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:01<00:14,  1.85s/it][A
 22%|██▏       | 2/9 [00:01<00:05,  1.21it/s][A
 44%|████▍     | 4/9 [00:02<00:01,  2.80it/s][A
 56%|█████▌    | 5/9 [00:03<00:02,  1.72it/s][A
 78%|███████▊  | 7/9 [00:03<00:00,  2.92it/s][A
100%|██████████| 9/9 [00:04<00:00,  2.23it/s][A
Epochs:  88%|████████▊ | 52/59 [23:55<03:12, 27.57s/it]

Val Loss: 8.2528 - Val Accuracy: 0.9372



Training:   0%|          | 0/69 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/69 [00:01<01:48,  1.60s/it][A
Training:   6%|▌         | 4/69 [00:01<00:21,  3.02it/s][A
Training:   9%|▊         | 6/69 [00:03<00:32,  1.91it/s][A
Training:  10%|█         | 7/69 [00:03<00:26,  2.35it/s][A
Training:  13%|█▎        | 9/69 [00:04<00:30,  1.97it/s][A
Training:  16%|█▌        | 11/69 [00:04<00:20,  2.90it/s][A
Training:  19%|█▉        | 13/69 [00:05<00:23,  2.34it/s][A
Training:  22%|██▏       | 15/69 [00:06<00:16,  3.21it/s][A
Training:  25%|██▍       | 17/69 [00:07<00:21,  2.43it/s][A
Training:  28%|██▊       | 19/69 [00:07<00:15,  3.27it/s][A
Training:  30%|███       | 21/69 [00:08<00:19,  2.48it/s][A
Training:  33%|███▎      | 23/69 [00:08<00:13,  3.36it/s][A
Training:  36%|███▌      | 25/69 [00:10<00:17,  2.47it/s][A
Training:  39%|███▉      | 27/69 [00:10<00:12,  3.30it/s][A
Training:  42%|████▏     | 29/69 [00:11<00:16,  2.46it/s][A
Training:  48%|████▊     | 33/69 [00:

Epoch: 53/59 - Loss: 4.3827 - Accuracy: 0.9296



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:01<00:13,  1.64s/it][A
 22%|██▏       | 2/9 [00:01<00:05,  1.28it/s][A
 56%|█████▌    | 5/9 [00:03<00:02,  1.93it/s][A
 78%|███████▊  | 7/9 [00:03<00:00,  3.00it/s][A
100%|██████████| 9/9 [00:03<00:00,  2.28it/s][A
Epochs:  90%|████████▉ | 53/59 [24:23<02:46, 27.74s/it]

Val Loss: 3.3190 - Val Accuracy: 0.9242



Training:   0%|          | 0/69 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/69 [00:01<02:14,  1.98s/it][A
Training:   4%|▍         | 3/69 [00:02<00:38,  1.73it/s][A
Training:   7%|▋         | 5/69 [00:03<00:38,  1.67it/s][A
Training:   9%|▊         | 6/69 [00:03<00:29,  2.14it/s][A
Training:  12%|█▏        | 8/69 [00:03<00:17,  3.44it/s][A
Training:  14%|█▍        | 10/69 [00:04<00:22,  2.63it/s][A
Training:  17%|█▋        | 12/69 [00:04<00:15,  3.68it/s][A
Training:  19%|█▉        | 13/69 [00:05<00:24,  2.33it/s][A
Training:  20%|██        | 14/69 [00:06<00:20,  2.65it/s][A
Training:  23%|██▎       | 16/69 [00:06<00:14,  3.78it/s][A
Training:  25%|██▍       | 17/69 [00:07<00:23,  2.21it/s][A
Training:  28%|██▊       | 19/69 [00:07<00:15,  3.18it/s][A
Training:  30%|███       | 21/69 [00:08<00:19,  2.42it/s][A
Training:  33%|███▎      | 23/69 [00:08<00:13,  3.36it/s][A
Training:  36%|███▌      | 25/69 [00:10<00:17,  2.51it/s][A
Training:  39%|███▉      | 27/69 [00:

Epoch: 54/59 - Loss: 2.8723 - Accuracy: 0.9364



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:01<00:14,  1.79s/it][A
 22%|██▏       | 2/9 [00:01<00:05,  1.25it/s][A
 33%|███▎      | 3/9 [00:02<00:02,  2.01it/s][A
 56%|█████▌    | 5/9 [00:02<00:01,  2.08it/s][A
 67%|██████▋   | 6/9 [00:03<00:01,  2.41it/s][A
 89%|████████▉ | 8/9 [00:03<00:00,  3.97it/s][A
100%|██████████| 9/9 [00:03<00:00,  2.37it/s][A
Epochs:  92%|█████████▏| 54/59 [24:50<02:18, 27.67s/it]

Val Loss: 3.3244 - Val Accuracy: 0.9403



Training:   0%|          | 0/69 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/69 [00:01<02:13,  1.96s/it][A
Training:   3%|▎         | 2/69 [00:02<00:58,  1.14it/s][A
Training:   4%|▍         | 3/69 [00:02<00:35,  1.85it/s][A
Training:   6%|▌         | 4/69 [00:02<00:25,  2.57it/s][A
Training:   7%|▋         | 5/69 [00:03<00:33,  1.93it/s][A
Training:   9%|▊         | 6/69 [00:03<00:24,  2.61it/s][A
Training:  13%|█▎        | 9/69 [00:04<00:20,  2.87it/s][A
Training:  14%|█▍        | 10/69 [00:04<00:18,  3.18it/s][A
Training:  17%|█▋        | 12/69 [00:04<00:12,  4.63it/s][A
Training:  19%|█▉        | 13/69 [00:05<00:23,  2.42it/s][A
Training:  20%|██        | 14/69 [00:05<00:19,  2.85it/s][A
Training:  22%|██▏       | 15/69 [00:05<00:15,  3.44it/s][A
Training:  25%|██▍       | 17/69 [00:06<00:17,  2.91it/s][A
Training:  26%|██▌       | 18/69 [00:07<00:18,  2.72it/s][A
Training:  28%|██▊       | 19/69 [00:07<00:15,  3.21it/s][A
Training:  30%|███       | 21/69 [00:08

Epoch: 55/59 - Loss: 2.5962 - Accuracy: 0.9371



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:01<00:15,  1.92s/it][A
 44%|████▍     | 4/9 [00:02<00:01,  2.50it/s][A
 67%|██████▋   | 6/9 [00:03<00:01,  2.00it/s][A
100%|██████████| 9/9 [00:04<00:00,  2.19it/s][A
Epochs:  93%|█████████▎| 55/59 [25:18<01:50, 27.64s/it]

Val Loss: 3.4556 - Val Accuracy: 0.9368



Training:   0%|          | 0/69 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/69 [00:01<02:05,  1.85s/it][A
Training:   4%|▍         | 3/69 [00:02<00:36,  1.79it/s][A
Training:   7%|▋         | 5/69 [00:03<00:35,  1.82it/s][A
Training:   9%|▊         | 6/69 [00:03<00:27,  2.28it/s][A
Training:  10%|█         | 7/69 [00:03<00:22,  2.79it/s][A
Training:  13%|█▎        | 9/69 [00:04<00:24,  2.40it/s][A
Training:  16%|█▌        | 11/69 [00:04<00:16,  3.55it/s][A
Training:  19%|█▉        | 13/69 [00:05<00:22,  2.49it/s][A
Training:  22%|██▏       | 15/69 [00:05<00:15,  3.41it/s][A
Training:  23%|██▎       | 16/69 [00:06<00:13,  3.90it/s][A
Training:  25%|██▍       | 17/69 [00:07<00:23,  2.19it/s][A
Training:  28%|██▊       | 19/69 [00:07<00:15,  3.19it/s][A
Training:  30%|███       | 21/69 [00:08<00:21,  2.28it/s][A
Training:  33%|███▎      | 23/69 [00:08<00:14,  3.23it/s][A
Training:  36%|███▌      | 25/69 [00:10<00:18,  2.35it/s][A
Training:  42%|████▏     | 29/69 [00:1

Epoch: 56/59 - Loss: 2.5193 - Accuracy: 0.9399



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:01<00:13,  1.64s/it][A
 33%|███▎      | 3/9 [00:01<00:02,  2.06it/s][A
 56%|█████▌    | 5/9 [00:02<00:02,  1.91it/s][A
 78%|███████▊  | 7/9 [00:03<00:00,  3.08it/s][A
100%|██████████| 9/9 [00:03<00:00,  2.31it/s][A
Epochs:  95%|█████████▍| 56/59 [25:46<01:23, 27.84s/it]

Val Loss: 3.4587 - Val Accuracy: 0.9399



Training:   0%|          | 0/69 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/69 [00:01<01:57,  1.72s/it][A
Training:   3%|▎         | 2/69 [00:01<00:52,  1.28it/s][A
Training:   6%|▌         | 4/69 [00:01<00:21,  3.08it/s][A
Training:   9%|▊         | 6/69 [00:03<00:30,  2.10it/s][A
Training:  12%|█▏        | 8/69 [00:03<00:19,  3.15it/s][A
Training:  13%|█▎        | 9/69 [00:04<00:30,  1.98it/s][A
Training:  16%|█▌        | 11/69 [00:04<00:19,  3.04it/s][A
Training:  19%|█▉        | 13/69 [00:05<00:23,  2.42it/s][A
Training:  20%|██        | 14/69 [00:05<00:19,  2.86it/s][A
Training:  22%|██▏       | 15/69 [00:06<00:16,  3.37it/s][A
Training:  25%|██▍       | 17/69 [00:07<00:21,  2.42it/s][A
Training:  28%|██▊       | 19/69 [00:07<00:14,  3.43it/s][A
Training:  30%|███       | 21/69 [00:08<00:17,  2.76it/s][A
Training:  32%|███▏      | 22/69 [00:08<00:15,  3.09it/s][A
Training:  36%|███▌      | 25/69 [00:09<00:13,  3.17it/s][A
Training:  38%|███▊      | 26/69 [00:0

Epoch: 57/59 - Loss: 2.8221 - Accuracy: 0.9340



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:01<00:13,  1.74s/it][A
 44%|████▍     | 4/9 [00:01<00:01,  2.79it/s][A
 67%|██████▋   | 6/9 [00:03<00:01,  2.07it/s][A
100%|██████████| 9/9 [00:03<00:00,  2.34it/s][A
Epochs:  97%|█████████▋| 57/59 [26:13<00:55, 27.63s/it]

Val Loss: 3.4383 - Val Accuracy: 0.9416



Training:   0%|          | 0/69 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/69 [00:01<01:56,  1.72s/it][A
Training:   6%|▌         | 4/69 [00:01<00:25,  2.52it/s][A
Training:   7%|▋         | 5/69 [00:03<00:39,  1.62it/s][A
Training:  10%|█         | 7/69 [00:03<00:23,  2.69it/s][A
Training:  12%|█▏        | 8/69 [00:03<00:20,  2.99it/s][A
Training:  13%|█▎        | 9/69 [00:04<00:32,  1.82it/s][A
Training:  16%|█▌        | 11/69 [00:04<00:19,  2.90it/s][A
Training:  17%|█▋        | 12/69 [00:04<00:16,  3.41it/s][A
Training:  19%|█▉        | 13/69 [00:05<00:26,  2.13it/s][A
Training:  20%|██        | 14/69 [00:06<00:22,  2.47it/s][A
Training:  23%|██▎       | 16/69 [00:06<00:13,  3.86it/s][A
Training:  25%|██▍       | 17/69 [00:07<00:19,  2.62it/s][A
Training:  26%|██▌       | 18/69 [00:07<00:22,  2.23it/s][A
Training:  28%|██▊       | 19/69 [00:07<00:17,  2.78it/s][A
Training:  29%|██▉       | 20/69 [00:07<00:14,  3.40it/s][A
Training:  30%|███       | 21/69 [00:0

Epoch: 58/59 - Loss: 2.5329 - Accuracy: 0.9412



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:01<00:13,  1.74s/it][A
 33%|███▎      | 3/9 [00:01<00:03,  1.98it/s][A
 56%|█████▌    | 5/9 [00:03<00:02,  1.85it/s][A
100%|██████████| 9/9 [00:03<00:00,  2.39it/s][A
Epochs:  98%|█████████▊| 58/59 [26:41<00:27, 27.60s/it]

Val Loss: 3.2763 - Val Accuracy: 0.9237



Training:   0%|          | 0/69 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/69 [00:01<01:50,  1.62s/it][A
Training:   4%|▍         | 3/69 [00:01<00:31,  2.10it/s][A
Training:   7%|▋         | 5/69 [00:02<00:33,  1.88it/s][A
Training:   9%|▊         | 6/69 [00:03<00:26,  2.38it/s][A
Training:  10%|█         | 7/69 [00:03<00:21,  2.92it/s][A
Training:  13%|█▎        | 9/69 [00:04<00:27,  2.18it/s][A
Training:  17%|█▋        | 12/69 [00:04<00:14,  3.94it/s][A
Training:  20%|██        | 14/69 [00:05<00:19,  2.84it/s][A
Training:  23%|██▎       | 16/69 [00:05<00:14,  3.77it/s][A
Training:  26%|██▌       | 18/69 [00:06<00:18,  2.75it/s][A
Training:  28%|██▊       | 19/69 [00:07<00:15,  3.13it/s][A
Training:  30%|███       | 21/69 [00:08<00:19,  2.46it/s][A
Training:  33%|███▎      | 23/69 [00:08<00:13,  3.35it/s][A
Training:  35%|███▍      | 24/69 [00:08<00:11,  3.78it/s][A
Training:  36%|███▌      | 25/69 [00:09<00:19,  2.31it/s][A
Training:  38%|███▊      | 26/69 [00:0

Epoch: 59/59 - Loss: 2.6466 - Accuracy: 0.9353



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:01<00:13,  1.73s/it][A
 44%|████▍     | 4/9 [00:01<00:01,  2.58it/s][A
 56%|█████▌    | 5/9 [00:03<00:02,  1.64it/s][A
 89%|████████▉ | 8/9 [00:03<00:00,  3.06it/s][A
100%|██████████| 9/9 [00:03<00:00,  2.27it/s][A
Epochs: 100%|██████████| 59/59 [27:08<00:00, 27.61s/it]


Val Loss: 5.4045 - Val Accuracy: 0.9135


[32m[I 2023-12-14 23:38:37,064][0m Trial 3 finished with value: 0.9134652018547058 and parameters: {'loss_learning_rate': 0.007241145783203654, 'learning_rate': 0.02124392374572327, 'weight_decay': 0.0004373342967663484, 'epsilon': 8.320175162308942e-08, 'batch_size': 203, 'epochs': 59}. Best is trial 2 with value: 0.937753438949585.[0m


Learning rate for Loss: 0.00029022607343956355
Learning rate: 3.3347055279343715e-05
Weight decay: 0.00013857639851633783
Epsilon: 5.910646219604286e-09
Batch size: 125
Number of epochs: 38


Epochs:   0%|          | 0/38 [00:00<?, ?it/s]
Training:   0%|          | 0/112 [00:00<?, ?it/s][A
Training:   1%|          | 1/112 [00:01<02:51,  1.55s/it][A
Training:   3%|▎         | 3/112 [00:01<00:48,  2.26it/s][A
Training:   4%|▍         | 5/112 [00:02<00:39,  2.70it/s][A
Training:   6%|▋         | 7/112 [00:02<00:26,  4.03it/s][A
Training:   8%|▊         | 9/112 [00:03<00:28,  3.62it/s][A
Training:  10%|▉         | 11/112 [00:03<00:20,  4.88it/s][A
Training:  12%|█▏        | 13/112 [00:03<00:24,  4.01it/s][A
Training:  14%|█▍        | 16/112 [00:04<00:16,  5.99it/s][A
Training:  16%|█▌        | 18/112 [00:04<00:22,  4.19it/s][A
Training:  18%|█▊        | 20/112 [00:05<00:17,  5.15it/s][A
Training:  19%|█▉        | 21/112 [00:05<00:24,  3.77it/s][A
Training:  20%|█▉        | 22/112 [00:05<00:21,  4.20it/s][A
Training:  21%|██▏       | 24/112 [00:05<00:15,  5.71it/s][A
Training:  22%|██▏       | 25/112 [00:06<00:22,  3.93it/s][A
Training:  24%|██▍       | 27/112 [00

Epoch: 1/38 - Loss: 19.4141 - Accuracy: 0.6124



  0%|          | 0/14 [00:00<?, ?it/s][A
  7%|▋         | 1/14 [00:01<00:15,  1.19s/it][A
 21%|██▏       | 3/14 [00:01<00:03,  2.85it/s][A
 36%|███▌      | 5/14 [00:01<00:03,  2.96it/s][A
 50%|█████     | 7/14 [00:02<00:01,  4.58it/s][A
 64%|██████▍   | 9/14 [00:02<00:01,  3.35it/s][A
 79%|███████▊  | 11/14 [00:03<00:00,  4.72it/s][A
100%|██████████| 14/14 [00:03<00:00,  3.65it/s][A
Epochs:   3%|▎         | 1/38 [00:28<17:24, 28.24s/it]

Val Loss: 15.0819 - Val Accuracy: 0.7680



Training:   0%|          | 0/112 [00:00<?, ?it/s][A
Training:   1%|          | 1/112 [00:01<02:03,  1.11s/it][A
Training:   3%|▎         | 3/112 [00:01<00:38,  2.86it/s][A
Training:   4%|▍         | 5/112 [00:01<00:33,  3.22it/s][A
Training:   5%|▌         | 6/112 [00:01<00:28,  3.71it/s][A
Training:   7%|▋         | 8/112 [00:02<00:18,  5.66it/s][A
Training:   9%|▉         | 10/112 [00:02<00:25,  3.97it/s][A
Training:  11%|█         | 12/112 [00:02<00:18,  5.43it/s][A
Training:  12%|█▎        | 14/112 [00:03<00:26,  3.72it/s][A
Training:  14%|█▍        | 16/112 [00:03<00:19,  4.87it/s][A
Training:  15%|█▌        | 17/112 [00:04<00:27,  3.40it/s][A
Training:  17%|█▋        | 19/112 [00:04<00:19,  4.78it/s][A
Training:  19%|█▉        | 21/112 [00:05<00:21,  4.19it/s][A
Training:  21%|██        | 23/112 [00:05<00:16,  5.47it/s][A
Training:  22%|██▏       | 25/112 [00:06<00:19,  4.49it/s][A
Training:  24%|██▍       | 27/112 [00:06<00:14,  5.84it/s][A
Training:  26%|██▌   

Epoch: 2/38 - Loss: 11.2783 - Accuracy: 0.8067



  0%|          | 0/14 [00:00<?, ?it/s][A
  7%|▋         | 1/14 [00:01<00:14,  1.13s/it][A
 14%|█▍        | 2/14 [00:01<00:06,  1.84it/s][A
 36%|███▌      | 5/14 [00:01<00:02,  3.17it/s][A
 43%|████▎     | 6/14 [00:02<00:02,  3.83it/s][A
 64%|██████▍   | 9/14 [00:02<00:01,  4.47it/s][A
 71%|███████▏  | 10/14 [00:02<00:00,  4.31it/s][A
 93%|█████████▎| 13/14 [00:03<00:00,  5.20it/s][A
100%|██████████| 14/14 [00:03<00:00,  3.72it/s][A
Epochs:   5%|▌         | 2/38 [00:55<16:46, 27.95s/it]

Val Loss: 9.0953 - Val Accuracy: 0.8682



Training:   0%|          | 0/112 [00:00<?, ?it/s][A
Training:   1%|          | 1/112 [00:01<02:30,  1.35s/it][A
Training:   3%|▎         | 3/112 [00:01<00:44,  2.47it/s][A
Training:   4%|▍         | 5/112 [00:02<00:39,  2.69it/s][A
Training:   8%|▊         | 9/112 [00:02<00:26,  3.91it/s][A
Training:   9%|▉         | 10/112 [00:03<00:23,  4.30it/s][A
Training:  11%|█         | 12/112 [00:03<00:17,  5.66it/s][A
Training:  12%|█▏        | 13/112 [00:03<00:24,  3.96it/s][A
Training:  12%|█▎        | 14/112 [00:03<00:24,  4.01it/s][A
Training:  15%|█▌        | 17/112 [00:04<00:20,  4.68it/s][A
Training:  16%|█▌        | 18/112 [00:04<00:23,  4.07it/s][A
Training:  18%|█▊        | 20/112 [00:04<00:16,  5.53it/s][A
Training:  19%|█▉        | 21/112 [00:05<00:19,  4.75it/s][A
Training:  20%|█▉        | 22/112 [00:05<00:20,  4.45it/s][A
Training:  21%|██▏       | 24/112 [00:05<00:14,  6.19it/s][A
Training:  22%|██▏       | 25/112 [00:06<00:20,  4.30it/s][A
Training:  23%|██▎  

Epoch: 3/38 - Loss: 8.3429 - Accuracy: 0.8655



  0%|          | 0/14 [00:00<?, ?it/s][A
  7%|▋         | 1/14 [00:01<00:16,  1.26s/it][A
 21%|██▏       | 3/14 [00:01<00:04,  2.62it/s][A
 36%|███▌      | 5/14 [00:02<00:03,  2.81it/s][A
 50%|█████     | 7/14 [00:02<00:01,  4.31it/s][A
 64%|██████▍   | 9/14 [00:02<00:01,  3.63it/s][A
100%|██████████| 14/14 [00:03<00:00,  3.81it/s][A
Epochs:   8%|▊         | 3/38 [01:23<16:15, 27.88s/it]

Val Loss: 7.5433 - Val Accuracy: 0.8917



Training:   0%|          | 0/112 [00:00<?, ?it/s][A
Training:   1%|          | 1/112 [00:01<02:10,  1.17s/it][A
Training:   3%|▎         | 3/112 [00:01<00:39,  2.77it/s][A
Training:   4%|▍         | 5/112 [00:02<00:41,  2.57it/s][A
Training:   6%|▋         | 7/112 [00:02<00:26,  3.93it/s][A
Training:   8%|▊         | 9/112 [00:03<00:29,  3.45it/s][A
Training:  12%|█▏        | 13/112 [00:03<00:26,  3.80it/s][A
Training:  15%|█▌        | 17/112 [00:04<00:22,  4.23it/s][A
Training:  17%|█▋        | 19/112 [00:04<00:18,  5.12it/s][A
Training:  19%|█▉        | 21/112 [00:05<00:22,  4.09it/s][A
Training:  21%|██▏       | 24/112 [00:05<00:15,  5.70it/s][A
Training:  23%|██▎       | 26/112 [00:06<00:19,  4.41it/s][A
Training:  26%|██▌       | 29/112 [00:07<00:21,  3.92it/s][A
Training:  28%|██▊       | 31/112 [00:07<00:16,  4.84it/s][A
Training:  29%|██▉       | 33/112 [00:08<00:19,  3.99it/s][A
Training:  32%|███▏      | 36/112 [00:08<00:13,  5.77it/s][A
Training:  34%|███▍  

Epoch: 4/38 - Loss: 7.0494 - Accuracy: 0.8882



  0%|          | 0/14 [00:00<?, ?it/s][A
  7%|▋         | 1/14 [00:01<00:17,  1.31s/it][A
 21%|██▏       | 3/14 [00:01<00:04,  2.49it/s][A
 29%|██▊       | 4/14 [00:01<00:02,  3.36it/s][A
 36%|███▌      | 5/14 [00:02<00:03,  2.81it/s][A
 43%|████▎     | 6/14 [00:02<00:02,  3.08it/s][A
 57%|█████▋    | 8/14 [00:02<00:01,  5.16it/s][A
 71%|███████▏  | 10/14 [00:03<00:01,  3.63it/s][A
 93%|█████████▎| 13/14 [00:03<00:00,  4.73it/s][A
100%|██████████| 14/14 [00:04<00:00,  3.47it/s][A
Epochs:  11%|█         | 4/38 [01:52<15:54, 28.07s/it]

Val Loss: 6.5711 - Val Accuracy: 0.8998



Training:   0%|          | 0/112 [00:00<?, ?it/s][A
Training:   1%|          | 1/112 [00:01<02:23,  1.30s/it][A
Training:   3%|▎         | 3/112 [00:01<00:42,  2.59it/s][A
Training:   4%|▍         | 5/112 [00:02<00:39,  2.71it/s][A
Training:   6%|▋         | 7/112 [00:02<00:26,  3.99it/s][A
Training:   8%|▊         | 9/112 [00:02<00:26,  3.90it/s][A
Training:  11%|█         | 12/112 [00:03<00:17,  5.65it/s][A
Training:  12%|█▏        | 13/112 [00:03<00:23,  4.14it/s][A
Training:  13%|█▎        | 15/112 [00:03<00:17,  5.41it/s][A
Training:  14%|█▍        | 16/112 [00:04<00:19,  4.99it/s][A
Training:  15%|█▌        | 17/112 [00:04<00:25,  3.69it/s][A
Training:  17%|█▋        | 19/112 [00:04<00:17,  5.34it/s][A
Training:  18%|█▊        | 20/112 [00:04<00:17,  5.12it/s][A
Training:  19%|█▉        | 21/112 [00:05<00:25,  3.60it/s][A
Training:  21%|██        | 23/112 [00:05<00:17,  5.12it/s][A
Training:  21%|██▏       | 24/112 [00:05<00:17,  5.01it/s][A
Training:  22%|██▏   

Epoch: 5/38 - Loss: 6.2536 - Accuracy: 0.9000



  0%|          | 0/14 [00:00<?, ?it/s][A
  7%|▋         | 1/14 [00:01<00:15,  1.20s/it][A
 14%|█▍        | 2/14 [00:01<00:06,  1.75it/s][A
 36%|███▌      | 5/14 [00:01<00:02,  3.18it/s][A
 43%|████▎     | 6/14 [00:02<00:02,  3.64it/s][A
 64%|██████▍   | 9/14 [00:02<00:01,  3.67it/s][A
 86%|████████▌ | 12/14 [00:03<00:00,  5.80it/s][A
100%|██████████| 14/14 [00:03<00:00,  3.53it/s][A
Epochs:  13%|█▎        | 5/38 [02:20<15:28, 28.14s/it]

Val Loss: 5.9249 - Val Accuracy: 0.9083



Training:   0%|          | 0/112 [00:00<?, ?it/s][A
Training:   1%|          | 1/112 [00:01<02:06,  1.14s/it][A
Training:   2%|▏         | 2/112 [00:01<00:58,  1.90it/s][A
Training:   4%|▍         | 5/112 [00:01<00:32,  3.27it/s][A
Training:   7%|▋         | 8/112 [00:02<00:19,  5.40it/s][A
Training:   8%|▊         | 9/112 [00:02<00:28,  3.56it/s][A
Training:  10%|▉         | 11/112 [00:02<00:20,  4.97it/s][A
Training:  12%|█▏        | 13/112 [00:03<00:25,  3.83it/s][A
Training:  12%|█▎        | 14/112 [00:03<00:22,  4.31it/s][A
Training:  13%|█▎        | 15/112 [00:03<00:20,  4.81it/s][A
Training:  15%|█▌        | 17/112 [00:04<00:21,  4.38it/s][A
Training:  16%|█▌        | 18/112 [00:04<00:19,  4.81it/s][A
Training:  18%|█▊        | 20/112 [00:04<00:14,  6.21it/s][A
Training:  19%|█▉        | 21/112 [00:05<00:19,  4.72it/s][A
Training:  20%|█▉        | 22/112 [00:05<00:18,  4.83it/s][A
Training:  21%|██▏       | 24/112 [00:05<00:13,  6.64it/s][A
Training:  22%|██▏   

Epoch: 6/38 - Loss: 5.7011 - Accuracy: 0.9069



  0%|          | 0/14 [00:00<?, ?it/s][A
  7%|▋         | 1/14 [00:01<00:16,  1.24s/it][A
 29%|██▊       | 4/14 [00:01<00:02,  3.74it/s][A
 43%|████▎     | 6/14 [00:02<00:02,  3.12it/s][A
 50%|█████     | 7/14 [00:02<00:01,  3.70it/s][A
 64%|██████▍   | 9/14 [00:02<00:01,  3.46it/s][A
100%|██████████| 14/14 [00:03<00:00,  3.81it/s][A
Epochs:  16%|█▌        | 6/38 [02:48<14:56, 28.01s/it]

Val Loss: 5.4790 - Val Accuracy: 0.9146



Training:   0%|          | 0/112 [00:00<?, ?it/s][A
Training:   1%|          | 1/112 [00:01<02:42,  1.46s/it][A
Training:   4%|▎         | 4/112 [00:01<00:33,  3.23it/s][A
Training:   5%|▌         | 6/112 [00:02<00:33,  3.12it/s][A
Training:   7%|▋         | 8/112 [00:02<00:23,  4.41it/s][A
Training:   9%|▉         | 10/112 [00:03<00:26,  3.85it/s][A
Training:  12%|█▏        | 13/112 [00:03<00:25,  3.81it/s][A
Training:  13%|█▎        | 15/112 [00:03<00:20,  4.82it/s][A
Training:  15%|█▌        | 17/112 [00:04<00:25,  3.79it/s][A
Training:  17%|█▋        | 19/112 [00:04<00:18,  4.97it/s][A
Training:  19%|█▉        | 21/112 [00:05<00:22,  4.07it/s][A
Training:  21%|██▏       | 24/112 [00:05<00:14,  6.03it/s][A
Training:  23%|██▎       | 26/112 [00:06<00:17,  4.88it/s][A
Training:  26%|██▌       | 29/112 [00:07<00:19,  4.37it/s][A
Training:  28%|██▊       | 31/112 [00:07<00:14,  5.47it/s][A
Training:  29%|██▉       | 33/112 [00:08<00:19,  4.15it/s][A
Training:  31%|███▏ 

Epoch: 7/38 - Loss: 5.2943 - Accuracy: 0.9138



  0%|          | 0/14 [00:00<?, ?it/s][A
  7%|▋         | 1/14 [00:01<00:16,  1.28s/it][A
 29%|██▊       | 4/14 [00:01<00:02,  3.56it/s][A
 43%|████▎     | 6/14 [00:02<00:02,  3.46it/s][A
 64%|██████▍   | 9/14 [00:02<00:01,  3.56it/s][A
 79%|███████▊  | 11/14 [00:02<00:00,  4.80it/s][A
100%|██████████| 14/14 [00:03<00:00,  3.77it/s][A
Epochs:  18%|█▊        | 7/38 [03:16<14:27, 27.99s/it]

Val Loss: 5.2242 - Val Accuracy: 0.9118



Training:   0%|          | 0/112 [00:00<?, ?it/s][A
Training:   1%|          | 1/112 [00:01<02:15,  1.22s/it][A
Training:   4%|▎         | 4/112 [00:01<00:28,  3.80it/s][A
Training:   5%|▌         | 6/112 [00:01<00:30,  3.53it/s][A
Training:   7%|▋         | 8/112 [00:02<00:20,  5.08it/s][A
Training:   9%|▉         | 10/112 [00:02<00:25,  3.94it/s][A
Training:  10%|▉         | 11/112 [00:02<00:22,  4.48it/s][A
Training:  12%|█▏        | 13/112 [00:03<00:27,  3.60it/s][A
Training:  13%|█▎        | 15/112 [00:03<00:20,  4.67it/s][A
Training:  15%|█▌        | 17/112 [00:04<00:23,  4.07it/s][A
Training:  17%|█▋        | 19/112 [00:04<00:17,  5.37it/s][A
Training:  19%|█▉        | 21/112 [00:05<00:20,  4.53it/s][A
Training:  20%|█▉        | 22/112 [00:05<00:19,  4.71it/s][A
Training:  22%|██▏       | 25/112 [00:05<00:18,  4.63it/s][A
Training:  23%|██▎       | 26/112 [00:06<00:16,  5.10it/s][A
Training:  26%|██▌       | 29/112 [00:06<00:19,  4.35it/s][A
Training:  28%|██▊  

Epoch: 8/38 - Loss: 4.9758 - Accuracy: 0.9179



  0%|          | 0/14 [00:00<?, ?it/s][A
  7%|▋         | 1/14 [00:01<00:15,  1.18s/it][A
 29%|██▊       | 4/14 [00:01<00:02,  3.96it/s][A
 43%|████▎     | 6/14 [00:02<00:02,  2.99it/s][A
 57%|█████▋    | 8/14 [00:02<00:01,  4.32it/s][A
 71%|███████▏  | 10/14 [00:03<00:01,  3.59it/s][A
100%|██████████| 14/14 [00:03<00:00,  3.60it/s][A
Epochs:  21%|██        | 8/38 [03:43<13:56, 27.88s/it]

Val Loss: 5.0113 - Val Accuracy: 0.9175



Training:   0%|          | 0/112 [00:00<?, ?it/s][A
Training:   1%|          | 1/112 [00:01<01:50,  1.00it/s][A
Training:   3%|▎         | 3/112 [00:01<00:35,  3.05it/s][A
Training:   4%|▍         | 5/112 [00:01<00:32,  3.25it/s][A
Training:   6%|▋         | 7/112 [00:01<00:22,  4.60it/s][A
Training:   8%|▊         | 9/112 [00:02<00:26,  3.94it/s][A
Training:   9%|▉         | 10/112 [00:02<00:22,  4.51it/s][A
Training:  10%|▉         | 11/112 [00:02<00:20,  5.03it/s][A
Training:  12%|█▏        | 13/112 [00:03<00:25,  3.95it/s][A
Training:  13%|█▎        | 15/112 [00:03<00:18,  5.28it/s][A
Training:  15%|█▌        | 17/112 [00:04<00:23,  4.07it/s][A
Training:  17%|█▋        | 19/112 [00:04<00:17,  5.27it/s][A
Training:  19%|█▉        | 21/112 [00:05<00:21,  4.33it/s][A
Training:  21%|██        | 23/112 [00:05<00:15,  5.74it/s][A
Training:  22%|██▏       | 25/112 [00:06<00:21,  4.11it/s][A
Training:  24%|██▍       | 27/112 [00:06<00:16,  5.10it/s][A
Training:  25%|██▌   

Epoch: 9/38 - Loss: 4.7365 - Accuracy: 0.9210



  0%|          | 0/14 [00:00<?, ?it/s][A
  7%|▋         | 1/14 [00:01<00:16,  1.27s/it][A
 29%|██▊       | 4/14 [00:01<00:02,  3.66it/s][A
 43%|████▎     | 6/14 [00:02<00:02,  2.82it/s][A
 64%|██████▍   | 9/14 [00:02<00:01,  3.52it/s][A
 71%|███████▏  | 10/14 [00:03<00:01,  4.00it/s][A
 86%|████████▌ | 12/14 [00:03<00:00,  5.11it/s][A
100%|██████████| 14/14 [00:03<00:00,  3.60it/s][A
Epochs:  24%|██▎       | 9/38 [04:11<13:25, 27.77s/it]

Val Loss: 4.7623 - Val Accuracy: 0.9215



Training:   0%|          | 0/112 [00:00<?, ?it/s][A
Training:   1%|          | 1/112 [00:01<02:12,  1.19s/it][A
Training:   3%|▎         | 3/112 [00:01<00:38,  2.84it/s][A
Training:   4%|▍         | 5/112 [00:02<00:42,  2.50it/s][A
Training:   5%|▌         | 6/112 [00:02<00:33,  3.12it/s][A
Training:   7%|▋         | 8/112 [00:02<00:21,  4.87it/s][A
Training:   9%|▉         | 10/112 [00:03<00:26,  3.92it/s][A
Training:  11%|█         | 12/112 [00:03<00:18,  5.33it/s][A
Training:  12%|█▎        | 14/112 [00:03<00:22,  4.37it/s][A
Training:  15%|█▌        | 17/112 [00:04<00:23,  3.99it/s][A
Training:  18%|█▊        | 20/112 [00:04<00:15,  5.87it/s][A
Training:  20%|█▉        | 22/112 [00:05<00:19,  4.72it/s][A
Training:  22%|██▏       | 25/112 [00:06<00:19,  4.54it/s][A
Training:  24%|██▍       | 27/112 [00:06<00:15,  5.54it/s][A
Training:  26%|██▌       | 29/112 [00:07<00:18,  4.37it/s][A
Training:  28%|██▊       | 31/112 [00:07<00:15,  5.19it/s][A
Training:  29%|██▉   

Epoch: 10/38 - Loss: 4.5248 - Accuracy: 0.9238



  0%|          | 0/14 [00:00<?, ?it/s][A
  7%|▋         | 1/14 [00:01<00:13,  1.04s/it][A
 21%|██▏       | 3/14 [00:01<00:03,  3.24it/s][A
 36%|███▌      | 5/14 [00:01<00:03,  2.94it/s][A
 57%|█████▋    | 8/14 [00:02<00:01,  4.67it/s][A
 64%|██████▍   | 9/14 [00:02<00:01,  3.58it/s][A
 86%|████████▌ | 12/14 [00:02<00:00,  5.23it/s][A
100%|██████████| 14/14 [00:03<00:00,  3.96it/s][A
Epochs:  26%|██▋       | 10/38 [04:38<12:56, 27.73s/it]

Val Loss: 4.5935 - Val Accuracy: 0.9210



Training:   0%|          | 0/112 [00:00<?, ?it/s][A
Training:   1%|          | 1/112 [00:01<02:14,  1.21s/it][A
Training:   2%|▏         | 2/112 [00:01<01:02,  1.76it/s][A
Training:   4%|▍         | 5/112 [00:02<00:39,  2.70it/s][A
Training:   6%|▋         | 7/112 [00:02<00:25,  4.04it/s][A
Training:   8%|▊         | 9/112 [00:03<00:31,  3.25it/s][A
Training:  10%|▉         | 11/112 [00:03<00:22,  4.50it/s][A
Training:  12%|█▏        | 13/112 [00:03<00:23,  4.20it/s][A
Training:  14%|█▍        | 16/112 [00:03<00:14,  6.43it/s][A
Training:  16%|█▌        | 18/112 [00:04<00:21,  4.41it/s][A
Training:  19%|█▉        | 21/112 [00:05<00:22,  4.09it/s][A
Training:  21%|██▏       | 24/112 [00:05<00:15,  5.67it/s][A
Training:  23%|██▎       | 26/112 [00:06<00:18,  4.55it/s][A
Training:  26%|██▌       | 29/112 [00:07<00:21,  3.92it/s][A
Training:  28%|██▊       | 31/112 [00:07<00:16,  4.85it/s][A
Training:  29%|██▉       | 33/112 [00:08<00:18,  4.34it/s][A
Training:  32%|███▏  

Epoch: 11/38 - Loss: 4.3725 - Accuracy: 0.9262



  0%|          | 0/14 [00:00<?, ?it/s][A
  7%|▋         | 1/14 [00:01<00:13,  1.02s/it][A
 36%|███▌      | 5/14 [00:01<00:02,  3.28it/s][A
 50%|█████     | 7/14 [00:01<00:01,  4.56it/s][A
 64%|██████▍   | 9/14 [00:02<00:01,  3.86it/s][A
100%|██████████| 14/14 [00:03<00:00,  4.22it/s][A
Epochs:  29%|██▉       | 11/38 [05:05<12:23, 27.53s/it]

Val Loss: 4.5367 - Val Accuracy: 0.9181



Training:   0%|          | 0/112 [00:00<?, ?it/s][A
Training:   1%|          | 1/112 [00:01<02:20,  1.26s/it][A
Training:   3%|▎         | 3/112 [00:01<00:40,  2.69it/s][A
Training:   4%|▍         | 5/112 [00:02<00:39,  2.73it/s][A
Training:   5%|▌         | 6/112 [00:02<00:32,  3.27it/s][A
Training:   7%|▋         | 8/112 [00:02<00:20,  5.06it/s][A
Training:   9%|▉         | 10/112 [00:03<00:27,  3.78it/s][A
Training:  12%|█▏        | 13/112 [00:03<00:24,  4.09it/s][A
Training:  12%|█▎        | 14/112 [00:03<00:21,  4.56it/s][A
Training:  14%|█▍        | 16/112 [00:04<00:16,  5.69it/s][A
Training:  15%|█▌        | 17/112 [00:04<00:23,  4.00it/s][A
Training:  17%|█▋        | 19/112 [00:04<00:16,  5.50it/s][A
Training:  19%|█▉        | 21/112 [00:05<00:22,  3.99it/s][A
Training:  21%|██▏       | 24/112 [00:05<00:14,  6.00it/s][A
Training:  23%|██▎       | 26/112 [00:06<00:19,  4.42it/s][A
Training:  25%|██▌       | 28/112 [00:06<00:15,  5.31it/s][A
Training:  26%|██▌   

Epoch: 12/38 - Loss: 4.2412 - Accuracy: 0.9284



  0%|          | 0/14 [00:00<?, ?it/s][A
  7%|▋         | 1/14 [00:01<00:16,  1.24s/it][A
 29%|██▊       | 4/14 [00:01<00:03,  3.06it/s][A
 36%|███▌      | 5/14 [00:01<00:03,  2.96it/s][A
 50%|█████     | 7/14 [00:02<00:01,  4.70it/s][A
 57%|█████▋    | 8/14 [00:02<00:01,  4.90it/s][A
 64%|██████▍   | 9/14 [00:02<00:01,  3.40it/s][A
 86%|████████▌ | 12/14 [00:03<00:00,  5.65it/s][A
100%|██████████| 14/14 [00:03<00:00,  3.78it/s][A
Epochs:  32%|███▏      | 12/38 [05:33<11:58, 27.62s/it]

Val Loss: 4.3772 - Val Accuracy: 0.9215



Training:   0%|          | 0/112 [00:00<?, ?it/s][A
Training:   1%|          | 1/112 [00:01<02:31,  1.36s/it][A
Training:   4%|▍         | 5/112 [00:02<00:38,  2.74it/s][A
Training:   6%|▋         | 7/112 [00:02<00:26,  4.00it/s][A
Training:   8%|▊         | 9/112 [00:02<00:29,  3.49it/s][A
Training:   9%|▉         | 10/112 [00:03<00:25,  3.93it/s][A
Training:  11%|█         | 12/112 [00:03<00:19,  5.19it/s][A
Training:  12%|█▏        | 13/112 [00:03<00:26,  3.68it/s][A
Training:  14%|█▍        | 16/112 [00:03<00:15,  6.13it/s][A
Training:  16%|█▌        | 18/112 [00:04<00:20,  4.63it/s][A
Training:  19%|█▉        | 21/112 [00:05<00:21,  4.30it/s][A
Training:  21%|██        | 23/112 [00:05<00:16,  5.45it/s][A
Training:  22%|██▏       | 25/112 [00:06<00:19,  4.42it/s][A
Training:  24%|██▍       | 27/112 [00:06<00:15,  5.43it/s][A
Training:  26%|██▌       | 29/112 [00:07<00:19,  4.35it/s][A
Training:  28%|██▊       | 31/112 [00:07<00:14,  5.49it/s][A
Training:  29%|██▉  

Epoch: 13/38 - Loss: 4.1254 - Accuracy: 0.9314



  0%|          | 0/14 [00:00<?, ?it/s][A
  7%|▋         | 1/14 [00:01<00:19,  1.48s/it][A
 21%|██▏       | 3/14 [00:01<00:04,  2.35it/s][A
 36%|███▌      | 5/14 [00:02<00:03,  2.87it/s][A
 50%|█████     | 7/14 [00:02<00:01,  4.11it/s][A
 64%|██████▍   | 9/14 [00:02<00:01,  3.90it/s][A
 79%|███████▊  | 11/14 [00:03<00:00,  4.84it/s][A
100%|██████████| 14/14 [00:03<00:00,  3.64it/s][A
Epochs:  34%|███▍      | 13/38 [06:01<11:32, 27.70s/it]

Val Loss: 4.3511 - Val Accuracy: 0.9186



Training:   0%|          | 0/112 [00:00<?, ?it/s][A
Training:   1%|          | 1/112 [00:01<02:23,  1.29s/it][A
Training:   2%|▏         | 2/112 [00:01<01:06,  1.65it/s][A
Training:   4%|▍         | 5/112 [00:02<00:34,  3.15it/s][A
Training:   5%|▌         | 6/112 [00:02<00:28,  3.69it/s][A
Training:   7%|▋         | 8/112 [00:02<00:21,  4.94it/s][A
Training:   8%|▊         | 9/112 [00:02<00:24,  4.16it/s][A
Training:   9%|▉         | 10/112 [00:02<00:24,  4.22it/s][A
Training:  11%|█         | 12/112 [00:03<00:18,  5.31it/s][A
Training:  12%|█▏        | 13/112 [00:03<00:24,  4.11it/s][A
Training:  13%|█▎        | 15/112 [00:03<00:16,  5.93it/s][A
Training:  14%|█▍        | 16/112 [00:04<00:18,  5.26it/s][A
Training:  15%|█▌        | 17/112 [00:04<00:24,  3.83it/s][A
Training:  17%|█▋        | 19/112 [00:04<00:17,  5.32it/s][A
Training:  18%|█▊        | 20/112 [00:04<00:16,  5.59it/s][A
Training:  19%|█▉        | 21/112 [00:05<00:21,  4.21it/s][A
Training:  20%|█▉     

Epoch: 14/38 - Loss: 4.0392 - Accuracy: 0.9330



  0%|          | 0/14 [00:00<?, ?it/s][A
  7%|▋         | 1/14 [00:01<00:17,  1.32s/it][A
 21%|██▏       | 3/14 [00:01<00:04,  2.61it/s][A
 36%|███▌      | 5/14 [00:02<00:03,  2.93it/s][A
 43%|████▎     | 6/14 [00:02<00:02,  3.08it/s][A
 50%|█████     | 7/14 [00:02<00:01,  3.60it/s][A
 64%|██████▍   | 9/14 [00:03<00:01,  3.61it/s][A
 71%|███████▏  | 10/14 [00:03<00:00,  4.14it/s][A
100%|██████████| 14/14 [00:04<00:00,  3.46it/s][A
Epochs:  37%|███▋      | 14/38 [06:30<11:09, 27.92s/it]

Val Loss: 4.2266 - Val Accuracy: 0.9284



Training:   0%|          | 0/112 [00:00<?, ?it/s][A
Training:   1%|          | 1/112 [00:00<01:47,  1.03it/s][A
Training:   2%|▏         | 2/112 [00:01<00:55,  1.98it/s][A
Training:   4%|▍         | 5/112 [00:01<00:28,  3.73it/s][A
Training:   5%|▌         | 6/112 [00:02<00:31,  3.33it/s][A
Training:   6%|▋         | 7/112 [00:02<00:26,  4.02it/s][A
Training:   8%|▊         | 9/112 [00:02<00:25,  4.10it/s][A
Training:   9%|▉         | 10/112 [00:02<00:25,  4.01it/s][A
Training:  12%|█▏        | 13/112 [00:03<00:20,  4.80it/s][A
Training:  12%|█▎        | 14/112 [00:03<00:23,  4.18it/s][A
Training:  13%|█▎        | 15/112 [00:03<00:20,  4.71it/s][A
Training:  15%|█▌        | 17/112 [00:04<00:16,  5.80it/s][A
Training:  16%|█▌        | 18/112 [00:04<00:22,  4.22it/s][A
Training:  17%|█▋        | 19/112 [00:04<00:22,  4.11it/s][A
Training:  19%|█▉        | 21/112 [00:05<00:16,  5.67it/s][A
Training:  20%|█▉        | 22/112 [00:05<00:21,  4.28it/s][A
Training:  21%|██     

Epoch: 15/38 - Loss: 3.9466 - Accuracy: 0.9331



  0%|          | 0/14 [00:00<?, ?it/s][A
  7%|▋         | 1/14 [00:01<00:13,  1.01s/it][A
 21%|██▏       | 3/14 [00:01<00:03,  3.24it/s][A
 36%|███▌      | 5/14 [00:01<00:02,  3.41it/s][A
 50%|█████     | 7/14 [00:01<00:01,  5.16it/s][A
 64%|██████▍   | 9/14 [00:02<00:01,  3.95it/s][A
 86%|████████▌ | 12/14 [00:02<00:00,  6.30it/s][A
100%|██████████| 14/14 [00:03<00:00,  4.09it/s][A
Epochs:  39%|███▉      | 15/38 [06:57<10:39, 27.80s/it]

Val Loss: 4.1366 - Val Accuracy: 0.9278



Training:   0%|          | 0/112 [00:00<?, ?it/s][A
Training:   1%|          | 1/112 [00:01<02:02,  1.10s/it][A
Training:   4%|▍         | 5/112 [00:01<00:37,  2.88it/s][A
Training:   6%|▋         | 7/112 [00:02<00:25,  4.06it/s][A
Training:   8%|▊         | 9/112 [00:02<00:28,  3.59it/s][A
Training:  10%|▉         | 11/112 [00:02<00:20,  4.84it/s][A
Training:  12%|█▏        | 13/112 [00:03<00:26,  3.79it/s][A
Training:  14%|█▍        | 16/112 [00:03<00:17,  5.52it/s][A
Training:  16%|█▌        | 18/112 [00:04<00:20,  4.67it/s][A
Training:  18%|█▊        | 20/112 [00:04<00:15,  5.77it/s][A
Training:  19%|█▉        | 21/112 [00:05<00:22,  4.04it/s][A
Training:  21%|██▏       | 24/112 [00:05<00:14,  6.23it/s][A
Training:  23%|██▎       | 26/112 [00:06<00:20,  4.22it/s][A
Training:  25%|██▌       | 28/112 [00:06<00:15,  5.39it/s][A
Training:  27%|██▋       | 30/112 [00:07<00:21,  3.75it/s][A
Training:  29%|██▊       | 32/112 [00:07<00:16,  4.83it/s][A
Training:  30%|███  

Epoch: 16/38 - Loss: 3.8558 - Accuracy: 0.9344



  0%|          | 0/14 [00:00<?, ?it/s][A
  7%|▋         | 1/14 [00:01<00:14,  1.08s/it][A
 14%|█▍        | 2/14 [00:01<00:06,  1.83it/s][A
 29%|██▊       | 4/14 [00:01<00:02,  4.23it/s][A
 43%|████▎     | 6/14 [00:02<00:02,  3.32it/s][A
 57%|█████▋    | 8/14 [00:02<00:01,  4.98it/s][A
 71%|███████▏  | 10/14 [00:03<00:01,  3.57it/s][A
 93%|█████████▎| 13/14 [00:03<00:00,  4.73it/s][A
100%|██████████| 14/14 [00:03<00:00,  3.71it/s][A
Epochs:  42%|████▏     | 16/38 [07:25<10:11, 27.81s/it]

Val Loss: 4.1690 - Val Accuracy: 0.9221



Training:   0%|          | 0/112 [00:00<?, ?it/s][A
Training:   1%|          | 1/112 [00:01<02:12,  1.19s/it][A
Training:   4%|▎         | 4/112 [00:01<00:28,  3.79it/s][A
Training:   5%|▌         | 6/112 [00:02<00:31,  3.38it/s][A
Training:   6%|▋         | 7/112 [00:02<00:26,  3.94it/s][A
Training:   8%|▊         | 9/112 [00:02<00:31,  3.32it/s][A
Training:  10%|▉         | 11/112 [00:03<00:21,  4.61it/s][A
Training:  12%|█▏        | 13/112 [00:03<00:26,  3.80it/s][A
Training:  13%|█▎        | 15/112 [00:03<00:19,  5.07it/s][A
Training:  15%|█▌        | 17/112 [00:04<00:23,  4.08it/s][A
Training:  16%|█▌        | 18/112 [00:04<00:20,  4.57it/s][A
Training:  18%|█▊        | 20/112 [00:04<00:15,  6.06it/s][A
Training:  20%|█▉        | 22/112 [00:05<00:19,  4.63it/s][A
Training:  21%|██▏       | 24/112 [00:05<00:14,  6.03it/s][A
Training:  23%|██▎       | 26/112 [00:06<00:19,  4.44it/s][A
Training:  25%|██▌       | 28/112 [00:06<00:14,  5.79it/s][A
Training:  27%|██▋   

Epoch: 17/38 - Loss: 3.8174 - Accuracy: 0.9364



  0%|          | 0/14 [00:00<?, ?it/s][A
  7%|▋         | 1/14 [00:01<00:15,  1.18s/it][A
 29%|██▊       | 4/14 [00:01<00:02,  3.91it/s][A
 43%|████▎     | 6/14 [00:02<00:02,  3.21it/s][A
 57%|█████▋    | 8/14 [00:02<00:01,  4.49it/s][A
 71%|███████▏  | 10/14 [00:02<00:01,  3.66it/s][A
 86%|████████▌ | 12/14 [00:03<00:00,  4.83it/s][A
100%|██████████| 14/14 [00:03<00:00,  3.75it/s][A
Epochs:  45%|████▍     | 17/38 [07:53<09:44, 27.81s/it]

Val Loss: 4.0509 - Val Accuracy: 0.9284



Training:   0%|          | 0/112 [00:00<?, ?it/s][A
Training:   1%|          | 1/112 [00:01<02:20,  1.27s/it][A
Training:   2%|▏         | 2/112 [00:01<01:04,  1.70it/s][A
Training:   4%|▎         | 4/112 [00:01<00:27,  3.95it/s][A
Training:   5%|▌         | 6/112 [00:02<00:35,  3.00it/s][A
Training:   7%|▋         | 8/112 [00:02<00:22,  4.55it/s][A
Training:   9%|▉         | 10/112 [00:03<00:28,  3.56it/s][A
Training:  12%|█▏        | 13/112 [00:03<00:24,  3.98it/s][A
Training:  14%|█▍        | 16/112 [00:03<00:16,  5.95it/s][A
Training:  16%|█▌        | 18/112 [00:04<00:22,  4.17it/s][A
Training:  19%|█▉        | 21/112 [00:05<00:23,  3.94it/s][A
Training:  21%|██        | 23/112 [00:05<00:18,  4.88it/s][A
Training:  22%|██▏       | 25/112 [00:06<00:21,  4.01it/s][A
Training:  24%|██▍       | 27/112 [00:06<00:16,  5.12it/s][A
Training:  26%|██▌       | 29/112 [00:07<00:18,  4.43it/s][A
Training:  29%|██▊       | 32/112 [00:07<00:12,  6.29it/s][A
Training:  30%|███   

Epoch: 18/38 - Loss: 3.7638 - Accuracy: 0.9365



  0%|          | 0/14 [00:00<?, ?it/s][A
  7%|▋         | 1/14 [00:01<00:16,  1.28s/it][A
 21%|██▏       | 3/14 [00:01<00:04,  2.62it/s][A
 36%|███▌      | 5/14 [00:02<00:03,  2.53it/s][A
 57%|█████▋    | 8/14 [00:02<00:01,  4.79it/s][A
 71%|███████▏  | 10/14 [00:03<00:01,  3.84it/s][A
100%|██████████| 14/14 [00:03<00:00,  3.77it/s][A
Epochs:  47%|████▋     | 18/38 [08:20<09:13, 27.69s/it]

Val Loss: 3.9903 - Val Accuracy: 0.9261



Training:   0%|          | 0/112 [00:00<?, ?it/s][A
Training:   1%|          | 1/112 [00:01<02:18,  1.25s/it][A
Training:   3%|▎         | 3/112 [00:01<00:41,  2.62it/s][A
Training:   4%|▍         | 5/112 [00:02<00:40,  2.64it/s][A
Training:   6%|▋         | 7/112 [00:02<00:25,  4.12it/s][A
Training:   8%|▊         | 9/112 [00:02<00:28,  3.60it/s][A
Training:  11%|█         | 12/112 [00:03<00:17,  5.64it/s][A
Training:  12%|█▎        | 14/112 [00:03<00:22,  4.42it/s][A
Training:  14%|█▍        | 16/112 [00:03<00:17,  5.58it/s][A
Training:  16%|█▌        | 18/112 [00:04<00:21,  4.37it/s][A
Training:  18%|█▊        | 20/112 [00:04<00:16,  5.60it/s][A
Training:  20%|█▉        | 22/112 [00:05<00:22,  4.09it/s][A
Training:  21%|██▏       | 24/112 [00:05<00:16,  5.18it/s][A
Training:  22%|██▏       | 25/112 [00:06<00:20,  4.18it/s][A
Training:  23%|██▎       | 26/112 [00:06<00:20,  4.30it/s][A
Training:  25%|██▌       | 28/112 [00:06<00:14,  5.79it/s][A
Training:  26%|██▌   

Epoch: 19/38 - Loss: 3.7164 - Accuracy: 0.9378



  0%|          | 0/14 [00:00<?, ?it/s][A
  7%|▋         | 1/14 [00:01<00:17,  1.36s/it][A
 36%|███▌      | 5/14 [00:02<00:03,  2.82it/s][A
 64%|██████▍   | 9/14 [00:02<00:01,  4.00it/s][A
 79%|███████▊  | 11/14 [00:02<00:00,  5.13it/s][A
100%|██████████| 14/14 [00:03<00:00,  3.80it/s][A
Epochs:  50%|█████     | 19/38 [08:48<08:45, 27.68s/it]

Val Loss: 3.9408 - Val Accuracy: 0.9290



Training:   0%|          | 0/112 [00:00<?, ?it/s][A
Training:   1%|          | 1/112 [00:01<02:27,  1.33s/it][A
Training:   3%|▎         | 3/112 [00:01<00:43,  2.52it/s][A
Training:   4%|▍         | 5/112 [00:02<00:35,  2.98it/s][A
Training:   6%|▋         | 7/112 [00:02<00:23,  4.47it/s][A
Training:   8%|▊         | 9/112 [00:02<00:26,  3.84it/s][A
Training:  11%|█         | 12/112 [00:03<00:17,  5.77it/s][A
Training:  12%|█▏        | 13/112 [00:03<00:24,  4.06it/s][A
Training:  12%|█▎        | 14/112 [00:03<00:21,  4.58it/s][A
Training:  14%|█▍        | 16/112 [00:03<00:15,  6.07it/s][A
Training:  15%|█▌        | 17/112 [00:04<00:24,  3.93it/s][A
Training:  18%|█▊        | 20/112 [00:04<00:14,  6.17it/s][A
Training:  20%|█▉        | 22/112 [00:05<00:19,  4.68it/s][A
Training:  21%|██        | 23/112 [00:05<00:17,  5.18it/s][A
Training:  22%|██▏       | 25/112 [00:05<00:19,  4.36it/s][A
Training:  25%|██▌       | 28/112 [00:06<00:12,  6.47it/s][A
Training:  27%|██▋   

Epoch: 20/38 - Loss: 3.6343 - Accuracy: 0.9395



  0%|          | 0/14 [00:00<?, ?it/s][A
  7%|▋         | 1/14 [00:01<00:13,  1.01s/it][A
 14%|█▍        | 2/14 [00:01<00:07,  1.71it/s][A
 36%|███▌      | 5/14 [00:01<00:02,  3.65it/s][A
 43%|████▎     | 6/14 [00:01<00:02,  3.74it/s][A
 57%|█████▋    | 8/14 [00:02<00:01,  5.61it/s][A
 64%|██████▍   | 9/14 [00:02<00:00,  5.03it/s][A
 71%|███████▏  | 10/14 [00:02<00:00,  4.13it/s][A
 86%|████████▌ | 12/14 [00:02<00:00,  5.71it/s][A
 93%|█████████▎| 13/14 [00:03<00:00,  5.03it/s][A
100%|██████████| 14/14 [00:03<00:00,  4.04it/s][A
Epochs:  53%|█████▎    | 20/38 [09:15<08:15, 27.52s/it]

Val Loss: 3.9449 - Val Accuracy: 0.9273



Training:   0%|          | 0/112 [00:00<?, ?it/s][A
Training:   1%|          | 1/112 [00:01<02:09,  1.17s/it][A
Training:   3%|▎         | 3/112 [00:01<00:38,  2.80it/s][A
Training:   4%|▍         | 5/112 [00:01<00:34,  3.12it/s][A
Training:   7%|▋         | 8/112 [00:02<00:18,  5.68it/s][A
Training:   9%|▉         | 10/112 [00:02<00:23,  4.33it/s][A
Training:  11%|█         | 12/112 [00:02<00:18,  5.53it/s][A
Training:  12%|█▎        | 14/112 [00:03<00:23,  4.13it/s][A
Training:  14%|█▍        | 16/112 [00:03<00:19,  5.02it/s][A
Training:  15%|█▌        | 17/112 [00:04<00:26,  3.63it/s][A
Training:  18%|█▊        | 20/112 [00:04<00:17,  5.11it/s][A
Training:  19%|█▉        | 21/112 [00:05<00:22,  4.09it/s][A
Training:  21%|██        | 23/112 [00:05<00:16,  5.43it/s][A
Training:  21%|██▏       | 24/112 [00:05<00:15,  5.63it/s][A
Training:  22%|██▏       | 25/112 [00:05<00:21,  4.06it/s][A
Training:  24%|██▍       | 27/112 [00:06<00:14,  5.81it/s][A
Training:  26%|██▌  

Epoch: 21/38 - Loss: 3.5984 - Accuracy: 0.9388



  0%|          | 0/14 [00:00<?, ?it/s][A
  7%|▋         | 1/14 [00:01<00:16,  1.30s/it][A
 21%|██▏       | 3/14 [00:01<00:04,  2.60it/s][A
 36%|███▌      | 5/14 [00:02<00:03,  2.65it/s][A
 50%|█████     | 7/14 [00:02<00:01,  4.02it/s][A
 64%|██████▍   | 9/14 [00:03<00:01,  3.49it/s][A
100%|██████████| 14/14 [00:03<00:00,  3.69it/s][A
Epochs:  55%|█████▌    | 21/38 [09:43<07:47, 27.53s/it]

Val Loss: 3.8951 - Val Accuracy: 0.9273



Training:   0%|          | 0/112 [00:00<?, ?it/s][A
Training:   1%|          | 1/112 [00:01<02:48,  1.52s/it][A
Training:   3%|▎         | 3/112 [00:01<00:47,  2.31it/s][A
Training:   4%|▍         | 5/112 [00:02<00:40,  2.61it/s][A
Training:   6%|▋         | 7/112 [00:02<00:26,  4.02it/s][A
Training:   8%|▊         | 9/112 [00:03<00:29,  3.55it/s][A
Training:  12%|█▏        | 13/112 [00:03<00:24,  4.02it/s][A
Training:  14%|█▍        | 16/112 [00:04<00:16,  5.76it/s][A
Training:  16%|█▌        | 18/112 [00:04<00:21,  4.34it/s][A
Training:  19%|█▉        | 21/112 [00:05<00:20,  4.40it/s][A
Training:  21%|██▏       | 24/112 [00:05<00:14,  6.07it/s][A
Training:  23%|██▎       | 26/112 [00:06<00:17,  4.99it/s][A
Training:  26%|██▌       | 29/112 [00:07<00:18,  4.45it/s][A
Training:  28%|██▊       | 31/112 [00:07<00:14,  5.40it/s][A
Training:  29%|██▉       | 33/112 [00:07<00:18,  4.25it/s][A
Training:  33%|███▎      | 37/112 [00:08<00:17,  4.24it/s][A
Training:  37%|███▋  

Epoch: 22/38 - Loss: 3.5707 - Accuracy: 0.9401



  0%|          | 0/14 [00:00<?, ?it/s][A
  7%|▋         | 1/14 [00:01<00:14,  1.11s/it][A
 14%|█▍        | 2/14 [00:01<00:06,  1.82it/s][A
 36%|███▌      | 5/14 [00:02<00:02,  3.06it/s][A
 43%|████▎     | 6/14 [00:02<00:02,  3.48it/s][A
 64%|██████▍   | 9/14 [00:02<00:01,  3.77it/s][A
100%|██████████| 14/14 [00:03<00:00,  3.72it/s][A
Epochs:  58%|█████▊    | 22/38 [10:10<07:22, 27.65s/it]

Val Loss: 3.8421 - Val Accuracy: 0.9325



Training:   0%|          | 0/112 [00:00<?, ?it/s][A
Training:   1%|          | 1/112 [00:01<02:00,  1.08s/it][A
Training:   2%|▏         | 2/112 [00:01<00:58,  1.87it/s][A
Training:   4%|▍         | 5/112 [00:01<00:32,  3.29it/s][A
Training:   6%|▋         | 7/112 [00:02<00:21,  4.79it/s][A
Training:   8%|▊         | 9/112 [00:02<00:24,  4.19it/s][A
Training:   9%|▉         | 10/112 [00:02<00:21,  4.69it/s][A
Training:  11%|█         | 12/112 [00:02<00:16,  6.14it/s][A
Training:  12%|█▏        | 13/112 [00:03<00:24,  4.01it/s][A
Training:  12%|█▎        | 14/112 [00:03<00:21,  4.55it/s][A
Training:  15%|█▌        | 17/112 [00:04<00:19,  4.78it/s][A
Training:  17%|█▋        | 19/112 [00:04<00:15,  6.06it/s][A
Training:  19%|█▉        | 21/112 [00:04<00:18,  4.92it/s][A
Training:  20%|█▉        | 22/112 [00:05<00:17,  5.28it/s][A
Training:  22%|██▏       | 25/112 [00:05<00:17,  4.94it/s][A
Training:  23%|██▎       | 26/112 [00:05<00:16,  5.20it/s][A
Training:  26%|██▌   

Epoch: 23/38 - Loss: 3.5308 - Accuracy: 0.9408



  0%|          | 0/14 [00:00<?, ?it/s][A
  7%|▋         | 1/14 [00:01<00:15,  1.16s/it][A
 36%|███▌      | 5/14 [00:01<00:03,  2.95it/s][A
 57%|█████▋    | 8/14 [00:02<00:01,  5.11it/s][A
 71%|███████▏  | 10/14 [00:02<00:01,  3.84it/s][A
100%|██████████| 14/14 [00:03<00:00,  3.62it/s][A
Epochs:  61%|██████    | 23/38 [10:38<06:54, 27.61s/it]

Val Loss: 3.8370 - Val Accuracy: 0.9295



Training:   0%|          | 0/112 [00:00<?, ?it/s][A
Training:   1%|          | 1/112 [00:01<02:39,  1.44s/it][A
Training:   3%|▎         | 3/112 [00:01<00:47,  2.28it/s][A
Training:   4%|▍         | 5/112 [00:02<00:41,  2.57it/s][A
Training:   7%|▋         | 8/112 [00:02<00:22,  4.66it/s][A
Training:   9%|▉         | 10/112 [00:03<00:26,  3.78it/s][A
Training:  12%|█▏        | 13/112 [00:03<00:25,  3.88it/s][A
Training:  13%|█▎        | 15/112 [00:04<00:19,  5.02it/s][A
Training:  15%|█▌        | 17/112 [00:04<00:24,  3.91it/s][A
Training:  17%|█▋        | 19/112 [00:04<00:18,  5.05it/s][A
Training:  19%|█▉        | 21/112 [00:05<00:25,  3.58it/s][A
Training:  21%|██        | 23/112 [00:06<00:19,  4.67it/s][A
Training:  22%|██▏       | 25/112 [00:06<00:20,  4.18it/s][A
Training:  24%|██▍       | 27/112 [00:06<00:15,  5.42it/s][A
Training:  26%|██▌       | 29/112 [00:07<00:19,  4.29it/s][A
Training:  28%|██▊       | 31/112 [00:07<00:14,  5.57it/s][A
Training:  29%|██▉  

Epoch: 24/38 - Loss: 3.5068 - Accuracy: 0.9403



  0%|          | 0/14 [00:00<?, ?it/s][A
  7%|▋         | 1/14 [00:01<00:16,  1.27s/it][A
 29%|██▊       | 4/14 [00:01<00:02,  3.72it/s][A
 43%|████▎     | 6/14 [00:01<00:02,  3.62it/s][A
 57%|█████▋    | 8/14 [00:02<00:01,  5.14it/s][A
 71%|███████▏  | 10/14 [00:02<00:01,  3.91it/s][A
 86%|████████▌ | 12/14 [00:02<00:00,  5.36it/s][A
100%|██████████| 14/14 [00:03<00:00,  3.82it/s][A
Epochs:  63%|██████▎   | 24/38 [11:06<06:27, 27.64s/it]

Val Loss: 3.7719 - Val Accuracy: 0.9302



Training:   0%|          | 0/112 [00:00<?, ?it/s][A
Training:   1%|          | 1/112 [00:01<02:15,  1.22s/it][A
Training:   3%|▎         | 3/112 [00:01<00:39,  2.75it/s][A
Training:   4%|▍         | 5/112 [00:01<00:33,  3.19it/s][A
Training:   6%|▋         | 7/112 [00:02<00:22,  4.75it/s][A
Training:   8%|▊         | 9/112 [00:02<00:24,  4.28it/s][A
Training:   9%|▉         | 10/112 [00:02<00:21,  4.68it/s][A
Training:  12%|█▏        | 13/112 [00:03<00:21,  4.68it/s][A
Training:  12%|█▎        | 14/112 [00:03<00:19,  5.10it/s][A
Training:  14%|█▍        | 16/112 [00:03<00:14,  6.64it/s][A
Training:  15%|█▌        | 17/112 [00:04<00:21,  4.44it/s][A
Training:  16%|█▌        | 18/112 [00:04<00:21,  4.41it/s][A
Training:  18%|█▊        | 20/112 [00:04<00:15,  5.84it/s][A
Training:  19%|█▉        | 21/112 [00:04<00:20,  4.42it/s][A
Training:  20%|█▉        | 22/112 [00:05<00:22,  4.09it/s][A
Training:  21%|██▏       | 24/112 [00:05<00:15,  5.73it/s][A
Training:  22%|██▏   

Epoch: 25/38 - Loss: 3.4513 - Accuracy: 0.9412



  0%|          | 0/14 [00:00<?, ?it/s][A
  7%|▋         | 1/14 [00:01<00:14,  1.12s/it][A
 14%|█▍        | 2/14 [00:01<00:06,  1.89it/s][A
 36%|███▌      | 5/14 [00:01<00:02,  3.20it/s][A
 43%|████▎     | 6/14 [00:02<00:02,  3.81it/s][A
 64%|██████▍   | 9/14 [00:02<00:01,  4.14it/s][A
 71%|███████▏  | 10/14 [00:02<00:00,  4.64it/s][A
 86%|████████▌ | 12/14 [00:02<00:00,  6.14it/s][A
100%|██████████| 14/14 [00:03<00:00,  3.83it/s][A
Epochs:  66%|██████▌   | 25/38 [11:33<05:57, 27.53s/it]

Val Loss: 3.7932 - Val Accuracy: 0.9278



Training:   0%|          | 0/112 [00:00<?, ?it/s][A
Training:   1%|          | 1/112 [00:01<02:04,  1.12s/it][A
Training:   3%|▎         | 3/112 [00:01<00:37,  2.90it/s][A
Training:   4%|▍         | 5/112 [00:01<00:35,  2.99it/s][A
Training:   6%|▋         | 7/112 [00:02<00:24,  4.26it/s][A
Training:   8%|▊         | 9/112 [00:02<00:28,  3.61it/s][A
Training:  10%|▉         | 11/112 [00:02<00:20,  4.90it/s][A
Training:  12%|█▏        | 13/112 [00:03<00:24,  4.06it/s][A
Training:  13%|█▎        | 15/112 [00:03<00:18,  5.33it/s][A
Training:  15%|█▌        | 17/112 [00:04<00:22,  4.21it/s][A
Training:  17%|█▋        | 19/112 [00:04<00:17,  5.22it/s][A
Training:  18%|█▊        | 20/112 [00:04<00:16,  5.68it/s][A
Training:  19%|█▉        | 21/112 [00:05<00:22,  4.06it/s][A
Training:  20%|█▉        | 22/112 [00:05<00:20,  4.37it/s][A
Training:  21%|██        | 23/112 [00:05<00:17,  5.05it/s][A
Training:  22%|██▏       | 25/112 [00:06<00:20,  4.34it/s][A
Training:  23%|██▎   

Epoch: 26/38 - Loss: 3.4346 - Accuracy: 0.9419



  0%|          | 0/14 [00:00<?, ?it/s][A
  7%|▋         | 1/14 [00:01<00:14,  1.12s/it][A
 21%|██▏       | 3/14 [00:01<00:03,  2.99it/s][A
 36%|███▌      | 5/14 [00:02<00:03,  2.51it/s][A
 50%|█████     | 7/14 [00:02<00:01,  3.85it/s][A
 64%|██████▍   | 9/14 [00:02<00:01,  3.45it/s][A
 79%|███████▊  | 11/14 [00:03<00:00,  4.82it/s][A
100%|██████████| 14/14 [00:03<00:00,  3.59it/s][A
Epochs:  68%|██████▊   | 26/38 [12:01<05:31, 27.62s/it]

Val Loss: 3.7780 - Val Accuracy: 0.9348



Training:   0%|          | 0/112 [00:00<?, ?it/s][A
Training:   1%|          | 1/112 [00:01<02:27,  1.33s/it][A
Training:   4%|▎         | 4/112 [00:01<00:30,  3.52it/s][A
Training:   5%|▌         | 6/112 [00:02<00:32,  3.26it/s][A
Training:   8%|▊         | 9/112 [00:02<00:27,  3.78it/s][A
Training:   9%|▉         | 10/112 [00:02<00:23,  4.25it/s][A
Training:  12%|█▏        | 13/112 [00:03<00:21,  4.58it/s][A
Training:  13%|█▎        | 15/112 [00:03<00:16,  5.93it/s][A
Training:  15%|█▌        | 17/112 [00:04<00:23,  4.12it/s][A
Training:  17%|█▋        | 19/112 [00:04<00:17,  5.21it/s][A
Training:  19%|█▉        | 21/112 [00:05<00:23,  3.81it/s][A
Training:  21%|██        | 23/112 [00:05<00:18,  4.76it/s][A
Training:  22%|██▏       | 25/112 [00:06<00:20,  4.24it/s][A
Training:  26%|██▌       | 29/112 [00:06<00:17,  4.79it/s][A
Training:  29%|██▊       | 32/112 [00:07<00:12,  6.52it/s][A
Training:  30%|███       | 34/112 [00:07<00:16,  4.83it/s][A
Training:  32%|███▏ 

Epoch: 27/38 - Loss: 3.4095 - Accuracy: 0.9423



  0%|          | 0/14 [00:00<?, ?it/s][A
  7%|▋         | 1/14 [00:01<00:14,  1.09s/it][A
 29%|██▊       | 4/14 [00:01<00:02,  4.09it/s][A
 43%|████▎     | 6/14 [00:01<00:02,  3.65it/s][A
 64%|██████▍   | 9/14 [00:02<00:01,  4.23it/s][A
 71%|███████▏  | 10/14 [00:02<00:00,  4.38it/s][A
 86%|████████▌ | 12/14 [00:02<00:00,  5.77it/s][A
 93%|█████████▎| 13/14 [00:03<00:00,  5.17it/s][A
100%|██████████| 14/14 [00:03<00:00,  4.06it/s][A
Epochs:  71%|███████   | 27/38 [12:28<05:01, 27.38s/it]

Val Loss: 3.8404 - Val Accuracy: 0.9336



Training:   0%|          | 0/112 [00:00<?, ?it/s][A
Training:   1%|          | 1/112 [00:01<02:30,  1.36s/it][A
Training:   3%|▎         | 3/112 [00:01<00:43,  2.49it/s][A
Training:   4%|▍         | 5/112 [00:02<00:38,  2.75it/s][A
Training:   7%|▋         | 8/112 [00:02<00:20,  5.16it/s][A
Training:   9%|▉         | 10/112 [00:03<00:25,  3.97it/s][A
Training:  12%|█▏        | 13/112 [00:03<00:21,  4.56it/s][A
Training:  12%|█▎        | 14/112 [00:03<00:21,  4.58it/s][A
Training:  14%|█▍        | 16/112 [00:03<00:16,  5.65it/s][A
Training:  15%|█▌        | 17/112 [00:04<00:19,  4.91it/s][A
Training:  16%|█▌        | 18/112 [00:04<00:25,  3.74it/s][A
Training:  18%|█▊        | 20/112 [00:04<00:18,  5.03it/s][A
Training:  20%|█▉        | 22/112 [00:05<00:24,  3.67it/s][A
Training:  22%|██▏       | 25/112 [00:05<00:14,  5.85it/s][A
Training:  24%|██▍       | 27/112 [00:06<00:20,  4.10it/s][A
Training:  26%|██▌       | 29/112 [00:06<00:15,  5.21it/s][A
Training:  28%|██▊  

Epoch: 28/38 - Loss: 3.3587 - Accuracy: 0.9433



  0%|          | 0/14 [00:00<?, ?it/s][A
  7%|▋         | 1/14 [00:01<00:14,  1.12s/it][A
 21%|██▏       | 3/14 [00:01<00:03,  2.90it/s][A
 36%|███▌      | 5/14 [00:01<00:02,  3.05it/s][A
 50%|█████     | 7/14 [00:02<00:01,  4.55it/s][A
 64%|██████▍   | 9/14 [00:02<00:01,  3.59it/s][A
 79%|███████▊  | 11/14 [00:02<00:00,  4.98it/s][A
100%|██████████| 14/14 [00:03<00:00,  3.64it/s][A
Epochs:  74%|███████▎  | 28/38 [12:56<04:35, 27.54s/it]

Val Loss: 3.7012 - Val Accuracy: 0.9376



Training:   0%|          | 0/112 [00:00<?, ?it/s][A
Training:   1%|          | 1/112 [00:01<02:23,  1.29s/it][A
Training:   4%|▍         | 5/112 [00:01<00:35,  3.01it/s][A
Training:   6%|▋         | 7/112 [00:02<00:24,  4.33it/s][A
Training:   8%|▊         | 9/112 [00:02<00:26,  3.95it/s][A
Training:  10%|▉         | 11/112 [00:02<00:19,  5.26it/s][A
Training:  12%|█▏        | 13/112 [00:03<00:26,  3.80it/s][A
Training:  14%|█▍        | 16/112 [00:03<00:16,  5.85it/s][A
Training:  16%|█▌        | 18/112 [00:04<00:22,  4.24it/s][A
Training:  18%|█▊        | 20/112 [00:04<00:17,  5.37it/s][A
Training:  20%|█▉        | 22/112 [00:05<00:20,  4.39it/s][A
Training:  22%|██▏       | 25/112 [00:06<00:20,  4.14it/s][A
Training:  24%|██▍       | 27/112 [00:06<00:16,  5.21it/s][A
Training:  26%|██▌       | 29/112 [00:06<00:19,  4.21it/s][A
Training:  29%|██▉       | 33/112 [00:07<00:18,  4.35it/s][A
Training:  31%|███▏      | 35/112 [00:07<00:14,  5.35it/s][A
Training:  33%|███▎ 

Epoch: 29/38 - Loss: 3.3433 - Accuracy: 0.9432



  0%|          | 0/14 [00:00<?, ?it/s][A
  7%|▋         | 1/14 [00:01<00:18,  1.41s/it][A
 36%|███▌      | 5/14 [00:02<00:03,  2.46it/s][A
 64%|██████▍   | 9/14 [00:03<00:01,  3.48it/s][A
 79%|███████▊  | 11/14 [00:03<00:00,  4.52it/s][A
100%|██████████| 14/14 [00:03<00:00,  3.60it/s][A
Epochs:  76%|███████▋  | 29/38 [13:23<04:07, 27.50s/it]

Val Loss: 3.6713 - Val Accuracy: 0.9336



Training:   0%|          | 0/112 [00:00<?, ?it/s][A
Training:   1%|          | 1/112 [00:00<01:50,  1.01it/s][A
Training:   3%|▎         | 3/112 [00:01<00:38,  2.84it/s][A
Training:   4%|▍         | 5/112 [00:01<00:32,  3.24it/s][A
Training:   6%|▋         | 7/112 [00:01<00:22,  4.68it/s][A
Training:   8%|▊         | 9/112 [00:02<00:28,  3.62it/s][A
Training:  10%|▉         | 11/112 [00:02<00:21,  4.75it/s][A
Training:  12%|█▏        | 13/112 [00:03<00:23,  4.24it/s][A
Training:  13%|█▎        | 15/112 [00:03<00:18,  5.13it/s][A
Training:  15%|█▌        | 17/112 [00:04<00:21,  4.49it/s][A
Training:  17%|█▋        | 19/112 [00:04<00:18,  5.02it/s][A
Training:  19%|█▉        | 21/112 [00:05<00:20,  4.43it/s][A
Training:  21%|██        | 23/112 [00:05<00:17,  5.21it/s][A
Training:  22%|██▏       | 25/112 [00:05<00:19,  4.43it/s][A
Training:  24%|██▍       | 27/112 [00:06<00:15,  5.38it/s][A
Training:  26%|██▌       | 29/112 [00:06<00:19,  4.17it/s][A
Training:  28%|██▊   

Epoch: 30/38 - Loss: 3.3225 - Accuracy: 0.9439



  0%|          | 0/14 [00:00<?, ?it/s][A
  7%|▋         | 1/14 [00:01<00:17,  1.35s/it][A
 36%|███▌      | 5/14 [00:02<00:03,  2.88it/s][A
 50%|█████     | 7/14 [00:02<00:01,  3.82it/s][A
 64%|██████▍   | 9/14 [00:02<00:01,  3.72it/s][A
 79%|███████▊  | 11/14 [00:02<00:00,  5.10it/s][A
100%|██████████| 14/14 [00:03<00:00,  3.71it/s][A
Epochs:  79%|███████▉  | 30/38 [13:51<03:41, 27.74s/it]

Val Loss: 3.6881 - Val Accuracy: 0.9341



Training:   0%|          | 0/112 [00:00<?, ?it/s][A
Training:   1%|          | 1/112 [00:01<02:08,  1.16s/it][A
Training:   2%|▏         | 2/112 [00:01<00:59,  1.84it/s][A
Training:   4%|▍         | 5/112 [00:02<00:35,  3.00it/s][A
Training:   6%|▋         | 7/112 [00:02<00:23,  4.47it/s][A
Training:   8%|▊         | 9/112 [00:03<00:30,  3.33it/s][A
Training:   9%|▉         | 10/112 [00:03<00:26,  3.80it/s][A
Training:  11%|█         | 12/112 [00:03<00:19,  5.13it/s][A
Training:  12%|█▏        | 13/112 [00:03<00:25,  3.95it/s][A
Training:  15%|█▌        | 17/112 [00:04<00:21,  4.34it/s][A
Training:  18%|█▊        | 20/112 [00:04<00:14,  6.31it/s][A
Training:  20%|█▉        | 22/112 [00:05<00:19,  4.56it/s][A
Training:  22%|██▏       | 25/112 [00:06<00:21,  4.14it/s][A
Training:  26%|██▌       | 29/112 [00:07<00:20,  4.06it/s][A
Training:  29%|██▊       | 32/112 [00:07<00:14,  5.39it/s][A
Training:  30%|███       | 34/112 [00:08<00:17,  4.53it/s][A
Training:  32%|███▏  

Epoch: 31/38 - Loss: 3.3117 - Accuracy: 0.9428



  0%|          | 0/14 [00:00<?, ?it/s][A
  7%|▋         | 1/14 [00:00<00:11,  1.11it/s][A
 21%|██▏       | 3/14 [00:01<00:03,  3.66it/s][A
 36%|███▌      | 5/14 [00:01<00:02,  3.39it/s][A
 43%|████▎     | 6/14 [00:01<00:02,  3.52it/s][A
 57%|█████▋    | 8/14 [00:02<00:01,  5.42it/s][A
 71%|███████▏  | 10/14 [00:02<00:00,  4.15it/s][A
 79%|███████▊  | 11/14 [00:02<00:00,  4.21it/s][A
 93%|█████████▎| 13/14 [00:03<00:00,  4.61it/s][A
100%|██████████| 14/14 [00:03<00:00,  4.05it/s][A
Epochs:  82%|████████▏ | 31/38 [14:18<03:12, 27.52s/it]

Val Loss: 3.6193 - Val Accuracy: 0.9359



Training:   0%|          | 0/112 [00:00<?, ?it/s][A
Training:   1%|          | 1/112 [00:01<02:06,  1.14s/it][A
Training:   3%|▎         | 3/112 [00:01<00:37,  2.94it/s][A
Training:   4%|▍         | 5/112 [00:01<00:37,  2.87it/s][A
Training:   5%|▌         | 6/112 [00:02<00:30,  3.48it/s][A
Training:   7%|▋         | 8/112 [00:02<00:19,  5.42it/s][A
Training:   9%|▉         | 10/112 [00:03<00:28,  3.56it/s][A
Training:  10%|▉         | 11/112 [00:03<00:24,  4.07it/s][A
Training:  12%|█▏        | 13/112 [00:03<00:28,  3.47it/s][A
Training:  13%|█▎        | 15/112 [00:04<00:20,  4.73it/s][A
Training:  15%|█▌        | 17/112 [00:04<00:22,  4.15it/s][A
Training:  16%|█▌        | 18/112 [00:04<00:21,  4.42it/s][A
Training:  18%|█▊        | 20/112 [00:04<00:15,  5.91it/s][A
Training:  19%|█▉        | 21/112 [00:05<00:21,  4.28it/s][A
Training:  20%|█▉        | 22/112 [00:05<00:20,  4.41it/s][A
Training:  21%|██▏       | 24/112 [00:05<00:14,  6.10it/s][A
Training:  22%|██▏   

Epoch: 32/38 - Loss: 3.3043 - Accuracy: 0.9441



  0%|          | 0/14 [00:00<?, ?it/s][A
  7%|▋         | 1/14 [00:01<00:17,  1.36s/it][A
 21%|██▏       | 3/14 [00:01<00:04,  2.53it/s][A
 36%|███▌      | 5/14 [00:02<00:03,  2.83it/s][A
 50%|█████     | 7/14 [00:02<00:01,  4.43it/s][A
 64%|██████▍   | 9/14 [00:03<00:01,  3.43it/s][A
 79%|███████▊  | 11/14 [00:03<00:00,  4.69it/s][A
100%|██████████| 14/14 [00:03<00:00,  3.69it/s][A
Epochs:  84%|████████▍ | 32/38 [14:46<02:45, 27.62s/it]

Val Loss: 3.6405 - Val Accuracy: 0.9336



Training:   0%|          | 0/112 [00:00<?, ?it/s][A
Training:   1%|          | 1/112 [00:01<02:17,  1.23s/it][A
Training:   3%|▎         | 3/112 [00:01<00:41,  2.62it/s][A
Training:   4%|▍         | 5/112 [00:02<00:38,  2.79it/s][A
Training:   6%|▋         | 7/112 [00:02<00:25,  4.16it/s][A
Training:   7%|▋         | 8/112 [00:02<00:21,  4.78it/s][A
Training:   8%|▊         | 9/112 [00:02<00:31,  3.29it/s][A
Training:  10%|▉         | 11/112 [00:03<00:20,  4.93it/s][A
Training:  12%|█▏        | 13/112 [00:03<00:24,  4.12it/s][A
Training:  12%|█▎        | 14/112 [00:03<00:21,  4.50it/s][A
Training:  14%|█▍        | 16/112 [00:03<00:15,  6.21it/s][A
Training:  16%|█▌        | 18/112 [00:04<00:21,  4.47it/s][A
Training:  19%|█▉        | 21/112 [00:05<00:20,  4.43it/s][A
Training:  20%|█▉        | 22/112 [00:05<00:19,  4.70it/s][A
Training:  21%|██▏       | 24/112 [00:05<00:14,  6.09it/s][A
Training:  22%|██▏       | 25/112 [00:06<00:21,  4.11it/s][A
Training:  23%|██▎    

Epoch: 33/38 - Loss: 3.2552 - Accuracy: 0.9445



  0%|          | 0/14 [00:00<?, ?it/s][A
  7%|▋         | 1/14 [00:01<00:15,  1.16s/it][A
 21%|██▏       | 3/14 [00:01<00:03,  2.81it/s][A
 36%|███▌      | 5/14 [00:02<00:03,  2.83it/s][A
 50%|█████     | 7/14 [00:02<00:01,  4.21it/s][A
 64%|██████▍   | 9/14 [00:02<00:01,  3.58it/s][A
 86%|████████▌ | 12/14 [00:02<00:00,  5.87it/s][A
100%|██████████| 14/14 [00:03<00:00,  3.83it/s][A
Epochs:  87%|████████▋ | 33/38 [15:14<02:17, 27.55s/it]

Val Loss: 3.6164 - Val Accuracy: 0.9353



Training:   0%|          | 0/112 [00:00<?, ?it/s][A
Training:   1%|          | 1/112 [00:01<02:12,  1.19s/it][A
Training:   2%|▏         | 2/112 [00:01<01:09,  1.58it/s][A
Training:   4%|▎         | 4/112 [00:01<00:29,  3.67it/s][A
Training:   4%|▍         | 5/112 [00:01<00:34,  3.14it/s][A
Training:   5%|▌         | 6/112 [00:02<00:29,  3.60it/s][A
Training:   8%|▊         | 9/112 [00:02<00:26,  3.88it/s][A
Training:  10%|▉         | 11/112 [00:02<00:18,  5.41it/s][A
Training:  12%|█▏        | 13/112 [00:03<00:22,  4.48it/s][A
Training:  12%|█▎        | 14/112 [00:03<00:21,  4.65it/s][A
Training:  14%|█▍        | 16/112 [00:03<00:15,  6.21it/s][A
Training:  15%|█▌        | 17/112 [00:04<00:18,  5.02it/s][A
Training:  16%|█▌        | 18/112 [00:04<00:23,  4.00it/s][A
Training:  18%|█▊        | 20/112 [00:04<00:16,  5.54it/s][A
Training:  19%|█▉        | 21/112 [00:05<00:18,  4.92it/s][A
Training:  20%|█▉        | 22/112 [00:05<00:23,  3.83it/s][A
Training:  22%|██▏    

Epoch: 34/38 - Loss: 3.2236 - Accuracy: 0.9446



  0%|          | 0/14 [00:00<?, ?it/s][A
  7%|▋         | 1/14 [00:01<00:18,  1.42s/it][A
 29%|██▊       | 4/14 [00:01<00:03,  3.30it/s][A
 43%|████▎     | 6/14 [00:02<00:02,  3.47it/s][A
 57%|█████▋    | 8/14 [00:02<00:01,  4.89it/s][A
 71%|███████▏  | 10/14 [00:02<00:01,  3.94it/s][A
100%|██████████| 14/14 [00:03<00:00,  3.76it/s][A
Epochs:  89%|████████▉ | 34/38 [15:41<01:50, 27.57s/it]

Val Loss: 3.6247 - Val Accuracy: 0.9347



Training:   0%|          | 0/112 [00:00<?, ?it/s][A
Training:   1%|          | 1/112 [00:01<02:30,  1.35s/it][A
Training:   3%|▎         | 3/112 [00:01<00:44,  2.46it/s][A
Training:   4%|▍         | 5/112 [00:02<00:40,  2.64it/s][A
Training:   8%|▊         | 9/112 [00:03<00:28,  3.66it/s][A
Training:  10%|▉         | 11/112 [00:03<00:21,  4.67it/s][A
Training:  12%|█▏        | 13/112 [00:03<00:22,  4.33it/s][A
Training:  12%|█▎        | 14/112 [00:03<00:23,  4.19it/s][A
Training:  15%|█▌        | 17/112 [00:04<00:20,  4.69it/s][A
Training:  16%|█▌        | 18/112 [00:04<00:20,  4.63it/s][A
Training:  19%|█▉        | 21/112 [00:05<00:19,  4.67it/s][A
Training:  20%|█▉        | 22/112 [00:05<00:17,  5.08it/s][A
Training:  21%|██▏       | 24/112 [00:05<00:13,  6.49it/s][A
Training:  22%|██▏       | 25/112 [00:06<00:19,  4.38it/s][A
Training:  23%|██▎       | 26/112 [00:06<00:17,  4.82it/s][A
Training:  25%|██▌       | 28/112 [00:06<00:12,  6.55it/s][A
Training:  26%|██▌  

Epoch: 35/38 - Loss: 3.2261 - Accuracy: 0.9448



  0%|          | 0/14 [00:00<?, ?it/s][A
  7%|▋         | 1/14 [00:01<00:14,  1.11s/it][A
 21%|██▏       | 3/14 [00:01<00:03,  2.96it/s][A
 36%|███▌      | 5/14 [00:01<00:03,  2.92it/s][A
 43%|████▎     | 6/14 [00:02<00:02,  3.34it/s][A
 64%|██████▍   | 9/14 [00:02<00:01,  4.16it/s][A
 71%|███████▏  | 10/14 [00:03<00:01,  3.93it/s][A
 93%|█████████▎| 13/14 [00:03<00:00,  5.31it/s][A
100%|██████████| 14/14 [00:03<00:00,  3.89it/s][A
Epochs:  92%|█████████▏| 35/38 [16:08<01:21, 27.32s/it]

Val Loss: 3.6186 - Val Accuracy: 0.9341



Training:   0%|          | 0/112 [00:00<?, ?it/s][A
Training:   1%|          | 1/112 [00:01<02:39,  1.43s/it][A
Training:   3%|▎         | 3/112 [00:01<00:45,  2.39it/s][A
Training:   4%|▍         | 5/112 [00:02<00:44,  2.43it/s][A
Training:   6%|▋         | 7/112 [00:02<00:27,  3.79it/s][A
Training:   8%|▊         | 9/112 [00:03<00:30,  3.43it/s][A
Training:  10%|▉         | 11/112 [00:03<00:20,  4.81it/s][A
Training:  12%|█▏        | 13/112 [00:03<00:24,  4.07it/s][A
Training:  14%|█▍        | 16/112 [00:04<00:15,  6.17it/s][A
Training:  16%|█▌        | 18/112 [00:04<00:20,  4.61it/s][A
Training:  18%|█▊        | 20/112 [00:04<00:16,  5.68it/s][A
Training:  20%|█▉        | 22/112 [00:05<00:22,  4.08it/s][A
Training:  21%|██▏       | 24/112 [00:05<00:17,  5.15it/s][A
Training:  23%|██▎       | 26/112 [00:06<00:21,  3.97it/s][A
Training:  26%|██▌       | 29/112 [00:07<00:19,  4.29it/s][A
Training:  29%|██▊       | 32/112 [00:07<00:13,  6.10it/s][A
Training:  30%|███   

Epoch: 36/38 - Loss: 3.1975 - Accuracy: 0.9459



  0%|          | 0/14 [00:00<?, ?it/s][A
  7%|▋         | 1/14 [00:01<00:18,  1.44s/it][A
 21%|██▏       | 3/14 [00:01<00:04,  2.41it/s][A
 36%|███▌      | 5/14 [00:02<00:03,  2.56it/s][A
 64%|██████▍   | 9/14 [00:03<00:01,  3.77it/s][A
 71%|███████▏  | 10/14 [00:03<00:00,  4.14it/s][A
 93%|█████████▎| 13/14 [00:03<00:00,  4.88it/s][A
100%|██████████| 14/14 [00:03<00:00,  3.69it/s][A
Epochs:  95%|█████████▍| 36/38 [16:35<00:54, 27.28s/it]

Val Loss: 3.6173 - Val Accuracy: 0.9336



Training:   0%|          | 0/112 [00:00<?, ?it/s][A
Training:   1%|          | 1/112 [00:01<02:38,  1.43s/it][A
Training:   3%|▎         | 3/112 [00:01<00:48,  2.27it/s][A
Training:   4%|▍         | 5/112 [00:02<00:41,  2.60it/s][A
Training:   6%|▋         | 7/112 [00:02<00:26,  3.96it/s][A
Training:   8%|▊         | 9/112 [00:03<00:31,  3.27it/s][A
Training:  10%|▉         | 11/112 [00:03<00:22,  4.56it/s][A
Training:  12%|█▏        | 13/112 [00:04<00:25,  3.90it/s][A
Training:  13%|█▎        | 15/112 [00:04<00:18,  5.13it/s][A
Training:  15%|█▌        | 17/112 [00:04<00:23,  3.98it/s][A
Training:  17%|█▋        | 19/112 [00:05<00:18,  5.11it/s][A
Training:  18%|█▊        | 20/112 [00:05<00:16,  5.47it/s][A
Training:  19%|█▉        | 21/112 [00:05<00:25,  3.53it/s][A
Training:  21%|██        | 23/112 [00:05<00:18,  4.79it/s][A
Training:  22%|██▏       | 25/112 [00:06<00:23,  3.71it/s][A
Training:  24%|██▍       | 27/112 [00:06<00:17,  4.92it/s][A
Training:  26%|██▌   

Epoch: 37/38 - Loss: 3.2105 - Accuracy: 0.9458



  0%|          | 0/14 [00:00<?, ?it/s][A
  7%|▋         | 1/14 [00:01<00:16,  1.31s/it][A
 36%|███▌      | 5/14 [00:02<00:03,  2.89it/s][A
 57%|█████▋    | 8/14 [00:02<00:01,  4.88it/s][A
 71%|███████▏  | 10/14 [00:02<00:00,  4.12it/s][A
 79%|███████▊  | 11/14 [00:02<00:00,  4.54it/s][A
100%|██████████| 14/14 [00:03<00:00,  3.82it/s][A
Epochs:  97%|█████████▋| 37/38 [17:03<00:27, 27.35s/it]

Val Loss: 3.5611 - Val Accuracy: 0.9393



Training:   0%|          | 0/112 [00:00<?, ?it/s][A
Training:   1%|          | 1/112 [00:01<02:04,  1.12s/it][A
Training:   2%|▏         | 2/112 [00:01<01:03,  1.73it/s][A
Training:   4%|▍         | 5/112 [00:01<00:30,  3.56it/s][A
Training:   5%|▌         | 6/112 [00:02<00:29,  3.61it/s][A
Training:   7%|▋         | 8/112 [00:02<00:19,  5.21it/s][A
Training:   8%|▊         | 9/112 [00:02<00:22,  4.63it/s][A
Training:   9%|▉         | 10/112 [00:03<00:28,  3.56it/s][A
Training:  11%|█         | 12/112 [00:03<00:19,  5.11it/s][A
Training:  12%|█▏        | 13/112 [00:03<00:20,  4.77it/s][A
Training:  12%|█▎        | 14/112 [00:03<00:25,  3.90it/s][A
Training:  14%|█▍        | 16/112 [00:03<00:16,  5.79it/s][A
Training:  15%|█▌        | 17/112 [00:04<00:19,  4.84it/s][A
Training:  16%|█▌        | 18/112 [00:04<00:21,  4.32it/s][A
Training:  17%|█▋        | 19/112 [00:04<00:20,  4.63it/s][A
Training:  19%|█▉        | 21/112 [00:05<00:16,  5.40it/s][A
Training:  20%|█▉     

Epoch: 38/38 - Loss: 3.1772 - Accuracy: 0.9456



  0%|          | 0/14 [00:00<?, ?it/s][A
  7%|▋         | 1/14 [00:01<00:16,  1.27s/it][A
 29%|██▊       | 4/14 [00:01<00:02,  3.59it/s][A
 43%|████▎     | 6/14 [00:02<00:02,  3.12it/s][A
 57%|█████▋    | 8/14 [00:02<00:01,  4.56it/s][A
 71%|███████▏  | 10/14 [00:03<00:01,  3.59it/s][A
100%|██████████| 14/14 [00:03<00:00,  3.64it/s][A
Epochs: 100%|██████████| 38/38 [17:30<00:00, 27.64s/it]
[32m[I 2023-12-14 23:56:07,976][0m Trial 4 finished with value: 0.9364524483680725 and parameters: {'loss_learning_rate': 0.00029022607343956355, 'learning_rate': 3.3347055279343715e-05, 'weight_decay': 0.00013857639851633783, 'epsilon': 5.910646219604286e-09, 'batch_size': 125, 'epochs': 38}. Best is trial 2 with value: 0.937753438949585.[0m


Val Loss: 3.5450 - Val Accuracy: 0.9365
Learning rate for Loss: 0.0002832058738344144
Learning rate: 0.00011278137650122777
Weight decay: 0.0002977809527118104
Epsilon: 7.382678812537027e-09
Batch size: 237
Number of epochs: 93


Epochs:   0%|          | 0/93 [00:00<?, ?it/s]
Training:   0%|          | 0/59 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/59 [00:01<01:42,  1.77s/it][A
Training:   3%|▎         | 2/59 [00:01<00:48,  1.17it/s][A
Training:   7%|▋         | 4/59 [00:02<00:20,  2.73it/s][A
Training:   8%|▊         | 5/59 [00:03<00:33,  1.63it/s][A
Training:  10%|█         | 6/59 [00:03<00:25,  2.09it/s][A
Training:  12%|█▏        | 7/59 [00:03<00:19,  2.63it/s][A
Training:  15%|█▌        | 9/59 [00:04<00:25,  1.96it/s][A
Training:  19%|█▊        | 11/59 [00:05<00:16,  2.91it/s][A
Training:  20%|██        | 12/59 [00:05<00:13,  3.43it/s][A
Training:  22%|██▏       | 13/59 [00:06<00:26,  1.75it/s][A
Training:  24%|██▎       | 14/59 [00:06<00:20,  2.19it/s][A
Training:  25%|██▌       | 15/59 [00:07<00:16,  2.59it/s][A
Training:  27%|██▋       | 16/59 [00:07<00:13,  3.26it/s][A
Training:  29%|██▉       | 17/59 [00:08<00:21,  1.98it/s][A
Training:  32%|███▏      | 19/59 [00:08<00:15,  2.58it

Epoch: 1/93 - Loss: 17.2352 - Accuracy: 0.6870



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:01<00:13,  1.92s/it][A
 50%|█████     | 4/8 [00:02<00:01,  2.51it/s][A
100%|██████████| 8/8 [00:03<00:00,  2.37it/s][A
Epochs:   0%|          | 0/93 [00:26<?, ?it/s]
[32m[I 2023-12-14 23:56:35,362][0m Trial 5 pruned. [0m


Val Loss: 10.3484 - Val Accuracy: 0.8175
Learning rate for Loss: 0.0017564699894723073
Learning rate: 0.058555390724633616
Weight decay: 0.008655274995683308
Epsilon: 9.75318218586541e-08
Batch size: 77
Number of epochs: 10


Epochs:   0%|          | 0/10 [00:00<?, ?it/s]
Training:   0%|          | 0/182 [00:00<?, ?it/s][A
Training:   1%|          | 1/182 [00:01<03:12,  1.06s/it][A
Training:   2%|▏         | 3/182 [00:01<00:57,  3.12it/s][A
Training:   3%|▎         | 5/182 [00:01<00:42,  4.13it/s][A
Training:   4%|▍         | 8/182 [00:01<00:24,  7.13it/s][A
Training:   5%|▌         | 10/182 [00:02<00:26,  6.53it/s][A
Training:   7%|▋         | 13/182 [00:02<00:24,  7.02it/s][A
Training:   8%|▊         | 15/182 [00:02<00:19,  8.58it/s][A
Training:   9%|▉         | 17/182 [00:02<00:22,  7.20it/s][A
Training:  10%|█         | 19/182 [00:03<00:19,  8.29it/s][A
Training:  12%|█▏        | 21/182 [00:03<00:21,  7.63it/s][A
Training:  13%|█▎        | 23/182 [00:03<00:19,  8.04it/s][A
Training:  14%|█▎        | 25/182 [00:03<00:22,  6.91it/s][A
Training:  15%|█▍        | 27/182 [00:04<00:18,  8.33it/s][A
Training:  16%|█▌        | 29/182 [00:04<00:22,  6.85it/s][A
Training:  18%|█▊        | 32/182 [0

Epoch: 1/10 - Loss: 39.7771 - Accuracy: 0.8178



  0%|          | 0/23 [00:00<?, ?it/s][A
  4%|▍         | 1/23 [00:00<00:21,  1.02it/s][A
 17%|█▋        | 4/23 [00:01<00:04,  4.52it/s][A
 26%|██▌       | 6/23 [00:01<00:03,  4.85it/s][A
 35%|███▍      | 8/23 [00:01<00:02,  6.44it/s][A
 43%|████▎     | 10/23 [00:01<00:02,  6.14it/s][A
 52%|█████▏    | 12/23 [00:02<00:01,  7.53it/s][A
 61%|██████    | 14/23 [00:02<00:01,  7.39it/s][A
 70%|██████▉   | 16/23 [00:02<00:00,  7.99it/s][A
 74%|███████▍  | 17/23 [00:02<00:00,  7.29it/s][A
 83%|████████▎ | 19/23 [00:03<00:00,  7.82it/s][A
 87%|████████▋ | 20/23 [00:03<00:00,  7.83it/s][A
100%|██████████| 23/23 [00:03<00:00,  6.59it/s][A
Epochs:   0%|          | 0/10 [00:26<?, ?it/s]
[32m[I 2023-12-14 23:57:02,804][0m Trial 6 pruned. [0m


Val Loss: 5.8399 - Val Accuracy: 0.8427
Learning rate for Loss: 0.00013480632548787101
Learning rate: 0.02548000545586087
Weight decay: 0.004207939458037113
Epsilon: 6.651857252565762e-08
Batch size: 54
Number of epochs: 71


Epochs:   0%|          | 0/71 [00:00<?, ?it/s]
Training:   0%|          | 0/259 [00:00<?, ?it/s][A
Training:   0%|          | 1/259 [00:00<03:28,  1.24it/s][A
Training:   2%|▏         | 5/259 [00:01<00:48,  5.29it/s][A
Training:   3%|▎         | 8/259 [00:01<00:29,  8.58it/s][A
Training:   4%|▍         | 10/259 [00:01<00:29,  8.44it/s][A
Training:   5%|▌         | 13/259 [00:01<00:26,  9.27it/s][A
Training:   7%|▋         | 17/259 [00:02<00:22, 10.95it/s][A
Training:   8%|▊         | 20/259 [00:02<00:19, 12.21it/s][A
Training:   8%|▊         | 22/259 [00:02<00:21, 11.12it/s][A
Training:   9%|▉         | 24/259 [00:02<00:18, 12.41it/s][A
Training:  10%|█         | 26/259 [00:02<00:22, 10.44it/s][A
Training:  11%|█         | 29/259 [00:03<00:20, 11.05it/s][A
Training:  12%|█▏        | 31/259 [00:03<00:20, 11.23it/s][A
Training:  13%|█▎        | 33/259 [00:03<00:23,  9.48it/s][A
Training:  14%|█▎        | 35/259 [00:03<00:21, 10.60it/s][A
Training:  14%|█▍        | 37/259 [

Epoch: 1/71 - Loss: 12.1695 - Accuracy: 0.8158



  0%|          | 0/33 [00:00<?, ?it/s][A
  3%|▎         | 1/33 [00:00<00:21,  1.49it/s][A
 15%|█▌        | 5/33 [00:00<00:04,  6.29it/s][A
 24%|██▍       | 8/33 [00:01<00:02,  8.95it/s][A
 30%|███       | 10/33 [00:01<00:02,  8.28it/s][A
 36%|███▋      | 12/33 [00:01<00:02,  9.32it/s][A
 42%|████▏     | 14/33 [00:01<00:01,  9.67it/s][A
 48%|████▊     | 16/33 [00:01<00:01, 10.99it/s][A
 55%|█████▍    | 18/33 [00:02<00:01, 10.00it/s][A
 61%|██████    | 20/33 [00:02<00:01, 10.71it/s][A
 67%|██████▋   | 22/33 [00:02<00:01,  9.84it/s][A
 76%|███████▌  | 25/33 [00:02<00:00,  9.69it/s][A
 85%|████████▍ | 28/33 [00:02<00:00, 12.35it/s][A
100%|██████████| 33/33 [00:03<00:00,  9.71it/s][A
Epochs:   1%|▏         | 1/71 [00:27<32:11, 27.59s/it]

Val Loss: 5.8189 - Val Accuracy: 0.9070



Training:   0%|          | 0/259 [00:00<?, ?it/s][A
Training:   0%|          | 1/259 [00:00<03:02,  1.41it/s][A
Training:   2%|▏         | 4/259 [00:00<00:42,  6.01it/s][A
Training:   2%|▏         | 6/259 [00:00<00:32,  7.84it/s][A
Training:   3%|▎         | 8/259 [00:01<00:25,  9.70it/s][A
Training:   4%|▍         | 10/259 [00:01<00:26,  9.35it/s][A
Training:   5%|▍         | 12/259 [00:01<00:26,  9.24it/s][A
Training:   5%|▌         | 14/259 [00:01<00:25,  9.63it/s][A
Training:   6%|▌         | 16/259 [00:01<00:24, 10.00it/s][A
Training:   7%|▋         | 18/259 [00:02<00:23, 10.42it/s][A
Training:   8%|▊         | 20/259 [00:02<00:23,  9.97it/s][A
Training:   8%|▊         | 22/259 [00:02<00:23, 10.02it/s][A
Training:   9%|▉         | 24/259 [00:02<00:23,  9.90it/s][A
Training:  10%|█         | 26/259 [00:02<00:20, 11.10it/s][A
Training:  11%|█         | 28/259 [00:03<00:20, 11.50it/s][A
Training:  12%|█▏        | 30/259 [00:03<00:21, 10.70it/s][A
Training:  12%|█▏   

Epoch: 2/71 - Loss: 5.0588 - Accuracy: 0.8852



  0%|          | 0/33 [00:00<?, ?it/s][A
  3%|▎         | 1/33 [00:00<00:21,  1.47it/s][A
 15%|█▌        | 5/33 [00:01<00:05,  5.40it/s][A
 27%|██▋       | 9/33 [00:01<00:03,  7.77it/s][A
 39%|███▉      | 13/33 [00:01<00:02,  8.69it/s][A
 52%|█████▏    | 17/33 [00:02<00:01,  8.67it/s][A
 64%|██████▎   | 21/33 [00:02<00:01,  9.34it/s][A
 76%|███████▌  | 25/33 [00:03<00:00,  9.36it/s][A
 85%|████████▍ | 28/33 [00:03<00:00, 11.43it/s][A
 91%|█████████ | 30/33 [00:03<00:00, 10.94it/s][A
100%|██████████| 33/33 [00:03<00:00,  9.14it/s][A
Epochs:   1%|▏         | 1/71 [00:54<1:03:37, 54.53s/it]
[32m[I 2023-12-14 23:57:57,905][0m Trial 7 pruned. [0m


Val Loss: 4.3696 - Val Accuracy: 0.8862
Learning rate for Loss: 0.0002096756314496251
Learning rate: 0.02713994637058365
Weight decay: 0.0015961140401311632
Epsilon: 1.1953849586282226e-08
Batch size: 201
Number of epochs: 64


Epochs:   0%|          | 0/64 [00:00<?, ?it/s]
Training:   0%|          | 0/70 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/70 [00:01<01:47,  1.55s/it][A
Training:   3%|▎         | 2/70 [00:01<00:54,  1.26it/s][A
Training:   7%|▋         | 5/70 [00:02<00:30,  2.14it/s][A
Training:   9%|▊         | 6/70 [00:03<00:28,  2.29it/s][A
Training:  10%|█         | 7/70 [00:03<00:22,  2.86it/s][A
Training:  13%|█▎        | 9/70 [00:04<00:26,  2.29it/s][A
Training:  14%|█▍        | 10/70 [00:04<00:22,  2.68it/s][A
Training:  17%|█▋        | 12/70 [00:04<00:14,  3.95it/s][A
Training:  19%|█▊        | 13/70 [00:05<00:23,  2.38it/s][A
Training:  23%|██▎       | 16/70 [00:05<00:12,  4.29it/s][A
Training:  26%|██▌       | 18/70 [00:07<00:19,  2.74it/s][A
Training:  30%|███       | 21/70 [00:08<00:19,  2.54it/s][A
Training:  34%|███▍      | 24/70 [00:08<00:12,  3.82it/s][A
Training:  37%|███▋      | 26/70 [00:09<00:15,  2.85it/s][A
Training:  40%|████      | 28/70 [00:09<00:11,  3.65i

Epoch: 1/64 - Loss: 15.5175 - Accuracy: 0.7928



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:01<00:11,  1.45s/it][A
 33%|███▎      | 3/9 [00:01<00:02,  2.38it/s][A
 56%|█████▌    | 5/9 [00:02<00:02,  1.82it/s][A
100%|██████████| 9/9 [00:03<00:00,  2.40it/s][A
Epochs:   0%|          | 0/64 [00:27<?, ?it/s]
[32m[I 2023-12-14 23:58:25,835][0m Trial 8 pruned. [0m


Val Loss: 5.4889 - Val Accuracy: 0.8764
Learning rate for Loss: 0.00016092774588079742
Learning rate: 0.002952527785624987
Weight decay: 0.0004422628981911029
Epsilon: 1.2457860298352204e-09
Batch size: 51
Number of epochs: 18


Epochs:   0%|          | 0/18 [00:00<?, ?it/s]
Training:   0%|          | 0/274 [00:00<?, ?it/s][A
Training:   0%|          | 1/274 [00:00<04:04,  1.11it/s][A
Training:   1%|          | 3/274 [00:01<01:15,  3.57it/s][A
Training:   2%|▏         | 5/274 [00:01<00:49,  5.47it/s][A
Training:   3%|▎         | 8/274 [00:01<00:28,  9.31it/s][A
Training:   4%|▎         | 10/274 [00:01<00:29,  8.90it/s][A
Training:   5%|▍         | 13/274 [00:01<00:27,  9.39it/s][A
Training:   6%|▌         | 17/274 [00:02<00:26,  9.71it/s][A
Training:   8%|▊         | 21/274 [00:02<00:25,  9.78it/s][A
Training:   9%|▉         | 24/274 [00:02<00:21, 11.65it/s][A
Training:   9%|▉         | 26/274 [00:03<00:24, 10.22it/s][A
Training:  11%|█         | 29/274 [00:03<00:22, 10.78it/s][A
Training:  12%|█▏        | 33/274 [00:03<00:20, 11.57it/s][A
Training:  14%|█▎        | 37/274 [00:03<00:19, 12.40it/s][A
Training:  15%|█▍        | 41/274 [00:04<00:17, 13.37it/s][A
Training:  16%|█▋        | 45/274 [0

Epoch: 1/18 - Loss: 8.2216 - Accuracy: 0.8616



  0%|          | 0/35 [00:00<?, ?it/s][A
  3%|▎         | 1/35 [00:00<00:20,  1.66it/s][A
  6%|▌         | 2/35 [00:00<00:10,  3.15it/s][A
 14%|█▍        | 5/35 [00:00<00:03,  7.51it/s][A
 20%|██        | 7/35 [00:01<00:03,  8.75it/s][A
 26%|██▌       | 9/35 [00:01<00:02,  9.86it/s][A
 31%|███▏      | 11/35 [00:01<00:02,  9.49it/s][A
 40%|████      | 14/35 [00:01<00:02,  8.77it/s][A
 49%|████▊     | 17/35 [00:01<00:01, 11.63it/s][A
 54%|█████▍    | 19/35 [00:02<00:01, 10.04it/s][A
 63%|██████▎   | 22/35 [00:02<00:01,  9.83it/s][A
 71%|███████▏  | 25/35 [00:02<00:00, 11.89it/s][A
 77%|███████▋  | 27/35 [00:02<00:00, 11.25it/s][A
 83%|████████▎ | 29/35 [00:03<00:00, 11.44it/s][A
 91%|█████████▏| 32/35 [00:03<00:00, 14.27it/s][A
100%|██████████| 35/35 [00:03<00:00,  9.72it/s][A
Epochs:   6%|▌         | 1/18 [00:27<07:48, 27.53s/it]

Val Loss: 5.4478 - Val Accuracy: 0.9199



Training:   0%|          | 0/274 [00:00<?, ?it/s][A
Training:   0%|          | 1/274 [00:00<02:42,  1.68it/s][A
Training:   1%|▏         | 4/274 [00:00<00:42,  6.41it/s][A
Training:   2%|▏         | 6/274 [00:00<00:32,  8.34it/s][A
Training:   3%|▎         | 8/274 [00:01<00:26, 10.17it/s][A
Training:   4%|▎         | 10/274 [00:01<00:26, 10.14it/s][A
Training:   4%|▍         | 12/274 [00:01<00:24, 10.51it/s][A
Training:   5%|▌         | 14/274 [00:01<00:21, 12.01it/s][A
Training:   6%|▌         | 16/274 [00:01<00:21, 12.19it/s][A
Training:   7%|▋         | 18/274 [00:01<00:23, 10.81it/s][A
Training:   8%|▊         | 21/274 [00:02<00:19, 12.91it/s][A
Training:   8%|▊         | 23/274 [00:02<00:19, 12.57it/s][A
Training:   9%|▉         | 25/274 [00:02<00:19, 12.76it/s][A
Training:  10%|▉         | 27/274 [00:02<00:19, 12.78it/s][A
Training:  11%|█         | 29/274 [00:02<00:20, 12.18it/s][A
Training:  11%|█▏        | 31/274 [00:02<00:21, 11.52it/s][A
Training:  12%|█▏   

Epoch: 2/18 - Loss: 4.6355 - Accuracy: 0.9075



  0%|          | 0/35 [00:00<?, ?it/s][A
  3%|▎         | 1/35 [00:00<00:24,  1.36it/s][A
 11%|█▏        | 4/35 [00:00<00:05,  5.80it/s][A
 17%|█▋        | 6/35 [00:01<00:04,  6.87it/s][A
 26%|██▌       | 9/35 [00:01<00:03,  6.86it/s][A
 37%|███▋      | 13/35 [00:01<00:02,  8.56it/s][A
 49%|████▊     | 17/35 [00:02<00:01,  9.34it/s][A
 60%|██████    | 21/35 [00:02<00:01, 10.75it/s][A
 66%|██████▌   | 23/35 [00:02<00:01, 11.57it/s][A
 71%|███████▏  | 25/35 [00:02<00:00, 11.50it/s][A
 77%|███████▋  | 27/35 [00:02<00:00, 12.78it/s][A
 83%|████████▎ | 29/35 [00:03<00:00, 11.81it/s][A
 91%|█████████▏| 32/35 [00:03<00:00, 13.43it/s][A
100%|██████████| 35/35 [00:03<00:00,  9.89it/s][A
Epochs:  11%|█         | 2/18 [00:54<07:16, 27.29s/it]

Val Loss: 4.5052 - Val Accuracy: 0.9186



Training:   0%|          | 0/274 [00:00<?, ?it/s][A
Training:   0%|          | 1/274 [00:00<03:27,  1.31it/s][A
Training:   1%|          | 2/274 [00:00<01:49,  2.49it/s][A
Training:   2%|▏         | 5/274 [00:01<00:42,  6.37it/s][A
Training:   3%|▎         | 7/274 [00:01<00:34,  7.79it/s][A
Training:   3%|▎         | 9/274 [00:01<00:29,  9.03it/s][A
Training:   4%|▍         | 11/274 [00:01<00:32,  8.02it/s][A
Training:   5%|▌         | 14/274 [00:01<00:23, 11.22it/s][A
Training:   6%|▌         | 16/274 [00:02<00:26,  9.90it/s][A
Training:   7%|▋         | 19/274 [00:02<00:24, 10.58it/s][A
Training:   8%|▊         | 21/274 [00:02<00:21, 11.62it/s][A
Training:   8%|▊         | 23/274 [00:02<00:22, 11.30it/s][A
Training:   9%|▉         | 25/274 [00:02<00:20, 11.94it/s][A
Training:  10%|▉         | 27/274 [00:03<00:21, 11.54it/s][A
Training:  11%|█         | 29/274 [00:03<00:20, 11.79it/s][A
Training:  11%|█▏        | 31/274 [00:03<00:20, 11.61it/s][A
Training:  12%|█▏    

Epoch: 3/18 - Loss: 4.2085 - Accuracy: 0.9141



  0%|          | 0/35 [00:00<?, ?it/s][A
  3%|▎         | 1/35 [00:00<00:24,  1.39it/s][A
 11%|█▏        | 4/35 [00:00<00:05,  5.69it/s][A
 17%|█▋        | 6/35 [00:01<00:03,  7.39it/s][A
 23%|██▎       | 8/35 [00:01<00:03,  8.71it/s][A
 29%|██▊       | 10/35 [00:01<00:02,  8.86it/s][A
 34%|███▍      | 12/35 [00:01<00:02, 10.33it/s][A
 40%|████      | 14/35 [00:01<00:02, 10.36it/s][A
 46%|████▌     | 16/35 [00:01<00:01, 11.85it/s][A
 51%|█████▏    | 18/35 [00:02<00:01,  9.93it/s][A
 60%|██████    | 21/35 [00:02<00:01, 11.62it/s][A
 66%|██████▌   | 23/35 [00:02<00:01, 10.96it/s][A
 71%|███████▏  | 25/35 [00:02<00:00, 11.22it/s][A
 77%|███████▋  | 27/35 [00:02<00:00, 11.23it/s][A
 83%|████████▎ | 29/35 [00:02<00:00, 12.39it/s][A
 89%|████████▊ | 31/35 [00:03<00:00, 10.70it/s][A
100%|██████████| 35/35 [00:03<00:00,  9.80it/s][A
Epochs:  17%|█▋        | 3/18 [01:22<06:52, 27.49s/it]

Val Loss: 3.9007 - Val Accuracy: 0.9361



Training:   0%|          | 0/274 [00:00<?, ?it/s][A
Training:   0%|          | 1/274 [00:00<03:45,  1.21it/s][A
Training:   1%|▏         | 4/274 [00:00<00:51,  5.28it/s][A
Training:   2%|▏         | 6/274 [00:01<00:40,  6.69it/s][A
Training:   3%|▎         | 9/274 [00:01<00:34,  7.70it/s][A
Training:   4%|▍         | 11/274 [00:01<00:28,  9.22it/s][A
Training:   5%|▍         | 13/274 [00:01<00:29,  9.00it/s][A
Training:   5%|▌         | 15/274 [00:01<00:24, 10.71it/s][A
Training:   6%|▌         | 17/274 [00:02<00:25,  9.89it/s][A
Training:   7%|▋         | 19/274 [00:02<00:23, 10.98it/s][A
Training:   8%|▊         | 21/274 [00:02<00:20, 12.21it/s][A
Training:   8%|▊         | 23/274 [00:02<00:22, 11.10it/s][A
Training:   9%|▉         | 26/274 [00:03<00:25,  9.60it/s][A
Training:  11%|█         | 30/274 [00:03<00:25,  9.75it/s][A
Training:  12%|█▏        | 34/274 [00:03<00:24,  9.73it/s][A
Training:  14%|█▎        | 37/274 [00:03<00:20, 11.58it/s][A
Training:  14%|█▍   

Epoch: 4/18 - Loss: 3.9466 - Accuracy: 0.9213



  0%|          | 0/35 [00:00<?, ?it/s][A
  3%|▎         | 1/35 [00:00<00:23,  1.46it/s][A
 11%|█▏        | 4/35 [00:00<00:04,  6.22it/s][A
 17%|█▋        | 6/35 [00:01<00:04,  6.99it/s][A
 26%|██▌       | 9/35 [00:01<00:03,  8.04it/s][A
 37%|███▋      | 13/35 [00:01<00:02,  9.40it/s][A
 49%|████▊     | 17/35 [00:02<00:01,  9.84it/s][A
 57%|█████▋    | 20/35 [00:02<00:01, 12.25it/s][A
 63%|██████▎   | 22/35 [00:02<00:01, 10.94it/s][A
 71%|███████▏  | 25/35 [00:02<00:00, 10.08it/s][A
 83%|████████▎ | 29/35 [00:03<00:00, 10.36it/s][A
100%|██████████| 35/35 [00:03<00:00,  9.81it/s][A
Epochs:  22%|██▏       | 4/18 [01:49<06:23, 27.37s/it]

Val Loss: 3.7330 - Val Accuracy: 0.9345



Training:   0%|          | 0/274 [00:00<?, ?it/s][A
Training:   0%|          | 1/274 [00:00<02:32,  1.80it/s][A
Training:   1%|▏         | 4/274 [00:00<00:37,  7.27it/s][A
Training:   2%|▏         | 6/274 [00:00<00:37,  7.13it/s][A
Training:   3%|▎         | 9/274 [00:01<00:32,  8.25it/s][A
Training:   4%|▍         | 12/274 [00:01<00:22, 11.64it/s][A
Training:   5%|▌         | 14/274 [00:01<00:24, 10.58it/s][A
Training:   6%|▌         | 17/274 [00:01<00:26,  9.78it/s][A
Training:   7%|▋         | 19/274 [00:02<00:22, 11.23it/s][A
Training:   8%|▊         | 21/274 [00:02<00:27,  9.37it/s][A
Training:   8%|▊         | 23/274 [00:02<00:24, 10.45it/s][A
Training:   9%|▉         | 25/274 [00:02<00:26,  9.42it/s][A
Training:  11%|█         | 29/274 [00:03<00:23, 10.36it/s][A
Training:  11%|█▏        | 31/274 [00:03<00:22, 10.88it/s][A
Training:  12%|█▏        | 33/274 [00:03<00:25,  9.34it/s][A
Training:  14%|█▎        | 37/274 [00:03<00:23, 10.13it/s][A
Training:  15%|█▍   

Epoch: 5/18 - Loss: 3.6525 - Accuracy: 0.9279



  0%|          | 0/35 [00:00<?, ?it/s][A
  3%|▎         | 1/35 [00:00<00:19,  1.71it/s][A
 14%|█▍        | 5/35 [00:00<00:04,  6.70it/s][A
 26%|██▌       | 9/35 [00:01<00:03,  8.20it/s][A
 37%|███▋      | 13/35 [00:01<00:02,  9.23it/s][A
 49%|████▊     | 17/35 [00:02<00:01,  9.83it/s][A
 60%|██████    | 21/35 [00:02<00:01,  9.97it/s][A
 71%|███████▏  | 25/35 [00:02<00:00, 10.48it/s][A
 83%|████████▎ | 29/35 [00:03<00:00, 10.88it/s][A
 91%|█████████▏| 32/35 [00:03<00:00, 12.99it/s][A
100%|██████████| 35/35 [00:03<00:00,  9.93it/s][A
Epochs:  28%|██▊       | 5/18 [02:16<05:55, 27.36s/it]

Val Loss: 3.6912 - Val Accuracy: 0.9311



Training:   0%|          | 0/274 [00:00<?, ?it/s][A
Training:   0%|          | 1/274 [00:00<03:03,  1.48it/s][A
Training:   2%|▏         | 5/274 [00:00<00:41,  6.41it/s][A
Training:   3%|▎         | 8/274 [00:01<00:27,  9.82it/s][A
Training:   4%|▎         | 10/274 [00:01<00:28,  9.25it/s][A
Training:   4%|▍         | 12/274 [00:01<00:26,  9.85it/s][A
Training:   5%|▌         | 14/274 [00:01<00:24, 10.53it/s][A
Training:   6%|▌         | 16/274 [00:01<00:24, 10.61it/s][A
Training:   7%|▋         | 18/274 [00:02<00:28,  9.05it/s][A
Training:   7%|▋         | 20/274 [00:02<00:23, 10.66it/s][A
Training:   8%|▊         | 22/274 [00:02<00:29,  8.67it/s][A
Training:   9%|▉         | 25/274 [00:02<00:28,  8.69it/s][A
Training:  10%|█         | 28/274 [00:03<00:21, 11.38it/s][A
Training:  11%|█         | 30/274 [00:03<00:21, 11.55it/s][A
Training:  12%|█▏        | 32/274 [00:03<00:18, 12.85it/s][A
Training:  12%|█▏        | 34/274 [00:03<00:20, 11.56it/s][A
Training:  13%|█▎  

Epoch: 6/18 - Loss: 3.7399 - Accuracy: 0.9255



  0%|          | 0/35 [00:00<?, ?it/s][A
  3%|▎         | 1/35 [00:00<00:24,  1.39it/s][A
 14%|█▍        | 5/35 [00:01<00:05,  5.35it/s][A
 26%|██▌       | 9/35 [00:01<00:03,  7.81it/s][A
 37%|███▋      | 13/35 [00:01<00:02,  9.09it/s][A
 49%|████▊     | 17/35 [00:02<00:01, 11.05it/s][A
 57%|█████▋    | 20/35 [00:02<00:01, 13.33it/s][A
 63%|██████▎   | 22/35 [00:02<00:01, 12.44it/s][A
 69%|██████▊   | 24/35 [00:02<00:00, 13.19it/s][A
 74%|███████▍  | 26/35 [00:02<00:00, 11.30it/s][A
 83%|████████▎ | 29/35 [00:02<00:00, 11.72it/s][A
 89%|████████▊ | 31/35 [00:03<00:00, 12.36it/s][A
 94%|█████████▍| 33/35 [00:03<00:00, 11.39it/s][A
100%|██████████| 35/35 [00:03<00:00,  9.89it/s][A
Epochs:  33%|███▎      | 6/18 [02:44<05:29, 27.49s/it]

Val Loss: 4.3675 - Val Accuracy: 0.8856



Training:   0%|          | 0/274 [00:00<?, ?it/s][A
Training:   0%|          | 1/274 [00:00<03:48,  1.19it/s][A
Training:   2%|▏         | 5/274 [00:01<00:51,  5.21it/s][A
Training:   3%|▎         | 8/274 [00:01<00:32,  8.16it/s][A
Training:   4%|▎         | 10/274 [00:01<00:29,  8.89it/s][A
Training:   5%|▍         | 13/274 [00:01<00:29,  8.94it/s][A
Training:   6%|▌         | 17/274 [00:02<00:26,  9.86it/s][A
Training:   8%|▊         | 21/274 [00:02<00:24, 10.44it/s][A
Training:   9%|▉         | 25/274 [00:02<00:23, 10.76it/s][A
Training:  10%|█         | 28/274 [00:03<00:19, 12.45it/s][A
Training:  11%|█         | 30/274 [00:03<00:21, 11.16it/s][A
Training:  12%|█▏        | 33/274 [00:03<00:22, 10.50it/s][A
Training:  13%|█▎        | 36/274 [00:03<00:18, 12.57it/s][A
Training:  14%|█▍        | 38/274 [00:03<00:20, 11.52it/s][A
Training:  15%|█▍        | 41/274 [00:04<00:21, 10.84it/s][A
Training:  16%|█▋        | 45/274 [00:04<00:20, 11.16it/s][A
Training:  18%|█▊  

Epoch: 7/18 - Loss: 3.5937 - Accuracy: 0.9298



  0%|          | 0/35 [00:00<?, ?it/s][A
  3%|▎         | 1/35 [00:00<00:16,  2.05it/s][A
  6%|▌         | 2/35 [00:00<00:09,  3.50it/s][A
 14%|█▍        | 5/35 [00:00<00:03,  8.41it/s][A
 20%|██        | 7/35 [00:00<00:02,  9.50it/s][A
 26%|██▌       | 9/35 [00:01<00:02,  9.51it/s][A
 31%|███▏      | 11/35 [00:01<00:02, 10.37it/s][A
 37%|███▋      | 13/35 [00:01<00:02,  9.87it/s][A
 43%|████▎     | 15/35 [00:01<00:01, 11.64it/s][A
 49%|████▊     | 17/35 [00:01<00:01,  9.41it/s][A
 60%|██████    | 21/35 [00:02<00:01, 10.29it/s][A
 71%|███████▏  | 25/35 [00:02<00:00, 10.79it/s][A
 83%|████████▎ | 29/35 [00:02<00:00, 11.19it/s][A
100%|██████████| 35/35 [00:03<00:00, 10.14it/s][A
Epochs:  39%|███▉      | 7/18 [03:12<05:01, 27.45s/it]

Val Loss: 3.5995 - Val Accuracy: 0.9384



Training:   0%|          | 0/274 [00:00<?, ?it/s][A
Training:   0%|          | 1/274 [00:00<03:33,  1.28it/s][A
Training:   2%|▏         | 5/274 [00:01<00:50,  5.36it/s][A
Training:   3%|▎         | 8/274 [00:01<00:30,  8.70it/s][A
Training:   4%|▎         | 10/274 [00:01<00:33,  7.99it/s][A
Training:   4%|▍         | 12/274 [00:01<00:28,  9.08it/s][A
Training:   5%|▌         | 14/274 [00:01<00:26,  9.76it/s][A
Training:   6%|▌         | 16/274 [00:01<00:22, 11.56it/s][A
Training:   7%|▋         | 18/274 [00:02<00:24, 10.39it/s][A
Training:   8%|▊         | 21/274 [00:02<00:25,  9.74it/s][A
Training:   8%|▊         | 23/274 [00:02<00:22, 11.23it/s][A
Training:   9%|▉         | 25/274 [00:02<00:26,  9.31it/s][A
Training:  10%|█         | 28/274 [00:03<00:20, 12.30it/s][A
Training:  11%|█         | 30/274 [00:03<00:21, 11.11it/s][A
Training:  12%|█▏        | 33/274 [00:03<00:21, 11.12it/s][A
Training:  13%|█▎        | 36/274 [00:03<00:17, 13.91it/s][A
Training:  14%|█▍  

Epoch: 8/18 - Loss: 3.2700 - Accuracy: 0.9386



  0%|          | 0/35 [00:00<?, ?it/s][A
  3%|▎         | 1/35 [00:00<00:19,  1.73it/s][A
  6%|▌         | 2/35 [00:00<00:09,  3.34it/s][A
 14%|█▍        | 5/35 [00:00<00:03,  7.91it/s][A
 26%|██▌       | 9/35 [00:01<00:02, 10.37it/s][A
 31%|███▏      | 11/35 [00:01<00:02, 11.09it/s][A
 37%|███▋      | 13/35 [00:01<00:02, 10.71it/s][A
 43%|████▎     | 15/35 [00:01<00:01, 10.69it/s][A
 49%|████▊     | 17/35 [00:01<00:01, 12.36it/s][A
 54%|█████▍    | 19/35 [00:01<00:01, 11.51it/s][A
 60%|██████    | 21/35 [00:02<00:01, 13.10it/s][A
 66%|██████▌   | 23/35 [00:02<00:01, 10.94it/s][A
 71%|███████▏  | 25/35 [00:02<00:00, 12.29it/s][A
 77%|███████▋  | 27/35 [00:02<00:00, 11.95it/s][A
 83%|████████▎ | 29/35 [00:02<00:00, 12.28it/s][A
 89%|████████▊ | 31/35 [00:02<00:00, 12.56it/s][A
 94%|█████████▍| 33/35 [00:03<00:00, 13.56it/s][A
100%|██████████| 35/35 [00:03<00:00, 10.22it/s][A
Epochs:  44%|████▍     | 8/18 [03:39<04:33, 27.38s/it]

Val Loss: 4.0700 - Val Accuracy: 0.9369



Training:   0%|          | 0/274 [00:00<?, ?it/s][A
Training:   0%|          | 1/274 [00:00<03:36,  1.26it/s][A
Training:   2%|▏         | 5/274 [00:01<00:45,  5.97it/s][A
Training:   3%|▎         | 8/274 [00:01<00:27,  9.59it/s][A
Training:   4%|▎         | 10/274 [00:01<00:31,  8.43it/s][A
Training:   5%|▍         | 13/274 [00:01<00:29,  8.92it/s][A
Training:   6%|▌         | 16/274 [00:01<00:21, 11.90it/s][A
Training:   7%|▋         | 18/274 [00:02<00:26,  9.59it/s][A
Training:   8%|▊         | 21/274 [00:02<00:26,  9.48it/s][A
Training:   9%|▉         | 24/274 [00:02<00:20, 12.09it/s][A
Training:   9%|▉         | 26/274 [00:02<00:23, 10.62it/s][A
Training:  11%|█         | 29/274 [00:03<00:23, 10.37it/s][A
Training:  12%|█▏        | 33/274 [00:03<00:22, 10.84it/s][A
Training:  14%|█▎        | 37/274 [00:03<00:22, 10.45it/s][A
Training:  15%|█▍        | 41/274 [00:04<00:22, 10.54it/s][A
Training:  16%|█▌        | 44/274 [00:04<00:18, 12.46it/s][A
Training:  17%|█▋  

Epoch: 9/18 - Loss: 3.3242 - Accuracy: 0.9354



  0%|          | 0/35 [00:00<?, ?it/s][A
  3%|▎         | 1/35 [00:00<00:23,  1.46it/s][A
 14%|█▍        | 5/35 [00:00<00:04,  6.90it/s][A
 23%|██▎       | 8/35 [00:01<00:02, 10.36it/s][A
 29%|██▊       | 10/35 [00:01<00:02, 10.58it/s][A
 37%|███▋      | 13/35 [00:01<00:02, 10.47it/s][A
 49%|████▊     | 17/35 [00:01<00:01, 11.11it/s][A
 60%|██████    | 21/35 [00:02<00:01, 11.03it/s][A
 71%|███████▏  | 25/35 [00:02<00:00, 10.49it/s][A
 83%|████████▎ | 29/35 [00:02<00:00, 10.54it/s][A
100%|██████████| 35/35 [00:03<00:00, 10.22it/s][A
Epochs:  50%|█████     | 9/18 [04:06<04:06, 27.41s/it]

Val Loss: 3.6396 - Val Accuracy: 0.9324



Training:   0%|          | 0/274 [00:00<?, ?it/s][A
Training:   0%|          | 1/274 [00:00<03:08,  1.45it/s][A
Training:   1%|          | 3/274 [00:00<00:59,  4.52it/s][A
Training:   2%|▏         | 5/274 [00:00<00:41,  6.50it/s][A
Training:   3%|▎         | 7/274 [00:01<00:31,  8.59it/s][A
Training:   3%|▎         | 9/274 [00:01<00:29,  8.96it/s][A
Training:   4%|▍         | 11/274 [00:01<00:24, 10.54it/s][A
Training:   5%|▍         | 13/274 [00:01<00:27,  9.56it/s][A
Training:   6%|▌         | 17/274 [00:02<00:24, 10.51it/s][A
Training:   8%|▊         | 21/274 [00:02<00:23, 10.89it/s][A
Training:   9%|▉         | 24/274 [00:02<00:18, 13.49it/s][A
Training:   9%|▉         | 26/274 [00:02<00:20, 12.04it/s][A
Training:  11%|█         | 29/274 [00:02<00:18, 13.08it/s][A
Training:  11%|█▏        | 31/274 [00:03<00:21, 11.45it/s][A
Training:  12%|█▏        | 33/274 [00:03<00:22, 10.80it/s][A
Training:  13%|█▎        | 35/274 [00:03<00:22, 10.50it/s][A
Training:  14%|█▍    

Epoch: 10/18 - Loss: 3.2382 - Accuracy: 0.9360



  0%|          | 0/35 [00:00<?, ?it/s][A
  3%|▎         | 1/35 [00:00<00:22,  1.53it/s][A
 11%|█▏        | 4/35 [00:00<00:05,  5.66it/s][A
 14%|█▍        | 5/35 [00:01<00:05,  5.93it/s][A
 23%|██▎       | 8/35 [00:01<00:03,  8.71it/s][A
 29%|██▊       | 10/35 [00:01<00:02,  9.85it/s][A
 34%|███▍      | 12/35 [00:01<00:02,  8.78it/s][A
 43%|████▎     | 15/35 [00:01<00:01, 11.91it/s][A
 49%|████▊     | 17/35 [00:02<00:01, 10.45it/s][A
 57%|█████▋    | 20/35 [00:02<00:01, 10.80it/s][A
 69%|██████▊   | 24/35 [00:02<00:00, 11.40it/s][A
 77%|███████▋  | 27/35 [00:02<00:00, 14.07it/s][A
 83%|████████▎ | 29/35 [00:02<00:00, 11.76it/s][A
100%|██████████| 35/35 [00:03<00:00, 10.40it/s][A
Epochs:  56%|█████▌    | 10/18 [04:34<03:39, 27.45s/it]

Val Loss: 3.5071 - Val Accuracy: 0.9265



Training:   0%|          | 0/274 [00:00<?, ?it/s][A
Training:   0%|          | 1/274 [00:00<03:45,  1.21it/s][A
Training:   1%|          | 2/274 [00:01<02:11,  2.08it/s][A
Training:   2%|▏         | 6/274 [00:01<00:48,  5.57it/s][A
Training:   4%|▎         | 10/274 [00:01<00:38,  6.86it/s][A
Training:   5%|▌         | 14/274 [00:02<00:30,  8.44it/s][A
Training:   7%|▋         | 18/274 [00:02<00:28,  9.01it/s][A
Training:   8%|▊         | 22/274 [00:02<00:25, 10.04it/s][A
Training:   9%|▉         | 26/274 [00:03<00:24, 10.14it/s][A
Training:  11%|█         | 29/274 [00:03<00:20, 12.22it/s][A
Training:  11%|█▏        | 31/274 [00:03<00:21, 11.20it/s][A
Training:  12%|█▏        | 34/274 [00:03<00:21, 11.40it/s][A
Training:  14%|█▍        | 38/274 [00:04<00:18, 12.52it/s][A
Training:  15%|█▍        | 41/274 [00:04<00:15, 14.58it/s][A
Training:  16%|█▌        | 43/274 [00:04<00:19, 12.08it/s][A
Training:  16%|█▋        | 45/274 [00:04<00:17, 13.15it/s][A
Training:  17%|█▋  

Epoch: 11/18 - Loss: 3.2492 - Accuracy: 0.9357



  0%|          | 0/35 [00:00<?, ?it/s][A
  3%|▎         | 1/35 [00:00<00:25,  1.34it/s][A
 14%|█▍        | 5/35 [00:01<00:05,  5.63it/s][A
 26%|██▌       | 9/35 [00:01<00:03,  7.23it/s][A
 37%|███▋      | 13/35 [00:01<00:02,  8.82it/s][A
 49%|████▊     | 17/35 [00:02<00:01,  9.36it/s][A
 60%|██████    | 21/35 [00:02<00:01,  9.72it/s][A
 71%|███████▏  | 25/35 [00:02<00:00, 10.78it/s][A
 83%|████████▎ | 29/35 [00:03<00:00, 11.63it/s][A
100%|██████████| 35/35 [00:03<00:00, 10.00it/s][A
Epochs:  61%|██████    | 11/18 [05:02<03:13, 27.58s/it]

Val Loss: 4.0542 - Val Accuracy: 0.9317



Training:   0%|          | 0/274 [00:00<?, ?it/s][A
Training:   0%|          | 1/274 [00:00<03:11,  1.43it/s][A
Training:   2%|▏         | 5/274 [00:01<00:47,  5.65it/s][A
Training:   3%|▎         | 8/274 [00:01<00:29,  9.10it/s][A
Training:   4%|▎         | 10/274 [00:01<00:28,  9.24it/s][A
Training:   5%|▍         | 13/274 [00:01<00:28,  9.23it/s][A
Training:   6%|▌         | 17/274 [00:02<00:25, 10.04it/s][A
Training:   7%|▋         | 20/274 [00:02<00:19, 12.70it/s][A
Training:   8%|▊         | 22/274 [00:02<00:22, 11.16it/s][A
Training:   9%|▉         | 25/274 [00:02<00:21, 11.37it/s][A
Training:  11%|█         | 29/274 [00:02<00:19, 12.51it/s][A
Training:  12%|█▏        | 32/274 [00:03<00:16, 14.51it/s][A
Training:  12%|█▏        | 34/274 [00:03<00:21, 11.00it/s][A
Training:  14%|█▎        | 37/274 [00:03<00:22, 10.75it/s][A
Training:  15%|█▍        | 41/274 [00:04<00:21, 10.78it/s][A
Training:  16%|█▌        | 44/274 [00:04<00:17, 12.93it/s][A
Training:  17%|█▋  

Epoch: 12/18 - Loss: 3.2874 - Accuracy: 0.9337



  0%|          | 0/35 [00:00<?, ?it/s][A
  3%|▎         | 1/35 [00:00<00:24,  1.41it/s][A
  6%|▌         | 2/35 [00:00<00:12,  2.74it/s][A
 14%|█▍        | 5/35 [00:01<00:04,  6.44it/s][A
 23%|██▎       | 8/35 [00:01<00:02,  9.81it/s][A
 29%|██▊       | 10/35 [00:01<00:02,  9.38it/s][A
 37%|███▋      | 13/35 [00:01<00:02,  9.42it/s][A
 49%|████▊     | 17/35 [00:02<00:01, 10.57it/s][A
 57%|█████▋    | 20/35 [00:02<00:01, 13.24it/s][A
 63%|██████▎   | 22/35 [00:02<00:01, 10.84it/s][A
 71%|███████▏  | 25/35 [00:02<00:01,  9.35it/s][A
 83%|████████▎ | 29/35 [00:03<00:00, 10.01it/s][A
100%|██████████| 35/35 [00:03<00:00,  9.52it/s][A
Epochs:  67%|██████▋   | 12/18 [05:29<02:44, 27.42s/it]

Val Loss: 3.5053 - Val Accuracy: 0.9384



Training:   0%|          | 0/274 [00:00<?, ?it/s][A
Training:   0%|          | 1/274 [00:00<03:36,  1.26it/s][A
Training:   2%|▏         | 5/274 [00:01<00:48,  5.55it/s][A
Training:   3%|▎         | 7/274 [00:01<00:35,  7.45it/s][A
Training:   3%|▎         | 9/274 [00:01<00:32,  8.04it/s][A
Training:   4%|▍         | 11/274 [00:01<00:27,  9.42it/s][A
Training:   5%|▍         | 13/274 [00:01<00:25, 10.25it/s][A
Training:   5%|▌         | 15/274 [00:01<00:21, 12.04it/s][A
Training:   6%|▌         | 17/274 [00:02<00:22, 11.43it/s][A
Training:   7%|▋         | 19/274 [00:02<00:19, 12.82it/s][A
Training:   8%|▊         | 21/274 [00:02<00:19, 13.16it/s][A
Training:   8%|▊         | 23/274 [00:02<00:24, 10.31it/s][A
Training:   9%|▉         | 26/274 [00:02<00:27,  8.89it/s][A
Training:  11%|█         | 29/274 [00:03<00:21, 11.65it/s][A
Training:  11%|█▏        | 31/274 [00:03<00:22, 10.90it/s][A
Training:  12%|█▏        | 34/274 [00:03<00:25,  9.50it/s][A
Training:  14%|█▎   

Epoch: 13/18 - Loss: 3.1300 - Accuracy: 0.9354



  0%|          | 0/35 [00:00<?, ?it/s][A
  3%|▎         | 1/35 [00:00<00:21,  1.55it/s][A
 11%|█▏        | 4/35 [00:00<00:05,  5.86it/s][A
 17%|█▋        | 6/35 [00:00<00:03,  7.81it/s][A
 23%|██▎       | 8/35 [00:01<00:02,  9.20it/s][A
 29%|██▊       | 10/35 [00:01<00:02, 10.10it/s][A
 34%|███▍      | 12/35 [00:01<00:02, 10.53it/s][A
 40%|████      | 14/35 [00:01<00:01, 11.15it/s][A
 46%|████▌     | 16/35 [00:01<00:01, 11.55it/s][A
 51%|█████▏    | 18/35 [00:01<00:01, 11.16it/s][A
 57%|█████▋    | 20/35 [00:02<00:01, 11.80it/s][A
 63%|██████▎   | 22/35 [00:02<00:01, 11.76it/s][A
 69%|██████▊   | 24/35 [00:02<00:01, 10.42it/s][A
 77%|███████▋  | 27/35 [00:02<00:00, 10.57it/s][A
 83%|████████▎ | 29/35 [00:02<00:00, 11.14it/s][A
 89%|████████▊ | 31/35 [00:03<00:00,  9.92it/s][A
100%|██████████| 35/35 [00:03<00:00,  9.93it/s][A
Epochs:  72%|███████▏  | 13/18 [05:56<02:17, 27.43s/it]

Val Loss: 3.5408 - Val Accuracy: 0.9395



Training:   0%|          | 0/274 [00:00<?, ?it/s][A
Training:   0%|          | 1/274 [00:00<02:46,  1.63it/s][A
Training:   1%|          | 2/274 [00:00<01:27,  3.09it/s][A
Training:   2%|▏         | 5/274 [00:00<00:35,  7.66it/s][A
Training:   3%|▎         | 7/274 [00:01<00:27,  9.58it/s][A
Training:   3%|▎         | 9/274 [00:01<00:24, 10.66it/s][A
Training:   4%|▍         | 11/274 [00:01<00:26,  9.92it/s][A
Training:   5%|▍         | 13/274 [00:01<00:23, 10.89it/s][A
Training:   5%|▌         | 15/274 [00:01<00:20, 12.75it/s][A
Training:   6%|▌         | 17/274 [00:01<00:21, 12.18it/s][A
Training:   7%|▋         | 19/274 [00:02<00:23, 10.98it/s][A
Training:   8%|▊         | 21/274 [00:02<00:23, 10.99it/s][A
Training:   8%|▊         | 23/274 [00:02<00:22, 10.98it/s][A
Training:   9%|▉         | 25/274 [00:02<00:21, 11.46it/s][A
Training:  10%|▉         | 27/274 [00:02<00:26,  9.41it/s][A
Training:  11%|█         | 29/274 [00:03<00:22, 11.10it/s][A
Training:  11%|█▏    

Epoch: 14/18 - Loss: 3.0944 - Accuracy: 0.9367



  0%|          | 0/35 [00:00<?, ?it/s][A
  3%|▎         | 1/35 [00:00<00:24,  1.37it/s][A
 14%|█▍        | 5/35 [00:01<00:05,  5.64it/s][A
 26%|██▌       | 9/35 [00:01<00:03,  8.20it/s][A
 37%|███▋      | 13/35 [00:01<00:02, 10.13it/s][A
 46%|████▌     | 16/35 [00:01<00:01, 12.52it/s][A
 51%|█████▏    | 18/35 [00:01<00:01, 11.30it/s][A
 60%|██████    | 21/35 [00:02<00:01, 10.34it/s][A
 66%|██████▌   | 23/35 [00:02<00:01, 11.22it/s][A
 71%|███████▏  | 25/35 [00:02<00:00, 10.94it/s][A
 77%|███████▋  | 27/35 [00:02<00:00, 11.49it/s][A
 83%|████████▎ | 29/35 [00:03<00:00,  8.86it/s][A
100%|██████████| 35/35 [00:03<00:00,  9.63it/s][A
Epochs:  78%|███████▊  | 14/18 [06:24<01:50, 27.56s/it]

Val Loss: 3.3588 - Val Accuracy: 0.9384



Training:   0%|          | 0/274 [00:00<?, ?it/s][A
Training:   0%|          | 1/274 [00:00<03:13,  1.41it/s][A
Training:   1%|          | 3/274 [00:00<01:00,  4.45it/s][A
Training:   2%|▏         | 5/274 [00:01<00:43,  6.13it/s][A
Training:   3%|▎         | 9/274 [00:01<00:30,  8.76it/s][A
Training:   4%|▍         | 11/274 [00:01<00:25, 10.48it/s][A
Training:   5%|▍         | 13/274 [00:01<00:27,  9.46it/s][A
Training:   5%|▌         | 15/274 [00:01<00:24, 10.65it/s][A
Training:   6%|▌         | 17/274 [00:02<00:23, 11.06it/s][A
Training:   7%|▋         | 19/274 [00:02<00:20, 12.54it/s][A
Training:   8%|▊         | 21/274 [00:02<00:26,  9.40it/s][A
Training:   9%|▉         | 25/274 [00:02<00:24, 10.33it/s][A
Training:  11%|█         | 29/274 [00:03<00:23, 10.38it/s][A
Training:  11%|█▏        | 31/274 [00:03<00:21, 11.36it/s][A
Training:  12%|█▏        | 33/274 [00:03<00:22, 10.72it/s][A
Training:  13%|█▎        | 36/274 [00:03<00:17, 13.38it/s][A
Training:  14%|█▍   

Epoch: 15/18 - Loss: 3.1496 - Accuracy: 0.9367



  0%|          | 0/35 [00:00<?, ?it/s][A
  3%|▎         | 1/35 [00:00<00:19,  1.79it/s][A
 11%|█▏        | 4/35 [00:00<00:04,  6.40it/s][A
 17%|█▋        | 6/35 [00:00<00:03,  7.70it/s][A
 23%|██▎       | 8/35 [00:01<00:03,  8.55it/s][A
 29%|██▊       | 10/35 [00:01<00:02,  8.83it/s][A
 37%|███▋      | 13/35 [00:01<00:02, 10.11it/s][A
 43%|████▎     | 15/35 [00:01<00:01, 11.36it/s][A
 49%|████▊     | 17/35 [00:01<00:01, 10.67it/s][A
 54%|█████▍    | 19/35 [00:02<00:01, 12.09it/s][A
 60%|██████    | 21/35 [00:02<00:01, 12.03it/s][A
 66%|██████▌   | 23/35 [00:02<00:00, 12.99it/s][A
 71%|███████▏  | 25/35 [00:02<00:00, 13.68it/s][A
 77%|███████▋  | 27/35 [00:02<00:00, 12.22it/s][A
 86%|████████▌ | 30/35 [00:02<00:00, 12.10it/s][A
 94%|█████████▍| 33/35 [00:03<00:00, 14.52it/s][A
100%|██████████| 35/35 [00:03<00:00, 10.53it/s][A
Epochs:  83%|████████▎ | 15/18 [06:51<01:22, 27.48s/it]

Val Loss: 3.3533 - Val Accuracy: 0.9401



Training:   0%|          | 0/274 [00:00<?, ?it/s][A
Training:   0%|          | 1/274 [00:00<03:09,  1.44it/s][A
Training:   1%|          | 2/274 [00:00<01:50,  2.45it/s][A
Training:   1%|▏         | 4/274 [00:01<00:49,  5.45it/s][A
Training:   2%|▏         | 6/274 [00:01<00:43,  6.12it/s][A
Training:   3%|▎         | 9/274 [00:01<00:27,  9.50it/s][A
Training:   4%|▍         | 11/274 [00:01<00:27,  9.40it/s][A
Training:   5%|▍         | 13/274 [00:01<00:25, 10.11it/s][A
Training:   5%|▌         | 15/274 [00:02<00:25, 10.15it/s][A
Training:   6%|▌         | 17/274 [00:02<00:25, 10.09it/s][A
Training:   7%|▋         | 19/274 [00:02<00:24, 10.42it/s][A
Training:   8%|▊         | 21/274 [00:02<00:23, 10.60it/s][A
Training:   8%|▊         | 23/274 [00:02<00:22, 11.40it/s][A
Training:   9%|▉         | 25/274 [00:02<00:19, 12.57it/s][A
Training:  10%|▉         | 27/274 [00:02<00:18, 13.11it/s][A
Training:  11%|█         | 29/274 [00:03<00:17, 13.77it/s][A
Training:  11%|█▏    

Epoch: 16/18 - Loss: 3.0190 - Accuracy: 0.9393



  0%|          | 0/35 [00:00<?, ?it/s][A
  3%|▎         | 1/35 [00:00<00:24,  1.41it/s][A
 14%|█▍        | 5/35 [00:01<00:05,  5.31it/s][A
 26%|██▌       | 9/35 [00:01<00:03,  7.10it/s][A
 37%|███▋      | 13/35 [00:01<00:02,  9.04it/s][A
 49%|████▊     | 17/35 [00:02<00:01,  9.73it/s][A
 60%|██████    | 21/35 [00:02<00:01, 10.38it/s][A
 71%|███████▏  | 25/35 [00:02<00:00, 11.01it/s][A
 83%|████████▎ | 29/35 [00:03<00:00, 11.59it/s][A
100%|██████████| 35/35 [00:03<00:00, 10.03it/s][A
Epochs:  89%|████████▉ | 16/18 [07:18<00:54, 27.33s/it]

Val Loss: 3.3115 - Val Accuracy: 0.9339



Training:   0%|          | 0/274 [00:00<?, ?it/s][A
Training:   0%|          | 1/274 [00:00<03:30,  1.30it/s][A
Training:   1%|          | 3/274 [00:00<01:04,  4.21it/s][A
Training:   2%|▏         | 5/274 [00:01<00:49,  5.40it/s][A
Training:   3%|▎         | 8/274 [00:01<00:29,  9.14it/s][A
Training:   4%|▎         | 10/274 [00:01<00:31,  8.35it/s][A
Training:   4%|▍         | 12/274 [00:01<00:26, 10.02it/s][A
Training:   5%|▌         | 14/274 [00:02<00:31,  8.18it/s][A
Training:   6%|▌         | 16/274 [00:02<00:26,  9.92it/s][A
Training:   7%|▋         | 18/274 [00:02<00:27,  9.42it/s][A
Training:   8%|▊         | 21/274 [00:02<00:24, 10.49it/s][A
Training:   9%|▉         | 25/274 [00:02<00:22, 11.30it/s][A
Training:  11%|█         | 29/274 [00:03<00:20, 11.94it/s][A
Training:  12%|█▏        | 33/274 [00:03<00:18, 13.15it/s][A
Training:  13%|█▎        | 35/274 [00:03<00:17, 14.05it/s][A
Training:  14%|█▎        | 37/274 [00:03<00:20, 11.70it/s][A
Training:  15%|█▍   

Epoch: 17/18 - Loss: 2.9579 - Accuracy: 0.9395



  0%|          | 0/35 [00:00<?, ?it/s][A
  3%|▎         | 1/35 [00:00<00:24,  1.37it/s][A
 11%|█▏        | 4/35 [00:00<00:05,  6.01it/s][A
 17%|█▋        | 6/35 [00:01<00:04,  6.29it/s][A
 26%|██▌       | 9/35 [00:01<00:03,  8.34it/s][A
 31%|███▏      | 11/35 [00:01<00:02,  9.63it/s][A
 37%|███▋      | 13/35 [00:01<00:02,  9.47it/s][A
 49%|████▊     | 17/35 [00:02<00:01, 11.10it/s][A
 60%|██████    | 21/35 [00:02<00:01, 11.61it/s][A
 71%|███████▏  | 25/35 [00:02<00:00, 12.66it/s][A
 83%|████████▎ | 29/35 [00:02<00:00, 13.95it/s][A
 91%|█████████▏| 32/35 [00:02<00:00, 16.00it/s][A
100%|██████████| 35/35 [00:03<00:00, 10.48it/s][A
Epochs:  94%|█████████▍| 17/18 [07:46<00:27, 27.34s/it]

Val Loss: 3.5190 - Val Accuracy: 0.9380



Training:   0%|          | 0/274 [00:00<?, ?it/s][A
Training:   0%|          | 1/274 [00:00<03:39,  1.24it/s][A
Training:   1%|▏         | 4/274 [00:00<00:51,  5.24it/s][A
Training:   2%|▏         | 6/274 [00:01<00:43,  6.14it/s][A
Training:   3%|▎         | 9/274 [00:01<00:34,  7.71it/s][A
Training:   4%|▍         | 11/274 [00:01<00:28,  9.21it/s][A
Training:   5%|▍         | 13/274 [00:01<00:29,  8.71it/s][A
Training:   5%|▌         | 15/274 [00:01<00:25, 10.34it/s][A
Training:   6%|▌         | 17/274 [00:02<00:24, 10.32it/s][A
Training:   7%|▋         | 19/274 [00:02<00:21, 11.87it/s][A
Training:   8%|▊         | 21/274 [00:02<00:23, 10.80it/s][A
Training:   8%|▊         | 23/274 [00:02<00:20, 12.05it/s][A
Training:   9%|▉         | 25/274 [00:02<00:22, 10.93it/s][A
Training:  10%|▉         | 27/274 [00:03<00:22, 10.91it/s][A
Training:  11%|█         | 29/274 [00:03<00:20, 11.70it/s][A
Training:  11%|█▏        | 31/274 [00:03<00:22, 11.02it/s][A
Training:  12%|█▏   

Epoch: 18/18 - Loss: 2.9052 - Accuracy: 0.9390



  0%|          | 0/35 [00:00<?, ?it/s][A
  3%|▎         | 1/35 [00:00<00:22,  1.49it/s][A
 14%|█▍        | 5/35 [00:01<00:05,  5.35it/s][A
 26%|██▌       | 9/35 [00:01<00:03,  8.27it/s][A
 34%|███▍      | 12/35 [00:01<00:02, 11.24it/s][A
 40%|████      | 14/35 [00:01<00:02, 10.11it/s][A
 49%|████▊     | 17/35 [00:02<00:01, 10.05it/s][A
 60%|██████    | 21/35 [00:02<00:01, 10.65it/s][A
 71%|███████▏  | 25/35 [00:02<00:00, 11.55it/s][A
 83%|████████▎ | 29/35 [00:02<00:00, 12.00it/s][A
100%|██████████| 35/35 [00:03<00:00, 10.24it/s][A
Epochs: 100%|██████████| 18/18 [08:13<00:00, 27.41s/it]


Val Loss: 3.7839 - Val Accuracy: 0.9266


[32m[I 2023-12-15 00:06:39,925][0m Trial 9 finished with value: 0.9266106486320496 and parameters: {'loss_learning_rate': 0.00016092774588079742, 'learning_rate': 0.002952527785624987, 'weight_decay': 0.0004422628981911029, 'epsilon': 1.2457860298352204e-09, 'batch_size': 51, 'epochs': 18}. Best is trial 2 with value: 0.937753438949585.[0m


Learning rate for Loss: 0.0010478711028608547
Learning rate: 0.00020392119265454287
Weight decay: 0.0015091576033363992
Epsilon: 2.04163723324564e-08
Batch size: 135
Number of epochs: 34


Epochs:   0%|          | 0/34 [00:00<?, ?it/s]
Training:   0%|          | 0/104 [00:00<?, ?it/s][A
Training:   1%|          | 1/104 [00:01<02:01,  1.18s/it][A
Training:   2%|▏         | 2/104 [00:01<00:56,  1.81it/s][A
Training:   4%|▍         | 4/104 [00:01<00:25,  3.96it/s][A
Training:   5%|▍         | 5/104 [00:02<00:36,  2.73it/s][A
Training:   7%|▋         | 7/104 [00:02<00:21,  4.42it/s][A
Training:   9%|▊         | 9/104 [00:02<00:25,  3.78it/s][A
Training:  10%|▉         | 10/104 [00:03<00:23,  4.07it/s][A
Training:  12%|█▏        | 12/104 [00:03<00:15,  5.83it/s][A
Training:  13%|█▎        | 14/104 [00:03<00:23,  3.83it/s][A
Training:  15%|█▌        | 16/104 [00:04<00:17,  5.09it/s][A
Training:  16%|█▋        | 17/104 [00:04<00:20,  4.15it/s][A
Training:  17%|█▋        | 18/104 [00:04<00:22,  3.88it/s][A
Training:  20%|██        | 21/104 [00:05<00:18,  4.49it/s][A
Training:  21%|██        | 22/104 [00:05<00:20,  4.00it/s][A
Training:  24%|██▍       | 25/104 [00:

Epoch: 1/34 - Loss: 10.4300 - Accuracy: 0.7892



  0%|          | 0/13 [00:00<?, ?it/s][A
  8%|▊         | 1/13 [00:01<00:13,  1.15s/it][A
 15%|█▌        | 2/13 [00:01<00:07,  1.46it/s][A
 31%|███       | 4/13 [00:01<00:02,  3.46it/s][A
 38%|███▊      | 5/13 [00:02<00:02,  3.00it/s][A
 46%|████▌     | 6/13 [00:02<00:02,  2.65it/s][A
 69%|██████▉   | 9/13 [00:02<00:00,  4.16it/s][A
 77%|███████▋  | 10/13 [00:03<00:00,  3.69it/s][A
100%|██████████| 13/13 [00:03<00:00,  3.46it/s][A
Epochs:   3%|▎         | 1/34 [00:27<15:09, 27.57s/it]

Val Loss: 5.8551 - Val Accuracy: 0.9038



Training:   0%|          | 0/104 [00:00<?, ?it/s][A
Training:   1%|          | 1/104 [00:01<02:18,  1.34s/it][A
Training:   2%|▏         | 2/104 [00:01<01:18,  1.30it/s][A
Training:   5%|▍         | 5/104 [00:02<00:31,  3.16it/s][A
Training:   6%|▌         | 6/104 [00:02<00:33,  2.95it/s][A
Training:   9%|▊         | 9/104 [00:03<00:23,  3.98it/s][A
Training:  10%|▉         | 10/104 [00:03<00:25,  3.64it/s][A
Training:  12%|█▏        | 12/104 [00:03<00:18,  4.97it/s][A
Training:  12%|█▎        | 13/104 [00:03<00:20,  4.51it/s][A
Training:  13%|█▎        | 14/104 [00:04<00:21,  4.19it/s][A
Training:  15%|█▌        | 16/104 [00:04<00:15,  5.85it/s][A
Training:  16%|█▋        | 17/104 [00:04<00:20,  4.34it/s][A
Training:  17%|█▋        | 18/104 [00:05<00:21,  3.98it/s][A
Training:  20%|██        | 21/104 [00:05<00:18,  4.58it/s][A
Training:  21%|██        | 22/104 [00:05<00:19,  4.25it/s][A
Training:  22%|██▏       | 23/104 [00:06<00:17,  4.74it/s][A
Training:  24%|██▍   

Epoch: 2/34 - Loss: 5.2575 - Accuracy: 0.9103



  0%|          | 0/13 [00:00<?, ?it/s][A
  8%|▊         | 1/13 [00:01<00:15,  1.32s/it][A
 38%|███▊      | 5/13 [00:02<00:02,  2.89it/s][A
 46%|████▌     | 6/13 [00:02<00:02,  3.43it/s][A
 62%|██████▏   | 8/13 [00:02<00:00,  5.06it/s][A
 77%|███████▋  | 10/13 [00:02<00:00,  4.07it/s][A
100%|██████████| 13/13 [00:03<00:00,  3.70it/s][A
Epochs:   6%|▌         | 2/34 [00:55<14:40, 27.52s/it]

Val Loss: 4.5764 - Val Accuracy: 0.9158



Training:   0%|          | 0/104 [00:00<?, ?it/s][A
Training:   1%|          | 1/104 [00:01<02:14,  1.31s/it][A
Training:   2%|▏         | 2/104 [00:01<01:02,  1.64it/s][A
Training:   4%|▍         | 4/104 [00:01<00:26,  3.82it/s][A
Training:   6%|▌         | 6/104 [00:02<00:30,  3.17it/s][A
Training:   8%|▊         | 8/104 [00:02<00:20,  4.80it/s][A
Training:  10%|▉         | 10/104 [00:03<00:23,  3.97it/s][A
Training:  12%|█▎        | 13/104 [00:04<00:25,  3.59it/s][A
Training:  14%|█▍        | 15/104 [00:04<00:18,  4.70it/s][A
Training:  16%|█▋        | 17/104 [00:04<00:22,  3.88it/s][A
Training:  17%|█▋        | 18/104 [00:04<00:20,  4.17it/s][A
Training:  20%|██        | 21/104 [00:05<00:20,  4.14it/s][A
Training:  23%|██▎       | 24/104 [00:05<00:13,  5.96it/s][A
Training:  25%|██▌       | 26/104 [00:06<00:15,  4.92it/s][A
Training:  27%|██▋       | 28/104 [00:06<00:12,  5.93it/s][A
Training:  28%|██▊       | 29/104 [00:07<00:17,  4.19it/s][A
Training:  29%|██▉   

Epoch: 3/34 - Loss: 4.3991 - Accuracy: 0.9249



  0%|          | 0/13 [00:00<?, ?it/s][A
  8%|▊         | 1/13 [00:01<00:13,  1.14s/it][A
 38%|███▊      | 5/13 [00:01<00:02,  3.06it/s][A
 69%|██████▉   | 9/13 [00:02<00:01,  3.82it/s][A
100%|██████████| 13/13 [00:03<00:00,  3.66it/s][A
Epochs:   6%|▌         | 2/34 [01:22<22:02, 41.34s/it]
[32m[I 2023-12-15 00:08:03,177][0m Trial 10 pruned. [0m


Val Loss: 4.4614 - Val Accuracy: 0.9232
Learning rate for Loss: 0.0005475502239825571
Learning rate: 0.0011125954409380188
Weight decay: 0.004132770040241243
Epsilon: 3.4960361296560697e-08
Batch size: 273
Number of epochs: 89


Epochs:   0%|          | 0/89 [00:00<?, ?it/s]
Training:   0%|          | 0/52 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/52 [00:02<01:57,  2.31s/it][A
Training:   4%|▍         | 2/52 [00:02<00:53,  1.08s/it][A
Training:  10%|▉         | 5/52 [00:04<00:32,  1.44it/s][A
Training:  12%|█▏        | 6/52 [00:04<00:27,  1.69it/s][A
Training:  13%|█▎        | 7/52 [00:04<00:21,  2.13it/s][A
Training:  15%|█▌        | 8/52 [00:04<00:16,  2.66it/s][A
Training:  17%|█▋        | 9/52 [00:06<00:27,  1.56it/s][A
Training:  19%|█▉        | 10/52 [00:06<00:21,  1.93it/s][A
Training:  23%|██▎       | 12/52 [00:06<00:12,  3.22it/s][A
Training:  25%|██▌       | 13/52 [00:07<00:23,  1.67it/s][A
Training:  29%|██▉       | 15/52 [00:08<00:14,  2.58it/s][A
Training:  33%|███▎      | 17/52 [00:09<00:18,  1.87it/s][A
Training:  37%|███▋      | 19/52 [00:09<00:12,  2.67it/s][A
Training:  38%|███▊      | 20/52 [00:09<00:10,  3.11it/s][A
Training:  40%|████      | 21/52 [00:11<00:18,  1.69it

Epoch: 1/89 - Loss: 10.2652 - Accuracy: 0.7907



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:01<00:11,  1.91s/it][A
 43%|████▎     | 3/7 [00:02<00:02,  1.81it/s][A
100%|██████████| 7/7 [00:03<00:00,  1.82it/s][A
Epochs:   1%|          | 1/89 [00:27<40:58, 27.94s/it]

Val Loss: 5.3800 - Val Accuracy: 0.9040



Training:   0%|          | 0/52 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/52 [00:02<01:54,  2.24s/it][A
Training:   4%|▍         | 2/52 [00:02<00:49,  1.02it/s][A
Training:  10%|▉         | 5/52 [00:04<00:34,  1.37it/s][A
Training:  12%|█▏        | 6/52 [00:04<00:26,  1.75it/s][A
Training:  13%|█▎        | 7/52 [00:04<00:20,  2.21it/s][A
Training:  15%|█▌        | 8/52 [00:04<00:15,  2.77it/s][A
Training:  17%|█▋        | 9/52 [00:05<00:28,  1.53it/s][A
Training:  21%|██        | 11/52 [00:06<00:16,  2.49it/s][A
Training:  25%|██▌       | 13/52 [00:07<00:22,  1.77it/s][A
Training:  29%|██▉       | 15/52 [00:08<00:14,  2.51it/s][A
Training:  33%|███▎      | 17/52 [00:09<00:18,  1.94it/s][A
Training:  35%|███▍      | 18/52 [00:09<00:14,  2.30it/s][A
Training:  37%|███▋      | 19/52 [00:09<00:12,  2.75it/s][A
Training:  40%|████      | 21/52 [00:11<00:15,  2.01it/s][A
Training:  46%|████▌     | 24/52 [00:11<00:08,  3.40it/s][A
Training:  50%|█████     | 26/52 [00:12

Epoch: 2/89 - Loss: 4.8948 - Accuracy: 0.9131



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:02<00:14,  2.39s/it][A
 43%|████▎     | 3/7 [00:02<00:02,  1.48it/s][A
100%|██████████| 7/7 [00:04<00:00,  1.66it/s][A
Epochs:   2%|▏         | 2/89 [00:55<40:36, 28.01s/it]

Val Loss: 4.5955 - Val Accuracy: 0.9147



Training:   0%|          | 0/52 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/52 [00:02<02:00,  2.35s/it][A
Training:   4%|▍         | 2/52 [00:02<00:56,  1.13s/it][A
Training:   6%|▌         | 3/52 [00:02<00:33,  1.47it/s][A
Training:  10%|▉         | 5/52 [00:04<00:33,  1.42it/s][A
Training:  12%|█▏        | 6/52 [00:04<00:27,  1.69it/s][A
Training:  13%|█▎        | 7/52 [00:04<00:20,  2.23it/s][A
Training:  17%|█▋        | 9/52 [00:06<00:25,  1.71it/s][A
Training:  19%|█▉        | 10/52 [00:06<00:22,  1.87it/s][A
Training:  23%|██▎       | 12/52 [00:06<00:13,  2.96it/s][A
Training:  25%|██▌       | 13/52 [00:08<00:22,  1.73it/s][A
Training:  27%|██▋       | 14/52 [00:08<00:19,  1.97it/s][A
Training:  29%|██▉       | 15/52 [00:08<00:15,  2.44it/s][A
Training:  33%|███▎      | 17/52 [00:09<00:18,  1.85it/s][A
Training:  35%|███▍      | 18/52 [00:10<00:17,  1.92it/s][A
Training:  40%|████      | 21/52 [00:11<00:14,  2.08it/s][A
Training:  42%|████▏     | 22/52 [00:11

Epoch: 3/89 - Loss: 4.2458 - Accuracy: 0.9251



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:02<00:13,  2.29s/it][A
 43%|████▎     | 3/7 [00:02<00:02,  1.53it/s][A
 57%|█████▋    | 4/7 [00:02<00:01,  2.11it/s][A
100%|██████████| 7/7 [00:04<00:00,  1.68it/s][A
Epochs:   3%|▎         | 3/89 [01:24<40:16, 28.10s/it]

Val Loss: 3.7845 - Val Accuracy: 0.9358



Training:   0%|          | 0/52 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/52 [00:02<01:46,  2.09s/it][A
Training:   6%|▌         | 3/52 [00:02<00:29,  1.68it/s][A
Training:  10%|▉         | 5/52 [00:03<00:29,  1.59it/s][A
Training:  12%|█▏        | 6/52 [00:04<00:27,  1.68it/s][A
Training:  15%|█▌        | 8/52 [00:04<00:16,  2.69it/s][A
Training:  17%|█▋        | 9/52 [00:05<00:21,  1.97it/s][A
Training:  19%|█▉        | 10/52 [00:05<00:24,  1.74it/s][A
Training:  23%|██▎       | 12/52 [00:06<00:14,  2.77it/s][A
Training:  25%|██▌       | 13/52 [00:06<00:17,  2.17it/s][A
Training:  27%|██▋       | 14/52 [00:07<00:21,  1.76it/s][A
Training:  33%|███▎      | 17/52 [00:08<00:14,  2.39it/s][A
Training:  35%|███▍      | 18/52 [00:09<00:17,  1.94it/s][A
Training:  37%|███▋      | 19/52 [00:09<00:14,  2.32it/s][A
Training:  40%|████      | 21/52 [00:10<00:10,  2.97it/s][A
Training:  42%|████▏     | 22/52 [00:11<00:16,  1.84it/s][A
Training:  44%|████▍     | 23/52 [00:1

Epoch: 4/89 - Loss: 3.9667 - Accuracy: 0.9298



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:02<00:13,  2.19s/it][A
 29%|██▊       | 2/7 [00:02<00:04,  1.03it/s][A
 43%|████▎     | 3/7 [00:02<00:02,  1.58it/s][A
 57%|█████▋    | 4/7 [00:02<00:01,  2.34it/s][A
 71%|███████▏  | 5/7 [00:03<00:01,  1.46it/s][A
100%|██████████| 7/7 [00:04<00:00,  1.71it/s][A
Epochs:   4%|▍         | 4/89 [01:52<39:49, 28.11s/it]

Val Loss: 3.6733 - Val Accuracy: 0.9341



Training:   0%|          | 0/52 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/52 [00:02<01:56,  2.29s/it][A
Training:   6%|▌         | 3/52 [00:02<00:31,  1.57it/s][A
Training:  10%|▉         | 5/52 [00:03<00:32,  1.44it/s][A
Training:  12%|█▏        | 6/52 [00:04<00:27,  1.67it/s][A
Training:  15%|█▌        | 8/52 [00:04<00:16,  2.71it/s][A
Training:  17%|█▋        | 9/52 [00:05<00:23,  1.83it/s][A
Training:  19%|█▉        | 10/52 [00:06<00:23,  1.81it/s][A
Training:  23%|██▎       | 12/52 [00:06<00:13,  2.87it/s][A
Training:  25%|██▌       | 13/52 [00:07<00:23,  1.68it/s][A
Training:  31%|███       | 16/52 [00:07<00:11,  3.13it/s][A
Training:  35%|███▍      | 18/52 [00:09<00:15,  2.17it/s][A
Training:  37%|███▋      | 19/52 [00:09<00:13,  2.46it/s][A
Training:  38%|███▊      | 20/52 [00:09<00:11,  2.90it/s][A
Training:  40%|████      | 21/52 [00:11<00:19,  1.57it/s][A
Training:  42%|████▏     | 22/52 [00:11<00:15,  1.97it/s][A
Training:  44%|████▍     | 23/52 [00:1

Epoch: 5/89 - Loss: 3.9500 - Accuracy: 0.9302



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:02<00:13,  2.29s/it][A
 43%|████▎     | 3/7 [00:02<00:02,  1.46it/s][A
 71%|███████▏  | 5/7 [00:03<00:01,  1.57it/s][A
100%|██████████| 7/7 [00:04<00:00,  1.73it/s][A
Epochs:   6%|▌         | 5/89 [02:19<39:07, 27.94s/it]

Val Loss: 4.0725 - Val Accuracy: 0.9189



Training:   0%|          | 0/52 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/52 [00:02<01:54,  2.24s/it][A
Training:   4%|▍         | 2/52 [00:02<00:55,  1.11s/it][A
Training:  10%|▉         | 5/52 [00:04<00:31,  1.48it/s][A
Training:  12%|█▏        | 6/52 [00:04<00:27,  1.66it/s][A
Training:  15%|█▌        | 8/52 [00:04<00:16,  2.62it/s][A
Training:  17%|█▋        | 9/52 [00:05<00:24,  1.76it/s][A
Training:  19%|█▉        | 10/52 [00:06<00:23,  1.81it/s][A
Training:  21%|██        | 11/52 [00:06<00:17,  2.28it/s][A
Training:  25%|██▌       | 13/52 [00:07<00:18,  2.14it/s][A
Training:  27%|██▋       | 14/52 [00:07<00:18,  2.07it/s][A
Training:  29%|██▉       | 15/52 [00:08<00:14,  2.57it/s][A
Training:  33%|███▎      | 17/52 [00:09<00:15,  2.20it/s][A
Training:  35%|███▍      | 18/52 [00:09<00:16,  2.04it/s][A
Training:  40%|████      | 21/52 [00:10<00:13,  2.31it/s][A
Training:  42%|████▏     | 22/52 [00:11<00:13,  2.22it/s][A
Training:  46%|████▌     | 24/52 [00:1

Epoch: 6/89 - Loss: 3.5114 - Accuracy: 0.9389



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:02<00:13,  2.25s/it][A
 29%|██▊       | 2/7 [00:02<00:05,  1.00s/it][A
100%|██████████| 7/7 [00:04<00:00,  1.66it/s][A
Epochs:   7%|▋         | 6/89 [02:47<38:35, 27.90s/it]

Val Loss: 4.8736 - Val Accuracy: 0.9142



Training:   0%|          | 0/52 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/52 [00:02<01:54,  2.24s/it][A
Training:   8%|▊         | 4/52 [00:02<00:22,  2.13it/s][A
Training:  12%|█▏        | 6/52 [00:04<00:29,  1.57it/s][A
Training:  13%|█▎        | 7/52 [00:04<00:23,  1.95it/s][A
Training:  17%|█▋        | 9/52 [00:05<00:25,  1.70it/s][A
Training:  19%|█▉        | 10/52 [00:05<00:20,  2.06it/s][A
Training:  23%|██▎       | 12/52 [00:05<00:13,  3.05it/s][A
Training:  25%|██▌       | 13/52 [00:07<00:21,  1.84it/s][A
Training:  27%|██▋       | 14/52 [00:07<00:17,  2.15it/s][A
Training:  29%|██▉       | 15/52 [00:07<00:13,  2.66it/s][A
Training:  31%|███       | 16/52 [00:07<00:12,  2.82it/s][A
Training:  33%|███▎      | 17/52 [00:09<00:21,  1.62it/s][A
Training:  35%|███▍      | 18/52 [00:09<00:17,  1.92it/s][A
Training:  38%|███▊      | 20/52 [00:09<00:10,  3.18it/s][A
Training:  40%|████      | 21/52 [00:10<00:17,  1.73it/s][A
Training:  44%|████▍     | 23/52 [00:

Epoch: 7/89 - Loss: 3.9039 - Accuracy: 0.9299



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:02<00:13,  2.31s/it][A
100%|██████████| 7/7 [00:03<00:00,  1.82it/s][A
Epochs:   8%|▊         | 7/89 [03:14<37:40, 27.57s/it]

Val Loss: 4.9024 - Val Accuracy: 0.9189



Training:   0%|          | 0/52 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/52 [00:02<01:53,  2.23s/it][A
Training:   4%|▍         | 2/52 [00:02<00:59,  1.20s/it][A
Training:  10%|▉         | 5/52 [00:03<00:30,  1.54it/s][A
Training:  12%|█▏        | 6/52 [00:04<00:30,  1.53it/s][A
Training:  17%|█▋        | 9/52 [00:05<00:22,  1.88it/s][A
Training:  19%|█▉        | 10/52 [00:06<00:20,  2.05it/s][A
Training:  23%|██▎       | 12/52 [00:06<00:13,  3.04it/s][A
Training:  25%|██▌       | 13/52 [00:07<00:21,  1.83it/s][A
Training:  27%|██▋       | 14/52 [00:08<00:19,  1.97it/s][A
Training:  33%|███▎      | 17/52 [00:09<00:16,  2.09it/s][A
Training:  35%|███▍      | 18/52 [00:09<00:15,  2.14it/s][A
Training:  37%|███▋      | 19/52 [00:09<00:13,  2.54it/s][A
Training:  38%|███▊      | 20/52 [00:10<00:10,  3.06it/s][A
Training:  40%|████      | 21/52 [00:11<00:17,  1.81it/s][A
Training:  42%|████▏     | 22/52 [00:11<00:15,  1.95it/s][A
Training:  44%|████▍     | 23/52 [00:

Epoch: 8/89 - Loss: 3.6304 - Accuracy: 0.9351



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:02<00:12,  2.14s/it][A
 29%|██▊       | 2/7 [00:02<00:05,  1.13s/it][A
 57%|█████▋    | 4/7 [00:02<00:01,  2.13it/s][A
 71%|███████▏  | 5/7 [00:03<00:01,  1.52it/s][A
100%|██████████| 7/7 [00:04<00:00,  1.66it/s][A
Epochs:   9%|▉         | 8/89 [03:43<37:38, 27.88s/it]

Val Loss: 3.5286 - Val Accuracy: 0.9350



Training:   0%|          | 0/52 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/52 [00:02<01:52,  2.20s/it][A
Training:   4%|▍         | 2/52 [00:02<00:49,  1.02it/s][A
Training:   8%|▊         | 4/52 [00:02<00:21,  2.22it/s][A
Training:  10%|▉         | 5/52 [00:03<00:33,  1.39it/s][A
Training:  12%|█▏        | 6/52 [00:04<00:24,  1.84it/s][A
Training:  15%|█▌        | 8/52 [00:04<00:14,  3.05it/s][A
Training:  17%|█▋        | 9/52 [00:05<00:25,  1.67it/s][A
Training:  19%|█▉        | 10/52 [00:05<00:20,  2.10it/s][A
Training:  23%|██▎       | 12/52 [00:05<00:11,  3.39it/s][A
Training:  27%|██▋       | 14/52 [00:07<00:20,  1.89it/s][A
Training:  31%|███       | 16/52 [00:07<00:13,  2.73it/s][A
Training:  33%|███▎      | 17/52 [00:09<00:22,  1.54it/s][A
Training:  35%|███▍      | 18/52 [00:09<00:17,  1.90it/s][A
Training:  38%|███▊      | 20/52 [00:09<00:11,  2.83it/s][A
Training:  40%|████      | 21/52 [00:11<00:18,  1.68it/s][A
Training:  44%|████▍     | 23/52 [00:11

Epoch: 9/89 - Loss: 3.3749 - Accuracy: 0.9388



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:02<00:15,  2.55s/it][A
 29%|██▊       | 2/7 [00:02<00:05,  1.11s/it][A
 57%|█████▋    | 4/7 [00:02<00:01,  2.23it/s][A
100%|██████████| 7/7 [00:04<00:00,  1.63it/s][A
Epochs:  10%|█         | 9/89 [04:11<37:19, 28.00s/it]

Val Loss: 3.8209 - Val Accuracy: 0.9302



Training:   0%|          | 0/52 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/52 [00:02<01:50,  2.18s/it][A
Training:   4%|▍         | 2/52 [00:02<00:48,  1.03it/s][A
Training:   8%|▊         | 4/52 [00:02<00:19,  2.44it/s][A
Training:  10%|▉         | 5/52 [00:03<00:33,  1.41it/s][A
Training:  12%|█▏        | 6/52 [00:04<00:25,  1.78it/s][A
Training:  13%|█▎        | 7/52 [00:04<00:18,  2.37it/s][A
Training:  17%|█▋        | 9/52 [00:05<00:26,  1.59it/s][A
Training:  19%|█▉        | 10/52 [00:06<00:21,  1.95it/s][A
Training:  25%|██▌       | 13/52 [00:07<00:19,  1.98it/s][A
Training:  27%|██▋       | 14/52 [00:07<00:17,  2.21it/s][A
Training:  31%|███       | 16/52 [00:07<00:11,  3.12it/s][A
Training:  33%|███▎      | 17/52 [00:09<00:20,  1.71it/s][A
Training:  37%|███▋      | 19/52 [00:09<00:12,  2.55it/s][A
Training:  38%|███▊      | 20/52 [00:09<00:10,  2.99it/s][A
Training:  40%|████      | 21/52 [00:11<00:19,  1.56it/s][A
Training:  44%|████▍     | 23/52 [00:11

Epoch: 10/89 - Loss: 3.2994 - Accuracy: 0.9408



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:02<00:12,  2.11s/it][A
 43%|████▎     | 3/7 [00:02<00:02,  1.66it/s][A
100%|██████████| 7/7 [00:03<00:00,  1.84it/s][A
Epochs:  11%|█         | 10/89 [04:39<36:55, 28.05s/it]

Val Loss: 3.3849 - Val Accuracy: 0.9434



Training:   0%|          | 0/52 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/52 [00:02<01:58,  2.32s/it][A
Training:   4%|▍         | 2/52 [00:02<00:51,  1.02s/it][A
Training:   8%|▊         | 4/52 [00:02<00:21,  2.26it/s][A
Training:  10%|▉         | 5/52 [00:04<00:35,  1.32it/s][A
Training:  13%|█▎        | 7/52 [00:04<00:20,  2.23it/s][A
Training:  15%|█▌        | 8/52 [00:04<00:16,  2.68it/s][A
Training:  17%|█▋        | 9/52 [00:05<00:26,  1.60it/s][A
Training:  19%|█▉        | 10/52 [00:05<00:20,  2.07it/s][A
Training:  23%|██▎       | 12/52 [00:06<00:12,  3.26it/s][A
Training:  25%|██▌       | 13/52 [00:07<00:23,  1.65it/s][A
Training:  29%|██▉       | 15/52 [00:07<00:14,  2.52it/s][A
Training:  33%|███▎      | 17/52 [00:09<00:17,  1.99it/s][A
Training:  35%|███▍      | 18/52 [00:09<00:14,  2.32it/s][A
Training:  38%|███▊      | 20/52 [00:09<00:09,  3.38it/s][A
Training:  40%|████      | 21/52 [00:10<00:16,  1.92it/s][A
Training:  42%|████▏     | 22/52 [00:11

Epoch: 11/89 - Loss: 3.2976 - Accuracy: 0.9410



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:02<00:13,  2.22s/it][A
 29%|██▊       | 2/7 [00:02<00:05,  1.01s/it][A
 71%|███████▏  | 5/7 [00:03<00:01,  1.62it/s][A
100%|██████████| 7/7 [00:04<00:00,  1.75it/s][A
Epochs:  12%|█▏        | 11/89 [05:07<36:18, 27.93s/it]

Val Loss: 3.5224 - Val Accuracy: 0.9373



Training:   0%|          | 0/52 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/52 [00:02<01:57,  2.30s/it][A
Training:   6%|▌         | 3/52 [00:02<00:34,  1.44it/s][A
Training:   8%|▊         | 4/52 [00:02<00:24,  1.94it/s][A
Training:  10%|▉         | 5/52 [00:04<00:40,  1.16it/s][A
Training:  12%|█▏        | 6/52 [00:04<00:28,  1.59it/s][A
Training:  15%|█▌        | 8/52 [00:04<00:15,  2.78it/s][A
Training:  17%|█▋        | 9/52 [00:06<00:27,  1.57it/s][A
Training:  21%|██        | 11/52 [00:06<00:17,  2.40it/s][A
Training:  25%|██▌       | 13/52 [00:07<00:21,  1.80it/s][A
Training:  27%|██▋       | 14/52 [00:07<00:17,  2.16it/s][A
Training:  29%|██▉       | 15/52 [00:08<00:15,  2.38it/s][A
Training:  33%|███▎      | 17/52 [00:09<00:18,  1.90it/s][A
Training:  37%|███▋      | 19/52 [00:09<00:13,  2.48it/s][A
Training:  40%|████      | 21/52 [00:11<00:14,  2.09it/s][A
Training:  44%|████▍     | 23/52 [00:11<00:11,  2.52it/s][A
Training:  48%|████▊     | 25/52 [00:13

Epoch: 12/89 - Loss: 3.1782 - Accuracy: 0.9417



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:02<00:12,  2.02s/it][A
 29%|██▊       | 2/7 [00:02<00:04,  1.10it/s][A
 43%|████▎     | 3/7 [00:02<00:02,  1.68it/s][A
 71%|███████▏  | 5/7 [00:03<00:01,  1.59it/s][A
100%|██████████| 7/7 [00:03<00:00,  1.77it/s][A
Epochs:  13%|█▎        | 12/89 [05:35<35:52, 27.96s/it]

Val Loss: 3.4918 - Val Accuracy: 0.9418



Training:   0%|          | 0/52 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/52 [00:02<01:53,  2.22s/it][A
Training:   4%|▍         | 2/52 [00:02<00:48,  1.02it/s][A
Training:   8%|▊         | 4/52 [00:02<00:20,  2.37it/s][A
Training:  10%|▉         | 5/52 [00:04<00:37,  1.26it/s][A
Training:  13%|█▎        | 7/52 [00:04<00:20,  2.18it/s][A
Training:  15%|█▌        | 8/52 [00:04<00:16,  2.66it/s][A
Training:  17%|█▋        | 9/52 [00:06<00:30,  1.43it/s][A
Training:  19%|█▉        | 10/52 [00:06<00:22,  1.85it/s][A
Training:  21%|██        | 11/52 [00:06<00:17,  2.37it/s][A
Training:  23%|██▎       | 12/52 [00:06<00:13,  2.98it/s][A
Training:  25%|██▌       | 13/52 [00:07<00:27,  1.43it/s][A
Training:  27%|██▋       | 14/52 [00:08<00:20,  1.87it/s][A
Training:  29%|██▉       | 15/52 [00:08<00:15,  2.45it/s][A
Training:  33%|███▎      | 17/52 [00:09<00:17,  1.98it/s][A
Training:  37%|███▋      | 19/52 [00:09<00:11,  3.00it/s][A
Training:  40%|████      | 21/52 [00:11

Epoch: 13/89 - Loss: 3.5100 - Accuracy: 0.9366



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:02<00:14,  2.37s/it][A
 43%|████▎     | 3/7 [00:02<00:02,  1.48it/s][A
 71%|███████▏  | 5/7 [00:04<00:01,  1.39it/s][A
100%|██████████| 7/7 [00:04<00:00,  1.62it/s][A
Epochs:  15%|█▍        | 13/89 [06:03<35:28, 28.01s/it]

Val Loss: 3.8102 - Val Accuracy: 0.9241



Training:   0%|          | 0/52 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/52 [00:02<01:54,  2.24s/it][A
Training:   4%|▍         | 2/52 [00:02<00:52,  1.05s/it][A
Training:   6%|▌         | 3/52 [00:02<00:30,  1.59it/s][A
Training:  10%|▉         | 5/52 [00:03<00:30,  1.56it/s][A
Training:  12%|█▏        | 6/52 [00:04<00:25,  1.79it/s][A
Training:  13%|█▎        | 7/52 [00:04<00:19,  2.34it/s][A
Training:  17%|█▋        | 9/52 [00:05<00:21,  1.96it/s][A
Training:  19%|█▉        | 10/52 [00:06<00:22,  1.85it/s][A
Training:  25%|██▌       | 13/52 [00:07<00:16,  2.31it/s][A
Training:  27%|██▋       | 14/52 [00:07<00:18,  2.06it/s][A
Training:  29%|██▉       | 15/52 [00:08<00:15,  2.47it/s][A
Training:  33%|███▎      | 17/52 [00:09<00:15,  2.26it/s][A
Training:  35%|███▍      | 18/52 [00:09<00:16,  2.02it/s][A
Training:  37%|███▋      | 19/52 [00:09<00:13,  2.47it/s][A
Training:  40%|████      | 21/52 [00:10<00:13,  2.26it/s][A
Training:  42%|████▏     | 22/52 [00:11

Epoch: 14/89 - Loss: 3.4153 - Accuracy: 0.9382



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:02<00:12,  2.16s/it][A
 43%|████▎     | 3/7 [00:02<00:02,  1.67it/s][A
 71%|███████▏  | 5/7 [00:03<00:01,  1.53it/s][A
100%|██████████| 7/7 [00:03<00:00,  1.79it/s][A
Epochs:  16%|█▌        | 14/89 [06:31<35:06, 28.09s/it]

Val Loss: 3.8583 - Val Accuracy: 0.9339



Training:   0%|          | 0/52 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/52 [00:02<02:02,  2.41s/it][A
Training:   4%|▍         | 2/52 [00:02<00:52,  1.06s/it][A
Training:   6%|▌         | 3/52 [00:02<00:30,  1.59it/s][A
Training:  10%|▉         | 5/52 [00:03<00:30,  1.52it/s][A
Training:  12%|█▏        | 6/52 [00:04<00:22,  2.01it/s][A
Training:  15%|█▌        | 8/52 [00:04<00:13,  3.27it/s][A
Training:  17%|█▋        | 9/52 [00:05<00:22,  1.95it/s][A
Training:  19%|█▉        | 10/52 [00:05<00:18,  2.23it/s][A
Training:  21%|██        | 11/52 [00:05<00:14,  2.82it/s][A
Training:  25%|██▌       | 13/52 [00:06<00:17,  2.19it/s][A
Training:  27%|██▋       | 14/52 [00:07<00:15,  2.50it/s][A
Training:  29%|██▉       | 15/52 [00:07<00:12,  2.94it/s][A
Training:  31%|███       | 16/52 [00:07<00:09,  3.60it/s][A
Training:  33%|███▎      | 17/52 [00:08<00:18,  1.85it/s][A
Training:  35%|███▍      | 18/52 [00:08<00:14,  2.32it/s][A
Training:  37%|███▋      | 19/52 [00:09

Epoch: 15/89 - Loss: 3.0500 - Accuracy: 0.9438



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:02<00:12,  2.13s/it][A
 29%|██▊       | 2/7 [00:02<00:04,  1.05it/s][A
 43%|████▎     | 3/7 [00:02<00:02,  1.76it/s][A
100%|██████████| 7/7 [00:04<00:00,  1.67it/s][A
Epochs:  17%|█▋        | 15/89 [06:59<34:25, 27.91s/it]

Val Loss: 3.5496 - Val Accuracy: 0.9399



Training:   0%|          | 0/52 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/52 [00:02<01:54,  2.25s/it][A
Training:   4%|▍         | 2/52 [00:02<00:49,  1.01it/s][A
Training:   6%|▌         | 3/52 [00:02<00:29,  1.68it/s][A
Training:  10%|▉         | 5/52 [00:04<00:36,  1.30it/s][A
Training:  13%|█▎        | 7/52 [00:04<00:20,  2.16it/s][A
Training:  17%|█▋        | 9/52 [00:06<00:25,  1.66it/s][A
Training:  19%|█▉        | 10/52 [00:06<00:20,  2.02it/s][A
Training:  21%|██        | 11/52 [00:06<00:16,  2.45it/s][A
Training:  23%|██▎       | 12/52 [00:06<00:13,  2.91it/s][A
Training:  25%|██▌       | 13/52 [00:08<00:25,  1.52it/s][A
Training:  31%|███       | 16/52 [00:08<00:11,  3.04it/s][A
Training:  35%|███▍      | 18/52 [00:09<00:17,  1.99it/s][A
Training:  38%|███▊      | 20/52 [00:09<00:11,  2.77it/s][A
Training:  42%|████▏     | 22/52 [00:11<00:14,  2.01it/s][A
Training:  44%|████▍     | 23/52 [00:11<00:12,  2.35it/s][A
Training:  48%|████▊     | 25/52 [00:1

Epoch: 16/89 - Loss: 3.0255 - Accuracy: 0.9459



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:02<00:14,  2.40s/it][A
 43%|████▎     | 3/7 [00:02<00:02,  1.46it/s][A
100%|██████████| 7/7 [00:04<00:00,  1.64it/s][A
Epochs:  18%|█▊        | 16/89 [07:27<34:12, 28.12s/it]

Val Loss: 3.3086 - Val Accuracy: 0.9437



Training:   0%|          | 0/52 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/52 [00:02<01:55,  2.26s/it][A
Training:   4%|▍         | 2/52 [00:02<00:53,  1.07s/it][A
Training:   6%|▌         | 3/52 [00:02<00:30,  1.59it/s][A
Training:  10%|▉         | 5/52 [00:03<00:30,  1.56it/s][A
Training:  12%|█▏        | 6/52 [00:04<00:26,  1.77it/s][A
Training:  15%|█▌        | 8/52 [00:04<00:15,  2.87it/s][A
Training:  17%|█▋        | 9/52 [00:05<00:23,  1.82it/s][A
Training:  19%|█▉        | 10/52 [00:05<00:21,  2.00it/s][A
Training:  21%|██        | 11/52 [00:06<00:16,  2.54it/s][A
Training:  23%|██▎       | 12/52 [00:06<00:12,  3.15it/s][A
Training:  25%|██▌       | 13/52 [00:07<00:25,  1.54it/s][A
Training:  27%|██▋       | 14/52 [00:07<00:19,  1.99it/s][A
Training:  29%|██▉       | 15/52 [00:07<00:14,  2.56it/s][A
Training:  33%|███▎      | 17/52 [00:09<00:18,  1.91it/s][A
Training:  35%|███▍      | 18/52 [00:09<00:15,  2.24it/s][A
Training:  37%|███▋      | 19/52 [00:09

Epoch: 17/89 - Loss: 2.8962 - Accuracy: 0.9472



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:02<00:13,  2.29s/it][A
 29%|██▊       | 2/7 [00:02<00:05,  1.01s/it][A
 57%|█████▋    | 4/7 [00:02<00:01,  2.45it/s][A
100%|██████████| 7/7 [00:04<00:00,  1.66it/s][A
Epochs:  19%|█▉        | 17/89 [07:56<34:01, 28.36s/it]

Val Loss: 3.5860 - Val Accuracy: 0.9384



Training:   0%|          | 0/52 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/52 [00:02<02:06,  2.48s/it][A
Training:   6%|▌         | 3/52 [00:02<00:34,  1.43it/s][A
Training:  10%|▉         | 5/52 [00:04<00:33,  1.39it/s][A
Training:  13%|█▎        | 7/52 [00:04<00:20,  2.20it/s][A
Training:  15%|█▌        | 8/52 [00:04<00:16,  2.66it/s][A
Training:  17%|█▋        | 9/52 [00:06<00:30,  1.42it/s][A
Training:  25%|██▌       | 13/52 [00:08<00:22,  1.73it/s][A
Training:  29%|██▉       | 15/52 [00:08<00:16,  2.30it/s][A
Training:  31%|███       | 16/52 [00:08<00:13,  2.66it/s][A
Training:  33%|███▎      | 17/52 [00:09<00:20,  1.74it/s][A
Training:  37%|███▋      | 19/52 [00:09<00:12,  2.56it/s][A
Training:  38%|███▊      | 20/52 [00:10<00:10,  2.92it/s][A
Training:  40%|████      | 21/52 [00:11<00:19,  1.60it/s][A
Training:  44%|████▍     | 23/52 [00:11<00:11,  2.45it/s][A
Training:  48%|████▊     | 25/52 [00:13<00:13,  1.94it/s][A
Training:  50%|█████     | 26/52 [00:1

Epoch: 18/89 - Loss: 3.1245 - Accuracy: 0.9429



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:02<00:13,  2.26s/it][A
 29%|██▊       | 2/7 [00:02<00:05,  1.01s/it][A
100%|██████████| 7/7 [00:04<00:00,  1.72it/s][A
Epochs:  20%|██        | 18/89 [08:24<33:17, 28.14s/it]

Val Loss: 4.5081 - Val Accuracy: 0.9190



Training:   0%|          | 0/52 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/52 [00:01<01:37,  1.92s/it][A
Training:   4%|▍         | 2/52 [00:02<00:42,  1.16it/s][A
Training:   6%|▌         | 3/52 [00:02<00:25,  1.95it/s][A
Training:   8%|▊         | 4/52 [00:02<00:16,  2.83it/s][A
Training:  10%|▉         | 5/52 [00:03<00:35,  1.34it/s][A
Training:  12%|█▏        | 6/52 [00:03<00:24,  1.89it/s][A
Training:  15%|█▌        | 8/52 [00:03<00:12,  3.40it/s][A
Training:  19%|█▉        | 10/52 [00:05<00:21,  1.99it/s][A
Training:  23%|██▎       | 12/52 [00:05<00:13,  2.86it/s][A
Training:  25%|██▌       | 13/52 [00:07<00:22,  1.71it/s][A
Training:  27%|██▋       | 14/52 [00:07<00:18,  2.11it/s][A
Training:  29%|██▉       | 15/52 [00:07<00:15,  2.40it/s][A
Training:  31%|███       | 16/52 [00:07<00:12,  2.94it/s][A
Training:  33%|███▎      | 17/52 [00:08<00:19,  1.75it/s][A
Training:  35%|███▍      | 18/52 [00:09<00:15,  2.14it/s][A
Training:  37%|███▋      | 19/52 [00:09

Epoch: 19/89 - Loss: 3.0954 - Accuracy: 0.9438



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:01<00:11,  1.97s/it][A
 29%|██▊       | 2/7 [00:02<00:05,  1.01s/it][A
 71%|███████▏  | 5/7 [00:03<00:01,  1.60it/s][A
100%|██████████| 7/7 [00:03<00:00,  1.77it/s][A
Epochs:  21%|██▏       | 19/89 [08:52<32:43, 28.05s/it]

Val Loss: 3.9647 - Val Accuracy: 0.9320



Training:   0%|          | 0/52 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/52 [00:02<01:53,  2.23s/it][A
Training:   6%|▌         | 3/52 [00:02<00:30,  1.61it/s][A
Training:  10%|▉         | 5/52 [00:04<00:34,  1.35it/s][A
Training:  15%|█▌        | 8/52 [00:04<00:16,  2.71it/s][A
Training:  19%|█▉        | 10/52 [00:06<00:23,  1.79it/s][A
Training:  23%|██▎       | 12/52 [00:06<00:16,  2.44it/s][A
Training:  27%|██▋       | 14/52 [00:07<00:21,  1.81it/s][A
Training:  33%|███▎      | 17/52 [00:09<00:20,  1.73it/s][A
Training:  37%|███▋      | 19/52 [00:09<00:14,  2.27it/s][A
Training:  38%|███▊      | 20/52 [00:10<00:12,  2.59it/s][A
Training:  40%|████      | 21/52 [00:11<00:18,  1.68it/s][A
Training:  44%|████▍     | 23/52 [00:11<00:12,  2.39it/s][A
Training:  48%|████▊     | 25/52 [00:13<00:14,  1.90it/s][A
Training:  52%|█████▏    | 27/52 [00:13<00:10,  2.38it/s][A
Training:  54%|█████▍    | 28/52 [00:13<00:08,  2.73it/s][A
Training:  56%|█████▌    | 29/52 [00

Epoch: 20/89 - Loss: 3.1178 - Accuracy: 0.9418



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:02<00:13,  2.27s/it][A
 43%|████▎     | 3/7 [00:02<00:02,  1.56it/s][A
100%|██████████| 7/7 [00:03<00:00,  1.83it/s][A
Epochs:  22%|██▏       | 20/89 [09:20<32:13, 28.02s/it]

Val Loss: 4.6537 - Val Accuracy: 0.9223



Training:   0%|          | 0/52 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/52 [00:02<01:53,  2.22s/it][A
Training:   4%|▍         | 2/52 [00:02<00:49,  1.00it/s][A
Training:   6%|▌         | 3/52 [00:02<00:29,  1.66it/s][A
Training:   8%|▊         | 4/52 [00:02<00:19,  2.47it/s][A
Training:  10%|▉         | 5/52 [00:03<00:30,  1.55it/s][A
Training:  12%|█▏        | 6/52 [00:03<00:22,  2.00it/s][A
Training:  13%|█▎        | 7/52 [00:04<00:16,  2.67it/s][A
Training:  15%|█▌        | 8/52 [00:04<00:15,  2.85it/s][A
Training:  17%|█▋        | 9/52 [00:05<00:27,  1.54it/s][A
Training:  19%|█▉        | 10/52 [00:05<00:20,  2.06it/s][A
Training:  23%|██▎       | 12/52 [00:05<00:12,  3.23it/s][A
Training:  25%|██▌       | 13/52 [00:07<00:24,  1.57it/s][A
Training:  29%|██▉       | 15/52 [00:07<00:15,  2.46it/s][A
Training:  31%|███       | 16/52 [00:07<00:12,  2.93it/s][A
Training:  33%|███▎      | 17/52 [00:09<00:21,  1.61it/s][A
Training:  38%|███▊      | 20/52 [00:09<0

Epoch: 21/89 - Loss: 2.9313 - Accuracy: 0.9452



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:02<00:12,  2.07s/it][A
 29%|██▊       | 2/7 [00:02<00:05,  1.10s/it][A
 71%|███████▏  | 5/7 [00:03<00:01,  1.69it/s][A
100%|██████████| 7/7 [00:04<00:00,  1.74it/s][A
Epochs:  24%|██▎       | 21/89 [09:48<31:43, 28.00s/it]

Val Loss: 3.6508 - Val Accuracy: 0.9384



Training:   0%|          | 0/52 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/52 [00:02<02:03,  2.42s/it][A
Training:   4%|▍         | 2/52 [00:02<00:52,  1.05s/it][A
Training:   6%|▌         | 3/52 [00:02<00:30,  1.60it/s][A
Training:   8%|▊         | 4/52 [00:02<00:20,  2.35it/s][A
Training:  10%|▉         | 5/52 [00:04<00:37,  1.25it/s][A
Training:  13%|█▎        | 7/52 [00:04<00:19,  2.28it/s][A
Training:  17%|█▋        | 9/52 [00:06<00:26,  1.62it/s][A
Training:  21%|██        | 11/52 [00:06<00:17,  2.40it/s][A
Training:  23%|██▎       | 12/52 [00:06<00:14,  2.84it/s][A
Training:  25%|██▌       | 13/52 [00:07<00:24,  1.60it/s][A
Training:  27%|██▋       | 14/52 [00:08<00:18,  2.01it/s][A
Training:  31%|███       | 16/52 [00:08<00:12,  2.83it/s][A
Training:  33%|███▎      | 17/52 [00:09<00:20,  1.72it/s][A
Training:  38%|███▊      | 20/52 [00:10<00:12,  2.62it/s][A
Training:  40%|████      | 21/52 [00:11<00:17,  1.80it/s][A
Training:  42%|████▏     | 22/52 [00:11

Epoch: 22/89 - Loss: 2.8477 - Accuracy: 0.9470



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:02<00:12,  2.10s/it][A
 57%|█████▋    | 4/7 [00:02<00:01,  2.28it/s][A
100%|██████████| 7/7 [00:03<00:00,  1.76it/s][A
Epochs:  25%|██▍       | 22/89 [10:16<31:16, 28.01s/it]

Val Loss: 3.6444 - Val Accuracy: 0.9352



Training:   0%|          | 0/52 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/52 [00:02<01:49,  2.15s/it][A
Training:   6%|▌         | 3/52 [00:02<00:33,  1.48it/s][A
Training:  10%|▉         | 5/52 [00:04<00:33,  1.38it/s][A
Training:  13%|█▎        | 7/52 [00:04<00:21,  2.11it/s][A
Training:  15%|█▌        | 8/52 [00:04<00:17,  2.56it/s][A
Training:  17%|█▋        | 9/52 [00:05<00:29,  1.47it/s][A
Training:  19%|█▉        | 10/52 [00:06<00:22,  1.88it/s][A
Training:  21%|██        | 11/52 [00:06<00:17,  2.28it/s][A
Training:  23%|██▎       | 12/52 [00:06<00:14,  2.85it/s][A
Training:  25%|██▌       | 13/52 [00:07<00:25,  1.56it/s][A
Training:  29%|██▉       | 15/52 [00:07<00:14,  2.47it/s][A
Training:  33%|███▎      | 17/52 [00:09<00:18,  1.93it/s][A
Training:  37%|███▋      | 19/52 [00:09<00:11,  2.76it/s][A
Training:  38%|███▊      | 20/52 [00:09<00:10,  3.15it/s][A
Training:  40%|████      | 21/52 [00:11<00:19,  1.62it/s][A
Training:  44%|████▍     | 23/52 [00:1

Epoch: 23/89 - Loss: 2.7856 - Accuracy: 0.9481



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:02<00:12,  2.01s/it][A
 43%|████▎     | 3/7 [00:02<00:02,  1.73it/s][A
100%|██████████| 7/7 [00:03<00:00,  1.80it/s][A
Epochs:  26%|██▌       | 23/89 [10:43<30:44, 27.95s/it]

Val Loss: 3.4791 - Val Accuracy: 0.9402



Training:   0%|          | 0/52 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/52 [00:02<01:50,  2.16s/it][A
Training:   6%|▌         | 3/52 [00:02<00:30,  1.63it/s][A
Training:  10%|▉         | 5/52 [00:03<00:33,  1.39it/s][A
Training:  15%|█▌        | 8/52 [00:04<00:17,  2.51it/s][A
Training:  17%|█▋        | 9/52 [00:05<00:25,  1.71it/s][A
Training:  19%|█▉        | 10/52 [00:05<00:21,  1.93it/s][A
Training:  23%|██▎       | 12/52 [00:06<00:13,  2.87it/s][A
Training:  25%|██▌       | 13/52 [00:07<00:21,  1.82it/s][A
Training:  27%|██▋       | 14/52 [00:07<00:18,  2.08it/s][A
Training:  31%|███       | 16/52 [00:07<00:12,  2.93it/s][A
Training:  33%|███▎      | 17/52 [00:09<00:18,  1.89it/s][A
Training:  35%|███▍      | 18/52 [00:09<00:15,  2.22it/s][A
Training:  37%|███▋      | 19/52 [00:09<00:12,  2.66it/s][A
Training:  38%|███▊      | 20/52 [00:09<00:10,  3.01it/s][A
Training:  40%|████      | 21/52 [00:10<00:17,  1.82it/s][A
Training:  42%|████▏     | 22/52 [00:

Epoch: 24/89 - Loss: 2.7895 - Accuracy: 0.9488



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:01<00:11,  1.97s/it][A
 29%|██▊       | 2/7 [00:02<00:05,  1.07s/it][A
 57%|█████▋    | 4/7 [00:02<00:01,  2.19it/s][A
 71%|███████▏  | 5/7 [00:03<00:01,  1.53it/s][A
100%|██████████| 7/7 [00:03<00:00,  1.75it/s][A
Epochs:  27%|██▋       | 24/89 [11:11<30:10, 27.85s/it]

Val Loss: 4.0596 - Val Accuracy: 0.9318



Training:   0%|          | 0/52 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/52 [00:02<01:48,  2.13s/it][A
Training:   4%|▍         | 2/52 [00:02<00:47,  1.05it/s][A
Training:   6%|▌         | 3/52 [00:02<00:29,  1.67it/s][A
Training:  10%|▉         | 5/52 [00:04<00:33,  1.40it/s][A
Training:  12%|█▏        | 6/52 [00:04<00:25,  1.81it/s][A
Training:  13%|█▎        | 7/52 [00:04<00:20,  2.24it/s][A
Training:  15%|█▌        | 8/52 [00:04<00:15,  2.86it/s][A
Training:  17%|█▋        | 9/52 [00:05<00:25,  1.67it/s][A
Training:  21%|██        | 11/52 [00:05<00:15,  2.62it/s][A
Training:  23%|██▎       | 12/52 [00:06<00:15,  2.55it/s][A
Training:  25%|██▌       | 13/52 [00:07<00:22,  1.72it/s][A
Training:  27%|██▋       | 14/52 [00:07<00:17,  2.12it/s][A
Training:  31%|███       | 16/52 [00:08<00:14,  2.47it/s][A
Training:  33%|███▎      | 17/52 [00:09<00:17,  1.98it/s][A
Training:  35%|███▍      | 18/52 [00:09<00:14,  2.35it/s][A
Training:  38%|███▊      | 20/52 [00:10<

Epoch: 25/89 - Loss: 2.9613 - Accuracy: 0.9459



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:02<00:14,  2.42s/it][A
 43%|████▎     | 3/7 [00:02<00:02,  1.47it/s][A
100%|██████████| 7/7 [00:04<00:00,  1.68it/s][A
Epochs:  28%|██▊       | 25/89 [11:39<29:53, 28.02s/it]

Val Loss: 5.2117 - Val Accuracy: 0.9123



Training:   0%|          | 0/52 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/52 [00:02<02:00,  2.36s/it][A
Training:   6%|▌         | 3/52 [00:02<00:32,  1.49it/s][A
Training:   8%|▊         | 4/52 [00:02<00:25,  1.92it/s][A
Training:  10%|▉         | 5/52 [00:04<00:37,  1.25it/s][A
Training:  12%|█▏        | 6/52 [00:04<00:28,  1.62it/s][A
Training:  13%|█▎        | 7/52 [00:04<00:20,  2.17it/s][A
Training:  15%|█▌        | 8/52 [00:04<00:17,  2.51it/s][A
Training:  17%|█▋        | 9/52 [00:05<00:24,  1.75it/s][A
Training:  19%|█▉        | 10/52 [00:05<00:19,  2.11it/s][A
Training:  23%|██▎       | 12/52 [00:06<00:14,  2.82it/s][A
Training:  25%|██▌       | 13/52 [00:07<00:18,  2.06it/s][A
Training:  27%|██▋       | 14/52 [00:07<00:16,  2.33it/s][A
Training:  29%|██▉       | 15/52 [00:07<00:13,  2.84it/s][A
Training:  31%|███       | 16/52 [00:08<00:15,  2.35it/s][A
Training:  33%|███▎      | 17/52 [00:09<00:17,  1.96it/s][A
Training:  35%|███▍      | 18/52 [00:09<

Epoch: 26/89 - Loss: 2.9010 - Accuracy: 0.9468



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:02<00:13,  2.27s/it][A
 71%|███████▏  | 5/7 [00:03<00:01,  1.49it/s][A
100%|██████████| 7/7 [00:04<00:00,  1.69it/s][A
Epochs:  29%|██▉       | 26/89 [12:07<29:13, 27.84s/it]

Val Loss: 3.6915 - Val Accuracy: 0.9358



Training:   0%|          | 0/52 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/52 [00:02<01:51,  2.19s/it][A
Training:   4%|▍         | 2/52 [00:02<00:51,  1.04s/it][A
Training:   8%|▊         | 4/52 [00:02<00:20,  2.35it/s][A
Training:  10%|▉         | 5/52 [00:03<00:33,  1.40it/s][A
Training:  13%|█▎        | 7/52 [00:04<00:18,  2.44it/s][A
Training:  17%|█▋        | 9/52 [00:05<00:25,  1.69it/s][A
Training:  21%|██        | 11/52 [00:05<00:16,  2.43it/s][A
Training:  25%|██▌       | 13/52 [00:07<00:22,  1.76it/s][A
Training:  29%|██▉       | 15/52 [00:07<00:14,  2.48it/s][A
Training:  31%|███       | 16/52 [00:07<00:12,  2.84it/s][A
Training:  33%|███▎      | 17/52 [00:09<00:19,  1.75it/s][A
Training:  37%|███▋      | 19/52 [00:09<00:12,  2.59it/s][A
Training:  38%|███▊      | 20/52 [00:09<00:10,  3.07it/s][A
Training:  40%|████      | 21/52 [00:11<00:18,  1.69it/s][A
Training:  42%|████▏     | 22/52 [00:11<00:14,  2.01it/s][A
Training:  44%|████▍     | 23/52 [00:1

Epoch: 27/89 - Loss: 2.8837 - Accuracy: 0.9463



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:02<00:12,  2.14s/it][A
 43%|████▎     | 3/7 [00:02<00:02,  1.65it/s][A
 57%|█████▋    | 4/7 [00:02<00:01,  2.28it/s][A
100%|██████████| 7/7 [00:04<00:00,  1.73it/s][A
Epochs:  30%|███       | 27/89 [12:35<28:52, 27.95s/it]

Val Loss: 3.2549 - Val Accuracy: 0.9421



Training:   0%|          | 0/52 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/52 [00:02<01:54,  2.25s/it][A
Training:   6%|▌         | 3/52 [00:02<00:32,  1.50it/s][A
Training:   8%|▊         | 4/52 [00:02<00:22,  2.10it/s][A
Training:  10%|▉         | 5/52 [00:03<00:35,  1.34it/s][A
Training:  13%|█▎        | 7/52 [00:03<00:18,  2.44it/s][A
Training:  17%|█▋        | 9/52 [00:05<00:25,  1.71it/s][A
Training:  19%|█▉        | 10/52 [00:05<00:20,  2.08it/s][A
Training:  23%|██▎       | 12/52 [00:05<00:13,  3.07it/s][A
Training:  25%|██▌       | 13/52 [00:07<00:21,  1.85it/s][A
Training:  29%|██▉       | 15/52 [00:07<00:14,  2.58it/s][A
Training:  33%|███▎      | 17/52 [00:08<00:17,  1.98it/s][A
Training:  35%|███▍      | 18/52 [00:09<00:15,  2.23it/s][A
Training:  40%|████      | 21/52 [00:10<00:14,  2.21it/s][A
Training:  42%|████▏     | 22/52 [00:10<00:12,  2.40it/s][A
Training:  46%|████▌     | 24/52 [00:10<00:08,  3.36it/s][A
Training:  48%|████▊     | 25/52 [00:1

Epoch: 28/89 - Loss: 2.8463 - Accuracy: 0.9484



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:02<00:14,  2.41s/it][A
 43%|████▎     | 3/7 [00:02<00:02,  1.46it/s][A
100%|██████████| 7/7 [00:04<00:00,  1.62it/s][A
Epochs:  31%|███▏      | 28/89 [13:03<28:25, 27.96s/it]

Val Loss: 4.2755 - Val Accuracy: 0.9310



Training:   0%|          | 0/52 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/52 [00:02<02:02,  2.41s/it][A
Training:   6%|▌         | 3/52 [00:02<00:32,  1.50it/s][A
Training:  10%|▉         | 5/52 [00:04<00:36,  1.30it/s][A
Training:  12%|█▏        | 6/52 [00:04<00:27,  1.68it/s][A
Training:  15%|█▌        | 8/52 [00:04<00:16,  2.67it/s][A
Training:  17%|█▋        | 9/52 [00:05<00:24,  1.73it/s][A
Training:  19%|█▉        | 10/52 [00:05<00:20,  2.08it/s][A
Training:  21%|██        | 11/52 [00:06<00:18,  2.27it/s][A
Training:  23%|██▎       | 12/52 [00:06<00:14,  2.81it/s][A
Training:  25%|██▌       | 13/52 [00:07<00:21,  1.80it/s][A
Training:  27%|██▋       | 14/52 [00:07<00:16,  2.25it/s][A
Training:  29%|██▉       | 15/52 [00:08<00:15,  2.44it/s][A
Training:  31%|███       | 16/52 [00:08<00:11,  3.03it/s][A
Training:  33%|███▎      | 17/52 [00:09<00:18,  1.90it/s][A
Training:  35%|███▍      | 18/52 [00:09<00:15,  2.13it/s][A
Training:  37%|███▋      | 19/52 [00:0

Epoch: 29/89 - Loss: 2.9080 - Accuracy: 0.9469



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:02<00:13,  2.22s/it][A
 29%|██▊       | 2/7 [00:02<00:05,  1.02s/it][A
 57%|█████▋    | 4/7 [00:02<00:01,  2.38it/s][A
100%|██████████| 7/7 [00:04<00:00,  1.72it/s][A
Epochs:  33%|███▎      | 29/89 [13:32<28:09, 28.17s/it]

Val Loss: 3.6679 - Val Accuracy: 0.9426



Training:   0%|          | 0/52 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/52 [00:02<01:51,  2.19s/it][A
Training:   4%|▍         | 2/52 [00:02<00:51,  1.03s/it][A
Training:   6%|▌         | 3/52 [00:02<00:31,  1.53it/s][A
Training:  10%|▉         | 5/52 [00:04<00:32,  1.44it/s][A
Training:  12%|█▏        | 6/52 [00:04<00:24,  1.86it/s][A
Training:  13%|█▎        | 7/52 [00:04<00:18,  2.41it/s][A
Training:  17%|█▋        | 9/52 [00:05<00:24,  1.76it/s][A
Training:  21%|██        | 11/52 [00:06<00:15,  2.65it/s][A
Training:  23%|██▎       | 12/52 [00:06<00:12,  3.15it/s][A
Training:  25%|██▌       | 13/52 [00:07<00:23,  1.66it/s][A
Training:  29%|██▉       | 15/52 [00:07<00:14,  2.53it/s][A
Training:  33%|███▎      | 17/52 [00:09<00:18,  1.89it/s][A
Training:  37%|███▋      | 19/52 [00:09<00:12,  2.69it/s][A
Training:  38%|███▊      | 20/52 [00:09<00:10,  3.10it/s][A
Training:  40%|████      | 21/52 [00:11<00:20,  1.54it/s][A
Training:  44%|████▍     | 23/52 [00:11

Epoch: 30/89 - Loss: 3.0670 - Accuracy: 0.9440



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:02<00:12,  2.12s/it][A
 43%|████▎     | 3/7 [00:02<00:02,  1.67it/s][A
100%|██████████| 7/7 [00:03<00:00,  1.80it/s][A
Epochs:  34%|███▎      | 30/89 [13:59<27:29, 27.97s/it]

Val Loss: 3.3932 - Val Accuracy: 0.9407



Training:   0%|          | 0/52 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/52 [00:02<01:46,  2.09s/it][A
Training:   4%|▍         | 2/52 [00:02<00:46,  1.08it/s][A
Training:   8%|▊         | 4/52 [00:02<00:18,  2.54it/s][A
Training:  10%|▉         | 5/52 [00:04<00:36,  1.28it/s][A
Training:  15%|█▌        | 8/52 [00:04<00:15,  2.80it/s][A
Training:  19%|█▉        | 10/52 [00:05<00:22,  1.88it/s][A
Training:  25%|██▌       | 13/52 [00:07<00:20,  1.93it/s][A
Training:  27%|██▋       | 14/52 [00:07<00:17,  2.22it/s][A
Training:  31%|███       | 16/52 [00:07<00:11,  3.01it/s][A
Training:  33%|███▎      | 17/52 [00:09<00:19,  1.82it/s][A
Training:  37%|███▋      | 19/52 [00:09<00:13,  2.52it/s][A
Training:  40%|████      | 21/52 [00:10<00:16,  1.87it/s][A
Training:  44%|████▍     | 23/52 [00:11<00:11,  2.55it/s][A
Training:  48%|████▊     | 25/52 [00:12<00:13,  1.99it/s][A
Training:  52%|█████▏    | 27/52 [00:12<00:09,  2.71it/s][A
Training:  56%|█████▌    | 29/52 [00:

Epoch: 31/89 - Loss: 2.6681 - Accuracy: 0.9500



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:02<00:15,  2.51s/it][A
 29%|██▊       | 2/7 [00:02<00:05,  1.12s/it][A
 43%|████▎     | 3/7 [00:02<00:02,  1.53it/s][A
100%|██████████| 7/7 [00:04<00:00,  1.61it/s][A
Epochs:  35%|███▍      | 31/89 [14:27<27:05, 28.02s/it]

Val Loss: 3.5886 - Val Accuracy: 0.9381



Training:   0%|          | 0/52 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/52 [00:02<01:58,  2.32s/it][A
Training:   4%|▍         | 2/52 [00:02<00:51,  1.03s/it][A
Training:   8%|▊         | 4/52 [00:02<00:20,  2.33it/s][A
Training:  10%|▉         | 5/52 [00:04<00:35,  1.31it/s][A
Training:  13%|█▎        | 7/52 [00:04<00:20,  2.23it/s][A
Training:  17%|█▋        | 9/52 [00:05<00:25,  1.70it/s][A
Training:  21%|██        | 11/52 [00:05<00:16,  2.52it/s][A
Training:  23%|██▎       | 12/52 [00:06<00:13,  2.98it/s][A
Training:  25%|██▌       | 13/52 [00:07<00:24,  1.59it/s][A
Training:  27%|██▋       | 14/52 [00:07<00:19,  1.98it/s][A
Training:  33%|███▎      | 17/52 [00:09<00:20,  1.73it/s][A
Training:  38%|███▊      | 20/52 [00:09<00:11,  2.87it/s][A
Training:  42%|████▏     | 22/52 [00:11<00:15,  1.96it/s][A
Training:  46%|████▌     | 24/52 [00:11<00:10,  2.57it/s][A
Training:  48%|████▊     | 25/52 [00:13<00:14,  1.82it/s][A
Training:  54%|█████▍    | 28/52 [00:1

Epoch: 32/89 - Loss: 2.8791 - Accuracy: 0.9465



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:02<00:14,  2.39s/it][A
 43%|████▎     | 3/7 [00:02<00:02,  1.48it/s][A
100%|██████████| 7/7 [00:04<00:00,  1.62it/s][A
Epochs:  36%|███▌      | 32/89 [14:56<26:47, 28.20s/it]

Val Loss: 3.7728 - Val Accuracy: 0.9317



Training:   0%|          | 0/52 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/52 [00:02<02:12,  2.59s/it][A
Training:   6%|▌         | 3/52 [00:02<00:35,  1.39it/s][A
Training:   8%|▊         | 4/52 [00:02<00:25,  1.89it/s][A
Training:  10%|▉         | 5/52 [00:04<00:40,  1.16it/s][A
Training:  13%|█▎        | 7/52 [00:04<00:22,  2.01it/s][A
Training:  15%|█▌        | 8/52 [00:04<00:17,  2.52it/s][A
Training:  17%|█▋        | 9/52 [00:06<00:31,  1.36it/s][A
Training:  21%|██        | 11/52 [00:06<00:17,  2.28it/s][A
Training:  25%|██▌       | 13/52 [00:08<00:22,  1.74it/s][A
Training:  29%|██▉       | 15/52 [00:08<00:14,  2.57it/s][A
Training:  33%|███▎      | 17/52 [00:09<00:19,  1.79it/s][A
Training:  37%|███▋      | 19/52 [00:10<00:13,  2.50it/s][A
Training:  40%|████      | 21/52 [00:11<00:16,  1.89it/s][A
Training:  44%|████▍     | 23/52 [00:11<00:11,  2.60it/s][A
Training:  48%|████▊     | 25/52 [00:13<00:13,  1.97it/s][A
Training:  50%|█████     | 26/52 [00:13

Epoch: 33/89 - Loss: 2.8877 - Accuracy: 0.9453



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:02<00:12,  2.16s/it][A
 43%|████▎     | 3/7 [00:02<00:02,  1.62it/s][A
100%|██████████| 7/7 [00:04<00:00,  1.72it/s][A
Epochs:  37%|███▋      | 33/89 [15:25<26:25, 28.31s/it]

Val Loss: 3.6506 - Val Accuracy: 0.9362



Training:   0%|          | 0/52 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/52 [00:02<02:00,  2.36s/it][A
Training:   4%|▍         | 2/52 [00:02<00:51,  1.04s/it][A
Training:   8%|▊         | 4/52 [00:02<00:20,  2.29it/s][A
Training:  10%|▉         | 5/52 [00:04<00:36,  1.28it/s][A
Training:  13%|█▎        | 7/52 [00:04<00:20,  2.23it/s][A
Training:  17%|█▋        | 9/52 [00:05<00:25,  1.70it/s][A
Training:  19%|█▉        | 10/52 [00:06<00:20,  2.07it/s][A
Training:  23%|██▎       | 12/52 [00:06<00:13,  3.02it/s][A
Training:  25%|██▌       | 13/52 [00:07<00:21,  1.84it/s][A
Training:  31%|███       | 16/52 [00:07<00:10,  3.31it/s][A
Training:  35%|███▍      | 18/52 [00:09<00:14,  2.35it/s][A
Training:  38%|███▊      | 20/52 [00:09<00:09,  3.21it/s][A
Training:  42%|████▏     | 22/52 [00:10<00:13,  2.20it/s][A
Training:  46%|████▌     | 24/52 [00:10<00:09,  3.01it/s][A
Training:  50%|█████     | 26/52 [00:12<00:12,  2.11it/s][A
Training:  52%|█████▏    | 27/52 [00:1

Epoch: 34/89 - Loss: 2.8194 - Accuracy: 0.9457



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:02<00:12,  2.05s/it][A
 43%|████▎     | 3/7 [00:02<00:02,  1.70it/s][A
 57%|█████▋    | 4/7 [00:02<00:01,  2.19it/s][A
100%|██████████| 7/7 [00:03<00:00,  1.88it/s][A
Epochs:  38%|███▊      | 34/89 [15:52<25:38, 27.98s/it]

Val Loss: 3.4456 - Val Accuracy: 0.9410



Training:   0%|          | 0/52 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/52 [00:02<02:02,  2.40s/it][A
Training:   4%|▍         | 2/52 [00:02<00:53,  1.06s/it][A
Training:   8%|▊         | 4/52 [00:02<00:20,  2.33it/s][A
Training:  12%|█▏        | 6/52 [00:04<00:27,  1.66it/s][A
Training:  17%|█▋        | 9/52 [00:06<00:26,  1.65it/s][A
Training:  21%|██        | 11/52 [00:06<00:17,  2.34it/s][A
Training:  25%|██▌       | 13/52 [00:08<00:22,  1.71it/s][A
Training:  29%|██▉       | 15/52 [00:08<00:15,  2.36it/s][A
Training:  33%|███▎      | 17/52 [00:09<00:18,  1.93it/s][A
Training:  35%|███▍      | 18/52 [00:09<00:15,  2.26it/s][A
Training:  40%|████      | 21/52 [00:11<00:14,  2.11it/s][A
Training:  48%|████▊     | 25/52 [00:12<00:12,  2.22it/s][A
Training:  50%|█████     | 26/52 [00:13<00:10,  2.48it/s][A
Training:  52%|█████▏    | 27/52 [00:13<00:09,  2.77it/s][A
Training:  56%|█████▌    | 29/52 [00:14<00:11,  2.01it/s][A
Training:  58%|█████▊    | 30/52 [00:

Epoch: 35/89 - Loss: 2.7397 - Accuracy: 0.9490



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:02<00:14,  2.43s/it][A
 43%|████▎     | 3/7 [00:02<00:02,  1.49it/s][A
 71%|███████▏  | 5/7 [00:03<00:01,  1.53it/s][A
 86%|████████▌ | 6/7 [00:04<00:00,  1.86it/s][A
100%|██████████| 7/7 [00:04<00:00,  1.61it/s][A
Epochs:  39%|███▉      | 35/89 [16:20<25:12, 28.01s/it]

Val Loss: 3.6364 - Val Accuracy: 0.9362



Training:   0%|          | 0/52 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/52 [00:02<01:53,  2.23s/it][A
Training:   4%|▍         | 2/52 [00:02<00:49,  1.02it/s][A
Training:   8%|▊         | 4/52 [00:02<00:20,  2.29it/s][A
Training:  10%|▉         | 5/52 [00:04<00:36,  1.29it/s][A
Training:  12%|█▏        | 6/52 [00:04<00:27,  1.64it/s][A
Training:  13%|█▎        | 7/52 [00:04<00:20,  2.19it/s][A
Training:  15%|█▌        | 8/52 [00:04<00:15,  2.77it/s][A
Training:  17%|█▋        | 9/52 [00:05<00:28,  1.51it/s][A
Training:  19%|█▉        | 10/52 [00:06<00:23,  1.79it/s][A
Training:  23%|██▎       | 12/52 [00:06<00:12,  3.08it/s][A
Training:  25%|██▌       | 13/52 [00:07<00:22,  1.72it/s][A
Training:  27%|██▋       | 14/52 [00:07<00:18,  2.11it/s][A
Training:  31%|███       | 16/52 [00:07<00:10,  3.41it/s][A
Training:  35%|███▍      | 18/52 [00:09<00:15,  2.18it/s][A
Training:  37%|███▋      | 19/52 [00:09<00:12,  2.60it/s][A
Training:  40%|████      | 21/52 [00:11<

Epoch: 36/89 - Loss: 2.7421 - Accuracy: 0.9492



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:02<00:12,  2.08s/it][A
 29%|██▊       | 2/7 [00:02<00:04,  1.07it/s][A
 57%|█████▋    | 4/7 [00:02<00:01,  2.48it/s][A
 71%|███████▏  | 5/7 [00:03<00:01,  1.42it/s][A
100%|██████████| 7/7 [00:04<00:00,  1.74it/s][A
Epochs:  40%|████      | 36/89 [16:48<24:51, 28.14s/it]

Val Loss: 3.4367 - Val Accuracy: 0.9412



Training:   0%|          | 0/52 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/52 [00:02<01:49,  2.15s/it][A
Training:   4%|▍         | 2/52 [00:02<00:48,  1.02it/s][A
Training:  10%|▉         | 5/52 [00:04<00:32,  1.45it/s][A
Training:  13%|█▎        | 7/52 [00:04<00:19,  2.26it/s][A
Training:  17%|█▋        | 9/52 [00:05<00:25,  1.69it/s][A
Training:  19%|█▉        | 10/52 [00:06<00:20,  2.02it/s][A
Training:  23%|██▎       | 12/52 [00:06<00:13,  3.03it/s][A
Training:  27%|██▋       | 14/52 [00:07<00:19,  2.00it/s][A
Training:  29%|██▉       | 15/52 [00:07<00:15,  2.37it/s][A
Training:  33%|███▎      | 17/52 [00:09<00:18,  1.86it/s][A
Training:  35%|███▍      | 18/52 [00:09<00:15,  2.17it/s][A
Training:  37%|███▋      | 19/52 [00:09<00:12,  2.63it/s][A
Training:  40%|████      | 21/52 [00:10<00:15,  2.02it/s][A
Training:  42%|████▏     | 22/52 [00:11<00:14,  2.11it/s][A
Training:  44%|████▍     | 23/52 [00:11<00:11,  2.55it/s][A
Training:  46%|████▌     | 24/52 [00:

Epoch: 37/89 - Loss: 2.7812 - Accuracy: 0.9472



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:02<00:14,  2.34s/it][A
 29%|██▊       | 2/7 [00:02<00:05,  1.03s/it][A
 57%|█████▋    | 4/7 [00:02<00:01,  2.29it/s][A
100%|██████████| 7/7 [00:04<00:00,  1.70it/s][A
Epochs:  42%|████▏     | 37/89 [17:17<24:29, 28.25s/it]

Val Loss: 3.5178 - Val Accuracy: 0.9397



Training:   0%|          | 0/52 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/52 [00:02<02:05,  2.46s/it][A
Training:   4%|▍         | 2/52 [00:02<00:54,  1.09s/it][A
Training:   8%|▊         | 4/52 [00:02<00:21,  2.20it/s][A
Training:  10%|▉         | 5/52 [00:04<00:33,  1.42it/s][A
Training:  13%|█▎        | 7/52 [00:04<00:18,  2.50it/s][A
Training:  17%|█▋        | 9/52 [00:05<00:23,  1.85it/s][A
Training:  21%|██        | 11/52 [00:05<00:15,  2.73it/s][A
Training:  25%|██▌       | 13/52 [00:07<00:22,  1.72it/s][A
Training:  29%|██▉       | 15/52 [00:07<00:15,  2.38it/s][A
Training:  33%|███▎      | 17/52 [00:09<00:18,  1.94it/s][A
Training:  37%|███▋      | 19/52 [00:09<00:12,  2.69it/s][A
Training:  40%|████      | 21/52 [00:11<00:15,  2.01it/s][A
Training:  42%|████▏     | 22/52 [00:11<00:12,  2.32it/s][A
Training:  44%|████▍     | 23/52 [00:11<00:10,  2.74it/s][A
Training:  48%|████▊     | 25/52 [00:12<00:13,  2.00it/s][A
Training:  50%|█████     | 26/52 [00:1

Epoch: 38/89 - Loss: 2.7279 - Accuracy: 0.9478



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:02<00:14,  2.35s/it][A
 71%|███████▏  | 5/7 [00:04<00:01,  1.39it/s][A
100%|██████████| 7/7 [00:04<00:00,  1.61it/s][A
Epochs:  43%|████▎     | 38/89 [17:44<23:50, 28.04s/it]

Val Loss: 3.2761 - Val Accuracy: 0.9444



Training:   0%|          | 0/52 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/52 [00:02<02:17,  2.69s/it][A
Training:   4%|▍         | 2/52 [00:02<00:59,  1.20s/it][A
Training:   6%|▌         | 3/52 [00:02<00:34,  1.43it/s][A
Training:   8%|▊         | 4/52 [00:03<00:22,  2.15it/s][A
Training:  10%|▉         | 5/52 [00:04<00:37,  1.24it/s][A
Training:  13%|█▎        | 7/52 [00:04<00:20,  2.23it/s][A
Training:  17%|█▋        | 9/52 [00:06<00:24,  1.78it/s][A
Training:  21%|██        | 11/52 [00:06<00:15,  2.60it/s][A
Training:  23%|██▎       | 12/52 [00:06<00:13,  3.05it/s][A
Training:  25%|██▌       | 13/52 [00:07<00:23,  1.63it/s][A
Training:  27%|██▋       | 14/52 [00:08<00:18,  2.02it/s][A
Training:  31%|███       | 16/52 [00:08<00:11,  3.15it/s][A
Training:  33%|███▎      | 17/52 [00:09<00:19,  1.80it/s][A
Training:  37%|███▋      | 19/52 [00:09<00:12,  2.69it/s][A
Training:  40%|████      | 21/52 [00:11<00:16,  1.87it/s][A
Training:  42%|████▏     | 22/52 [00:11

Epoch: 39/89 - Loss: 2.6837 - Accuracy: 0.9493



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:02<00:13,  2.19s/it][A
 43%|████▎     | 3/7 [00:02<00:02,  1.58it/s][A
100%|██████████| 7/7 [00:04<00:00,  1.69it/s][A
Epochs:  44%|████▍     | 39/89 [18:13<23:24, 28.09s/it]

Val Loss: 3.9288 - Val Accuracy: 0.9318



Training:   0%|          | 0/52 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/52 [00:02<02:01,  2.38s/it][A
Training:   4%|▍         | 2/52 [00:02<00:52,  1.05s/it][A
Training:   6%|▌         | 3/52 [00:02<00:30,  1.59it/s][A
Training:   8%|▊         | 4/52 [00:02<00:20,  2.37it/s][A
Training:  10%|▉         | 5/52 [00:03<00:33,  1.40it/s][A
Training:  12%|█▏        | 6/52 [00:04<00:23,  1.97it/s][A
Training:  15%|█▌        | 8/52 [00:04<00:12,  3.48it/s][A
Training:  17%|█▋        | 9/52 [00:05<00:27,  1.56it/s][A
Training:  19%|█▉        | 10/52 [00:05<00:21,  1.99it/s][A
Training:  23%|██▎       | 12/52 [00:06<00:12,  3.11it/s][A
Training:  25%|██▌       | 13/52 [00:07<00:22,  1.75it/s][A
Training:  29%|██▉       | 15/52 [00:07<00:13,  2.73it/s][A
Training:  33%|███▎      | 17/52 [00:09<00:18,  1.86it/s][A
Training:  37%|███▋      | 19/52 [00:09<00:12,  2.71it/s][A
Training:  40%|████      | 21/52 [00:11<00:17,  1.81it/s][A
Training:  42%|████▏     | 22/52 [00:11<

Epoch: 40/89 - Loss: 2.5615 - Accuracy: 0.9509



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:02<00:14,  2.39s/it][A
 43%|████▎     | 3/7 [00:02<00:02,  1.47it/s][A
 57%|█████▋    | 4/7 [00:02<00:01,  2.07it/s][A
100%|██████████| 7/7 [00:04<00:00,  1.62it/s][A
Epochs:  45%|████▍     | 40/89 [18:41<23:01, 28.20s/it]

Val Loss: 3.6526 - Val Accuracy: 0.9365



Training:   0%|          | 0/52 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/52 [00:02<01:59,  2.34s/it][A
Training:   6%|▌         | 3/52 [00:02<00:34,  1.43it/s][A
Training:   8%|▊         | 4/52 [00:02<00:24,  1.99it/s][A
Training:  10%|▉         | 5/52 [00:04<00:39,  1.18it/s][A
Training:  12%|█▏        | 6/52 [00:04<00:28,  1.62it/s][A
Training:  13%|█▎        | 7/52 [00:04<00:20,  2.17it/s][A
Training:  17%|█▋        | 9/52 [00:05<00:24,  1.78it/s][A
Training:  21%|██        | 11/52 [00:06<00:14,  2.76it/s][A
Training:  25%|██▌       | 13/52 [00:07<00:19,  1.96it/s][A
Training:  27%|██▋       | 14/52 [00:07<00:17,  2.17it/s][A
Training:  29%|██▉       | 15/52 [00:07<00:14,  2.64it/s][A
Training:  31%|███       | 16/52 [00:08<00:11,  3.18it/s][A
Training:  33%|███▎      | 17/52 [00:09<00:19,  1.81it/s][A
Training:  35%|███▍      | 18/52 [00:09<00:16,  2.06it/s][A
Training:  37%|███▋      | 19/52 [00:09<00:12,  2.64it/s][A
Training:  40%|████      | 21/52 [00:11

Epoch: 41/89 - Loss: 2.6688 - Accuracy: 0.9488



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:02<00:12,  2.11s/it][A
 29%|██▊       | 2/7 [00:02<00:04,  1.07it/s][A
 43%|████▎     | 3/7 [00:02<00:02,  1.75it/s][A
100%|██████████| 7/7 [00:04<00:00,  1.75it/s][A
Epochs:  46%|████▌     | 41/89 [19:09<22:27, 28.08s/it]

Val Loss: 3.3842 - Val Accuracy: 0.9402



Training:   0%|          | 0/52 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/52 [00:02<01:47,  2.10s/it][A
Training:   6%|▌         | 3/52 [00:02<00:30,  1.63it/s][A
Training:   8%|▊         | 4/52 [00:02<00:21,  2.21it/s][A
Training:  10%|▉         | 5/52 [00:03<00:35,  1.32it/s][A
Training:  12%|█▏        | 6/52 [00:03<00:25,  1.81it/s][A
Training:  13%|█▎        | 7/52 [00:04<00:19,  2.31it/s][A
Training:  15%|█▌        | 8/52 [00:04<00:14,  3.03it/s][A
Training:  17%|█▋        | 9/52 [00:05<00:30,  1.39it/s][A
Training:  21%|██        | 11/52 [00:05<00:17,  2.37it/s][A
Training:  23%|██▎       | 12/52 [00:06<00:13,  2.92it/s][A
Training:  25%|██▌       | 13/52 [00:07<00:25,  1.55it/s][A
Training:  29%|██▉       | 15/52 [00:07<00:15,  2.36it/s][A
Training:  31%|███       | 16/52 [00:07<00:12,  2.84it/s][A
Training:  33%|███▎      | 17/52 [00:09<00:21,  1.59it/s][A
Training:  35%|███▍      | 18/52 [00:09<00:16,  2.03it/s][A
Training:  37%|███▋      | 19/52 [00:09<

Epoch: 42/89 - Loss: 2.6449 - Accuracy: 0.9500



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:02<00:14,  2.40s/it][A
 43%|████▎     | 3/7 [00:02<00:02,  1.51it/s][A
100%|██████████| 7/7 [00:04<00:00,  1.74it/s][A
Epochs:  47%|████▋     | 42/89 [19:37<22:00, 28.09s/it]

Val Loss: 3.4862 - Val Accuracy: 0.9407



Training:   0%|          | 0/52 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/52 [00:02<02:04,  2.44s/it][A
Training:   4%|▍         | 2/52 [00:02<00:54,  1.08s/it][A
Training:   6%|▌         | 3/52 [00:02<00:32,  1.53it/s][A
Training:  10%|▉         | 5/52 [00:03<00:30,  1.55it/s][A
Training:  12%|█▏        | 6/52 [00:04<00:22,  2.02it/s][A
Training:  13%|█▎        | 7/52 [00:04<00:17,  2.60it/s][A
Training:  15%|█▌        | 8/52 [00:04<00:13,  3.29it/s][A
Training:  17%|█▋        | 9/52 [00:05<00:29,  1.46it/s][A
Training:  19%|█▉        | 10/52 [00:06<00:23,  1.80it/s][A
Training:  23%|██▎       | 12/52 [00:06<00:13,  2.90it/s][A
Training:  25%|██▌       | 13/52 [00:07<00:22,  1.76it/s][A
Training:  27%|██▋       | 14/52 [00:07<00:17,  2.23it/s][A
Training:  31%|███       | 16/52 [00:07<00:10,  3.49it/s][A
Training:  33%|███▎      | 17/52 [00:09<00:20,  1.68it/s][A
Training:  35%|███▍      | 18/52 [00:09<00:16,  2.09it/s][A
Training:  38%|███▊      | 20/52 [00:09<

Epoch: 43/89 - Loss: 2.5780 - Accuracy: 0.9502



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:02<00:14,  2.36s/it][A
 29%|██▊       | 2/7 [00:02<00:05,  1.04s/it][A
 57%|█████▋    | 4/7 [00:02<00:01,  2.27it/s][A
 71%|███████▏  | 5/7 [00:03<00:01,  1.49it/s][A
100%|██████████| 7/7 [00:04<00:00,  1.72it/s][A
Epochs:  48%|████▊     | 43/89 [20:05<21:26, 27.98s/it]

Val Loss: 3.7182 - Val Accuracy: 0.9373



Training:   0%|          | 0/52 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/52 [00:02<02:01,  2.38s/it][A
Training:   6%|▌         | 3/52 [00:02<00:32,  1.49it/s][A
Training:  10%|▉         | 5/52 [00:04<00:36,  1.28it/s][A
Training:  12%|█▏        | 6/52 [00:04<00:27,  1.67it/s][A
Training:  15%|█▌        | 8/52 [00:04<00:16,  2.67it/s][A
Training:  17%|█▋        | 9/52 [00:06<00:29,  1.48it/s][A
Training:  21%|██        | 11/52 [00:06<00:18,  2.22it/s][A
Training:  25%|██▌       | 13/52 [00:07<00:21,  1.78it/s][A
Training:  29%|██▉       | 15/52 [00:08<00:15,  2.44it/s][A
Training:  31%|███       | 16/52 [00:08<00:12,  2.84it/s][A
Training:  33%|███▎      | 17/52 [00:09<00:20,  1.69it/s][A
Training:  35%|███▍      | 18/52 [00:09<00:16,  2.07it/s][A
Training:  40%|████      | 21/52 [00:11<00:16,  1.94it/s][A
Training:  44%|████▍     | 23/52 [00:11<00:10,  2.73it/s][A
Training:  48%|████▊     | 25/52 [00:13<00:14,  1.92it/s][A
Training:  52%|█████▏    | 27/52 [00:1

Epoch: 44/89 - Loss: 2.6177 - Accuracy: 0.9491



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:02<00:13,  2.26s/it][A
 43%|████▎     | 3/7 [00:02<00:02,  1.60it/s][A
100%|██████████| 7/7 [00:04<00:00,  1.70it/s][A
Epochs:  49%|████▉     | 44/89 [20:33<21:04, 28.10s/it]

Val Loss: 3.8246 - Val Accuracy: 0.9315



Training:   0%|          | 0/52 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/52 [00:02<01:55,  2.26s/it][A
Training:   6%|▌         | 3/52 [00:02<00:37,  1.32it/s][A
Training:  10%|▉         | 5/52 [00:04<00:33,  1.38it/s][A
Training:  13%|█▎        | 7/52 [00:04<00:21,  2.05it/s][A
Training:  17%|█▋        | 9/52 [00:05<00:24,  1.72it/s][A
Training:  21%|██        | 11/52 [00:06<00:19,  2.14it/s][A
Training:  25%|██▌       | 13/52 [00:07<00:19,  2.02it/s][A
Training:  27%|██▋       | 14/52 [00:07<00:16,  2.28it/s][A
Training:  29%|██▉       | 15/52 [00:08<00:16,  2.29it/s][A
Training:  31%|███       | 16/52 [00:08<00:13,  2.74it/s][A
Training:  33%|███▎      | 17/52 [00:09<00:18,  1.86it/s][A
Training:  35%|███▍      | 18/52 [00:09<00:14,  2.31it/s][A
Training:  37%|███▋      | 19/52 [00:10<00:17,  1.94it/s][A
Training:  38%|███▊      | 20/52 [00:10<00:12,  2.46it/s][A
Training:  40%|████      | 21/52 [00:11<00:16,  1.91it/s][A
Training:  44%|████▍     | 23/52 [00:

Epoch: 45/89 - Loss: 2.6020 - Accuracy: 0.9505



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:02<00:13,  2.26s/it][A
 57%|█████▋    | 4/7 [00:02<00:01,  2.19it/s][A
100%|██████████| 7/7 [00:03<00:00,  1.77it/s][A
Epochs:  51%|█████     | 45/89 [21:01<20:39, 28.16s/it]

Val Loss: 3.6274 - Val Accuracy: 0.9410



Training:   0%|          | 0/52 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/52 [00:02<01:50,  2.16s/it][A
Training:   4%|▍         | 2/52 [00:02<00:48,  1.02it/s][A
Training:   6%|▌         | 3/52 [00:02<00:31,  1.58it/s][A
Training:   8%|▊         | 4/52 [00:02<00:20,  2.34it/s][A
Training:  10%|▉         | 5/52 [00:03<00:33,  1.39it/s][A
Training:  13%|█▎        | 7/52 [00:04<00:21,  2.06it/s][A
Training:  15%|█▌        | 8/52 [00:04<00:16,  2.62it/s][A
Training:  17%|█▋        | 9/52 [00:05<00:23,  1.81it/s][A
Training:  21%|██        | 11/52 [00:06<00:17,  2.37it/s][A
Training:  25%|██▌       | 13/52 [00:07<00:19,  1.96it/s][A
Training:  29%|██▉       | 15/52 [00:07<00:13,  2.66it/s][A
Training:  33%|███▎      | 17/52 [00:09<00:17,  1.97it/s][A
Training:  37%|███▋      | 19/52 [00:09<00:12,  2.67it/s][A
Training:  40%|████      | 21/52 [00:10<00:15,  1.97it/s][A
Training:  44%|████▍     | 23/52 [00:11<00:11,  2.62it/s][A
Training:  46%|████▌     | 24/52 [00:11<

Epoch: 46/89 - Loss: 2.6931 - Accuracy: 0.9474



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:02<00:14,  2.38s/it][A
 57%|█████▋    | 4/7 [00:02<00:01,  2.09it/s][A
100%|██████████| 7/7 [00:04<00:00,  1.66it/s][A
Epochs:  52%|█████▏    | 46/89 [21:29<20:09, 28.12s/it]

Val Loss: 3.4145 - Val Accuracy: 0.9423



Training:   0%|          | 0/52 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/52 [00:02<01:44,  2.05s/it][A
Training:   4%|▍         | 2/52 [00:02<00:48,  1.02it/s][A
Training:   8%|▊         | 4/52 [00:02<00:19,  2.47it/s][A
Training:  10%|▉         | 5/52 [00:03<00:33,  1.40it/s][A
Training:  13%|█▎        | 7/52 [00:04<00:20,  2.16it/s][A
Training:  17%|█▋        | 9/52 [00:05<00:25,  1.66it/s][A
Training:  21%|██        | 11/52 [00:06<00:17,  2.35it/s][A
Training:  23%|██▎       | 12/52 [00:06<00:14,  2.79it/s][A
Training:  25%|██▌       | 13/52 [00:07<00:23,  1.68it/s][A
Training:  29%|██▉       | 15/52 [00:07<00:14,  2.61it/s][A
Training:  33%|███▎      | 17/52 [00:09<00:21,  1.62it/s][A
Training:  37%|███▋      | 19/52 [00:09<00:14,  2.30it/s][A
Training:  40%|████      | 21/52 [00:11<00:17,  1.75it/s][A
Training:  46%|████▌     | 24/52 [00:11<00:09,  2.81it/s][A
Training:  50%|█████     | 26/52 [00:13<00:13,  1.94it/s][A
Training:  54%|█████▍    | 28/52 [00:1

Epoch: 47/89 - Loss: 2.5091 - Accuracy: 0.9517



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:02<00:13,  2.24s/it][A
 29%|██▊       | 2/7 [00:02<00:04,  1.00it/s][A
 57%|█████▋    | 4/7 [00:02<00:01,  2.43it/s][A
100%|██████████| 7/7 [00:04<00:00,  1.69it/s][A
Epochs:  53%|█████▎    | 47/89 [21:58<19:41, 28.14s/it]

Val Loss: 4.0200 - Val Accuracy: 0.9302



Training:   0%|          | 0/52 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/52 [00:02<01:43,  2.03s/it][A
Training:   4%|▍         | 2/52 [00:02<00:49,  1.01it/s][A
Training:  10%|▉         | 5/52 [00:03<00:30,  1.56it/s][A
Training:  12%|█▏        | 6/52 [00:04<00:28,  1.59it/s][A
Training:  15%|█▌        | 8/52 [00:04<00:17,  2.56it/s][A
Training:  17%|█▋        | 9/52 [00:05<00:22,  1.91it/s][A
Training:  19%|█▉        | 10/52 [00:06<00:23,  1.81it/s][A
Training:  25%|██▌       | 13/52 [00:07<00:20,  1.94it/s][A
Training:  27%|██▋       | 14/52 [00:08<00:19,  1.99it/s][A
Training:  29%|██▉       | 15/52 [00:08<00:15,  2.38it/s][A
Training:  33%|███▎      | 17/52 [00:09<00:16,  2.14it/s][A
Training:  35%|███▍      | 18/52 [00:09<00:16,  2.07it/s][A
Training:  37%|███▋      | 19/52 [00:09<00:13,  2.53it/s][A
Training:  40%|████      | 21/52 [00:10<00:13,  2.23it/s][A
Training:  42%|████▏     | 22/52 [00:11<00:15,  1.89it/s][A
Training:  46%|████▌     | 24/52 [00:1

Epoch: 48/89 - Loss: 2.6105 - Accuracy: 0.9495



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:02<00:15,  2.52s/it][A
 57%|█████▋    | 4/7 [00:02<00:01,  1.92it/s][A
100%|██████████| 7/7 [00:04<00:00,  1.67it/s][A
Epochs:  54%|█████▍    | 48/89 [22:26<19:16, 28.21s/it]

Val Loss: 4.2492 - Val Accuracy: 0.9331



Training:   0%|          | 0/52 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/52 [00:02<01:54,  2.25s/it][A
Training:   8%|▊         | 4/52 [00:02<00:22,  2.18it/s][A
Training:  12%|█▏        | 6/52 [00:04<00:29,  1.58it/s][A
Training:  17%|█▋        | 9/52 [00:05<00:26,  1.63it/s][A
Training:  25%|██▌       | 13/52 [00:07<00:19,  1.97it/s][A
Training:  29%|██▉       | 15/52 [00:07<00:15,  2.44it/s][A
Training:  31%|███       | 16/52 [00:07<00:13,  2.75it/s][A
Training:  33%|███▎      | 17/52 [00:09<00:18,  1.90it/s][A
Training:  37%|███▋      | 19/52 [00:09<00:13,  2.36it/s][A
Training:  38%|███▊      | 20/52 [00:09<00:11,  2.68it/s][A
Training:  40%|████      | 21/52 [00:10<00:17,  1.74it/s][A
Training:  44%|████▍     | 23/52 [00:11<00:11,  2.54it/s][A
Training:  48%|████▊     | 25/52 [00:12<00:14,  1.80it/s][A
Training:  52%|█████▏    | 27/52 [00:13<00:09,  2.54it/s][A
Training:  56%|█████▌    | 29/52 [00:14<00:11,  1.97it/s][A
Training:  60%|█████▉    | 31/52 [00

Epoch: 49/89 - Loss: 2.9434 - Accuracy: 0.9442



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:02<00:13,  2.26s/it][A
 29%|██▊       | 2/7 [00:02<00:04,  1.00it/s][A
 57%|█████▋    | 4/7 [00:02<00:01,  2.26it/s][A
 71%|███████▏  | 5/7 [00:03<00:01,  1.60it/s][A
100%|██████████| 7/7 [00:03<00:00,  1.78it/s][A
Epochs:  55%|█████▌    | 49/89 [22:53<18:34, 27.87s/it]

Val Loss: 3.4308 - Val Accuracy: 0.9404



Training:   0%|          | 0/52 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/52 [00:01<01:39,  1.95s/it][A
Training:   6%|▌         | 3/52 [00:02<00:27,  1.78it/s][A
Training:  10%|▉         | 5/52 [00:03<00:33,  1.42it/s][A
Training:  13%|█▎        | 7/52 [00:03<00:19,  2.31it/s][A
Training:  15%|█▌        | 8/52 [00:04<00:17,  2.57it/s][A
Training:  17%|█▋        | 9/52 [00:05<00:30,  1.43it/s][A
Training:  21%|██        | 11/52 [00:05<00:18,  2.24it/s][A
Training:  23%|██▎       | 12/52 [00:06<00:15,  2.59it/s][A
Training:  25%|██▌       | 13/52 [00:07<00:25,  1.54it/s][A
Training:  27%|██▋       | 14/52 [00:07<00:19,  1.91it/s][A
Training:  31%|███       | 16/52 [00:07<00:11,  3.02it/s][A
Training:  33%|███▎      | 17/52 [00:09<00:20,  1.73it/s][A
Training:  37%|███▋      | 19/52 [00:09<00:12,  2.66it/s][A
Training:  38%|███▊      | 20/52 [00:09<00:10,  3.13it/s][A
Training:  40%|████      | 21/52 [00:11<00:19,  1.60it/s][A
Training:  42%|████▏     | 22/52 [00:1

Epoch: 50/89 - Loss: 2.5144 - Accuracy: 0.9498



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:01<00:11,  1.91s/it][A
 29%|██▊       | 2/7 [00:02<00:04,  1.09it/s][A
 43%|████▎     | 3/7 [00:02<00:02,  1.63it/s][A
 71%|███████▏  | 5/7 [00:03<00:01,  1.71it/s][A
100%|██████████| 7/7 [00:04<00:00,  1.75it/s][A
Epochs:  56%|█████▌    | 50/89 [23:21<18:06, 27.86s/it]

Val Loss: 3.4052 - Val Accuracy: 0.9399



Training:   0%|          | 0/52 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/52 [00:02<01:57,  2.31s/it][A
Training:   6%|▌         | 3/52 [00:02<00:32,  1.50it/s][A
Training:  10%|▉         | 5/52 [00:04<00:34,  1.37it/s][A
Training:  13%|█▎        | 7/52 [00:04<00:20,  2.22it/s][A
Training:  17%|█▋        | 9/52 [00:05<00:24,  1.77it/s][A
Training:  25%|██▌       | 13/52 [00:07<00:19,  2.01it/s][A
Training:  29%|██▉       | 15/52 [00:07<00:14,  2.61it/s][A
Training:  33%|███▎      | 17/52 [00:09<00:17,  2.01it/s][A
Training:  35%|███▍      | 18/52 [00:09<00:14,  2.27it/s][A
Training:  38%|███▊      | 20/52 [00:09<00:10,  3.16it/s][A
Training:  40%|████      | 21/52 [00:10<00:16,  1.86it/s][A
Training:  42%|████▏     | 22/52 [00:11<00:13,  2.18it/s][A
Training:  46%|████▌     | 24/52 [00:11<00:09,  3.10it/s][A
Training:  48%|████▊     | 25/52 [00:12<00:14,  1.84it/s][A
Training:  50%|█████     | 26/52 [00:12<00:11,  2.21it/s][A
Training:  56%|█████▌    | 29/52 [00:

Epoch: 51/89 - Loss: 2.5193 - Accuracy: 0.9501



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:02<00:14,  2.43s/it][A
 43%|████▎     | 3/7 [00:02<00:02,  1.48it/s][A
100%|██████████| 7/7 [00:04<00:00,  1.68it/s][A
Epochs:  57%|█████▋    | 51/89 [23:48<17:33, 27.73s/it]

Val Loss: 3.2540 - Val Accuracy: 0.9436



Training:   0%|          | 0/52 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/52 [00:02<01:50,  2.17s/it][A
Training:   4%|▍         | 2/52 [00:02<00:53,  1.06s/it][A
Training:   8%|▊         | 4/52 [00:02<00:21,  2.23it/s][A
Training:  10%|▉         | 5/52 [00:04<00:34,  1.36it/s][A
Training:  12%|█▏        | 6/52 [00:04<00:28,  1.63it/s][A
Training:  13%|█▎        | 7/52 [00:04<00:20,  2.17it/s][A
Training:  15%|█▌        | 8/52 [00:04<00:15,  2.76it/s][A
Training:  17%|█▋        | 9/52 [00:05<00:26,  1.64it/s][A
Training:  19%|█▉        | 10/52 [00:06<00:24,  1.75it/s][A
Training:  23%|██▎       | 12/52 [00:06<00:13,  2.86it/s][A
Training:  25%|██▌       | 13/52 [00:07<00:20,  1.94it/s][A
Training:  27%|██▋       | 14/52 [00:08<00:20,  1.82it/s][A
Training:  29%|██▉       | 15/52 [00:08<00:16,  2.30it/s][A
Training:  33%|███▎      | 17/52 [00:09<00:18,  1.93it/s][A
Training:  35%|███▍      | 18/52 [00:10<00:18,  1.88it/s][A
Training:  40%|████      | 21/52 [00:11<

Epoch: 52/89 - Loss: 2.4600 - Accuracy: 0.9513



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:02<00:14,  2.36s/it][A
 43%|████▎     | 3/7 [00:02<00:02,  1.49it/s][A
 71%|███████▏  | 5/7 [00:04<00:01,  1.40it/s][A
100%|██████████| 7/7 [00:04<00:00,  1.63it/s][A
Epochs:  58%|█████▊    | 52/89 [24:17<17:16, 28.01s/it]

Val Loss: 3.2402 - Val Accuracy: 0.9415



Training:   0%|          | 0/52 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/52 [00:02<01:56,  2.29s/it][A
Training:   4%|▍         | 2/52 [00:02<00:52,  1.04s/it][A
Training:   6%|▌         | 3/52 [00:02<00:30,  1.60it/s][A
Training:   8%|▊         | 4/52 [00:02<00:21,  2.28it/s][A
Training:  10%|▉         | 5/52 [00:04<00:39,  1.20it/s][A
Training:  13%|█▎        | 7/52 [00:04<00:19,  2.29it/s][A
Training:  15%|█▌        | 8/52 [00:04<00:16,  2.61it/s][A
Training:  17%|█▋        | 9/52 [00:05<00:27,  1.58it/s][A
Training:  21%|██        | 11/52 [00:06<00:15,  2.59it/s][A
Training:  23%|██▎       | 12/52 [00:06<00:14,  2.84it/s][A
Training:  25%|██▌       | 13/52 [00:07<00:26,  1.47it/s][A
Training:  29%|██▉       | 15/52 [00:08<00:15,  2.37it/s][A
Training:  31%|███       | 16/52 [00:08<00:12,  2.81it/s][A
Training:  33%|███▎      | 17/52 [00:09<00:22,  1.56it/s][A
Training:  37%|███▋      | 19/52 [00:09<00:13,  2.48it/s][A
Training:  40%|████      | 21/52 [00:11<

Epoch: 53/89 - Loss: 2.5902 - Accuracy: 0.9501



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:02<00:12,  2.02s/it][A
 43%|████▎     | 3/7 [00:02<00:02,  1.78it/s][A
100%|██████████| 7/7 [00:04<00:00,  1.73it/s][A
Epochs:  60%|█████▉    | 53/89 [24:44<16:39, 27.77s/it]

Val Loss: 3.4618 - Val Accuracy: 0.9388



Training:   0%|          | 0/52 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/52 [00:02<01:49,  2.14s/it][A
Training:   6%|▌         | 3/52 [00:02<00:29,  1.66it/s][A
Training:   8%|▊         | 4/52 [00:02<00:21,  2.23it/s][A
Training:  10%|▉         | 5/52 [00:03<00:37,  1.25it/s][A
Training:  12%|█▏        | 6/52 [00:04<00:26,  1.71it/s][A
Training:  13%|█▎        | 7/52 [00:04<00:20,  2.15it/s][A
Training:  17%|█▋        | 9/52 [00:05<00:24,  1.73it/s][A
Training:  19%|█▉        | 10/52 [00:05<00:19,  2.14it/s][A
Training:  25%|██▌       | 13/52 [00:07<00:21,  1.80it/s][A
Training:  29%|██▉       | 15/52 [00:07<00:14,  2.49it/s][A
Training:  31%|███       | 16/52 [00:08<00:12,  2.90it/s][A
Training:  33%|███▎      | 17/52 [00:09<00:18,  1.91it/s][A
Training:  35%|███▍      | 18/52 [00:09<00:14,  2.34it/s][A
Training:  37%|███▋      | 19/52 [00:09<00:12,  2.63it/s][A
Training:  38%|███▊      | 20/52 [00:09<00:09,  3.26it/s][A
Training:  40%|████      | 21/52 [00:11

Epoch: 54/89 - Loss: 2.5941 - Accuracy: 0.9500



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:01<00:11,  1.86s/it][A
 29%|██▊       | 2/7 [00:02<00:04,  1.06it/s][A
 57%|█████▋    | 4/7 [00:02<00:01,  2.55it/s][A
 71%|███████▏  | 5/7 [00:03<00:01,  1.59it/s][A
100%|██████████| 7/7 [00:03<00:00,  1.79it/s][A
Epochs:  61%|██████    | 54/89 [25:12<16:12, 27.79s/it]

Val Loss: 3.3685 - Val Accuracy: 0.9412



Training:   0%|          | 0/52 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/52 [00:02<01:52,  2.22s/it][A
Training:   4%|▍         | 2/52 [00:02<00:49,  1.01it/s][A
Training:   8%|▊         | 4/52 [00:02<00:20,  2.34it/s][A
Training:  10%|▉         | 5/52 [00:04<00:37,  1.26it/s][A
Training:  12%|█▏        | 6/52 [00:04<00:27,  1.67it/s][A
Training:  13%|█▎        | 7/52 [00:04<00:20,  2.18it/s][A
Training:  17%|█▋        | 9/52 [00:06<00:26,  1.62it/s][A
Training:  19%|█▉        | 10/52 [00:06<00:21,  1.99it/s][A
Training:  21%|██        | 11/52 [00:06<00:16,  2.49it/s][A
Training:  23%|██▎       | 12/52 [00:06<00:13,  3.06it/s][A
Training:  25%|██▌       | 13/52 [00:07<00:24,  1.56it/s][A
Training:  27%|██▋       | 14/52 [00:08<00:18,  2.03it/s][A
Training:  31%|███       | 16/52 [00:08<00:10,  3.41it/s][A
Training:  33%|███▎      | 17/52 [00:09<00:22,  1.57it/s][A
Training:  38%|███▊      | 20/52 [00:09<00:10,  3.04it/s][A
Training:  42%|████▏     | 22/52 [00:11

Epoch: 55/89 - Loss: 2.4505 - Accuracy: 0.9502



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:02<00:13,  2.31s/it][A
 71%|███████▏  | 5/7 [00:03<00:01,  1.47it/s][A
100%|██████████| 7/7 [00:04<00:00,  1.70it/s][A
Epochs:  62%|██████▏   | 55/89 [25:40<15:50, 27.96s/it]

Val Loss: 3.2485 - Val Accuracy: 0.9438



Training:   0%|          | 0/52 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/52 [00:02<02:05,  2.45s/it][A
Training:   4%|▍         | 2/52 [00:02<00:53,  1.07s/it][A
Training:  10%|▉         | 5/52 [00:04<00:31,  1.50it/s][A
Training:  12%|█▏        | 6/52 [00:04<00:24,  1.90it/s][A
Training:  13%|█▎        | 7/52 [00:04<00:19,  2.27it/s][A
Training:  15%|█▌        | 8/52 [00:04<00:15,  2.81it/s][A
Training:  17%|█▋        | 9/52 [00:05<00:27,  1.56it/s][A
Training:  19%|█▉        | 10/52 [00:06<00:21,  1.99it/s][A
Training:  21%|██        | 11/52 [00:06<00:17,  2.31it/s][A
Training:  23%|██▎       | 12/52 [00:06<00:13,  2.97it/s][A
Training:  25%|██▌       | 13/52 [00:07<00:22,  1.73it/s][A
Training:  29%|██▉       | 15/52 [00:08<00:18,  2.01it/s][A
Training:  33%|███▎      | 17/52 [00:09<00:18,  1.93it/s][A
Training:  37%|███▋      | 19/52 [00:10<00:15,  2.10it/s][A
Training:  38%|███▊      | 20/52 [00:10<00:12,  2.50it/s][A
Training:  40%|████      | 21/52 [00:11

Epoch: 56/89 - Loss: 2.5001 - Accuracy: 0.9526



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:02<00:13,  2.27s/it][A
100%|██████████| 7/7 [00:03<00:00,  1.75it/s][A
Epochs:  63%|██████▎   | 56/89 [26:08<15:18, 27.85s/it]

Val Loss: 3.4925 - Val Accuracy: 0.9391



Training:   0%|          | 0/52 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/52 [00:02<01:51,  2.19s/it][A
Training:   8%|▊         | 4/52 [00:02<00:22,  2.14it/s][A
Training:  10%|▉         | 5/52 [00:03<00:36,  1.27it/s][A
Training:  13%|█▎        | 7/52 [00:04<00:21,  2.13it/s][A
Training:  15%|█▌        | 8/52 [00:04<00:18,  2.34it/s][A
Training:  17%|█▋        | 9/52 [00:05<00:30,  1.42it/s][A
Training:  19%|█▉        | 10/52 [00:06<00:23,  1.82it/s][A
Training:  23%|██▎       | 12/52 [00:06<00:14,  2.85it/s][A
Training:  25%|██▌       | 13/52 [00:07<00:23,  1.68it/s][A
Training:  29%|██▉       | 15/52 [00:07<00:14,  2.57it/s][A
Training:  33%|███▎      | 17/52 [00:09<00:17,  1.95it/s][A
Training:  37%|███▋      | 19/52 [00:09<00:12,  2.66it/s][A
Training:  40%|████      | 21/52 [00:10<00:15,  2.03it/s][A
Training:  46%|████▌     | 24/52 [00:11<00:08,  3.28it/s][A
Training:  50%|█████     | 26/52 [00:12<00:11,  2.18it/s][A
Training:  52%|█████▏    | 27/52 [00:1

Epoch: 57/89 - Loss: 2.4541 - Accuracy: 0.9517



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:02<00:12,  2.08s/it][A
 29%|██▊       | 2/7 [00:02<00:05,  1.03s/it][A
 57%|█████▋    | 4/7 [00:02<00:01,  2.36it/s][A
 71%|███████▏  | 5/7 [00:03<00:01,  1.54it/s][A
100%|██████████| 7/7 [00:04<00:00,  1.62it/s][A
Epochs:  64%|██████▍   | 57/89 [26:35<14:46, 27.70s/it]

Val Loss: 3.3084 - Val Accuracy: 0.9407



Training:   0%|          | 0/52 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/52 [00:02<02:00,  2.37s/it][A
Training:   8%|▊         | 4/52 [00:02<00:22,  2.09it/s][A
Training:  12%|█▏        | 6/52 [00:04<00:29,  1.54it/s][A
Training:  13%|█▎        | 7/52 [00:04<00:23,  1.89it/s][A
Training:  15%|█▌        | 8/52 [00:04<00:18,  2.34it/s][A
Training:  17%|█▋        | 9/52 [00:05<00:29,  1.44it/s][A
Training:  25%|██▌       | 13/52 [00:07<00:21,  1.81it/s][A
Training:  31%|███       | 16/52 [00:07<00:12,  2.85it/s][A
Training:  35%|███▍      | 18/52 [00:09<00:15,  2.18it/s][A
Training:  37%|███▋      | 19/52 [00:09<00:14,  2.32it/s][A
Training:  40%|████      | 21/52 [00:11<00:15,  1.97it/s][A
Training:  44%|████▍     | 23/52 [00:11<00:12,  2.28it/s][A
Training:  48%|████▊     | 25/52 [00:12<00:12,  2.13it/s][A
Training:  52%|█████▏    | 27/52 [00:12<00:09,  2.72it/s][A
Training:  56%|█████▌    | 29/52 [00:14<00:10,  2.10it/s][A
Training:  60%|█████▉    | 31/52 [00:1

Epoch: 58/89 - Loss: 2.6750 - Accuracy: 0.9477



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:02<00:15,  2.50s/it][A
 43%|████▎     | 3/7 [00:02<00:02,  1.40it/s][A
100%|██████████| 7/7 [00:04<00:00,  1.66it/s][A
Epochs:  65%|██████▌   | 58/89 [27:02<14:13, 27.52s/it]

Val Loss: 3.5608 - Val Accuracy: 0.9376



Training:   0%|          | 0/52 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/52 [00:02<01:51,  2.19s/it][A
Training:   4%|▍         | 2/52 [00:02<00:58,  1.17s/it][A
Training:   6%|▌         | 3/52 [00:02<00:34,  1.42it/s][A
Training:  10%|▉         | 5/52 [00:03<00:29,  1.58it/s][A
Training:  12%|█▏        | 6/52 [00:04<00:28,  1.63it/s][A
Training:  15%|█▌        | 8/52 [00:04<00:16,  2.68it/s][A
Training:  17%|█▋        | 9/52 [00:05<00:24,  1.77it/s][A
Training:  19%|█▉        | 10/52 [00:06<00:21,  1.92it/s][A
Training:  23%|██▎       | 12/52 [00:06<00:12,  3.10it/s][A
Training:  25%|██▌       | 13/52 [00:07<00:21,  1.79it/s][A
Training:  27%|██▋       | 14/52 [00:07<00:18,  2.07it/s][A
Training:  29%|██▉       | 15/52 [00:08<00:14,  2.58it/s][A
Training:  31%|███       | 16/52 [00:08<00:11,  3.01it/s][A
Training:  33%|███▎      | 17/52 [00:09<00:18,  1.89it/s][A
Training:  35%|███▍      | 18/52 [00:09<00:18,  1.82it/s][A
Training:  38%|███▊      | 20/52 [00:10

Epoch: 59/89 - Loss: 2.4615 - Accuracy: 0.9500



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:02<00:15,  2.52s/it][A
 29%|██▊       | 2/7 [00:02<00:05,  1.10s/it][A
 57%|█████▋    | 4/7 [00:02<00:01,  2.13it/s][A
 71%|███████▏  | 5/7 [00:04<00:01,  1.37it/s][A
100%|██████████| 7/7 [00:04<00:00,  1.57it/s][A
Epochs:  66%|██████▋   | 59/89 [27:30<13:49, 27.66s/it]

Val Loss: 3.3805 - Val Accuracy: 0.9383



Training:   0%|          | 0/52 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/52 [00:02<01:53,  2.23s/it][A
Training:   4%|▍         | 2/52 [00:02<00:51,  1.03s/it][A
Training:   8%|▊         | 4/52 [00:02<00:21,  2.27it/s][A
Training:  10%|▉         | 5/52 [00:04<00:35,  1.34it/s][A
Training:  12%|█▏        | 6/52 [00:04<00:28,  1.62it/s][A
Training:  17%|█▋        | 9/52 [00:05<00:23,  1.86it/s][A
Training:  19%|█▉        | 10/52 [00:06<00:25,  1.67it/s][A
Training:  23%|██▎       | 12/52 [00:06<00:16,  2.45it/s][A
Training:  25%|██▌       | 13/52 [00:07<00:18,  2.05it/s][A
Training:  27%|██▋       | 14/52 [00:08<00:21,  1.74it/s][A
Training:  31%|███       | 16/52 [00:08<00:13,  2.66it/s][A
Training:  33%|███▎      | 17/52 [00:09<00:14,  2.37it/s][A
Training:  35%|███▍      | 18/52 [00:10<00:20,  1.70it/s][A
Training:  37%|███▋      | 19/52 [00:10<00:15,  2.15it/s][A
Training:  38%|███▊      | 20/52 [00:10<00:11,  2.68it/s][A
Training:  40%|████      | 21/52 [00:1

Epoch: 60/89 - Loss: 2.5412 - Accuracy: 0.9495



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:02<00:14,  2.40s/it][A
 43%|████▎     | 3/7 [00:02<00:02,  1.41it/s][A
100%|██████████| 7/7 [00:04<00:00,  1.69it/s][A
Epochs:  67%|██████▋   | 60/89 [27:59<13:30, 27.95s/it]

Val Loss: 3.4887 - Val Accuracy: 0.9347



Training:   0%|          | 0/52 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/52 [00:02<01:50,  2.16s/it][A
Training:   4%|▍         | 2/52 [00:02<00:53,  1.08s/it][A
Training:   8%|▊         | 4/52 [00:02<00:20,  2.29it/s][A
Training:  10%|▉         | 5/52 [00:03<00:29,  1.59it/s][A
Training:  12%|█▏        | 6/52 [00:03<00:23,  1.98it/s][A
Training:  15%|█▌        | 8/52 [00:04<00:13,  3.33it/s][A
Training:  17%|█▋        | 9/52 [00:05<00:27,  1.57it/s][A
Training:  19%|█▉        | 10/52 [00:05<00:21,  1.99it/s][A
Training:  21%|██        | 11/52 [00:05<00:16,  2.46it/s][A
Training:  23%|██▎       | 12/52 [00:06<00:13,  3.00it/s][A
Training:  25%|██▌       | 13/52 [00:07<00:25,  1.53it/s][A
Training:  27%|██▋       | 14/52 [00:07<00:18,  2.01it/s][A
Training:  29%|██▉       | 15/52 [00:07<00:14,  2.60it/s][A
Training:  31%|███       | 16/52 [00:07<00:11,  3.26it/s][A
Training:  33%|███▎      | 17/52 [00:09<00:22,  1.54it/s][A
Training:  37%|███▋      | 19/52 [00:09

Epoch: 61/89 - Loss: 2.3853 - Accuracy: 0.9527



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:02<00:14,  2.36s/it][A
 43%|████▎     | 3/7 [00:02<00:02,  1.49it/s][A
 71%|███████▏  | 5/7 [00:04<00:01,  1.40it/s][A
100%|██████████| 7/7 [00:04<00:00,  1.62it/s][A
Epochs:  69%|██████▊   | 61/89 [28:27<13:01, 27.92s/it]

Val Loss: 3.3937 - Val Accuracy: 0.9402



Training:   0%|          | 0/52 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/52 [00:02<02:05,  2.47s/it][A
Training:   4%|▍         | 2/52 [00:02<00:54,  1.09s/it][A
Training:   8%|▊         | 4/52 [00:02<00:22,  2.14it/s][A
Training:  10%|▉         | 5/52 [00:04<00:37,  1.25it/s][A
Training:  12%|█▏        | 6/52 [00:04<00:27,  1.70it/s][A
Training:  13%|█▎        | 7/52 [00:04<00:19,  2.26it/s][A
Training:  17%|█▋        | 9/52 [00:06<00:26,  1.60it/s][A
Training:  21%|██        | 11/52 [00:06<00:16,  2.43it/s][A
Training:  25%|██▌       | 13/52 [00:08<00:21,  1.80it/s][A
Training:  29%|██▉       | 15/52 [00:08<00:14,  2.58it/s][A
Training:  33%|███▎      | 17/52 [00:09<00:19,  1.79it/s][A
Training:  38%|███▊      | 20/52 [00:10<00:11,  2.89it/s][A
Training:  42%|████▏     | 22/52 [00:11<00:14,  2.03it/s][A
Training:  48%|████▊     | 25/52 [00:13<00:13,  2.00it/s][A
Training:  52%|█████▏    | 27/52 [00:13<00:09,  2.60it/s][A
Training:  56%|█████▌    | 29/52 [00:14

Epoch: 62/89 - Loss: 2.4604 - Accuracy: 0.9502



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:02<00:14,  2.41s/it][A
 29%|██▊       | 2/7 [00:02<00:05,  1.05s/it][A
 43%|████▎     | 3/7 [00:02<00:02,  1.59it/s][A
 71%|███████▏  | 5/7 [00:04<00:01,  1.47it/s][A
100%|██████████| 7/7 [00:04<00:00,  1.61it/s][A
Epochs:  70%|██████▉   | 62/89 [28:55<12:38, 28.09s/it]

Val Loss: 3.3116 - Val Accuracy: 0.9412



Training:   0%|          | 0/52 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/52 [00:02<02:06,  2.48s/it][A
Training:   6%|▌         | 3/52 [00:02<00:34,  1.43it/s][A
Training:  10%|▉         | 5/52 [00:04<00:35,  1.34it/s][A
Training:  13%|█▎        | 7/52 [00:04<00:20,  2.20it/s][A
Training:  15%|█▌        | 8/52 [00:04<00:16,  2.65it/s][A
Training:  17%|█▋        | 9/52 [00:06<00:30,  1.40it/s][A
Training:  21%|██        | 11/52 [00:06<00:18,  2.16it/s][A
Training:  25%|██▌       | 13/52 [00:08<00:23,  1.66it/s][A
Training:  29%|██▉       | 15/52 [00:08<00:17,  2.10it/s][A
Training:  31%|███       | 16/52 [00:08<00:14,  2.47it/s][A
Training:  33%|███▎      | 17/52 [00:09<00:20,  1.67it/s][A
Training:  37%|███▋      | 19/52 [00:10<00:13,  2.41it/s][A
Training:  40%|████      | 21/52 [00:11<00:16,  1.83it/s][A
Training:  42%|████▏     | 22/52 [00:11<00:13,  2.16it/s][A
Training:  46%|████▌     | 24/52 [00:12<00:08,  3.12it/s][A
Training:  48%|████▊     | 25/52 [00:1

Epoch: 63/89 - Loss: 2.4022 - Accuracy: 0.9520



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:02<00:13,  2.29s/it][A
 43%|████▎     | 3/7 [00:02<00:02,  1.56it/s][A
100%|██████████| 7/7 [00:04<00:00,  1.69it/s][A
Epochs:  71%|███████   | 63/89 [29:24<12:18, 28.39s/it]

Val Loss: 3.3326 - Val Accuracy: 0.9397



Training:   0%|          | 0/52 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/52 [00:02<01:51,  2.19s/it][A
Training:   4%|▍         | 2/52 [00:02<00:51,  1.03s/it][A
Training:   6%|▌         | 3/52 [00:02<00:30,  1.62it/s][A
Training:  10%|▉         | 5/52 [00:04<00:33,  1.41it/s][A
Training:  12%|█▏        | 6/52 [00:04<00:27,  1.67it/s][A
Training:  15%|█▌        | 8/52 [00:04<00:15,  2.79it/s][A
Training:  17%|█▋        | 9/52 [00:05<00:24,  1.76it/s][A
Training:  19%|█▉        | 10/52 [00:06<00:22,  1.86it/s][A
Training:  21%|██        | 11/52 [00:06<00:17,  2.38it/s][A
Training:  25%|██▌       | 13/52 [00:07<00:19,  1.99it/s][A
Training:  27%|██▋       | 14/52 [00:08<00:18,  2.01it/s][A
Training:  31%|███       | 16/52 [00:08<00:12,  2.99it/s][A
Training:  33%|███▎      | 17/52 [00:09<00:20,  1.74it/s][A
Training:  35%|███▍      | 18/52 [00:09<00:16,  2.07it/s][A
Training:  38%|███▊      | 20/52 [00:09<00:10,  3.19it/s][A
Training:  40%|████      | 21/52 [00:11

Epoch: 64/89 - Loss: 2.4759 - Accuracy: 0.9501



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:02<00:12,  2.10s/it][A
 29%|██▊       | 2/7 [00:02<00:05,  1.02s/it][A
 43%|████▎     | 3/7 [00:02<00:02,  1.63it/s][A
 71%|███████▏  | 5/7 [00:03<00:01,  1.61it/s][A
100%|██████████| 7/7 [00:04<00:00,  1.70it/s][A
Epochs:  72%|███████▏  | 64/89 [29:53<11:50, 28.43s/it]

Val Loss: 3.4124 - Val Accuracy: 0.9362



Training:   0%|          | 0/52 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/52 [00:02<02:03,  2.41s/it][A
Training:   4%|▍         | 2/52 [00:02<00:52,  1.06s/it][A
Training:   8%|▊         | 4/52 [00:02<00:20,  2.35it/s][A
Training:  12%|█▏        | 6/52 [00:04<00:30,  1.49it/s][A
Training:  15%|█▌        | 8/52 [00:04<00:19,  2.30it/s][A
Training:  17%|█▋        | 9/52 [00:06<00:28,  1.50it/s][A
Training:  19%|█▉        | 10/52 [00:06<00:22,  1.87it/s][A
Training:  21%|██        | 11/52 [00:06<00:17,  2.34it/s][A
Training:  25%|██▌       | 13/52 [00:07<00:22,  1.76it/s][A
Training:  29%|██▉       | 15/52 [00:08<00:14,  2.61it/s][A
Training:  31%|███       | 16/52 [00:08<00:11,  3.08it/s][A
Training:  33%|███▎      | 17/52 [00:09<00:19,  1.78it/s][A
Training:  37%|███▋      | 19/52 [00:09<00:11,  2.80it/s][A
Training:  40%|████      | 21/52 [00:11<00:15,  1.97it/s][A
Training:  42%|████▏     | 22/52 [00:11<00:12,  2.34it/s][A
Training:  44%|████▍     | 23/52 [00:1

Epoch: 65/89 - Loss: 2.3858 - Accuracy: 0.9512



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:02<00:14,  2.35s/it][A
 43%|████▎     | 3/7 [00:02<00:02,  1.49it/s][A
100%|██████████| 7/7 [00:04<00:00,  1.66it/s][A
Epochs:  73%|███████▎  | 65/89 [30:21<11:20, 28.35s/it]

Val Loss: 3.4001 - Val Accuracy: 0.9357



Training:   0%|          | 0/52 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/52 [00:02<01:57,  2.31s/it][A
Training:   4%|▍         | 2/52 [00:02<00:53,  1.07s/it][A
Training:   8%|▊         | 4/52 [00:02<00:21,  2.21it/s][A
Training:  10%|▉         | 5/52 [00:04<00:36,  1.30it/s][A
Training:  12%|█▏        | 6/52 [00:04<00:26,  1.71it/s][A
Training:  15%|█▌        | 8/52 [00:04<00:14,  2.94it/s][A
Training:  17%|█▋        | 9/52 [00:06<00:28,  1.51it/s][A
Training:  21%|██        | 11/52 [00:06<00:17,  2.37it/s][A
Training:  25%|██▌       | 13/52 [00:07<00:20,  1.87it/s][A
Training:  29%|██▉       | 15/52 [00:07<00:13,  2.72it/s][A
Training:  31%|███       | 16/52 [00:07<00:11,  3.15it/s][A
Training:  33%|███▎      | 17/52 [00:09<00:20,  1.69it/s][A
Training:  37%|███▋      | 19/52 [00:09<00:12,  2.54it/s][A
Training:  38%|███▊      | 20/52 [00:09<00:10,  2.99it/s][A
Training:  40%|████      | 21/52 [00:11<00:18,  1.66it/s][A
Training:  42%|████▏     | 22/52 [00:11

Epoch: 66/89 - Loss: 2.6937 - Accuracy: 0.9468



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:02<00:13,  2.25s/it][A
 43%|████▎     | 3/7 [00:02<00:02,  1.53it/s][A
 57%|█████▋    | 4/7 [00:02<00:01,  2.13it/s][A
100%|██████████| 7/7 [00:04<00:00,  1.71it/s][A
Epochs:  74%|███████▍  | 66/89 [30:49<10:50, 28.29s/it]

Val Loss: 4.2701 - Val Accuracy: 0.9281



Training:   0%|          | 0/52 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/52 [00:02<02:04,  2.44s/it][A
Training:   8%|▊         | 4/52 [00:02<00:23,  2.00it/s][A
Training:  12%|█▏        | 6/52 [00:04<00:31,  1.46it/s][A
Training:  15%|█▌        | 8/52 [00:04<00:19,  2.21it/s][A
Training:  17%|█▋        | 9/52 [00:06<00:28,  1.51it/s][A
Training:  19%|█▉        | 10/52 [00:06<00:22,  1.88it/s][A
Training:  25%|██▌       | 13/52 [00:07<00:22,  1.73it/s][A
Training:  27%|██▋       | 14/52 [00:08<00:18,  2.00it/s][A
Training:  29%|██▉       | 15/52 [00:08<00:15,  2.40it/s][A
Training:  31%|███       | 16/52 [00:08<00:12,  2.89it/s][A
Training:  33%|███▎      | 17/52 [00:09<00:21,  1.62it/s][A
Training:  35%|███▍      | 18/52 [00:09<00:16,  2.06it/s][A
Training:  37%|███▋      | 19/52 [00:10<00:12,  2.56it/s][A
Training:  38%|███▊      | 20/52 [00:10<00:10,  3.12it/s][A
Training:  40%|████      | 21/52 [00:11<00:20,  1.53it/s][A
Training:  48%|████▊     | 25/52 [00:

Epoch: 67/89 - Loss: 2.8008 - Accuracy: 0.9458



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:02<00:13,  2.24s/it][A
100%|██████████| 7/7 [00:04<00:00,  1.72it/s][A
Epochs:  75%|███████▌  | 67/89 [31:18<10:26, 28.50s/it]

Val Loss: 3.7572 - Val Accuracy: 0.9355



Training:   0%|          | 0/52 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/52 [00:02<01:52,  2.20s/it][A
Training:   8%|▊         | 4/52 [00:02<00:21,  2.20it/s][A
Training:  12%|█▏        | 6/52 [00:04<00:28,  1.60it/s][A
Training:  13%|█▎        | 7/52 [00:04<00:22,  1.97it/s][A
Training:  15%|█▌        | 8/52 [00:04<00:17,  2.46it/s][A
Training:  17%|█▋        | 9/52 [00:05<00:30,  1.42it/s][A
Training:  21%|██        | 11/52 [00:05<00:18,  2.26it/s][A
Training:  23%|██▎       | 12/52 [00:06<00:14,  2.74it/s][A
Training:  25%|██▌       | 13/52 [00:07<00:24,  1.58it/s][A
Training:  29%|██▉       | 15/52 [00:07<00:15,  2.43it/s][A
Training:  33%|███▎      | 17/52 [00:09<00:19,  1.75it/s][A
Training:  35%|███▍      | 18/52 [00:09<00:16,  2.07it/s][A
Training:  37%|███▋      | 19/52 [00:09<00:13,  2.53it/s][A
Training:  40%|████      | 21/52 [00:11<00:18,  1.71it/s][A
Training:  48%|████▊     | 25/52 [00:13<00:13,  1.96it/s][A
Training:  52%|█████▏    | 27/52 [00:1

Epoch: 68/89 - Loss: 2.4631 - Accuracy: 0.9515



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:02<00:14,  2.40s/it][A
 57%|█████▋    | 4/7 [00:02<00:01,  2.06it/s][A
100%|██████████| 7/7 [00:04<00:00,  1.72it/s][A
Epochs:  76%|███████▋  | 68/89 [31:47<09:58, 28.48s/it]

Val Loss: 4.1848 - Val Accuracy: 0.9263



Training:   0%|          | 0/52 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/52 [00:02<01:51,  2.20s/it][A
Training:   4%|▍         | 2/52 [00:02<00:49,  1.01it/s][A
Training:   6%|▌         | 3/52 [00:02<00:29,  1.68it/s][A
Training:  10%|▉         | 5/52 [00:03<00:29,  1.58it/s][A
Training:  13%|█▎        | 7/52 [00:03<00:17,  2.65it/s][A
Training:  17%|█▋        | 9/52 [00:05<00:21,  2.00it/s][A
Training:  23%|██▎       | 12/52 [00:05<00:11,  3.35it/s][A
Training:  25%|██▌       | 13/52 [00:07<00:21,  1.79it/s][A
Training:  29%|██▉       | 15/52 [00:07<00:14,  2.55it/s][A
Training:  33%|███▎      | 17/52 [00:08<00:17,  1.98it/s][A
Training:  37%|███▋      | 19/52 [00:08<00:11,  2.75it/s][A
Training:  40%|████      | 21/52 [00:10<00:15,  2.02it/s][A
Training:  42%|████▏     | 22/52 [00:10<00:14,  2.11it/s][A
Training:  44%|████▍     | 23/52 [00:11<00:11,  2.51it/s][A
Training:  46%|████▌     | 24/52 [00:11<00:09,  2.96it/s][A
Training:  48%|████▊     | 25/52 [00:1

Epoch: 69/89 - Loss: 2.6888 - Accuracy: 0.9455



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:02<00:13,  2.19s/it][A
 43%|████▎     | 3/7 [00:02<00:02,  1.61it/s][A
 71%|███████▏  | 5/7 [00:03<00:01,  1.52it/s][A
100%|██████████| 7/7 [00:04<00:00,  1.75it/s][A
Epochs:  78%|███████▊  | 69/89 [32:14<09:22, 28.14s/it]

Val Loss: 3.3651 - Val Accuracy: 0.9394



Training:   0%|          | 0/52 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/52 [00:02<01:50,  2.17s/it][A
Training:   6%|▌         | 3/52 [00:02<00:30,  1.58it/s][A
Training:   8%|▊         | 4/52 [00:02<00:22,  2.17it/s][A
Training:  10%|▉         | 5/52 [00:03<00:32,  1.43it/s][A
Training:  12%|█▏        | 6/52 [00:03<00:23,  1.96it/s][A
Training:  13%|█▎        | 7/52 [00:04<00:20,  2.15it/s][A
Training:  17%|█▋        | 9/52 [00:05<00:22,  1.92it/s][A
Training:  19%|█▉        | 10/52 [00:05<00:19,  2.12it/s][A
Training:  21%|██        | 11/52 [00:06<00:18,  2.22it/s][A
Training:  23%|██▎       | 12/52 [00:06<00:14,  2.79it/s][A
Training:  25%|██▌       | 13/52 [00:07<00:22,  1.77it/s][A
Training:  27%|██▋       | 14/52 [00:07<00:18,  2.04it/s][A
Training:  29%|██▉       | 15/52 [00:07<00:17,  2.16it/s][A
Training:  33%|███▎      | 17/52 [00:09<00:17,  1.95it/s][A
Training:  35%|███▍      | 18/52 [00:09<00:14,  2.38it/s][A
Training:  37%|███▋      | 19/52 [00:09

Epoch: 70/89 - Loss: 2.5380 - Accuracy: 0.9487



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:02<00:14,  2.49s/it][A
 57%|█████▋    | 4/7 [00:02<00:01,  1.94it/s][A
100%|██████████| 7/7 [00:04<00:00,  1.70it/s][A
Epochs:  79%|███████▊  | 70/89 [32:42<08:55, 28.19s/it]

Val Loss: 3.3251 - Val Accuracy: 0.9378



Training:   0%|          | 0/52 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/52 [00:02<02:07,  2.50s/it][A
Training:   4%|▍         | 2/52 [00:02<00:54,  1.10s/it][A
Training:   8%|▊         | 4/52 [00:02<00:22,  2.17it/s][A
Training:  10%|▉         | 5/52 [00:04<00:33,  1.39it/s][A
Training:  12%|█▏        | 6/52 [00:04<00:25,  1.82it/s][A
Training:  15%|█▌        | 8/52 [00:04<00:15,  2.89it/s][A
Training:  17%|█▋        | 9/52 [00:06<00:28,  1.49it/s][A
Training:  19%|█▉        | 10/52 [00:06<00:21,  1.92it/s][A
Training:  23%|██▎       | 12/52 [00:06<00:13,  2.98it/s][A
Training:  25%|██▌       | 13/52 [00:08<00:25,  1.55it/s][A
Training:  29%|██▉       | 15/52 [00:08<00:15,  2.36it/s][A
Training:  31%|███       | 16/52 [00:08<00:12,  2.83it/s][A
Training:  33%|███▎      | 17/52 [00:09<00:22,  1.57it/s][A
Training:  38%|███▊      | 20/52 [00:10<00:10,  2.96it/s][A
Training:  42%|████▏     | 22/52 [00:11<00:15,  1.94it/s][A
Training:  44%|████▍     | 23/52 [00:11

Epoch: 71/89 - Loss: 2.6937 - Accuracy: 0.9451



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:02<00:13,  2.20s/it][A
 43%|████▎     | 3/7 [00:02<00:02,  1.62it/s][A
 71%|███████▏  | 5/7 [00:03<00:01,  1.48it/s][A
100%|██████████| 7/7 [00:04<00:00,  1.66it/s][A
Epochs:  80%|███████▉  | 71/89 [33:11<08:32, 28.45s/it]

Val Loss: 3.5744 - Val Accuracy: 0.9341



Training:   0%|          | 0/52 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/52 [00:02<01:54,  2.24s/it][A
Training:   6%|▌         | 3/52 [00:02<00:32,  1.52it/s][A
Training:   8%|▊         | 4/52 [00:02<00:22,  2.14it/s][A
Training:  10%|▉         | 5/52 [00:04<00:37,  1.27it/s][A
Training:  12%|█▏        | 6/52 [00:04<00:26,  1.74it/s][A
Training:  15%|█▌        | 8/52 [00:04<00:14,  2.94it/s][A
Training:  17%|█▋        | 9/52 [00:05<00:27,  1.56it/s][A
Training:  19%|█▉        | 10/52 [00:05<00:21,  1.98it/s][A
Training:  21%|██        | 11/52 [00:06<00:16,  2.49it/s][A
Training:  25%|██▌       | 13/52 [00:07<00:23,  1.65it/s][A
Training:  29%|██▉       | 15/52 [00:07<00:15,  2.45it/s][A
Training:  31%|███       | 16/52 [00:08<00:12,  2.91it/s][A
Training:  33%|███▎      | 17/52 [00:09<00:21,  1.65it/s][A
Training:  35%|███▍      | 18/52 [00:09<00:16,  2.02it/s][A
Training:  37%|███▋      | 19/52 [00:09<00:13,  2.53it/s][A
Training:  40%|████      | 21/52 [00:11

Epoch: 72/89 - Loss: 2.4880 - Accuracy: 0.9498



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:02<00:14,  2.37s/it][A
 43%|████▎     | 3/7 [00:02<00:02,  1.53it/s][A
100%|██████████| 7/7 [00:04<00:00,  1.66it/s][A
Epochs:  81%|████████  | 72/89 [33:40<08:02, 28.38s/it]

Val Loss: 3.3681 - Val Accuracy: 0.9420



Training:   0%|          | 0/52 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/52 [00:01<01:34,  1.86s/it][A
Training:   4%|▍         | 2/52 [00:02<00:43,  1.15it/s][A
Training:  10%|▉         | 5/52 [00:03<00:30,  1.55it/s][A
Training:  12%|█▏        | 6/52 [00:04<00:28,  1.60it/s][A
Training:  13%|█▎        | 7/52 [00:04<00:21,  2.05it/s][A
Training:  15%|█▌        | 8/52 [00:04<00:16,  2.62it/s][A
Training:  17%|█▋        | 9/52 [00:05<00:26,  1.65it/s][A
Training:  19%|█▉        | 10/52 [00:06<00:22,  1.83it/s][A
Training:  23%|██▎       | 12/52 [00:06<00:14,  2.85it/s][A
Training:  25%|██▌       | 13/52 [00:07<00:20,  1.89it/s][A
Training:  27%|██▋       | 14/52 [00:07<00:19,  1.92it/s][A
Training:  31%|███       | 16/52 [00:07<00:11,  3.10it/s][A
Training:  33%|███▎      | 17/52 [00:09<00:19,  1.83it/s][A
Training:  35%|███▍      | 18/52 [00:09<00:17,  2.00it/s][A
Training:  38%|███▊      | 20/52 [00:09<00:10,  3.09it/s][A
Training:  40%|████      | 21/52 [00:11

Epoch: 73/89 - Loss: 2.3796 - Accuracy: 0.9514



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:02<00:12,  2.15s/it][A
 57%|█████▋    | 4/7 [00:02<00:01,  2.17it/s][A
 71%|███████▏  | 5/7 [00:03<00:01,  1.51it/s][A
100%|██████████| 7/7 [00:03<00:00,  1.85it/s][A
Epochs:  82%|████████▏ | 73/89 [34:08<07:32, 28.28s/it]

Val Loss: 3.6312 - Val Accuracy: 0.9339



Training:   0%|          | 0/52 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/52 [00:02<01:54,  2.24s/it][A
Training:   4%|▍         | 2/52 [00:02<00:49,  1.01it/s][A
Training:   8%|▊         | 4/52 [00:02<00:20,  2.35it/s][A
Training:  10%|▉         | 5/52 [00:04<00:35,  1.31it/s][A
Training:  13%|█▎        | 7/52 [00:04<00:19,  2.33it/s][A
Training:  17%|█▋        | 9/52 [00:05<00:24,  1.74it/s][A
Training:  19%|█▉        | 10/52 [00:05<00:20,  2.09it/s][A
Training:  23%|██▎       | 12/52 [00:06<00:12,  3.17it/s][A
Training:  27%|██▋       | 14/52 [00:07<00:20,  1.85it/s][A
Training:  31%|███       | 16/52 [00:08<00:13,  2.64it/s][A
Training:  33%|███▎      | 17/52 [00:09<00:20,  1.68it/s][A
Training:  35%|███▍      | 18/52 [00:09<00:17,  1.91it/s][A
Training:  38%|███▊      | 20/52 [00:09<00:11,  2.87it/s][A
Training:  40%|████      | 21/52 [00:11<00:18,  1.71it/s][A
Training:  42%|████▏     | 22/52 [00:11<00:16,  1.85it/s][A
Training:  44%|████▍     | 23/52 [00:1

Epoch: 74/89 - Loss: 2.3605 - Accuracy: 0.9529



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:02<00:13,  2.19s/it][A
 43%|████▎     | 3/7 [00:02<00:02,  1.65it/s][A
 71%|███████▏  | 5/7 [00:03<00:01,  1.54it/s][A
100%|██████████| 7/7 [00:03<00:00,  1.78it/s][A
Epochs:  83%|████████▎ | 74/89 [34:36<07:04, 28.31s/it]

Val Loss: 3.3685 - Val Accuracy: 0.9373



Training:   0%|          | 0/52 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/52 [00:02<01:56,  2.29s/it][A
Training:   6%|▌         | 3/52 [00:02<00:33,  1.47it/s][A
Training:   8%|▊         | 4/52 [00:02<00:23,  2.08it/s][A
Training:  10%|▉         | 5/52 [00:04<00:39,  1.18it/s][A
Training:  13%|█▎        | 7/52 [00:04<00:20,  2.17it/s][A
Training:  17%|█▋        | 9/52 [00:06<00:26,  1.61it/s][A
Training:  21%|██        | 11/52 [00:06<00:16,  2.42it/s][A
Training:  25%|██▌       | 13/52 [00:07<00:20,  1.93it/s][A
Training:  27%|██▋       | 14/52 [00:07<00:16,  2.29it/s][A
Training:  33%|███▎      | 17/52 [00:09<00:17,  2.03it/s][A
Training:  35%|███▍      | 18/52 [00:09<00:15,  2.22it/s][A
Training:  37%|███▋      | 19/52 [00:09<00:12,  2.60it/s][A
Training:  40%|████      | 21/52 [00:11<00:15,  2.00it/s][A
Training:  42%|████▏     | 22/52 [00:11<00:13,  2.27it/s][A
Training:  44%|████▍     | 23/52 [00:11<00:10,  2.70it/s][A
Training:  46%|████▌     | 24/52 [00:1

Epoch: 75/89 - Loss: 2.4480 - Accuracy: 0.9508



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:02<00:13,  2.28s/it][A
 43%|████▎     | 3/7 [00:02<00:02,  1.52it/s][A
 71%|███████▏  | 5/7 [00:03<00:01,  1.45it/s][A
100%|██████████| 7/7 [00:04<00:00,  1.68it/s][A
Epochs:  84%|████████▍ | 75/89 [35:04<06:35, 28.26s/it]

Val Loss: 3.1932 - Val Accuracy: 0.9418



Training:   0%|          | 0/52 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/52 [00:02<01:57,  2.30s/it][A
Training:   6%|▌         | 3/52 [00:02<00:32,  1.50it/s][A
Training:   8%|▊         | 4/52 [00:02<00:22,  2.10it/s][A
Training:  10%|▉         | 5/52 [00:04<00:42,  1.11it/s][A
Training:  13%|█▎        | 7/52 [00:04<00:22,  2.01it/s][A
Training:  17%|█▋        | 9/52 [00:06<00:27,  1.54it/s][A
Training:  19%|█▉        | 10/52 [00:06<00:22,  1.88it/s][A
Training:  23%|██▎       | 12/52 [00:06<00:14,  2.85it/s][A
Training:  25%|██▌       | 13/52 [00:08<00:24,  1.59it/s][A
Training:  27%|██▋       | 14/52 [00:08<00:19,  1.99it/s][A
Training:  29%|██▉       | 15/52 [00:08<00:14,  2.47it/s][A
Training:  33%|███▎      | 17/52 [00:10<00:20,  1.71it/s][A
Training:  35%|███▍      | 18/52 [00:10<00:16,  2.05it/s][A
Training:  37%|███▋      | 19/52 [00:10<00:13,  2.52it/s][A
Training:  38%|███▊      | 20/52 [00:10<00:10,  3.13it/s][A
Training:  40%|████      | 21/52 [00:1

Epoch: 76/89 - Loss: 2.2537 - Accuracy: 0.9536



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:02<00:13,  2.17s/it][A
 43%|████▎     | 3/7 [00:02<00:02,  1.65it/s][A
 71%|███████▏  | 5/7 [00:03<00:01,  1.50it/s][A
100%|██████████| 7/7 [00:03<00:00,  1.76it/s][A
Epochs:  85%|████████▌ | 76/89 [35:32<06:05, 28.14s/it]

Val Loss: 3.2619 - Val Accuracy: 0.9404



Training:   0%|          | 0/52 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/52 [00:02<01:58,  2.32s/it][A
Training:   8%|▊         | 4/52 [00:02<00:23,  2.02it/s][A
Training:  10%|▉         | 5/52 [00:04<00:38,  1.22it/s][A
Training:  12%|█▏        | 6/52 [00:04<00:28,  1.61it/s][A
Training:  15%|█▌        | 8/52 [00:04<00:16,  2.71it/s][A
Training:  19%|█▉        | 10/52 [00:06<00:23,  1.80it/s][A
Training:  23%|██▎       | 12/52 [00:06<00:15,  2.60it/s][A
Training:  25%|██▌       | 13/52 [00:07<00:24,  1.59it/s][A
Training:  27%|██▋       | 14/52 [00:08<00:20,  1.87it/s][A
Training:  31%|███       | 16/52 [00:08<00:13,  2.75it/s][A
Training:  33%|███▎      | 17/52 [00:09<00:21,  1.60it/s][A
Training:  35%|███▍      | 18/52 [00:09<00:17,  1.96it/s][A
Training:  38%|███▊      | 20/52 [00:10<00:10,  3.04it/s][A
Training:  40%|████      | 21/52 [00:11<00:18,  1.66it/s][A
Training:  42%|████▏     | 22/52 [00:11<00:14,  2.03it/s][A
Training:  44%|████▍     | 23/52 [00:

Epoch: 77/89 - Loss: 2.2870 - Accuracy: 0.9550



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:02<00:13,  2.26s/it][A
 43%|████▎     | 3/7 [00:02<00:02,  1.56it/s][A
 71%|███████▏  | 5/7 [00:03<00:01,  1.44it/s][A
100%|██████████| 7/7 [00:04<00:00,  1.66it/s][A
Epochs:  87%|████████▋ | 77/89 [36:01<05:39, 28.30s/it]

Val Loss: 3.4807 - Val Accuracy: 0.9344



Training:   0%|          | 0/52 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/52 [00:02<01:58,  2.32s/it][A
Training:   6%|▌         | 3/52 [00:02<00:31,  1.54it/s][A
Training:   8%|▊         | 4/52 [00:02<00:23,  2.06it/s][A
Training:  10%|▉         | 5/52 [00:04<00:39,  1.19it/s][A
Training:  13%|█▎        | 7/52 [00:04<00:21,  2.11it/s][A
Training:  17%|█▋        | 9/52 [00:05<00:26,  1.63it/s][A
Training:  21%|██        | 11/52 [00:06<00:17,  2.40it/s][A
Training:  23%|██▎       | 12/52 [00:06<00:14,  2.75it/s][A
Training:  25%|██▌       | 13/52 [00:07<00:23,  1.67it/s][A
Training:  29%|██▉       | 15/52 [00:07<00:14,  2.58it/s][A
Training:  31%|███       | 16/52 [00:07<00:12,  2.96it/s][A
Training:  33%|███▎      | 17/52 [00:09<00:21,  1.61it/s][A
Training:  37%|███▋      | 19/52 [00:09<00:13,  2.50it/s][A
Training:  38%|███▊      | 20/52 [00:09<00:11,  2.72it/s][A
Training:  40%|████      | 21/52 [00:11<00:18,  1.64it/s][A
Training:  42%|████▏     | 22/52 [00:1

Epoch: 78/89 - Loss: 2.4459 - Accuracy: 0.9515



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:02<00:13,  2.25s/it][A
 29%|██▊       | 2/7 [00:02<00:05,  1.09s/it][A
 43%|████▎     | 3/7 [00:02<00:02,  1.53it/s][A
 71%|███████▏  | 5/7 [00:03<00:01,  1.54it/s][A
100%|██████████| 7/7 [00:04<00:00,  1.61it/s][A
Epochs:  88%|████████▊ | 78/89 [36:29<05:12, 28.44s/it]

Val Loss: 3.3116 - Val Accuracy: 0.9447



Training:   0%|          | 0/52 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/52 [00:02<01:58,  2.32s/it][A
Training:   6%|▌         | 3/52 [00:02<00:33,  1.46it/s][A
Training:   8%|▊         | 4/52 [00:02<00:23,  2.07it/s][A
Training:  10%|▉         | 5/52 [00:04<00:39,  1.20it/s][A
Training:  13%|█▎        | 7/52 [00:04<00:21,  2.05it/s][A
Training:  17%|█▋        | 9/52 [00:06<00:26,  1.64it/s][A
Training:  21%|██        | 11/52 [00:06<00:18,  2.20it/s][A
Training:  23%|██▎       | 12/52 [00:06<00:15,  2.60it/s][A
Training:  25%|██▌       | 13/52 [00:07<00:23,  1.64it/s][A
Training:  29%|██▉       | 15/52 [00:08<00:16,  2.24it/s][A
Training:  33%|███▎      | 17/52 [00:09<00:18,  1.87it/s][A
Training:  35%|███▍      | 18/52 [00:09<00:15,  2.20it/s][A
Training:  37%|███▋      | 19/52 [00:10<00:13,  2.40it/s][A
Training:  40%|████      | 21/52 [00:11<00:15,  2.03it/s][A
Training:  44%|████▍     | 23/52 [00:11<00:10,  2.66it/s][A
Training:  48%|████▊     | 25/52 [00:1

Epoch: 79/89 - Loss: 2.3716 - Accuracy: 0.9517



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:02<00:13,  2.24s/it][A
 29%|██▊       | 2/7 [00:02<00:05,  1.07s/it][A
 71%|███████▏  | 5/7 [00:03<00:01,  1.60it/s][A
100%|██████████| 7/7 [00:04<00:00,  1.60it/s][A
Epochs:  89%|████████▉ | 79/89 [36:58<04:45, 28.51s/it]

Val Loss: 3.2756 - Val Accuracy: 0.9404



Training:   0%|          | 0/52 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/52 [00:02<02:01,  2.38s/it][A
Training:   6%|▌         | 3/52 [00:02<00:32,  1.49it/s][A
Training:  10%|▉         | 5/52 [00:04<00:36,  1.30it/s][A
Training:  13%|█▎        | 7/52 [00:04<00:21,  2.08it/s][A
Training:  15%|█▌        | 8/52 [00:04<00:17,  2.50it/s][A
Training:  17%|█▋        | 9/52 [00:06<00:29,  1.46it/s][A
Training:  21%|██        | 11/52 [00:06<00:17,  2.28it/s][A
Training:  25%|██▌       | 13/52 [00:07<00:21,  1.80it/s][A
Training:  29%|██▉       | 15/52 [00:07<00:14,  2.63it/s][A
Training:  33%|███▎      | 17/52 [00:09<00:18,  1.85it/s][A
Training:  40%|████      | 21/52 [00:11<00:14,  2.13it/s][A
Training:  42%|████▏     | 22/52 [00:11<00:13,  2.28it/s][A
Training:  46%|████▌     | 24/52 [00:11<00:09,  3.09it/s][A
Training:  48%|████▊     | 25/52 [00:12<00:13,  1.98it/s][A
Training:  50%|█████     | 26/52 [00:13<00:12,  2.16it/s][A
Training:  52%|█████▏    | 27/52 [00:1

Epoch: 80/89 - Loss: 2.3236 - Accuracy: 0.9532



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:02<00:14,  2.35s/it][A
 43%|████▎     | 3/7 [00:02<00:02,  1.46it/s][A
 71%|███████▏  | 5/7 [00:03<00:01,  1.45it/s][A
100%|██████████| 7/7 [00:04<00:00,  1.65it/s][A
Epochs:  90%|████████▉ | 80/89 [37:27<04:16, 28.51s/it]

Val Loss: 3.4901 - Val Accuracy: 0.9383



Training:   0%|          | 0/52 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/52 [00:02<02:01,  2.38s/it][A
Training:   4%|▍         | 2/52 [00:02<00:52,  1.05s/it][A
Training:   8%|▊         | 4/52 [00:02<00:20,  2.29it/s][A
Training:  10%|▉         | 5/52 [00:04<00:38,  1.21it/s][A
Training:  12%|█▏        | 6/52 [00:04<00:28,  1.64it/s][A
Training:  15%|█▌        | 8/52 [00:04<00:15,  2.75it/s][A
Training:  17%|█▋        | 9/52 [00:06<00:27,  1.57it/s][A
Training:  21%|██        | 11/52 [00:06<00:16,  2.52it/s][A
Training:  23%|██▎       | 12/52 [00:06<00:13,  3.02it/s][A
Training:  25%|██▌       | 13/52 [00:08<00:26,  1.50it/s][A
Training:  27%|██▋       | 14/52 [00:08<00:20,  1.89it/s][A
Training:  29%|██▉       | 15/52 [00:08<00:15,  2.37it/s][A
Training:  31%|███       | 16/52 [00:08<00:12,  2.91it/s][A
Training:  33%|███▎      | 17/52 [00:09<00:21,  1.60it/s][A
Training:  37%|███▋      | 19/52 [00:09<00:12,  2.72it/s][A
Training:  40%|████      | 21/52 [00:11

Epoch: 81/89 - Loss: 2.3892 - Accuracy: 0.9509



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:02<00:13,  2.25s/it][A
 29%|██▊       | 2/7 [00:02<00:05,  1.01s/it][A
100%|██████████| 7/7 [00:04<00:00,  1.68it/s][A
Epochs:  91%|█████████ | 81/89 [37:55<03:47, 28.48s/it]

Val Loss: 3.3537 - Val Accuracy: 0.9397



Training:   0%|          | 0/52 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/52 [00:02<02:01,  2.37s/it][A
Training:   4%|▍         | 2/52 [00:02<00:52,  1.05s/it][A
Training:   6%|▌         | 3/52 [00:02<00:32,  1.50it/s][A
Training:  10%|▉         | 5/52 [00:04<00:33,  1.42it/s][A
Training:  13%|█▎        | 7/52 [00:04<00:21,  2.09it/s][A
Training:  15%|█▌        | 8/52 [00:04<00:17,  2.55it/s][A
Training:  17%|█▋        | 9/52 [00:05<00:26,  1.61it/s][A
Training:  19%|█▉        | 10/52 [00:06<00:20,  2.06it/s][A
Training:  21%|██        | 11/52 [00:06<00:19,  2.15it/s][A
Training:  25%|██▌       | 13/52 [00:07<00:22,  1.71it/s][A
Training:  27%|██▋       | 14/52 [00:08<00:17,  2.12it/s][A
Training:  29%|██▉       | 15/52 [00:08<00:17,  2.15it/s][A
Training:  33%|███▎      | 17/52 [00:09<00:19,  1.81it/s][A
Training:  35%|███▍      | 18/52 [00:10<00:15,  2.22it/s][A
Training:  37%|███▋      | 19/52 [00:10<00:12,  2.60it/s][A
Training:  40%|████      | 21/52 [00:11

Epoch: 82/89 - Loss: 2.3386 - Accuracy: 0.9544



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:02<00:14,  2.35s/it][A
 43%|████▎     | 3/7 [00:02<00:02,  1.43it/s][A
 71%|███████▏  | 5/7 [00:03<00:01,  1.45it/s][A
100%|██████████| 7/7 [00:04<00:00,  1.63it/s][A
Epochs:  92%|█████████▏| 82/89 [38:24<03:19, 28.49s/it]

Val Loss: 3.3249 - Val Accuracy: 0.9399



Training:   0%|          | 0/52 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/52 [00:02<02:00,  2.36s/it][A
Training:   4%|▍         | 2/52 [00:02<00:51,  1.03s/it][A
Training:   8%|▊         | 4/52 [00:02<00:20,  2.37it/s][A
Training:  12%|█▏        | 6/52 [00:04<00:26,  1.71it/s][A
Training:  15%|█▌        | 8/52 [00:04<00:16,  2.61it/s][A
Training:  17%|█▋        | 9/52 [00:05<00:28,  1.51it/s][A
Training:  23%|██▎       | 12/52 [00:06<00:14,  2.76it/s][A
Training:  27%|██▋       | 14/52 [00:07<00:19,  1.91it/s][A
Training:  31%|███       | 16/52 [00:07<00:13,  2.62it/s][A
Training:  33%|███▎      | 17/52 [00:09<00:20,  1.68it/s][A
Training:  37%|███▋      | 19/52 [00:09<00:13,  2.42it/s][A
Training:  40%|████      | 21/52 [00:11<00:16,  1.82it/s][A
Training:  46%|████▌     | 24/52 [00:11<00:09,  2.97it/s][A
Training:  50%|█████     | 26/52 [00:12<00:12,  2.13it/s][A
Training:  56%|█████▌    | 29/52 [00:14<00:12,  1.90it/s][A
Training:  58%|█████▊    | 30/52 [00:1

Epoch: 83/89 - Loss: 2.3105 - Accuracy: 0.9525



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:02<00:13,  2.19s/it][A
 29%|██▊       | 2/7 [00:02<00:04,  1.02it/s][A
 57%|█████▋    | 4/7 [00:02<00:01,  2.49it/s][A
100%|██████████| 7/7 [00:04<00:00,  1.71it/s][A
Epochs:  93%|█████████▎| 83/89 [38:52<02:50, 28.47s/it]

Val Loss: 3.3023 - Val Accuracy: 0.9388



Training:   0%|          | 0/52 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/52 [00:02<01:48,  2.13s/it][A
Training:   6%|▌         | 3/52 [00:02<00:30,  1.60it/s][A
Training:  10%|▉         | 5/52 [00:03<00:29,  1.59it/s][A
Training:  12%|█▏        | 6/52 [00:03<00:23,  1.98it/s][A
Training:  13%|█▎        | 7/52 [00:03<00:18,  2.47it/s][A
Training:  15%|█▌        | 8/52 [00:04<00:14,  3.03it/s][A
Training:  17%|█▋        | 9/52 [00:05<00:28,  1.53it/s][A
Training:  19%|█▉        | 10/52 [00:05<00:23,  1.75it/s][A
Training:  21%|██        | 11/52 [00:05<00:17,  2.29it/s][A
Training:  23%|██▎       | 12/52 [00:06<00:13,  2.90it/s][A
Training:  25%|██▌       | 13/52 [00:07<00:23,  1.69it/s][A
Training:  27%|██▋       | 14/52 [00:07<00:18,  2.08it/s][A
Training:  31%|███       | 16/52 [00:07<00:10,  3.38it/s][A
Training:  33%|███▎      | 17/52 [00:08<00:18,  1.90it/s][A
Training:  35%|███▍      | 18/52 [00:09<00:18,  1.88it/s][A
Training:  38%|███▊      | 20/52 [00:09

Epoch: 84/89 - Loss: 2.3095 - Accuracy: 0.9533



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:02<00:13,  2.30s/it][A
 43%|████▎     | 3/7 [00:02<00:02,  1.45it/s][A
 71%|███████▏  | 5/7 [00:03<00:01,  1.51it/s][A
100%|██████████| 7/7 [00:04<00:00,  1.73it/s][A
Epochs:  94%|█████████▍| 84/89 [39:20<02:21, 28.39s/it]

Val Loss: 3.3614 - Val Accuracy: 0.9423



Training:   0%|          | 0/52 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/52 [00:02<01:57,  2.31s/it][A
Training:   4%|▍         | 2/52 [00:02<00:50,  1.02s/it][A
Training:   8%|▊         | 4/52 [00:02<00:20,  2.30it/s][A
Training:  10%|▉         | 5/52 [00:03<00:33,  1.39it/s][A
Training:  12%|█▏        | 6/52 [00:04<00:24,  1.87it/s][A
Training:  13%|█▎        | 7/52 [00:04<00:18,  2.44it/s][A
Training:  15%|█▌        | 8/52 [00:04<00:14,  3.12it/s][A
Training:  17%|█▋        | 9/52 [00:05<00:28,  1.49it/s][A
Training:  19%|█▉        | 10/52 [00:05<00:21,  1.99it/s][A
Training:  23%|██▎       | 12/52 [00:06<00:12,  3.24it/s][A
Training:  25%|██▌       | 13/52 [00:07<00:23,  1.64it/s][A
Training:  29%|██▉       | 15/52 [00:07<00:14,  2.50it/s][A
Training:  31%|███       | 16/52 [00:07<00:12,  2.95it/s][A
Training:  33%|███▎      | 17/52 [00:09<00:22,  1.55it/s][A
Training:  37%|███▋      | 19/52 [00:09<00:13,  2.36it/s][A
Training:  40%|████      | 21/52 [00:11<

Epoch: 85/89 - Loss: 2.2776 - Accuracy: 0.9525



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:02<00:12,  2.08s/it][A
 29%|██▊       | 2/7 [00:02<00:04,  1.08it/s][A
 43%|████▎     | 3/7 [00:02<00:02,  1.79it/s][A
100%|██████████| 7/7 [00:04<00:00,  1.75it/s][A
Epochs:  96%|█████████▌| 85/89 [39:49<01:53, 28.44s/it]

Val Loss: 3.2668 - Val Accuracy: 0.9415



Training:   0%|          | 0/52 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/52 [00:02<02:09,  2.54s/it][A
Training:   4%|▍         | 2/52 [00:02<00:56,  1.12s/it][A
Training:   6%|▌         | 3/52 [00:02<00:33,  1.48it/s][A
Training:   8%|▊         | 4/52 [00:02<00:21,  2.22it/s][A
Training:  10%|▉         | 5/52 [00:04<00:35,  1.32it/s][A
Training:  13%|█▎        | 7/52 [00:04<00:17,  2.51it/s][A
Training:  17%|█▋        | 9/52 [00:05<00:23,  1.85it/s][A
Training:  19%|█▉        | 10/52 [00:05<00:18,  2.26it/s][A
Training:  23%|██▎       | 12/52 [00:06<00:11,  3.37it/s][A
Training:  25%|██▌       | 13/52 [00:07<00:21,  1.79it/s][A
Training:  31%|███       | 16/52 [00:07<00:11,  3.20it/s][A
Training:  35%|███▍      | 18/52 [00:09<00:16,  2.10it/s][A
Training:  38%|███▊      | 20/52 [00:09<00:11,  2.72it/s][A
Training:  40%|████      | 21/52 [00:11<00:17,  1.74it/s][A
Training:  44%|████▍     | 23/52 [00:11<00:11,  2.53it/s][A
Training:  46%|████▌     | 24/52 [00:11

Epoch: 86/89 - Loss: 2.2284 - Accuracy: 0.9537



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:02<00:13,  2.17s/it][A
 43%|████▎     | 3/7 [00:02<00:02,  1.65it/s][A
 71%|███████▏  | 5/7 [00:03<00:01,  1.45it/s][A
100%|██████████| 7/7 [00:04<00:00,  1.73it/s][A
Epochs:  97%|█████████▋| 86/89 [40:17<01:25, 28.46s/it]

Val Loss: 3.4536 - Val Accuracy: 0.9373



Training:   0%|          | 0/52 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/52 [00:02<01:53,  2.23s/it][A
Training:   4%|▍         | 2/52 [00:02<00:49,  1.01it/s][A
Training:   8%|▊         | 4/52 [00:02<00:20,  2.35it/s][A
Training:  10%|▉         | 5/52 [00:03<00:32,  1.44it/s][A
Training:  12%|█▏        | 6/52 [00:04<00:27,  1.67it/s][A
Training:  15%|█▌        | 8/52 [00:04<00:17,  2.50it/s][A
Training:  17%|█▋        | 9/52 [00:05<00:28,  1.53it/s][A
Training:  19%|█▉        | 10/52 [00:06<00:23,  1.80it/s][A
Training:  21%|██        | 11/52 [00:06<00:17,  2.29it/s][A
Training:  23%|██▎       | 12/52 [00:06<00:13,  2.90it/s][A
Training:  25%|██▌       | 13/52 [00:07<00:22,  1.75it/s][A
Training:  27%|██▋       | 14/52 [00:07<00:17,  2.12it/s][A
Training:  31%|███       | 16/52 [00:08<00:12,  2.93it/s][A
Training:  33%|███▎      | 17/52 [00:09<00:20,  1.69it/s][A
Training:  35%|███▍      | 18/52 [00:09<00:15,  2.13it/s][A
Training:  37%|███▋      | 19/52 [00:09

Epoch: 87/89 - Loss: 2.3290 - Accuracy: 0.9531



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:01<00:11,  1.96s/it][A
 29%|██▊       | 2/7 [00:02<00:04,  1.14it/s][A
 71%|███████▏  | 5/7 [00:03<00:01,  1.49it/s][A
100%|██████████| 7/7 [00:04<00:00,  1.71it/s][A
Epochs:  98%|█████████▊| 87/89 [40:46<00:56, 28.49s/it]

Val Loss: 3.2939 - Val Accuracy: 0.9418



Training:   0%|          | 0/52 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/52 [00:01<01:38,  1.93s/it][A
Training:   4%|▍         | 2/52 [00:02<00:43,  1.15it/s][A
Training:   6%|▌         | 3/52 [00:02<00:26,  1.84it/s][A
Training:   8%|▊         | 4/52 [00:02<00:18,  2.64it/s][A
Training:  10%|▉         | 5/52 [00:03<00:36,  1.29it/s][A
Training:  13%|█▎        | 7/52 [00:04<00:20,  2.25it/s][A
Training:  15%|█▌        | 8/52 [00:04<00:15,  2.80it/s][A
Training:  17%|█▋        | 9/52 [00:05<00:25,  1.66it/s][A
Training:  21%|██        | 11/52 [00:05<00:17,  2.39it/s][A
Training:  25%|██▌       | 13/52 [00:07<00:22,  1.77it/s][A
Training:  27%|██▋       | 14/52 [00:07<00:17,  2.15it/s][A
Training:  29%|██▉       | 15/52 [00:07<00:15,  2.38it/s][A
Training:  31%|███       | 16/52 [00:07<00:12,  2.94it/s][A
Training:  33%|███▎      | 17/52 [00:09<00:21,  1.65it/s][A
Training:  37%|███▋      | 19/52 [00:09<00:14,  2.35it/s][A
Training:  40%|████      | 21/52 [00:10<

Epoch: 88/89 - Loss: 2.3404 - Accuracy: 0.9522



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:02<00:12,  2.13s/it][A
100%|██████████| 7/7 [00:03<00:00,  1.76it/s][A
Epochs:  99%|█████████▉| 88/89 [41:14<00:28, 28.28s/it]

Val Loss: 3.5174 - Val Accuracy: 0.9379



Training:   0%|          | 0/52 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/52 [00:02<01:59,  2.34s/it][A
Training:   4%|▍         | 2/52 [00:02<00:51,  1.02s/it][A
Training:  10%|▉         | 5/52 [00:04<00:32,  1.43it/s][A
Training:  12%|█▏        | 6/52 [00:04<00:25,  1.82it/s][A
Training:  13%|█▎        | 7/52 [00:04<00:19,  2.29it/s][A
Training:  15%|█▌        | 8/52 [00:04<00:15,  2.85it/s][A
Training:  17%|█▋        | 9/52 [00:06<00:29,  1.46it/s][A
Training:  23%|██▎       | 12/52 [00:06<00:13,  3.02it/s][A
Training:  27%|██▋       | 14/52 [00:07<00:19,  1.92it/s][A
Training:  31%|███       | 16/52 [00:08<00:13,  2.64it/s][A
Training:  33%|███▎      | 17/52 [00:09<00:22,  1.58it/s][A
Training:  37%|███▋      | 19/52 [00:09<00:14,  2.30it/s][A
Training:  38%|███▊      | 20/52 [00:10<00:11,  2.72it/s][A
Training:  40%|████      | 21/52 [00:11<00:21,  1.46it/s][A
Training:  42%|████▏     | 22/52 [00:12<00:16,  1.82it/s][A
Training:  46%|████▌     | 24/52 [00:12

Epoch: 89/89 - Loss: 2.4302 - Accuracy: 0.9504



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:02<00:14,  2.39s/it][A
 43%|████▎     | 3/7 [00:02<00:02,  1.50it/s][A
100%|██████████| 7/7 [00:04<00:00,  1.66it/s][A
Epochs: 100%|██████████| 89/89 [41:42<00:00, 28.12s/it]


Val Loss: 3.3878 - Val Accuracy: 0.9404
Saving best model...


[32m[I 2023-12-15 00:49:46,864][0m Trial 11 finished with value: 0.9404187798500061 and parameters: {'loss_learning_rate': 0.0005475502239825571, 'learning_rate': 0.0011125954409380188, 'weight_decay': 0.004132770040241243, 'epsilon': 3.4960361296560697e-08, 'batch_size': 273, 'epochs': 89}. Best is trial 11 with value: 0.9404187798500061.[0m


Learning rate for Loss: 0.0005277050881421744
Learning rate: 0.0005432782772369768
Weight decay: 0.0027195407598362966
Epsilon: 2.9301992360816376e-08
Batch size: 285
Number of epochs: 96


Epochs:   0%|          | 0/96 [00:00<?, ?it/s]
Training:   0%|          | 0/50 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/50 [00:02<01:49,  2.24s/it][A
Training:   6%|▌         | 3/50 [00:02<00:29,  1.60it/s][A
Training:  10%|█         | 5/50 [00:03<00:31,  1.42it/s][A
Training:  14%|█▍        | 7/50 [00:04<00:19,  2.21it/s][A
Training:  16%|█▌        | 8/50 [00:04<00:15,  2.67it/s][A
Training:  18%|█▊        | 9/50 [00:06<00:29,  1.39it/s][A
Training:  20%|██        | 10/50 [00:06<00:22,  1.79it/s][A
Training:  24%|██▍       | 12/50 [00:06<00:13,  2.83it/s][A
Training:  26%|██▌       | 13/50 [00:07<00:23,  1.55it/s][A
Training:  30%|███       | 15/50 [00:08<00:14,  2.38it/s][A
Training:  32%|███▏      | 16/50 [00:08<00:11,  2.84it/s][A
Training:  34%|███▍      | 17/50 [00:09<00:22,  1.44it/s][A
Training:  36%|███▌      | 18/50 [00:10<00:17,  1.84it/s][A
Training:  38%|███▊      | 19/50 [00:10<00:13,  2.24it/s][A
Training:  42%|████▏     | 21/50 [00:11<00:17,  1.67i

Epoch: 1/96 - Loss: 10.0629 - Accuracy: 0.7895



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:02<00:15,  2.60s/it][A
 71%|███████▏  | 5/7 [00:04<00:01,  1.37it/s][A
100%|██████████| 7/7 [00:04<00:00,  1.56it/s][A
Epochs:   0%|          | 0/96 [00:29<?, ?it/s]
[32m[I 2023-12-15 00:50:16,451][0m Trial 12 pruned. [0m


Val Loss: 5.6724 - Val Accuracy: 0.8903
Learning rate for Loss: 0.002289514973902357
Learning rate: 0.007646092569651815
Weight decay: 0.0008053997913410849
Epsilon: 2.3212362162812156e-08
Batch size: 136
Number of epochs: 42


Epochs:   0%|          | 0/42 [00:00<?, ?it/s]
Training:   0%|          | 0/103 [00:00<?, ?it/s][A
Training:   1%|          | 1/103 [00:01<02:20,  1.37s/it][A
Training:   4%|▍         | 4/103 [00:01<00:29,  3.37it/s][A
Training:   6%|▌         | 6/103 [00:02<00:29,  3.29it/s][A
Training:   7%|▋         | 7/103 [00:02<00:31,  3.06it/s][A
Training:   9%|▊         | 9/103 [00:03<00:27,  3.38it/s][A
Training:  11%|█         | 11/103 [00:03<00:24,  3.72it/s][A
Training:  12%|█▏        | 12/103 [00:03<00:21,  4.25it/s][A
Training:  13%|█▎        | 13/103 [00:04<00:25,  3.58it/s][A
Training:  15%|█▍        | 15/103 [00:04<00:21,  4.00it/s][A
Training:  17%|█▋        | 17/103 [00:04<00:21,  3.93it/s][A
Training:  18%|█▊        | 19/103 [00:05<00:19,  4.37it/s][A
Training:  20%|██        | 21/103 [00:06<00:21,  3.75it/s][A
Training:  22%|██▏       | 23/103 [00:06<00:16,  4.95it/s][A
Training:  23%|██▎       | 24/103 [00:06<00:17,  4.64it/s][A
Training:  24%|██▍       | 25/103 [00

Epoch: 1/42 - Loss: 10.5662 - Accuracy: 0.8036



  0%|          | 0/13 [00:00<?, ?it/s][A
  8%|▊         | 1/13 [00:01<00:15,  1.26s/it][A
 31%|███       | 4/13 [00:01<00:02,  3.72it/s][A
 46%|████▌     | 6/13 [00:02<00:02,  2.83it/s][A
 62%|██████▏   | 8/13 [00:02<00:01,  4.17it/s][A
 77%|███████▋  | 10/13 [00:03<00:00,  3.73it/s][A
100%|██████████| 13/13 [00:03<00:00,  3.54it/s][A
Epochs:   0%|          | 0/42 [00:27<?, ?it/s]
[32m[I 2023-12-15 00:50:44,709][0m Trial 13 pruned. [0m


Val Loss: 5.0934 - Val Accuracy: 0.8861
Learning rate for Loss: 0.000464955048386433
Learning rate: 0.0008393612566801806
Weight decay: 0.00010595225339379551
Epsilon: 4.2768576402929346e-08
Batch size: 254
Number of epochs: 83


Epochs:   0%|          | 0/83 [00:00<?, ?it/s]
Training:   0%|          | 0/56 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/56 [00:01<01:46,  1.93s/it][A
Training:   4%|▎         | 2/56 [00:02<00:51,  1.05it/s][A
Training:   9%|▉         | 5/56 [00:03<00:29,  1.75it/s][A
Training:  11%|█         | 6/56 [00:03<00:25,  1.96it/s][A
Training:  14%|█▍        | 8/56 [00:03<00:16,  2.99it/s][A
Training:  16%|█▌        | 9/56 [00:05<00:25,  1.85it/s][A
Training:  18%|█▊        | 10/56 [00:05<00:23,  1.95it/s][A
Training:  21%|██▏       | 12/56 [00:05<00:14,  2.99it/s][A
Training:  23%|██▎       | 13/56 [00:06<00:21,  1.96it/s][A
Training:  25%|██▌       | 14/56 [00:07<00:18,  2.26it/s][A
Training:  27%|██▋       | 15/56 [00:07<00:14,  2.79it/s][A
Training:  29%|██▊       | 16/56 [00:07<00:11,  3.41it/s][A
Training:  30%|███       | 17/56 [00:08<00:19,  2.04it/s][A
Training:  32%|███▏      | 18/56 [00:08<00:19,  1.95it/s][A
Training:  36%|███▌      | 20/56 [00:09<00:11,  3.13i

Epoch: 1/83 - Loss: 9.6149 - Accuracy: 0.8003



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:02<00:15,  2.55s/it][A
 57%|█████▋    | 4/7 [00:02<00:01,  1.95it/s][A
100%|██████████| 7/7 [00:04<00:00,  1.63it/s][A
Epochs:   0%|          | 0/83 [00:28<?, ?it/s]
[32m[I 2023-12-15 00:51:14,121][0m Trial 14 pruned. [0m


Val Loss: 5.6151 - Val Accuracy: 0.9012
Learning rate for Loss: 0.0016723340404899286
Learning rate: 0.00297091543911568
Weight decay: 0.0030935162473622207
Epsilon: 1.3436697189792923e-08
Batch size: 156
Number of epochs: 48


Epochs:   0%|          | 0/48 [00:00<?, ?it/s]
Training:   0%|          | 0/90 [00:00<?, ?it/s][A
Training:   1%|          | 1/90 [00:01<02:07,  1.43s/it][A
Training:   4%|▍         | 4/90 [00:01<00:32,  2.65it/s][A
Training:   6%|▌         | 5/90 [00:02<00:41,  2.05it/s][A
Training:   9%|▉         | 8/90 [00:02<00:23,  3.50it/s][A
Training:  10%|█         | 9/90 [00:03<00:30,  2.70it/s][A
Training:  11%|█         | 10/90 [00:03<00:24,  3.24it/s][A
Training:  13%|█▎        | 12/90 [00:04<00:19,  3.99it/s][A
Training:  14%|█▍        | 13/90 [00:04<00:27,  2.83it/s][A
Training:  17%|█▋        | 15/90 [00:04<00:18,  4.15it/s][A
Training:  18%|█▊        | 16/90 [00:05<00:18,  3.96it/s][A
Training:  19%|█▉        | 17/90 [00:05<00:25,  2.83it/s][A
Training:  21%|██        | 19/90 [00:06<00:16,  4.19it/s][A
Training:  22%|██▏       | 20/90 [00:06<00:19,  3.61it/s][A
Training:  23%|██▎       | 21/90 [00:06<00:22,  3.00it/s][A
Training:  26%|██▌       | 23/90 [00:07<00:14,  4.51

Epoch: 1/48 - Loss: 8.5977 - Accuracy: 0.8215



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:16,  1.52s/it][A
 42%|████▏     | 5/12 [00:02<00:03,  2.22it/s][A
 67%|██████▋   | 8/12 [00:02<00:01,  3.92it/s][A
100%|██████████| 12/12 [00:03<00:00,  3.20it/s][A
Epochs:   2%|▏         | 1/48 [00:28<22:20, 28.51s/it]

Val Loss: 4.4888 - Val Accuracy: 0.9187



Training:   0%|          | 0/90 [00:00<?, ?it/s][A
Training:   1%|          | 1/90 [00:01<02:23,  1.61s/it][A
Training:   6%|▌         | 5/90 [00:02<00:41,  2.06it/s][A
Training:   9%|▉         | 8/90 [00:02<00:22,  3.64it/s][A
Training:  11%|█         | 10/90 [00:03<00:26,  3.00it/s][A
Training:  14%|█▍        | 13/90 [00:04<00:24,  3.14it/s][A
Training:  16%|█▌        | 14/90 [00:04<00:22,  3.43it/s][A
Training:  19%|█▉        | 17/90 [00:05<00:21,  3.43it/s][A
Training:  21%|██        | 19/90 [00:05<00:16,  4.21it/s][A
Training:  23%|██▎       | 21/90 [00:06<00:19,  3.46it/s][A
Training:  24%|██▍       | 22/90 [00:06<00:17,  3.85it/s][A
Training:  28%|██▊       | 25/90 [00:07<00:17,  3.79it/s][A
Training:  29%|██▉       | 26/90 [00:07<00:15,  4.22it/s][A
Training:  31%|███       | 28/90 [00:07<00:10,  5.64it/s][A
Training:  33%|███▎      | 30/90 [00:08<00:16,  3.75it/s][A
Training:  36%|███▌      | 32/90 [00:08<00:11,  4.89it/s][A
Training:  38%|███▊      | 34/90 [0

Epoch: 2/48 - Loss: 4.6448 - Accuracy: 0.9146



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:15,  1.40s/it][A
 17%|█▋        | 2/12 [00:01<00:06,  1.44it/s][A
 33%|███▎      | 4/12 [00:01<00:02,  3.36it/s][A
 42%|████▏     | 5/12 [00:02<00:03,  2.31it/s][A
 50%|█████     | 6/12 [00:02<00:02,  2.71it/s][A
 67%|██████▋   | 8/12 [00:02<00:00,  4.50it/s][A
 75%|███████▌  | 9/12 [00:03<00:01,  2.99it/s][A
100%|██████████| 12/12 [00:03<00:00,  3.13it/s][A
Epochs:   4%|▍         | 2/48 [00:56<21:25, 27.94s/it]

Val Loss: 3.9168 - Val Accuracy: 0.9336



Training:   0%|          | 0/90 [00:00<?, ?it/s][A
Training:   1%|          | 1/90 [00:01<02:03,  1.38s/it][A
Training:   3%|▎         | 3/90 [00:01<00:36,  2.42it/s][A
Training:   4%|▍         | 4/90 [00:01<00:27,  3.16it/s][A
Training:   6%|▌         | 5/90 [00:02<00:37,  2.29it/s][A
Training:   7%|▋         | 6/90 [00:02<00:30,  2.80it/s][A
Training:   9%|▉         | 8/90 [00:02<00:18,  4.50it/s][A
Training:  10%|█         | 9/90 [00:03<00:28,  2.82it/s][A
Training:  12%|█▏        | 11/90 [00:03<00:18,  4.38it/s][A
Training:  13%|█▎        | 12/90 [00:03<00:15,  4.93it/s][A
Training:  14%|█▍        | 13/90 [00:04<00:30,  2.50it/s][A
Training:  16%|█▌        | 14/90 [00:04<00:24,  3.11it/s][A
Training:  18%|█▊        | 16/90 [00:04<00:15,  4.72it/s][A
Training:  20%|██        | 18/90 [00:05<00:20,  3.52it/s][A
Training:  22%|██▏       | 20/90 [00:05<00:14,  4.82it/s][A
Training:  23%|██▎       | 21/90 [00:06<00:24,  2.86it/s][A
Training:  26%|██▌       | 23/90 [00:06

Epoch: 3/48 - Loss: 4.1600 - Accuracy: 0.9228



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:17,  1.59s/it][A
 33%|███▎      | 4/12 [00:01<00:02,  2.76it/s][A
 42%|████▏     | 5/12 [00:02<00:03,  2.24it/s][A
 58%|█████▊    | 7/12 [00:02<00:01,  3.48it/s][A
 67%|██████▋   | 8/12 [00:02<00:00,  4.11it/s][A
 75%|███████▌  | 9/12 [00:03<00:01,  2.89it/s][A
100%|██████████| 12/12 [00:03<00:00,  3.16it/s][A
Epochs:   6%|▋         | 3/48 [01:23<20:46, 27.69s/it]

Val Loss: 6.2952 - Val Accuracy: 0.8825



Training:   0%|          | 0/90 [00:00<?, ?it/s][A
Training:   1%|          | 1/90 [00:01<02:17,  1.54s/it][A
Training:   3%|▎         | 3/90 [00:01<00:38,  2.27it/s][A
Training:   6%|▌         | 5/90 [00:02<00:36,  2.36it/s][A
Training:   9%|▉         | 8/90 [00:02<00:20,  4.09it/s][A
Training:  10%|█         | 9/90 [00:03<00:27,  2.95it/s][A
Training:  11%|█         | 10/90 [00:03<00:24,  3.22it/s][A
Training:  13%|█▎        | 12/90 [00:03<00:19,  4.04it/s][A
Training:  14%|█▍        | 13/90 [00:04<00:24,  3.15it/s][A
Training:  16%|█▌        | 14/90 [00:04<00:21,  3.49it/s][A
Training:  18%|█▊        | 16/90 [00:05<00:18,  4.03it/s][A
Training:  19%|█▉        | 17/90 [00:05<00:22,  3.32it/s][A
Training:  20%|██        | 18/90 [00:05<00:18,  3.84it/s][A
Training:  21%|██        | 19/90 [00:05<00:16,  4.39it/s][A
Training:  22%|██▏       | 20/90 [00:06<00:18,  3.83it/s][A
Training:  23%|██▎       | 21/90 [00:06<00:20,  3.30it/s][A
Training:  24%|██▍       | 22/90 [00:

Epoch: 4/48 - Loss: 3.7943 - Accuracy: 0.9320



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:15,  1.42s/it][A
 25%|██▌       | 3/12 [00:01<00:03,  2.44it/s][A
 42%|████▏     | 5/12 [00:02<00:03,  2.19it/s][A
 67%|██████▋   | 8/12 [00:02<00:01,  3.90it/s][A
100%|██████████| 12/12 [00:03<00:00,  3.30it/s][A
Epochs:   8%|▊         | 4/48 [01:51<20:21, 27.77s/it]

Val Loss: 4.1244 - Val Accuracy: 0.9155



Training:   0%|          | 0/90 [00:00<?, ?it/s][A
Training:   1%|          | 1/90 [00:01<02:10,  1.46s/it][A
Training:   3%|▎         | 3/90 [00:01<00:36,  2.39it/s][A
Training:   6%|▌         | 5/90 [00:02<00:38,  2.21it/s][A
Training:   9%|▉         | 8/90 [00:02<00:19,  4.14it/s][A
Training:  11%|█         | 10/90 [00:03<00:25,  3.08it/s][A
Training:  13%|█▎        | 12/90 [00:03<00:18,  4.17it/s][A
Training:  16%|█▌        | 14/90 [00:04<00:25,  2.99it/s][A
Training:  17%|█▋        | 15/90 [00:04<00:21,  3.42it/s][A
Training:  19%|█▉        | 17/90 [00:05<00:24,  2.96it/s][A
Training:  21%|██        | 19/90 [00:06<00:18,  3.84it/s][A
Training:  23%|██▎       | 21/90 [00:06<00:22,  3.12it/s][A
Training:  28%|██▊       | 25/90 [00:08<00:19,  3.39it/s][A
Training:  31%|███       | 28/90 [00:08<00:12,  4.84it/s][A
Training:  33%|███▎      | 30/90 [00:09<00:16,  3.72it/s][A
Training:  36%|███▌      | 32/90 [00:09<00:12,  4.70it/s][A
Training:  38%|███▊      | 34/90 [00

Epoch: 5/48 - Loss: 4.0450 - Accuracy: 0.9232



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:15,  1.37s/it][A
 17%|█▋        | 2/12 [00:01<00:06,  1.52it/s][A
 33%|███▎      | 4/12 [00:01<00:02,  3.49it/s][A
 42%|████▏     | 5/12 [00:02<00:02,  2.53it/s][A
 50%|█████     | 6/12 [00:02<00:02,  2.86it/s][A
 75%|███████▌  | 9/12 [00:03<00:00,  3.38it/s][A
100%|██████████| 12/12 [00:03<00:00,  3.06it/s][A
Epochs:  10%|█         | 5/48 [02:19<19:57, 27.85s/it]

Val Loss: 3.9517 - Val Accuracy: 0.9323



Training:   0%|          | 0/90 [00:00<?, ?it/s][A
Training:   1%|          | 1/90 [00:01<02:20,  1.57s/it][A
Training:   3%|▎         | 3/90 [00:01<00:39,  2.22it/s][A
Training:   6%|▌         | 5/90 [00:02<00:37,  2.24it/s][A
Training:   8%|▊         | 7/90 [00:02<00:23,  3.50it/s][A
Training:  10%|█         | 9/90 [00:03<00:30,  2.65it/s][A
Training:  12%|█▏        | 11/90 [00:03<00:21,  3.71it/s][A
Training:  14%|█▍        | 13/90 [00:04<00:25,  3.06it/s][A
Training:  17%|█▋        | 15/90 [00:04<00:18,  4.15it/s][A
Training:  19%|█▉        | 17/90 [00:05<00:22,  3.18it/s][A
Training:  22%|██▏       | 20/90 [00:05<00:14,  4.90it/s][A
Training:  24%|██▍       | 22/90 [00:07<00:19,  3.46it/s][A
Training:  27%|██▋       | 24/90 [00:07<00:14,  4.49it/s][A
Training:  29%|██▉       | 26/90 [00:07<00:17,  3.62it/s][A
Training:  31%|███       | 28/90 [00:08<00:13,  4.71it/s][A
Training:  33%|███▎      | 30/90 [00:08<00:16,  3.57it/s][A
Training:  36%|███▌      | 32/90 [00:

Epoch: 6/48 - Loss: 3.6585 - Accuracy: 0.9335



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:15,  1.38s/it][A
 25%|██▌       | 3/12 [00:01<00:03,  2.47it/s][A
 33%|███▎      | 4/12 [00:01<00:02,  3.23it/s][A
 42%|████▏     | 5/12 [00:02<00:03,  2.24it/s][A
 58%|█████▊    | 7/12 [00:02<00:01,  3.84it/s][A
 75%|███████▌  | 9/12 [00:03<00:00,  3.09it/s][A
100%|██████████| 12/12 [00:03<00:00,  3.32it/s][A
Epochs:  12%|█▎        | 6/48 [02:47<19:31, 27.89s/it]

Val Loss: 4.0311 - Val Accuracy: 0.9280



Training:   0%|          | 0/90 [00:00<?, ?it/s][A
Training:   1%|          | 1/90 [00:01<02:21,  1.59s/it][A
Training:   4%|▍         | 4/90 [00:01<00:28,  3.04it/s][A
Training:   7%|▋         | 6/90 [00:02<00:34,  2.44it/s][A
Training:   9%|▉         | 8/90 [00:02<00:22,  3.58it/s][A
Training:  11%|█         | 10/90 [00:03<00:27,  2.87it/s][A
Training:  14%|█▍        | 13/90 [00:05<00:28,  2.71it/s][A
Training:  18%|█▊        | 16/90 [00:05<00:17,  4.12it/s][A
Training:  20%|██        | 18/90 [00:06<00:21,  3.35it/s][A
Training:  22%|██▏       | 20/90 [00:06<00:16,  4.20it/s][A
Training:  24%|██▍       | 22/90 [00:07<00:20,  3.38it/s][A
Training:  27%|██▋       | 24/90 [00:07<00:15,  4.30it/s][A
Training:  28%|██▊       | 25/90 [00:08<00:23,  2.72it/s][A
Training:  30%|███       | 27/90 [00:08<00:16,  3.75it/s][A
Training:  32%|███▏      | 29/90 [00:09<00:19,  3.20it/s][A
Training:  37%|███▋      | 33/90 [00:10<00:15,  3.67it/s][A
Training:  41%|████      | 37/90 [00

Epoch: 7/48 - Loss: 3.4247 - Accuracy: 0.9372



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:15,  1.44s/it][A
 33%|███▎      | 4/12 [00:01<00:02,  3.31it/s][A
 50%|█████     | 6/12 [00:02<00:02,  2.76it/s][A
100%|██████████| 12/12 [00:03<00:00,  3.39it/s][A
Epochs:  15%|█▍        | 7/48 [03:14<18:55, 27.71s/it]

Val Loss: 3.5545 - Val Accuracy: 0.9400



Training:   0%|          | 0/90 [00:00<?, ?it/s][A
Training:   1%|          | 1/90 [00:01<02:15,  1.52s/it][A
Training:   3%|▎         | 3/90 [00:01<00:39,  2.18it/s][A
Training:   6%|▌         | 5/90 [00:02<00:37,  2.29it/s][A
Training:   7%|▋         | 6/90 [00:02<00:30,  2.72it/s][A
Training:   9%|▉         | 8/90 [00:02<00:18,  4.35it/s][A
Training:  11%|█         | 10/90 [00:03<00:28,  2.83it/s][A
Training:  12%|█▏        | 11/90 [00:04<00:23,  3.33it/s][A
Training:  14%|█▍        | 13/90 [00:04<00:23,  3.34it/s][A
Training:  16%|█▌        | 14/90 [00:05<00:25,  2.99it/s][A
Training:  18%|█▊        | 16/90 [00:05<00:17,  4.25it/s][A
Training:  19%|█▉        | 17/90 [00:05<00:19,  3.75it/s][A
Training:  20%|██        | 18/90 [00:05<00:20,  3.50it/s][A
Training:  23%|██▎       | 21/90 [00:06<00:15,  4.50it/s][A
Training:  24%|██▍       | 22/90 [00:07<00:22,  3.03it/s][A
Training:  26%|██▌       | 23/90 [00:07<00:19,  3.51it/s][A
Training:  28%|██▊       | 25/90 [00:

Epoch: 8/48 - Loss: 3.2348 - Accuracy: 0.9419



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:14,  1.34s/it][A
 17%|█▋        | 2/12 [00:01<00:06,  1.52it/s][A
 42%|████▏     | 5/12 [00:02<00:02,  2.65it/s][A
 50%|█████     | 6/12 [00:02<00:02,  2.79it/s][A
 75%|███████▌  | 9/12 [00:03<00:00,  3.35it/s][A
100%|██████████| 12/12 [00:03<00:00,  3.23it/s][A
Epochs:  17%|█▋        | 8/48 [03:42<18:24, 27.61s/it]

Val Loss: 3.8344 - Val Accuracy: 0.9244



Training:   0%|          | 0/90 [00:00<?, ?it/s][A
Training:   1%|          | 1/90 [00:01<02:26,  1.65s/it][A
Training:   4%|▍         | 4/90 [00:01<00:29,  2.93it/s][A
Training:   7%|▋         | 6/90 [00:02<00:33,  2.53it/s][A
Training:  10%|█         | 9/90 [00:03<00:28,  2.85it/s][A
Training:  11%|█         | 10/90 [00:03<00:26,  3.01it/s][A
Training:  13%|█▎        | 12/90 [00:03<00:18,  4.21it/s][A
Training:  14%|█▍        | 13/90 [00:04<00:26,  2.90it/s][A
Training:  16%|█▌        | 14/90 [00:05<00:24,  3.05it/s][A
Training:  18%|█▊        | 16/90 [00:05<00:16,  4.51it/s][A
Training:  19%|█▉        | 17/90 [00:05<00:20,  3.53it/s][A
Training:  20%|██        | 18/90 [00:05<00:20,  3.44it/s][A
Training:  21%|██        | 19/90 [00:06<00:17,  4.02it/s][A
Training:  23%|██▎       | 21/90 [00:06<00:18,  3.71it/s][A
Training:  24%|██▍       | 22/90 [00:07<00:20,  3.35it/s][A
Training:  28%|██▊       | 25/90 [00:07<00:18,  3.59it/s][A
Training:  29%|██▉       | 26/90 [00

Epoch: 9/48 - Loss: 3.4740 - Accuracy: 0.9391



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:14,  1.30s/it][A
 17%|█▋        | 2/12 [00:01<00:06,  1.52it/s][A
 42%|████▏     | 5/12 [00:02<00:02,  2.79it/s][A
 50%|█████     | 6/12 [00:02<00:01,  3.31it/s][A
 67%|██████▋   | 8/12 [00:02<00:00,  4.97it/s][A
 75%|███████▌  | 9/12 [00:03<00:00,  3.42it/s][A
100%|██████████| 12/12 [00:03<00:00,  3.32it/s][A
Epochs:  19%|█▉        | 9/48 [04:09<17:52, 27.50s/it]

Val Loss: 4.0380 - Val Accuracy: 0.9241



Training:   0%|          | 0/90 [00:00<?, ?it/s][A
Training:   1%|          | 1/90 [00:01<02:08,  1.45s/it][A
Training:   2%|▏         | 2/90 [00:01<01:00,  1.44it/s][A
Training:   3%|▎         | 3/90 [00:01<00:37,  2.34it/s][A
Training:   6%|▌         | 5/90 [00:02<00:33,  2.56it/s][A
Training:   7%|▋         | 6/90 [00:02<00:28,  2.90it/s][A
Training:   9%|▉         | 8/90 [00:02<00:17,  4.60it/s][A
Training:  10%|█         | 9/90 [00:03<00:30,  2.65it/s][A
Training:  11%|█         | 10/90 [00:03<00:25,  3.08it/s][A
Training:  14%|█▍        | 13/90 [00:04<00:25,  3.03it/s][A
Training:  17%|█▋        | 15/90 [00:04<00:17,  4.21it/s][A
Training:  19%|█▉        | 17/90 [00:06<00:24,  3.00it/s][A
Training:  22%|██▏       | 20/90 [00:06<00:14,  4.69it/s][A
Training:  24%|██▍       | 22/90 [00:07<00:19,  3.47it/s][A
Training:  26%|██▌       | 23/90 [00:07<00:17,  3.87it/s][A
Training:  28%|██▊       | 25/90 [00:08<00:21,  3.03it/s][A
Training:  29%|██▉       | 26/90 [00:08

Epoch: 10/48 - Loss: 3.4341 - Accuracy: 0.9341



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:14,  1.31s/it][A
 33%|███▎      | 4/12 [00:01<00:02,  3.53it/s][A
 50%|█████     | 6/12 [00:02<00:01,  3.01it/s][A
 67%|██████▋   | 8/12 [00:02<00:00,  4.18it/s][A
100%|██████████| 12/12 [00:03<00:00,  3.46it/s][A
Epochs:  21%|██        | 10/48 [04:37<17:27, 27.57s/it]

Val Loss: 3.8350 - Val Accuracy: 0.9293



Training:   0%|          | 0/90 [00:00<?, ?it/s][A
Training:   1%|          | 1/90 [00:01<01:58,  1.33s/it][A
Training:   3%|▎         | 3/90 [00:01<00:34,  2.54it/s][A
Training:   6%|▌         | 5/90 [00:02<00:34,  2.46it/s][A
Training:   7%|▋         | 6/90 [00:02<00:27,  3.04it/s][A
Training:  10%|█         | 9/90 [00:03<00:24,  3.27it/s][A
Training:  11%|█         | 10/90 [00:03<00:23,  3.36it/s][A
Training:  13%|█▎        | 12/90 [00:03<00:16,  4.82it/s][A
Training:  14%|█▍        | 13/90 [00:04<00:22,  3.39it/s][A
Training:  16%|█▌        | 14/90 [00:04<00:20,  3.68it/s][A
Training:  19%|█▉        | 17/90 [00:05<00:18,  3.95it/s][A
Training:  20%|██        | 18/90 [00:05<00:17,  4.01it/s][A
Training:  23%|██▎       | 21/90 [00:06<00:15,  4.35it/s][A
Training:  24%|██▍       | 22/90 [00:06<00:18,  3.67it/s][A
Training:  27%|██▋       | 24/90 [00:06<00:13,  4.85it/s][A
Training:  28%|██▊       | 25/90 [00:07<00:18,  3.56it/s][A
Training:  29%|██▉       | 26/90 [00:

Epoch: 11/48 - Loss: 3.3190 - Accuracy: 0.9373



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:15,  1.41s/it][A
 25%|██▌       | 3/12 [00:01<00:03,  2.38it/s][A
 42%|████▏     | 5/12 [00:02<00:02,  2.48it/s][A
 67%|██████▋   | 8/12 [00:02<00:00,  4.73it/s][A
100%|██████████| 12/12 [00:03<00:00,  3.45it/s][A
Epochs:  23%|██▎       | 11/48 [05:03<16:48, 27.26s/it]

Val Loss: 3.5664 - Val Accuracy: 0.9283



Training:   0%|          | 0/90 [00:00<?, ?it/s][A
Training:   1%|          | 1/90 [00:01<02:28,  1.67s/it][A
Training:   2%|▏         | 2/90 [00:01<01:05,  1.34it/s][A
Training:   4%|▍         | 4/90 [00:01<00:27,  3.17it/s][A
Training:   7%|▋         | 6/90 [00:02<00:30,  2.77it/s][A
Training:  10%|█         | 9/90 [00:03<00:27,  2.94it/s][A
Training:  12%|█▏        | 11/90 [00:03<00:20,  3.94it/s][A
Training:  14%|█▍        | 13/90 [00:04<00:24,  3.09it/s][A
Training:  19%|█▉        | 17/90 [00:05<00:21,  3.32it/s][A
Training:  23%|██▎       | 21/90 [00:06<00:17,  3.94it/s][A
Training:  28%|██▊       | 25/90 [00:07<00:16,  3.95it/s][A
Training:  29%|██▉       | 26/90 [00:07<00:15,  4.14it/s][A
Training:  30%|███       | 27/90 [00:07<00:13,  4.52it/s][A
Training:  32%|███▏      | 29/90 [00:08<00:15,  3.82it/s][A
Training:  33%|███▎      | 30/90 [00:08<00:15,  3.83it/s][A
Training:  36%|███▌      | 32/90 [00:09<00:11,  4.97it/s][A
Training:  37%|███▋      | 33/90 [00:

Epoch: 12/48 - Loss: 3.1604 - Accuracy: 0.9403



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:15,  1.40s/it][A
 33%|███▎      | 4/12 [00:01<00:02,  3.28it/s][A
 50%|█████     | 6/12 [00:02<00:02,  2.88it/s][A
100%|██████████| 12/12 [00:03<00:00,  3.77it/s][A
Epochs:  25%|██▌       | 12/48 [05:30<16:19, 27.20s/it]

Val Loss: 3.4354 - Val Accuracy: 0.9394



Training:   0%|          | 0/90 [00:00<?, ?it/s][A
Training:   1%|          | 1/90 [00:01<02:19,  1.57s/it][A
Training:   3%|▎         | 3/90 [00:01<00:40,  2.15it/s][A
Training:   6%|▌         | 5/90 [00:02<00:37,  2.25it/s][A
Training:   8%|▊         | 7/90 [00:02<00:24,  3.40it/s][A
Training:  10%|█         | 9/90 [00:03<00:27,  2.92it/s][A
Training:  12%|█▏        | 11/90 [00:03<00:19,  3.96it/s][A
Training:  13%|█▎        | 12/90 [00:03<00:17,  4.45it/s][A
Training:  14%|█▍        | 13/90 [00:04<00:24,  3.10it/s][A
Training:  16%|█▌        | 14/90 [00:04<00:21,  3.46it/s][A
Training:  17%|█▋        | 15/90 [00:04<00:18,  4.01it/s][A
Training:  19%|█▉        | 17/90 [00:05<00:17,  4.24it/s][A
Training:  20%|██        | 18/90 [00:05<00:17,  4.06it/s][A
Training:  21%|██        | 19/90 [00:05<00:15,  4.52it/s][A
Training:  23%|██▎       | 21/90 [00:06<00:15,  4.56it/s][A
Training:  24%|██▍       | 22/90 [00:06<00:15,  4.28it/s][A
Training:  27%|██▋       | 24/90 [00:

Epoch: 13/48 - Loss: 3.3456 - Accuracy: 0.9350



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:15,  1.38s/it][A
 33%|███▎      | 4/12 [00:01<00:02,  3.35it/s][A
 50%|█████     | 6/12 [00:02<00:02,  2.76it/s][A
 67%|██████▋   | 8/12 [00:02<00:00,  4.07it/s][A
100%|██████████| 12/12 [00:03<00:00,  3.32it/s][A
Epochs:  27%|██▋       | 13/48 [05:57<15:52, 27.22s/it]

Val Loss: 3.4394 - Val Accuracy: 0.9421



Training:   0%|          | 0/90 [00:00<?, ?it/s][A
Training:   1%|          | 1/90 [00:01<01:53,  1.27s/it][A
Training:   2%|▏         | 2/90 [00:01<00:54,  1.61it/s][A
Training:   4%|▍         | 4/90 [00:01<00:23,  3.64it/s][A
Training:   6%|▌         | 5/90 [00:02<00:34,  2.49it/s][A
Training:   7%|▋         | 6/90 [00:02<00:28,  2.91it/s][A
Training:   9%|▉         | 8/90 [00:02<00:18,  4.37it/s][A
Training:  10%|█         | 9/90 [00:03<00:25,  3.14it/s][A
Training:  11%|█         | 10/90 [00:03<00:26,  2.99it/s][A
Training:  13%|█▎        | 12/90 [00:03<00:17,  4.51it/s][A
Training:  14%|█▍        | 13/90 [00:04<00:24,  3.09it/s][A
Training:  17%|█▋        | 15/90 [00:04<00:16,  4.62it/s][A
Training:  19%|█▉        | 17/90 [00:05<00:20,  3.50it/s][A
Training:  21%|██        | 19/90 [00:05<00:14,  4.80it/s][A
Training:  23%|██▎       | 21/90 [00:06<00:18,  3.77it/s][A
Training:  24%|██▍       | 22/90 [00:06<00:16,  4.06it/s][A
Training:  28%|██▊       | 25/90 [00:07

Epoch: 14/48 - Loss: 2.9002 - Accuracy: 0.9438



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:16,  1.50s/it][A
 25%|██▌       | 3/12 [00:01<00:04,  2.24it/s][A
 42%|████▏     | 5/12 [00:02<00:03,  2.28it/s][A
 58%|█████▊    | 7/12 [00:02<00:01,  3.55it/s][A
 67%|██████▋   | 8/12 [00:02<00:00,  4.11it/s][A
 75%|███████▌  | 9/12 [00:03<00:01,  2.83it/s][A
100%|██████████| 12/12 [00:03<00:00,  3.25it/s][A
Epochs:  29%|██▉       | 14/48 [06:24<15:21, 27.09s/it]

Val Loss: 3.7528 - Val Accuracy: 0.9275



Training:   0%|          | 0/90 [00:00<?, ?it/s][A
Training:   1%|          | 1/90 [00:01<01:52,  1.27s/it][A
Training:   2%|▏         | 2/90 [00:01<00:57,  1.53it/s][A
Training:   4%|▍         | 4/90 [00:01<00:24,  3.54it/s][A
Training:   6%|▌         | 5/90 [00:02<00:32,  2.59it/s][A
Training:   7%|▋         | 6/90 [00:02<00:29,  2.81it/s][A
Training:   9%|▉         | 8/90 [00:02<00:18,  4.53it/s][A
Training:  10%|█         | 9/90 [00:03<00:24,  3.27it/s][A
Training:  11%|█         | 10/90 [00:03<00:27,  2.94it/s][A
Training:  13%|█▎        | 12/90 [00:03<00:18,  4.29it/s][A
Training:  14%|█▍        | 13/90 [00:04<00:22,  3.45it/s][A
Training:  16%|█▌        | 14/90 [00:04<00:24,  3.14it/s][A
Training:  18%|█▊        | 16/90 [00:04<00:16,  4.56it/s][A
Training:  19%|█▉        | 17/90 [00:05<00:18,  3.90it/s][A
Training:  20%|██        | 18/90 [00:05<00:22,  3.24it/s][A
Training:  22%|██▏       | 20/90 [00:05<00:15,  4.53it/s][A
Training:  23%|██▎       | 21/90 [00:06

Epoch: 15/48 - Loss: 2.9916 - Accuracy: 0.9431



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:16,  1.46s/it][A
 25%|██▌       | 3/12 [00:01<00:03,  2.36it/s][A
 42%|████▏     | 5/12 [00:02<00:02,  2.56it/s][A
 58%|█████▊    | 7/12 [00:02<00:01,  3.99it/s][A
 75%|███████▌  | 9/12 [00:03<00:00,  3.27it/s][A
100%|██████████| 12/12 [00:03<00:00,  3.45it/s][A
Epochs:  31%|███▏      | 15/48 [06:51<14:48, 26.92s/it]

Val Loss: 3.6294 - Val Accuracy: 0.9355



Training:   0%|          | 0/90 [00:00<?, ?it/s][A
Training:   1%|          | 1/90 [00:01<02:13,  1.50s/it][A
Training:   3%|▎         | 3/90 [00:01<00:37,  2.33it/s][A
Training:   6%|▌         | 5/90 [00:02<00:36,  2.30it/s][A
Training:   8%|▊         | 7/90 [00:02<00:22,  3.63it/s][A
Training:  10%|█         | 9/90 [00:03<00:28,  2.85it/s][A
Training:  12%|█▏        | 11/90 [00:03<00:20,  3.85it/s][A
Training:  14%|█▍        | 13/90 [00:04<00:27,  2.83it/s][A
Training:  16%|█▌        | 14/90 [00:04<00:23,  3.21it/s][A
Training:  18%|█▊        | 16/90 [00:05<00:16,  4.38it/s][A
Training:  19%|█▉        | 17/90 [00:05<00:23,  3.05it/s][A
Training:  21%|██        | 19/90 [00:05<00:16,  4.38it/s][A
Training:  23%|██▎       | 21/90 [00:06<00:19,  3.47it/s][A
Training:  26%|██▌       | 23/90 [00:06<00:15,  4.37it/s][A
Training:  28%|██▊       | 25/90 [00:08<00:21,  3.07it/s][A
Training:  30%|███       | 27/90 [00:08<00:15,  4.03it/s][A
Training:  32%|███▏      | 29/90 [00:

Epoch: 16/48 - Loss: 3.0105 - Accuracy: 0.9417



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:14,  1.29s/it][A
 17%|█▋        | 2/12 [00:01<00:06,  1.50it/s][A
 33%|███▎      | 4/12 [00:01<00:02,  3.28it/s][A
 42%|████▏     | 5/12 [00:02<00:03,  2.26it/s][A
 67%|██████▋   | 8/12 [00:02<00:00,  4.27it/s][A
 75%|███████▌  | 9/12 [00:03<00:01,  2.90it/s][A
100%|██████████| 12/12 [00:03<00:00,  3.24it/s][A
Epochs:  33%|███▎      | 16/48 [07:19<14:31, 27.23s/it]

Val Loss: 3.7021 - Val Accuracy: 0.9339



Training:   0%|          | 0/90 [00:00<?, ?it/s][A
Training:   1%|          | 1/90 [00:01<02:11,  1.47s/it][A
Training:   3%|▎         | 3/90 [00:01<00:38,  2.24it/s][A
Training:   6%|▌         | 5/90 [00:02<00:37,  2.27it/s][A
Training:   7%|▋         | 6/90 [00:02<00:29,  2.81it/s][A
Training:   8%|▊         | 7/90 [00:02<00:23,  3.46it/s][A
Training:  10%|█         | 9/90 [00:03<00:27,  2.97it/s][A
Training:  11%|█         | 10/90 [00:03<00:24,  3.33it/s][A
Training:  13%|█▎        | 12/90 [00:03<00:16,  4.65it/s][A
Training:  14%|█▍        | 13/90 [00:04<00:25,  3.07it/s][A
Training:  17%|█▋        | 15/90 [00:04<00:19,  3.88it/s][A
Training:  19%|█▉        | 17/90 [00:05<00:22,  3.18it/s][A
Training:  21%|██        | 19/90 [00:06<00:18,  3.92it/s][A
Training:  23%|██▎       | 21/90 [00:06<00:19,  3.51it/s][A
Training:  24%|██▍       | 22/90 [00:06<00:17,  3.93it/s][A
Training:  28%|██▊       | 25/90 [00:07<00:17,  3.81it/s][A
Training:  29%|██▉       | 26/90 [00:0

Epoch: 17/48 - Loss: 2.9220 - Accuracy: 0.9423



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:14,  1.30s/it][A
 25%|██▌       | 3/12 [00:01<00:03,  2.50it/s][A
 42%|████▏     | 5/12 [00:02<00:02,  2.99it/s][A
 50%|█████     | 6/12 [00:02<00:02,  2.96it/s][A
 58%|█████▊    | 7/12 [00:02<00:01,  3.61it/s][A
 75%|███████▌  | 9/12 [00:03<00:00,  3.39it/s][A
100%|██████████| 12/12 [00:03<00:00,  3.30it/s][A
Epochs:  35%|███▌      | 17/48 [07:46<14:03, 27.20s/it]

Val Loss: 3.6202 - Val Accuracy: 0.9344



Training:   0%|          | 0/90 [00:00<?, ?it/s][A
Training:   1%|          | 1/90 [00:01<02:13,  1.50s/it][A
Training:   2%|▏         | 2/90 [00:01<01:00,  1.45it/s][A
Training:   4%|▍         | 4/90 [00:01<00:25,  3.34it/s][A
Training:   6%|▌         | 5/90 [00:02<00:35,  2.37it/s][A
Training:   8%|▊         | 7/90 [00:02<00:22,  3.69it/s][A
Training:  10%|█         | 9/90 [00:03<00:25,  3.18it/s][A
Training:  11%|█         | 10/90 [00:03<00:24,  3.26it/s][A
Training:  13%|█▎        | 12/90 [00:03<00:16,  4.77it/s][A
Training:  14%|█▍        | 13/90 [00:04<00:24,  3.21it/s][A
Training:  16%|█▌        | 14/90 [00:04<00:21,  3.58it/s][A
Training:  17%|█▋        | 15/90 [00:04<00:18,  3.97it/s][A
Training:  19%|█▉        | 17/90 [00:05<00:21,  3.47it/s][A
Training:  20%|██        | 18/90 [00:05<00:17,  4.00it/s][A
Training:  21%|██        | 19/90 [00:05<00:19,  3.69it/s][A
Training:  23%|██▎       | 21/90 [00:06<00:17,  3.87it/s][A
Training:  24%|██▍       | 22/90 [00:0

Epoch: 18/48 - Loss: 2.9154 - Accuracy: 0.9437



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:15,  1.41s/it][A
 33%|███▎      | 4/12 [00:01<00:02,  3.19it/s][A
 50%|█████     | 6/12 [00:02<00:02,  2.81it/s][A
 58%|█████▊    | 7/12 [00:02<00:01,  3.19it/s][A
 75%|███████▌  | 9/12 [00:03<00:01,  2.80it/s][A
100%|██████████| 12/12 [00:03<00:00,  3.26it/s][A
Epochs:  38%|███▊      | 18/48 [08:14<13:44, 27.49s/it]

Val Loss: 3.3297 - Val Accuracy: 0.9416



Training:   0%|          | 0/90 [00:00<?, ?it/s][A
Training:   1%|          | 1/90 [00:01<02:14,  1.51s/it][A
Training:   3%|▎         | 3/90 [00:01<00:37,  2.32it/s][A
Training:   6%|▌         | 5/90 [00:02<00:39,  2.14it/s][A
Training:   8%|▊         | 7/90 [00:02<00:25,  3.27it/s][A
Training:  10%|█         | 9/90 [00:03<00:29,  2.79it/s][A
Training:  12%|█▏        | 11/90 [00:03<00:20,  3.87it/s][A
Training:  14%|█▍        | 13/90 [00:05<00:29,  2.63it/s][A
Training:  16%|█▌        | 14/90 [00:05<00:24,  3.06it/s][A
Training:  19%|█▉        | 17/90 [00:06<00:24,  2.97it/s][A
Training:  22%|██▏       | 20/90 [00:06<00:15,  4.55it/s][A
Training:  24%|██▍       | 22/90 [00:07<00:19,  3.50it/s][A
Training:  28%|██▊       | 25/90 [00:08<00:18,  3.56it/s][A
Training:  30%|███       | 27/90 [00:08<00:14,  4.40it/s][A
Training:  32%|███▏      | 29/90 [00:09<00:16,  3.70it/s][A
Training:  37%|███▋      | 33/90 [00:09<00:14,  3.99it/s][A
Training:  39%|███▉      | 35/90 [00:

Epoch: 19/48 - Loss: 2.8084 - Accuracy: 0.9452



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:16,  1.50s/it][A
 33%|███▎      | 4/12 [00:01<00:02,  2.67it/s][A
 42%|████▏     | 5/12 [00:02<00:03,  2.23it/s][A
 50%|█████     | 6/12 [00:02<00:02,  2.69it/s][A
 67%|██████▋   | 8/12 [00:02<00:01,  3.68it/s][A
 75%|███████▌  | 9/12 [00:03<00:00,  3.00it/s][A
100%|██████████| 12/12 [00:03<00:00,  3.15it/s][A
Epochs:  40%|███▉      | 19/48 [08:41<13:09, 27.24s/it]

Val Loss: 3.7812 - Val Accuracy: 0.9253



Training:   0%|          | 0/90 [00:00<?, ?it/s][A
Training:   1%|          | 1/90 [00:01<02:15,  1.52s/it][A
Training:   2%|▏         | 2/90 [00:01<01:02,  1.41it/s][A
Training:   4%|▍         | 4/90 [00:01<00:26,  3.29it/s][A
Training:   6%|▌         | 5/90 [00:02<00:40,  2.10it/s][A
Training:   9%|▉         | 8/90 [00:02<00:19,  4.27it/s][A
Training:  11%|█         | 10/90 [00:03<00:24,  3.22it/s][A
Training:  13%|█▎        | 12/90 [00:03<00:17,  4.48it/s][A
Training:  16%|█▌        | 14/90 [00:04<00:24,  3.16it/s][A
Training:  18%|█▊        | 16/90 [00:04<00:17,  4.21it/s][A
Training:  20%|██        | 18/90 [00:05<00:21,  3.35it/s][A
Training:  22%|██▏       | 20/90 [00:05<00:15,  4.38it/s][A
Training:  23%|██▎       | 21/90 [00:06<00:22,  3.13it/s][A
Training:  26%|██▌       | 23/90 [00:06<00:15,  4.25it/s][A
Training:  28%|██▊       | 25/90 [00:07<00:18,  3.48it/s][A
Training:  30%|███       | 27/90 [00:07<00:13,  4.59it/s][A
Training:  32%|███▏      | 29/90 [00:

Epoch: 20/48 - Loss: 2.9617 - Accuracy: 0.9412



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:13,  1.24s/it][A
 25%|██▌       | 3/12 [00:01<00:03,  2.67it/s][A
 42%|████▏     | 5/12 [00:02<00:02,  2.36it/s][A
 58%|█████▊    | 7/12 [00:02<00:01,  3.74it/s][A
100%|██████████| 12/12 [00:03<00:00,  3.29it/s][A
Epochs:  42%|████▏     | 20/48 [09:08<12:47, 27.41s/it]

Val Loss: 3.8276 - Val Accuracy: 0.9323



Training:   0%|          | 0/90 [00:00<?, ?it/s][A
Training:   1%|          | 1/90 [00:01<02:04,  1.40s/it][A
Training:   4%|▍         | 4/90 [00:01<00:26,  3.30it/s][A
Training:   7%|▋         | 6/90 [00:02<00:31,  2.66it/s][A
Training:  10%|█         | 9/90 [00:03<00:30,  2.69it/s][A
Training:  11%|█         | 10/90 [00:03<00:25,  3.09it/s][A
Training:  13%|█▎        | 12/90 [00:03<00:17,  4.35it/s][A
Training:  16%|█▌        | 14/90 [00:04<00:23,  3.30it/s][A
Training:  19%|█▉        | 17/90 [00:05<00:22,  3.26it/s][A
Training:  21%|██        | 19/90 [00:05<00:17,  4.08it/s][A
Training:  23%|██▎       | 21/90 [00:06<00:19,  3.56it/s][A
Training:  26%|██▌       | 23/90 [00:06<00:14,  4.60it/s][A
Training:  28%|██▊       | 25/90 [00:07<00:17,  3.62it/s][A
Training:  30%|███       | 27/90 [00:07<00:14,  4.47it/s][A
Training:  32%|███▏      | 29/90 [00:08<00:17,  3.57it/s][A
Training:  33%|███▎      | 30/90 [00:08<00:14,  4.01it/s][A
Training:  36%|███▌      | 32/90 [00

Epoch: 21/48 - Loss: 2.7393 - Accuracy: 0.9467



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:17,  1.63s/it][A
 25%|██▌       | 3/12 [00:01<00:04,  2.06it/s][A
 42%|████▏     | 5/12 [00:02<00:03,  2.15it/s][A
 67%|██████▋   | 8/12 [00:02<00:00,  4.07it/s][A
100%|██████████| 12/12 [00:03<00:00,  3.07it/s][A
Epochs:  44%|████▍     | 21/48 [09:36<12:23, 27.55s/it]

Val Loss: 3.3516 - Val Accuracy: 0.9341



Training:   0%|          | 0/90 [00:00<?, ?it/s][A
Training:   1%|          | 1/90 [00:01<02:15,  1.52s/it][A
Training:   3%|▎         | 3/90 [00:01<00:39,  2.18it/s][A
Training:   6%|▌         | 5/90 [00:02<00:41,  2.03it/s][A
Training:   7%|▋         | 6/90 [00:02<00:32,  2.55it/s][A
Training:   9%|▉         | 8/90 [00:02<00:19,  4.10it/s][A
Training:  11%|█         | 10/90 [00:03<00:26,  3.05it/s][A
Training:  14%|█▍        | 13/90 [00:04<00:26,  2.93it/s][A
Training:  17%|█▋        | 15/90 [00:05<00:19,  3.87it/s][A
Training:  19%|█▉        | 17/90 [00:05<00:21,  3.41it/s][A
Training:  21%|██        | 19/90 [00:05<00:15,  4.54it/s][A
Training:  23%|██▎       | 21/90 [00:06<00:18,  3.66it/s][A
Training:  26%|██▌       | 23/90 [00:06<00:14,  4.65it/s][A
Training:  28%|██▊       | 25/90 [00:07<00:18,  3.61it/s][A
Training:  30%|███       | 27/90 [00:07<00:13,  4.59it/s][A
Training:  32%|███▏      | 29/90 [00:08<00:16,  3.68it/s][A
Training:  34%|███▍      | 31/90 [00:

Epoch: 22/48 - Loss: 2.7462 - Accuracy: 0.9442



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:14,  1.35s/it][A
 17%|█▋        | 2/12 [00:01<00:06,  1.59it/s][A
 33%|███▎      | 4/12 [00:01<00:02,  3.62it/s][A
 42%|████▏     | 5/12 [00:02<00:03,  2.27it/s][A
 58%|█████▊    | 7/12 [00:02<00:01,  3.69it/s][A
 75%|███████▌  | 9/12 [00:03<00:01,  2.74it/s][A
100%|██████████| 12/12 [00:03<00:00,  3.10it/s][A
Epochs:  46%|████▌     | 22/48 [10:04<11:57, 27.58s/it]

Val Loss: 3.3979 - Val Accuracy: 0.9410



Training:   0%|          | 0/90 [00:00<?, ?it/s][A
Training:   1%|          | 1/90 [00:01<02:13,  1.50s/it][A
Training:   3%|▎         | 3/90 [00:01<00:38,  2.27it/s][A
Training:   6%|▌         | 5/90 [00:02<00:35,  2.39it/s][A
Training:   8%|▊         | 7/90 [00:02<00:22,  3.77it/s][A
Training:  10%|█         | 9/90 [00:03<00:28,  2.85it/s][A
Training:  12%|█▏        | 11/90 [00:03<00:20,  3.92it/s][A
Training:  14%|█▍        | 13/90 [00:04<00:25,  3.06it/s][A
Training:  17%|█▋        | 15/90 [00:04<00:18,  4.10it/s][A
Training:  19%|█▉        | 17/90 [00:05<00:20,  3.48it/s][A
Training:  22%|██▏       | 20/90 [00:05<00:13,  5.37it/s][A
Training:  24%|██▍       | 22/90 [00:06<00:17,  3.94it/s][A
Training:  28%|██▊       | 25/90 [00:07<00:17,  3.72it/s][A
Training:  31%|███       | 28/90 [00:07<00:11,  5.18it/s][A
Training:  33%|███▎      | 30/90 [00:08<00:14,  4.21it/s][A
Training:  36%|███▌      | 32/90 [00:08<00:10,  5.29it/s][A
Training:  38%|███▊      | 34/90 [00:

Epoch: 23/48 - Loss: 2.7464 - Accuracy: 0.9455



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:12,  1.11s/it][A
 17%|█▋        | 2/12 [00:01<00:05,  1.92it/s][A
 42%|████▏     | 5/12 [00:01<00:02,  3.40it/s][A
 58%|█████▊    | 7/12 [00:02<00:01,  4.75it/s][A
 67%|██████▋   | 8/12 [00:02<00:00,  5.27it/s][A
100%|██████████| 12/12 [00:02<00:00,  4.23it/s][A
Epochs:  48%|████▊     | 23/48 [10:27<10:53, 26.14s/it]

Val Loss: 3.2637 - Val Accuracy: 0.9432



Training:   0%|          | 0/90 [00:00<?, ?it/s][A
Training:   1%|          | 1/90 [00:01<01:36,  1.08s/it][A
Training:   6%|▌         | 5/90 [00:01<00:28,  2.93it/s][A
Training:   9%|▉         | 8/90 [00:02<00:16,  5.00it/s][A
Training:  11%|█         | 10/90 [00:02<00:20,  3.93it/s][A
Training:  14%|█▍        | 13/90 [00:03<00:18,  4.16it/s][A
Training:  19%|█▉        | 17/90 [00:04<00:17,  4.18it/s][A
Training:  23%|██▎       | 21/90 [00:05<00:15,  4.51it/s][A
Training:  27%|██▋       | 24/90 [00:05<00:11,  5.94it/s][A
Training:  29%|██▉       | 26/90 [00:05<00:12,  5.04it/s][A
Training:  32%|███▏      | 29/90 [00:06<00:13,  4.64it/s][A
Training:  36%|███▌      | 32/90 [00:06<00:09,  6.23it/s][A
Training:  38%|███▊      | 34/90 [00:07<00:11,  4.83it/s][A
Training:  41%|████      | 37/90 [00:08<00:11,  4.49it/s][A
Training:  42%|████▏     | 38/90 [00:08<00:10,  4.77it/s][A
Training:  46%|████▌     | 41/90 [00:09<00:10,  4.84it/s][A
Training:  47%|████▋     | 42/90 [0

Epoch: 24/48 - Loss: 2.7260 - Accuracy: 0.9453



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:13,  1.24s/it][A
 33%|███▎      | 4/12 [00:01<00:02,  3.72it/s][A
 50%|█████     | 6/12 [00:02<00:01,  3.20it/s][A
100%|██████████| 12/12 [00:02<00:00,  4.13it/s][A
Epochs:  50%|█████     | 24/48 [10:48<09:53, 24.72s/it]

Val Loss: 4.0313 - Val Accuracy: 0.9096



Training:   0%|          | 0/90 [00:00<?, ?it/s][A
Training:   1%|          | 1/90 [00:01<01:51,  1.25s/it][A
Training:   6%|▌         | 5/90 [00:02<00:30,  2.83it/s][A
Training:   9%|▉         | 8/90 [00:02<00:16,  4.98it/s][A
Training:  11%|█         | 10/90 [00:02<00:21,  3.79it/s][A
Training:  14%|█▍        | 13/90 [00:03<00:22,  3.50it/s][A
Training:  19%|█▉        | 17/90 [00:04<00:17,  4.11it/s][A
Training:  21%|██        | 19/90 [00:04<00:14,  5.03it/s][A
Training:  23%|██▎       | 21/90 [00:05<00:15,  4.35it/s][A
Training:  27%|██▋       | 24/90 [00:05<00:11,  5.95it/s][A
Training:  29%|██▉       | 26/90 [00:06<00:13,  4.68it/s][A
Training:  31%|███       | 28/90 [00:06<00:10,  5.86it/s][A
Training:  33%|███▎      | 30/90 [00:07<00:13,  4.53it/s][A
Training:  37%|███▋      | 33/90 [00:07<00:12,  4.42it/s][A
Training:  41%|████      | 37/90 [00:08<00:11,  4.66it/s][A
Training:  46%|████▌     | 41/90 [00:09<00:10,  4.66it/s][A
Training:  49%|████▉     | 44/90 [0

Epoch: 25/48 - Loss: 2.8079 - Accuracy: 0.9441



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:11,  1.02s/it][A
 42%|████▏     | 5/12 [00:01<00:02,  3.11it/s][A
 67%|██████▋   | 8/12 [00:02<00:00,  5.06it/s][A
100%|██████████| 12/12 [00:02<00:00,  4.36it/s][A
Epochs:  52%|█████▏    | 25/48 [11:09<09:05, 23.71s/it]

Val Loss: 3.7310 - Val Accuracy: 0.9302



Training:   0%|          | 0/90 [00:00<?, ?it/s][A
Training:   1%|          | 1/90 [00:01<01:29,  1.01s/it][A
Training:   3%|▎         | 3/90 [00:01<00:26,  3.23it/s][A
Training:   6%|▌         | 5/90 [00:01<00:28,  3.01it/s][A
Training:   8%|▊         | 7/90 [00:01<00:18,  4.56it/s][A
Training:  10%|█         | 9/90 [00:02<00:22,  3.66it/s][A
Training:  12%|█▏        | 11/90 [00:02<00:15,  5.00it/s][A
Training:  14%|█▍        | 13/90 [00:03<00:19,  4.03it/s][A
Training:  17%|█▋        | 15/90 [00:03<00:14,  5.33it/s][A
Training:  19%|█▉        | 17/90 [00:04<00:16,  4.40it/s][A
Training:  21%|██        | 19/90 [00:04<00:13,  5.44it/s][A
Training:  23%|██▎       | 21/90 [00:05<00:15,  4.43it/s][A
Training:  26%|██▌       | 23/90 [00:05<00:11,  5.65it/s][A
Training:  28%|██▊       | 25/90 [00:05<00:14,  4.57it/s][A
Training:  29%|██▉       | 26/90 [00:05<00:12,  5.03it/s][A
Training:  31%|███       | 28/90 [00:06<00:09,  6.37it/s][A
Training:  32%|███▏      | 29/90 [00:

Epoch: 26/48 - Loss: 2.8911 - Accuracy: 0.9415



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:11,  1.06s/it][A
 33%|███▎      | 4/12 [00:01<00:01,  4.36it/s][A
 50%|█████     | 6/12 [00:01<00:01,  3.59it/s][A
 67%|██████▋   | 8/12 [00:02<00:00,  4.81it/s][A
100%|██████████| 12/12 [00:02<00:00,  4.28it/s][A
Epochs:  54%|█████▍    | 26/48 [11:30<08:23, 22.88s/it]

Val Loss: 3.2868 - Val Accuracy: 0.9440



Training:   0%|          | 0/90 [00:00<?, ?it/s][A
Training:   1%|          | 1/90 [00:01<01:37,  1.09s/it][A
Training:   3%|▎         | 3/90 [00:01<00:28,  3.04it/s][A
Training:   6%|▌         | 5/90 [00:01<00:28,  3.02it/s][A
Training:   7%|▋         | 6/90 [00:02<00:23,  3.60it/s][A
Training:   8%|▊         | 7/90 [00:02<00:19,  4.37it/s][A
Training:  10%|█         | 9/90 [00:02<00:22,  3.64it/s][A
Training:  11%|█         | 10/90 [00:03<00:21,  3.70it/s][A
Training:  14%|█▍        | 13/90 [00:03<00:17,  4.44it/s][A
Training:  16%|█▌        | 14/90 [00:03<00:17,  4.23it/s][A
Training:  19%|█▉        | 17/90 [00:04<00:15,  4.77it/s][A
Training:  20%|██        | 18/90 [00:04<00:17,  4.11it/s][A
Training:  22%|██▏       | 20/90 [00:04<00:12,  5.44it/s][A
Training:  23%|██▎       | 21/90 [00:05<00:14,  4.69it/s][A
Training:  24%|██▍       | 22/90 [00:05<00:16,  4.08it/s][A
Training:  28%|██▊       | 25/90 [00:06<00:12,  5.37it/s][A
Training:  29%|██▉       | 26/90 [00:0

Epoch: 27/48 - Loss: 2.7714 - Accuracy: 0.9450



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:00<00:07,  1.45it/s][A
 42%|████▏     | 5/12 [00:01<00:01,  4.60it/s][A
100%|██████████| 12/12 [00:01<00:00,  6.02it/s][A
Epochs:  56%|█████▋    | 27/48 [11:50<07:42, 22.01s/it]

Val Loss: 3.8131 - Val Accuracy: 0.9332



Training:   0%|          | 0/90 [00:00<?, ?it/s][A
Training:   1%|          | 1/90 [00:00<01:11,  1.24it/s][A
Training:   6%|▌         | 5/90 [00:01<00:19,  4.42it/s][A
Training:   8%|▊         | 7/90 [00:01<00:13,  6.07it/s][A
Training:  10%|█         | 9/90 [00:01<00:15,  5.16it/s][A
Training:  12%|█▏        | 11/90 [00:02<00:11,  6.86it/s][A
Training:  14%|█▍        | 13/90 [00:02<00:14,  5.34it/s][A
Training:  17%|█▋        | 15/90 [00:02<00:10,  6.90it/s][A
Training:  19%|█▉        | 17/90 [00:03<00:12,  6.07it/s][A
Training:  20%|██        | 18/90 [00:03<00:11,  6.41it/s][A
Training:  23%|██▎       | 21/90 [00:03<00:10,  6.71it/s][A
Training:  24%|██▍       | 22/90 [00:03<00:09,  6.88it/s][A
Training:  28%|██▊       | 25/90 [00:04<00:10,  6.48it/s][A
Training:  30%|███       | 27/90 [00:04<00:07,  7.91it/s][A
Training:  32%|███▏      | 29/90 [00:04<00:10,  5.88it/s][A
Training:  37%|███▋      | 33/90 [00:05<00:08,  6.45it/s][A
Training:  40%|████      | 36/90 [00

Epoch: 28/48 - Loss: 2.6710 - Accuracy: 0.9468



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:00<00:09,  1.22it/s][A
 42%|████▏     | 5/12 [00:01<00:01,  4.14it/s][A
100%|██████████| 12/12 [00:02<00:00,  5.73it/s][A
Epochs:  58%|█████▊    | 28/48 [12:07<06:45, 20.26s/it]

Val Loss: 3.3120 - Val Accuracy: 0.9394



Training:   0%|          | 0/90 [00:00<?, ?it/s][A
Training:   1%|          | 1/90 [00:00<01:08,  1.31it/s][A
Training:   6%|▌         | 5/90 [00:01<00:20,  4.08it/s][A
Training:  10%|█         | 9/90 [00:01<00:15,  5.36it/s][A
Training:  14%|█▍        | 13/90 [00:02<00:12,  5.96it/s][A
Training:  19%|█▉        | 17/90 [00:03<00:11,  6.51it/s][A
Training:  22%|██▏       | 20/90 [00:03<00:08,  8.25it/s][A
Training:  24%|██▍       | 22/90 [00:03<00:10,  6.32it/s][A
Training:  28%|██▊       | 25/90 [00:04<00:11,  5.80it/s][A
Training:  32%|███▏      | 29/90 [00:04<00:09,  6.42it/s][A
Training:  37%|███▋      | 33/90 [00:05<00:08,  6.65it/s][A
Training:  40%|████      | 36/90 [00:05<00:06,  8.37it/s][A
Training:  42%|████▏     | 38/90 [00:06<00:08,  6.43it/s][A
Training:  46%|████▌     | 41/90 [00:06<00:08,  6.08it/s][A
Training:  50%|█████     | 45/90 [00:07<00:06,  6.50it/s][A
Training:  53%|█████▎    | 48/90 [00:07<00:05,  8.22it/s][A
Training:  56%|█████▌    | 50/90 [0

Epoch: 29/48 - Loss: 2.7907 - Accuracy: 0.9426



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:00<00:09,  1.15it/s][A
 42%|████▏     | 5/12 [00:01<00:01,  3.71it/s][A
100%|██████████| 12/12 [00:02<00:00,  5.52it/s][A
Epochs:  60%|██████    | 29/48 [12:23<06:00, 18.96s/it]

Val Loss: 3.2897 - Val Accuracy: 0.9378



Training:   0%|          | 0/90 [00:00<?, ?it/s][A
Training:   1%|          | 1/90 [00:00<01:10,  1.27it/s][A
Training:   2%|▏         | 2/90 [00:00<00:34,  2.56it/s][A
Training:   6%|▌         | 5/90 [00:01<00:19,  4.33it/s][A
Training:   8%|▊         | 7/90 [00:01<00:13,  6.31it/s][A
Training:  10%|█         | 9/90 [00:01<00:15,  5.33it/s][A
Training:  13%|█▎        | 12/90 [00:02<00:09,  8.26it/s][A
Training:  16%|█▌        | 14/90 [00:02<00:11,  6.39it/s][A
Training:  19%|█▉        | 17/90 [00:03<00:11,  6.11it/s][A
Training:  20%|██        | 18/90 [00:03<00:11,  6.26it/s][A
Training:  23%|██▎       | 21/90 [00:03<00:11,  6.24it/s][A
Training:  26%|██▌       | 23/90 [00:03<00:09,  7.27it/s][A
Training:  28%|██▊       | 25/90 [00:04<00:09,  6.57it/s][A
Training:  30%|███       | 27/90 [00:04<00:08,  7.44it/s][A
Training:  32%|███▏      | 29/90 [00:04<00:09,  6.48it/s][A
Training:  34%|███▍      | 31/90 [00:04<00:07,  7.72it/s][A
Training:  37%|███▋      | 33/90 [00:

Epoch: 30/48 - Loss: 2.8633 - Accuracy: 0.9420



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:00<00:10,  1.08it/s][A
 42%|████▏     | 5/12 [00:01<00:01,  3.71it/s][A
100%|██████████| 12/12 [00:02<00:00,  5.65it/s][A
Epochs:  62%|██████▎   | 30/48 [12:38<05:24, 18.04s/it]

Val Loss: 3.7015 - Val Accuracy: 0.9334



Training:   0%|          | 0/90 [00:00<?, ?it/s][A
Training:   1%|          | 1/90 [00:00<01:16,  1.17it/s][A
Training:   6%|▌         | 5/90 [00:01<00:21,  3.90it/s][A
Training:  10%|█         | 9/90 [00:02<00:15,  5.25it/s][A
Training:  14%|█▍        | 13/90 [00:02<00:13,  5.84it/s][A
Training:  19%|█▉        | 17/90 [00:03<00:11,  6.15it/s][A
Training:  20%|██        | 18/90 [00:03<00:11,  6.43it/s][A
Training:  23%|██▎       | 21/90 [00:03<00:10,  6.44it/s][A
Training:  26%|██▌       | 23/90 [00:03<00:08,  7.49it/s][A
Training:  28%|██▊       | 25/90 [00:04<00:10,  6.45it/s][A
Training:  30%|███       | 27/90 [00:04<00:08,  7.82it/s][A
Training:  32%|███▏      | 29/90 [00:04<00:10,  6.02it/s][A
Training:  34%|███▍      | 31/90 [00:05<00:08,  7.33it/s][A
Training:  37%|███▋      | 33/90 [00:05<00:09,  5.95it/s][A
Training:  39%|███▉      | 35/90 [00:05<00:07,  7.23it/s][A
Training:  41%|████      | 37/90 [00:06<00:08,  6.57it/s][A
Training:  43%|████▎     | 39/90 [0

Epoch: 31/48 - Loss: 2.6842 - Accuracy: 0.9461



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:00<00:09,  1.22it/s][A
 42%|████▏     | 5/12 [00:01<00:01,  4.46it/s][A
100%|██████████| 12/12 [00:01<00:00,  6.24it/s][A
Epochs:  65%|██████▍   | 31/48 [12:54<04:53, 17.26s/it]

Val Loss: 3.6396 - Val Accuracy: 0.9267



Training:   0%|          | 0/90 [00:00<?, ?it/s][A
Training:   1%|          | 1/90 [00:00<01:20,  1.10it/s][A
Training:   6%|▌         | 5/90 [00:01<00:20,  4.09it/s][A
Training:  10%|█         | 9/90 [00:02<00:15,  5.25it/s][A
Training:  13%|█▎        | 12/90 [00:02<00:10,  7.53it/s][A
Training:  16%|█▌        | 14/90 [00:02<00:12,  5.87it/s][A
Training:  19%|█▉        | 17/90 [00:03<00:12,  5.69it/s][A
Training:  23%|██▎       | 21/90 [00:03<00:11,  6.06it/s][A
Training:  28%|██▊       | 25/90 [00:04<00:10,  6.21it/s][A
Training:  32%|███▏      | 29/90 [00:05<00:09,  6.26it/s][A
Training:  37%|███▋      | 33/90 [00:05<00:08,  6.58it/s][A
Training:  41%|████      | 37/90 [00:06<00:07,  6.82it/s][A
Training:  44%|████▍     | 40/90 [00:06<00:05,  8.44it/s][A
Training:  47%|████▋     | 42/90 [00:06<00:07,  6.74it/s][A
Training:  50%|█████     | 45/90 [00:07<00:07,  5.98it/s][A
Training:  54%|█████▍    | 49/90 [00:08<00:06,  6.34it/s][A
Training:  59%|█████▉    | 53/90 [0

Epoch: 32/48 - Loss: 2.6975 - Accuracy: 0.9447



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:00<00:08,  1.28it/s][A
 42%|████▏     | 5/12 [00:01<00:01,  4.10it/s][A
100%|██████████| 12/12 [00:02<00:00,  5.67it/s][A
Epochs:  67%|██████▋   | 32/48 [13:10<04:30, 16.92s/it]

Val Loss: 3.1072 - Val Accuracy: 0.9384



Training:   0%|          | 0/90 [00:00<?, ?it/s][A
Training:   1%|          | 1/90 [00:00<01:11,  1.24it/s][A
Training:   4%|▍         | 4/90 [00:00<00:16,  5.36it/s][A
Training:   7%|▋         | 6/90 [00:01<00:17,  4.77it/s][A
Training:  10%|█         | 9/90 [00:02<00:16,  4.78it/s][A
Training:  13%|█▎        | 12/90 [00:02<00:11,  7.04it/s][A
Training:  16%|█▌        | 14/90 [00:02<00:12,  5.88it/s][A
Training:  19%|█▉        | 17/90 [00:03<00:12,  5.68it/s][A
Training:  22%|██▏       | 20/90 [00:03<00:08,  7.84it/s][A
Training:  24%|██▍       | 22/90 [00:03<00:11,  5.98it/s][A
Training:  27%|██▋       | 24/90 [00:04<00:09,  7.21it/s][A
Training:  29%|██▉       | 26/90 [00:04<00:10,  5.99it/s][A
Training:  32%|███▏      | 29/90 [00:05<00:10,  5.85it/s][A
Training:  37%|███▋      | 33/90 [00:05<00:09,  6.26it/s][A
Training:  41%|████      | 37/90 [00:06<00:08,  5.98it/s][A
Training:  46%|████▌     | 41/90 [00:06<00:07,  6.41it/s][A
Training:  50%|█████     | 45/90 [00

Epoch: 33/48 - Loss: 2.5285 - Accuracy: 0.9495



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:00<00:09,  1.18it/s][A
 42%|████▏     | 5/12 [00:01<00:01,  4.04it/s][A
 67%|██████▋   | 8/12 [00:01<00:00,  6.78it/s][A
100%|██████████| 12/12 [00:02<00:00,  5.70it/s][A
Epochs:  69%|██████▉   | 33/48 [13:26<04:09, 16.64s/it]

Val Loss: 3.1416 - Val Accuracy: 0.9437



Training:   0%|          | 0/90 [00:00<?, ?it/s][A
Training:   1%|          | 1/90 [00:00<01:20,  1.11it/s][A
Training:   6%|▌         | 5/90 [00:01<00:21,  3.97it/s][A
Training:  10%|█         | 9/90 [00:01<00:15,  5.36it/s][A
Training:  13%|█▎        | 12/90 [00:02<00:10,  7.66it/s][A
Training:  16%|█▌        | 14/90 [00:02<00:13,  5.65it/s][A
Training:  19%|█▉        | 17/90 [00:03<00:13,  5.51it/s][A
Training:  23%|██▎       | 21/90 [00:03<00:11,  6.18it/s][A
Training:  28%|██▊       | 25/90 [00:04<00:09,  6.69it/s][A
Training:  32%|███▏      | 29/90 [00:04<00:09,  6.64it/s][A
Training:  37%|███▋      | 33/90 [00:05<00:08,  6.36it/s][A
Training:  41%|████      | 37/90 [00:06<00:07,  6.65it/s][A
Training:  46%|████▌     | 41/90 [00:06<00:07,  6.81it/s][A
Training:  50%|█████     | 45/90 [00:07<00:06,  6.64it/s][A
Training:  54%|█████▍    | 49/90 [00:07<00:06,  6.62it/s][A
Training:  59%|█████▉    | 53/90 [00:08<00:05,  6.91it/s][A
Training:  63%|██████▎   | 57/90 [0

Epoch: 34/48 - Loss: 2.4852 - Accuracy: 0.9510



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:00<00:09,  1.22it/s][A
 42%|████▏     | 5/12 [00:01<00:01,  4.07it/s][A
100%|██████████| 12/12 [00:02<00:00,  5.75it/s][A
Epochs:  71%|███████   | 34/48 [13:42<03:50, 16.47s/it]

Val Loss: 3.1412 - Val Accuracy: 0.9437



Training:   0%|          | 0/90 [00:00<?, ?it/s][A
Training:   1%|          | 1/90 [00:00<01:11,  1.25it/s][A
Training:   4%|▍         | 4/90 [00:00<00:15,  5.57it/s][A
Training:   7%|▋         | 6/90 [00:01<00:18,  4.57it/s][A
Training:  10%|█         | 9/90 [00:02<00:17,  4.72it/s][A
Training:  14%|█▍        | 13/90 [00:02<00:13,  5.79it/s][A
Training:  18%|█▊        | 16/90 [00:02<00:09,  7.96it/s][A
Training:  20%|██        | 18/90 [00:03<00:11,  6.25it/s][A
Training:  23%|██▎       | 21/90 [00:03<00:12,  5.52it/s][A
Training:  28%|██▊       | 25/90 [00:04<00:10,  5.93it/s][A
Training:  32%|███▏      | 29/90 [00:05<00:09,  6.27it/s][A
Training:  37%|███▋      | 33/90 [00:05<00:09,  6.23it/s][A
Training:  41%|████      | 37/90 [00:06<00:08,  6.40it/s][A
Training:  46%|████▌     | 41/90 [00:06<00:07,  6.67it/s][A
Training:  50%|█████     | 45/90 [00:07<00:06,  6.81it/s][A
Training:  54%|█████▍    | 49/90 [00:07<00:06,  6.81it/s][A
Training:  59%|█████▉    | 53/90 [00

Epoch: 35/48 - Loss: 2.5215 - Accuracy: 0.9489



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:00<00:08,  1.25it/s][A
 42%|████▏     | 5/12 [00:01<00:01,  4.39it/s][A
100%|██████████| 12/12 [00:01<00:00,  6.34it/s][A
Epochs:  73%|███████▎  | 35/48 [13:58<03:31, 16.24s/it]

Val Loss: 3.2986 - Val Accuracy: 0.9382



Training:   0%|          | 0/90 [00:00<?, ?it/s][A
Training:   1%|          | 1/90 [00:00<01:14,  1.20it/s][A
Training:   6%|▌         | 5/90 [00:01<00:22,  3.86it/s][A
Training:  10%|█         | 9/90 [00:02<00:15,  5.12it/s][A
Training:  14%|█▍        | 13/90 [00:02<00:13,  5.92it/s][A
Training:  19%|█▉        | 17/90 [00:03<00:11,  6.32it/s][A
Training:  23%|██▎       | 21/90 [00:03<00:11,  6.17it/s][A
Training:  27%|██▋       | 24/90 [00:03<00:08,  7.86it/s][A
Training:  29%|██▉       | 26/90 [00:04<00:09,  6.52it/s][A
Training:  32%|███▏      | 29/90 [00:04<00:09,  6.14it/s][A
Training:  37%|███▋      | 33/90 [00:05<00:09,  6.30it/s][A
Training:  41%|████      | 37/90 [00:06<00:08,  6.31it/s][A
Training:  46%|████▌     | 41/90 [00:06<00:07,  6.48it/s][A
Training:  50%|█████     | 45/90 [00:07<00:06,  6.74it/s][A
Training:  54%|█████▍    | 49/90 [00:07<00:06,  6.77it/s][A
Training:  59%|█████▉    | 53/90 [00:08<00:05,  6.80it/s][A
Training:  63%|██████▎   | 57/90 [0

Epoch: 36/48 - Loss: 2.5103 - Accuracy: 0.9476



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:00<00:09,  1.13it/s][A
 25%|██▌       | 3/12 [00:00<00:02,  3.72it/s][A
 42%|████▏     | 5/12 [00:01<00:01,  3.81it/s][A
100%|██████████| 12/12 [00:02<00:00,  5.60it/s][A
Epochs:  75%|███████▌  | 36/48 [14:14<03:13, 16.16s/it]

Val Loss: 3.1549 - Val Accuracy: 0.9421



Training:   0%|          | 0/90 [00:00<?, ?it/s][A
Training:   1%|          | 1/90 [00:00<01:17,  1.15it/s][A
Training:   6%|▌         | 5/90 [00:01<00:21,  3.98it/s][A
Training:  10%|█         | 9/90 [00:02<00:15,  5.23it/s][A
Training:  13%|█▎        | 12/90 [00:02<00:10,  7.49it/s][A
Training:  16%|█▌        | 14/90 [00:02<00:12,  5.92it/s][A
Training:  19%|█▉        | 17/90 [00:03<00:13,  5.54it/s][A
Training:  23%|██▎       | 21/90 [00:03<00:11,  5.98it/s][A
Training:  28%|██▊       | 25/90 [00:04<00:10,  6.17it/s][A
Training:  32%|███▏      | 29/90 [00:05<00:09,  6.47it/s][A
Training:  37%|███▋      | 33/90 [00:05<00:08,  6.65it/s][A
Training:  41%|████      | 37/90 [00:06<00:07,  6.81it/s][A
Training:  46%|████▌     | 41/90 [00:06<00:07,  6.91it/s][A
Training:  50%|█████     | 45/90 [00:07<00:06,  6.83it/s][A
Training:  54%|█████▍    | 49/90 [00:07<00:05,  6.89it/s][A
Training:  59%|█████▉    | 53/90 [00:08<00:05,  6.99it/s][A
Training:  63%|██████▎   | 57/90 [0

Epoch: 37/48 - Loss: 2.5179 - Accuracy: 0.9498



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:00<00:08,  1.30it/s][A
 42%|████▏     | 5/12 [00:01<00:01,  4.25it/s][A
100%|██████████| 12/12 [00:02<00:00,  5.87it/s][A
Epochs:  77%|███████▋  | 37/48 [14:30<02:57, 16.12s/it]

Val Loss: 3.1238 - Val Accuracy: 0.9360



Training:   0%|          | 0/90 [00:00<?, ?it/s][A
Training:   1%|          | 1/90 [00:00<01:10,  1.26it/s][A
Training:   6%|▌         | 5/90 [00:01<00:19,  4.39it/s][A
Training:   8%|▊         | 7/90 [00:01<00:13,  6.17it/s][A
Training:  10%|█         | 9/90 [00:01<00:16,  5.02it/s][A
Training:  11%|█         | 10/90 [00:02<00:15,  5.29it/s][A
Training:  14%|█▍        | 13/90 [00:02<00:13,  5.73it/s][A
Training:  16%|█▌        | 14/90 [00:02<00:12,  6.09it/s][A
Training:  19%|█▉        | 17/90 [00:03<00:11,  6.31it/s][A
Training:  21%|██        | 19/90 [00:03<00:09,  7.80it/s][A
Training:  23%|██▎       | 21/90 [00:03<00:10,  6.28it/s][A
Training:  24%|██▍       | 22/90 [00:03<00:10,  6.53it/s][A
Training:  28%|██▊       | 25/90 [00:04<00:09,  6.54it/s][A
Training:  29%|██▉       | 26/90 [00:04<00:09,  6.78it/s][A
Training:  32%|███▏      | 29/90 [00:04<00:09,  6.49it/s][A
Training:  33%|███▎      | 30/90 [00:05<00:08,  6.84it/s][A
Training:  37%|███▋      | 33/90 [00

Epoch: 38/48 - Loss: 2.6295 - Accuracy: 0.9468



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:00<00:09,  1.19it/s][A
 42%|████▏     | 5/12 [00:01<00:01,  3.94it/s][A
100%|██████████| 12/12 [00:02<00:00,  5.70it/s][A
Epochs:  79%|███████▉  | 38/48 [14:46<02:40, 16.10s/it]

Val Loss: 3.2641 - Val Accuracy: 0.9410



Training:   0%|          | 0/90 [00:00<?, ?it/s][A
Training:   1%|          | 1/90 [00:00<01:18,  1.14it/s][A
Training:   6%|▌         | 5/90 [00:01<00:20,  4.10it/s][A
Training:   9%|▉         | 8/90 [00:01<00:12,  6.66it/s][A
Training:  11%|█         | 10/90 [00:02<00:14,  5.33it/s][A
Training:  14%|█▍        | 13/90 [00:02<00:12,  6.02it/s][A
Training:  16%|█▌        | 14/90 [00:02<00:12,  6.29it/s][A
Training:  19%|█▉        | 17/90 [00:03<00:11,  6.25it/s][A
Training:  20%|██        | 18/90 [00:03<00:11,  6.31it/s][A
Training:  23%|██▎       | 21/90 [00:03<00:10,  6.36it/s][A
Training:  24%|██▍       | 22/90 [00:03<00:10,  6.44it/s][A
Training:  28%|██▊       | 25/90 [00:04<00:09,  6.77it/s][A
Training:  29%|██▉       | 26/90 [00:04<00:09,  7.04it/s][A
Training:  31%|███       | 28/90 [00:04<00:07,  8.34it/s][A
Training:  32%|███▏      | 29/90 [00:04<00:09,  6.62it/s][A
Training:  33%|███▎      | 30/90 [00:04<00:08,  6.85it/s][A
Training:  36%|███▌      | 32/90 [0

Epoch: 39/48 - Loss: 2.5893 - Accuracy: 0.9469



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:00<00:10,  1.08it/s][A
 42%|████▏     | 5/12 [00:01<00:01,  4.03it/s][A
100%|██████████| 12/12 [00:02<00:00,  5.77it/s][A
Epochs:  81%|████████▏ | 39/48 [15:01<02:23, 15.95s/it]

Val Loss: 3.2898 - Val Accuracy: 0.9355



Training:   0%|          | 0/90 [00:00<?, ?it/s][A
Training:   1%|          | 1/90 [00:00<01:08,  1.30it/s][A
Training:   6%|▌         | 5/90 [00:01<00:19,  4.41it/s][A
Training:  10%|█         | 9/90 [00:01<00:15,  5.30it/s][A
Training:  13%|█▎        | 12/90 [00:02<00:10,  7.62it/s][A
Training:  16%|█▌        | 14/90 [00:02<00:12,  6.04it/s][A
Training:  19%|█▉        | 17/90 [00:03<00:12,  5.81it/s][A
Training:  23%|██▎       | 21/90 [00:03<00:10,  6.35it/s][A
Training:  28%|██▊       | 25/90 [00:04<00:10,  6.36it/s][A
Training:  32%|███▏      | 29/90 [00:04<00:09,  6.33it/s][A
Training:  37%|███▋      | 33/90 [00:05<00:08,  6.55it/s][A
Training:  41%|████      | 37/90 [00:06<00:08,  6.53it/s][A
Training:  46%|████▌     | 41/90 [00:06<00:07,  6.82it/s][A
Training:  49%|████▉     | 44/90 [00:06<00:05,  8.46it/s][A
Training:  51%|█████     | 46/90 [00:07<00:06,  6.69it/s][A
Training:  54%|█████▍    | 49/90 [00:07<00:06,  6.28it/s][A
Training:  59%|█████▉    | 53/90 [0

Epoch: 40/48 - Loss: 2.5069 - Accuracy: 0.9484



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:00<00:08,  1.29it/s][A
 42%|████▏     | 5/12 [00:01<00:01,  4.13it/s][A
100%|██████████| 12/12 [00:02<00:00,  5.76it/s][A
Epochs:  83%|████████▎ | 40/48 [15:17<02:07, 15.97s/it]

Val Loss: 3.1227 - Val Accuracy: 0.9448



Training:   0%|          | 0/90 [00:00<?, ?it/s][A
Training:   1%|          | 1/90 [00:00<01:12,  1.23it/s][A
Training:   2%|▏         | 2/90 [00:00<00:37,  2.33it/s][A
Training:   6%|▌         | 5/90 [00:01<00:19,  4.43it/s][A
Training:   7%|▋         | 6/90 [00:01<00:16,  4.95it/s][A
Training:  10%|█         | 9/90 [00:02<00:14,  5.59it/s][A
Training:  11%|█         | 10/90 [00:02<00:14,  5.60it/s][A
Training:  14%|█▍        | 13/90 [00:02<00:11,  6.52it/s][A
Training:  16%|█▌        | 14/90 [00:02<00:12,  6.18it/s][A
Training:  19%|█▉        | 17/90 [00:03<00:10,  7.24it/s][A
Training:  20%|██        | 18/90 [00:03<00:11,  6.34it/s][A
Training:  23%|██▎       | 21/90 [00:03<00:09,  7.15it/s][A
Training:  24%|██▍       | 22/90 [00:03<00:10,  6.24it/s][A
Training:  28%|██▊       | 25/90 [00:04<00:09,  6.80it/s][A
Training:  29%|██▉       | 26/90 [00:04<00:10,  6.23it/s][A
Training:  32%|███▏      | 29/90 [00:04<00:09,  6.76it/s][A
Training:  33%|███▎      | 30/90 [00:

Epoch: 41/48 - Loss: 2.5000 - Accuracy: 0.9482



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:00<00:09,  1.18it/s][A
 33%|███▎      | 4/12 [00:00<00:01,  5.32it/s][A
 50%|█████     | 6/12 [00:01<00:01,  4.59it/s][A
100%|██████████| 12/12 [00:02<00:00,  5.64it/s][A
Epochs:  85%|████████▌ | 41/48 [15:33<01:51, 15.97s/it]

Val Loss: 3.2264 - Val Accuracy: 0.9387



Training:   0%|          | 0/90 [00:00<?, ?it/s][A
Training:   1%|          | 1/90 [00:00<01:14,  1.20it/s][A
Training:   6%|▌         | 5/90 [00:01<00:20,  4.12it/s][A
Training:   9%|▉         | 8/90 [00:01<00:11,  6.85it/s][A
Training:  11%|█         | 10/90 [00:02<00:14,  5.45it/s][A
Training:  14%|█▍        | 13/90 [00:02<00:13,  5.61it/s][A
Training:  19%|█▉        | 17/90 [00:03<00:12,  5.87it/s][A
Training:  23%|██▎       | 21/90 [00:03<00:11,  6.05it/s][A
Training:  27%|██▋       | 24/90 [00:03<00:08,  7.70it/s][A
Training:  29%|██▉       | 26/90 [00:04<00:09,  6.59it/s][A
Training:  32%|███▏      | 29/90 [00:04<00:09,  6.29it/s][A
Training:  36%|███▌      | 32/90 [00:05<00:07,  8.19it/s][A
Training:  38%|███▊      | 34/90 [00:05<00:08,  6.57it/s][A
Training:  41%|████      | 37/90 [00:06<00:08,  5.99it/s][A
Training:  46%|████▌     | 41/90 [00:06<00:07,  6.64it/s][A
Training:  50%|█████     | 45/90 [00:07<00:06,  6.85it/s][A
Training:  54%|█████▍    | 49/90 [0

Epoch: 42/48 - Loss: 2.4586 - Accuracy: 0.9490



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:00<00:10,  1.10it/s][A
 33%|███▎      | 4/12 [00:01<00:01,  4.99it/s][A
 50%|█████     | 6/12 [00:01<00:01,  4.32it/s][A
100%|██████████| 12/12 [00:02<00:00,  5.60it/s][A
Epochs:  88%|████████▊ | 42/48 [15:50<01:36, 16.02s/it]

Val Loss: 3.5066 - Val Accuracy: 0.9398



Training:   0%|          | 0/90 [00:00<?, ?it/s][A
Training:   1%|          | 1/90 [00:00<01:09,  1.28it/s][A
Training:   4%|▍         | 4/90 [00:00<00:15,  5.44it/s][A
Training:   7%|▋         | 6/90 [00:01<00:17,  4.70it/s][A
Training:  10%|█         | 9/90 [00:01<00:16,  4.96it/s][A
Training:  13%|█▎        | 12/90 [00:02<00:10,  7.36it/s][A
Training:  16%|█▌        | 14/90 [00:02<00:12,  6.04it/s][A
Training:  18%|█▊        | 16/90 [00:02<00:09,  7.49it/s][A
Training:  20%|██        | 18/90 [00:03<00:12,  5.81it/s][A
Training:  23%|██▎       | 21/90 [00:03<00:12,  5.61it/s][A
Training:  28%|██▊       | 25/90 [00:04<00:10,  6.22it/s][A
Training:  31%|███       | 28/90 [00:04<00:07,  8.12it/s][A
Training:  33%|███▎      | 30/90 [00:04<00:08,  6.94it/s][A
Training:  36%|███▌      | 32/90 [00:05<00:07,  8.22it/s][A
Training:  38%|███▊      | 34/90 [00:05<00:09,  6.07it/s][A
Training:  41%|████      | 37/90 [00:06<00:09,  5.78it/s][A
Training:  44%|████▍     | 40/90 [00

Epoch: 43/48 - Loss: 2.3901 - Accuracy: 0.9520



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:00<00:09,  1.14it/s][A
 33%|███▎      | 4/12 [00:01<00:01,  5.04it/s][A
 50%|█████     | 6/12 [00:01<00:01,  4.52it/s][A
100%|██████████| 12/12 [00:02<00:00,  5.78it/s][A
Epochs:  90%|████████▉ | 43/48 [16:05<01:19, 15.88s/it]

Val Loss: 3.2263 - Val Accuracy: 0.9403



Training:   0%|          | 0/90 [00:00<?, ?it/s][A
Training:   1%|          | 1/90 [00:00<01:04,  1.37it/s][A
Training:   6%|▌         | 5/90 [00:01<00:19,  4.41it/s][A
Training:   9%|▉         | 8/90 [00:01<00:11,  7.40it/s][A
Training:  11%|█         | 10/90 [00:01<00:13,  6.02it/s][A
Training:  14%|█▍        | 13/90 [00:02<00:12,  5.99it/s][A
Training:  18%|█▊        | 16/90 [00:02<00:08,  8.39it/s][A
Training:  20%|██        | 18/90 [00:03<00:11,  6.21it/s][A
Training:  22%|██▏       | 20/90 [00:03<00:09,  7.30it/s][A
Training:  24%|██▍       | 22/90 [00:03<00:11,  6.03it/s][A
Training:  28%|██▊       | 25/90 [00:04<00:11,  5.86it/s][A
Training:  32%|███▏      | 29/90 [00:04<00:09,  6.15it/s][A
Training:  36%|███▌      | 32/90 [00:04<00:07,  8.11it/s][A
Training:  38%|███▊      | 34/90 [00:05<00:08,  6.42it/s][A
Training:  40%|████      | 36/90 [00:05<00:07,  7.59it/s][A
Training:  42%|████▏     | 38/90 [00:06<00:08,  6.30it/s][A
Training:  44%|████▍     | 40/90 [0

Epoch: 44/48 - Loss: 2.6848 - Accuracy: 0.9435



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:00<00:09,  1.22it/s][A
 42%|████▏     | 5/12 [00:01<00:01,  4.30it/s][A
100%|██████████| 12/12 [00:02<00:00,  5.98it/s][A
Epochs:  92%|█████████▏| 44/48 [16:21<01:03, 15.83s/it]

Val Loss: 3.3150 - Val Accuracy: 0.9389



Training:   0%|          | 0/90 [00:00<?, ?it/s][A
Training:   1%|          | 1/90 [00:00<01:14,  1.20it/s][A
Training:   6%|▌         | 5/90 [00:01<00:20,  4.20it/s][A
Training:  10%|█         | 9/90 [00:02<00:16,  5.05it/s][A
Training:  14%|█▍        | 13/90 [00:02<00:13,  5.67it/s][A
Training:  18%|█▊        | 16/90 [00:02<00:09,  7.57it/s][A
Training:  20%|██        | 18/90 [00:03<00:11,  6.42it/s][A
Training:  23%|██▎       | 21/90 [00:03<00:11,  6.03it/s][A
Training:  28%|██▊       | 25/90 [00:04<00:10,  6.25it/s][A
Training:  32%|███▏      | 29/90 [00:04<00:09,  6.39it/s][A
Training:  37%|███▋      | 33/90 [00:05<00:08,  6.81it/s][A
Training:  40%|████      | 36/90 [00:05<00:06,  8.50it/s][A
Training:  42%|████▏     | 38/90 [00:06<00:07,  6.59it/s][A
Training:  46%|████▌     | 41/90 [00:06<00:08,  6.09it/s][A
Training:  50%|█████     | 45/90 [00:07<00:07,  6.39it/s][A
Training:  54%|█████▍    | 49/90 [00:07<00:06,  6.67it/s][A
Training:  59%|█████▉    | 53/90 [0

Epoch: 45/48 - Loss: 2.3970 - Accuracy: 0.9495



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:00<00:09,  1.18it/s][A
 42%|████▏     | 5/12 [00:01<00:01,  4.00it/s][A
100%|██████████| 12/12 [00:02<00:00,  5.76it/s][A
Epochs:  94%|█████████▍| 45/48 [16:37<00:47, 15.88s/it]

Val Loss: 3.6098 - Val Accuracy: 0.9291



Training:   0%|          | 0/90 [00:00<?, ?it/s][A
Training:   1%|          | 1/90 [00:00<01:16,  1.16it/s][A
Training:   4%|▍         | 4/90 [00:00<00:16,  5.13it/s][A
Training:   7%|▋         | 6/90 [00:01<00:18,  4.43it/s][A
Training:  10%|█         | 9/90 [00:02<00:16,  4.83it/s][A
Training:  14%|█▍        | 13/90 [00:02<00:13,  5.57it/s][A
Training:  19%|█▉        | 17/90 [00:03<00:12,  6.08it/s][A
Training:  23%|██▎       | 21/90 [00:03<00:10,  6.46it/s][A
Training:  28%|██▊       | 25/90 [00:04<00:09,  6.81it/s][A
Training:  32%|███▏      | 29/90 [00:04<00:08,  7.01it/s][A
Training:  37%|███▋      | 33/90 [00:05<00:08,  6.51it/s][A
Training:  41%|████      | 37/90 [00:06<00:07,  6.65it/s][A
Training:  46%|████▌     | 41/90 [00:06<00:07,  6.78it/s][A
Training:  50%|█████     | 45/90 [00:07<00:06,  6.99it/s][A
Training:  52%|█████▏    | 47/90 [00:07<00:05,  7.89it/s][A
Training:  54%|█████▍    | 49/90 [00:07<00:06,  6.62it/s][A
Training:  59%|█████▉    | 53/90 [00

Epoch: 46/48 - Loss: 2.4667 - Accuracy: 0.9474



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:00<00:10,  1.09it/s][A
 42%|████▏     | 5/12 [00:01<00:01,  3.97it/s][A
100%|██████████| 12/12 [00:02<00:00,  5.59it/s][A
Epochs:  96%|█████████▌| 46/48 [16:53<00:31, 15.91s/it]

Val Loss: 3.2369 - Val Accuracy: 0.9392



Training:   0%|          | 0/90 [00:00<?, ?it/s][A
Training:   1%|          | 1/90 [00:00<01:16,  1.16it/s][A
Training:   6%|▌         | 5/90 [00:01<00:20,  4.20it/s][A
Training:   9%|▉         | 8/90 [00:01<00:11,  7.05it/s][A
Training:  11%|█         | 10/90 [00:01<00:13,  6.05it/s][A
Training:  13%|█▎        | 12/90 [00:02<00:10,  7.34it/s][A
Training:  16%|█▌        | 14/90 [00:02<00:12,  5.94it/s][A
Training:  18%|█▊        | 16/90 [00:02<00:09,  7.55it/s][A
Training:  20%|██        | 18/90 [00:03<00:12,  5.68it/s][A
Training:  23%|██▎       | 21/90 [00:03<00:11,  6.00it/s][A
Training:  27%|██▋       | 24/90 [00:03<00:07,  8.41it/s][A
Training:  29%|██▉       | 26/90 [00:04<00:10,  6.11it/s][A
Training:  32%|███▏      | 29/90 [00:04<00:10,  5.77it/s][A
Training:  37%|███▋      | 33/90 [00:05<00:09,  6.15it/s][A
Training:  41%|████      | 37/90 [00:06<00:08,  6.44it/s][A
Training:  46%|████▌     | 41/90 [00:06<00:07,  6.52it/s][A
Training:  49%|████▉     | 44/90 [0

Epoch: 47/48 - Loss: 2.3387 - Accuracy: 0.9501



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:00<00:07,  1.39it/s][A
 42%|████▏     | 5/12 [00:01<00:01,  4.45it/s][A
 67%|██████▋   | 8/12 [00:01<00:00,  7.03it/s][A
100%|██████████| 12/12 [00:02<00:00,  5.92it/s][A
Epochs:  98%|█████████▊| 47/48 [17:08<00:15, 15.80s/it]

Val Loss: 3.1474 - Val Accuracy: 0.9448



Training:   0%|          | 0/90 [00:00<?, ?it/s][A
Training:   1%|          | 1/90 [00:00<01:14,  1.20it/s][A
Training:   6%|▌         | 5/90 [00:01<00:21,  3.99it/s][A
Training:   8%|▊         | 7/90 [00:01<00:15,  5.46it/s][A
Training:  10%|█         | 9/90 [00:02<00:16,  4.88it/s][A
Training:  14%|█▍        | 13/90 [00:02<00:11,  6.48it/s][A
Training:  19%|█▉        | 17/90 [00:02<00:10,  7.07it/s][A
Training:  22%|██▏       | 20/90 [00:03<00:07,  9.11it/s][A
Training:  24%|██▍       | 22/90 [00:03<00:10,  6.50it/s][A
Training:  28%|██▊       | 25/90 [00:04<00:11,  5.85it/s][A
Training:  32%|███▏      | 29/90 [00:04<00:09,  6.31it/s][A
Training:  37%|███▋      | 33/90 [00:05<00:08,  6.43it/s][A
Training:  41%|████      | 37/90 [00:06<00:08,  6.38it/s][A
Training:  46%|████▌     | 41/90 [00:06<00:07,  6.65it/s][A
Training:  50%|█████     | 45/90 [00:07<00:06,  6.98it/s][A
Training:  54%|█████▍    | 49/90 [00:07<00:06,  6.75it/s][A
Training:  59%|█████▉    | 53/90 [00

Epoch: 48/48 - Loss: 2.4154 - Accuracy: 0.9502



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:00<00:08,  1.29it/s][A
 33%|███▎      | 4/12 [00:00<00:01,  5.69it/s][A
 50%|█████     | 6/12 [00:01<00:01,  4.43it/s][A
100%|██████████| 12/12 [00:02<00:00,  5.81it/s][A
Epochs: 100%|██████████| 48/48 [17:24<00:00, 21.76s/it]
[32m[I 2023-12-15 01:08:39,388][0m Trial 15 finished with value: 0.9360263347625732 and parameters: {'loss_learning_rate': 0.0016723340404899286, 'learning_rate': 0.00297091543911568, 'weight_decay': 0.0030935162473622207, 'epsilon': 1.3436697189792923e-08, 'batch_size': 156, 'epochs': 48}. Best is trial 11 with value: 0.9404187798500061.[0m


Val Loss: 3.2265 - Val Accuracy: 0.9360
Learning rate for Loss: 0.004451198397636186
Learning rate: 0.09134641904547088
Weight decay: 0.0009169084310732388
Epsilon: 3.9767097546968835e-08
Batch size: 107
Number of epochs: 26


Epochs:   0%|          | 0/26 [00:00<?, ?it/s]
Training:   0%|          | 0/131 [00:00<?, ?it/s][A
Training:   1%|          | 1/131 [00:00<01:33,  1.38it/s][A
Training:   4%|▍         | 5/131 [00:01<00:25,  4.93it/s][A
Training:   7%|▋         | 9/131 [00:01<00:17,  6.96it/s][A
Training:  10%|▉         | 13/131 [00:01<00:14,  8.16it/s][A
Training:  13%|█▎        | 17/131 [00:02<00:12,  9.03it/s][A
Training:  16%|█▌        | 21/131 [00:02<00:11,  9.22it/s][A
Training:  18%|█▊        | 23/131 [00:02<00:10, 10.34it/s][A
Training:  19%|█▉        | 25/131 [00:03<00:12,  8.70it/s][A
Training:  22%|██▏       | 29/131 [00:03<00:11,  8.78it/s][A
Training:  25%|██▌       | 33/131 [00:03<00:10,  9.47it/s][A
Training:  28%|██▊       | 37/131 [00:04<00:09,  9.65it/s][A
Training:  31%|███▏      | 41/131 [00:04<00:09,  9.51it/s][A
Training:  34%|███▍      | 45/131 [00:05<00:08,  9.71it/s][A
Training:  37%|███▋      | 48/131 [00:05<00:07, 11.54it/s][A
Training:  38%|███▊      | 50/131 [

Epoch: 1/26 - Loss: 55.3374 - Accuracy: 0.7900



  0%|          | 0/17 [00:00<?, ?it/s][A
  6%|▌         | 1/17 [00:00<00:10,  1.56it/s][A
 29%|██▉       | 5/17 [00:01<00:02,  5.76it/s][A
 53%|█████▎    | 9/17 [00:01<00:01,  7.67it/s][A
 76%|███████▋  | 13/17 [00:01<00:00,  8.76it/s][A
100%|██████████| 17/17 [00:01<00:00,  8.78it/s][A
Epochs:   0%|          | 0/26 [00:16<?, ?it/s]
[32m[I 2023-12-15 01:08:55,717][0m Trial 16 pruned. [0m


Val Loss: 5.7275 - Val Accuracy: 0.8796
Learning rate for Loss: 0.0005260793851023105
Learning rate: 1.0731669565517476e-05
Weight decay: 0.00025583574342948745
Epsilon: 2.9895356764070386e-09
Batch size: 181
Number of epochs: 84


Epochs:   0%|          | 0/84 [00:00<?, ?it/s]
Training:   0%|          | 0/78 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/78 [00:01<01:17,  1.00s/it][A
Training:   6%|▋         | 5/78 [00:01<00:21,  3.44it/s][A
Training:  12%|█▏        | 9/78 [00:02<00:15,  4.32it/s][A
Training:  17%|█▋        | 13/78 [00:03<00:12,  5.04it/s][A
Training:  22%|██▏       | 17/78 [00:03<00:11,  5.49it/s][A
Training:  26%|██▌       | 20/78 [00:03<00:08,  6.89it/s][A
Training:  27%|██▋       | 21/78 [00:04<00:11,  4.78it/s][A
Training:  32%|███▏      | 25/78 [00:05<00:10,  5.12it/s][A
Training:  37%|███▋      | 29/78 [00:05<00:08,  5.51it/s][A
Training:  42%|████▏     | 33/78 [00:06<00:08,  5.62it/s][A
Training:  47%|████▋     | 37/78 [00:07<00:07,  5.67it/s][A
Training:  53%|█████▎    | 41/78 [00:07<00:06,  5.88it/s][A
Training:  56%|█████▋    | 44/78 [00:07<00:04,  7.35it/s][A
Training:  59%|█████▉    | 46/78 [00:08<00:05,  5.78it/s][A
Training:  63%|██████▎   | 49/78 [00:09<00:05,  5.

Epoch: 1/84 - Loss: 21.8242 - Accuracy: 0.5744



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:00<00:08,  1.11it/s][A
 50%|█████     | 5/10 [00:01<00:01,  3.33it/s][A
100%|██████████| 10/10 [00:02<00:00,  4.33it/s][A
Epochs:   0%|          | 0/84 [00:16<?, ?it/s]
[32m[I 2023-12-15 01:09:12,520][0m Trial 17 pruned. [0m


Val Loss: 21.0230 - Val Accuracy: 0.6198
Learning rate for Loss: 0.0009890707862992576
Learning rate: 0.0002620469185953932
Weight decay: 0.0018605104626275328
Epsilon: 5.1625657105462916e-08
Batch size: 247
Number of epochs: 50


Epochs:   0%|          | 0/50 [00:00<?, ?it/s]
Training:   0%|          | 0/57 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/57 [00:01<01:09,  1.24s/it][A
Training:   5%|▌         | 3/57 [00:01<00:19,  2.70it/s][A
Training:   9%|▉         | 5/57 [00:02<00:18,  2.81it/s][A
Training:  11%|█         | 6/57 [00:02<00:15,  3.39it/s][A
Training:  16%|█▌        | 9/57 [00:03<00:13,  3.56it/s][A
Training:  18%|█▊        | 10/57 [00:03<00:12,  3.86it/s][A
Training:  23%|██▎       | 13/57 [00:03<00:10,  4.02it/s][A
Training:  25%|██▍       | 14/57 [00:04<00:09,  4.37it/s][A
Training:  30%|██▉       | 17/57 [00:04<00:09,  4.12it/s][A
Training:  32%|███▏      | 18/57 [00:05<00:09,  4.26it/s][A
Training:  37%|███▋      | 21/57 [00:05<00:08,  4.05it/s][A
Training:  39%|███▊      | 22/57 [00:05<00:07,  4.46it/s][A
Training:  44%|████▍     | 25/57 [00:06<00:07,  4.31it/s][A
Training:  46%|████▌     | 26/57 [00:06<00:06,  4.64it/s][A
Training:  51%|█████     | 29/57 [00:07<00:06,  4.38

Epoch: 1/50 - Loss: 11.7784 - Accuracy: 0.7455



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:01<00:08,  1.18s/it][A
 50%|█████     | 4/8 [00:01<00:01,  3.80it/s][A
100%|██████████| 8/8 [00:02<00:00,  3.69it/s][A
Epochs:   0%|          | 0/50 [00:15<?, ?it/s]
[32m[I 2023-12-15 01:09:28,300][0m Trial 18 pruned. [0m


Val Loss: 7.0665 - Val Accuracy: 0.8811
Learning rate for Loss: 0.0004009011737522738
Learning rate: 0.011111878764147874
Weight decay: 0.0006245196613254969
Epsilon: 2.270185135099767e-08
Batch size: 100
Number of epochs: 27


Epochs:   0%|          | 0/27 [00:00<?, ?it/s]
Training:   0%|          | 0/140 [00:00<?, ?it/s][A
Training:   1%|          | 1/140 [00:00<01:32,  1.51it/s][A
Training:   4%|▎         | 5/140 [00:01<00:23,  5.63it/s][A
Training:   6%|▋         | 9/140 [00:01<00:15,  8.65it/s][A
Training:   9%|▉         | 13/140 [00:01<00:13,  9.76it/s][A
Training:  12%|█▏        | 17/140 [00:02<00:12, 10.01it/s][A
Training:  15%|█▌        | 21/140 [00:02<00:12,  9.90it/s][A
Training:  18%|█▊        | 25/140 [00:02<00:11,  9.91it/s][A
Training:  21%|██        | 29/140 [00:03<00:10, 10.43it/s][A
Training:  24%|██▎       | 33/140 [00:03<00:10, 10.54it/s][A
Training:  26%|██▋       | 37/140 [00:03<00:09, 10.64it/s][A
Training:  29%|██▉       | 41/140 [00:04<00:09, 10.76it/s][A
Training:  32%|███▏      | 45/140 [00:04<00:09, 10.37it/s][A
Training:  35%|███▌      | 49/140 [00:05<00:08, 10.58it/s][A
Training:  38%|███▊      | 53/140 [00:05<00:08, 10.59it/s][A
Training:  41%|████      | 57/140 [

Epoch: 1/27 - Loss: 12.3690 - Accuracy: 0.8058



  0%|          | 0/18 [00:00<?, ?it/s][A
  6%|▌         | 1/18 [00:00<00:10,  1.70it/s][A
 28%|██▊       | 5/18 [00:00<00:02,  6.12it/s][A
 50%|█████     | 9/18 [00:01<00:01,  7.55it/s][A
 72%|███████▏  | 13/18 [00:01<00:00,  8.49it/s][A
100%|██████████| 18/18 [00:02<00:00,  8.22it/s][A
Epochs:   4%|▎         | 1/27 [00:15<06:54, 15.95s/it]

Val Loss: 4.7440 - Val Accuracy: 0.9065



Training:   0%|          | 0/140 [00:00<?, ?it/s][A
Training:   1%|          | 1/140 [00:00<01:19,  1.74it/s][A
Training:   4%|▎         | 5/140 [00:00<00:20,  6.47it/s][A
Training:   6%|▋         | 9/140 [00:01<00:16,  7.79it/s][A
Training:   9%|▉         | 13/140 [00:01<00:14,  8.74it/s][A
Training:  11%|█▏        | 16/140 [00:01<00:10, 11.29it/s][A
Training:  13%|█▎        | 18/140 [00:02<00:13,  8.95it/s][A
Training:  15%|█▌        | 21/140 [00:02<00:13,  8.79it/s][A
Training:  18%|█▊        | 25/140 [00:02<00:11,  9.84it/s][A
Training:  21%|██        | 29/140 [00:03<00:11,  9.90it/s][A
Training:  24%|██▎       | 33/140 [00:03<00:10, 10.02it/s][A
Training:  26%|██▋       | 37/140 [00:04<00:09, 10.42it/s][A
Training:  28%|██▊       | 39/140 [00:04<00:08, 11.42it/s][A
Training:  29%|██▉       | 41/140 [00:04<00:09,  9.97it/s][A
Training:  32%|███▏      | 45/140 [00:04<00:09, 10.45it/s][A
Training:  35%|███▌      | 49/140 [00:05<00:08, 10.95it/s][A
Training:  37%|███▋

Epoch: 2/27 - Loss: 4.6570 - Accuracy: 0.9124



  0%|          | 0/18 [00:00<?, ?it/s][A
  6%|▌         | 1/18 [00:00<00:11,  1.51it/s][A
 28%|██▊       | 5/18 [00:01<00:02,  5.60it/s][A
 50%|█████     | 9/18 [00:01<00:01,  7.13it/s][A
 72%|███████▏  | 13/18 [00:01<00:00,  8.55it/s][A
100%|██████████| 18/18 [00:02<00:00,  8.12it/s][A
Epochs:   4%|▎         | 1/27 [00:31<13:51, 31.96s/it]
[32m[I 2023-12-15 01:10:00,652][0m Trial 19 pruned. [0m


Val Loss: 4.1993 - Val Accuracy: 0.8944

Study statistics: 
  Number of finished trials:  20
  Number of pruned trials:  12
  Number of complete trials:  8


In [20]:
print("Best trial:")
trial = study.best_trial

print("  Value: ", trial.value)

print("  Params: ")
for key, value in trial.params.items():
    print("    {}: {}".format(key, value))

Best trial:
  Value:  0.9404187798500061
  Params: 
    batch_size: 273
    epochs: 89
    epsilon: 3.4960361296560697e-08
    learning_rate: 0.0011125954409380188
    loss_learning_rate: 0.0005475502239825571
    weight_decay: 0.004132770040241243


In [None]:
# ViT P12-S8 CosFace Mean

Best trial:
Value:  0.9404187798500061
Params: 
batch_size: 273
epochs: 89
epsilon: 3.4960361296560697e-08
learning_rate: 0.0011125954409380188
loss_learning_rate: 0.0005475502239825571
weight_decay: 0.004132770040241243