In [1]:
import os
import random
import pandas as pd
import numpy as np
import mxnet as mx
import torch
import torch.nn as nn
import torch.nn.functional as F
import torch.optim as opt
from torch.utils.data import Dataset, DataLoader
from einops import rearrange, repeat
import optuna
from optuna.trial import TrialState
from tqdm import tqdm

In [2]:
def file_to_embed(embeds, file):
    emb = []
    for f in file:
        emb.append(embeds[f][0])
    return torch.stack(emb)

In [3]:
MIN_NUM_PATCHES = 16

In [4]:
device = torch.device("cuda:2" if torch.cuda.is_available() else "cpu")
device

device(type='cuda', index=2)

In [5]:
class AdienceDataset(Dataset):
    def __init__(self, annot_file, img_dir):
        self.img_lbls = pd.read_csv(annot_file, header=None)
        self.img_dir = img_dir
    
    def __len__(self):
        return len(self.img_lbls)
    
    def __getitem__(self, idx):
        img_file = self.img_lbls.iloc[idx, 0]
        img_path = os.path.join(self.img_dir, img_file)
        image = mx.image.imread(img_path)
        if image.shape[1] != 112:
            image = mx.image.resize_short(image, 112)
        image = mx.nd.transpose(image, axes=(2,0,1))
        image = torch.tensor(image.asnumpy()).type(torch.FloatTensor)
        label = self.img_lbls.iloc[idx, 1]

        return image, label, img_file

In [6]:
train_data = AdienceDataset("../train.csv", "../cropped_Adience/")
val_data = AdienceDataset("../val.csv", "../cropped_Adience/")

In [7]:
class CosFace(nn.Module):
    r"""Implement of CosFace (https://arxiv.org/pdf/1801.09414.pdf):
    Args:
        in_features: size of each input sample
        out_features: size of each output sample
        device_id: the ID of GPU where the model will be trained by model parallel.
                       if device_id=None, it will be trained on CPU without model parallel.
        s: norm of input feature
        m: margin
        cos(theta)-m
    """

    def __init__(self, in_features, out_features, device_id, s=64.0, m=0.35):
        super(CosFace, self).__init__()
        self.in_features = in_features
        self.out_features = out_features
        self.device_id = device_id
        self.s = s
        self.m = m
        print("self.device_id", self.device_id)
        self.weight = nn.Parameter(torch.FloatTensor(out_features, in_features))
        nn.init.xavier_uniform_(self.weight)

    def forward(self, input, label):
        # --------------------------- cos(theta) & phi(theta) ---------------------------

        if self.device_id == None:
            cosine = F.linear(F.normalize(input), F.normalize(self.weight))
        else:
            x = input
            sub_weights = torch.chunk(self.weight, len(self.device_id), dim=0)
            temp_x = x.cuda(self.device_id[0])
            weight = sub_weights[0].cuda(self.device_id[0])
            cosine = F.linear(F.normalize(temp_x), F.normalize(weight))
            for i in range(1, len(self.device_id)):
                temp_x = x.cuda(self.device_id[i])
                weight = sub_weights[i].cuda(self.device_id[i])
                cosine = torch.cat((cosine, F.linear(F.normalize(temp_x), F.normalize(weight)).cuda(self.device_id[0])),
                                   dim=1)
        phi = cosine - self.m
        # --------------------------- convert label to one-hot ---------------------------
        one_hot = torch.zeros(cosine.size())
        if self.device_id != None:
            one_hot = one_hot.cuda(self.device_id[0])
        # one_hot = one_hot.cuda() if cosine.is_cuda else one_hot

        one_hot.scatter_(1, label.view(-1, 1).long(), 1)
        # -------------torch.where(out_i = {x_i if condition_i else y_i) -------------
        output = (one_hot * phi) + (
                    (1.0 - one_hot) * cosine)  # you can use torch.where if your torch.__version__ is 0.4
        output *= self.s

        return output

    def __repr__(self):
        return self.__class__.__name__ + '(' \
               + 'in_features = ' + str(self.in_features) \
               + ', out_features = ' + str(self.out_features) \
               + ', s = ' + str(self.s) \
               + ', m = ' + str(self.m) + ')'

In [8]:
class Residual(nn.Module):
    def __init__(self, fn):
        super().__init__()
        self.fn = fn
    def forward(self, x, **kwargs):
        return self.fn(x, **kwargs) + x

In [9]:
class PreNorm(nn.Module):
    def __init__(self, dim, fn):
        super().__init__()
        self.norm = nn.LayerNorm(dim)
        self.fn = fn
    def forward(self, x, **kwargs):
        return self.fn(self.norm(x), **kwargs)

In [10]:
class FeedForward(nn.Module):
    def __init__(self, dim, hidden_dim, dropout = 0.):
        super().__init__()
        self.net = nn.Sequential(
            nn.Linear(dim, hidden_dim),
            nn.GELU(),
            nn.Dropout(dropout),
            nn.Linear(hidden_dim, dim),
            nn.Dropout(dropout)
        )
    def forward(self, x):
        return self.net(x)

In [11]:
class Attention(nn.Module):
    def __init__(self, dim, heads = 8, dim_head = 64, dropout = 0.):
        super().__init__()
        inner_dim = dim_head *  heads
        self.heads = heads
        self.scale = dim ** -0.5

        self.to_qkv = nn.Linear(dim, inner_dim * 3, bias = False)
        self.to_out = nn.Sequential(
            nn.Linear(inner_dim, dim),
            nn.Dropout(dropout)
        )

    def forward(self, x, mask = None):
        b, n, _, h = *x.shape, self.heads
        qkv = self.to_qkv(x).chunk(3, dim = -1)

        q, k, v = map(lambda t: rearrange(t, 'b n (h d) -> b h n d', h = h), qkv)
        dots = torch.einsum('bhid,bhjd->bhij', q, k) * self.scale
        mask_value = -torch.finfo(dots.dtype).max
        #embed()
        if mask is not None:
            mask = F.pad(mask.flatten(1), (1, 0), value = True)
            assert mask.shape[-1] == dots.shape[-1], 'mask has incorrect dimensions'
            mask = mask[:, None, :] * mask[:, :, None]
            dots.masked_fill_(~mask, mask_value)
            del mask

        attn = dots.softmax(dim=-1)

        out = torch.einsum('bhij,bhjd->bhid', attn, v)
        out = rearrange(out, 'b h n d -> b n (h d)')
        out =  self.to_out(out)

        return out

In [12]:
class Transformer(nn.Module):
    def __init__(self, dim, depth, heads, dim_head, mlp_dim, dropout):
        super().__init__()
        self.layers = nn.ModuleList([])
        for _ in range(depth):
            self.layers.append(nn.ModuleList([
                Residual(PreNorm(dim, Attention(dim, heads = heads, dim_head = dim_head, dropout = dropout))),
                Residual(PreNorm(dim, FeedForward(dim, mlp_dim, dropout = dropout)))
            ]))
    def forward(self, x, mask = None):
        for attn, ff in self.layers:
            x = attn(x, mask = mask)
            #embed()
            x = ff(x)
        return x

In [13]:
class ViTs_face(nn.Module):
    def __init__(self, *, loss_type, GPU_ID, num_class, image_size, patch_size, ac_patch_size,
                         pad, dim, depth, heads, mlp_dim, pool = 'mean', channels = 3, dim_head = 64, dropout = 0., emb_dropout = 0.):
        super().__init__()
        assert image_size % patch_size == 0, 'Image dimensions must be divisible by the patch size.'
        num_patches = (image_size // patch_size) ** 2
        patch_dim = channels * ac_patch_size ** 2
        assert num_patches > MIN_NUM_PATCHES, f'your number of patches ({num_patches}) is way too small for attention to be effective (at least 16). Try decreasing your patch size'
        assert pool in {'cls', 'mean'}, 'pool type must be either cls (cls token) or mean (mean pooling)'

        self.patch_size = patch_size
        self.soft_split = nn.Unfold(kernel_size=(ac_patch_size, ac_patch_size), stride=(self.patch_size, self.patch_size), padding=(pad, pad))


        self.pos_embedding = nn.Parameter(torch.randn(1, num_patches + 1, dim))
        self.patch_to_embedding = nn.Linear(patch_dim, dim)
        self.cls_token = nn.Parameter(torch.randn(1, 1, dim))
        self.dropout = nn.Dropout(emb_dropout)

        self.transformer = Transformer(dim, depth, heads, dim_head, mlp_dim, dropout)

        self.pool = pool
        self.to_latent = nn.Identity()

        self.mlp_head = nn.Sequential(
            nn.LayerNorm(dim),
        )
        self.loss_type = loss_type
        self.GPU_ID = GPU_ID
        if self.loss_type == 'None':
            print("no loss for vit_face")
        else:
            if self.loss_type == 'Softmax':
                self.loss = Softmax(in_features=dim, out_features=num_class, device_id=self.GPU_ID)
            elif self.loss_type == 'CosFace':
                self.loss = CosFace(in_features=dim, out_features=num_class, device_id=self.GPU_ID)
            elif self.loss_type == 'ArcFace':
                self.loss = ArcFace(in_features=dim, out_features=num_class, device_id=self.GPU_ID)
            elif self.loss_type == 'SFace':
                self.loss = SFaceLoss(in_features=dim, out_features=num_class, device_id=self.GPU_ID)

    def forward(self, img, label= None , mask = None):
        p = self.patch_size
        x = self.soft_split(img).transpose(1, 2)
        x = self.patch_to_embedding(x)
        b, n, _ = x.shape

        cls_tokens = repeat(self.cls_token, '() n d -> b n d', b = b)
        x = torch.cat((cls_tokens, x), dim=1)
        x += self.pos_embedding[:, :(n + 1)]
        x = self.dropout(x)
        x = self.transformer(x, mask)

        y = x[:, 0]
        z = x[:, 1:].mean(dim = 1)

        y = self.to_latent(y)
        emb_y = self.mlp_head(y)
        z = self.to_latent(z)
        emb_z = self.mlp_head(z)
        emb = torch.cat((emb_y, emb_z), dim=1)
        if label is not None:
            x = self.loss(emb, label)
            return x, emb
        else:
            return emb

In [14]:
class ViT_plus(nn.Module):
    def __init__(self):
        super(ViT_plus, self).__init__()
        
        self.fc1 = nn.Linear(in_features=1024, out_features=1024)
        self.fc2 = nn.Linear(in_features=1024, out_features=2)
        
    def forward(self, x):
        x = self.fc1(x)
        x_cosface = x
        x_classification = self.fc2(x)
        
        return x_cosface, x_classification

In [15]:
model = ViTs_face(
            loss_type='CosFace',
            GPU_ID=[device],
            num_class=93431,
            image_size=112,
            patch_size=8,
            ac_patch_size=12,
            pad=4,
            dim=512,
            depth=20,
            heads=8,
            mlp_dim=2048,
            dropout=0.1,
            emb_dropout=0.1
        ).to(device)
model.load_state_dict(
    torch.load("../Backbone_VITs_Epoch_2_Batch_12000_Time_2021-03-17-04-05_checkpoint.pth", map_location=device)
)

self.device_id [device(type='cuda', index=2)]


<All keys matched successfully>

In [16]:
for param in model.parameters():
    param.requires_grad = False

In [17]:
embeds = {}
model.eval()

with torch.no_grad():
    for img, _, file in train_data:
        img = img.to(device)
        embeds[file] = model(torch.unsqueeze(img, 0))

    for img, _, file in val_data:
        img = img.to(device)
        embeds[file] = model(torch.unsqueeze(img, 0))

In [18]:
best_accu = 0.0
def objective(trial):
    model_xtr = ViT_plus().to(device)
    
    lr = trial.suggest_float("learning_rate", 1e-5, 1e-1, log=True)
    wd = trial.suggest_float('weight_decay', 1e-4, 1e-2, log=True)
    eps = trial.suggest_float("epsilon", 1e-9, 1e-7, log=True)
    optimizer = opt.AdamW(model_xtr.parameters(), lr=lr, eps=eps, weight_decay=wd)
    
    criterion = nn.CrossEntropyLoss()
    
    batch_size = trial.suggest_int('batch_size', 50, 300)
    num_epochs = trial.suggest_int('epochs', 10, 100)
    
    print("Learning rate: "+ str(lr))
    print("Weight decay: "+ str(wd))
    print("Epsilon: "+ str(eps))
    print("Batch size: "+ str(batch_size))
    print("Number of epochs: "+ str(num_epochs))
    
    for epoch in tqdm(range(num_epochs), desc="Epochs"):
        train_loader = DataLoader(train_data, batch_size=batch_size, shuffle=True, num_workers=4)
        val_loader = DataLoader(val_data, batch_size=batch_size, shuffle=False, num_workers=4)
        
        # training loop
        running_loss = []
        running_accu = []
        
        model_xtr.train()
        for img, label, file in tqdm(train_loader, desc="Training", leave=False):
            img, label = img.to(device), label.to(device)

            x = file_to_embed(embeds, file)
            
            optimizer.zero_grad()
            _, output = model_xtr(x)
            
            pred = torch.argmax(output, 1)
            accuracy = torch.eq(pred, label).sum() / len(img)

            loss = criterion(output, label)
            loss.backward()
            optimizer.step()

            running_accu.append(accuracy.cpu().detach().numpy())
            running_loss.append(loss.cpu().detach().numpy())
        print("Epoch: {}/{} - Loss: {:.4f} - Accuracy: {:.4f}".format(epoch+1, num_epochs, np.mean(running_loss), np.mean(running_accu)))
        
        # validation loop
        val_loss = []
        val_accu = []

        model_xtr.eval()
        with torch.no_grad():
            for img, label, file in tqdm(val_loader):
                img, label = img.to(device), label.to(device)
                
                x = file_to_embed(embeds, file)
                
                _, output = model_xtr(x)
                
                pred = torch.argmax(output, 1)
                accuracy = torch.eq(pred, label).sum() / len(img)
                
                loss = criterion(output, label)
                
                val_accu.append(accuracy.cpu().detach().numpy())
                val_loss.append(loss.cpu().detach().numpy())
        val_accu = np.mean(val_accu)
        val_loss = np.mean(val_loss)
        print("Val Loss: {:.4f} - Val Accuracy: {:.4f}".format(val_loss, val_accu))
        
        trial.report(val_accu, epoch)
        if trial.should_prune():
            raise optuna.exceptions.TrialPruned()
    
    global best_accu
    if val_accu > best_accu:
        best_accu = val_accu
        print("Saving best model...")
        torch.save(model_xtr.state_dict(), "../vit_12-8_mean.pt")
            
    return val_accu

In [19]:
study = optuna.create_study(direction='maximize',
                            study_name='vit-12-8-mean-study',
                            storage='sqlite:///study8.db',
                            load_if_exists=True)
study.optimize(objective, n_trials=10)

pruned_trials = study.get_trials(deepcopy=False, states=[TrialState.PRUNED])
complete_trials = study.get_trials(deepcopy=False, states=[TrialState.COMPLETE])

# Display the study statistics
print("\nStudy statistics: ")
print("  Number of finished trials: ", len(study.trials))
print("  Number of pruned trials: ", len(pruned_trials))
print("  Number of complete trials: ", len(complete_trials))

[32m[I 2023-12-11 22:58:47,455][0m A new study created in RDB with name: vit-12-8-mean-study[0m


Learning rate: 0.05870926873283856
Weight decay: 0.0001579889011773346
Epsilon: 1.6867250271368622e-08
Batch size: 282
Number of epochs: 72


Epochs:   0%|          | 0/72 [00:00<?, ?it/s]
Training:   0%|          | 0/50 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/50 [00:01<01:19,  1.61s/it][A
Training:   8%|▊         | 4/50 [00:01<00:15,  2.98it/s][A
Training:  12%|█▏        | 6/50 [00:02<00:19,  2.24it/s][A
Training:  18%|█▊        | 9/50 [00:04<00:17,  2.33it/s][A
Training:  24%|██▍       | 12/50 [00:04<00:10,  3.68it/s][A
Training:  28%|██▊       | 14/50 [00:05<00:12,  2.88it/s][A
Training:  34%|███▍      | 17/50 [00:06<00:12,  2.72it/s][A
Training:  40%|████      | 20/50 [00:06<00:07,  3.91it/s][A
Training:  44%|████▍     | 22/50 [00:07<00:09,  3.07it/s][A
Training:  50%|█████     | 25/50 [00:09<00:08,  2.79it/s][A
Training:  56%|█████▌    | 28/50 [00:09<00:05,  3.97it/s][A
Training:  60%|██████    | 30/50 [00:10<00:06,  3.13it/s][A
Training:  66%|██████▌   | 33/50 [00:11<00:05,  2.99it/s][A
Training:  70%|███████   | 35/50 [00:11<00:03,  3.77it/s][A
Training:  74%|███████▍  | 37/50 [00:12<00:04,  2.9

Epoch: 1/72 - Loss: 156.3585 - Accuracy: 0.7573



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:01<00:08,  1.49s/it][A
 57%|█████▋    | 4/7 [00:01<00:00,  3.18it/s][A
100%|██████████| 7/7 [00:02<00:00,  2.54it/s][A
Epochs:   1%|▏         | 1/72 [00:18<22:02, 18.63s/it]

Val Loss: 5.3191 - Val Accuracy: 0.8567



Training:   0%|          | 0/50 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/50 [00:01<01:11,  1.45s/it][A
Training:   4%|▍         | 2/50 [00:01<00:33,  1.45it/s][A
Training:  10%|█         | 5/50 [00:02<00:20,  2.25it/s][A
Training:  12%|█▏        | 6/50 [00:02<00:16,  2.74it/s][A
Training:  16%|█▌        | 8/50 [00:02<00:10,  4.18it/s][A
Training:  18%|█▊        | 9/50 [00:03<00:16,  2.54it/s][A
Training:  20%|██        | 10/50 [00:03<00:13,  3.04it/s][A
Training:  22%|██▏       | 11/50 [00:04<00:12,  3.21it/s][A
Training:  26%|██▌       | 13/50 [00:05<00:12,  2.89it/s][A
Training:  28%|██▊       | 14/50 [00:05<00:11,  3.09it/s][A
Training:  30%|███       | 15/50 [00:05<00:10,  3.43it/s][A
Training:  34%|███▍      | 17/50 [00:06<00:10,  3.25it/s][A
Training:  36%|███▌      | 18/50 [00:06<00:10,  3.02it/s][A
Training:  38%|███▊      | 19/50 [00:06<00:08,  3.55it/s][A
Training:  42%|████▏     | 21/50 [00:07<00:08,  3.26it/s][A
Training:  44%|████▍     | 22/50 [00:0

Epoch: 2/72 - Loss: 7.0225 - Accuracy: 0.9172



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:01<00:09,  1.56s/it][A
100%|██████████| 7/7 [00:02<00:00,  2.59it/s][A
Epochs:   3%|▎         | 2/72 [00:36<21:25, 18.36s/it]

Val Loss: 1.0901 - Val Accuracy: 0.9406



Training:   0%|          | 0/50 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/50 [00:01<01:13,  1.50s/it][A
Training:   8%|▊         | 4/50 [00:01<00:14,  3.13it/s][A
Training:  12%|█▏        | 6/50 [00:02<00:18,  2.39it/s][A
Training:  18%|█▊        | 9/50 [00:03<00:16,  2.50it/s][A
Training:  22%|██▏       | 11/50 [00:03<00:11,  3.43it/s][A
Training:  26%|██▌       | 13/50 [00:05<00:14,  2.55it/s][A
Training:  34%|███▍      | 17/50 [00:06<00:12,  2.74it/s][A
Training:  42%|████▏     | 21/50 [00:07<00:09,  2.92it/s][A
Training:  50%|█████     | 25/50 [00:08<00:08,  3.12it/s][A
Training:  56%|█████▌    | 28/50 [00:09<00:05,  4.14it/s][A
Training:  60%|██████    | 30/50 [00:10<00:06,  3.26it/s][A
Training:  66%|██████▌   | 33/50 [00:11<00:05,  3.32it/s][A
Training:  70%|███████   | 35/50 [00:11<00:04,  3.73it/s][A
Training:  74%|███████▍  | 37/50 [00:12<00:03,  3.35it/s][A
Training:  76%|███████▌  | 38/50 [00:12<00:03,  3.49it/s][A
Training:  78%|███████▊  | 39/50 [00

Epoch: 3/72 - Loss: 2.2083 - Accuracy: 0.9307



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:01<00:09,  1.59s/it][A
100%|██████████| 7/7 [00:02<00:00,  2.57it/s][A
Epochs:   4%|▍         | 3/72 [00:55<21:03, 18.32s/it]

Val Loss: 0.6312 - Val Accuracy: 0.8842



Training:   0%|          | 0/50 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/50 [00:01<01:18,  1.60s/it][A
Training:  10%|█         | 5/50 [00:02<00:22,  2.00it/s][A
Training:  16%|█▌        | 8/50 [00:02<00:11,  3.57it/s][A
Training:  20%|██        | 10/50 [00:04<00:14,  2.69it/s][A
Training:  26%|██▌       | 13/50 [00:05<00:14,  2.62it/s][A
Training:  30%|███       | 15/50 [00:05<00:10,  3.42it/s][A
Training:  34%|███▍      | 17/50 [00:06<00:12,  2.72it/s][A
Training:  40%|████      | 20/50 [00:06<00:07,  4.09it/s][A
Training:  44%|████▍     | 22/50 [00:07<00:09,  3.08it/s][A
Training:  50%|█████     | 25/50 [00:08<00:08,  2.87it/s][A
Training:  56%|█████▌    | 28/50 [00:09<00:05,  4.11it/s][A
Training:  60%|██████    | 30/50 [00:10<00:06,  3.15it/s][A
Training:  66%|██████▌   | 33/50 [00:11<00:05,  3.10it/s][A
Training:  74%|███████▍  | 37/50 [00:12<00:03,  3.30it/s][A
Training:  80%|████████  | 40/50 [00:12<00:02,  4.46it/s][A
Training:  84%|████████▍ | 42/50 [0

Epoch: 4/72 - Loss: 1.2334 - Accuracy: 0.9312



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:01<00:09,  1.55s/it][A
100%|██████████| 7/7 [00:02<00:00,  2.51it/s][A
Epochs:   6%|▌         | 4/72 [01:13<20:47, 18.34s/it]

Val Loss: 3.9059 - Val Accuracy: 0.9291



Training:   0%|          | 0/50 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/50 [00:01<01:17,  1.58s/it][A
Training:   6%|▌         | 3/50 [00:01<00:21,  2.23it/s][A
Training:  10%|█         | 5/50 [00:02<00:21,  2.06it/s][A
Training:  14%|█▍        | 7/50 [00:02<00:13,  3.28it/s][A
Training:  18%|█▊        | 9/50 [00:04<00:16,  2.44it/s][A
Training:  24%|██▍       | 12/50 [00:04<00:09,  4.14it/s][A
Training:  28%|██▊       | 14/50 [00:05<00:12,  2.97it/s][A
Training:  32%|███▏      | 16/50 [00:05<00:08,  3.95it/s][A
Training:  36%|███▌      | 18/50 [00:06<00:10,  2.96it/s][A
Training:  38%|███▊      | 19/50 [00:06<00:10,  3.09it/s][A
Training:  42%|████▏     | 21/50 [00:07<00:10,  2.76it/s][A
Training:  46%|████▌     | 23/50 [00:07<00:07,  3.49it/s][A
Training:  50%|█████     | 25/50 [00:08<00:09,  2.76it/s][A
Training:  54%|█████▍    | 27/50 [00:09<00:06,  3.63it/s][A
Training:  58%|█████▊    | 29/50 [00:10<00:07,  2.75it/s][A
Training:  66%|██████▌   | 33/50 [00:

Epoch: 5/72 - Loss: 2.3472 - Accuracy: 0.9374



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:01<00:09,  1.51s/it][A
100%|██████████| 7/7 [00:02<00:00,  2.59it/s][A
Epochs:   7%|▋         | 5/72 [01:32<20:34, 18.43s/it]

Val Loss: 5.5239 - Val Accuracy: 0.9472



Training:   0%|          | 0/50 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/50 [00:01<01:16,  1.56s/it][A
Training:   4%|▍         | 2/50 [00:01<00:35,  1.35it/s][A
Training:  10%|█         | 5/50 [00:02<00:20,  2.23it/s][A
Training:  12%|█▏        | 6/50 [00:02<00:17,  2.56it/s][A
Training:  18%|█▊        | 9/50 [00:03<00:14,  2.84it/s][A
Training:  20%|██        | 10/50 [00:04<00:12,  3.08it/s][A
Training:  26%|██▌       | 13/50 [00:05<00:11,  3.17it/s][A
Training:  28%|██▊       | 14/50 [00:05<00:10,  3.29it/s][A
Training:  30%|███       | 15/50 [00:05<00:09,  3.72it/s][A
Training:  34%|███▍      | 17/50 [00:06<00:10,  3.10it/s][A
Training:  36%|███▌      | 18/50 [00:06<00:10,  2.98it/s][A
Training:  42%|████▏     | 21/50 [00:07<00:09,  3.16it/s][A
Training:  44%|████▍     | 22/50 [00:07<00:09,  3.04it/s][A
Training:  50%|█████     | 25/50 [00:08<00:07,  3.24it/s][A
Training:  52%|█████▏    | 26/50 [00:09<00:07,  3.29it/s][A
Training:  54%|█████▍    | 27/50 [00:

Epoch: 6/72 - Loss: 3.3760 - Accuracy: 0.9416



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:01<00:09,  1.55s/it][A
100%|██████████| 7/7 [00:02<00:00,  2.57it/s][A
Epochs:   8%|▊         | 6/72 [01:50<20:15, 18.41s/it]

Val Loss: 0.8413 - Val Accuracy: 0.9477



Training:   0%|          | 0/50 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/50 [00:01<01:16,  1.57s/it][A
Training:   6%|▌         | 3/50 [00:01<00:21,  2.23it/s][A
Training:  10%|█         | 5/50 [00:02<00:23,  1.94it/s][A
Training:  16%|█▌        | 8/50 [00:02<00:11,  3.78it/s][A
Training:  20%|██        | 10/50 [00:04<00:14,  2.76it/s][A
Training:  26%|██▌       | 13/50 [00:05<00:13,  2.68it/s][A
Training:  30%|███       | 15/50 [00:05<00:10,  3.48it/s][A
Training:  34%|███▍      | 17/50 [00:06<00:11,  2.80it/s][A
Training:  36%|███▌      | 18/50 [00:06<00:10,  3.14it/s][A
Training:  40%|████      | 20/50 [00:06<00:07,  4.20it/s][A
Training:  42%|████▏     | 21/50 [00:07<00:10,  2.72it/s][A
Training:  44%|████▍     | 22/50 [00:07<00:08,  3.15it/s][A
Training:  46%|████▌     | 23/50 [00:07<00:07,  3.70it/s][A
Training:  50%|█████     | 25/50 [00:08<00:08,  2.88it/s][A
Training:  52%|█████▏    | 26/50 [00:08<00:07,  3.35it/s][A
Training:  56%|█████▌    | 28/50 [00

Epoch: 7/72 - Loss: 0.7673 - Accuracy: 0.9448



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:01<00:09,  1.53s/it][A
100%|██████████| 7/7 [00:02<00:00,  2.61it/s][A
Epochs:  10%|▉         | 7/72 [02:08<19:56, 18.41s/it]

Val Loss: 0.6551 - Val Accuracy: 0.9509



Training:   0%|          | 0/50 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/50 [00:01<01:18,  1.60s/it][A
Training:   8%|▊         | 4/50 [00:01<00:15,  3.01it/s][A
Training:  12%|█▏        | 6/50 [00:02<00:19,  2.29it/s][A
Training:  18%|█▊        | 9/50 [00:04<00:17,  2.33it/s][A
Training:  22%|██▏       | 11/50 [00:04<00:12,  3.22it/s][A
Training:  26%|██▌       | 13/50 [00:05<00:14,  2.54it/s][A
Training:  34%|███▍      | 17/50 [00:06<00:11,  2.75it/s][A
Training:  40%|████      | 20/50 [00:06<00:07,  3.93it/s][A
Training:  44%|████▍     | 22/50 [00:07<00:09,  3.07it/s][A
Training:  50%|█████     | 25/50 [00:09<00:08,  2.81it/s][A
Training:  56%|█████▌    | 28/50 [00:09<00:05,  3.98it/s][A
Training:  60%|██████    | 30/50 [00:10<00:06,  3.17it/s][A
Training:  66%|██████▌   | 33/50 [00:11<00:05,  3.04it/s][A
Training:  74%|███████▍  | 37/50 [00:12<00:04,  3.20it/s][A
Training:  80%|████████  | 40/50 [00:12<00:02,  4.32it/s][A
Training:  84%|████████▍ | 42/50 [00

Epoch: 8/72 - Loss: 1.4368 - Accuracy: 0.9454



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:01<00:09,  1.53s/it][A
100%|██████████| 7/7 [00:02<00:00,  2.64it/s][A
Epochs:  11%|█         | 8/72 [02:27<19:41, 18.46s/it]

Val Loss: 0.8310 - Val Accuracy: 0.9519



Training:   0%|          | 0/50 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/50 [00:01<01:17,  1.59s/it][A
Training:   8%|▊         | 4/50 [00:01<00:15,  3.00it/s][A
Training:  12%|█▏        | 6/50 [00:02<00:18,  2.33it/s][A
Training:  18%|█▊        | 9/50 [00:04<00:16,  2.43it/s][A
Training:  22%|██▏       | 11/50 [00:04<00:11,  3.34it/s][A
Training:  26%|██▌       | 13/50 [00:05<00:14,  2.57it/s][A
Training:  34%|███▍      | 17/50 [00:06<00:11,  2.81it/s][A
Training:  40%|████      | 20/50 [00:06<00:07,  4.02it/s][A
Training:  44%|████▍     | 22/50 [00:07<00:08,  3.17it/s][A
Training:  50%|█████     | 25/50 [00:08<00:08,  2.83it/s][A
Training:  58%|█████▊    | 29/50 [00:10<00:07,  2.98it/s][A
Training:  66%|██████▌   | 33/50 [00:11<00:05,  3.25it/s][A
Training:  74%|███████▍  | 37/50 [00:12<00:03,  3.29it/s][A
Training:  82%|████████▏ | 41/50 [00:13<00:02,  3.47it/s][A
Training:  90%|█████████ | 45/50 [00:14<00:01,  3.52it/s][A
Training:  96%|█████████▌| 48/50 [00

Epoch: 9/72 - Loss: 3.1267 - Accuracy: 0.9388



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:01<00:09,  1.56s/it][A
100%|██████████| 7/7 [00:02<00:00,  2.53it/s][A
Epochs:  12%|█▎        | 9/72 [02:46<19:26, 18.52s/it]

Val Loss: 1.4402 - Val Accuracy: 0.9435



Training:   0%|          | 0/50 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/50 [00:01<01:17,  1.58s/it][A
Training:   8%|▊         | 4/50 [00:01<00:15,  3.04it/s][A
Training:  12%|█▏        | 6/50 [00:02<00:18,  2.38it/s][A
Training:  16%|█▌        | 8/50 [00:02<00:11,  3.57it/s][A
Training:  20%|██        | 10/50 [00:03<00:14,  2.69it/s][A
Training:  24%|██▍       | 12/50 [00:04<00:10,  3.70it/s][A
Training:  28%|██▊       | 14/50 [00:05<00:12,  2.85it/s][A
Training:  30%|███       | 15/50 [00:05<00:10,  3.26it/s][A
Training:  34%|███▍      | 17/50 [00:06<00:12,  2.62it/s][A
Training:  38%|███▊      | 19/50 [00:06<00:08,  3.66it/s][A
Training:  40%|████      | 20/50 [00:06<00:07,  3.97it/s][A
Training:  42%|████▏     | 21/50 [00:07<00:11,  2.51it/s][A
Training:  46%|████▌     | 23/50 [00:07<00:07,  3.76it/s][A
Training:  50%|█████     | 25/50 [00:08<00:09,  2.77it/s][A
Training:  54%|█████▍    | 27/50 [00:08<00:06,  3.70it/s][A
Training:  58%|█████▊    | 29/50 [00

Epoch: 10/72 - Loss: 0.6241 - Accuracy: 0.9448



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:01<00:09,  1.58s/it][A
100%|██████████| 7/7 [00:02<00:00,  2.53it/s][A
Epochs:  14%|█▍        | 10/72 [03:04<19:03, 18.45s/it]

Val Loss: 0.5767 - Val Accuracy: 0.9477



Training:   0%|          | 0/50 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/50 [00:01<01:12,  1.48s/it][A
Training:   4%|▍         | 2/50 [00:01<00:33,  1.41it/s][A
Training:  10%|█         | 5/50 [00:02<00:20,  2.18it/s][A
Training:  12%|█▏        | 6/50 [00:02<00:16,  2.64it/s][A
Training:  16%|█▌        | 8/50 [00:02<00:10,  4.10it/s][A
Training:  18%|█▊        | 9/50 [00:03<00:16,  2.51it/s][A
Training:  22%|██▏       | 11/50 [00:04<00:10,  3.80it/s][A
Training:  26%|██▌       | 13/50 [00:05<00:14,  2.64it/s][A
Training:  34%|███▍      | 17/50 [00:06<00:10,  3.03it/s][A
Training:  40%|████      | 20/50 [00:06<00:06,  4.41it/s][A
Training:  44%|████▍     | 22/50 [00:07<00:08,  3.13it/s][A
Training:  48%|████▊     | 24/50 [00:07<00:06,  4.03it/s][A
Training:  52%|█████▏    | 26/50 [00:08<00:08,  2.98it/s][A
Training:  58%|█████▊    | 29/50 [00:09<00:07,  2.92it/s][A
Training:  60%|██████    | 30/50 [00:10<00:06,  3.18it/s][A
Training:  66%|██████▌   | 33/50 [00:1

Epoch: 11/72 - Loss: 0.2199 - Accuracy: 0.9537



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:01<00:09,  1.50s/it][A
 57%|█████▋    | 4/7 [00:01<00:00,  3.18it/s][A
100%|██████████| 7/7 [00:02<00:00,  2.63it/s][A
Epochs:  15%|█▌        | 11/72 [03:22<18:43, 18.43s/it]

Val Loss: 0.3397 - Val Accuracy: 0.9477



Training:   0%|          | 0/50 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/50 [00:01<01:16,  1.56s/it][A
Training:   8%|▊         | 4/50 [00:01<00:14,  3.09it/s][A
Training:  12%|█▏        | 6/50 [00:02<00:18,  2.35it/s][A
Training:  14%|█▍        | 7/50 [00:02<00:15,  2.85it/s][A
Training:  18%|█▊        | 9/50 [00:04<00:18,  2.26it/s][A
Training:  24%|██▍       | 12/50 [00:04<00:09,  3.92it/s][A
Training:  28%|██▊       | 14/50 [00:05<00:12,  2.82it/s][A
Training:  34%|███▍      | 17/50 [00:06<00:12,  2.64it/s][A
Training:  40%|████      | 20/50 [00:06<00:07,  3.89it/s][A
Training:  44%|████▍     | 22/50 [00:07<00:09,  3.01it/s][A
Training:  50%|█████     | 25/50 [00:08<00:08,  2.87it/s][A
Training:  54%|█████▍    | 27/50 [00:09<00:06,  3.65it/s][A
Training:  58%|█████▊    | 29/50 [00:10<00:07,  2.85it/s][A
Training:  64%|██████▍   | 32/50 [00:10<00:04,  4.16it/s][A
Training:  68%|██████▊   | 34/50 [00:11<00:04,  3.39it/s][A
Training:  74%|███████▍  | 37/50 [00:

Epoch: 12/72 - Loss: 0.2134 - Accuracy: 0.9565



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:01<00:09,  1.63s/it][A
 57%|█████▋    | 4/7 [00:01<00:01,  2.95it/s][A
100%|██████████| 7/7 [00:02<00:00,  2.56it/s][A
Epochs:  17%|█▋        | 12/72 [03:41<18:26, 18.45s/it]

Val Loss: 0.2602 - Val Accuracy: 0.9453



Training:   0%|          | 0/50 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/50 [00:01<01:14,  1.53s/it][A
Training:   8%|▊         | 4/50 [00:01<00:15,  3.01it/s][A
Training:  12%|█▏        | 6/50 [00:02<00:19,  2.29it/s][A
Training:  18%|█▊        | 9/50 [00:03<00:16,  2.42it/s][A
Training:  24%|██▍       | 12/50 [00:04<00:09,  3.85it/s][A
Training:  28%|██▊       | 14/50 [00:05<00:11,  3.01it/s][A
Training:  32%|███▏      | 16/50 [00:05<00:08,  3.81it/s][A
Training:  34%|███▍      | 17/50 [00:06<00:12,  2.63it/s][A
Training:  38%|███▊      | 19/50 [00:06<00:08,  3.61it/s][A
Training:  40%|████      | 20/50 [00:06<00:07,  3.79it/s][A
Training:  42%|████▏     | 21/50 [00:07<00:11,  2.54it/s][A
Training:  48%|████▊     | 24/50 [00:07<00:06,  3.89it/s][A
Training:  50%|█████     | 25/50 [00:08<00:09,  2.77it/s][A
Training:  54%|█████▍    | 27/50 [00:08<00:06,  3.80it/s][A
Training:  56%|█████▌    | 28/50 [00:09<00:05,  3.75it/s][A
Training:  58%|█████▊    | 29/50 [00

Epoch: 13/72 - Loss: 0.2767 - Accuracy: 0.9552



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:01<00:08,  1.44s/it][A
 43%|████▎     | 3/7 [00:01<00:01,  2.38it/s][A
 71%|███████▏  | 5/7 [00:02<00:00,  2.19it/s][A
100%|██████████| 7/7 [00:02<00:00,  2.59it/s][A
Epochs:  18%|█▊        | 13/72 [03:59<18:04, 18.38s/it]

Val Loss: 0.4653 - Val Accuracy: 0.9485



Training:   0%|          | 0/50 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/50 [00:01<01:12,  1.48s/it][A
Training:   4%|▍         | 2/50 [00:01<00:32,  1.45it/s][A
Training:  10%|█         | 5/50 [00:02<00:20,  2.22it/s][A
Training:  12%|█▏        | 6/50 [00:02<00:16,  2.62it/s][A
Training:  18%|█▊        | 9/50 [00:03<00:15,  2.69it/s][A
Training:  20%|██        | 10/50 [00:04<00:13,  3.06it/s][A
Training:  26%|██▌       | 13/50 [00:05<00:12,  3.02it/s][A
Training:  28%|██▊       | 14/50 [00:05<00:10,  3.30it/s][A
Training:  34%|███▍      | 17/50 [00:06<00:10,  3.14it/s][A
Training:  36%|███▌      | 18/50 [00:06<00:09,  3.33it/s][A
Training:  40%|████      | 20/50 [00:06<00:06,  4.59it/s][A
Training:  42%|████▏     | 21/50 [00:07<00:09,  2.95it/s][A
Training:  44%|████▍     | 22/50 [00:07<00:09,  3.11it/s][A
Training:  50%|█████     | 25/50 [00:08<00:08,  3.05it/s][A
Training:  52%|█████▏    | 26/50 [00:08<00:07,  3.33it/s][A
Training:  58%|█████▊    | 29/50 [00:

Epoch: 14/72 - Loss: 0.1711 - Accuracy: 0.9599



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:01<00:09,  1.52s/it][A
100%|██████████| 7/7 [00:02<00:00,  2.60it/s][A
Epochs:  19%|█▉        | 14/72 [04:17<17:45, 18.38s/it]

Val Loss: 0.2593 - Val Accuracy: 0.9450



Training:   0%|          | 0/50 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/50 [00:01<01:17,  1.58s/it][A
Training:   8%|▊         | 4/50 [00:01<00:15,  3.05it/s][A
Training:  12%|█▏        | 6/50 [00:02<00:18,  2.40it/s][A
Training:  14%|█▍        | 7/50 [00:02<00:14,  2.90it/s][A
Training:  18%|█▊        | 9/50 [00:03<00:16,  2.44it/s][A
Training:  22%|██▏       | 11/50 [00:03<00:10,  3.58it/s][A
Training:  26%|██▌       | 13/50 [00:05<00:13,  2.66it/s][A
Training:  30%|███       | 15/50 [00:05<00:09,  3.69it/s][A
Training:  34%|███▍      | 17/50 [00:06<00:11,  2.81it/s][A
Training:  36%|███▌      | 18/50 [00:06<00:10,  3.17it/s][A
Training:  42%|████▏     | 21/50 [00:07<00:10,  2.85it/s][A
Training:  50%|█████     | 25/50 [00:08<00:08,  3.09it/s][A
Training:  54%|█████▍    | 27/50 [00:08<00:05,  3.88it/s][A
Training:  58%|█████▊    | 29/50 [00:10<00:07,  2.95it/s][A
Training:  62%|██████▏   | 31/50 [00:10<00:05,  3.77it/s][A
Training:  66%|██████▌   | 33/50 [00:

Epoch: 15/72 - Loss: 0.1205 - Accuracy: 0.9637



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:01<00:09,  1.53s/it][A
 57%|█████▋    | 4/7 [00:01<00:01,  2.80it/s][A
100%|██████████| 7/7 [00:02<00:00,  2.56it/s][A
Epochs:  21%|██        | 15/72 [04:36<17:30, 18.43s/it]

Val Loss: 0.2109 - Val Accuracy: 0.9259



Training:   0%|          | 0/50 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/50 [00:01<01:13,  1.50s/it][A
Training:   6%|▌         | 3/50 [00:01<00:20,  2.34it/s][A
Training:  10%|█         | 5/50 [00:02<00:22,  2.02it/s][A
Training:  12%|█▏        | 6/50 [00:02<00:17,  2.57it/s][A
Training:  18%|█▊        | 9/50 [00:03<00:15,  2.73it/s][A
Training:  20%|██        | 10/50 [00:04<00:12,  3.11it/s][A
Training:  26%|██▌       | 13/50 [00:05<00:12,  2.97it/s][A
Training:  30%|███       | 15/50 [00:05<00:08,  3.94it/s][A
Training:  34%|███▍      | 17/50 [00:06<00:11,  2.86it/s][A
Training:  40%|████      | 20/50 [00:06<00:06,  4.32it/s][A
Training:  44%|████▍     | 22/50 [00:07<00:08,  3.16it/s][A
Training:  48%|████▊     | 24/50 [00:07<00:06,  4.03it/s][A
Training:  50%|█████     | 25/50 [00:08<00:09,  2.65it/s][A
Training:  54%|█████▍    | 27/50 [00:08<00:06,  3.65it/s][A
Training:  58%|█████▊    | 29/50 [00:09<00:07,  2.80it/s][A
Training:  62%|██████▏   | 31/50 [00:

Epoch: 16/72 - Loss: 0.1487 - Accuracy: 0.9598



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:01<00:09,  1.51s/it][A
 57%|█████▋    | 4/7 [00:01<00:00,  3.18it/s][A
100%|██████████| 7/7 [00:02<00:00,  2.54it/s][A
Epochs:  22%|██▏       | 16/72 [04:54<17:12, 18.43s/it]

Val Loss: 0.3491 - Val Accuracy: 0.9392



Training:   0%|          | 0/50 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/50 [00:01<01:11,  1.47s/it][A
Training:   8%|▊         | 4/50 [00:01<00:14,  3.24it/s][A
Training:  12%|█▏        | 6/50 [00:02<00:18,  2.36it/s][A
Training:  18%|█▊        | 9/50 [00:03<00:15,  2.61it/s][A
Training:  20%|██        | 10/50 [00:03<00:13,  2.86it/s][A
Training:  26%|██▌       | 13/50 [00:05<00:13,  2.84it/s][A
Training:  28%|██▊       | 14/50 [00:05<00:11,  3.16it/s][A
Training:  32%|███▏      | 16/50 [00:05<00:07,  4.31it/s][A
Training:  34%|███▍      | 17/50 [00:06<00:12,  2.71it/s][A
Training:  36%|███▌      | 18/50 [00:06<00:10,  3.15it/s][A
Training:  40%|████      | 20/50 [00:06<00:06,  4.59it/s][A
Training:  44%|████▍     | 22/50 [00:07<00:09,  2.99it/s][A
Training:  48%|████▊     | 24/50 [00:07<00:06,  4.17it/s][A
Training:  52%|█████▏    | 26/50 [00:08<00:08,  2.81it/s][A
Training:  58%|█████▊    | 29/50 [00:09<00:07,  2.83it/s][A
Training:  60%|██████    | 30/50 [00

Epoch: 17/72 - Loss: 0.2209 - Accuracy: 0.9601



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:01<00:09,  1.57s/it][A
 57%|█████▋    | 4/7 [00:01<00:00,  3.08it/s][A
100%|██████████| 7/7 [00:02<00:00,  2.52it/s][A
Epochs:  24%|██▎       | 17/72 [05:13<16:54, 18.45s/it]

Val Loss: 0.3103 - Val Accuracy: 0.9414



Training:   0%|          | 0/50 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/50 [00:01<01:15,  1.55s/it][A
Training:   6%|▌         | 3/50 [00:01<00:21,  2.24it/s][A
Training:  10%|█         | 5/50 [00:02<00:23,  1.95it/s][A
Training:  18%|█▊        | 9/50 [00:04<00:15,  2.60it/s][A
Training:  24%|██▍       | 12/50 [00:04<00:09,  4.03it/s][A
Training:  28%|██▊       | 14/50 [00:05<00:12,  2.92it/s][A
Training:  34%|███▍      | 17/50 [00:06<00:11,  2.94it/s][A
Training:  36%|███▌      | 18/50 [00:06<00:10,  3.09it/s][A
Training:  42%|████▏     | 21/50 [00:07<00:09,  3.08it/s][A
Training:  44%|████▍     | 22/50 [00:07<00:08,  3.29it/s][A
Training:  50%|█████     | 25/50 [00:08<00:07,  3.13it/s][A
Training:  52%|█████▏    | 26/50 [00:08<00:07,  3.38it/s][A
Training:  58%|█████▊    | 29/50 [00:09<00:06,  3.15it/s][A
Training:  60%|██████    | 30/50 [00:10<00:05,  3.40it/s][A
Training:  66%|██████▌   | 33/50 [00:11<00:05,  3.35it/s][A
Training:  68%|██████▊   | 34/50 [00

Epoch: 18/72 - Loss: 0.1700 - Accuracy: 0.9603



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:01<00:09,  1.56s/it][A
 57%|█████▋    | 4/7 [00:01<00:00,  3.08it/s][A
100%|██████████| 7/7 [00:02<00:00,  2.54it/s][A
Epochs:  25%|██▌       | 18/72 [05:31<16:33, 18.40s/it]

Val Loss: 1.0960 - Val Accuracy: 0.9515



Training:   0%|          | 0/50 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/50 [00:01<01:09,  1.43s/it][A
Training:   4%|▍         | 2/50 [00:01<00:33,  1.42it/s][A
Training:  10%|█         | 5/50 [00:02<00:19,  2.34it/s][A
Training:  12%|█▏        | 6/50 [00:02<00:16,  2.74it/s][A
Training:  18%|█▊        | 9/50 [00:03<00:14,  2.77it/s][A
Training:  20%|██        | 10/50 [00:04<00:12,  3.10it/s][A
Training:  26%|██▌       | 13/50 [00:05<00:12,  3.04it/s][A
Training:  28%|██▊       | 14/50 [00:05<00:10,  3.27it/s][A
Training:  32%|███▏      | 16/50 [00:05<00:07,  4.56it/s][A
Training:  34%|███▍      | 17/50 [00:06<00:11,  2.82it/s][A
Training:  36%|███▌      | 18/50 [00:06<00:10,  3.14it/s][A
Training:  42%|████▏     | 21/50 [00:07<00:10,  2.89it/s][A
Training:  46%|████▌     | 23/50 [00:07<00:06,  3.91it/s][A
Training:  50%|█████     | 25/50 [00:08<00:08,  2.93it/s][A
Training:  52%|█████▏    | 26/50 [00:08<00:07,  3.30it/s][A
Training:  56%|█████▌    | 28/50 [00:

Epoch: 19/72 - Loss: 0.7883 - Accuracy: 0.9494



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:01<00:09,  1.54s/it][A
 57%|█████▋    | 4/7 [00:01<00:00,  3.13it/s][A
100%|██████████| 7/7 [00:02<00:00,  2.55it/s][A
Epochs:  26%|██▋       | 19/72 [05:50<16:17, 18.44s/it]

Val Loss: 0.4058 - Val Accuracy: 0.9483



Training:   0%|          | 0/50 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/50 [00:01<01:17,  1.58s/it][A
Training:   6%|▌         | 3/50 [00:01<00:22,  2.11it/s][A
Training:  10%|█         | 5/50 [00:02<00:21,  2.06it/s][A
Training:  12%|█▏        | 6/50 [00:02<00:17,  2.53it/s][A
Training:  18%|█▊        | 9/50 [00:04<00:15,  2.63it/s][A
Training:  20%|██        | 10/50 [00:04<00:13,  2.95it/s][A
Training:  26%|██▌       | 13/50 [00:05<00:13,  2.82it/s][A
Training:  28%|██▊       | 14/50 [00:05<00:11,  3.15it/s][A
Training:  34%|███▍      | 17/50 [00:06<00:10,  3.09it/s][A
Training:  36%|███▌      | 18/50 [00:06<00:09,  3.25it/s][A
Training:  42%|████▏     | 21/50 [00:07<00:09,  3.05it/s][A
Training:  44%|████▍     | 22/50 [00:07<00:08,  3.42it/s][A
Training:  48%|████▊     | 24/50 [00:07<00:05,  4.62it/s][A
Training:  50%|█████     | 25/50 [00:08<00:09,  2.76it/s][A
Training:  52%|█████▏    | 26/50 [00:09<00:07,  3.24it/s][A
Training:  58%|█████▊    | 29/50 [00:

Epoch: 20/72 - Loss: 0.2373 - Accuracy: 0.9549



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:01<00:08,  1.50s/it][A
 43%|████▎     | 3/7 [00:01<00:01,  2.33it/s][A
100%|██████████| 7/7 [00:02<00:00,  2.67it/s][A
Epochs:  28%|██▊       | 20/72 [06:08<15:55, 18.38s/it]

Val Loss: 0.2889 - Val Accuracy: 0.9470



Training:   0%|          | 0/50 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/50 [00:01<01:15,  1.53s/it][A
Training:   8%|▊         | 4/50 [00:01<00:15,  3.03it/s][A
Training:  12%|█▏        | 6/50 [00:02<00:18,  2.43it/s][A
Training:  14%|█▍        | 7/50 [00:02<00:14,  2.92it/s][A
Training:  18%|█▊        | 9/50 [00:03<00:17,  2.40it/s][A
Training:  22%|██▏       | 11/50 [00:04<00:11,  3.48it/s][A
Training:  24%|██▍       | 12/50 [00:04<00:09,  4.00it/s][A
Training:  26%|██▌       | 13/50 [00:05<00:15,  2.45it/s][A
Training:  28%|██▊       | 14/50 [00:05<00:12,  2.93it/s][A
Training:  32%|███▏      | 16/50 [00:05<00:07,  4.32it/s][A
Training:  34%|███▍      | 17/50 [00:06<00:12,  2.55it/s][A
Training:  36%|███▌      | 18/50 [00:06<00:10,  3.11it/s][A
Training:  40%|████      | 20/50 [00:06<00:06,  4.29it/s][A
Training:  42%|████▏     | 21/50 [00:07<00:11,  2.54it/s][A
Training:  46%|████▌     | 23/50 [00:07<00:07,  3.81it/s][A
Training:  48%|████▊     | 24/50 [00:

Epoch: 21/72 - Loss: 0.2839 - Accuracy: 0.9547



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:01<00:09,  1.53s/it][A
100%|██████████| 7/7 [00:02<00:00,  2.61it/s][A
Epochs:  29%|██▉       | 21/72 [06:26<15:32, 18.28s/it]

Val Loss: 0.4215 - Val Accuracy: 0.9458



Training:   0%|          | 0/50 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/50 [00:01<01:13,  1.51s/it][A
Training:  10%|█         | 5/50 [00:02<00:21,  2.07it/s][A
Training:  14%|█▍        | 7/50 [00:02<00:13,  3.13it/s][A
Training:  18%|█▊        | 9/50 [00:03<00:16,  2.43it/s][A
Training:  22%|██▏       | 11/50 [00:04<00:11,  3.43it/s][A
Training:  26%|██▌       | 13/50 [00:05<00:14,  2.54it/s][A
Training:  30%|███       | 15/50 [00:05<00:09,  3.50it/s][A
Training:  34%|███▍      | 17/50 [00:06<00:11,  2.75it/s][A
Training:  40%|████      | 20/50 [00:06<00:07,  4.28it/s][A
Training:  44%|████▍     | 22/50 [00:07<00:09,  2.96it/s][A
Training:  50%|█████     | 25/50 [00:09<00:08,  2.79it/s][A
Training:  56%|█████▌    | 28/50 [00:09<00:05,  4.00it/s][A
Training:  60%|██████    | 30/50 [00:10<00:06,  3.02it/s][A
Training:  66%|██████▌   | 33/50 [00:11<00:06,  2.80it/s][A
Training:  74%|███████▍  | 37/50 [00:12<00:04,  3.06it/s][A
Training:  82%|████████▏ | 41/50 [00

Epoch: 22/72 - Loss: 0.2637 - Accuracy: 0.9567



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:01<00:08,  1.45s/it][A
 29%|██▊       | 2/7 [00:01<00:03,  1.49it/s][A
 57%|█████▋    | 4/7 [00:01<00:00,  3.44it/s][A
100%|██████████| 7/7 [00:02<00:00,  2.57it/s][A
Epochs:  31%|███       | 22/72 [06:45<15:21, 18.44s/it]

Val Loss: 0.6113 - Val Accuracy: 0.9473



Training:   0%|          | 0/50 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/50 [00:01<01:16,  1.57s/it][A
Training:  10%|█         | 5/50 [00:02<00:22,  2.04it/s][A
Training:  18%|█▊        | 9/50 [00:03<00:15,  2.60it/s][A
Training:  24%|██▍       | 12/50 [00:04<00:09,  3.89it/s][A
Training:  28%|██▊       | 14/50 [00:05<00:12,  2.95it/s][A
Training:  34%|███▍      | 17/50 [00:06<00:11,  2.80it/s][A
Training:  42%|████▏     | 21/50 [00:07<00:09,  2.99it/s][A
Training:  48%|████▊     | 24/50 [00:07<00:06,  4.06it/s][A
Training:  52%|█████▏    | 26/50 [00:08<00:07,  3.15it/s][A
Training:  58%|█████▊    | 29/50 [00:10<00:07,  2.90it/s][A
Training:  66%|██████▌   | 33/50 [00:11<00:05,  3.11it/s][A
Training:  74%|███████▍  | 37/50 [00:12<00:03,  3.26it/s][A
Training:  80%|████████  | 40/50 [00:12<00:02,  4.31it/s][A
Training:  84%|████████▍ | 42/50 [00:13<00:02,  3.45it/s][A
Training:  90%|█████████ | 45/50 [00:14<00:01,  3.27it/s][A
Training:  98%|█████████▊| 49/50 [0

Epoch: 23/72 - Loss: 0.2822 - Accuracy: 0.9572



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:01<00:08,  1.43s/it][A
 43%|████▎     | 3/7 [00:01<00:01,  2.35it/s][A
100%|██████████| 7/7 [00:02<00:00,  2.62it/s][A
Epochs:  32%|███▏      | 23/72 [07:03<15:01, 18.39s/it]

Val Loss: 0.5254 - Val Accuracy: 0.9394



Training:   0%|          | 0/50 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/50 [00:01<01:18,  1.60s/it][A
Training:   6%|▌         | 3/50 [00:01<00:21,  2.19it/s][A
Training:  10%|█         | 5/50 [00:02<00:21,  2.06it/s][A
Training:  14%|█▍        | 7/50 [00:02<00:14,  3.06it/s][A
Training:  18%|█▊        | 9/50 [00:04<00:16,  2.51it/s][A
Training:  22%|██▏       | 11/50 [00:04<00:11,  3.52it/s][A
Training:  26%|██▌       | 13/50 [00:05<00:13,  2.72it/s][A
Training:  30%|███       | 15/50 [00:05<00:09,  3.54it/s][A
Training:  34%|███▍      | 17/50 [00:06<00:11,  3.00it/s][A
Training:  38%|███▊      | 19/50 [00:06<00:08,  3.68it/s][A
Training:  42%|████▏     | 21/50 [00:07<00:09,  3.07it/s][A
Training:  46%|████▌     | 23/50 [00:07<00:07,  3.54it/s][A
Training:  50%|█████     | 25/50 [00:08<00:07,  3.18it/s][A
Training:  52%|█████▏    | 26/50 [00:08<00:06,  3.55it/s][A
Training:  54%|█████▍    | 27/50 [00:09<00:06,  3.41it/s][A
Training:  58%|█████▊    | 29/50 [00:

Epoch: 24/72 - Loss: 0.2646 - Accuracy: 0.9577



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:01<00:09,  1.58s/it][A
 57%|█████▋    | 4/7 [00:01<00:00,  3.04it/s][A
100%|██████████| 7/7 [00:02<00:00,  2.44it/s][A
Epochs:  33%|███▎      | 24/72 [07:22<14:49, 18.54s/it]

Val Loss: 0.2755 - Val Accuracy: 0.9517



Training:   0%|          | 0/50 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/50 [00:01<01:15,  1.53s/it][A
Training:   8%|▊         | 4/50 [00:01<00:14,  3.12it/s][A
Training:  12%|█▏        | 6/50 [00:02<00:19,  2.24it/s][A
Training:  18%|█▊        | 9/50 [00:03<00:16,  2.42it/s][A
Training:  26%|██▌       | 13/50 [00:05<00:13,  2.76it/s][A
Training:  32%|███▏      | 16/50 [00:05<00:08,  3.89it/s][A
Training:  36%|███▌      | 18/50 [00:06<00:10,  3.13it/s][A
Training:  38%|███▊      | 19/50 [00:06<00:09,  3.39it/s][A
Training:  42%|████▏     | 21/50 [00:07<00:10,  2.64it/s][A
Training:  46%|████▌     | 23/50 [00:07<00:07,  3.55it/s][A
Training:  50%|█████     | 25/50 [00:08<00:09,  2.75it/s][A
Training:  56%|█████▌    | 28/50 [00:09<00:05,  4.16it/s][A
Training:  60%|██████    | 30/50 [00:10<00:06,  3.10it/s][A
Training:  66%|██████▌   | 33/50 [00:11<00:05,  2.88it/s][A
Training:  74%|███████▍  | 37/50 [00:12<00:04,  2.98it/s][A
Training:  82%|████████▏ | 41/50 [00

Epoch: 25/72 - Loss: 0.2183 - Accuracy: 0.9579



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:01<00:09,  1.59s/it][A
 57%|█████▋    | 4/7 [00:01<00:00,  3.01it/s][A
100%|██████████| 7/7 [00:02<00:00,  2.50it/s][A
Epochs:  35%|███▍      | 25/72 [07:41<14:38, 18.69s/it]

Val Loss: 0.2613 - Val Accuracy: 0.9473



Training:   0%|          | 0/50 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/50 [00:01<01:20,  1.64s/it][A
Training:   8%|▊         | 4/50 [00:01<00:15,  2.94it/s][A
Training:  12%|█▏        | 6/50 [00:02<00:20,  2.17it/s][A
Training:  18%|█▊        | 9/50 [00:04<00:17,  2.39it/s][A
Training:  24%|██▍       | 12/50 [00:04<00:10,  3.77it/s][A
Training:  28%|██▊       | 14/50 [00:05<00:12,  2.95it/s][A
Training:  34%|███▍      | 17/50 [00:06<00:12,  2.66it/s][A
Training:  38%|███▊      | 19/50 [00:06<00:09,  3.42it/s][A
Training:  42%|████▏     | 21/50 [00:07<00:10,  2.79it/s][A
Training:  50%|█████     | 25/50 [00:09<00:08,  2.94it/s][A
Training:  58%|█████▊    | 29/50 [00:10<00:06,  3.18it/s][A
Training:  64%|██████▍   | 32/50 [00:10<00:04,  4.30it/s][A
Training:  68%|██████▊   | 34/50 [00:11<00:04,  3.37it/s][A
Training:  74%|███████▍  | 37/50 [00:12<00:04,  3.09it/s][A
Training:  80%|████████  | 40/50 [00:12<00:02,  4.23it/s][A
Training:  84%|████████▍ | 42/50 [00

Epoch: 26/72 - Loss: 0.3437 - Accuracy: 0.9551



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:01<00:09,  1.60s/it][A
100%|██████████| 7/7 [00:02<00:00,  2.52it/s][A
Epochs:  36%|███▌      | 26/72 [08:00<14:22, 18.75s/it]

Val Loss: 0.5451 - Val Accuracy: 0.9492



Training:   0%|          | 0/50 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/50 [00:01<01:15,  1.55s/it][A
Training:   6%|▌         | 3/50 [00:01<00:20,  2.26it/s][A
Training:  10%|█         | 5/50 [00:02<00:22,  2.00it/s][A
Training:  18%|█▊        | 9/50 [00:04<00:16,  2.49it/s][A
Training:  26%|██▌       | 13/50 [00:05<00:13,  2.81it/s][A
Training:  32%|███▏      | 16/50 [00:05<00:08,  3.97it/s][A
Training:  36%|███▌      | 18/50 [00:06<00:10,  3.00it/s][A
Training:  42%|████▏     | 21/50 [00:07<00:10,  2.84it/s][A
Training:  48%|████▊     | 24/50 [00:07<00:06,  3.99it/s][A
Training:  52%|█████▏    | 26/50 [00:09<00:08,  2.95it/s][A
Training:  56%|█████▌    | 28/50 [00:09<00:05,  3.73it/s][A
Training:  60%|██████    | 30/50 [00:10<00:06,  3.04it/s][A
Training:  66%|██████▌   | 33/50 [00:11<00:05,  2.90it/s][A
Training:  74%|███████▍  | 37/50 [00:12<00:04,  3.22it/s][A
Training:  82%|████████▏ | 41/50 [00:13<00:02,  3.30it/s][A
Training:  86%|████████▌ | 43/50 [00

Epoch: 27/72 - Loss: 0.4580 - Accuracy: 0.9529



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:01<00:08,  1.43s/it][A
 43%|████▎     | 3/7 [00:01<00:01,  2.43it/s][A
100%|██████████| 7/7 [00:02<00:00,  2.60it/s][A
Epochs:  38%|███▊      | 27/72 [08:19<14:05, 18.80s/it]

Val Loss: 0.4771 - Val Accuracy: 0.9320



Training:   0%|          | 0/50 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/50 [00:01<01:13,  1.50s/it][A
Training:   6%|▌         | 3/50 [00:01<00:20,  2.32it/s][A
Training:  10%|█         | 5/50 [00:02<00:21,  2.12it/s][A
Training:  14%|█▍        | 7/50 [00:02<00:12,  3.37it/s][A
Training:  18%|█▊        | 9/50 [00:03<00:15,  2.57it/s][A
Training:  22%|██▏       | 11/50 [00:03<00:10,  3.59it/s][A
Training:  26%|██▌       | 13/50 [00:05<00:13,  2.79it/s][A
Training:  30%|███       | 15/50 [00:05<00:09,  3.68it/s][A
Training:  34%|███▍      | 17/50 [00:06<00:11,  2.83it/s][A
Training:  36%|███▌      | 18/50 [00:06<00:10,  3.05it/s][A
Training:  42%|████▏     | 21/50 [00:07<00:09,  3.01it/s][A
Training:  44%|████▍     | 22/50 [00:07<00:08,  3.11it/s][A
Training:  50%|█████     | 25/50 [00:08<00:07,  3.16it/s][A
Training:  52%|█████▏    | 26/50 [00:08<00:07,  3.39it/s][A
Training:  58%|█████▊    | 29/50 [00:09<00:06,  3.43it/s][A
Training:  60%|██████    | 30/50 [00:

Epoch: 28/72 - Loss: 0.4625 - Accuracy: 0.9533



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:01<00:08,  1.49s/it][A
 43%|████▎     | 3/7 [00:01<00:01,  2.26it/s][A
100%|██████████| 7/7 [00:02<00:00,  2.61it/s][A
Epochs:  39%|███▉      | 28/72 [08:37<13:42, 18.70s/it]

Val Loss: 0.5435 - Val Accuracy: 0.9526



Training:   0%|          | 0/50 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/50 [00:01<01:18,  1.60s/it][A
Training:   6%|▌         | 3/50 [00:01<00:22,  2.13it/s][A
Training:  10%|█         | 5/50 [00:02<00:22,  2.04it/s][A
Training:  12%|█▏        | 6/50 [00:02<00:17,  2.58it/s][A
Training:  16%|█▌        | 8/50 [00:03<00:10,  3.98it/s][A
Training:  18%|█▊        | 9/50 [00:03<00:16,  2.46it/s][A
Training:  20%|██        | 10/50 [00:04<00:14,  2.83it/s][A
Training:  26%|██▌       | 13/50 [00:05<00:13,  2.81it/s][A
Training:  28%|██▊       | 14/50 [00:05<00:11,  3.10it/s][A
Training:  34%|███▍      | 17/50 [00:06<00:11,  2.91it/s][A
Training:  42%|████▏     | 21/50 [00:07<00:09,  3.04it/s][A
Training:  50%|█████     | 25/50 [00:08<00:07,  3.19it/s][A
Training:  58%|█████▊    | 29/50 [00:10<00:06,  3.34it/s][A
Training:  64%|██████▍   | 32/50 [00:10<00:04,  4.40it/s][A
Training:  66%|██████▌   | 33/50 [00:11<00:05,  3.10it/s][A
Training:  74%|███████▍  | 37/50 [00:1

Epoch: 29/72 - Loss: 0.4635 - Accuracy: 0.9551



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:01<00:09,  1.57s/it][A
100%|██████████| 7/7 [00:02<00:00,  2.56it/s][A
Epochs:  40%|████      | 29/72 [08:56<13:22, 18.66s/it]

Val Loss: 0.7164 - Val Accuracy: 0.9448



Training:   0%|          | 0/50 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/50 [00:01<01:14,  1.51s/it][A
Training:   6%|▌         | 3/50 [00:01<00:20,  2.27it/s][A
Training:  10%|█         | 5/50 [00:02<00:21,  2.08it/s][A
Training:  12%|█▏        | 6/50 [00:02<00:17,  2.56it/s][A
Training:  18%|█▊        | 9/50 [00:03<00:14,  2.74it/s][A
Training:  20%|██        | 10/50 [00:04<00:13,  3.06it/s][A
Training:  24%|██▍       | 12/50 [00:04<00:08,  4.37it/s][A
Training:  26%|██▌       | 13/50 [00:05<00:13,  2.77it/s][A
Training:  28%|██▊       | 14/50 [00:05<00:11,  3.04it/s][A
Training:  34%|███▍      | 17/50 [00:06<00:11,  2.91it/s][A
Training:  36%|███▌      | 18/50 [00:06<00:10,  3.18it/s][A
Training:  42%|████▏     | 21/50 [00:07<00:09,  2.97it/s][A
Training:  48%|████▊     | 24/50 [00:07<00:05,  4.55it/s][A
Training:  52%|█████▏    | 26/50 [00:08<00:07,  3.18it/s][A
Training:  58%|█████▊    | 29/50 [00:09<00:06,  3.17it/s][A
Training:  60%|██████    | 30/50 [00:

Epoch: 30/72 - Loss: 0.5864 - Accuracy: 0.9507



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:01<00:08,  1.46s/it][A
 57%|█████▋    | 4/7 [00:01<00:00,  3.23it/s][A
100%|██████████| 7/7 [00:02<00:00,  2.64it/s][A
Epochs:  42%|████▏     | 30/72 [09:14<13:00, 18.58s/it]

Val Loss: 1.0365 - Val Accuracy: 0.9477



Training:   0%|          | 0/50 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/50 [00:01<01:09,  1.41s/it][A
Training:   4%|▍         | 2/50 [00:01<00:31,  1.50it/s][A
Training:   8%|▊         | 4/50 [00:01<00:13,  3.48it/s][A
Training:  10%|█         | 5/50 [00:02<00:21,  2.06it/s][A
Training:  12%|█▏        | 6/50 [00:02<00:17,  2.57it/s][A
Training:  18%|█▊        | 9/50 [00:03<00:14,  2.84it/s][A
Training:  20%|██        | 10/50 [00:04<00:13,  3.01it/s][A
Training:  26%|██▌       | 13/50 [00:05<00:12,  3.00it/s][A
Training:  28%|██▊       | 14/50 [00:05<00:10,  3.35it/s][A
Training:  34%|███▍      | 17/50 [00:06<00:10,  3.08it/s][A
Training:  38%|███▊      | 19/50 [00:06<00:07,  3.94it/s][A
Training:  42%|████▏     | 21/50 [00:07<00:09,  3.08it/s][A
Training:  44%|████▍     | 22/50 [00:07<00:08,  3.28it/s][A
Training:  50%|█████     | 25/50 [00:08<00:07,  3.22it/s][A
Training:  52%|█████▏    | 26/50 [00:08<00:06,  3.52it/s][A
Training:  58%|█████▊    | 29/50 [00:0

Epoch: 31/72 - Loss: 0.8380 - Accuracy: 0.9491



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:01<00:08,  1.45s/it][A
 29%|██▊       | 2/7 [00:01<00:03,  1.44it/s][A
 71%|███████▏  | 5/7 [00:02<00:00,  2.42it/s][A
100%|██████████| 7/7 [00:02<00:00,  2.53it/s][A
Epochs:  43%|████▎     | 31/72 [09:33<12:39, 18.53s/it]

Val Loss: 0.9756 - Val Accuracy: 0.9519



Training:   0%|          | 0/50 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/50 [00:01<01:16,  1.56s/it][A
Training:  10%|█         | 5/50 [00:02<00:22,  2.02it/s][A
Training:  14%|█▍        | 7/50 [00:02<00:14,  3.04it/s][A
Training:  18%|█▊        | 9/50 [00:04<00:17,  2.37it/s][A
Training:  26%|██▌       | 13/50 [00:05<00:13,  2.80it/s][A
Training:  34%|███▍      | 17/50 [00:06<00:11,  2.95it/s][A
Training:  42%|████▏     | 21/50 [00:07<00:09,  3.01it/s][A
Training:  48%|████▊     | 24/50 [00:07<00:06,  4.03it/s][A
Training:  52%|█████▏    | 26/50 [00:08<00:07,  3.27it/s][A
Training:  58%|█████▊    | 29/50 [00:09<00:06,  3.20it/s][A
Training:  64%|██████▍   | 32/50 [00:10<00:04,  4.36it/s][A
Training:  68%|██████▊   | 34/50 [00:11<00:04,  3.23it/s][A
Training:  72%|███████▏  | 36/50 [00:11<00:03,  4.03it/s][A
Training:  76%|███████▌  | 38/50 [00:12<00:04,  2.91it/s][A
Training:  82%|████████▏ | 41/50 [00:13<00:03,  2.76it/s][A
Training:  90%|█████████ | 45/50 [00

Epoch: 32/72 - Loss: 1.2219 - Accuracy: 0.9479



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:01<00:08,  1.49s/it][A
 43%|████▎     | 3/7 [00:01<00:01,  2.33it/s][A
 71%|███████▏  | 5/7 [00:02<00:00,  2.28it/s][A
100%|██████████| 7/7 [00:02<00:00,  2.61it/s][A
Epochs:  44%|████▍     | 32/72 [09:51<12:24, 18.61s/it]

Val Loss: 3.9217 - Val Accuracy: 0.8876



Training:   0%|          | 0/50 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/50 [00:01<01:13,  1.50s/it][A
Training:   8%|▊         | 4/50 [00:01<00:14,  3.20it/s][A
Training:  12%|█▏        | 6/50 [00:02<00:18,  2.43it/s][A
Training:  14%|█▍        | 7/50 [00:02<00:14,  2.93it/s][A
Training:  18%|█▊        | 9/50 [00:03<00:17,  2.30it/s][A
Training:  20%|██        | 10/50 [00:04<00:14,  2.74it/s][A
Training:  26%|██▌       | 13/50 [00:05<00:14,  2.61it/s][A
Training:  30%|███       | 15/50 [00:05<00:09,  3.59it/s][A
Training:  34%|███▍      | 17/50 [00:06<00:12,  2.66it/s][A
Training:  36%|███▌      | 18/50 [00:06<00:10,  3.06it/s][A
Training:  42%|████▏     | 21/50 [00:07<00:10,  2.85it/s][A
Training:  46%|████▌     | 23/50 [00:07<00:07,  3.73it/s][A
Training:  50%|█████     | 25/50 [00:08<00:08,  2.92it/s][A
Training:  52%|█████▏    | 26/50 [00:09<00:07,  3.20it/s][A
Training:  58%|█████▊    | 29/50 [00:10<00:06,  3.25it/s][A
Training:  60%|██████    | 30/50 [00:

Epoch: 33/72 - Loss: 3.6943 - Accuracy: 0.9325



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:01<00:08,  1.45s/it][A
 43%|████▎     | 3/7 [00:01<00:01,  2.39it/s][A
 71%|███████▏  | 5/7 [00:02<00:00,  2.23it/s][A
100%|██████████| 7/7 [00:02<00:00,  2.60it/s][A
Epochs:  46%|████▌     | 33/72 [10:10<12:09, 18.71s/it]

Val Loss: 4.6260 - Val Accuracy: 0.9418



Training:   0%|          | 0/50 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/50 [00:01<01:13,  1.51s/it][A
Training:   8%|▊         | 4/50 [00:01<00:14,  3.18it/s][A
Training:  12%|█▏        | 6/50 [00:02<00:18,  2.35it/s][A
Training:  18%|█▊        | 9/50 [00:03<00:16,  2.42it/s][A
Training:  22%|██▏       | 11/50 [00:04<00:11,  3.32it/s][A
Training:  26%|██▌       | 13/50 [00:05<00:14,  2.57it/s][A
Training:  32%|███▏      | 16/50 [00:05<00:08,  3.94it/s][A
Training:  36%|███▌      | 18/50 [00:06<00:11,  2.87it/s][A
Training:  42%|████▏     | 21/50 [00:07<00:10,  2.83it/s][A
Training:  48%|████▊     | 24/50 [00:07<00:06,  3.75it/s][A
Training:  50%|█████     | 25/50 [00:08<00:08,  2.88it/s][A
Training:  56%|█████▌    | 28/50 [00:09<00:05,  3.74it/s][A
Training:  58%|█████▊    | 29/50 [00:10<00:07,  2.63it/s][A
Training:  64%|██████▍   | 32/50 [00:10<00:04,  3.76it/s][A
Training:  66%|██████▌   | 33/50 [00:11<00:06,  2.66it/s][A
Training:  72%|███████▏  | 36/50 [00

Epoch: 34/72 - Loss: 6.2484 - Accuracy: 0.9308



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:01<00:09,  1.58s/it][A
100%|██████████| 7/7 [00:02<00:00,  2.55it/s][A
Epochs:  47%|████▋     | 34/72 [10:29<11:52, 18.75s/it]

Val Loss: 21.9197 - Val Accuracy: 0.8889



Training:   0%|          | 0/50 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/50 [00:01<01:16,  1.57s/it][A
Training:   8%|▊         | 4/50 [00:01<00:15,  3.07it/s][A
Training:  12%|█▏        | 6/50 [00:02<00:18,  2.41it/s][A
Training:  18%|█▊        | 9/50 [00:03<00:16,  2.54it/s][A
Training:  20%|██        | 10/50 [00:03<00:13,  2.91it/s][A
Training:  26%|██▌       | 13/50 [00:05<00:13,  2.76it/s][A
Training:  32%|███▏      | 16/50 [00:05<00:08,  4.23it/s][A
Training:  36%|███▌      | 18/50 [00:06<00:11,  2.89it/s][A
Training:  42%|████▏     | 21/50 [00:07<00:10,  2.78it/s][A
Training:  48%|████▊     | 24/50 [00:07<00:06,  4.04it/s][A
Training:  52%|█████▏    | 26/50 [00:08<00:07,  3.07it/s][A
Training:  58%|█████▊    | 29/50 [00:09<00:06,  3.19it/s][A
Training:  66%|██████▌   | 33/50 [00:10<00:04,  3.54it/s][A
Training:  74%|███████▍  | 37/50 [00:11<00:03,  3.93it/s][A
Training:  82%|████████▏ | 41/50 [00:12<00:02,  4.02it/s][A
Training:  90%|█████████ | 45/50 [00

Epoch: 35/72 - Loss: 10.0947 - Accuracy: 0.9302



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:01<00:07,  1.27s/it][A
100%|██████████| 7/7 [00:02<00:00,  3.15it/s][A
Epochs:  49%|████▊     | 35/72 [10:46<11:09, 18.10s/it]

Val Loss: 15.7007 - Val Accuracy: 0.9343



Training:   0%|          | 0/50 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/50 [00:01<01:00,  1.23s/it][A
Training:   6%|▌         | 3/50 [00:01<00:16,  2.78it/s][A
Training:  10%|█         | 5/50 [00:02<00:18,  2.42it/s][A
Training:  12%|█▏        | 6/50 [00:02<00:14,  3.00it/s][A
Training:  18%|█▊        | 9/50 [00:03<00:14,  2.86it/s][A
Training:  20%|██        | 10/50 [00:03<00:11,  3.34it/s][A
Training:  26%|██▌       | 13/50 [00:04<00:12,  2.96it/s][A
Training:  28%|██▊       | 14/50 [00:04<00:11,  3.10it/s][A
Training:  32%|███▏      | 16/50 [00:05<00:07,  4.27it/s][A
Training:  34%|███▍      | 17/50 [00:05<00:11,  2.96it/s][A
Training:  36%|███▌      | 18/50 [00:06<00:10,  3.05it/s][A
Training:  40%|████      | 20/50 [00:06<00:07,  3.92it/s][A
Training:  42%|████▏     | 21/50 [00:07<00:12,  2.37it/s][A
Training:  44%|████▍     | 22/50 [00:07<00:10,  2.59it/s][A
Training:  48%|████▊     | 24/50 [00:08<00:07,  3.25it/s][A
Training:  50%|█████     | 25/50 [00:

Epoch: 36/72 - Loss: 47.1315 - Accuracy: 0.9179



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:01<00:09,  1.64s/it][A
 57%|█████▋    | 4/7 [00:01<00:01,  2.95it/s][A
100%|██████████| 7/7 [00:02<00:00,  2.37it/s][A
Epochs:  50%|█████     | 36/72 [11:05<11:03, 18.42s/it]

Val Loss: 145.1499 - Val Accuracy: 0.8204



Training:   0%|          | 0/50 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/50 [00:01<01:15,  1.54s/it][A
Training:   6%|▌         | 3/50 [00:01<00:21,  2.20it/s][A
Training:  10%|█         | 5/50 [00:02<00:22,  2.01it/s][A
Training:  14%|█▍        | 7/50 [00:02<00:14,  3.07it/s][A
Training:  18%|█▊        | 9/50 [00:04<00:16,  2.43it/s][A
Training:  22%|██▏       | 11/50 [00:04<00:11,  3.37it/s][A
Training:  26%|██▌       | 13/50 [00:05<00:14,  2.52it/s][A
Training:  30%|███       | 15/50 [00:05<00:10,  3.33it/s][A
Training:  34%|███▍      | 17/50 [00:06<00:12,  2.57it/s][A
Training:  36%|███▌      | 18/50 [00:06<00:10,  2.98it/s][A
Training:  38%|███▊      | 19/50 [00:07<00:11,  2.66it/s][A
Training:  42%|████▏     | 21/50 [00:08<00:10,  2.70it/s][A
Training:  46%|████▌     | 23/50 [00:08<00:10,  2.67it/s][A
Training:  50%|█████     | 25/50 [00:09<00:07,  3.13it/s][A
Training:  52%|█████▏    | 26/50 [00:09<00:07,  3.40it/s][A
Training:  54%|█████▍    | 27/50 [00:

Epoch: 37/72 - Loss: 105.0187 - Accuracy: 0.9234



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:01<00:10,  1.68s/it][A
100%|██████████| 7/7 [00:02<00:00,  2.41it/s][A
Epochs:  51%|█████▏    | 37/72 [11:25<11:00, 18.88s/it]

Val Loss: 47.3466 - Val Accuracy: 0.9369



Training:   0%|          | 0/50 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/50 [00:01<01:20,  1.64s/it][A
Training:   6%|▌         | 3/50 [00:01<00:22,  2.12it/s][A
Training:  10%|█         | 5/50 [00:02<00:21,  2.09it/s][A
Training:  14%|█▍        | 7/50 [00:02<00:13,  3.11it/s][A
Training:  18%|█▊        | 9/50 [00:03<00:15,  2.61it/s][A
Training:  20%|██        | 10/50 [00:04<00:13,  3.01it/s][A
Training:  22%|██▏       | 11/50 [00:04<00:11,  3.40it/s][A
Training:  26%|██▌       | 13/50 [00:05<00:14,  2.58it/s][A
Training:  30%|███       | 15/50 [00:05<00:10,  3.43it/s][A
Training:  34%|███▍      | 17/50 [00:07<00:15,  2.10it/s][A
Training:  38%|███▊      | 19/50 [00:07<00:10,  2.91it/s][A
Training:  42%|████▏     | 21/50 [00:08<00:12,  2.29it/s][A
Training:  46%|████▌     | 23/50 [00:08<00:08,  3.14it/s][A
Training:  50%|█████     | 25/50 [00:09<00:10,  2.46it/s][A
Training:  54%|█████▍    | 27/50 [00:10<00:06,  3.36it/s][A
Training:  58%|█████▊    | 29/50 [00:

Epoch: 38/72 - Loss: 28.0178 - Accuracy: 0.9482



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:01<00:09,  1.61s/it][A
 57%|█████▋    | 4/7 [00:01<00:00,  3.00it/s][A
100%|██████████| 7/7 [00:02<00:00,  2.44it/s][A
Epochs:  53%|█████▎    | 38/72 [11:45<10:57, 19.35s/it]

Val Loss: 24.3871 - Val Accuracy: 0.9458



Training:   0%|          | 0/50 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/50 [00:01<01:13,  1.51s/it][A
Training:   8%|▊         | 4/50 [00:01<00:14,  3.16it/s][A
Training:  12%|█▏        | 6/50 [00:02<00:19,  2.29it/s][A
Training:  16%|█▌        | 8/50 [00:02<00:12,  3.43it/s][A
Training:  20%|██        | 10/50 [00:04<00:15,  2.55it/s][A
Training:  26%|██▌       | 13/50 [00:05<00:14,  2.55it/s][A
Training:  28%|██▊       | 14/50 [00:05<00:12,  2.86it/s][A
Training:  32%|███▏      | 16/50 [00:05<00:09,  3.60it/s][A
Training:  34%|███▍      | 17/50 [00:06<00:15,  2.19it/s][A
Training:  36%|███▌      | 18/50 [00:07<00:13,  2.35it/s][A
Training:  42%|████▏     | 21/50 [00:08<00:11,  2.58it/s][A
Training:  44%|████▍     | 22/50 [00:08<00:09,  2.83it/s][A
Training:  50%|█████     | 25/50 [00:09<00:09,  2.75it/s][A
Training:  56%|█████▌    | 28/50 [00:09<00:05,  4.13it/s][A
Training:  58%|█████▊    | 29/50 [00:10<00:07,  2.83it/s][A
Training:  62%|██████▏   | 31/50 [00

Epoch: 39/72 - Loss: 19.9798 - Accuracy: 0.9495



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:01<00:09,  1.64s/it][A
 57%|█████▋    | 4/7 [00:01<00:01,  2.92it/s][A
100%|██████████| 7/7 [00:02<00:00,  2.48it/s][A
Epochs:  54%|█████▍    | 39/72 [12:05<10:44, 19.54s/it]

Val Loss: 36.3004 - Val Accuracy: 0.9473



Training:   0%|          | 0/50 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/50 [00:01<01:15,  1.54s/it][A
Training:   6%|▌         | 3/50 [00:01<00:20,  2.25it/s][A
Training:  10%|█         | 5/50 [00:03<00:25,  1.75it/s][A
Training:  16%|█▌        | 8/50 [00:03<00:12,  3.41it/s][A
Training:  20%|██        | 10/50 [00:04<00:16,  2.38it/s][A
Training:  26%|██▌       | 13/50 [00:05<00:15,  2.37it/s][A
Training:  30%|███       | 15/50 [00:05<00:11,  3.14it/s][A
Training:  34%|███▍      | 17/50 [00:07<00:14,  2.27it/s][A
Training:  38%|███▊      | 19/50 [00:07<00:10,  3.02it/s][A
Training:  42%|████▏     | 21/50 [00:08<00:11,  2.49it/s][A
Training:  48%|████▊     | 24/50 [00:08<00:06,  3.84it/s][A
Training:  52%|█████▏    | 26/50 [00:10<00:08,  2.71it/s][A
Training:  58%|█████▊    | 29/50 [00:11<00:07,  2.67it/s][A
Training:  66%|██████▌   | 33/50 [00:12<00:05,  2.98it/s][A
Training:  68%|██████▊   | 34/50 [00:12<00:04,  3.28it/s][A
Training:  72%|███████▏  | 36/50 [00

Epoch: 40/72 - Loss: 22.3198 - Accuracy: 0.9514



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:01<00:10,  1.74s/it][A
 43%|████▎     | 3/7 [00:01<00:01,  2.01it/s][A
100%|██████████| 7/7 [00:02<00:00,  2.43it/s][A
Epochs:  56%|█████▌    | 40/72 [12:26<10:32, 19.78s/it]

Val Loss: 24.9736 - Val Accuracy: 0.9335



Training:   0%|          | 0/50 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/50 [00:01<01:19,  1.62s/it][A
Training:   6%|▌         | 3/50 [00:01<00:22,  2.12it/s][A
Training:  10%|█         | 5/50 [00:02<00:23,  1.89it/s][A
Training:  14%|█▍        | 7/50 [00:03<00:15,  2.71it/s][A
Training:  18%|█▊        | 9/50 [00:04<00:18,  2.28it/s][A
Training:  22%|██▏       | 11/50 [00:04<00:12,  3.03it/s][A
Training:  26%|██▌       | 13/50 [00:05<00:14,  2.55it/s][A
Training:  30%|███       | 15/50 [00:05<00:11,  3.16it/s][A
Training:  34%|███▍      | 17/50 [00:07<00:14,  2.24it/s][A
Training:  38%|███▊      | 19/50 [00:07<00:10,  3.05it/s][A
Training:  42%|████▏     | 21/50 [00:08<00:11,  2.49it/s][A
Training:  46%|████▌     | 23/50 [00:08<00:08,  3.30it/s][A
Training:  50%|█████     | 25/50 [00:09<00:09,  2.60it/s][A
Training:  58%|█████▊    | 29/50 [00:10<00:06,  3.07it/s][A
Training:  62%|██████▏   | 31/50 [00:11<00:04,  3.86it/s][A
Training:  66%|██████▌   | 33/50 [00:

Epoch: 41/72 - Loss: 14.6078 - Accuracy: 0.9537



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:01<00:09,  1.59s/it][A
100%|██████████| 7/7 [00:02<00:00,  2.50it/s][A
Epochs:  57%|█████▋    | 41/72 [12:46<10:16, 19.87s/it]

Val Loss: 18.1131 - Val Accuracy: 0.9468



Training:   0%|          | 0/50 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/50 [00:01<01:22,  1.68s/it][A
Training:   6%|▌         | 3/50 [00:01<00:23,  1.98it/s][A
Training:  10%|█         | 5/50 [00:03<00:24,  1.85it/s][A
Training:  14%|█▍        | 7/50 [00:03<00:14,  2.94it/s][A
Training:  18%|█▊        | 9/50 [00:04<00:18,  2.21it/s][A
Training:  24%|██▍       | 12/50 [00:04<00:10,  3.76it/s][A
Training:  28%|██▊       | 14/50 [00:05<00:13,  2.58it/s][A
Training:  30%|███       | 15/50 [00:06<00:13,  2.64it/s][A
Training:  32%|███▏      | 16/50 [00:06<00:11,  2.97it/s][A
Training:  34%|███▍      | 17/50 [00:07<00:17,  1.94it/s][A
Training:  38%|███▊      | 19/50 [00:07<00:10,  2.94it/s][A
Training:  40%|████      | 20/50 [00:07<00:08,  3.42it/s][A
Training:  42%|████▏     | 21/50 [00:08<00:14,  2.04it/s][A
Training:  46%|████▌     | 23/50 [00:09<00:08,  3.17it/s][A
Training:  48%|████▊     | 24/50 [00:09<00:07,  3.61it/s][A
Training:  50%|█████     | 25/50 [00:

Epoch: 42/72 - Loss: 13.1866 - Accuracy: 0.9537



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:01<00:09,  1.51s/it][A
 29%|██▊       | 2/7 [00:01<00:03,  1.43it/s][A
100%|██████████| 7/7 [00:02<00:00,  2.47it/s][A
Epochs:  58%|█████▊    | 42/72 [13:06<10:03, 20.12s/it]

Val Loss: 22.6789 - Val Accuracy: 0.9514



Training:   0%|          | 0/50 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/50 [00:01<01:24,  1.73s/it][A
Training:   6%|▌         | 3/50 [00:01<00:23,  2.03it/s][A
Training:  10%|█         | 5/50 [00:03<00:25,  1.76it/s][A
Training:  16%|█▌        | 8/50 [00:03<00:12,  3.31it/s][A
Training:  20%|██        | 10/50 [00:04<00:15,  2.56it/s][A
Training:  24%|██▍       | 12/50 [00:04<00:11,  3.30it/s][A
Training:  26%|██▌       | 13/50 [00:06<00:19,  1.87it/s][A
Training:  30%|███       | 15/50 [00:06<00:12,  2.72it/s][A
Training:  34%|███▍      | 17/50 [00:07<00:15,  2.16it/s][A
Training:  38%|███▊      | 19/50 [00:07<00:10,  2.97it/s][A
Training:  42%|████▏     | 21/50 [00:08<00:12,  2.39it/s][A
Training:  50%|█████     | 25/50 [00:10<00:09,  2.72it/s][A
Training:  54%|█████▍    | 27/50 [00:10<00:06,  3.44it/s][A
Training:  58%|█████▊    | 29/50 [00:11<00:07,  2.80it/s][A
Training:  62%|██████▏   | 31/50 [00:11<00:05,  3.47it/s][A
Training:  66%|██████▌   | 33/50 [00

Epoch: 43/72 - Loss: 13.1625 - Accuracy: 0.9550



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:01<00:10,  1.69s/it][A
 43%|████▎     | 3/7 [00:01<00:01,  2.01it/s][A
100%|██████████| 7/7 [00:03<00:00,  2.31it/s][A
Epochs:  60%|█████▉    | 43/72 [13:27<09:49, 20.32s/it]

Val Loss: 18.5947 - Val Accuracy: 0.9462



Training:   0%|          | 0/50 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/50 [00:01<01:22,  1.69s/it][A
Training:   6%|▌         | 3/50 [00:01<00:23,  2.00it/s][A
Training:  10%|█         | 5/50 [00:02<00:23,  1.91it/s][A
Training:  12%|█▏        | 6/50 [00:03<00:18,  2.32it/s][A
Training:  18%|█▊        | 9/50 [00:04<00:16,  2.48it/s][A
Training:  20%|██        | 10/50 [00:04<00:15,  2.60it/s][A
Training:  24%|██▍       | 12/50 [00:04<00:10,  3.75it/s][A
Training:  26%|██▌       | 13/50 [00:05<00:17,  2.11it/s][A
Training:  28%|██▊       | 14/50 [00:06<00:15,  2.35it/s][A
Training:  30%|███       | 15/50 [00:06<00:12,  2.83it/s][A
Training:  34%|███▍      | 17/50 [00:07<00:14,  2.32it/s][A
Training:  38%|███▊      | 19/50 [00:07<00:10,  3.03it/s][A
Training:  42%|████▏     | 21/50 [00:08<00:11,  2.58it/s][A
Training:  44%|████▍     | 22/50 [00:08<00:09,  3.01it/s][A
Training:  46%|████▌     | 23/50 [00:09<00:07,  3.39it/s][A
Training:  50%|█████     | 25/50 [00:

Epoch: 44/72 - Loss: 12.2041 - Accuracy: 0.9577



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:01<00:10,  1.72s/it][A
 43%|████▎     | 3/7 [00:01<00:01,  2.06it/s][A
100%|██████████| 7/7 [00:03<00:00,  2.28it/s][A
Epochs:  61%|██████    | 44/72 [13:47<09:28, 20.30s/it]

Val Loss: 17.5157 - Val Accuracy: 0.9495



Training:   0%|          | 0/50 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/50 [00:01<01:21,  1.66s/it][A
Training:   8%|▊         | 4/50 [00:01<00:15,  2.90it/s][A
Training:  12%|█▏        | 6/50 [00:03<00:21,  2.03it/s][A
Training:  18%|█▊        | 9/50 [00:04<00:20,  2.05it/s][A
Training:  20%|██        | 10/50 [00:04<00:17,  2.32it/s][A
Training:  26%|██▌       | 13/50 [00:05<00:15,  2.45it/s][A
Training:  28%|██▊       | 14/50 [00:06<00:13,  2.70it/s][A
Training:  34%|███▍      | 17/50 [00:07<00:12,  2.69it/s][A
Training:  36%|███▌      | 18/50 [00:07<00:11,  2.71it/s][A
Training:  42%|████▏     | 21/50 [00:08<00:10,  2.84it/s][A
Training:  44%|████▍     | 22/50 [00:08<00:09,  2.85it/s][A
Training:  48%|████▊     | 24/50 [00:09<00:06,  3.86it/s][A
Training:  50%|█████     | 25/50 [00:09<00:09,  2.75it/s][A
Training:  52%|█████▏    | 26/50 [00:10<00:07,  3.00it/s][A
Training:  56%|█████▌    | 28/50 [00:10<00:05,  4.32it/s][A
Training:  58%|█████▊    | 29/50 [00

Epoch: 45/72 - Loss: 10.0461 - Accuracy: 0.9564



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:01<00:09,  1.63s/it][A
 43%|████▎     | 3/7 [00:01<00:01,  2.13it/s][A
100%|██████████| 7/7 [00:03<00:00,  2.30it/s][A
Epochs:  62%|██████▎   | 45/72 [14:08<09:07, 20.26s/it]

Val Loss: 14.2681 - Val Accuracy: 0.9500



Training:   0%|          | 0/50 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/50 [00:01<01:18,  1.61s/it][A
Training:   4%|▍         | 2/50 [00:01<00:37,  1.30it/s][A
Training:  10%|█         | 5/50 [00:02<00:21,  2.06it/s][A
Training:  12%|█▏        | 6/50 [00:03<00:17,  2.45it/s][A
Training:  18%|█▊        | 9/50 [00:04<00:18,  2.18it/s][A
Training:  22%|██▏       | 11/50 [00:04<00:12,  3.01it/s][A
Training:  26%|██▌       | 13/50 [00:05<00:15,  2.41it/s][A
Training:  30%|███       | 15/50 [00:06<00:11,  3.15it/s][A
Training:  34%|███▍      | 17/50 [00:07<00:12,  2.57it/s][A
Training:  38%|███▊      | 19/50 [00:07<00:09,  3.23it/s][A
Training:  40%|████      | 20/50 [00:07<00:08,  3.56it/s][A
Training:  42%|████▏     | 21/50 [00:08<00:12,  2.40it/s][A
Training:  46%|████▌     | 23/50 [00:08<00:08,  3.29it/s][A
Training:  48%|████▊     | 24/50 [00:08<00:07,  3.70it/s][A
Training:  50%|█████     | 25/50 [00:09<00:10,  2.46it/s][A
Training:  54%|█████▍    | 27/50 [00:

Epoch: 46/72 - Loss: 10.3805 - Accuracy: 0.9562



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:01<00:10,  1.78s/it][A
100%|██████████| 7/7 [00:03<00:00,  2.11it/s][A
Epochs:  64%|██████▍   | 46/72 [14:28<08:50, 20.41s/it]

Val Loss: 17.5694 - Val Accuracy: 0.9350



Training:   0%|          | 0/50 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/50 [00:01<01:28,  1.80s/it][A
Training:   8%|▊         | 4/50 [00:01<00:17,  2.68it/s][A
Training:  12%|█▏        | 6/50 [00:03<00:26,  1.69it/s][A
Training:  16%|█▌        | 8/50 [00:03<00:16,  2.58it/s][A
Training:  20%|██        | 10/50 [00:05<00:19,  2.10it/s][A
Training:  24%|██▍       | 12/50 [00:05<00:12,  2.96it/s][A
Training:  28%|██▊       | 14/50 [00:06<00:15,  2.40it/s][A
Training:  34%|███▍      | 17/50 [00:07<00:13,  2.48it/s][A
Training:  38%|███▊      | 19/50 [00:07<00:09,  3.27it/s][A
Training:  42%|████▏     | 21/50 [00:08<00:11,  2.58it/s][A
Training:  50%|█████     | 25/50 [00:10<00:08,  2.86it/s][A
Training:  54%|█████▍    | 27/50 [00:10<00:06,  3.57it/s][A
Training:  58%|█████▊    | 29/50 [00:11<00:06,  3.02it/s][A
Training:  62%|██████▏   | 31/50 [00:11<00:04,  3.89it/s][A
Training:  66%|██████▌   | 33/50 [00:12<00:05,  3.08it/s][A
Training:  68%|██████▊   | 34/50 [00

Epoch: 47/72 - Loss: 8.1764 - Accuracy: 0.9586



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:01<00:09,  1.65s/it][A
 43%|████▎     | 3/7 [00:01<00:01,  2.14it/s][A
100%|██████████| 7/7 [00:03<00:00,  2.17it/s][A
Epochs:  65%|██████▌   | 47/72 [14:49<08:29, 20.39s/it]

Val Loss: 14.2962 - Val Accuracy: 0.9394



Training:   0%|          | 0/50 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/50 [00:01<01:21,  1.67s/it][A
Training:   6%|▌         | 3/50 [00:01<00:23,  2.03it/s][A
Training:  10%|█         | 5/50 [00:03<00:30,  1.48it/s][A
Training:  14%|█▍        | 7/50 [00:03<00:17,  2.40it/s][A
Training:  18%|█▊        | 9/50 [00:04<00:19,  2.10it/s][A
Training:  22%|██▏       | 11/50 [00:04<00:13,  2.96it/s][A
Training:  26%|██▌       | 13/50 [00:06<00:15,  2.33it/s][A
Training:  32%|███▏      | 16/50 [00:06<00:09,  3.76it/s][A
Training:  36%|███▌      | 18/50 [00:07<00:11,  2.68it/s][A
Training:  42%|████▏     | 21/50 [00:08<00:11,  2.53it/s][A
Training:  48%|████▊     | 24/50 [00:09<00:07,  3.70it/s][A
Training:  52%|█████▏    | 26/50 [00:10<00:07,  3.01it/s][A
Training:  58%|█████▊    | 29/50 [00:11<00:07,  2.74it/s][A
Training:  64%|██████▍   | 32/50 [00:11<00:04,  3.84it/s][A
Training:  68%|██████▊   | 34/50 [00:12<00:05,  3.18it/s][A
Training:  74%|███████▍  | 37/50 [00:

Epoch: 48/72 - Loss: 10.4519 - Accuracy: 0.9583



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:01<00:11,  1.90s/it][A
 43%|████▎     | 3/7 [00:02<00:02,  1.89it/s][A
 71%|███████▏  | 5/7 [00:03<00:01,  1.91it/s][A
100%|██████████| 7/7 [00:03<00:00,  2.14it/s][A
Epochs:  67%|██████▋   | 48/72 [15:09<08:12, 20.50s/it]

Val Loss: 17.7513 - Val Accuracy: 0.9462



Training:   0%|          | 0/50 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/50 [00:02<01:38,  2.02s/it][A
Training:   6%|▌         | 3/50 [00:02<00:26,  1.76it/s][A
Training:  10%|█         | 5/50 [00:03<00:26,  1.69it/s][A
Training:  16%|█▌        | 8/50 [00:03<00:14,  2.99it/s][A
Training:  18%|█▊        | 9/50 [00:04<00:19,  2.07it/s][A
Training:  22%|██▏       | 11/50 [00:04<00:13,  2.94it/s][A
Training:  26%|██▌       | 13/50 [00:06<00:15,  2.36it/s][A
Training:  28%|██▊       | 14/50 [00:06<00:13,  2.76it/s][A
Training:  32%|███▏      | 16/50 [00:06<00:09,  3.77it/s][A
Training:  34%|███▍      | 17/50 [00:07<00:13,  2.38it/s][A
Training:  38%|███▊      | 19/50 [00:07<00:09,  3.41it/s][A
Training:  40%|████      | 20/50 [00:07<00:07,  3.94it/s][A
Training:  42%|████▏     | 21/50 [00:08<00:11,  2.49it/s][A
Training:  46%|████▌     | 23/50 [00:08<00:07,  3.76it/s][A
Training:  50%|█████     | 25/50 [00:09<00:08,  2.95it/s][A
Training:  52%|█████▏    | 26/50 [00:

Epoch: 49/72 - Loss: 10.3928 - Accuracy: 0.9571



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:01<00:11,  1.99s/it][A
 57%|█████▋    | 4/7 [00:02<00:01,  2.41it/s][A
100%|██████████| 7/7 [00:03<00:00,  2.06it/s][A
Epochs:  68%|██████▊   | 49/72 [15:30<07:51, 20.49s/it]

Val Loss: 20.2823 - Val Accuracy: 0.9392



Training:   0%|          | 0/50 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/50 [00:02<01:42,  2.09s/it][A
Training:   4%|▍         | 2/50 [00:02<00:44,  1.07it/s][A
Training:   8%|▊         | 4/50 [00:02<00:17,  2.62it/s][A
Training:  12%|█▏        | 6/50 [00:03<00:21,  2.07it/s][A
Training:  18%|█▊        | 9/50 [00:04<00:16,  2.41it/s][A
Training:  20%|██        | 10/50 [00:04<00:14,  2.73it/s][A
Training:  24%|██▍       | 12/50 [00:04<00:09,  3.91it/s][A
Training:  26%|██▌       | 13/50 [00:06<00:16,  2.27it/s][A
Training:  28%|██▊       | 14/50 [00:06<00:13,  2.73it/s][A
Training:  32%|███▏      | 16/50 [00:06<00:08,  4.05it/s][A
Training:  36%|███▌      | 18/50 [00:07<00:12,  2.66it/s][A
Training:  42%|████▏     | 21/50 [00:08<00:10,  2.65it/s][A
Training:  50%|█████     | 25/50 [00:09<00:08,  2.94it/s][A
Training:  54%|█████▍    | 27/50 [00:09<00:06,  3.69it/s][A
Training:  58%|█████▊    | 29/50 [00:10<00:07,  2.91it/s][A
Training:  64%|██████▍   | 32/50 [00:

Epoch: 50/72 - Loss: 13.1076 - Accuracy: 0.9574



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:02<00:12,  2.11s/it][A
100%|██████████| 7/7 [00:03<00:00,  2.02it/s][A
Epochs:  69%|██████▉   | 50/72 [15:51<07:33, 20.62s/it]

Val Loss: 19.3820 - Val Accuracy: 0.9384



Training:   0%|          | 0/50 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/50 [00:02<01:44,  2.14s/it][A
Training:   6%|▌         | 3/50 [00:02<00:28,  1.65it/s][A
Training:  10%|█         | 5/50 [00:03<00:26,  1.71it/s][A
Training:  14%|█▍        | 7/50 [00:03<00:15,  2.76it/s][A
Training:  18%|█▊        | 9/50 [00:04<00:19,  2.11it/s][A
Training:  24%|██▍       | 12/50 [00:04<00:10,  3.58it/s][A
Training:  28%|██▊       | 14/50 [00:06<00:13,  2.65it/s][A
Training:  34%|███▍      | 17/50 [00:07<00:12,  2.60it/s][A
Training:  38%|███▊      | 19/50 [00:07<00:09,  3.37it/s][A
Training:  42%|████▏     | 21/50 [00:08<00:10,  2.85it/s][A
Training:  50%|█████     | 25/50 [00:09<00:07,  3.19it/s][A
Training:  54%|█████▍    | 27/50 [00:09<00:05,  3.90it/s][A
Training:  58%|█████▊    | 29/50 [00:10<00:06,  3.08it/s][A
Training:  60%|██████    | 30/50 [00:10<00:05,  3.37it/s][A
Training:  64%|██████▍   | 32/50 [00:11<00:04,  3.89it/s][A
Training:  66%|██████▌   | 33/50 [00:

Epoch: 51/72 - Loss: 11.7207 - Accuracy: 0.9579



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:01<00:11,  1.93s/it][A
 43%|████▎     | 3/7 [00:02<00:02,  1.85it/s][A
100%|██████████| 7/7 [00:03<00:00,  2.07it/s][A
Epochs:  71%|███████   | 51/72 [16:12<07:14, 20.69s/it]

Val Loss: 16.7245 - Val Accuracy: 0.9534



Training:   0%|          | 0/50 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/50 [00:02<01:43,  2.11s/it][A
Training:   6%|▌         | 3/50 [00:02<00:27,  1.70it/s][A
Training:  10%|█         | 5/50 [00:03<00:28,  1.59it/s][A
Training:  14%|█▍        | 7/50 [00:03<00:16,  2.59it/s][A
Training:  18%|█▊        | 9/50 [00:04<00:19,  2.06it/s][A
Training:  22%|██▏       | 11/50 [00:05<00:13,  2.98it/s][A
Training:  26%|██▌       | 13/50 [00:06<00:15,  2.34it/s][A
Training:  32%|███▏      | 16/50 [00:06<00:08,  3.79it/s][A
Training:  36%|███▌      | 18/50 [00:07<00:10,  2.93it/s][A
Training:  40%|████      | 20/50 [00:07<00:07,  3.88it/s][A
Training:  44%|████▍     | 22/50 [00:08<00:09,  2.95it/s][A
Training:  50%|█████     | 25/50 [00:09<00:08,  2.86it/s][A
Training:  54%|█████▍    | 27/50 [00:09<00:06,  3.62it/s][A
Training:  58%|█████▊    | 29/50 [00:11<00:07,  2.80it/s][A
Training:  64%|██████▍   | 32/50 [00:11<00:04,  4.16it/s][A
Training:  68%|██████▊   | 34/50 [00:

Epoch: 52/72 - Loss: 11.3344 - Accuracy: 0.9603



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:02<00:12,  2.03s/it][A
100%|██████████| 7/7 [00:03<00:00,  2.08it/s][A
Epochs:  72%|███████▏  | 52/72 [16:33<06:55, 20.78s/it]

Val Loss: 20.8172 - Val Accuracy: 0.9396



Training:   0%|          | 0/50 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/50 [00:02<01:48,  2.21s/it][A
Training:   8%|▊         | 4/50 [00:02<00:20,  2.25it/s][A
Training:  12%|█▏        | 6/50 [00:03<00:23,  1.88it/s][A
Training:  16%|█▌        | 8/50 [00:03<00:14,  2.88it/s][A
Training:  20%|██        | 10/50 [00:04<00:17,  2.25it/s][A
Training:  26%|██▌       | 13/50 [00:06<00:15,  2.39it/s][A
Training:  30%|███       | 15/50 [00:06<00:11,  3.13it/s][A
Training:  34%|███▍      | 17/50 [00:07<00:12,  2.60it/s][A
Training:  42%|████▏     | 21/50 [00:08<00:09,  2.92it/s][A
Training:  48%|████▊     | 24/50 [00:08<00:06,  4.07it/s][A
Training:  52%|█████▏    | 26/50 [00:09<00:08,  2.91it/s][A
Training:  58%|█████▊    | 29/50 [00:11<00:07,  2.79it/s][A
Training:  64%|██████▍   | 32/50 [00:11<00:04,  3.94it/s][A
Training:  68%|██████▊   | 34/50 [00:12<00:05,  2.88it/s][A
Training:  74%|███████▍  | 37/50 [00:13<00:04,  2.67it/s][A
Training:  80%|████████  | 40/50 [00

Epoch: 53/72 - Loss: 12.0061 - Accuracy: 0.9571



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:01<00:11,  1.87s/it][A
 29%|██▊       | 2/7 [00:02<00:04,  1.06it/s][A
 71%|███████▏  | 5/7 [00:03<00:00,  2.06it/s][A
100%|██████████| 7/7 [00:03<00:00,  2.05it/s][A
Epochs:  74%|███████▎  | 53/72 [16:54<06:36, 20.86s/it]

Val Loss: 16.2246 - Val Accuracy: 0.9446



Training:   0%|          | 0/50 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/50 [00:02<01:39,  2.03s/it][A
Training:   6%|▌         | 3/50 [00:02<00:27,  1.72it/s][A
Training:  10%|█         | 5/50 [00:03<00:24,  1.81it/s][A
Training:  16%|█▌        | 8/50 [00:03<00:11,  3.56it/s][A
Training:  20%|██        | 10/50 [00:04<00:15,  2.63it/s][A
Training:  26%|██▌       | 13/50 [00:05<00:14,  2.57it/s][A
Training:  30%|███       | 15/50 [00:05<00:10,  3.37it/s][A
Training:  34%|███▍      | 17/50 [00:06<00:11,  2.81it/s][A
Training:  38%|███▊      | 19/50 [00:06<00:08,  3.67it/s][A
Training:  42%|████▏     | 21/50 [00:08<00:10,  2.71it/s][A
Training:  46%|████▌     | 23/50 [00:08<00:08,  3.37it/s][A
Training:  50%|█████     | 25/50 [00:09<00:08,  2.83it/s][A
Training:  54%|█████▍    | 27/50 [00:09<00:06,  3.65it/s][A
Training:  58%|█████▊    | 29/50 [00:10<00:07,  2.78it/s][A
Training:  62%|██████▏   | 31/50 [00:10<00:05,  3.65it/s][A
Training:  66%|██████▌   | 33/50 [00

Epoch: 54/72 - Loss: 10.6971 - Accuracy: 0.9605



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:02<00:12,  2.03s/it][A
 29%|██▊       | 2/7 [00:02<00:04,  1.02it/s][A
 57%|█████▋    | 4/7 [00:02<00:01,  2.52it/s][A
100%|██████████| 7/7 [00:03<00:00,  2.04it/s][A
Epochs:  75%|███████▌  | 54/72 [17:14<06:14, 20.81s/it]

Val Loss: 20.3545 - Val Accuracy: 0.9387



Training:   0%|          | 0/50 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/50 [00:01<01:34,  1.93s/it][A
Training:   8%|▊         | 4/50 [00:02<00:18,  2.55it/s][A
Training:  12%|█▏        | 6/50 [00:03<00:21,  2.06it/s][A
Training:  18%|█▊        | 9/50 [00:04<00:18,  2.18it/s][A
Training:  26%|██▌       | 13/50 [00:05<00:14,  2.60it/s][A
Training:  34%|███▍      | 17/50 [00:07<00:11,  2.80it/s][A
Training:  42%|████▏     | 21/50 [00:08<00:09,  2.95it/s][A
Training:  50%|█████     | 25/50 [00:09<00:08,  3.07it/s][A
Training:  54%|█████▍    | 27/50 [00:09<00:06,  3.67it/s][A
Training:  58%|█████▊    | 29/50 [00:10<00:07,  2.94it/s][A
Training:  64%|██████▍   | 32/50 [00:10<00:04,  4.08it/s][A
Training:  68%|██████▊   | 34/50 [00:12<00:05,  3.04it/s][A
Training:  72%|███████▏  | 36/50 [00:12<00:03,  3.70it/s][A
Training:  74%|███████▍  | 37/50 [00:13<00:05,  2.50it/s][A
Training:  80%|████████  | 40/50 [00:13<00:02,  3.81it/s][A
Training:  84%|████████▍ | 42/50 [00

Epoch: 55/72 - Loss: 10.1172 - Accuracy: 0.9582



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:02<00:12,  2.03s/it][A
 57%|█████▋    | 4/7 [00:02<00:01,  2.42it/s][A
100%|██████████| 7/7 [00:03<00:00,  2.12it/s][A
Epochs:  76%|███████▋  | 55/72 [17:35<05:52, 20.75s/it]

Val Loss: 19.6137 - Val Accuracy: 0.9482



Training:   0%|          | 0/50 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/50 [00:01<01:28,  1.81s/it][A
Training:   6%|▌         | 3/50 [00:01<00:23,  1.97it/s][A
Training:  10%|█         | 5/50 [00:03<00:24,  1.84it/s][A
Training:  14%|█▍        | 7/50 [00:03<00:14,  2.99it/s][A
Training:  18%|█▊        | 9/50 [00:04<00:17,  2.38it/s][A
Training:  24%|██▍       | 12/50 [00:04<00:09,  3.87it/s][A
Training:  28%|██▊       | 14/50 [00:05<00:12,  2.86it/s][A
Training:  32%|███▏      | 16/50 [00:05<00:08,  3.84it/s][A
Training:  36%|███▌      | 18/50 [00:06<00:11,  2.79it/s][A
Training:  42%|████▏     | 21/50 [00:07<00:10,  2.78it/s][A
Training:  46%|████▌     | 23/50 [00:08<00:07,  3.60it/s][A
Training:  50%|█████     | 25/50 [00:09<00:09,  2.75it/s][A
Training:  54%|█████▍    | 27/50 [00:09<00:06,  3.64it/s][A
Training:  58%|█████▊    | 29/50 [00:10<00:07,  2.64it/s][A
Training:  62%|██████▏   | 31/50 [00:10<00:05,  3.53it/s][A
Training:  66%|██████▌   | 33/50 [00:

Epoch: 56/72 - Loss: 13.8496 - Accuracy: 0.9587



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:01<00:10,  1.74s/it][A
 57%|█████▋    | 4/7 [00:01<00:01,  2.78it/s][A
100%|██████████| 7/7 [00:02<00:00,  2.42it/s][A
Epochs:  78%|███████▊  | 56/72 [17:55<05:29, 20.57s/it]

Val Loss: 18.0903 - Val Accuracy: 0.9561



Training:   0%|          | 0/50 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/50 [00:01<01:25,  1.75s/it][A
Training:  10%|█         | 5/50 [00:03<00:25,  1.77it/s][A
Training:  14%|█▍        | 7/50 [00:03<00:16,  2.68it/s][A
Training:  18%|█▊        | 9/50 [00:04<00:17,  2.28it/s][A
Training:  26%|██▌       | 13/50 [00:05<00:14,  2.53it/s][A
Training:  32%|███▏      | 16/50 [00:05<00:09,  3.64it/s][A
Training:  34%|███▍      | 17/50 [00:07<00:13,  2.54it/s][A
Training:  40%|████      | 20/50 [00:07<00:07,  3.87it/s][A
Training:  44%|████▍     | 22/50 [00:08<00:09,  2.87it/s][A
Training:  48%|████▊     | 24/50 [00:08<00:07,  3.67it/s][A
Training:  52%|█████▏    | 26/50 [00:09<00:08,  2.88it/s][A
Training:  58%|█████▊    | 29/50 [00:10<00:07,  2.70it/s][A
Training:  62%|██████▏   | 31/50 [00:10<00:05,  3.47it/s][A
Training:  66%|██████▌   | 33/50 [00:12<00:06,  2.72it/s][A
Training:  72%|███████▏  | 36/50 [00:12<00:03,  4.04it/s][A
Training:  76%|███████▌  | 38/50 [00

Epoch: 57/72 - Loss: 13.6154 - Accuracy: 0.9594



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:01<00:09,  1.66s/it][A
100%|██████████| 7/7 [00:02<00:00,  2.48it/s][A
Epochs:  79%|███████▉  | 57/72 [18:15<05:06, 20.42s/it]

Val Loss: 29.0808 - Val Accuracy: 0.9357



Training:   0%|          | 0/50 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/50 [00:01<01:16,  1.57s/it][A
Training:   4%|▍         | 2/50 [00:01<00:35,  1.35it/s][A
Training:  10%|█         | 5/50 [00:02<00:22,  2.01it/s][A
Training:  12%|█▏        | 6/50 [00:03<00:18,  2.41it/s][A
Training:  18%|█▊        | 9/50 [00:04<00:15,  2.71it/s][A
Training:  20%|██        | 10/50 [00:04<00:13,  2.95it/s][A
Training:  26%|██▌       | 13/50 [00:05<00:12,  2.99it/s][A
Training:  28%|██▊       | 14/50 [00:05<00:12,  2.94it/s][A
Training:  34%|███▍      | 17/50 [00:06<00:10,  3.01it/s][A
Training:  36%|███▌      | 18/50 [00:06<00:10,  3.11it/s][A
Training:  40%|████      | 20/50 [00:07<00:07,  4.21it/s][A
Training:  42%|████▏     | 21/50 [00:07<00:09,  3.15it/s][A
Training:  44%|████▍     | 22/50 [00:08<00:09,  2.80it/s][A
Training:  50%|█████     | 25/50 [00:08<00:07,  3.33it/s][A
Training:  52%|█████▏    | 26/50 [00:09<00:07,  3.09it/s][A
Training:  58%|█████▊    | 29/50 [00:

Epoch: 58/72 - Loss: 15.6727 - Accuracy: 0.9568



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:01<00:09,  1.64s/it][A
100%|██████████| 7/7 [00:02<00:00,  2.45it/s][A
Epochs:  81%|████████  | 58/72 [18:35<04:42, 20.21s/it]

Val Loss: 25.9431 - Val Accuracy: 0.9458



Training:   0%|          | 0/50 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/50 [00:01<01:21,  1.67s/it][A
Training:   4%|▍         | 2/50 [00:01<00:35,  1.33it/s][A
Training:   8%|▊         | 4/50 [00:01<00:15,  2.99it/s][A
Training:  10%|█         | 5/50 [00:03<00:24,  1.80it/s][A
Training:  16%|█▌        | 8/50 [00:03<00:10,  3.86it/s][A
Training:  20%|██        | 10/50 [00:04<00:15,  2.65it/s][A
Training:  26%|██▌       | 13/50 [00:05<00:14,  2.58it/s][A
Training:  30%|███       | 15/50 [00:05<00:10,  3.40it/s][A
Training:  34%|███▍      | 17/50 [00:06<00:12,  2.58it/s][A
Training:  42%|████▏     | 21/50 [00:08<00:10,  2.84it/s][A
Training:  46%|████▌     | 23/50 [00:08<00:07,  3.57it/s][A
Training:  50%|█████     | 25/50 [00:09<00:08,  2.80it/s][A
Training:  54%|█████▍    | 27/50 [00:09<00:06,  3.63it/s][A
Training:  58%|█████▊    | 29/50 [00:10<00:07,  2.63it/s][A
Training:  62%|██████▏   | 31/50 [00:10<00:05,  3.48it/s][A
Training:  66%|██████▌   | 33/50 [00:

Epoch: 59/72 - Loss: 16.3338 - Accuracy: 0.9571



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:01<00:08,  1.47s/it][A
 57%|█████▋    | 4/7 [00:01<00:00,  3.05it/s][A
100%|██████████| 7/7 [00:02<00:00,  2.62it/s][A
Epochs:  82%|████████▏ | 59/72 [18:55<04:21, 20.11s/it]

Val Loss: 21.9447 - Val Accuracy: 0.9519



Training:   0%|          | 0/50 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/50 [00:01<01:18,  1.61s/it][A
Training:   4%|▍         | 2/50 [00:01<00:36,  1.33it/s][A
Training:  10%|█         | 5/50 [00:02<00:20,  2.16it/s][A
Training:  12%|█▏        | 6/50 [00:03<00:18,  2.43it/s][A
Training:  18%|█▊        | 9/50 [00:04<00:15,  2.72it/s][A
Training:  20%|██        | 10/50 [00:04<00:13,  3.08it/s][A
Training:  26%|██▌       | 13/50 [00:05<00:13,  2.81it/s][A
Training:  30%|███       | 15/50 [00:05<00:09,  3.75it/s][A
Training:  34%|███▍      | 17/50 [00:06<00:11,  2.82it/s][A
Training:  40%|████      | 20/50 [00:06<00:07,  4.25it/s][A
Training:  42%|████▏     | 21/50 [00:07<00:10,  2.80it/s][A
Training:  44%|████▍     | 22/50 [00:07<00:08,  3.22it/s][A
Training:  50%|█████     | 25/50 [00:09<00:08,  2.93it/s][A
Training:  52%|█████▏    | 26/50 [00:09<00:07,  3.04it/s][A
Training:  56%|█████▌    | 28/50 [00:09<00:05,  4.22it/s][A
Training:  58%|█████▊    | 29/50 [00:

Epoch: 60/72 - Loss: 14.9397 - Accuracy: 0.9601



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:01<00:09,  1.56s/it][A
 43%|████▎     | 3/7 [00:01<00:01,  2.25it/s][A
100%|██████████| 7/7 [00:02<00:00,  2.39it/s][A
Epochs:  83%|████████▎ | 60/72 [19:15<04:00, 20.03s/it]

Val Loss: 30.5868 - Val Accuracy: 0.9389



Training:   0%|          | 0/50 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/50 [00:01<01:28,  1.80s/it][A
Training:   4%|▍         | 2/50 [00:01<00:38,  1.23it/s][A
Training:  10%|█         | 5/50 [00:03<00:23,  1.89it/s][A
Training:  14%|█▍        | 7/50 [00:03<00:14,  2.96it/s][A
Training:  18%|█▊        | 9/50 [00:04<00:16,  2.56it/s][A
Training:  24%|██▍       | 12/50 [00:04<00:09,  4.21it/s][A
Training:  28%|██▊       | 14/50 [00:05<00:12,  2.95it/s][A
Training:  32%|███▏      | 16/50 [00:05<00:08,  3.94it/s][A
Training:  36%|███▌      | 18/50 [00:06<00:11,  2.77it/s][A
Training:  42%|████▏     | 21/50 [00:07<00:10,  2.85it/s][A
Training:  44%|████▍     | 22/50 [00:08<00:09,  3.09it/s][A
Training:  48%|████▊     | 24/50 [00:08<00:06,  4.10it/s][A
Training:  50%|█████     | 25/50 [00:09<00:09,  2.52it/s][A
Training:  54%|█████▍    | 27/50 [00:09<00:06,  3.53it/s][A
Training:  58%|█████▊    | 29/50 [00:10<00:08,  2.61it/s][A
Training:  62%|██████▏   | 31/50 [00:

Epoch: 61/72 - Loss: 15.1886 - Accuracy: 0.9584



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:01<00:09,  1.66s/it][A
 57%|█████▋    | 4/7 [00:01<00:01,  2.93it/s][A
100%|██████████| 7/7 [00:02<00:00,  2.38it/s][A
Epochs:  85%|████████▍ | 61/72 [19:35<03:40, 20.02s/it]

Val Loss: 24.2349 - Val Accuracy: 0.9494



Training:   0%|          | 0/50 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/50 [00:01<01:24,  1.72s/it][A
Training:  10%|█         | 5/50 [00:02<00:23,  1.94it/s][A
Training:  12%|█▏        | 6/50 [00:03<00:18,  2.39it/s][A
Training:  16%|█▌        | 8/50 [00:03<00:11,  3.64it/s][A
Training:  20%|██        | 10/50 [00:04<00:14,  2.71it/s][A
Training:  22%|██▏       | 11/50 [00:04<00:12,  3.14it/s][A
Training:  26%|██▌       | 13/50 [00:05<00:14,  2.47it/s][A
Training:  30%|███       | 15/50 [00:05<00:10,  3.48it/s][A
Training:  34%|███▍      | 17/50 [00:06<00:12,  2.69it/s][A
Training:  38%|███▊      | 19/50 [00:06<00:08,  3.63it/s][A
Training:  42%|████▏     | 21/50 [00:07<00:10,  2.77it/s][A
Training:  46%|████▌     | 23/50 [00:08<00:07,  3.77it/s][A
Training:  50%|█████     | 25/50 [00:09<00:09,  2.66it/s][A
Training:  54%|█████▍    | 27/50 [00:09<00:06,  3.62it/s][A
Training:  58%|█████▊    | 29/50 [00:10<00:08,  2.53it/s][A
Training:  64%|██████▍   | 32/50 [00

Epoch: 62/72 - Loss: 19.0970 - Accuracy: 0.9558



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:01<00:09,  1.52s/it][A
 29%|██▊       | 2/7 [00:01<00:03,  1.36it/s][A
 71%|███████▏  | 5/7 [00:02<00:00,  2.29it/s][A
100%|██████████| 7/7 [00:02<00:00,  2.38it/s][A
Epochs:  86%|████████▌ | 62/72 [19:55<03:19, 19.98s/it]

Val Loss: 28.2342 - Val Accuracy: 0.9529



Training:   0%|          | 0/50 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/50 [00:01<01:21,  1.66s/it][A
Training:   6%|▌         | 3/50 [00:01<00:22,  2.08it/s][A
Training:  10%|█         | 5/50 [00:02<00:23,  1.92it/s][A
Training:  14%|█▍        | 7/50 [00:03<00:14,  3.07it/s][A
Training:  18%|█▊        | 9/50 [00:03<00:15,  2.61it/s][A
Training:  20%|██        | 10/50 [00:04<00:14,  2.80it/s][A
Training:  24%|██▍       | 12/50 [00:04<00:09,  4.01it/s][A
Training:  26%|██▌       | 13/50 [00:05<00:13,  2.84it/s][A
Training:  28%|██▊       | 14/50 [00:05<00:12,  2.96it/s][A
Training:  32%|███▏      | 16/50 [00:05<00:07,  4.36it/s][A
Training:  34%|███▍      | 17/50 [00:06<00:10,  3.03it/s][A
Training:  36%|███▌      | 18/50 [00:06<00:09,  3.24it/s][A
Training:  42%|████▏     | 21/50 [00:07<00:07,  3.70it/s][A
Training:  44%|████▍     | 22/50 [00:07<00:07,  3.55it/s][A
Training:  50%|█████     | 25/50 [00:08<00:07,  3.55it/s][A
Training:  52%|█████▏    | 26/50 [00:

Epoch: 63/72 - Loss: 17.4330 - Accuracy: 0.9582



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:01<00:09,  1.61s/it][A
 57%|█████▋    | 4/7 [00:01<00:01,  2.96it/s][A
100%|██████████| 7/7 [00:02<00:00,  2.57it/s][A
Epochs:  88%|████████▊ | 63/72 [20:13<02:54, 19.38s/it]

Val Loss: 26.3291 - Val Accuracy: 0.9349



Training:   0%|          | 0/50 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/50 [00:01<01:19,  1.62s/it][A
Training:   8%|▊         | 4/50 [00:01<00:15,  2.98it/s][A
Training:  12%|█▏        | 6/50 [00:02<00:19,  2.28it/s][A
Training:  18%|█▊        | 9/50 [00:04<00:16,  2.42it/s][A
Training:  26%|██▌       | 13/50 [00:05<00:12,  2.90it/s][A
Training:  34%|███▍      | 17/50 [00:06<00:10,  3.09it/s][A
Training:  42%|████▏     | 21/50 [00:07<00:08,  3.35it/s][A
Training:  50%|█████     | 25/50 [00:08<00:07,  3.35it/s][A
Training:  58%|█████▊    | 29/50 [00:09<00:06,  3.32it/s][A
Training:  64%|██████▍   | 32/50 [00:09<00:04,  4.31it/s][A
Training:  68%|██████▊   | 34/50 [00:10<00:04,  3.34it/s][A
Training:  74%|███████▍  | 37/50 [00:12<00:04,  3.17it/s][A
Training:  80%|████████  | 40/50 [00:12<00:02,  4.29it/s][A
Training:  84%|████████▍ | 42/50 [00:13<00:02,  3.28it/s][A
Training:  90%|█████████ | 45/50 [00:14<00:01,  3.16it/s][A
Training:  96%|█████████▌| 48/50 [00

Epoch: 64/72 - Loss: 23.6954 - Accuracy: 0.9536



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:01<00:09,  1.58s/it][A
 71%|███████▏  | 5/7 [00:02<00:00,  2.20it/s][A
100%|██████████| 7/7 [00:02<00:00,  2.50it/s][A
Epochs:  89%|████████▉ | 64/72 [20:31<02:32, 19.05s/it]

Val Loss: 37.5711 - Val Accuracy: 0.9529



Training:   0%|          | 0/50 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/50 [00:01<01:17,  1.59s/it][A
Training:   6%|▌         | 3/50 [00:01<00:21,  2.22it/s][A
Training:  10%|█         | 5/50 [00:02<00:24,  1.83it/s][A
Training:  16%|█▌        | 8/50 [00:03<00:11,  3.56it/s][A
Training:  20%|██        | 10/50 [00:04<00:15,  2.57it/s][A
Training:  26%|██▌       | 13/50 [00:05<00:13,  2.70it/s][A
Training:  28%|██▊       | 14/50 [00:05<00:12,  2.96it/s][A
Training:  34%|███▍      | 17/50 [00:06<00:10,  3.11it/s][A
Training:  36%|███▌      | 18/50 [00:06<00:09,  3.38it/s][A
Training:  42%|████▏     | 21/50 [00:07<00:08,  3.22it/s][A
Training:  44%|████▍     | 22/50 [00:07<00:07,  3.56it/s][A
Training:  48%|████▊     | 24/50 [00:07<00:05,  4.75it/s][A
Training:  50%|█████     | 25/50 [00:08<00:09,  2.69it/s][A
Training:  58%|█████▊    | 29/50 [00:10<00:07,  2.90it/s][A
Training:  64%|██████▍   | 32/50 [00:10<00:04,  4.24it/s][A
Training:  68%|██████▊   | 34/50 [00

Epoch: 65/72 - Loss: 21.0230 - Accuracy: 0.9584



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:01<00:09,  1.52s/it][A
 43%|████▎     | 3/7 [00:01<00:01,  2.31it/s][A
100%|██████████| 7/7 [00:02<00:00,  2.62it/s][A
Epochs:  90%|█████████ | 65/72 [20:50<02:12, 18.94s/it]

Val Loss: 31.8692 - Val Accuracy: 0.9473



Training:   0%|          | 0/50 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/50 [00:01<01:13,  1.50s/it][A
Training:  10%|█         | 5/50 [00:02<00:22,  2.05it/s][A
Training:  18%|█▊        | 9/50 [00:03<00:15,  2.70it/s][A
Training:  22%|██▏       | 11/50 [00:03<00:11,  3.52it/s][A
Training:  26%|██▌       | 13/50 [00:05<00:13,  2.67it/s][A
Training:  34%|███▍      | 17/50 [00:06<00:10,  3.10it/s][A
Training:  36%|███▌      | 18/50 [00:06<00:09,  3.40it/s][A
Training:  42%|████▏     | 21/50 [00:07<00:09,  3.10it/s][A
Training:  48%|████▊     | 24/50 [00:07<00:05,  4.46it/s][A
Training:  52%|█████▏    | 26/50 [00:08<00:07,  3.29it/s][A
Training:  56%|█████▌    | 28/50 [00:08<00:05,  4.20it/s][A
Training:  60%|██████    | 30/50 [00:09<00:06,  3.01it/s][A
Training:  66%|██████▌   | 33/50 [00:11<00:05,  2.92it/s][A
Training:  74%|███████▍  | 37/50 [00:12<00:04,  3.03it/s][A
Training:  82%|████████▏ | 41/50 [00:13<00:02,  3.13it/s][A
Training:  88%|████████▊ | 44/50 [0

Epoch: 66/72 - Loss: 20.4407 - Accuracy: 0.9585



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:01<00:09,  1.50s/it][A
 57%|█████▋    | 4/7 [00:01<00:00,  3.17it/s][A
100%|██████████| 7/7 [00:02<00:00,  2.64it/s][A
Epochs:  92%|█████████▏| 66/72 [21:08<01:53, 18.84s/it]

Val Loss: 31.2941 - Val Accuracy: 0.9485



Training:   0%|          | 0/50 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/50 [00:01<01:18,  1.60s/it][A
Training:   6%|▌         | 3/50 [00:01<00:21,  2.17it/s][A
Training:  10%|█         | 5/50 [00:02<00:23,  1.94it/s][A
Training:  14%|█▍        | 7/50 [00:02<00:13,  3.10it/s][A
Training:  18%|█▊        | 9/50 [00:04<00:16,  2.47it/s][A
Training:  24%|██▍       | 12/50 [00:04<00:09,  4.13it/s][A
Training:  28%|██▊       | 14/50 [00:05<00:11,  3.06it/s][A
Training:  34%|███▍      | 17/50 [00:06<00:10,  3.07it/s][A
Training:  42%|████▏     | 21/50 [00:07<00:09,  3.17it/s][A
Training:  46%|████▌     | 23/50 [00:07<00:06,  3.94it/s][A
Training:  50%|█████     | 25/50 [00:08<00:08,  2.97it/s][A
Training:  56%|█████▌    | 28/50 [00:08<00:05,  4.32it/s][A
Training:  60%|██████    | 30/50 [00:09<00:06,  3.15it/s][A
Training:  66%|██████▌   | 33/50 [00:11<00:05,  2.92it/s][A
Training:  72%|███████▏  | 36/50 [00:11<00:03,  4.10it/s][A
Training:  76%|███████▌  | 38/50 [00:

Epoch: 67/72 - Loss: 22.5914 - Accuracy: 0.9559



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:01<00:08,  1.47s/it][A
100%|██████████| 7/7 [00:02<00:00,  2.65it/s][A
Epochs:  93%|█████████▎| 67/72 [21:27<01:33, 18.72s/it]

Val Loss: 44.9633 - Val Accuracy: 0.9325



Training:   0%|          | 0/50 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/50 [00:01<01:15,  1.55s/it][A
Training:   8%|▊         | 4/50 [00:01<00:15,  3.03it/s][A
Training:  12%|█▏        | 6/50 [00:02<00:17,  2.46it/s][A
Training:  18%|█▊        | 9/50 [00:03<00:15,  2.62it/s][A
Training:  24%|██▍       | 12/50 [00:03<00:09,  4.14it/s][A
Training:  28%|██▊       | 14/50 [00:04<00:11,  3.06it/s][A
Training:  34%|███▍      | 17/50 [00:05<00:10,  3.05it/s][A
Training:  38%|███▊      | 19/50 [00:06<00:08,  3.85it/s][A
Training:  42%|████▏     | 21/50 [00:07<00:09,  2.94it/s][A
Training:  46%|████▌     | 23/50 [00:07<00:07,  3.83it/s][A
Training:  50%|█████     | 25/50 [00:08<00:08,  2.91it/s][A
Training:  54%|█████▍    | 27/50 [00:08<00:06,  3.79it/s][A
Training:  58%|█████▊    | 29/50 [00:09<00:06,  3.02it/s][A
Training:  62%|██████▏   | 31/50 [00:09<00:05,  3.63it/s][A
Training:  66%|██████▌   | 33/50 [00:10<00:05,  3.07it/s][A
Training:  70%|███████   | 35/50 [00

Epoch: 68/72 - Loss: 28.7282 - Accuracy: 0.9528



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:01<00:08,  1.45s/it][A
 43%|████▎     | 3/7 [00:01<00:01,  2.36it/s][A
100%|██████████| 7/7 [00:02<00:00,  2.59it/s][A
Epochs:  94%|█████████▍| 68/72 [21:45<01:14, 18.51s/it]

Val Loss: 44.7110 - Val Accuracy: 0.9487



Training:   0%|          | 0/50 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/50 [00:01<01:14,  1.52s/it][A
Training:   6%|▌         | 3/50 [00:01<00:20,  2.32it/s][A
Training:  10%|█         | 5/50 [00:02<00:22,  2.04it/s][A
Training:  14%|█▍        | 7/50 [00:02<00:13,  3.27it/s][A
Training:  18%|█▊        | 9/50 [00:03<00:16,  2.54it/s][A
Training:  22%|██▏       | 11/50 [00:04<00:10,  3.64it/s][A
Training:  26%|██▌       | 13/50 [00:05<00:13,  2.82it/s][A
Training:  30%|███       | 15/50 [00:05<00:09,  3.88it/s][A
Training:  34%|███▍      | 17/50 [00:06<00:11,  3.00it/s][A
Training:  36%|███▌      | 18/50 [00:06<00:09,  3.24it/s][A
Training:  40%|████      | 20/50 [00:06<00:06,  4.46it/s][A
Training:  44%|████▍     | 22/50 [00:07<00:09,  3.05it/s][A
Training:  50%|█████     | 25/50 [00:08<00:08,  2.94it/s][A
Training:  52%|█████▏    | 26/50 [00:08<00:07,  3.30it/s][A
Training:  58%|█████▊    | 29/50 [00:09<00:07,  2.98it/s][A
Training:  60%|██████    | 30/50 [00:

Epoch: 69/72 - Loss: 32.3011 - Accuracy: 0.9574



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:01<00:09,  1.55s/it][A
 29%|██▊       | 2/7 [00:01<00:03,  1.39it/s][A
 71%|███████▏  | 5/7 [00:02<00:00,  2.39it/s][A
100%|██████████| 7/7 [00:02<00:00,  2.47it/s][A
Epochs:  96%|█████████▌| 69/72 [22:03<00:55, 18.56s/it]

Val Loss: 52.9010 - Val Accuracy: 0.9494



Training:   0%|          | 0/50 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/50 [00:01<01:14,  1.52s/it][A
Training:   8%|▊         | 4/50 [00:01<00:14,  3.16it/s][A
Training:  12%|█▏        | 6/50 [00:02<00:18,  2.41it/s][A
Training:  18%|█▊        | 9/50 [00:03<00:16,  2.56it/s][A
Training:  20%|██        | 10/50 [00:03<00:13,  2.95it/s][A
Training:  26%|██▌       | 13/50 [00:04<00:12,  2.94it/s][A
Training:  30%|███       | 15/50 [00:05<00:08,  3.90it/s][A
Training:  34%|███▍      | 17/50 [00:06<00:11,  2.89it/s][A
Training:  36%|███▌      | 18/50 [00:06<00:09,  3.23it/s][A
Training:  42%|████▏     | 21/50 [00:07<00:09,  3.15it/s][A
Training:  44%|████▍     | 22/50 [00:07<00:08,  3.35it/s][A
Training:  50%|█████     | 25/50 [00:08<00:07,  3.21it/s][A
Training:  52%|█████▏    | 26/50 [00:08<00:07,  3.40it/s][A
Training:  58%|█████▊    | 29/50 [00:09<00:06,  3.30it/s][A
Training:  60%|██████    | 30/50 [00:09<00:05,  3.52it/s][A
Training:  66%|██████▌   | 33/50 [00

Epoch: 70/72 - Loss: 25.6876 - Accuracy: 0.9578



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:01<00:09,  1.54s/it][A
100%|██████████| 7/7 [00:02<00:00,  2.50it/s][A
Epochs:  97%|█████████▋| 70/72 [22:22<00:37, 18.52s/it]

Val Loss: 37.2443 - Val Accuracy: 0.9436



Training:   0%|          | 0/50 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/50 [00:01<01:11,  1.47s/it][A
Training:  10%|█         | 5/50 [00:02<00:21,  2.08it/s][A
Training:  14%|█▍        | 7/50 [00:02<00:14,  3.07it/s][A
Training:  18%|█▊        | 9/50 [00:03<00:15,  2.72it/s][A
Training:  26%|██▌       | 13/50 [00:04<00:11,  3.12it/s][A
Training:  28%|██▊       | 14/50 [00:04<00:10,  3.48it/s][A
Training:  32%|███▏      | 16/50 [00:05<00:07,  4.58it/s][A
Training:  34%|███▍      | 17/50 [00:06<00:11,  2.77it/s][A
Training:  36%|███▌      | 18/50 [00:06<00:10,  3.10it/s][A
Training:  42%|████▏     | 21/50 [00:07<00:09,  2.96it/s][A
Training:  44%|████▍     | 22/50 [00:07<00:08,  3.31it/s][A
Training:  48%|████▊     | 24/50 [00:07<00:05,  4.60it/s][A
Training:  50%|█████     | 25/50 [00:08<00:08,  2.89it/s][A
Training:  52%|█████▏    | 26/50 [00:08<00:07,  3.25it/s][A
Training:  58%|█████▊    | 29/50 [00:09<00:06,  3.25it/s][A
Training:  60%|██████    | 30/50 [00

Epoch: 71/72 - Loss: 23.9052 - Accuracy: 0.9595



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:01<00:09,  1.52s/it][A
100%|██████████| 7/7 [00:02<00:00,  2.58it/s][A
Epochs:  99%|█████████▊| 71/72 [22:40<00:18, 18.44s/it]

Val Loss: 35.9335 - Val Accuracy: 0.9477



Training:   0%|          | 0/50 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/50 [00:01<01:06,  1.37s/it][A
Training:   6%|▌         | 3/50 [00:01<00:18,  2.52it/s][A
Training:  10%|█         | 5/50 [00:02<00:21,  2.11it/s][A
Training:  14%|█▍        | 7/50 [00:02<00:12,  3.36it/s][A
Training:  18%|█▊        | 9/50 [00:03<00:14,  2.77it/s][A
Training:  24%|██▍       | 12/50 [00:03<00:08,  4.65it/s][A
Training:  28%|██▊       | 14/50 [00:04<00:11,  3.15it/s][A
Training:  32%|███▏      | 16/50 [00:04<00:08,  4.17it/s][A
Training:  36%|███▌      | 18/50 [00:06<00:10,  3.05it/s][A
Training:  40%|████      | 20/50 [00:06<00:07,  4.08it/s][A
Training:  44%|████▍     | 22/50 [00:07<00:09,  3.01it/s][A
Training:  48%|████▊     | 24/50 [00:07<00:06,  3.95it/s][A
Training:  52%|█████▏    | 26/50 [00:08<00:07,  3.12it/s][A
Training:  56%|█████▌    | 28/50 [00:08<00:05,  4.05it/s][A
Training:  58%|█████▊    | 29/50 [00:09<00:07,  2.63it/s][A
Training:  62%|██████▏   | 31/50 [00:

Epoch: 72/72 - Loss: 25.0053 - Accuracy: 0.9607



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:01<00:09,  1.53s/it][A
 43%|████▎     | 3/7 [00:01<00:01,  2.30it/s][A
100%|██████████| 7/7 [00:02<00:00,  2.60it/s][A
Epochs: 100%|██████████| 72/72 [22:59<00:00, 19.16s/it]


Val Loss: 33.7485 - Val Accuracy: 0.9487
Saving best model...


[32m[I 2023-12-11 23:21:47,220][0m Trial 0 finished with value: 0.9486914873123169 and parameters: {'learning_rate': 0.05870926873283856, 'weight_decay': 0.0001579889011773346, 'epsilon': 1.6867250271368622e-08, 'batch_size': 282, 'epochs': 72}. Best is trial 0 with value: 0.9486914873123169.[0m


Learning rate: 0.0008919924301837155
Weight decay: 0.00010220890304481278
Epsilon: 2.3380831337579294e-09
Batch size: 78
Number of epochs: 55


Epochs:   0%|          | 0/55 [00:00<?, ?it/s]
Training:   0%|          | 0/180 [00:00<?, ?it/s][A
Training:   1%|          | 1/180 [00:00<01:27,  2.05it/s][A
Training:   3%|▎         | 5/180 [00:00<00:23,  7.54it/s][A
Training:   5%|▌         | 9/180 [00:01<00:18,  9.24it/s][A
Training:   7%|▋         | 13/180 [00:01<00:15, 10.75it/s][A
Training:   8%|▊         | 15/180 [00:01<00:13, 11.92it/s][A
Training:   9%|▉         | 17/180 [00:01<00:14, 10.88it/s][A
Training:  11%|█         | 19/180 [00:01<00:13, 11.62it/s][A
Training:  12%|█▏        | 21/180 [00:02<00:13, 11.48it/s][A
Training:  13%|█▎        | 23/180 [00:02<00:13, 11.28it/s][A
Training:  14%|█▍        | 25/180 [00:02<00:13, 11.85it/s][A
Training:  15%|█▌        | 27/180 [00:02<00:13, 11.63it/s][A
Training:  17%|█▋        | 30/180 [00:02<00:10, 13.88it/s][A
Training:  18%|█▊        | 32/180 [00:02<00:11, 13.22it/s][A
Training:  19%|█▉        | 34/180 [00:03<00:10, 13.38it/s][A
Training:  20%|██        | 36/180 [

Epoch: 1/55 - Loss: 0.2032 - Accuracy: 0.9238



  0%|          | 0/23 [00:00<?, ?it/s][A
  4%|▍         | 1/23 [00:00<00:12,  1.71it/s][A
 22%|██▏       | 5/23 [00:00<00:02,  6.93it/s][A
 30%|███       | 7/23 [00:00<00:01,  9.15it/s][A
 39%|███▉      | 9/23 [00:01<00:01,  8.34it/s][A
 57%|█████▋    | 13/23 [00:01<00:01,  9.85it/s][A
 74%|███████▍  | 17/23 [00:01<00:00, 10.69it/s][A
100%|██████████| 23/23 [00:02<00:00,  9.87it/s][A
Epochs:   2%|▏         | 1/55 [00:17<16:03, 17.85s/it]

Val Loss: 0.1223 - Val Accuracy: 0.9544



Training:   0%|          | 0/180 [00:00<?, ?it/s][A
Training:   1%|          | 1/180 [00:00<01:39,  1.80it/s][A
Training:   3%|▎         | 5/180 [00:00<00:26,  6.65it/s][A
Training:   5%|▌         | 9/180 [00:01<00:18,  9.42it/s][A
Training:   7%|▋         | 13/180 [00:01<00:15, 10.65it/s][A
Training:   9%|▉         | 17/180 [00:01<00:15, 10.81it/s][A
Training:  12%|█▏        | 21/180 [00:02<00:14, 10.69it/s][A
Training:  14%|█▍        | 25/180 [00:02<00:14, 11.02it/s][A
Training:  16%|█▌        | 29/180 [00:02<00:13, 11.45it/s][A
Training:  18%|█▊        | 33/180 [00:03<00:12, 11.80it/s][A
Training:  21%|██        | 37/180 [00:03<00:11, 12.01it/s][A
Training:  23%|██▎       | 41/180 [00:03<00:11, 12.55it/s][A
Training:  25%|██▌       | 45/180 [00:04<00:10, 12.80it/s][A
Training:  27%|██▋       | 49/180 [00:04<00:10, 12.33it/s][A
Training:  29%|██▉       | 53/180 [00:04<00:10, 12.30it/s][A
Training:  32%|███▏      | 57/180 [00:05<00:09, 12.36it/s][A
Training:  34%|███▍

Epoch: 2/55 - Loss: 0.1273 - Accuracy: 0.9553



  0%|          | 0/23 [00:00<?, ?it/s][A
  4%|▍         | 1/23 [00:00<00:14,  1.53it/s][A
 22%|██▏       | 5/23 [00:00<00:02,  6.26it/s][A
 39%|███▉      | 9/23 [00:01<00:01,  8.44it/s][A
 57%|█████▋    | 13/23 [00:01<00:01,  9.64it/s][A
 74%|███████▍  | 17/23 [00:01<00:00, 10.58it/s][A
100%|██████████| 23/23 [00:02<00:00,  9.67it/s][A
Epochs:   4%|▎         | 2/55 [00:35<15:42, 17.77s/it]

Val Loss: 0.1510 - Val Accuracy: 0.9504



Training:   0%|          | 0/180 [00:00<?, ?it/s][A
Training:   1%|          | 1/180 [00:00<01:51,  1.61it/s][A
Training:   3%|▎         | 5/180 [00:00<00:27,  6.27it/s][A
Training:   5%|▌         | 9/180 [00:01<00:20,  8.42it/s][A
Training:   7%|▋         | 13/180 [00:01<00:16, 10.42it/s][A
Training:   9%|▉         | 17/180 [00:01<00:14, 11.23it/s][A
Training:  12%|█▏        | 21/180 [00:02<00:14, 11.36it/s][A
Training:  13%|█▎        | 24/180 [00:02<00:11, 13.56it/s][A
Training:  14%|█▍        | 26/180 [00:02<00:13, 11.69it/s][A
Training:  16%|█▌        | 29/180 [00:02<00:12, 11.64it/s][A
Training:  17%|█▋        | 31/180 [00:02<00:11, 12.84it/s][A
Training:  18%|█▊        | 33/180 [00:03<00:12, 11.34it/s][A
Training:  20%|██        | 36/180 [00:03<00:11, 13.01it/s][A
Training:  21%|██        | 38/180 [00:03<00:11, 12.10it/s][A
Training:  23%|██▎       | 41/180 [00:03<00:11, 11.77it/s][A
Training:  24%|██▍       | 44/180 [00:03<00:09, 14.51it/s][A
Training:  26%|██▌ 

Epoch: 3/55 - Loss: 0.1143 - Accuracy: 0.9567



  0%|          | 0/23 [00:00<?, ?it/s][A
  4%|▍         | 1/23 [00:00<00:11,  1.96it/s][A
 22%|██▏       | 5/23 [00:00<00:02,  6.36it/s][A
 35%|███▍      | 8/23 [00:00<00:01, 10.09it/s][A
 43%|████▎     | 10/23 [00:01<00:01,  9.21it/s][A
 57%|█████▋    | 13/23 [00:01<00:01,  9.30it/s][A
 70%|██████▉   | 16/23 [00:01<00:00, 11.64it/s][A
 78%|███████▊  | 18/23 [00:01<00:00, 11.03it/s][A
 87%|████████▋ | 20/23 [00:02<00:00, 11.57it/s][A
100%|██████████| 23/23 [00:02<00:00,  9.92it/s][A
Epochs:   5%|▌         | 3/55 [00:53<15:20, 17.69s/it]

Val Loss: 0.1089 - Val Accuracy: 0.9602



Training:   0%|          | 0/180 [00:00<?, ?it/s][A
Training:   1%|          | 1/180 [00:00<01:48,  1.65it/s][A
Training:   3%|▎         | 5/180 [00:00<00:27,  6.47it/s][A
Training:   5%|▌         | 9/180 [00:01<00:19,  8.70it/s][A
Training:   7%|▋         | 13/180 [00:01<00:16, 10.20it/s][A
Training:   9%|▉         | 17/180 [00:01<00:15, 10.70it/s][A
Training:  12%|█▏        | 21/180 [00:02<00:13, 11.44it/s][A
Training:  14%|█▍        | 25/180 [00:02<00:14, 11.00it/s][A
Training:  16%|█▌        | 29/180 [00:02<00:13, 11.38it/s][A
Training:  18%|█▊        | 33/180 [00:03<00:12, 11.33it/s][A
Training:  21%|██        | 37/180 [00:03<00:12, 11.34it/s][A
Training:  23%|██▎       | 41/180 [00:03<00:12, 11.45it/s][A
Training:  25%|██▌       | 45/180 [00:04<00:11, 12.17it/s][A
Training:  27%|██▋       | 48/180 [00:04<00:09, 13.96it/s][A
Training:  28%|██▊       | 50/180 [00:04<00:10, 12.11it/s][A
Training:  29%|██▉       | 53/180 [00:04<00:10, 12.01it/s][A
Training:  32%|███▏

Epoch: 4/55 - Loss: 0.1063 - Accuracy: 0.9616



  0%|          | 0/23 [00:00<?, ?it/s][A
  4%|▍         | 1/23 [00:00<00:10,  2.03it/s][A
 22%|██▏       | 5/23 [00:00<00:02,  7.24it/s][A
 30%|███       | 7/23 [00:00<00:01,  9.26it/s][A
 39%|███▉      | 9/23 [00:01<00:01,  8.77it/s][A
 57%|█████▋    | 13/23 [00:01<00:01,  9.83it/s][A
 74%|███████▍  | 17/23 [00:01<00:00, 10.76it/s][A
100%|██████████| 23/23 [00:02<00:00, 10.04it/s][A
Epochs:   7%|▋         | 4/55 [01:10<15:03, 17.71s/it]

Val Loss: 0.1071 - Val Accuracy: 0.9552



Training:   0%|          | 0/180 [00:00<?, ?it/s][A
Training:   1%|          | 1/180 [00:00<01:42,  1.75it/s][A
Training:   3%|▎         | 5/180 [00:00<00:27,  6.45it/s][A
Training:   5%|▌         | 9/180 [00:01<00:20,  8.35it/s][A
Training:   7%|▋         | 13/180 [00:01<00:18,  9.07it/s][A
Training:   9%|▉         | 17/180 [00:01<00:16, 10.10it/s][A
Training:  12%|█▏        | 21/180 [00:02<00:15, 10.49it/s][A
Training:  14%|█▍        | 25/180 [00:02<00:13, 11.30it/s][A
Training:  16%|█▌        | 29/180 [00:02<00:12, 12.19it/s][A
Training:  18%|█▊        | 33/180 [00:03<00:12, 11.83it/s][A
Training:  21%|██        | 37/180 [00:03<00:11, 12.01it/s][A
Training:  23%|██▎       | 41/180 [00:03<00:11, 12.13it/s][A
Training:  25%|██▌       | 45/180 [00:04<00:11, 12.08it/s][A
Training:  27%|██▋       | 49/180 [00:04<00:10, 12.36it/s][A
Training:  29%|██▉       | 53/180 [00:04<00:10, 12.66it/s][A
Training:  32%|███▏      | 57/180 [00:05<00:09, 13.44it/s][A
Training:  34%|███▍

Epoch: 5/55 - Loss: 0.1069 - Accuracy: 0.9600



  0%|          | 0/23 [00:00<?, ?it/s][A
  4%|▍         | 1/23 [00:00<00:12,  1.69it/s][A
 22%|██▏       | 5/23 [00:00<00:02,  6.26it/s][A
 39%|███▉      | 9/23 [00:01<00:01,  8.36it/s][A
 57%|█████▋    | 13/23 [00:01<00:01,  9.95it/s][A
 70%|██████▉   | 16/23 [00:01<00:00, 12.62it/s][A
 78%|███████▊  | 18/23 [00:01<00:00, 10.70it/s][A
 91%|█████████▏| 21/23 [00:02<00:00, 11.57it/s][A
100%|██████████| 23/23 [00:02<00:00,  9.63it/s][A
Epochs:   9%|▉         | 5/55 [01:28<14:46, 17.72s/it]

Val Loss: 0.1114 - Val Accuracy: 0.9569



Training:   0%|          | 0/180 [00:00<?, ?it/s][A
Training:   1%|          | 1/180 [00:00<01:52,  1.59it/s][A
Training:   3%|▎         | 5/180 [00:00<00:29,  6.01it/s][A
Training:   5%|▌         | 9/180 [00:01<00:20,  8.24it/s][A
Training:   7%|▋         | 13/180 [00:01<00:17,  9.37it/s][A
Training:   9%|▉         | 17/180 [00:02<00:16,  9.91it/s][A
Training:  12%|█▏        | 21/180 [00:02<00:15, 10.57it/s][A
Training:  14%|█▍        | 25/180 [00:02<00:14, 10.70it/s][A
Training:  16%|█▌        | 29/180 [00:02<00:12, 11.73it/s][A
Training:  18%|█▊        | 33/180 [00:03<00:12, 11.79it/s][A
Training:  21%|██        | 37/180 [00:03<00:12, 11.81it/s][A
Training:  23%|██▎       | 41/180 [00:04<00:12, 11.54it/s][A
Training:  25%|██▌       | 45/180 [00:04<00:11, 11.29it/s][A
Training:  27%|██▋       | 49/180 [00:04<00:11, 11.38it/s][A
Training:  29%|██▉       | 53/180 [00:05<00:10, 12.07it/s][A
Training:  32%|███▏      | 57/180 [00:05<00:09, 13.21it/s][A
Training:  34%|███▍

Epoch: 6/55 - Loss: 0.1000 - Accuracy: 0.9630



  0%|          | 0/23 [00:00<?, ?it/s][A
  4%|▍         | 1/23 [00:00<00:12,  1.81it/s][A
 22%|██▏       | 5/23 [00:00<00:02,  6.49it/s][A
 39%|███▉      | 9/23 [00:01<00:01,  8.45it/s][A
 57%|█████▋    | 13/23 [00:01<00:01,  9.79it/s][A
 74%|███████▍  | 17/23 [00:01<00:00, 10.83it/s][A
100%|██████████| 23/23 [00:02<00:00,  9.91it/s][A
Epochs:  11%|█         | 6/55 [01:46<14:28, 17.72s/it]

Val Loss: 0.1096 - Val Accuracy: 0.9570



Training:   0%|          | 0/180 [00:00<?, ?it/s][A
Training:   1%|          | 1/180 [00:00<01:37,  1.83it/s][A
Training:   3%|▎         | 5/180 [00:00<00:26,  6.60it/s][A
Training:   5%|▌         | 9/180 [00:01<00:20,  8.38it/s][A
Training:   7%|▋         | 13/180 [00:01<00:17,  9.64it/s][A
Training:   9%|▉         | 17/180 [00:01<00:15, 10.21it/s][A
Training:  12%|█▏        | 21/180 [00:02<00:14, 10.83it/s][A
Training:  14%|█▍        | 25/180 [00:02<00:13, 11.22it/s][A
Training:  16%|█▌        | 29/180 [00:02<00:12, 11.79it/s][A
Training:  18%|█▊        | 33/180 [00:03<00:12, 12.19it/s][A
Training:  21%|██        | 37/180 [00:03<00:11, 12.76it/s][A
Training:  23%|██▎       | 41/180 [00:03<00:11, 12.60it/s][A
Training:  25%|██▌       | 45/180 [00:04<00:11, 12.04it/s][A
Training:  27%|██▋       | 49/180 [00:04<00:10, 12.05it/s][A
Training:  29%|██▉       | 53/180 [00:04<00:10, 12.00it/s][A
Training:  32%|███▏      | 57/180 [00:05<00:10, 12.11it/s][A
Training:  34%|███▍

Epoch: 7/55 - Loss: 0.0984 - Accuracy: 0.9630



  0%|          | 0/23 [00:00<?, ?it/s][A
  4%|▍         | 1/23 [00:00<00:13,  1.66it/s][A
 22%|██▏       | 5/23 [00:00<00:02,  6.39it/s][A
 39%|███▉      | 9/23 [00:01<00:01,  8.20it/s][A
 57%|█████▋    | 13/23 [00:01<00:01,  9.51it/s][A
 74%|███████▍  | 17/23 [00:01<00:00, 10.52it/s][A
 91%|█████████▏| 21/23 [00:02<00:00, 11.53it/s][A
100%|██████████| 23/23 [00:02<00:00,  9.50it/s][A
Epochs:  13%|█▎        | 7/55 [02:03<14:07, 17.66s/it]

Val Loss: 0.1203 - Val Accuracy: 0.9678



Training:   0%|          | 0/180 [00:00<?, ?it/s][A
Training:   1%|          | 1/180 [00:00<01:25,  2.08it/s][A
Training:   2%|▏         | 4/180 [00:00<00:20,  8.43it/s][A
Training:   3%|▎         | 6/180 [00:00<00:22,  7.76it/s][A
Training:   5%|▌         | 9/180 [00:01<00:18,  9.17it/s][A
Training:   6%|▌         | 11/180 [00:01<00:15, 10.83it/s][A
Training:   7%|▋         | 13/180 [00:01<00:17,  9.79it/s][A
Training:   9%|▉         | 16/180 [00:01<00:12, 13.18it/s][A
Training:  10%|█         | 18/180 [00:01<00:15, 10.25it/s][A
Training:  12%|█▏        | 21/180 [00:02<00:15,  9.97it/s][A
Training:  14%|█▍        | 25/180 [00:02<00:15, 10.29it/s][A
Training:  16%|█▌        | 29/180 [00:02<00:13, 10.88it/s][A
Training:  18%|█▊        | 33/180 [00:03<00:13, 11.21it/s][A
Training:  19%|█▉        | 35/180 [00:03<00:12, 12.01it/s][A
Training:  21%|██        | 37/180 [00:03<00:12, 11.17it/s][A
Training:  23%|██▎       | 41/180 [00:03<00:11, 12.12it/s][A
Training:  24%|██▍  

Epoch: 8/55 - Loss: 0.0959 - Accuracy: 0.9651



  0%|          | 0/23 [00:00<?, ?it/s][A
  4%|▍         | 1/23 [00:00<00:12,  1.80it/s][A
 22%|██▏       | 5/23 [00:00<00:02,  6.18it/s][A
 39%|███▉      | 9/23 [00:01<00:01,  8.45it/s][A
 57%|█████▋    | 13/23 [00:01<00:01,  9.88it/s][A
 74%|███████▍  | 17/23 [00:01<00:00, 10.70it/s][A
100%|██████████| 23/23 [00:02<00:00,  9.90it/s][A
Epochs:  15%|█▍        | 8/55 [02:21<13:49, 17.65s/it]

Val Loss: 0.1234 - Val Accuracy: 0.9541



Training:   0%|          | 0/180 [00:00<?, ?it/s][A
Training:   1%|          | 1/180 [00:00<01:35,  1.87it/s][A
Training:   1%|          | 2/180 [00:00<00:52,  3.38it/s][A
Training:   3%|▎         | 5/180 [00:00<00:23,  7.51it/s][A
Training:   3%|▎         | 6/180 [00:00<00:22,  7.83it/s][A
Training:   5%|▌         | 9/180 [00:01<00:18,  9.45it/s][A
Training:   7%|▋         | 13/180 [00:01<00:15, 10.62it/s][A
Training:   9%|▉         | 17/180 [00:01<00:15, 10.47it/s][A
Training:  12%|█▏        | 21/180 [00:02<00:15, 10.16it/s][A
Training:  14%|█▍        | 25/180 [00:02<00:14, 10.93it/s][A
Training:  16%|█▌        | 29/180 [00:02<00:12, 11.66it/s][A
Training:  18%|█▊        | 33/180 [00:03<00:12, 11.76it/s][A
Training:  21%|██        | 37/180 [00:03<00:12, 11.88it/s][A
Training:  23%|██▎       | 41/180 [00:03<00:11, 11.72it/s][A
Training:  25%|██▌       | 45/180 [00:04<00:11, 11.69it/s][A
Training:  27%|██▋       | 49/180 [00:04<00:11, 11.80it/s][A
Training:  29%|██▉   

Epoch: 9/55 - Loss: 0.0918 - Accuracy: 0.9644



  0%|          | 0/23 [00:00<?, ?it/s][A
  4%|▍         | 1/23 [00:00<00:13,  1.67it/s][A
 22%|██▏       | 5/23 [00:00<00:02,  6.18it/s][A
 39%|███▉      | 9/23 [00:01<00:01,  8.36it/s][A
 57%|█████▋    | 13/23 [00:01<00:01,  9.26it/s][A
 74%|███████▍  | 17/23 [00:02<00:00,  9.81it/s][A
100%|██████████| 23/23 [00:02<00:00,  9.39it/s][A
Epochs:  16%|█▋        | 9/55 [02:39<13:32, 17.66s/it]

Val Loss: 0.1101 - Val Accuracy: 0.9613



Training:   0%|          | 0/180 [00:00<?, ?it/s][A
Training:   1%|          | 1/180 [00:00<01:38,  1.81it/s][A
Training:   3%|▎         | 5/180 [00:00<00:26,  6.57it/s][A
Training:   5%|▌         | 9/180 [00:01<00:21,  8.00it/s][A
Training:   7%|▋         | 13/180 [00:01<00:17,  9.67it/s][A
Training:   9%|▉         | 17/180 [00:01<00:15, 10.76it/s][A
Training:  11%|█         | 20/180 [00:02<00:12, 12.99it/s][A
Training:  12%|█▏        | 22/180 [00:02<00:15, 10.39it/s][A
Training:  14%|█▍        | 25/180 [00:02<00:15, 10.07it/s][A
Training:  16%|█▌        | 29/180 [00:02<00:13, 10.81it/s][A
Training:  18%|█▊        | 33/180 [00:03<00:12, 11.38it/s][A
Training:  21%|██        | 37/180 [00:03<00:12, 11.69it/s][A
Training:  23%|██▎       | 41/180 [00:03<00:11, 11.98it/s][A
Training:  24%|██▍       | 43/180 [00:04<00:10, 12.76it/s][A
Training:  25%|██▌       | 45/180 [00:04<00:11, 11.56it/s][A
Training:  26%|██▌       | 47/180 [00:04<00:10, 12.53it/s][A
Training:  27%|██▋ 

Epoch: 10/55 - Loss: 0.0925 - Accuracy: 0.9649



  0%|          | 0/23 [00:00<?, ?it/s][A
  4%|▍         | 1/23 [00:00<00:11,  1.94it/s][A
 22%|██▏       | 5/23 [00:00<00:02,  6.63it/s][A
 39%|███▉      | 9/23 [00:01<00:01,  9.12it/s][A
 57%|█████▋    | 13/23 [00:01<00:00, 10.12it/s][A
 74%|███████▍  | 17/23 [00:01<00:00, 10.89it/s][A
 83%|████████▎ | 19/23 [00:01<00:00, 11.53it/s][A
100%|██████████| 23/23 [00:02<00:00, 10.14it/s][A
Epochs:  18%|█▊        | 10/55 [02:56<13:10, 17.58s/it]

Val Loss: 0.1320 - Val Accuracy: 0.9569



Training:   0%|          | 0/180 [00:00<?, ?it/s][A
Training:   1%|          | 1/180 [00:00<01:37,  1.83it/s][A
Training:   3%|▎         | 5/180 [00:00<00:28,  6.22it/s][A
Training:   5%|▌         | 9/180 [00:01<00:21,  7.92it/s][A
Training:   7%|▋         | 13/180 [00:01<00:17,  9.34it/s][A
Training:   9%|▉         | 17/180 [00:01<00:16, 10.12it/s][A
Training:  12%|█▏        | 21/180 [00:02<00:15, 10.41it/s][A
Training:  14%|█▍        | 25/180 [00:02<00:13, 11.10it/s][A
Training:  16%|█▌        | 29/180 [00:02<00:13, 11.43it/s][A
Training:  18%|█▊        | 32/180 [00:03<00:10, 13.48it/s][A
Training:  19%|█▉        | 34/180 [00:03<00:13, 10.75it/s][A
Training:  21%|██        | 37/180 [00:03<00:12, 11.31it/s][A
Training:  22%|██▏       | 39/180 [00:03<00:11, 12.05it/s][A
Training:  23%|██▎       | 41/180 [00:04<00:12, 11.30it/s][A
Training:  24%|██▍       | 43/180 [00:04<00:11, 11.82it/s][A
Training:  25%|██▌       | 45/180 [00:04<00:11, 12.14it/s][A
Training:  26%|██▌ 

Epoch: 11/55 - Loss: 0.0973 - Accuracy: 0.9640



  0%|          | 0/23 [00:00<?, ?it/s][A
  4%|▍         | 1/23 [00:00<00:11,  1.96it/s][A
 22%|██▏       | 5/23 [00:00<00:02,  6.98it/s][A
 39%|███▉      | 9/23 [00:01<00:01,  8.74it/s][A
 52%|█████▏    | 12/23 [00:01<00:00, 11.77it/s][A
 61%|██████    | 14/23 [00:01<00:00, 10.86it/s][A
 70%|██████▉   | 16/23 [00:01<00:00, 12.02it/s][A
 78%|███████▊  | 18/23 [00:01<00:00, 11.23it/s][A
 87%|████████▋ | 20/23 [00:01<00:00, 12.74it/s][A
100%|██████████| 23/23 [00:02<00:00, 10.25it/s][A
Epochs:  20%|██        | 11/55 [03:14<12:54, 17.61s/it]

Val Loss: 0.1136 - Val Accuracy: 0.9563



Training:   0%|          | 0/180 [00:00<?, ?it/s][A
Training:   1%|          | 1/180 [00:00<01:41,  1.76it/s][A
Training:   3%|▎         | 5/180 [00:00<00:27,  6.30it/s][A
Training:   4%|▍         | 7/180 [00:01<00:20,  8.46it/s][A
Training:   5%|▌         | 9/180 [00:01<00:19,  8.57it/s][A
Training:   7%|▋         | 12/180 [00:01<00:13, 12.29it/s][A
Training:   8%|▊         | 14/180 [00:01<00:15, 10.38it/s][A
Training:   9%|▉         | 16/180 [00:01<00:13, 12.08it/s][A
Training:  10%|█         | 18/180 [00:01<00:15, 10.36it/s][A
Training:  12%|█▏        | 21/180 [00:02<00:15, 10.38it/s][A
Training:  13%|█▎        | 23/180 [00:02<00:13, 11.27it/s][A
Training:  14%|█▍        | 25/180 [00:02<00:15, 10.08it/s][A
Training:  15%|█▌        | 27/180 [00:02<00:13, 11.62it/s][A
Training:  16%|█▌        | 29/180 [00:02<00:13, 10.83it/s][A
Training:  17%|█▋        | 31/180 [00:03<00:12, 12.27it/s][A
Training:  18%|█▊        | 33/180 [00:03<00:13, 10.85it/s][A
Training:  19%|█▉   

Epoch: 12/55 - Loss: 0.0903 - Accuracy: 0.9653



  0%|          | 0/23 [00:00<?, ?it/s][A
  4%|▍         | 1/23 [00:00<00:11,  1.90it/s][A
 17%|█▋        | 4/23 [00:00<00:02,  7.63it/s][A
 26%|██▌       | 6/23 [00:00<00:02,  7.73it/s][A
 39%|███▉      | 9/23 [00:01<00:01,  8.07it/s][A
 57%|█████▋    | 13/23 [00:01<00:01,  9.51it/s][A
 74%|███████▍  | 17/23 [00:01<00:00, 10.51it/s][A
100%|██████████| 23/23 [00:02<00:00, 10.06it/s][A
Epochs:  22%|██▏       | 12/55 [03:31<12:35, 17.57s/it]

Val Loss: 0.1035 - Val Accuracy: 0.9636



Training:   0%|          | 0/180 [00:00<?, ?it/s][A
Training:   1%|          | 1/180 [00:00<01:42,  1.75it/s][A
Training:   3%|▎         | 5/180 [00:00<00:28,  6.22it/s][A
Training:   5%|▌         | 9/180 [00:01<00:20,  8.30it/s][A
Training:   7%|▋         | 13/180 [00:01<00:17,  9.53it/s][A
Training:   9%|▉         | 17/180 [00:01<00:15, 10.28it/s][A
Training:  12%|█▏        | 21/180 [00:02<00:14, 10.62it/s][A
Training:  14%|█▍        | 25/180 [00:02<00:14, 10.37it/s][A
Training:  16%|█▌        | 29/180 [00:03<00:14, 10.68it/s][A
Training:  18%|█▊        | 33/180 [00:03<00:13, 11.02it/s][A
Training:  21%|██        | 37/180 [00:03<00:12, 11.14it/s][A
Training:  23%|██▎       | 41/180 [00:04<00:12, 11.58it/s][A
Training:  25%|██▌       | 45/180 [00:04<00:11, 11.87it/s][A
Training:  27%|██▋       | 49/180 [00:04<00:11, 11.78it/s][A
Training:  29%|██▉       | 53/180 [00:05<00:11, 11.42it/s][A
Training:  32%|███▏      | 57/180 [00:05<00:10, 12.04it/s][A
Training:  34%|███▍

Epoch: 13/55 - Loss: 0.0868 - Accuracy: 0.9674



  0%|          | 0/23 [00:00<?, ?it/s][A
  4%|▍         | 1/23 [00:00<00:11,  1.98it/s][A
 17%|█▋        | 4/23 [00:00<00:02,  7.72it/s][A
 26%|██▌       | 6/23 [00:00<00:02,  7.38it/s][A
 39%|███▉      | 9/23 [00:01<00:01,  8.07it/s][A
 57%|█████▋    | 13/23 [00:01<00:01,  9.72it/s][A
 74%|███████▍  | 17/23 [00:01<00:00, 10.25it/s][A
100%|██████████| 23/23 [00:02<00:00,  9.91it/s][A
Epochs:  24%|██▎       | 13/55 [03:49<12:15, 17.51s/it]

Val Loss: 0.1238 - Val Accuracy: 0.9559



Training:   0%|          | 0/180 [00:00<?, ?it/s][A
Training:   1%|          | 1/180 [00:00<01:36,  1.85it/s][A
Training:   2%|▏         | 4/180 [00:00<00:23,  7.47it/s][A
Training:   3%|▎         | 6/180 [00:00<00:23,  7.49it/s][A
Training:   5%|▌         | 9/180 [00:01<00:20,  8.46it/s][A
Training:   7%|▋         | 13/180 [00:01<00:16, 10.07it/s][A
Training:   9%|▉         | 17/180 [00:01<00:15, 10.53it/s][A
Training:  11%|█         | 19/180 [00:02<00:13, 11.76it/s][A
Training:  12%|█▏        | 21/180 [00:02<00:14, 10.86it/s][A
Training:  14%|█▍        | 25/180 [00:02<00:13, 11.47it/s][A
Training:  16%|█▌        | 28/180 [00:02<00:10, 13.99it/s][A
Training:  17%|█▋        | 30/180 [00:02<00:13, 10.80it/s][A
Training:  18%|█▊        | 33/180 [00:03<00:12, 11.71it/s][A
Training:  19%|█▉        | 35/180 [00:03<00:12, 11.93it/s][A
Training:  21%|██        | 37/180 [00:03<00:12, 11.23it/s][A
Training:  22%|██▏       | 39/180 [00:03<00:11, 12.53it/s][A
Training:  23%|██▎  

Epoch: 14/55 - Loss: 0.0842 - Accuracy: 0.9692



  0%|          | 0/23 [00:00<?, ?it/s][A
  4%|▍         | 1/23 [00:00<00:12,  1.70it/s][A
 22%|██▏       | 5/23 [00:00<00:02,  6.09it/s][A
 39%|███▉      | 9/23 [00:01<00:01,  8.08it/s][A
 57%|█████▋    | 13/23 [00:01<00:01,  9.60it/s][A
 70%|██████▉   | 16/23 [00:01<00:00, 12.22it/s][A
 78%|███████▊  | 18/23 [00:02<00:00, 10.13it/s][A
100%|██████████| 23/23 [00:02<00:00,  9.51it/s][A
Epochs:  25%|██▌       | 14/55 [04:06<11:56, 17.48s/it]

Val Loss: 0.1186 - Val Accuracy: 0.9636



Training:   0%|          | 0/180 [00:00<?, ?it/s][A
Training:   1%|          | 1/180 [00:00<01:33,  1.92it/s][A
Training:   3%|▎         | 5/180 [00:00<00:26,  6.73it/s][A
Training:   5%|▌         | 9/180 [00:01<00:20,  8.42it/s][A
Training:   7%|▋         | 13/180 [00:01<00:17,  9.43it/s][A
Training:   9%|▉         | 17/180 [00:01<00:15, 10.20it/s][A
Training:  12%|█▏        | 21/180 [00:02<00:15, 10.42it/s][A
Training:  14%|█▍        | 25/180 [00:02<00:14, 10.68it/s][A
Training:  16%|█▌        | 29/180 [00:02<00:13, 11.32it/s][A
Training:  18%|█▊        | 33/180 [00:03<00:13, 11.27it/s][A
Training:  21%|██        | 37/180 [00:03<00:12, 11.18it/s][A
Training:  23%|██▎       | 41/180 [00:04<00:12, 11.00it/s][A
Training:  25%|██▌       | 45/180 [00:04<00:12, 11.17it/s][A
Training:  27%|██▋       | 49/180 [00:04<00:11, 11.35it/s][A
Training:  29%|██▉       | 53/180 [00:05<00:11, 11.36it/s][A
Training:  32%|███▏      | 57/180 [00:05<00:10, 11.51it/s][A
Training:  34%|███▍

Epoch: 15/55 - Loss: 0.0864 - Accuracy: 0.9685



  0%|          | 0/23 [00:00<?, ?it/s][A
  4%|▍         | 1/23 [00:00<00:11,  1.98it/s][A
 17%|█▋        | 4/23 [00:00<00:02,  7.85it/s][A
 26%|██▌       | 6/23 [00:00<00:02,  7.28it/s][A
 39%|███▉      | 9/23 [00:01<00:01,  8.38it/s][A
 57%|█████▋    | 13/23 [00:01<00:00, 10.04it/s][A
 70%|██████▉   | 16/23 [00:01<00:00, 12.66it/s][A
 78%|███████▊  | 18/23 [00:01<00:00,  9.94it/s][A
100%|██████████| 23/23 [00:02<00:00,  9.67it/s][A
Epochs:  27%|██▋       | 15/55 [04:24<11:40, 17.51s/it]

Val Loss: 0.1253 - Val Accuracy: 0.9558



Training:   0%|          | 0/180 [00:00<?, ?it/s][A
Training:   1%|          | 1/180 [00:00<01:39,  1.80it/s][A
Training:   3%|▎         | 5/180 [00:00<00:25,  6.73it/s][A
Training:   5%|▌         | 9/180 [00:01<00:19,  8.80it/s][A
Training:   7%|▋         | 12/180 [00:01<00:14, 11.84it/s][A
Training:   8%|▊         | 14/180 [00:01<00:15, 10.40it/s][A
Training:   9%|▉         | 17/180 [00:01<00:17,  9.44it/s][A
Training:  12%|█▏        | 21/180 [00:02<00:15, 10.27it/s][A
Training:  14%|█▍        | 25/180 [00:02<00:13, 11.10it/s][A
Training:  16%|█▌        | 29/180 [00:02<00:12, 11.90it/s][A
Training:  18%|█▊        | 33/180 [00:03<00:13, 11.29it/s][A
Training:  21%|██        | 37/180 [00:03<00:12, 11.82it/s][A
Training:  22%|██▏       | 39/180 [00:03<00:11, 12.41it/s][A
Training:  23%|██▎       | 41/180 [00:03<00:11, 11.91it/s][A
Training:  24%|██▍       | 43/180 [00:04<00:10, 12.81it/s][A
Training:  25%|██▌       | 45/180 [00:04<00:11, 12.00it/s][A
Training:  26%|██▌ 

Epoch: 16/55 - Loss: 0.0866 - Accuracy: 0.9668



  0%|          | 0/23 [00:00<?, ?it/s][A
  4%|▍         | 1/23 [00:00<00:12,  1.75it/s][A
 22%|██▏       | 5/23 [00:00<00:02,  6.42it/s][A
 39%|███▉      | 9/23 [00:01<00:01,  8.59it/s][A
 57%|█████▋    | 13/23 [00:01<00:01,  9.61it/s][A
 74%|███████▍  | 17/23 [00:01<00:00, 10.40it/s][A
100%|██████████| 23/23 [00:02<00:00,  9.93it/s][A
Epochs:  29%|██▉       | 16/55 [04:41<11:23, 17.52s/it]

Val Loss: 0.1182 - Val Accuracy: 0.9602



Training:   0%|          | 0/180 [00:00<?, ?it/s][A
Training:   1%|          | 1/180 [00:00<01:39,  1.81it/s][A
Training:   2%|▏         | 4/180 [00:00<00:23,  7.51it/s][A
Training:   3%|▎         | 6/180 [00:00<00:23,  7.50it/s][A
Training:   5%|▌         | 9/180 [00:01<00:20,  8.17it/s][A
Training:   7%|▋         | 13/180 [00:01<00:18,  9.24it/s][A
Training:   9%|▉         | 17/180 [00:01<00:16, 10.17it/s][A
Training:  12%|█▏        | 21/180 [00:02<00:14, 10.93it/s][A
Training:  14%|█▍        | 25/180 [00:02<00:13, 11.17it/s][A
Training:  16%|█▌        | 29/180 [00:02<00:13, 11.50it/s][A
Training:  18%|█▊        | 33/180 [00:03<00:13, 11.14it/s][A
Training:  21%|██        | 37/180 [00:03<00:12, 11.26it/s][A
Training:  23%|██▎       | 41/180 [00:04<00:12, 11.36it/s][A
Training:  25%|██▌       | 45/180 [00:04<00:11, 11.65it/s][A
Training:  27%|██▋       | 49/180 [00:04<00:11, 11.89it/s][A
Training:  29%|██▉       | 53/180 [00:05<00:10, 12.03it/s][A
Training:  32%|███▏ 

Epoch: 17/55 - Loss: 0.0846 - Accuracy: 0.9687



  0%|          | 0/23 [00:00<?, ?it/s][A
  4%|▍         | 1/23 [00:00<00:12,  1.75it/s][A
 22%|██▏       | 5/23 [00:00<00:02,  6.12it/s][A
 39%|███▉      | 9/23 [00:01<00:01,  8.20it/s][A
 57%|█████▋    | 13/23 [00:01<00:01,  9.26it/s][A
 74%|███████▍  | 17/23 [00:01<00:00, 10.25it/s][A
100%|██████████| 23/23 [00:02<00:00,  9.58it/s][A
Epochs:  31%|███       | 17/55 [04:59<11:05, 17.51s/it]

Val Loss: 0.1328 - Val Accuracy: 0.9513



Training:   0%|          | 0/180 [00:00<?, ?it/s][A
Training:   1%|          | 1/180 [00:00<01:41,  1.76it/s][A
Training:   3%|▎         | 5/180 [00:00<00:28,  6.21it/s][A
Training:   5%|▌         | 9/180 [00:01<00:20,  8.34it/s][A
Training:   7%|▋         | 13/180 [00:01<00:18,  9.23it/s][A
Training:   9%|▉         | 17/180 [00:01<00:15, 10.23it/s][A
Training:  12%|█▏        | 21/180 [00:02<00:15, 10.46it/s][A
Training:  14%|█▍        | 25/180 [00:02<00:13, 11.08it/s][A
Training:  16%|█▌        | 29/180 [00:02<00:13, 11.27it/s][A
Training:  18%|█▊        | 33/180 [00:03<00:13, 11.25it/s][A
Training:  21%|██        | 37/180 [00:03<00:12, 11.16it/s][A
Training:  23%|██▎       | 41/180 [00:04<00:11, 11.96it/s][A
Training:  25%|██▌       | 45/180 [00:04<00:11, 11.94it/s][A
Training:  27%|██▋       | 49/180 [00:04<00:10, 11.95it/s][A
Training:  29%|██▉       | 53/180 [00:04<00:10, 12.36it/s][A
Training:  32%|███▏      | 57/180 [00:05<00:09, 12.57it/s][A
Training:  33%|███▎

Epoch: 18/55 - Loss: 0.0872 - Accuracy: 0.9679



  0%|          | 0/23 [00:00<?, ?it/s][A
  4%|▍         | 1/23 [00:00<00:11,  1.96it/s][A
 22%|██▏       | 5/23 [00:00<00:02,  6.70it/s][A
 39%|███▉      | 9/23 [00:01<00:01,  8.73it/s][A
 48%|████▊     | 11/23 [00:01<00:01, 10.30it/s][A
 57%|█████▋    | 13/23 [00:01<00:01,  8.86it/s][A
 74%|███████▍  | 17/23 [00:01<00:00, 10.29it/s][A
100%|██████████| 23/23 [00:02<00:00,  9.86it/s][A
Epochs:  33%|███▎      | 18/55 [05:16<10:49, 17.56s/it]

Val Loss: 0.1169 - Val Accuracy: 0.9624



Training:   0%|          | 0/180 [00:00<?, ?it/s][A
Training:   1%|          | 1/180 [00:00<01:36,  1.85it/s][A
Training:   2%|▏         | 4/180 [00:00<00:23,  7.43it/s][A
Training:   3%|▎         | 6/180 [00:00<00:22,  7.89it/s][A
Training:   4%|▍         | 8/180 [00:01<00:18,  9.23it/s][A
Training:   6%|▌         | 10/180 [00:01<00:18,  9.35it/s][A
Training:   7%|▋         | 12/180 [00:01<00:16, 10.14it/s][A
Training:   8%|▊         | 14/180 [00:01<00:15, 10.48it/s][A
Training:   9%|▉         | 16/180 [00:01<00:15, 10.69it/s][A
Training:  10%|█         | 18/180 [00:01<00:13, 11.59it/s][A
Training:  11%|█         | 20/180 [00:02<00:14, 11.32it/s][A
Training:  12%|█▏        | 22/180 [00:02<00:13, 11.42it/s][A
Training:  13%|█▎        | 24/180 [00:02<00:12, 12.54it/s][A
Training:  14%|█▍        | 26/180 [00:02<00:14, 10.80it/s][A
Training:  16%|█▌        | 28/180 [00:02<00:12, 12.41it/s][A
Training:  17%|█▋        | 30/180 [00:02<00:12, 11.78it/s][A
Training:  18%|█▊   

Epoch: 19/55 - Loss: 0.0844 - Accuracy: 0.9684



  0%|          | 0/23 [00:00<?, ?it/s][A
  4%|▍         | 1/23 [00:00<00:11,  1.96it/s][A
 22%|██▏       | 5/23 [00:00<00:02,  7.01it/s][A
 35%|███▍      | 8/23 [00:00<00:01, 10.92it/s][A
 43%|████▎     | 10/23 [00:01<00:01,  9.29it/s][A
 57%|█████▋    | 13/23 [00:01<00:01,  9.32it/s][A
 74%|███████▍  | 17/23 [00:01<00:00,  9.97it/s][A
100%|██████████| 23/23 [00:02<00:00, 10.04it/s][A
Epochs:  35%|███▍      | 19/55 [05:34<10:31, 17.55s/it]

Val Loss: 0.1160 - Val Accuracy: 0.9574



Training:   0%|          | 0/180 [00:00<?, ?it/s][A
Training:   1%|          | 1/180 [00:00<01:40,  1.79it/s][A
Training:   3%|▎         | 5/180 [00:00<00:26,  6.53it/s][A
Training:   5%|▌         | 9/180 [00:01<00:19,  8.89it/s][A
Training:   7%|▋         | 12/180 [00:01<00:14, 11.88it/s][A
Training:   8%|▊         | 14/180 [00:01<00:16,  9.85it/s][A
Training:   9%|▉         | 17/180 [00:01<00:17,  9.55it/s][A
Training:  11%|█         | 20/180 [00:02<00:12, 12.34it/s][A
Training:  12%|█▏        | 22/180 [00:02<00:15, 10.37it/s][A
Training:  14%|█▍        | 25/180 [00:02<00:14, 10.35it/s][A
Training:  16%|█▌        | 29/180 [00:02<00:13, 11.09it/s][A
Training:  18%|█▊        | 33/180 [00:03<00:13, 11.14it/s][A
Training:  21%|██        | 37/180 [00:03<00:13, 10.74it/s][A
Training:  23%|██▎       | 41/180 [00:04<00:12, 11.48it/s][A
Training:  25%|██▌       | 45/180 [00:04<00:11, 11.56it/s][A
Training:  27%|██▋       | 49/180 [00:04<00:11, 11.61it/s][A
Training:  29%|██▉ 

Epoch: 20/55 - Loss: 0.0853 - Accuracy: 0.9690



  0%|          | 0/23 [00:00<?, ?it/s][A
  4%|▍         | 1/23 [00:00<00:11,  1.86it/s][A
 22%|██▏       | 5/23 [00:00<00:02,  6.60it/s][A
 39%|███▉      | 9/23 [00:01<00:01,  8.19it/s][A
 57%|█████▋    | 13/23 [00:01<00:01,  8.96it/s][A
 74%|███████▍  | 17/23 [00:01<00:00,  9.87it/s][A
100%|██████████| 23/23 [00:02<00:00,  9.62it/s][A
Epochs:  36%|███▋      | 20/55 [05:51<10:15, 17.58s/it]

Val Loss: 0.1109 - Val Accuracy: 0.9558



Training:   0%|          | 0/180 [00:00<?, ?it/s][A
Training:   1%|          | 1/180 [00:00<01:39,  1.80it/s][A
Training:   3%|▎         | 5/180 [00:00<00:25,  6.75it/s][A
Training:   5%|▌         | 9/180 [00:01<00:19,  8.74it/s][A
Training:   7%|▋         | 13/180 [00:01<00:16,  9.83it/s][A
Training:   9%|▉         | 17/180 [00:01<00:15, 10.50it/s][A
Training:  12%|█▏        | 21/180 [00:02<00:14, 11.09it/s][A
Training:  14%|█▍        | 25/180 [00:02<00:14, 11.04it/s][A
Training:  16%|█▌        | 29/180 [00:02<00:13, 10.98it/s][A
Training:  18%|█▊        | 33/180 [00:03<00:12, 11.49it/s][A
Training:  21%|██        | 37/180 [00:03<00:12, 11.43it/s][A
Training:  23%|██▎       | 41/180 [00:03<00:12, 11.14it/s][A
Training:  25%|██▌       | 45/180 [00:04<00:11, 11.66it/s][A
Training:  27%|██▋       | 49/180 [00:04<00:11, 11.84it/s][A
Training:  29%|██▉       | 53/180 [00:04<00:11, 11.54it/s][A
Training:  32%|███▏      | 57/180 [00:05<00:10, 11.90it/s][A
Training:  34%|███▍

Epoch: 21/55 - Loss: 0.0800 - Accuracy: 0.9709



  0%|          | 0/23 [00:00<?, ?it/s][A
  4%|▍         | 1/23 [00:00<00:11,  1.88it/s][A
 22%|██▏       | 5/23 [00:00<00:02,  6.72it/s][A
 39%|███▉      | 9/23 [00:01<00:01,  8.64it/s][A
 57%|█████▋    | 13/23 [00:01<00:01,  9.46it/s][A
 74%|███████▍  | 17/23 [00:01<00:00, 10.41it/s][A
100%|██████████| 23/23 [00:02<00:00, 10.00it/s][A
Epochs:  38%|███▊      | 21/55 [06:09<09:56, 17.55s/it]

Val Loss: 0.1159 - Val Accuracy: 0.9591



Training:   0%|          | 0/180 [00:00<?, ?it/s][A
Training:   1%|          | 1/180 [00:00<01:39,  1.80it/s][A
Training:   3%|▎         | 5/180 [00:00<00:26,  6.63it/s][A
Training:   5%|▌         | 9/180 [00:01<00:20,  8.38it/s][A
Training:   7%|▋         | 13/180 [00:01<00:18,  9.27it/s][A
Training:   9%|▉         | 17/180 [00:01<00:16, 10.11it/s][A
Training:  12%|█▏        | 21/180 [00:02<00:15, 10.55it/s][A
Training:  14%|█▍        | 25/180 [00:02<00:13, 11.22it/s][A
Training:  16%|█▌        | 29/180 [00:02<00:13, 11.57it/s][A
Training:  18%|█▊        | 33/180 [00:03<00:12, 11.55it/s][A
Training:  21%|██        | 37/180 [00:03<00:12, 11.20it/s][A
Training:  23%|██▎       | 41/180 [00:04<00:12, 11.39it/s][A
Training:  24%|██▍       | 44/180 [00:04<00:10, 13.44it/s][A
Training:  26%|██▌       | 46/180 [00:04<00:11, 11.44it/s][A
Training:  27%|██▋       | 49/180 [00:04<00:12, 10.90it/s][A
Training:  29%|██▉       | 53/180 [00:05<00:11, 11.21it/s][A
Training:  32%|███▏

Epoch: 22/55 - Loss: 0.0871 - Accuracy: 0.9673



  0%|          | 0/23 [00:00<?, ?it/s][A
  4%|▍         | 1/23 [00:00<00:11,  1.91it/s][A
 22%|██▏       | 5/23 [00:00<00:02,  7.29it/s][A
 35%|███▍      | 8/23 [00:00<00:01, 11.27it/s][A
 43%|████▎     | 10/23 [00:01<00:01,  9.23it/s][A
 57%|█████▋    | 13/23 [00:01<00:01,  9.57it/s][A
 70%|██████▉   | 16/23 [00:01<00:00, 12.60it/s][A
 78%|███████▊  | 18/23 [00:01<00:00,  9.90it/s][A
100%|██████████| 23/23 [00:02<00:00,  9.88it/s][A
Epochs:  40%|████      | 22/55 [06:27<09:40, 17.59s/it]

Val Loss: 0.1223 - Val Accuracy: 0.9602



Training:   0%|          | 0/180 [00:00<?, ?it/s][A
Training:   1%|          | 1/180 [00:00<01:44,  1.71it/s][A
Training:   3%|▎         | 5/180 [00:00<00:26,  6.62it/s][A
Training:   5%|▌         | 9/180 [00:01<00:19,  8.66it/s][A
Training:   7%|▋         | 13/180 [00:01<00:18,  9.19it/s][A
Training:   9%|▉         | 17/180 [00:01<00:16,  9.90it/s][A
Training:  12%|█▏        | 21/180 [00:02<00:15, 10.48it/s][A
Training:  14%|█▍        | 25/180 [00:02<00:14, 10.95it/s][A
Training:  16%|█▌        | 29/180 [00:02<00:13, 11.50it/s][A
Training:  18%|█▊        | 33/180 [00:03<00:12, 11.54it/s][A
Training:  21%|██        | 37/180 [00:03<00:13, 10.83it/s][A
Training:  23%|██▎       | 41/180 [00:04<00:12, 11.39it/s][A
Training:  25%|██▌       | 45/180 [00:04<00:11, 11.71it/s][A
Training:  27%|██▋       | 49/180 [00:04<00:11, 11.13it/s][A
Training:  29%|██▉       | 53/180 [00:05<00:11, 11.48it/s][A
Training:  32%|███▏      | 57/180 [00:05<00:10, 11.73it/s][A
Training:  34%|███▍

Epoch: 23/55 - Loss: 0.0861 - Accuracy: 0.9674



  0%|          | 0/23 [00:00<?, ?it/s][A
  4%|▍         | 1/23 [00:00<00:10,  2.06it/s][A
 22%|██▏       | 5/23 [00:00<00:02,  7.55it/s][A
 39%|███▉      | 9/23 [00:01<00:01,  9.73it/s][A
 57%|█████▋    | 13/23 [00:01<00:00, 10.74it/s][A
 74%|███████▍  | 17/23 [00:01<00:00, 10.68it/s][A
100%|██████████| 23/23 [00:02<00:00, 10.71it/s][A
Epochs:  42%|████▏     | 23/55 [06:44<09:22, 17.57s/it]

Val Loss: 0.1138 - Val Accuracy: 0.9608



Training:   0%|          | 0/180 [00:00<?, ?it/s][A
Training:   1%|          | 1/180 [00:00<01:47,  1.66it/s][A
Training:   3%|▎         | 5/180 [00:00<00:27,  6.29it/s][A
Training:   5%|▌         | 9/180 [00:01<00:19,  8.59it/s][A
Training:   7%|▋         | 13/180 [00:01<00:17,  9.30it/s][A
Training:   9%|▉         | 17/180 [00:01<00:16, 10.17it/s][A
Training:  12%|█▏        | 21/180 [00:02<00:14, 10.65it/s][A
Training:  14%|█▍        | 25/180 [00:02<00:14, 10.97it/s][A
Training:  16%|█▌        | 29/180 [00:02<00:13, 11.24it/s][A
Training:  18%|█▊        | 33/180 [00:03<00:12, 11.39it/s][A
Training:  21%|██        | 37/180 [00:03<00:12, 11.75it/s][A
Training:  23%|██▎       | 41/180 [00:04<00:12, 11.38it/s][A
Training:  25%|██▌       | 45/180 [00:04<00:11, 11.41it/s][A
Training:  27%|██▋       | 49/180 [00:04<00:11, 11.77it/s][A
Training:  29%|██▉       | 53/180 [00:05<00:10, 11.61it/s][A
Training:  32%|███▏      | 57/180 [00:05<00:10, 11.80it/s][A
Training:  34%|███▍

Epoch: 24/55 - Loss: 0.0799 - Accuracy: 0.9701



  0%|          | 0/23 [00:00<?, ?it/s][A
  4%|▍         | 1/23 [00:00<00:11,  1.90it/s][A
 22%|██▏       | 5/23 [00:00<00:02,  6.89it/s][A
 39%|███▉      | 9/23 [00:01<00:01,  9.60it/s][A
 57%|█████▋    | 13/23 [00:01<00:00, 11.26it/s][A
 74%|███████▍  | 17/23 [00:01<00:00, 11.87it/s][A
100%|██████████| 23/23 [00:02<00:00, 11.20it/s][A
Epochs:  44%|████▎     | 24/55 [07:02<09:04, 17.55s/it]

Val Loss: 0.1210 - Val Accuracy: 0.9591



Training:   0%|          | 0/180 [00:00<?, ?it/s][A
Training:   1%|          | 1/180 [00:00<01:39,  1.79it/s][A
Training:   3%|▎         | 5/180 [00:00<00:26,  6.51it/s][A
Training:   5%|▌         | 9/180 [00:01<00:20,  8.18it/s][A
Training:   7%|▋         | 13/180 [00:01<00:17,  9.52it/s][A
Training:   9%|▉         | 17/180 [00:01<00:15, 10.23it/s][A
Training:  12%|█▏        | 21/180 [00:02<00:14, 10.84it/s][A
Training:  14%|█▍        | 25/180 [00:02<00:14, 11.05it/s][A
Training:  16%|█▌        | 29/180 [00:02<00:13, 11.48it/s][A
Training:  18%|█▊        | 33/180 [00:03<00:12, 11.84it/s][A
Training:  21%|██        | 37/180 [00:03<00:11, 11.92it/s][A
Training:  23%|██▎       | 41/180 [00:03<00:11, 12.00it/s][A
Training:  25%|██▌       | 45/180 [00:04<00:10, 12.30it/s][A
Training:  27%|██▋       | 49/180 [00:04<00:10, 12.30it/s][A
Training:  29%|██▉       | 53/180 [00:04<00:10, 12.32it/s][A
Training:  32%|███▏      | 57/180 [00:05<00:10, 11.82it/s][A
Training:  34%|███▍

Epoch: 25/55 - Loss: 0.0807 - Accuracy: 0.9704



  0%|          | 0/23 [00:00<?, ?it/s][A
  4%|▍         | 1/23 [00:00<00:11,  1.98it/s][A
 22%|██▏       | 5/23 [00:00<00:02,  6.78it/s][A
 39%|███▉      | 9/23 [00:01<00:01,  8.75it/s][A
 57%|█████▋    | 13/23 [00:01<00:01,  9.78it/s][A
 74%|███████▍  | 17/23 [00:01<00:00, 11.09it/s][A
100%|██████████| 23/23 [00:02<00:00, 10.63it/s][A
Epochs:  45%|████▌     | 25/55 [07:19<08:45, 17.52s/it]

Val Loss: 0.1281 - Val Accuracy: 0.9546



Training:   0%|          | 0/180 [00:00<?, ?it/s][A
Training:   1%|          | 1/180 [00:00<01:27,  2.05it/s][A
Training:   3%|▎         | 5/180 [00:00<00:23,  7.30it/s][A
Training:   5%|▌         | 9/180 [00:01<00:19,  8.86it/s][A
Training:   7%|▋         | 13/180 [00:01<00:16, 10.22it/s][A
Training:   9%|▉         | 17/180 [00:01<00:15, 10.56it/s][A
Training:  11%|█         | 20/180 [00:01<00:12, 12.47it/s][A
Training:  12%|█▏        | 22/180 [00:02<00:14, 10.89it/s][A
Training:  14%|█▍        | 25/180 [00:02<00:14, 10.56it/s][A
Training:  16%|█▌        | 29/180 [00:02<00:13, 10.84it/s][A
Training:  18%|█▊        | 33/180 [00:03<00:13, 11.24it/s][A
Training:  21%|██        | 37/180 [00:03<00:12, 11.37it/s][A
Training:  23%|██▎       | 41/180 [00:03<00:12, 11.41it/s][A
Training:  25%|██▌       | 45/180 [00:04<00:12, 11.13it/s][A
Training:  27%|██▋       | 49/180 [00:04<00:11, 11.02it/s][A
Training:  29%|██▉       | 53/180 [00:05<00:11, 11.27it/s][A
Training:  32%|███▏

Epoch: 26/55 - Loss: 0.0824 - Accuracy: 0.9715



  0%|          | 0/23 [00:00<?, ?it/s][A
  4%|▍         | 1/23 [00:00<00:11,  1.99it/s][A
 22%|██▏       | 5/23 [00:00<00:02,  7.74it/s][A
 30%|███       | 7/23 [00:00<00:01,  9.60it/s][A
 39%|███▉      | 9/23 [00:01<00:01,  9.98it/s][A
 48%|████▊     | 11/23 [00:01<00:01, 11.43it/s][A
 57%|█████▋    | 13/23 [00:01<00:00, 10.84it/s][A
 65%|██████▌   | 15/23 [00:01<00:00, 11.36it/s][A
 74%|███████▍  | 17/23 [00:01<00:00, 11.88it/s][A
 83%|████████▎ | 19/23 [00:01<00:00, 11.78it/s][A
100%|██████████| 23/23 [00:02<00:00, 10.77it/s][A
Epochs:  47%|████▋     | 26/55 [07:37<08:28, 17.52s/it]

Val Loss: 0.1155 - Val Accuracy: 0.9574



Training:   0%|          | 0/180 [00:00<?, ?it/s][A
Training:   1%|          | 1/180 [00:00<01:30,  1.97it/s][A
Training:   3%|▎         | 5/180 [00:00<00:24,  7.13it/s][A
Training:   5%|▌         | 9/180 [00:01<00:18,  9.06it/s][A
Training:   7%|▋         | 13/180 [00:01<00:16, 10.03it/s][A
Training:   9%|▉         | 17/180 [00:01<00:15, 10.50it/s][A
Training:  12%|█▏        | 21/180 [00:02<00:15, 10.49it/s][A
Training:  14%|█▍        | 25/180 [00:02<00:14, 10.79it/s][A
Training:  16%|█▌        | 29/180 [00:02<00:14, 10.52it/s][A
Training:  18%|█▊        | 33/180 [00:03<00:13, 10.71it/s][A
Training:  21%|██        | 37/180 [00:03<00:13, 10.89it/s][A
Training:  23%|██▎       | 41/180 [00:04<00:12, 11.01it/s][A
Training:  25%|██▌       | 45/180 [00:04<00:12, 11.05it/s][A
Training:  27%|██▋       | 49/180 [00:04<00:12, 10.80it/s][A
Training:  29%|██▉       | 53/180 [00:05<00:11, 11.23it/s][A
Training:  32%|███▏      | 57/180 [00:05<00:10, 11.35it/s][A
Training:  34%|███▍

Epoch: 27/55 - Loss: 0.0777 - Accuracy: 0.9707



  0%|          | 0/23 [00:00<?, ?it/s][A
  4%|▍         | 1/23 [00:00<00:11,  1.90it/s][A
 22%|██▏       | 5/23 [00:00<00:02,  6.73it/s][A
 39%|███▉      | 9/23 [00:01<00:01,  9.32it/s][A
 57%|█████▋    | 13/23 [00:01<00:01,  9.92it/s][A
 74%|███████▍  | 17/23 [00:01<00:00, 10.77it/s][A
100%|██████████| 23/23 [00:02<00:00, 10.22it/s][A
Epochs:  49%|████▉     | 27/55 [07:54<08:12, 17.59s/it]

Val Loss: 0.1256 - Val Accuracy: 0.9546



Training:   0%|          | 0/180 [00:00<?, ?it/s][A
Training:   1%|          | 1/180 [00:00<01:30,  1.97it/s][A
Training:   3%|▎         | 5/180 [00:00<00:24,  7.20it/s][A
Training:   5%|▌         | 9/180 [00:01<00:16, 10.08it/s][A
Training:   7%|▋         | 13/180 [00:01<00:15, 10.97it/s][A
Training:   9%|▉         | 17/180 [00:01<00:13, 11.70it/s][A
Training:  11%|█         | 19/180 [00:01<00:12, 12.61it/s][A
Training:  12%|█▏        | 21/180 [00:02<00:13, 11.37it/s][A
Training:  13%|█▎        | 23/180 [00:02<00:13, 11.49it/s][A
Training:  14%|█▍        | 25/180 [00:02<00:13, 11.52it/s][A
Training:  15%|█▌        | 27/180 [00:02<00:13, 11.15it/s][A
Training:  16%|█▌        | 29/180 [00:02<00:12, 11.93it/s][A
Training:  17%|█▋        | 31/180 [00:02<00:13, 10.95it/s][A
Training:  18%|█▊        | 33/180 [00:03<00:12, 11.97it/s][A
Training:  19%|█▉        | 35/180 [00:03<00:13, 11.15it/s][A
Training:  21%|██        | 37/180 [00:03<00:11, 12.54it/s][A
Training:  22%|██▏ 

Epoch: 28/55 - Loss: 0.0817 - Accuracy: 0.9707



  0%|          | 0/23 [00:00<?, ?it/s][A
  4%|▍         | 1/23 [00:00<00:12,  1.78it/s][A
 22%|██▏       | 5/23 [00:00<00:02,  6.83it/s][A
 35%|███▍      | 8/23 [00:00<00:01, 10.20it/s][A
 43%|████▎     | 10/23 [00:01<00:01, 10.92it/s][A
 52%|█████▏    | 12/23 [00:01<00:00, 11.81it/s][A
 61%|██████    | 14/23 [00:01<00:00, 11.75it/s][A
 70%|██████▉   | 16/23 [00:01<00:00, 11.59it/s][A
 78%|███████▊  | 18/23 [00:01<00:00, 12.24it/s][A
 87%|████████▋ | 20/23 [00:01<00:00, 12.05it/s][A
100%|██████████| 23/23 [00:02<00:00, 10.34it/s][A
Epochs:  51%|█████     | 28/55 [08:12<07:55, 17.62s/it]

Val Loss: 0.1193 - Val Accuracy: 0.9624



Training:   0%|          | 0/180 [00:00<?, ?it/s][A
Training:   1%|          | 1/180 [00:00<01:40,  1.78it/s][A
Training:   3%|▎         | 5/180 [00:00<00:25,  6.75it/s][A
Training:   5%|▌         | 9/180 [00:01<00:18,  9.21it/s][A
Training:   7%|▋         | 13/180 [00:01<00:15, 10.63it/s][A
Training:   9%|▉         | 17/180 [00:01<00:14, 11.51it/s][A
Training:  12%|█▏        | 21/180 [00:02<00:13, 11.70it/s][A
Training:  14%|█▍        | 25/180 [00:02<00:13, 11.43it/s][A
Training:  16%|█▌        | 29/180 [00:02<00:13, 11.58it/s][A
Training:  18%|█▊        | 33/180 [00:03<00:12, 11.74it/s][A
Training:  21%|██        | 37/180 [00:03<00:12, 11.31it/s][A
Training:  23%|██▎       | 41/180 [00:03<00:12, 11.47it/s][A
Training:  25%|██▌       | 45/180 [00:04<00:11, 11.54it/s][A
Training:  27%|██▋       | 49/180 [00:04<00:11, 11.89it/s][A
Training:  29%|██▉       | 53/180 [00:04<00:10, 11.73it/s][A
Training:  32%|███▏      | 57/180 [00:05<00:10, 11.41it/s][A
Training:  34%|███▍

Epoch: 29/55 - Loss: 0.0769 - Accuracy: 0.9717



  0%|          | 0/23 [00:00<?, ?it/s][A
  4%|▍         | 1/23 [00:00<00:12,  1.76it/s][A
 22%|██▏       | 5/23 [00:00<00:02,  6.25it/s][A
 39%|███▉      | 9/23 [00:01<00:01,  8.75it/s][A
 57%|█████▋    | 13/23 [00:01<00:00, 10.07it/s][A
 74%|███████▍  | 17/23 [00:01<00:00, 11.64it/s][A
100%|██████████| 23/23 [00:02<00:00, 10.75it/s][A
Epochs:  53%|█████▎    | 29/55 [08:30<07:36, 17.56s/it]

Val Loss: 0.1285 - Val Accuracy: 0.9585



Training:   0%|          | 0/180 [00:00<?, ?it/s][A
Training:   1%|          | 1/180 [00:00<01:39,  1.80it/s][A
Training:   3%|▎         | 5/180 [00:00<00:25,  6.76it/s][A
Training:   5%|▌         | 9/180 [00:01<00:18,  9.16it/s][A
Training:   6%|▌         | 11/180 [00:01<00:15, 10.59it/s][A
Training:   7%|▋         | 13/180 [00:01<00:16, 10.24it/s][A
Training:   8%|▊         | 15/180 [00:01<00:14, 11.36it/s][A
Training:   9%|▉         | 17/180 [00:01<00:14, 11.03it/s][A
Training:  11%|█         | 19/180 [00:01<00:12, 12.61it/s][A
Training:  12%|█▏        | 21/180 [00:02<00:13, 11.47it/s][A
Training:  13%|█▎        | 23/180 [00:02<00:11, 13.13it/s][A
Training:  14%|█▍        | 25/180 [00:02<00:12, 12.45it/s][A
Training:  15%|█▌        | 27/180 [00:02<00:11, 13.64it/s][A
Training:  16%|█▌        | 29/180 [00:02<00:11, 12.78it/s][A
Training:  18%|█▊        | 33/180 [00:03<00:11, 13.16it/s][A
Training:  21%|██        | 37/180 [00:03<00:11, 12.79it/s][A
Training:  23%|██▎ 

Epoch: 30/55 - Loss: 0.0812 - Accuracy: 0.9697



  0%|          | 0/23 [00:00<?, ?it/s][A
  4%|▍         | 1/23 [00:00<00:10,  2.02it/s][A
 22%|██▏       | 5/23 [00:00<00:02,  6.85it/s][A
 39%|███▉      | 9/23 [00:01<00:01,  9.00it/s][A
 57%|█████▋    | 13/23 [00:01<00:00, 10.38it/s][A
 70%|██████▉   | 16/23 [00:01<00:00, 12.39it/s][A
 78%|███████▊  | 18/23 [00:01<00:00, 11.29it/s][A
100%|██████████| 23/23 [00:02<00:00, 10.11it/s][A
Epochs:  55%|█████▍    | 30/55 [08:47<07:19, 17.56s/it]

Val Loss: 0.1292 - Val Accuracy: 0.9570



Training:   0%|          | 0/180 [00:00<?, ?it/s][A
Training:   1%|          | 1/180 [00:00<01:37,  1.84it/s][A
Training:   3%|▎         | 5/180 [00:00<00:26,  6.65it/s][A
Training:   5%|▌         | 9/180 [00:01<00:19,  8.84it/s][A
Training:   7%|▋         | 13/180 [00:01<00:16,  9.85it/s][A
Training:   9%|▉         | 17/180 [00:01<00:15, 10.52it/s][A
Training:  12%|█▏        | 21/180 [00:02<00:14, 10.87it/s][A
Training:  14%|█▍        | 25/180 [00:02<00:13, 11.78it/s][A
Training:  16%|█▌        | 29/180 [00:02<00:12, 12.20it/s][A
Training:  18%|█▊        | 33/180 [00:03<00:11, 12.81it/s][A
Training:  21%|██        | 37/180 [00:03<00:10, 13.21it/s][A
Training:  23%|██▎       | 41/180 [00:03<00:10, 13.45it/s][A
Training:  24%|██▍       | 44/180 [00:03<00:08, 15.32it/s][A
Training:  26%|██▌       | 46/180 [00:04<00:10, 12.80it/s][A
Training:  27%|██▋       | 49/180 [00:04<00:11, 11.80it/s][A
Training:  29%|██▉       | 52/180 [00:04<00:09, 13.68it/s][A
Training:  30%|███ 

Epoch: 31/55 - Loss: 0.0780 - Accuracy: 0.9719



  0%|          | 0/23 [00:00<?, ?it/s][A
  4%|▍         | 1/23 [00:00<00:13,  1.64it/s][A
 22%|██▏       | 5/23 [00:00<00:02,  6.09it/s][A
 39%|███▉      | 9/23 [00:01<00:01,  8.35it/s][A
 57%|█████▋    | 13/23 [00:01<00:01,  9.56it/s][A
 74%|███████▍  | 17/23 [00:01<00:00, 10.19it/s][A
100%|██████████| 23/23 [00:02<00:00,  9.80it/s][A
Epochs:  56%|█████▋    | 31/55 [09:05<07:01, 17.57s/it]

Val Loss: 0.1366 - Val Accuracy: 0.9519



Training:   0%|          | 0/180 [00:00<?, ?it/s][A
Training:   1%|          | 1/180 [00:00<01:43,  1.73it/s][A
Training:   3%|▎         | 5/180 [00:00<00:24,  7.17it/s][A
Training:   5%|▌         | 9/180 [00:01<00:17,  9.57it/s][A
Training:   7%|▋         | 13/180 [00:01<00:15, 10.68it/s][A
Training:   8%|▊         | 15/180 [00:01<00:13, 11.80it/s][A
Training:   9%|▉         | 17/180 [00:01<00:14, 11.09it/s][A
Training:  12%|█▏        | 21/180 [00:02<00:13, 11.48it/s][A
Training:  13%|█▎        | 23/180 [00:02<00:13, 11.86it/s][A
Training:  14%|█▍        | 25/180 [00:02<00:13, 11.45it/s][A
Training:  15%|█▌        | 27/180 [00:02<00:12, 11.90it/s][A
Training:  16%|█▌        | 29/180 [00:02<00:13, 11.10it/s][A
Training:  18%|█▊        | 33/180 [00:03<00:12, 11.71it/s][A
Training:  21%|██        | 37/180 [00:03<00:11, 12.38it/s][A
Training:  23%|██▎       | 41/180 [00:03<00:10, 13.02it/s][A
Training:  25%|██▌       | 45/180 [00:03<00:09, 14.01it/s][A
Training:  26%|██▌ 

Epoch: 32/55 - Loss: 0.0752 - Accuracy: 0.9727



  0%|          | 0/23 [00:00<?, ?it/s][A
  4%|▍         | 1/23 [00:00<00:12,  1.77it/s][A
 22%|██▏       | 5/23 [00:00<00:02,  6.34it/s][A
 39%|███▉      | 9/23 [00:01<00:01,  8.17it/s][A
 52%|█████▏    | 12/23 [00:01<00:01, 10.99it/s][A
 61%|██████    | 14/23 [00:01<00:00,  9.50it/s][A
 74%|███████▍  | 17/23 [00:01<00:00,  9.92it/s][A
100%|██████████| 23/23 [00:02<00:00,  9.50it/s][A
Epochs:  58%|█████▊    | 32/55 [09:22<06:45, 17.62s/it]

Val Loss: 0.1221 - Val Accuracy: 0.9608



Training:   0%|          | 0/180 [00:00<?, ?it/s][A
Training:   1%|          | 1/180 [00:00<01:41,  1.77it/s][A
Training:   3%|▎         | 5/180 [00:00<00:27,  6.40it/s][A
Training:   5%|▌         | 9/180 [00:01<00:19,  8.56it/s][A
Training:   7%|▋         | 13/180 [00:01<00:16, 10.39it/s][A
Training:   9%|▉         | 17/180 [00:01<00:14, 11.00it/s][A
Training:  12%|█▏        | 21/180 [00:02<00:13, 11.91it/s][A
Training:  14%|█▍        | 25/180 [00:02<00:13, 11.81it/s][A
Training:  16%|█▌        | 29/180 [00:02<00:12, 12.31it/s][A
Training:  18%|█▊        | 32/180 [00:02<00:10, 14.45it/s][A
Training:  19%|█▉        | 34/180 [00:03<00:11, 12.29it/s][A
Training:  21%|██        | 37/180 [00:03<00:12, 11.78it/s][A
Training:  23%|██▎       | 41/180 [00:03<00:11, 12.61it/s][A
Training:  25%|██▌       | 45/180 [00:03<00:10, 12.93it/s][A
Training:  27%|██▋       | 49/180 [00:04<00:09, 13.21it/s][A
Training:  29%|██▉       | 53/180 [00:04<00:09, 13.00it/s][A
Training:  31%|███ 

Epoch: 33/55 - Loss: 0.0730 - Accuracy: 0.9737



  0%|          | 0/23 [00:00<?, ?it/s][A
  4%|▍         | 1/23 [00:00<00:12,  1.70it/s][A
 22%|██▏       | 5/23 [00:00<00:02,  6.25it/s][A
 39%|███▉      | 9/23 [00:01<00:01,  8.80it/s][A
 57%|█████▋    | 13/23 [00:01<00:01,  9.86it/s][A
 74%|███████▍  | 17/23 [00:01<00:00, 10.52it/s][A
100%|██████████| 23/23 [00:02<00:00, 10.16it/s][A
Epochs:  60%|██████    | 33/55 [09:40<06:26, 17.58s/it]

Val Loss: 0.1146 - Val Accuracy: 0.9624



Training:   0%|          | 0/180 [00:00<?, ?it/s][A
Training:   1%|          | 1/180 [00:00<01:41,  1.76it/s][A
Training:   3%|▎         | 5/180 [00:00<00:25,  6.77it/s][A
Training:   5%|▌         | 9/180 [00:01<00:19,  8.82it/s][A
Training:   7%|▋         | 13/180 [00:01<00:16,  9.83it/s][A
Training:   9%|▉         | 17/180 [00:01<00:15, 10.44it/s][A
Training:  12%|█▏        | 21/180 [00:02<00:13, 11.51it/s][A
Training:  14%|█▍        | 25/180 [00:02<00:13, 11.55it/s][A
Training:  16%|█▌        | 29/180 [00:02<00:13, 11.53it/s][A
Training:  18%|█▊        | 33/180 [00:03<00:12, 11.63it/s][A
Training:  21%|██        | 37/180 [00:03<00:12, 11.37it/s][A
Training:  23%|██▎       | 41/180 [00:03<00:11, 11.73it/s][A
Training:  25%|██▌       | 45/180 [00:04<00:11, 12.16it/s][A
Training:  27%|██▋       | 49/180 [00:04<00:10, 12.21it/s][A
Training:  29%|██▉       | 53/180 [00:04<00:10, 12.51it/s][A
Training:  32%|███▏      | 57/180 [00:05<00:09, 12.86it/s][A
Training:  34%|███▍

Epoch: 34/55 - Loss: 0.0777 - Accuracy: 0.9707



  0%|          | 0/23 [00:00<?, ?it/s][A
  4%|▍         | 1/23 [00:00<00:12,  1.72it/s][A
 22%|██▏       | 5/23 [00:00<00:02,  6.73it/s][A
 39%|███▉      | 9/23 [00:01<00:01,  9.00it/s][A
 48%|████▊     | 11/23 [00:01<00:01, 10.61it/s][A
 57%|█████▋    | 13/23 [00:01<00:01,  9.90it/s][A
 65%|██████▌   | 15/23 [00:01<00:00, 11.25it/s][A
 74%|███████▍  | 17/23 [00:01<00:00, 11.09it/s][A
 83%|████████▎ | 19/23 [00:02<00:00, 11.45it/s][A
 91%|█████████▏| 21/23 [00:02<00:00, 11.80it/s][A
100%|██████████| 23/23 [00:02<00:00,  9.81it/s][A
Epochs:  62%|██████▏   | 34/55 [09:57<06:09, 17.58s/it]

Val Loss: 0.1339 - Val Accuracy: 0.9591



Training:   0%|          | 0/180 [00:00<?, ?it/s][A
Training:   1%|          | 1/180 [00:00<01:40,  1.79it/s][A
Training:   3%|▎         | 5/180 [00:00<00:26,  6.70it/s][A
Training:   5%|▌         | 9/180 [00:01<00:19,  8.92it/s][A
Training:   6%|▌         | 11/180 [00:01<00:16, 10.05it/s][A
Training:   7%|▋         | 13/180 [00:01<00:17,  9.47it/s][A
Training:   9%|▉         | 16/180 [00:01<00:12, 12.68it/s][A
Training:  10%|█         | 18/180 [00:01<00:14, 11.43it/s][A
Training:  11%|█         | 20/180 [00:02<00:12, 12.85it/s][A
Training:  12%|█▏        | 22/180 [00:02<00:14, 11.25it/s][A
Training:  14%|█▍        | 25/180 [00:02<00:13, 11.08it/s][A
Training:  16%|█▌        | 28/180 [00:02<00:10, 13.98it/s][A
Training:  17%|█▋        | 30/180 [00:02<00:12, 12.31it/s][A
Training:  18%|█▊        | 33/180 [00:03<00:12, 12.04it/s][A
Training:  20%|██        | 36/180 [00:03<00:10, 13.94it/s][A
Training:  21%|██        | 38/180 [00:03<00:12, 11.78it/s][A
Training:  22%|██▏ 

Epoch: 35/55 - Loss: 0.0751 - Accuracy: 0.9714



  0%|          | 0/23 [00:00<?, ?it/s][A
  4%|▍         | 1/23 [00:00<00:12,  1.81it/s][A
 22%|██▏       | 5/23 [00:00<00:02,  6.83it/s][A
 35%|███▍      | 8/23 [00:00<00:01, 10.65it/s][A
 43%|████▎     | 10/23 [00:01<00:01,  9.08it/s][A
 57%|█████▋    | 13/23 [00:01<00:01,  9.73it/s][A
 65%|██████▌   | 15/23 [00:01<00:00, 11.34it/s][A
 74%|███████▍  | 17/23 [00:01<00:00, 10.77it/s][A
 87%|████████▋ | 20/23 [00:01<00:00, 12.96it/s][A
100%|██████████| 23/23 [00:02<00:00,  9.96it/s][A
Epochs:  64%|██████▎   | 35/55 [10:15<05:51, 17.57s/it]

Val Loss: 0.1273 - Val Accuracy: 0.9585



Training:   0%|          | 0/180 [00:00<?, ?it/s][A
Training:   1%|          | 1/180 [00:00<01:55,  1.56it/s][A
Training:   3%|▎         | 5/180 [00:00<00:28,  6.05it/s][A
Training:   5%|▌         | 9/180 [00:01<00:20,  8.38it/s][A
Training:   7%|▋         | 13/180 [00:01<00:17,  9.60it/s][A
Training:   9%|▉         | 17/180 [00:01<00:15, 10.64it/s][A
Training:  12%|█▏        | 21/180 [00:02<00:14, 11.21it/s][A
Training:  14%|█▍        | 25/180 [00:02<00:14, 10.95it/s][A
Training:  16%|█▌        | 29/180 [00:02<00:13, 11.49it/s][A
Training:  18%|█▊        | 32/180 [00:03<00:10, 13.66it/s][A
Training:  19%|█▉        | 34/180 [00:03<00:11, 12.21it/s][A
Training:  21%|██        | 37/180 [00:03<00:11, 11.95it/s][A
Training:  23%|██▎       | 41/180 [00:03<00:11, 12.55it/s][A
Training:  25%|██▌       | 45/180 [00:04<00:10, 12.55it/s][A
Training:  27%|██▋       | 49/180 [00:04<00:10, 12.87it/s][A
Training:  28%|██▊       | 51/180 [00:04<00:09, 13.45it/s][A
Training:  29%|██▉ 

Epoch: 36/55 - Loss: 0.0760 - Accuracy: 0.9711



  0%|          | 0/23 [00:00<?, ?it/s][A
  4%|▍         | 1/23 [00:00<00:11,  1.84it/s][A
 22%|██▏       | 5/23 [00:00<00:02,  6.70it/s][A
 39%|███▉      | 9/23 [00:01<00:01,  9.01it/s][A
 57%|█████▋    | 13/23 [00:01<00:01,  9.84it/s][A
 74%|███████▍  | 17/23 [00:01<00:00, 10.73it/s][A
100%|██████████| 23/23 [00:02<00:00, 10.31it/s][A
Epochs:  65%|██████▌   | 36/55 [10:33<05:33, 17.57s/it]

Val Loss: 0.1173 - Val Accuracy: 0.9597



Training:   0%|          | 0/180 [00:00<?, ?it/s][A
Training:   1%|          | 1/180 [00:00<01:36,  1.86it/s][A
Training:   3%|▎         | 5/180 [00:00<00:26,  6.61it/s][A
Training:   5%|▌         | 9/180 [00:01<00:19,  8.81it/s][A
Training:   7%|▋         | 13/180 [00:01<00:17,  9.41it/s][A
Training:   9%|▉         | 17/180 [00:01<00:15, 10.28it/s][A
Training:  12%|█▏        | 21/180 [00:02<00:14, 10.74it/s][A
Training:  14%|█▍        | 25/180 [00:02<00:14, 10.61it/s][A
Training:  16%|█▌        | 29/180 [00:02<00:13, 10.92it/s][A
Training:  18%|█▊        | 33/180 [00:03<00:12, 11.38it/s][A
Training:  21%|██        | 37/180 [00:03<00:12, 11.60it/s][A
Training:  23%|██▎       | 41/180 [00:03<00:11, 11.92it/s][A
Training:  25%|██▌       | 45/180 [00:04<00:10, 12.51it/s][A
Training:  27%|██▋       | 48/180 [00:04<00:09, 14.60it/s][A
Training:  28%|██▊       | 50/180 [00:04<00:10, 12.23it/s][A
Training:  29%|██▉       | 53/180 [00:04<00:11, 11.33it/s][A
Training:  32%|███▏

Epoch: 37/55 - Loss: 0.0779 - Accuracy: 0.9722



  0%|          | 0/23 [00:00<?, ?it/s][A
  4%|▍         | 1/23 [00:00<00:12,  1.73it/s][A
 22%|██▏       | 5/23 [00:00<00:02,  6.53it/s][A
 39%|███▉      | 9/23 [00:01<00:01,  8.84it/s][A
 57%|█████▋    | 13/23 [00:01<00:00, 10.05it/s][A
 74%|███████▍  | 17/23 [00:01<00:00, 10.38it/s][A
100%|██████████| 23/23 [00:02<00:00, 10.12it/s][A
Epochs:  67%|██████▋   | 37/55 [10:50<05:16, 17.60s/it]

Val Loss: 0.1247 - Val Accuracy: 0.9558



Training:   0%|          | 0/180 [00:00<?, ?it/s][A
Training:   1%|          | 1/180 [00:00<01:48,  1.65it/s][A
Training:   3%|▎         | 5/180 [00:00<00:27,  6.39it/s][A
Training:   5%|▌         | 9/180 [00:01<00:19,  8.80it/s][A
Training:   7%|▋         | 13/180 [00:01<00:16, 10.19it/s][A
Training:   9%|▉         | 17/180 [00:01<00:16, 10.01it/s][A
Training:  12%|█▏        | 21/180 [00:02<00:15, 10.50it/s][A
Training:  14%|█▍        | 25/180 [00:02<00:14, 10.72it/s][A
Training:  16%|█▌        | 29/180 [00:02<00:13, 11.11it/s][A
Training:  18%|█▊        | 33/180 [00:03<00:13, 11.25it/s][A
Training:  21%|██        | 37/180 [00:03<00:11, 11.94it/s][A
Training:  23%|██▎       | 41/180 [00:03<00:11, 12.28it/s][A
Training:  24%|██▍       | 43/180 [00:04<00:10, 12.96it/s][A
Training:  25%|██▌       | 45/180 [00:04<00:11, 12.11it/s][A
Training:  27%|██▋       | 49/180 [00:04<00:10, 12.78it/s][A
Training:  29%|██▉       | 53/180 [00:04<00:10, 11.99it/s][A
Training:  32%|███▏

Epoch: 38/55 - Loss: 0.0755 - Accuracy: 0.9722



  0%|          | 0/23 [00:00<?, ?it/s][A
  4%|▍         | 1/23 [00:00<00:09,  2.21it/s][A
 22%|██▏       | 5/23 [00:00<00:02,  7.41it/s][A
 39%|███▉      | 9/23 [00:01<00:01,  9.07it/s][A
 57%|█████▋    | 13/23 [00:01<00:00, 10.07it/s][A
 74%|███████▍  | 17/23 [00:01<00:00, 11.18it/s][A
 87%|████████▋ | 20/23 [00:01<00:00, 13.52it/s][A
100%|██████████| 23/23 [00:02<00:00,  9.98it/s][A
Epochs:  69%|██████▉   | 38/55 [11:08<04:59, 17.63s/it]

Val Loss: 0.1375 - Val Accuracy: 0.9563



Training:   0%|          | 0/180 [00:00<?, ?it/s][A
Training:   1%|          | 1/180 [00:00<01:45,  1.70it/s][A
Training:   3%|▎         | 5/180 [00:00<00:28,  6.25it/s][A
Training:   5%|▌         | 9/180 [00:01<00:19,  8.61it/s][A
Training:   7%|▋         | 13/180 [00:01<00:16, 10.32it/s][A
Training:   9%|▉         | 17/180 [00:01<00:15, 10.44it/s][A
Training:  12%|█▏        | 21/180 [00:02<00:14, 10.80it/s][A
Training:  14%|█▍        | 25/180 [00:02<00:13, 11.09it/s][A
Training:  16%|█▌        | 29/180 [00:02<00:13, 11.30it/s][A
Training:  18%|█▊        | 33/180 [00:03<00:13, 11.20it/s][A
Training:  21%|██        | 37/180 [00:03<00:12, 11.71it/s][A
Training:  23%|██▎       | 41/180 [00:03<00:11, 11.94it/s][A
Training:  25%|██▌       | 45/180 [00:04<00:10, 12.31it/s][A
Training:  27%|██▋       | 49/180 [00:04<00:10, 12.41it/s][A
Training:  29%|██▉       | 52/180 [00:04<00:08, 14.24it/s][A
Training:  30%|███       | 54/180 [00:04<00:10, 11.95it/s][A
Training:  32%|███▏

Epoch: 39/55 - Loss: 0.0750 - Accuracy: 0.9719



  0%|          | 0/23 [00:00<?, ?it/s][A
  4%|▍         | 1/23 [00:00<00:11,  1.98it/s][A
 22%|██▏       | 5/23 [00:00<00:02,  7.24it/s][A
 39%|███▉      | 9/23 [00:01<00:01,  9.50it/s][A
 57%|█████▋    | 13/23 [00:01<00:00, 10.47it/s][A
 74%|███████▍  | 17/23 [00:01<00:00, 10.88it/s][A
100%|██████████| 23/23 [00:02<00:00, 10.45it/s][A
Epochs:  71%|███████   | 39/55 [11:26<04:41, 17.60s/it]

Val Loss: 0.1205 - Val Accuracy: 0.9632



Training:   0%|          | 0/180 [00:00<?, ?it/s][A
Training:   1%|          | 1/180 [00:00<01:56,  1.54it/s][A
Training:   3%|▎         | 5/180 [00:00<00:27,  6.45it/s][A
Training:   5%|▌         | 9/180 [00:01<00:20,  8.47it/s][A
Training:   7%|▋         | 13/180 [00:01<00:17,  9.60it/s][A
Training:   9%|▉         | 17/180 [00:01<00:15, 10.43it/s][A
Training:  12%|█▏        | 21/180 [00:02<00:15, 10.39it/s][A
Training:  14%|█▍        | 25/180 [00:02<00:14, 11.01it/s][A
Training:  16%|█▌        | 29/180 [00:03<00:13, 10.95it/s][A
Training:  18%|█▊        | 33/180 [00:03<00:13, 11.00it/s][A
Training:  21%|██        | 37/180 [00:03<00:12, 11.48it/s][A
Training:  23%|██▎       | 41/180 [00:04<00:12, 11.55it/s][A
Training:  25%|██▌       | 45/180 [00:04<00:11, 11.88it/s][A
Training:  27%|██▋       | 49/180 [00:04<00:11, 11.27it/s][A
Training:  29%|██▉       | 53/180 [00:05<00:11, 11.33it/s][A
Training:  32%|███▏      | 57/180 [00:05<00:10, 11.76it/s][A
Training:  34%|███▍

Epoch: 40/55 - Loss: 0.0705 - Accuracy: 0.9731



  0%|          | 0/23 [00:00<?, ?it/s][A
  4%|▍         | 1/23 [00:00<00:10,  2.05it/s][A
 22%|██▏       | 5/23 [00:00<00:02,  6.79it/s][A
 39%|███▉      | 9/23 [00:01<00:01,  9.62it/s][A
 57%|█████▋    | 13/23 [00:01<00:00, 10.64it/s][A
 70%|██████▉   | 16/23 [00:01<00:00, 13.08it/s][A
 78%|███████▊  | 18/23 [00:01<00:00, 11.39it/s][A
100%|██████████| 23/23 [00:02<00:00, 10.50it/s][A
Epochs:  73%|███████▎  | 40/55 [11:43<04:24, 17.61s/it]

Val Loss: 0.1354 - Val Accuracy: 0.9613



Training:   0%|          | 0/180 [00:00<?, ?it/s][A
Training:   1%|          | 1/180 [00:00<01:51,  1.61it/s][A
Training:   3%|▎         | 5/180 [00:00<00:28,  6.21it/s][A
Training:   5%|▌         | 9/180 [00:01<00:20,  8.33it/s][A
Training:   7%|▋         | 13/180 [00:01<00:16,  9.90it/s][A
Training:   9%|▉         | 17/180 [00:01<00:15, 10.50it/s][A
Training:  12%|█▏        | 21/180 [00:02<00:14, 10.89it/s][A
Training:  14%|█▍        | 25/180 [00:02<00:13, 11.48it/s][A
Training:  16%|█▌        | 29/180 [00:02<00:12, 11.65it/s][A
Training:  18%|█▊        | 33/180 [00:03<00:12, 11.40it/s][A
Training:  21%|██        | 37/180 [00:03<00:12, 11.55it/s][A
Training:  23%|██▎       | 41/180 [00:03<00:11, 11.74it/s][A
Training:  25%|██▌       | 45/180 [00:04<00:11, 11.62it/s][A
Training:  27%|██▋       | 49/180 [00:04<00:11, 11.25it/s][A
Training:  29%|██▉       | 53/180 [00:05<00:11, 11.04it/s][A
Training:  32%|███▏      | 57/180 [00:05<00:10, 11.57it/s][A
Training:  34%|███▍

Epoch: 41/55 - Loss: 0.0741 - Accuracy: 0.9716



  0%|          | 0/23 [00:00<?, ?it/s][A
  4%|▍         | 1/23 [00:00<00:11,  1.95it/s][A
 22%|██▏       | 5/23 [00:00<00:02,  6.98it/s][A
 39%|███▉      | 9/23 [00:01<00:01,  8.65it/s][A
 57%|█████▋    | 13/23 [00:01<00:00, 10.08it/s][A
 74%|███████▍  | 17/23 [00:01<00:00, 10.58it/s][A
100%|██████████| 23/23 [00:02<00:00, 10.38it/s][A
Epochs:  75%|███████▍  | 41/55 [12:01<04:06, 17.59s/it]

Val Loss: 0.1287 - Val Accuracy: 0.9558



Training:   0%|          | 0/180 [00:00<?, ?it/s][A
Training:   1%|          | 1/180 [00:00<01:49,  1.64it/s][A
Training:   3%|▎         | 5/180 [00:00<00:28,  6.23it/s][A
Training:   5%|▌         | 9/180 [00:01<00:20,  8.33it/s][A
Training:   7%|▋         | 13/180 [00:01<00:17,  9.57it/s][A
Training:   9%|▉         | 17/180 [00:01<00:15, 10.46it/s][A
Training:  12%|█▏        | 21/180 [00:02<00:14, 11.06it/s][A
Training:  14%|█▍        | 25/180 [00:02<00:14, 10.97it/s][A
Training:  16%|█▌        | 29/180 [00:03<00:14, 10.63it/s][A
Training:  18%|█▊        | 33/180 [00:03<00:13, 10.83it/s][A
Training:  21%|██        | 37/180 [00:03<00:12, 11.36it/s][A
Training:  23%|██▎       | 41/180 [00:04<00:11, 11.75it/s][A
Training:  25%|██▌       | 45/180 [00:04<00:11, 11.92it/s][A
Training:  27%|██▋       | 49/180 [00:04<00:10, 12.29it/s][A
Training:  29%|██▉       | 53/180 [00:04<00:10, 12.38it/s][A
Training:  32%|███▏      | 57/180 [00:05<00:10, 12.01it/s][A
Training:  34%|███▍

Epoch: 42/55 - Loss: 0.0770 - Accuracy: 0.9707



  0%|          | 0/23 [00:00<?, ?it/s][A
  4%|▍         | 1/23 [00:00<00:11,  1.97it/s][A
 22%|██▏       | 5/23 [00:00<00:02,  7.29it/s][A
 39%|███▉      | 9/23 [00:01<00:01,  9.54it/s][A
 57%|█████▋    | 13/23 [00:01<00:00, 10.97it/s][A
 70%|██████▉   | 16/23 [00:01<00:00, 13.31it/s][A
 78%|███████▊  | 18/23 [00:01<00:00, 11.67it/s][A
 87%|████████▋ | 20/23 [00:01<00:00, 12.40it/s][A
100%|██████████| 23/23 [00:02<00:00, 10.68it/s][A
Epochs:  76%|███████▋  | 42/55 [12:18<03:47, 17.53s/it]

Val Loss: 0.1285 - Val Accuracy: 0.9609



Training:   0%|          | 0/180 [00:00<?, ?it/s][A
Training:   1%|          | 1/180 [00:00<01:40,  1.78it/s][A
Training:   3%|▎         | 5/180 [00:00<00:27,  6.34it/s][A
Training:   5%|▌         | 9/180 [00:01<00:20,  8.39it/s][A
Training:   7%|▋         | 13/180 [00:01<00:16,  9.98it/s][A
Training:   9%|▉         | 17/180 [00:01<00:15, 10.69it/s][A
Training:  11%|█         | 19/180 [00:01<00:13, 11.88it/s][A
Training:  12%|█▏        | 21/180 [00:02<00:14, 10.61it/s][A
Training:  14%|█▍        | 25/180 [00:02<00:13, 11.13it/s][A
Training:  16%|█▌        | 29/180 [00:02<00:13, 11.20it/s][A
Training:  18%|█▊        | 33/180 [00:03<00:13, 10.55it/s][A
Training:  21%|██        | 37/180 [00:03<00:12, 11.11it/s][A
Training:  23%|██▎       | 41/180 [00:03<00:12, 11.54it/s][A
Training:  25%|██▌       | 45/180 [00:04<00:11, 11.46it/s][A
Training:  27%|██▋       | 49/180 [00:04<00:11, 11.54it/s][A
Training:  29%|██▉       | 53/180 [00:05<00:10, 11.86it/s][A
Training:  32%|███▏

Epoch: 43/55 - Loss: 0.0732 - Accuracy: 0.9719



  0%|          | 0/23 [00:00<?, ?it/s][A
  4%|▍         | 1/23 [00:00<00:13,  1.61it/s][A
 22%|██▏       | 5/23 [00:00<00:02,  6.46it/s][A
 39%|███▉      | 9/23 [00:01<00:01,  9.19it/s][A
 57%|█████▋    | 13/23 [00:01<00:00, 10.16it/s][A
 74%|███████▍  | 17/23 [00:01<00:00, 11.45it/s][A
100%|██████████| 23/23 [00:02<00:00, 10.64it/s][A
Epochs:  78%|███████▊  | 43/55 [12:35<03:29, 17.49s/it]

Val Loss: 0.1227 - Val Accuracy: 0.9597



Training:   0%|          | 0/180 [00:00<?, ?it/s][A
Training:   1%|          | 1/180 [00:00<01:33,  1.90it/s][A
Training:   2%|▏         | 3/180 [00:00<00:31,  5.68it/s][A
Training:   3%|▎         | 5/180 [00:00<00:23,  7.58it/s][A
Training:   4%|▍         | 7/180 [00:00<00:17,  9.74it/s][A
Training:   5%|▌         | 9/180 [00:01<00:18,  9.42it/s][A
Training:   6%|▌         | 11/180 [00:01<00:15, 11.13it/s][A
Training:   7%|▋         | 13/180 [00:01<00:16, 10.00it/s][A
Training:   9%|▉         | 16/180 [00:01<00:12, 13.34it/s][A
Training:  10%|█         | 18/180 [00:01<00:14, 10.83it/s][A
Training:  12%|█▏        | 21/180 [00:02<00:15, 10.30it/s][A
Training:  14%|█▍        | 25/180 [00:02<00:13, 11.36it/s][A
Training:  16%|█▌        | 29/180 [00:02<00:12, 11.85it/s][A
Training:  18%|█▊        | 32/180 [00:02<00:10, 14.32it/s][A
Training:  19%|█▉        | 34/180 [00:03<00:13, 11.12it/s][A
Training:  21%|██        | 37/180 [00:03<00:12, 11.15it/s][A
Training:  22%|██▏   

Epoch: 44/55 - Loss: 0.0745 - Accuracy: 0.9716



  0%|          | 0/23 [00:00<?, ?it/s][A
  4%|▍         | 1/23 [00:00<00:10,  2.01it/s][A
 17%|█▋        | 4/23 [00:00<00:02,  7.25it/s][A
 26%|██▌       | 6/23 [00:00<00:02,  8.14it/s][A
 39%|███▉      | 9/23 [00:01<00:01,  9.00it/s][A
 52%|█████▏    | 12/23 [00:01<00:00, 12.48it/s][A
 61%|██████    | 14/23 [00:01<00:00, 10.99it/s][A
 74%|███████▍  | 17/23 [00:01<00:00, 10.83it/s][A
100%|██████████| 23/23 [00:02<00:00, 10.87it/s][A
Epochs:  80%|████████  | 44/55 [12:53<03:11, 17.45s/it]

Val Loss: 0.1315 - Val Accuracy: 0.9641



Training:   0%|          | 0/180 [00:00<?, ?it/s][A
Training:   1%|          | 1/180 [00:00<01:43,  1.73it/s][A
Training:   3%|▎         | 5/180 [00:00<00:25,  6.74it/s][A
Training:   5%|▌         | 9/180 [00:01<00:19,  8.78it/s][A
Training:   7%|▋         | 13/180 [00:01<00:17,  9.42it/s][A
Training:   9%|▉         | 17/180 [00:01<00:16, 10.14it/s][A
Training:  12%|█▏        | 21/180 [00:02<00:14, 10.86it/s][A
Training:  14%|█▍        | 25/180 [00:02<00:14, 10.59it/s][A
Training:  16%|█▌        | 29/180 [00:02<00:13, 11.23it/s][A
Training:  18%|█▊        | 33/180 [00:03<00:12, 11.44it/s][A
Training:  21%|██        | 37/180 [00:03<00:12, 11.55it/s][A
Training:  22%|██▏       | 40/180 [00:03<00:10, 13.46it/s][A
Training:  23%|██▎       | 42/180 [00:04<00:12, 11.43it/s][A
Training:  25%|██▌       | 45/180 [00:04<00:12, 10.98it/s][A
Training:  27%|██▋       | 49/180 [00:04<00:11, 11.32it/s][A
Training:  29%|██▉       | 53/180 [00:05<00:11, 11.31it/s][A
Training:  32%|███▏

Epoch: 45/55 - Loss: 0.0693 - Accuracy: 0.9739



  0%|          | 0/23 [00:00<?, ?it/s][A
  4%|▍         | 1/23 [00:00<00:10,  2.15it/s][A
 17%|█▋        | 4/23 [00:00<00:02,  8.63it/s][A
 26%|██▌       | 6/23 [00:00<00:02,  7.89it/s][A
 39%|███▉      | 9/23 [00:01<00:01,  9.17it/s][A
 57%|█████▋    | 13/23 [00:01<00:00, 10.67it/s][A
 74%|███████▍  | 17/23 [00:01<00:00, 11.63it/s][A
 83%|████████▎ | 19/23 [00:01<00:00, 12.26it/s][A
100%|██████████| 23/23 [00:02<00:00, 10.59it/s][A
Epochs:  82%|████████▏ | 45/55 [13:10<02:54, 17.47s/it]

Val Loss: 0.1309 - Val Accuracy: 0.9570



Training:   0%|          | 0/180 [00:00<?, ?it/s][A
Training:   1%|          | 1/180 [00:00<01:26,  2.07it/s][A
Training:   2%|▏         | 3/180 [00:00<00:29,  5.94it/s][A
Training:   3%|▎         | 5/180 [00:00<00:24,  7.15it/s][A
Training:   4%|▍         | 8/180 [00:00<00:15, 10.99it/s][A
Training:   6%|▌         | 10/180 [00:01<00:16, 10.48it/s][A
Training:   7%|▋         | 12/180 [00:01<00:14, 11.38it/s][A
Training:   8%|▊         | 14/180 [00:01<00:16, 10.13it/s][A
Training:   9%|▉         | 17/180 [00:01<00:17,  9.25it/s][A
Training:  12%|█▏        | 21/180 [00:02<00:15, 10.36it/s][A
Training:  14%|█▍        | 25/180 [00:02<00:13, 11.71it/s][A
Training:  16%|█▌        | 28/180 [00:02<00:10, 14.16it/s][A
Training:  17%|█▋        | 30/180 [00:02<00:12, 11.76it/s][A
Training:  18%|█▊        | 33/180 [00:03<00:13, 10.97it/s][A
Training:  19%|█▉        | 35/180 [00:03<00:11, 12.25it/s][A
Training:  21%|██        | 37/180 [00:03<00:12, 11.10it/s][A
Training:  22%|██▏  

Epoch: 46/55 - Loss: 0.0736 - Accuracy: 0.9741



  0%|          | 0/23 [00:00<?, ?it/s][A
  4%|▍         | 1/23 [00:00<00:13,  1.68it/s][A
 22%|██▏       | 5/23 [00:00<00:02,  6.67it/s][A
 39%|███▉      | 9/23 [00:01<00:01,  9.15it/s][A
 52%|█████▏    | 12/23 [00:01<00:00, 11.90it/s][A
 61%|██████    | 14/23 [00:01<00:00, 10.21it/s][A
 74%|███████▍  | 17/23 [00:01<00:00, 10.38it/s][A
 87%|████████▋ | 20/23 [00:01<00:00, 13.23it/s][A
100%|██████████| 23/23 [00:02<00:00, 10.45it/s][A
Epochs:  84%|████████▎ | 46/55 [13:28<02:37, 17.48s/it]

Val Loss: 0.1163 - Val Accuracy: 0.9652



Training:   0%|          | 0/180 [00:00<?, ?it/s][A
Training:   1%|          | 1/180 [00:00<01:36,  1.85it/s][A
Training:   2%|▏         | 4/180 [00:00<00:23,  7.48it/s][A
Training:   3%|▎         | 6/180 [00:00<00:22,  7.83it/s][A
Training:   5%|▌         | 9/180 [00:01<00:20,  8.30it/s][A
Training:   7%|▋         | 13/180 [00:01<00:18,  8.91it/s][A
Training:   9%|▉         | 17/180 [00:02<00:17,  9.28it/s][A
Training:  12%|█▏        | 21/180 [00:02<00:15, 10.39it/s][A
Training:  14%|█▍        | 25/180 [00:02<00:14, 10.62it/s][A
Training:  16%|█▌        | 29/180 [00:03<00:14, 10.72it/s][A
Training:  18%|█▊        | 33/180 [00:03<00:13, 11.09it/s][A
Training:  21%|██        | 37/180 [00:03<00:12, 11.60it/s][A
Training:  23%|██▎       | 41/180 [00:04<00:12, 11.57it/s][A
Training:  24%|██▍       | 44/180 [00:04<00:10, 13.55it/s][A
Training:  26%|██▌       | 46/180 [00:04<00:11, 11.90it/s][A
Training:  27%|██▋       | 49/180 [00:04<00:11, 11.56it/s][A
Training:  29%|██▉  

Epoch: 47/55 - Loss: 0.0750 - Accuracy: 0.9726



  0%|          | 0/23 [00:00<?, ?it/s][A
  4%|▍         | 1/23 [00:00<00:11,  1.93it/s][A
 22%|██▏       | 5/23 [00:00<00:02,  6.75it/s][A
 39%|███▉      | 9/23 [00:01<00:01,  8.95it/s][A
 57%|█████▋    | 13/23 [00:01<00:00, 10.07it/s][A
 74%|███████▍  | 17/23 [00:01<00:00, 11.29it/s][A
100%|██████████| 23/23 [00:02<00:00, 10.63it/s][A
Epochs:  85%|████████▌ | 47/55 [13:45<02:19, 17.50s/it]

Val Loss: 0.1176 - Val Accuracy: 0.9652



Training:   0%|          | 0/180 [00:00<?, ?it/s][A
Training:   1%|          | 1/180 [00:00<01:42,  1.75it/s][A
Training:   3%|▎         | 5/180 [00:00<00:26,  6.73it/s][A
Training:   5%|▌         | 9/180 [00:01<00:19,  8.59it/s][A
Training:   7%|▋         | 13/180 [00:01<00:17,  9.75it/s][A
Training:   9%|▉         | 17/180 [00:01<00:15, 10.58it/s][A
Training:  12%|█▏        | 21/180 [00:02<00:15, 10.52it/s][A
Training:  14%|█▍        | 25/180 [00:02<00:14, 11.07it/s][A
Training:  16%|█▌        | 29/180 [00:02<00:14, 10.76it/s][A
Training:  18%|█▊        | 33/180 [00:03<00:13, 11.21it/s][A
Training:  21%|██        | 37/180 [00:03<00:12, 11.49it/s][A
Training:  23%|██▎       | 41/180 [00:03<00:11, 11.76it/s][A
Training:  25%|██▌       | 45/180 [00:04<00:11, 11.54it/s][A
Training:  27%|██▋       | 49/180 [00:04<00:11, 11.30it/s][A
Training:  29%|██▉       | 53/180 [00:05<00:10, 11.59it/s][A
Training:  32%|███▏      | 57/180 [00:05<00:10, 11.73it/s][A
Training:  34%|███▍

Epoch: 48/55 - Loss: 0.0728 - Accuracy: 0.9730



  0%|          | 0/23 [00:00<?, ?it/s][A
  4%|▍         | 1/23 [00:00<00:12,  1.80it/s][A
 22%|██▏       | 5/23 [00:00<00:02,  6.74it/s][A
 39%|███▉      | 9/23 [00:01<00:01,  8.88it/s][A
 57%|█████▋    | 13/23 [00:01<00:01,  9.83it/s][A
 74%|███████▍  | 17/23 [00:01<00:00, 11.04it/s][A
100%|██████████| 23/23 [00:02<00:00, 10.38it/s][A
Epochs:  87%|████████▋ | 48/55 [14:03<02:02, 17.56s/it]

Val Loss: 0.1405 - Val Accuracy: 0.9608



Training:   0%|          | 0/180 [00:00<?, ?it/s][A
Training:   1%|          | 1/180 [00:00<01:32,  1.93it/s][A
Training:   3%|▎         | 5/180 [00:00<00:25,  6.83it/s][A
Training:   5%|▌         | 9/180 [00:01<00:18,  9.01it/s][A
Training:   7%|▋         | 13/180 [00:01<00:16,  9.96it/s][A
Training:   9%|▉         | 17/180 [00:01<00:16, 10.06it/s][A
Training:  12%|█▏        | 21/180 [00:02<00:15, 10.51it/s][A
Training:  14%|█▍        | 25/180 [00:02<00:14, 10.91it/s][A
Training:  16%|█▌        | 28/180 [00:02<00:11, 13.05it/s][A
Training:  17%|█▋        | 30/180 [00:02<00:12, 11.69it/s][A
Training:  18%|█▊        | 33/180 [00:03<00:13, 10.83it/s][A
Training:  21%|██        | 37/180 [00:03<00:13, 10.86it/s][A
Training:  23%|██▎       | 41/180 [00:03<00:12, 11.43it/s][A
Training:  24%|██▍       | 43/180 [00:04<00:11, 12.22it/s][A
Training:  25%|██▌       | 45/180 [00:04<00:12, 11.06it/s][A
Training:  27%|██▋       | 49/180 [00:04<00:11, 11.87it/s][A
Training:  28%|██▊ 

Epoch: 49/55 - Loss: 0.0746 - Accuracy: 0.9722



  0%|          | 0/23 [00:00<?, ?it/s][A
  4%|▍         | 1/23 [00:00<00:13,  1.64it/s][A
 22%|██▏       | 5/23 [00:00<00:02,  6.45it/s][A
 39%|███▉      | 9/23 [00:01<00:01,  9.05it/s][A
 57%|█████▋    | 13/23 [00:01<00:00, 10.28it/s][A
 74%|███████▍  | 17/23 [00:01<00:00, 10.80it/s][A
100%|██████████| 23/23 [00:02<00:00, 10.49it/s][A
Epochs:  89%|████████▉ | 49/55 [14:21<01:45, 17.60s/it]

Val Loss: 0.1432 - Val Accuracy: 0.9591



Training:   0%|          | 0/180 [00:00<?, ?it/s][A
Training:   1%|          | 1/180 [00:00<01:28,  2.02it/s][A
Training:   2%|▏         | 4/180 [00:00<00:21,  8.22it/s][A
Training:   3%|▎         | 6/180 [00:00<00:21,  8.04it/s][A
Training:   5%|▌         | 9/180 [00:01<00:19,  8.76it/s][A
Training:   7%|▋         | 13/180 [00:01<00:17,  9.82it/s][A
Training:   9%|▉         | 17/180 [00:01<00:15, 10.21it/s][A
Training:  12%|█▏        | 21/180 [00:02<00:14, 10.67it/s][A
Training:  14%|█▍        | 25/180 [00:02<00:13, 11.38it/s][A
Training:  16%|█▌        | 29/180 [00:02<00:13, 11.42it/s][A
Training:  18%|█▊        | 32/180 [00:02<00:10, 13.58it/s][A
Training:  19%|█▉        | 34/180 [00:03<00:12, 11.83it/s][A
Training:  21%|██        | 37/180 [00:03<00:12, 11.14it/s][A
Training:  23%|██▎       | 41/180 [00:03<00:11, 11.66it/s][A
Training:  24%|██▍       | 44/180 [00:03<00:09, 13.92it/s][A
Training:  26%|██▌       | 46/180 [00:04<00:11, 11.56it/s][A
Training:  27%|██▋  

Epoch: 50/55 - Loss: 0.0694 - Accuracy: 0.9741



  0%|          | 0/23 [00:00<?, ?it/s][A
  4%|▍         | 1/23 [00:00<00:10,  2.06it/s][A
 22%|██▏       | 5/23 [00:00<00:02,  6.88it/s][A
 39%|███▉      | 9/23 [00:01<00:01,  8.77it/s][A
 57%|█████▋    | 13/23 [00:01<00:01,  9.96it/s][A
 74%|███████▍  | 17/23 [00:01<00:00, 10.86it/s][A
100%|██████████| 23/23 [00:02<00:00, 10.61it/s][A
Epochs:  91%|█████████ | 50/55 [14:38<01:27, 17.57s/it]

Val Loss: 0.1140 - Val Accuracy: 0.9608



Training:   0%|          | 0/180 [00:00<?, ?it/s][A
Training:   1%|          | 1/180 [00:00<01:32,  1.94it/s][A
Training:   3%|▎         | 5/180 [00:00<00:24,  7.27it/s][A
Training:   4%|▍         | 8/180 [00:00<00:15, 11.22it/s][A
Training:   6%|▌         | 10/180 [00:01<00:18,  9.31it/s][A
Training:   7%|▋         | 13/180 [00:01<00:17,  9.73it/s][A
Training:   9%|▉         | 17/180 [00:01<00:15, 10.71it/s][A
Training:  12%|█▏        | 21/180 [00:02<00:15, 10.37it/s][A
Training:  14%|█▍        | 25/180 [00:02<00:14, 10.83it/s][A
Training:  16%|█▌        | 29/180 [00:02<00:13, 11.31it/s][A
Training:  17%|█▋        | 31/180 [00:02<00:12, 12.29it/s][A
Training:  18%|█▊        | 33/180 [00:03<00:12, 11.34it/s][A
Training:  20%|██        | 36/180 [00:03<00:10, 13.99it/s][A
Training:  21%|██        | 38/180 [00:03<00:13, 10.68it/s][A
Training:  23%|██▎       | 41/180 [00:03<00:12, 11.06it/s][A
Training:  25%|██▌       | 45/180 [00:04<00:12, 11.03it/s][A
Training:  26%|██▌ 

Epoch: 51/55 - Loss: 0.0739 - Accuracy: 0.9723



  0%|          | 0/23 [00:00<?, ?it/s][A
  4%|▍         | 1/23 [00:00<00:10,  2.09it/s][A
 22%|██▏       | 5/23 [00:00<00:02,  8.07it/s][A
 35%|███▍      | 8/23 [00:00<00:01, 10.98it/s][A
 43%|████▎     | 10/23 [00:01<00:01, 10.56it/s][A
 52%|█████▏    | 12/23 [00:01<00:00, 11.63it/s][A
 61%|██████    | 14/23 [00:01<00:00, 11.02it/s][A
 70%|██████▉   | 16/23 [00:01<00:00, 11.56it/s][A
 78%|███████▊  | 18/23 [00:01<00:00, 10.94it/s][A
100%|██████████| 23/23 [00:02<00:00, 10.72it/s][A
Epochs:  93%|█████████▎| 51/55 [14:56<01:10, 17.58s/it]

Val Loss: 0.1205 - Val Accuracy: 0.9613



Training:   0%|          | 0/180 [00:00<?, ?it/s][A
Training:   1%|          | 1/180 [00:00<01:30,  1.97it/s][A
Training:   3%|▎         | 5/180 [00:00<00:21,  8.12it/s][A
Training:   5%|▌         | 9/180 [00:01<00:17, 10.05it/s][A
Training:   6%|▌         | 11/180 [00:01<00:14, 11.35it/s][A
Training:   7%|▋         | 13/180 [00:01<00:15, 10.67it/s][A
Training:   8%|▊         | 15/180 [00:01<00:14, 11.53it/s][A
Training:   9%|▉         | 17/180 [00:01<00:15, 10.62it/s][A
Training:  11%|█         | 19/180 [00:01<00:13, 12.29it/s][A
Training:  12%|█▏        | 21/180 [00:02<00:14, 10.86it/s][A
Training:  13%|█▎        | 23/180 [00:02<00:13, 11.63it/s][A
Training:  14%|█▍        | 25/180 [00:02<00:13, 11.09it/s][A
Training:  15%|█▌        | 27/180 [00:02<00:12, 11.96it/s][A
Training:  16%|█▌        | 29/180 [00:02<00:13, 10.87it/s][A
Training:  17%|█▋        | 31/180 [00:02<00:12, 12.07it/s][A
Training:  18%|█▊        | 33/180 [00:03<00:13, 11.05it/s][A
Training:  20%|██  

Epoch: 52/55 - Loss: 0.0696 - Accuracy: 0.9738



  0%|          | 0/23 [00:00<?, ?it/s][A
  4%|▍         | 1/23 [00:00<00:10,  2.11it/s][A
 22%|██▏       | 5/23 [00:00<00:02,  8.06it/s][A
 39%|███▉      | 9/23 [00:01<00:01, 10.59it/s][A
 48%|████▊     | 11/23 [00:01<00:00, 12.03it/s][A
 57%|█████▋    | 13/23 [00:01<00:00, 11.05it/s][A
 65%|██████▌   | 15/23 [00:01<00:00, 12.27it/s][A
 74%|███████▍  | 17/23 [00:01<00:00, 10.83it/s][A
100%|██████████| 23/23 [00:02<00:00, 10.86it/s][A
Epochs:  95%|█████████▍| 52/55 [15:13<00:52, 17.57s/it]

Val Loss: 0.1191 - Val Accuracy: 0.9608



Training:   0%|          | 0/180 [00:00<?, ?it/s][A
Training:   1%|          | 1/180 [00:00<01:30,  1.97it/s][A
Training:   3%|▎         | 5/180 [00:00<00:23,  7.33it/s][A
Training:   5%|▌         | 9/180 [00:01<00:17,  9.96it/s][A
Training:   7%|▋         | 13/180 [00:01<00:15, 10.87it/s][A
Training:   9%|▉         | 17/180 [00:01<00:15, 10.53it/s][A
Training:  12%|█▏        | 21/180 [00:02<00:13, 11.68it/s][A
Training:  14%|█▍        | 25/180 [00:02<00:13, 11.22it/s][A
Training:  16%|█▌        | 29/180 [00:02<00:13, 11.41it/s][A
Training:  18%|█▊        | 33/180 [00:03<00:12, 11.69it/s][A
Training:  21%|██        | 37/180 [00:03<00:12, 11.69it/s][A
Training:  23%|██▎       | 41/180 [00:03<00:11, 11.60it/s][A
Training:  25%|██▌       | 45/180 [00:04<00:11, 11.76it/s][A
Training:  27%|██▋       | 49/180 [00:04<00:11, 11.49it/s][A
Training:  29%|██▉       | 53/180 [00:04<00:10, 11.71it/s][A
Training:  32%|███▏      | 57/180 [00:05<00:10, 11.45it/s][A
Training:  34%|███▍

Epoch: 53/55 - Loss: 0.0697 - Accuracy: 0.9744



  0%|          | 0/23 [00:00<?, ?it/s][A
  4%|▍         | 1/23 [00:00<00:10,  2.17it/s][A
 22%|██▏       | 5/23 [00:00<00:02,  8.48it/s][A
 39%|███▉      | 9/23 [00:00<00:01, 11.12it/s][A
 48%|████▊     | 11/23 [00:01<00:00, 12.14it/s][A
 57%|█████▋    | 13/23 [00:01<00:00, 12.39it/s][A
 65%|██████▌   | 15/23 [00:01<00:00, 12.07it/s][A
 74%|███████▍  | 17/23 [00:01<00:00, 12.25it/s][A
 83%|████████▎ | 19/23 [00:01<00:00, 11.84it/s][A
100%|██████████| 23/23 [00:02<00:00, 11.07it/s][A
Epochs:  96%|█████████▋| 53/55 [15:31<00:35, 17.57s/it]

Val Loss: 0.1253 - Val Accuracy: 0.9563



Training:   0%|          | 0/180 [00:00<?, ?it/s][A
Training:   1%|          | 1/180 [00:00<01:34,  1.89it/s][A
Training:   3%|▎         | 5/180 [00:00<00:25,  6.97it/s][A
Training:   5%|▌         | 9/180 [00:01<00:18,  9.48it/s][A
Training:   7%|▋         | 13/180 [00:01<00:15, 10.82it/s][A
Training:   9%|▉         | 17/180 [00:01<00:14, 11.58it/s][A
Training:  11%|█         | 19/180 [00:01<00:13, 12.38it/s][A
Training:  12%|█▏        | 21/180 [00:02<00:13, 11.64it/s][A
Training:  13%|█▎        | 23/180 [00:02<00:13, 11.57it/s][A
Training:  14%|█▍        | 25/180 [00:02<00:13, 11.32it/s][A
Training:  15%|█▌        | 27/180 [00:02<00:13, 11.49it/s][A
Training:  16%|█▌        | 29/180 [00:02<00:12, 11.73it/s][A
Training:  17%|█▋        | 31/180 [00:02<00:12, 11.60it/s][A
Training:  18%|█▊        | 33/180 [00:03<00:12, 11.66it/s][A
Training:  19%|█▉        | 35/180 [00:03<00:12, 11.40it/s][A
Training:  21%|██        | 37/180 [00:03<00:12, 11.82it/s][A
Training:  22%|██▏ 

Epoch: 54/55 - Loss: 0.0767 - Accuracy: 0.9715



  0%|          | 0/23 [00:00<?, ?it/s][A
  4%|▍         | 1/23 [00:00<00:10,  2.02it/s][A
 22%|██▏       | 5/23 [00:00<00:02,  7.93it/s][A
 39%|███▉      | 9/23 [00:00<00:01, 10.98it/s][A
 57%|█████▋    | 13/23 [00:01<00:00, 12.18it/s][A
 74%|███████▍  | 17/23 [00:01<00:00, 12.39it/s][A
100%|██████████| 23/23 [00:01<00:00, 11.73it/s][A
Epochs:  98%|█████████▊| 54/55 [15:49<00:17, 17.58s/it]

Val Loss: 0.1237 - Val Accuracy: 0.9563



Training:   0%|          | 0/180 [00:00<?, ?it/s][A
Training:   1%|          | 1/180 [00:00<01:35,  1.87it/s][A
Training:   3%|▎         | 5/180 [00:00<00:25,  6.93it/s][A
Training:   5%|▌         | 9/180 [00:01<00:17,  9.50it/s][A
Training:   7%|▋         | 13/180 [00:01<00:15, 10.92it/s][A
Training:   9%|▉         | 17/180 [00:01<00:14, 11.12it/s][A
Training:  12%|█▏        | 21/180 [00:02<00:14, 11.01it/s][A
Training:  14%|█▍        | 25/180 [00:02<00:14, 11.01it/s][A
Training:  16%|█▌        | 29/180 [00:02<00:13, 11.07it/s][A
Training:  18%|█▊        | 33/180 [00:03<00:12, 11.62it/s][A
Training:  21%|██        | 37/180 [00:03<00:12, 11.64it/s][A
Training:  23%|██▎       | 41/180 [00:03<00:11, 11.98it/s][A
Training:  25%|██▌       | 45/180 [00:04<00:11, 12.21it/s][A
Training:  27%|██▋       | 49/180 [00:04<00:10, 12.14it/s][A
Training:  29%|██▉       | 53/180 [00:04<00:10, 11.98it/s][A
Training:  32%|███▏      | 57/180 [00:05<00:10, 11.80it/s][A
Training:  34%|███▍

Epoch: 55/55 - Loss: 0.0709 - Accuracy: 0.9729



  0%|          | 0/23 [00:00<?, ?it/s][A
  4%|▍         | 1/23 [00:00<00:11,  1.88it/s][A
 22%|██▏       | 5/23 [00:00<00:02,  6.50it/s][A
 39%|███▉      | 9/23 [00:01<00:01,  8.91it/s][A
 57%|█████▋    | 13/23 [00:01<00:00, 10.72it/s][A
 74%|███████▍  | 17/23 [00:01<00:00, 11.63it/s][A
100%|██████████| 23/23 [00:02<00:00, 10.98it/s][A
Epochs: 100%|██████████| 55/55 [16:06<00:00, 17.57s/it]
[32m[I 2023-12-11 23:37:54,142][0m Trial 1 finished with value: 0.9624417424201965 and parameters: {'learning_rate': 0.0008919924301837155, 'weight_decay': 0.00010220890304481278, 'epsilon': 2.3380831337579294e-09, 'batch_size': 78, 'epochs': 55}. Best is trial 1 with value: 0.9624417424201965.[0m


Val Loss: 0.1337 - Val Accuracy: 0.9624
Saving best model...
Learning rate: 0.00010173550281282758
Weight decay: 0.008588437544705844
Epsilon: 3.762780786582391e-09
Batch size: 249
Number of epochs: 40


Epochs:   0%|          | 0/40 [00:00<?, ?it/s]
Training:   0%|          | 0/57 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/57 [00:01<01:11,  1.27s/it][A
Training:   7%|▋         | 4/57 [00:01<00:14,  3.64it/s][A
Training:  11%|█         | 6/57 [00:02<00:18,  2.70it/s][A
Training:  16%|█▌        | 9/57 [00:03<00:16,  2.87it/s][A
Training:  19%|█▉        | 11/57 [00:03<00:12,  3.81it/s][A
Training:  23%|██▎       | 13/57 [00:04<00:14,  3.09it/s][A
Training:  28%|██▊       | 16/57 [00:04<00:08,  4.79it/s][A
Training:  32%|███▏      | 18/57 [00:05<00:11,  3.53it/s][A
Training:  37%|███▋      | 21/57 [00:06<00:11,  3.19it/s][A
Training:  42%|████▏     | 24/57 [00:06<00:07,  4.56it/s][A
Training:  46%|████▌     | 26/57 [00:07<00:08,  3.52it/s][A
Training:  49%|████▉     | 28/57 [00:07<00:06,  4.43it/s][A
Training:  53%|█████▎    | 30/57 [00:08<00:07,  3.43it/s][A
Training:  56%|█████▌    | 32/57 [00:08<00:05,  4.29it/s][A
Training:  58%|█████▊    | 33/57 [00:09<00:07,  3.0

Epoch: 1/40 - Loss: 0.3315 - Accuracy: 0.8800



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:01<00:08,  1.24s/it][A
100%|██████████| 8/8 [00:02<00:00,  3.73it/s][A
Epochs:   2%|▎         | 1/40 [00:17<11:26, 17.61s/it]

Val Loss: 0.1609 - Val Accuracy: 0.9533



Training:   0%|          | 0/57 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/57 [00:01<01:10,  1.25s/it][A
Training:   9%|▉         | 5/57 [00:02<00:21,  2.41it/s][A
Training:  14%|█▍        | 8/57 [00:02<00:11,  4.18it/s][A
Training:  18%|█▊        | 10/57 [00:03<00:14,  3.22it/s][A
Training:  23%|██▎       | 13/57 [00:04<00:14,  3.00it/s][A
Training:  30%|██▉       | 17/57 [00:05<00:12,  3.31it/s][A
Training:  37%|███▋      | 21/57 [00:06<00:10,  3.46it/s][A
Training:  40%|████      | 23/57 [00:06<00:08,  4.19it/s][A
Training:  44%|████▍     | 25/57 [00:07<00:09,  3.35it/s][A
Training:  51%|█████     | 29/57 [00:08<00:08,  3.47it/s][A
Training:  58%|█████▊    | 33/57 [00:09<00:06,  3.54it/s][A
Training:  61%|██████▏   | 35/57 [00:10<00:05,  4.21it/s][A
Training:  65%|██████▍   | 37/57 [00:11<00:05,  3.34it/s][A
Training:  68%|██████▊   | 39/57 [00:11<00:04,  4.17it/s][A
Training:  72%|███████▏  | 41/57 [00:12<00:04,  3.26it/s][A
Training:  75%|███████▌  | 43/57 [0

Epoch: 2/40 - Loss: 0.1552 - Accuracy: 0.9503



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:01<00:09,  1.37s/it][A
 50%|█████     | 4/8 [00:01<00:01,  3.50it/s][A
100%|██████████| 8/8 [00:02<00:00,  3.53it/s][A
Epochs:   5%|▌         | 2/40 [00:35<11:09, 17.61s/it]

Val Loss: 0.1176 - Val Accuracy: 0.9654



Training:   0%|          | 0/57 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/57 [00:01<01:02,  1.12s/it][A
Training:   9%|▉         | 5/57 [00:02<00:20,  2.54it/s][A
Training:  12%|█▏        | 7/57 [00:02<00:13,  3.78it/s][A
Training:  16%|█▌        | 9/57 [00:03<00:16,  2.90it/s][A
Training:  23%|██▎       | 13/57 [00:04<00:13,  3.28it/s][A
Training:  28%|██▊       | 16/57 [00:04<00:08,  4.72it/s][A
Training:  32%|███▏      | 18/57 [00:05<00:10,  3.57it/s][A
Training:  35%|███▌      | 20/57 [00:05<00:08,  4.44it/s][A
Training:  39%|███▊      | 22/57 [00:06<00:09,  3.55it/s][A
Training:  40%|████      | 23/57 [00:06<00:08,  3.96it/s][A
Training:  44%|████▍     | 25/57 [00:07<00:10,  3.11it/s][A
Training:  47%|████▋     | 27/57 [00:07<00:07,  3.92it/s][A
Training:  51%|█████     | 29/57 [00:08<00:08,  3.22it/s][A
Training:  54%|█████▍    | 31/57 [00:08<00:06,  4.01it/s][A
Training:  58%|█████▊    | 33/57 [00:09<00:07,  3.22it/s][A
Training:  61%|██████▏   | 35/57 [00

Epoch: 3/40 - Loss: 0.1276 - Accuracy: 0.9545



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:01<00:09,  1.32s/it][A
100%|██████████| 8/8 [00:02<00:00,  3.46it/s][A
Epochs:   8%|▊         | 3/40 [00:52<10:54, 17.68s/it]

Val Loss: 0.1038 - Val Accuracy: 0.9669



Training:   0%|          | 0/57 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/57 [00:01<01:04,  1.15s/it][A
Training:   9%|▉         | 5/57 [00:02<00:21,  2.46it/s][A
Training:  12%|█▏        | 7/57 [00:02<00:13,  3.67it/s][A
Training:  16%|█▌        | 9/57 [00:03<00:17,  2.82it/s][A
Training:  23%|██▎       | 13/57 [00:04<00:13,  3.22it/s][A
Training:  28%|██▊       | 16/57 [00:04<00:08,  4.66it/s][A
Training:  32%|███▏      | 18/57 [00:05<00:11,  3.49it/s][A
Training:  35%|███▌      | 20/57 [00:05<00:08,  4.43it/s][A
Training:  39%|███▊      | 22/57 [00:06<00:10,  3.39it/s][A
Training:  44%|████▍     | 25/57 [00:07<00:10,  3.18it/s][A
Training:  51%|█████     | 29/57 [00:08<00:08,  3.26it/s][A
Training:  58%|█████▊    | 33/57 [00:09<00:07,  3.42it/s][A
Training:  63%|██████▎   | 36/57 [00:10<00:04,  4.49it/s][A
Training:  67%|██████▋   | 38/57 [00:11<00:05,  3.56it/s][A
Training:  72%|███████▏  | 41/57 [00:12<00:04,  3.28it/s][A
Training:  79%|███████▉  | 45/57 [00

Epoch: 4/40 - Loss: 0.1141 - Accuracy: 0.9601



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:01<00:08,  1.23s/it][A
 50%|█████     | 4/8 [00:01<00:01,  3.72it/s][A
100%|██████████| 8/8 [00:02<00:00,  3.52it/s][A
Epochs:  10%|█         | 4/40 [01:10<10:38, 17.73s/it]

Val Loss: 0.0975 - Val Accuracy: 0.9639



Training:   0%|          | 0/57 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/57 [00:01<01:02,  1.12s/it][A
Training:   9%|▉         | 5/57 [00:02<00:21,  2.47it/s][A
Training:  14%|█▍        | 8/57 [00:02<00:11,  4.31it/s][A
Training:  18%|█▊        | 10/57 [00:03<00:14,  3.25it/s][A
Training:  23%|██▎       | 13/57 [00:04<00:14,  3.04it/s][A
Training:  30%|██▉       | 17/57 [00:05<00:12,  3.23it/s][A
Training:  37%|███▋      | 21/57 [00:06<00:10,  3.34it/s][A
Training:  44%|████▍     | 25/57 [00:07<00:09,  3.43it/s][A
Training:  51%|█████     | 29/57 [00:08<00:07,  3.57it/s][A
Training:  58%|█████▊    | 33/57 [00:09<00:06,  3.68it/s][A
Training:  65%|██████▍   | 37/57 [00:10<00:05,  3.64it/s][A
Training:  72%|███████▏  | 41/57 [00:12<00:04,  3.67it/s][A
Training:  79%|███████▉  | 45/57 [00:13<00:03,  3.67it/s][A
Training:  84%|████████▍ | 48/57 [00:13<00:01,  4.63it/s][A
Training:  86%|████████▌ | 49/57 [00:14<00:02,  3.48it/s][A
Training:  93%|█████████▎| 53/57 [0

Epoch: 5/40 - Loss: 0.1041 - Accuracy: 0.9619



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:01<00:08,  1.28s/it][A
100%|██████████| 8/8 [00:02<00:00,  3.37it/s][A
Epochs:  12%|█▎        | 5/40 [01:28<10:20, 17.73s/it]

Val Loss: 0.0938 - Val Accuracy: 0.9699



Training:   0%|          | 0/57 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/57 [00:01<01:09,  1.24s/it][A
Training:   9%|▉         | 5/57 [00:02<00:20,  2.58it/s][A
Training:  14%|█▍        | 8/57 [00:02<00:10,  4.55it/s][A
Training:  18%|█▊        | 10/57 [00:03<00:14,  3.16it/s][A
Training:  23%|██▎       | 13/57 [00:04<00:14,  3.01it/s][A
Training:  26%|██▋       | 15/57 [00:04<00:10,  3.84it/s][A
Training:  30%|██▉       | 17/57 [00:05<00:12,  3.17it/s][A
Training:  35%|███▌      | 20/57 [00:05<00:07,  4.69it/s][A
Training:  39%|███▊      | 22/57 [00:06<00:09,  3.56it/s][A
Training:  44%|████▍     | 25/57 [00:07<00:09,  3.34it/s][A
Training:  49%|████▉     | 28/57 [00:07<00:06,  4.78it/s][A
Training:  53%|█████▎    | 30/57 [00:08<00:07,  3.65it/s][A
Training:  56%|█████▌    | 32/57 [00:08<00:05,  4.55it/s][A
Training:  60%|█████▉    | 34/57 [00:09<00:06,  3.40it/s][A
Training:  65%|██████▍   | 37/57 [00:10<00:06,  3.15it/s][A
Training:  72%|███████▏  | 41/57 [0

Epoch: 6/40 - Loss: 0.0966 - Accuracy: 0.9660



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:01<00:08,  1.28s/it][A
 25%|██▌       | 2/8 [00:01<00:03,  1.68it/s][A
100%|██████████| 8/8 [00:02<00:00,  3.36it/s][A
Epochs:  15%|█▌        | 6/40 [01:46<10:00, 17.67s/it]

Val Loss: 0.0980 - Val Accuracy: 0.9684



Training:   0%|          | 0/57 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/57 [00:01<01:10,  1.27s/it][A
Training:   9%|▉         | 5/57 [00:02<00:19,  2.62it/s][A
Training:  12%|█▏        | 7/57 [00:02<00:12,  3.87it/s][A
Training:  16%|█▌        | 9/57 [00:03<00:15,  3.11it/s][A
Training:  18%|█▊        | 10/57 [00:03<00:13,  3.54it/s][A
Training:  23%|██▎       | 13/57 [00:04<00:12,  3.41it/s][A
Training:  25%|██▍       | 14/57 [00:04<00:11,  3.73it/s][A
Training:  30%|██▉       | 17/57 [00:05<00:11,  3.58it/s][A
Training:  32%|███▏      | 18/57 [00:05<00:09,  3.93it/s][A
Training:  37%|███▋      | 21/57 [00:06<00:09,  3.76it/s][A
Training:  39%|███▊      | 22/57 [00:06<00:09,  3.78it/s][A
Training:  44%|████▍     | 25/57 [00:07<00:08,  3.62it/s][A
Training:  47%|████▋     | 27/57 [00:07<00:06,  4.63it/s][A
Training:  49%|████▉     | 28/57 [00:07<00:05,  5.00it/s][A
Training:  51%|█████     | 29/57 [00:08<00:09,  2.98it/s][A
Training:  54%|█████▍    | 31/57 [00

Epoch: 7/40 - Loss: 0.0918 - Accuracy: 0.9662



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:01<00:09,  1.35s/it][A
100%|██████████| 8/8 [00:02<00:00,  3.39it/s][A
Epochs:  18%|█▊        | 7/40 [02:03<09:44, 17.71s/it]

Val Loss: 0.0894 - Val Accuracy: 0.9709



Training:   0%|          | 0/57 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/57 [00:01<01:19,  1.42s/it][A
Training:   9%|▉         | 5/57 [00:02<00:20,  2.52it/s][A
Training:  16%|█▌        | 9/57 [00:03<00:15,  3.09it/s][A
Training:  23%|██▎       | 13/57 [00:04<00:13,  3.31it/s][A
Training:  28%|██▊       | 16/57 [00:04<00:08,  4.59it/s][A
Training:  32%|███▏      | 18/57 [00:05<00:11,  3.54it/s][A
Training:  35%|███▌      | 20/57 [00:05<00:08,  4.45it/s][A
Training:  39%|███▊      | 22/57 [00:06<00:10,  3.35it/s][A
Training:  42%|████▏     | 24/57 [00:06<00:07,  4.34it/s][A
Training:  46%|████▌     | 26/57 [00:07<00:09,  3.32it/s][A
Training:  51%|█████     | 29/57 [00:08<00:08,  3.21it/s][A
Training:  54%|█████▍    | 31/57 [00:08<00:06,  4.09it/s][A
Training:  58%|█████▊    | 33/57 [00:09<00:07,  3.33it/s][A
Training:  60%|█████▉    | 34/57 [00:09<00:06,  3.59it/s][A
Training:  65%|██████▍   | 37/57 [00:10<00:05,  3.42it/s][A
Training:  67%|██████▋   | 38/57 [0

Epoch: 8/40 - Loss: 0.0929 - Accuracy: 0.9644



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:01<00:08,  1.25s/it][A
 38%|███▊      | 3/8 [00:01<00:01,  2.72it/s][A
 62%|██████▎   | 5/8 [00:02<00:01,  2.61it/s][A
100%|██████████| 8/8 [00:02<00:00,  3.37it/s][A
Epochs:  20%|██        | 8/40 [02:21<09:28, 17.78s/it]

Val Loss: 0.0886 - Val Accuracy: 0.9679



Training:   0%|          | 0/57 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/57 [00:01<01:16,  1.36s/it][A
Training:   9%|▉         | 5/57 [00:02<00:20,  2.54it/s][A
Training:  16%|█▌        | 9/57 [00:03<00:14,  3.30it/s][A
Training:  23%|██▎       | 13/57 [00:04<00:12,  3.41it/s][A
Training:  28%|██▊       | 16/57 [00:04<00:08,  4.75it/s][A
Training:  32%|███▏      | 18/57 [00:05<00:10,  3.56it/s][A
Training:  37%|███▋      | 21/57 [00:06<00:10,  3.40it/s][A
Training:  40%|████      | 23/57 [00:06<00:08,  4.16it/s][A
Training:  44%|████▍     | 25/57 [00:07<00:09,  3.40it/s][A
Training:  46%|████▌     | 26/57 [00:07<00:08,  3.78it/s][A
Training:  51%|█████     | 29/57 [00:08<00:07,  3.55it/s][A
Training:  53%|█████▎    | 30/57 [00:08<00:07,  3.76it/s][A
Training:  58%|█████▊    | 33/57 [00:09<00:06,  3.46it/s][A
Training:  61%|██████▏   | 35/57 [00:09<00:04,  4.47it/s][A
Training:  65%|██████▍   | 37/57 [00:10<00:05,  3.45it/s][A
Training:  67%|██████▋   | 38/57 [0

Epoch: 9/40 - Loss: 0.0861 - Accuracy: 0.9696



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:01<00:09,  1.29s/it][A
 50%|█████     | 4/8 [00:01<00:01,  3.63it/s][A
100%|██████████| 8/8 [00:02<00:00,  3.27it/s][A
Epochs:  22%|██▎       | 9/40 [02:39<09:09, 17.74s/it]

Val Loss: 0.0889 - Val Accuracy: 0.9654



Training:   0%|          | 0/57 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/57 [00:01<01:08,  1.22s/it][A
Training:   4%|▎         | 2/57 [00:01<00:30,  1.78it/s][A
Training:   9%|▉         | 5/57 [00:02<00:18,  2.74it/s][A
Training:  12%|█▏        | 7/57 [00:02<00:12,  3.91it/s][A
Training:  16%|█▌        | 9/57 [00:03<00:13,  3.52it/s][A
Training:  18%|█▊        | 10/57 [00:03<00:12,  3.77it/s][A
Training:  23%|██▎       | 13/57 [00:04<00:11,  3.81it/s][A
Training:  25%|██▍       | 14/57 [00:04<00:11,  3.67it/s][A
Training:  30%|██▉       | 17/57 [00:05<00:10,  3.94it/s][A
Training:  32%|███▏      | 18/57 [00:05<00:10,  3.61it/s][A
Training:  35%|███▌      | 20/57 [00:05<00:07,  4.92it/s][A
Training:  37%|███▋      | 21/57 [00:06<00:10,  3.51it/s][A
Training:  39%|███▊      | 22/57 [00:06<00:11,  3.16it/s][A
Training:  44%|████▍     | 25/57 [00:07<00:08,  3.89it/s][A
Training:  46%|████▌     | 26/57 [00:07<00:08,  3.47it/s][A
Training:  51%|█████     | 29/57 [00:

Epoch: 10/40 - Loss: 0.0830 - Accuracy: 0.9704



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:01<00:09,  1.38s/it][A
100%|██████████| 8/8 [00:02<00:00,  3.21it/s][A
Epochs:  25%|██▌       | 10/40 [02:57<08:52, 17.76s/it]

Val Loss: 0.0926 - Val Accuracy: 0.9669



Training:   0%|          | 0/57 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/57 [00:01<01:15,  1.34s/it][A
Training:   7%|▋         | 4/57 [00:01<00:15,  3.46it/s][A
Training:  11%|█         | 6/57 [00:02<00:18,  2.80it/s][A
Training:  14%|█▍        | 8/57 [00:02<00:11,  4.17it/s][A
Training:  18%|█▊        | 10/57 [00:03<00:13,  3.43it/s][A
Training:  23%|██▎       | 13/57 [00:04<00:13,  3.29it/s][A
Training:  28%|██▊       | 16/57 [00:04<00:08,  4.96it/s][A
Training:  32%|███▏      | 18/57 [00:05<00:11,  3.47it/s][A
Training:  37%|███▋      | 21/57 [00:06<00:11,  3.22it/s][A
Training:  42%|████▏     | 24/57 [00:06<00:07,  4.58it/s][A
Training:  46%|████▌     | 26/57 [00:07<00:08,  3.57it/s][A
Training:  51%|█████     | 29/57 [00:08<00:08,  3.30it/s][A
Training:  58%|█████▊    | 33/57 [00:09<00:06,  3.51it/s][A
Training:  61%|██████▏   | 35/57 [00:09<00:05,  4.18it/s][A
Training:  65%|██████▍   | 37/57 [00:10<00:05,  3.42it/s][A
Training:  68%|██████▊   | 39/57 [00

Epoch: 11/40 - Loss: 0.0803 - Accuracy: 0.9707



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:01<00:09,  1.36s/it][A
100%|██████████| 8/8 [00:02<00:00,  3.29it/s][A
Epochs:  28%|██▊       | 11/40 [03:14<08:33, 17.71s/it]

Val Loss: 0.0861 - Val Accuracy: 0.9674



Training:   0%|          | 0/57 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/57 [00:01<01:11,  1.28s/it][A
Training:   5%|▌         | 3/57 [00:01<00:20,  2.68it/s][A
Training:   9%|▉         | 5/57 [00:02<00:20,  2.58it/s][A
Training:  14%|█▍        | 8/57 [00:02<00:10,  4.72it/s][A
Training:  18%|█▊        | 10/57 [00:03<00:12,  3.62it/s][A
Training:  21%|██        | 12/57 [00:03<00:09,  4.88it/s][A
Training:  25%|██▍       | 14/57 [00:04<00:11,  3.81it/s][A
Training:  28%|██▊       | 16/57 [00:04<00:08,  4.71it/s][A
Training:  30%|██▉       | 17/57 [00:04<00:12,  3.29it/s][A
Training:  33%|███▎      | 19/57 [00:05<00:08,  4.33it/s][A
Training:  37%|███▋      | 21/57 [00:06<00:10,  3.30it/s][A
Training:  40%|████      | 23/57 [00:06<00:08,  4.06it/s][A
Training:  44%|████▍     | 25/57 [00:07<00:09,  3.35it/s][A
Training:  47%|████▋     | 27/57 [00:07<00:07,  3.94it/s][A
Training:  51%|█████     | 29/57 [00:08<00:08,  3.32it/s][A
Training:  54%|█████▍    | 31/57 [00

Epoch: 12/40 - Loss: 0.0798 - Accuracy: 0.9709



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:01<00:09,  1.36s/it][A
 50%|█████     | 4/8 [00:01<00:01,  3.45it/s][A
100%|██████████| 8/8 [00:02<00:00,  3.17it/s][A
Epochs:  30%|███       | 12/40 [03:32<08:14, 17.67s/it]

Val Loss: 0.0862 - Val Accuracy: 0.9679



Training:   0%|          | 0/57 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/57 [00:01<01:09,  1.24s/it][A
Training:   7%|▋         | 4/57 [00:01<00:14,  3.66it/s][A
Training:  11%|█         | 6/57 [00:02<00:17,  2.85it/s][A
Training:  16%|█▌        | 9/57 [00:03<00:16,  2.93it/s][A
Training:  21%|██        | 12/57 [00:03<00:10,  4.46it/s][A
Training:  25%|██▍       | 14/57 [00:04<00:12,  3.52it/s][A
Training:  30%|██▉       | 17/57 [00:05<00:11,  3.47it/s][A
Training:  33%|███▎      | 19/57 [00:05<00:08,  4.39it/s][A
Training:  37%|███▋      | 21/57 [00:06<00:10,  3.46it/s][A
Training:  40%|████      | 23/57 [00:06<00:07,  4.26it/s][A
Training:  44%|████▍     | 25/57 [00:07<00:09,  3.39it/s][A
Training:  47%|████▋     | 27/57 [00:07<00:07,  4.20it/s][A
Training:  51%|█████     | 29/57 [00:08<00:08,  3.31it/s][A
Training:  54%|█████▍    | 31/57 [00:08<00:06,  4.10it/s][A
Training:  58%|█████▊    | 33/57 [00:09<00:07,  3.37it/s][A
Training:  61%|██████▏   | 35/57 [00

Epoch: 13/40 - Loss: 0.0774 - Accuracy: 0.9716



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:01<00:09,  1.35s/it][A
 50%|█████     | 4/8 [00:01<00:01,  3.48it/s][A
 75%|███████▌  | 6/8 [00:02<00:00,  2.82it/s][A
100%|██████████| 8/8 [00:02<00:00,  3.16it/s][A
Epochs:  32%|███▎      | 13/40 [03:50<07:57, 17.68s/it]

Val Loss: 0.0882 - Val Accuracy: 0.9664



Training:   0%|          | 0/57 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/57 [00:01<01:15,  1.35s/it][A
Training:   7%|▋         | 4/57 [00:01<00:15,  3.53it/s][A
Training:  11%|█         | 6/57 [00:02<00:18,  2.78it/s][A
Training:  16%|█▌        | 9/57 [00:03<00:16,  2.93it/s][A
Training:  19%|█▉        | 11/57 [00:03<00:11,  3.95it/s][A
Training:  23%|██▎       | 13/57 [00:04<00:13,  3.33it/s][A
Training:  28%|██▊       | 16/57 [00:04<00:08,  4.95it/s][A
Training:  32%|███▏      | 18/57 [00:05<00:09,  3.94it/s][A
Training:  35%|███▌      | 20/57 [00:05<00:07,  4.98it/s][A
Training:  39%|███▊      | 22/57 [00:06<00:09,  3.55it/s][A
Training:  44%|████▍     | 25/57 [00:07<00:10,  3.19it/s][A
Training:  49%|████▉     | 28/57 [00:07<00:06,  4.61it/s][A
Training:  53%|█████▎    | 30/57 [00:08<00:07,  3.40it/s][A
Training:  58%|█████▊    | 33/57 [00:09<00:07,  3.30it/s][A
Training:  61%|██████▏   | 35/57 [00:09<00:05,  4.16it/s][A
Training:  65%|██████▍   | 37/57 [00

Epoch: 14/40 - Loss: 0.0768 - Accuracy: 0.9706



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:01<00:09,  1.33s/it][A
 38%|███▊      | 3/8 [00:01<00:01,  2.60it/s][A
 62%|██████▎   | 5/8 [00:02<00:01,  2.40it/s][A
100%|██████████| 8/8 [00:02<00:00,  3.15it/s][A
Epochs:  35%|███▌      | 14/40 [04:07<07:39, 17.67s/it]

Val Loss: 0.0893 - Val Accuracy: 0.9659



Training:   0%|          | 0/57 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/57 [00:01<01:14,  1.33s/it][A
Training:   4%|▎         | 2/57 [00:01<00:34,  1.62it/s][A
Training:   9%|▉         | 5/57 [00:02<00:21,  2.47it/s][A
Training:  16%|█▌        | 9/57 [00:03<00:14,  3.20it/s][A
Training:  19%|█▉        | 11/57 [00:03<00:10,  4.24it/s][A
Training:  23%|██▎       | 13/57 [00:04<00:13,  3.16it/s][A
Training:  28%|██▊       | 16/57 [00:04<00:08,  4.81it/s][A
Training:  32%|███▏      | 18/57 [00:05<00:10,  3.76it/s][A
Training:  37%|███▋      | 21/57 [00:06<00:10,  3.42it/s][A
Training:  44%|████▍     | 25/57 [00:07<00:08,  3.56it/s][A
Training:  47%|████▋     | 27/57 [00:07<00:06,  4.30it/s][A
Training:  51%|█████     | 29/57 [00:08<00:08,  3.44it/s][A
Training:  54%|█████▍    | 31/57 [00:08<00:05,  4.35it/s][A
Training:  58%|█████▊    | 33/57 [00:09<00:07,  3.38it/s][A
Training:  63%|██████▎   | 36/57 [00:09<00:04,  4.89it/s][A
Training:  67%|██████▋   | 38/57 [00

Epoch: 15/40 - Loss: 0.0815 - Accuracy: 0.9700



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:01<00:08,  1.29s/it][A
 25%|██▌       | 2/8 [00:01<00:03,  1.65it/s][A
 50%|█████     | 4/8 [00:01<00:01,  3.88it/s][A
100%|██████████| 8/8 [00:02<00:00,  3.22it/s][A
Epochs:  38%|███▊      | 15/40 [04:25<07:22, 17.71s/it]

Val Loss: 0.1048 - Val Accuracy: 0.9578



Training:   0%|          | 0/57 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/57 [00:01<01:17,  1.38s/it][A
Training:   5%|▌         | 3/57 [00:01<00:21,  2.53it/s][A
Training:   9%|▉         | 5/57 [00:02<00:22,  2.35it/s][A
Training:  16%|█▌        | 9/57 [00:03<00:15,  3.08it/s][A
Training:  21%|██        | 12/57 [00:03<00:09,  4.67it/s][A
Training:  25%|██▍       | 14/57 [00:04<00:11,  3.65it/s][A
Training:  30%|██▉       | 17/57 [00:05<00:11,  3.56it/s][A
Training:  33%|███▎      | 19/57 [00:05<00:08,  4.34it/s][A
Training:  37%|███▋      | 21/57 [00:06<00:09,  3.65it/s][A
Training:  42%|████▏     | 24/57 [00:06<00:06,  5.29it/s][A
Training:  46%|████▌     | 26/57 [00:07<00:07,  3.91it/s][A
Training:  49%|████▉     | 28/57 [00:07<00:05,  4.92it/s][A
Training:  53%|█████▎    | 30/57 [00:08<00:07,  3.56it/s][A
Training:  58%|█████▊    | 33/57 [00:09<00:07,  3.27it/s][A
Training:  65%|██████▍   | 37/57 [00:10<00:06,  3.32it/s][A
Training:  72%|███████▏  | 41/57 [00

Epoch: 16/40 - Loss: 0.0777 - Accuracy: 0.9693



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:01<00:09,  1.38s/it][A
 62%|██████▎   | 5/8 [00:02<00:01,  2.41it/s][A
100%|██████████| 8/8 [00:02<00:00,  3.16it/s][A
Epochs:  40%|████      | 16/40 [04:43<07:03, 17.67s/it]

Val Loss: 0.0873 - Val Accuracy: 0.9659



Training:   0%|          | 0/57 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/57 [00:01<01:16,  1.37s/it][A
Training:   7%|▋         | 4/57 [00:01<00:15,  3.42it/s][A
Training:  11%|█         | 6/57 [00:02<00:19,  2.66it/s][A
Training:  16%|█▌        | 9/57 [00:03<00:17,  2.69it/s][A
Training:  19%|█▉        | 11/57 [00:03<00:12,  3.60it/s][A
Training:  23%|██▎       | 13/57 [00:04<00:13,  3.17it/s][A
Training:  30%|██▉       | 17/57 [00:05<00:10,  3.65it/s][A
Training:  33%|███▎      | 19/57 [00:05<00:08,  4.57it/s][A
Training:  37%|███▋      | 21/57 [00:06<00:10,  3.51it/s][A
Training:  42%|████▏     | 24/57 [00:06<00:06,  5.15it/s][A
Training:  46%|████▌     | 26/57 [00:07<00:07,  4.06it/s][A
Training:  51%|█████     | 29/57 [00:08<00:07,  3.62it/s][A
Training:  54%|█████▍    | 31/57 [00:08<00:05,  4.46it/s][A
Training:  58%|█████▊    | 33/57 [00:09<00:06,  3.52it/s][A
Training:  63%|██████▎   | 36/57 [00:09<00:04,  5.11it/s][A
Training:  67%|██████▋   | 38/57 [00

Epoch: 17/40 - Loss: 0.0741 - Accuracy: 0.9727



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:01<00:08,  1.28s/it][A
 62%|██████▎   | 5/8 [00:02<00:01,  2.49it/s][A
100%|██████████| 8/8 [00:02<00:00,  3.25it/s][A
Epochs:  42%|████▎     | 17/40 [05:00<06:44, 17.60s/it]

Val Loss: 0.0878 - Val Accuracy: 0.9669



Training:   0%|          | 0/57 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/57 [00:01<01:11,  1.28s/it][A
Training:   4%|▎         | 2/57 [00:01<00:33,  1.63it/s][A
Training:   9%|▉         | 5/57 [00:02<00:20,  2.52it/s][A
Training:  11%|█         | 6/57 [00:02<00:16,  3.04it/s][A
Training:  16%|█▌        | 9/57 [00:03<00:14,  3.38it/s][A
Training:  18%|█▊        | 10/57 [00:03<00:14,  3.26it/s][A
Training:  23%|██▎       | 13/57 [00:04<00:12,  3.62it/s][A
Training:  25%|██▍       | 14/57 [00:04<00:12,  3.44it/s][A
Training:  30%|██▉       | 17/57 [00:05<00:10,  4.00it/s][A
Training:  32%|███▏      | 18/57 [00:05<00:10,  3.86it/s][A
Training:  37%|███▋      | 21/57 [00:06<00:09,  3.87it/s][A
Training:  39%|███▊      | 22/57 [00:06<00:08,  3.92it/s][A
Training:  42%|████▏     | 24/57 [00:06<00:06,  5.27it/s][A
Training:  44%|████▍     | 25/57 [00:07<00:09,  3.55it/s][A
Training:  46%|████▌     | 26/57 [00:07<00:08,  3.68it/s][A
Training:  51%|█████     | 29/57 [00:

Epoch: 18/40 - Loss: 0.0715 - Accuracy: 0.9738



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:01<00:09,  1.34s/it][A
 62%|██████▎   | 5/8 [00:02<00:01,  2.47it/s][A
100%|██████████| 8/8 [00:02<00:00,  3.17it/s][A
Epochs:  45%|████▌     | 18/40 [05:18<06:28, 17.66s/it]

Val Loss: 0.0881 - Val Accuracy: 0.9664



Training:   0%|          | 0/57 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/57 [00:01<01:13,  1.31s/it][A
Training:   7%|▋         | 4/57 [00:01<00:14,  3.62it/s][A
Training:  11%|█         | 6/57 [00:02<00:18,  2.76it/s][A
Training:  16%|█▌        | 9/57 [00:03<00:16,  2.99it/s][A
Training:  18%|█▊        | 10/57 [00:03<00:14,  3.35it/s][A
Training:  23%|██▎       | 13/57 [00:04<00:13,  3.28it/s][A
Training:  25%|██▍       | 14/57 [00:04<00:12,  3.55it/s][A
Training:  30%|██▉       | 17/57 [00:05<00:11,  3.58it/s][A
Training:  32%|███▏      | 18/57 [00:05<00:09,  3.92it/s][A
Training:  37%|███▋      | 21/57 [00:06<00:09,  3.64it/s][A
Training:  39%|███▊      | 22/57 [00:06<00:08,  4.07it/s][A
Training:  42%|████▏     | 24/57 [00:06<00:06,  5.44it/s][A
Training:  46%|████▌     | 26/57 [00:07<00:08,  3.56it/s][A
Training:  51%|█████     | 29/57 [00:08<00:07,  3.64it/s][A
Training:  53%|█████▎    | 30/57 [00:08<00:06,  3.98it/s][A
Training:  58%|█████▊    | 33/57 [00

Epoch: 19/40 - Loss: 0.0711 - Accuracy: 0.9734



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:01<00:08,  1.27s/it][A
 38%|███▊      | 3/8 [00:01<00:01,  2.55it/s][A
 62%|██████▎   | 5/8 [00:02<00:01,  2.44it/s][A
100%|██████████| 8/8 [00:02<00:00,  3.07it/s][A
Epochs:  48%|████▊     | 19/40 [05:36<06:10, 17.65s/it]

Val Loss: 0.0901 - Val Accuracy: 0.9654



Training:   0%|          | 0/57 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/57 [00:01<01:18,  1.41s/it][A
Training:   9%|▉         | 5/57 [00:02<00:22,  2.33it/s][A
Training:  12%|█▏        | 7/57 [00:02<00:14,  3.45it/s][A
Training:  16%|█▌        | 9/57 [00:03<00:17,  2.72it/s][A
Training:  19%|█▉        | 11/57 [00:03<00:12,  3.81it/s][A
Training:  23%|██▎       | 13/57 [00:04<00:14,  3.04it/s][A
Training:  28%|██▊       | 16/57 [00:04<00:08,  4.78it/s][A
Training:  32%|███▏      | 18/57 [00:05<00:11,  3.39it/s][A
Training:  37%|███▋      | 21/57 [00:06<00:11,  3.25it/s][A
Training:  42%|████▏     | 24/57 [00:06<00:07,  4.69it/s][A
Training:  46%|████▌     | 26/57 [00:07<00:08,  3.76it/s][A
Training:  49%|████▉     | 28/57 [00:07<00:06,  4.70it/s][A
Training:  53%|█████▎    | 30/57 [00:08<00:07,  3.52it/s][A
Training:  56%|█████▌    | 32/57 [00:08<00:05,  4.52it/s][A
Training:  60%|█████▉    | 34/57 [00:09<00:06,  3.34it/s][A
Training:  65%|██████▍   | 37/57 [00

Epoch: 20/40 - Loss: 0.0707 - Accuracy: 0.9739



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:01<00:08,  1.24s/it][A
 50%|█████     | 4/8 [00:01<00:01,  3.39it/s][A
100%|██████████| 8/8 [00:02<00:00,  3.33it/s][A
Epochs:  50%|█████     | 20/40 [05:53<05:54, 17.73s/it]

Val Loss: 0.0873 - Val Accuracy: 0.9654



Training:   0%|          | 0/57 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/57 [00:01<01:20,  1.44s/it][A
Training:   5%|▌         | 3/57 [00:01<00:22,  2.39it/s][A
Training:   9%|▉         | 5/57 [00:02<00:23,  2.21it/s][A
Training:  14%|█▍        | 8/57 [00:02<00:12,  3.95it/s][A
Training:  16%|█▌        | 9/57 [00:03<00:19,  2.43it/s][A
Training:  21%|██        | 12/57 [00:03<00:10,  4.20it/s][A
Training:  25%|██▍       | 14/57 [00:04<00:13,  3.23it/s][A
Training:  28%|██▊       | 16/57 [00:04<00:09,  4.31it/s][A
Training:  32%|███▏      | 18/57 [00:05<00:12,  3.23it/s][A
Training:  35%|███▌      | 20/57 [00:06<00:08,  4.25it/s][A
Training:  39%|███▊      | 22/57 [00:06<00:10,  3.30it/s][A
Training:  44%|████▍     | 25/57 [00:07<00:09,  3.37it/s][A
Training:  46%|████▌     | 26/57 [00:07<00:08,  3.75it/s][A
Training:  49%|████▉     | 28/57 [00:08<00:06,  4.68it/s][A
Training:  51%|█████     | 29/57 [00:08<00:08,  3.14it/s][A
Training:  56%|█████▌    | 32/57 [00:

Epoch: 21/40 - Loss: 0.0708 - Accuracy: 0.9719



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:01<00:09,  1.37s/it][A
 38%|███▊      | 3/8 [00:01<00:02,  2.49it/s][A
 62%|██████▎   | 5/8 [00:02<00:01,  2.38it/s][A
100%|██████████| 8/8 [00:02<00:00,  3.14it/s][A
Epochs:  52%|█████▎    | 21/40 [06:12<05:39, 17.89s/it]

Val Loss: 0.0865 - Val Accuracy: 0.9674



Training:   0%|          | 0/57 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/57 [00:01<01:19,  1.42s/it][A
Training:   7%|▋         | 4/57 [00:01<00:16,  3.29it/s][A
Training:  11%|█         | 6/57 [00:02<00:19,  2.62it/s][A
Training:  16%|█▌        | 9/57 [00:03<00:17,  2.79it/s][A
Training:  19%|█▉        | 11/57 [00:03<00:12,  3.64it/s][A
Training:  23%|██▎       | 13/57 [00:04<00:13,  3.16it/s][A
Training:  26%|██▋       | 15/57 [00:04<00:10,  4.03it/s][A
Training:  30%|██▉       | 17/57 [00:05<00:12,  3.21it/s][A
Training:  33%|███▎      | 19/57 [00:05<00:09,  4.06it/s][A
Training:  37%|███▋      | 21/57 [00:06<00:10,  3.33it/s][A
Training:  40%|████      | 23/57 [00:06<00:08,  4.08it/s][A
Training:  44%|████▍     | 25/57 [00:07<00:09,  3.47it/s][A
Training:  47%|████▋     | 27/57 [00:07<00:07,  4.20it/s][A
Training:  51%|█████     | 29/57 [00:08<00:08,  3.49it/s][A
Training:  54%|█████▍    | 31/57 [00:08<00:05,  4.34it/s][A
Training:  58%|█████▊    | 33/57 [00

Epoch: 22/40 - Loss: 0.0689 - Accuracy: 0.9739



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:01<00:09,  1.31s/it][A
 38%|███▊      | 3/8 [00:01<00:01,  2.61it/s][A
100%|██████████| 8/8 [00:02<00:00,  3.25it/s][A
Epochs:  55%|█████▌    | 22/40 [06:30<05:22, 17.91s/it]

Val Loss: 0.0902 - Val Accuracy: 0.9664



Training:   0%|          | 0/57 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/57 [00:01<01:20,  1.44s/it][A
Training:   5%|▌         | 3/57 [00:01<00:22,  2.43it/s][A
Training:   9%|▉         | 5/57 [00:02<00:22,  2.31it/s][A
Training:  12%|█▏        | 7/57 [00:02<00:13,  3.66it/s][A
Training:  16%|█▌        | 9/57 [00:03<00:17,  2.73it/s][A
Training:  21%|██        | 12/57 [00:03<00:09,  4.54it/s][A
Training:  25%|██▍       | 14/57 [00:04<00:12,  3.48it/s][A
Training:  30%|██▉       | 17/57 [00:05<00:12,  3.21it/s][A
Training:  37%|███▋      | 21/57 [00:06<00:10,  3.40it/s][A
Training:  42%|████▏     | 24/57 [00:06<00:07,  4.70it/s][A
Training:  46%|████▌     | 26/57 [00:07<00:08,  3.74it/s][A
Training:  49%|████▉     | 28/57 [00:07<00:06,  4.62it/s][A
Training:  53%|█████▎    | 30/57 [00:08<00:07,  3.56it/s][A
Training:  56%|█████▌    | 32/57 [00:08<00:05,  4.58it/s][A
Training:  60%|█████▉    | 34/57 [00:09<00:06,  3.41it/s][A
Training:  65%|██████▍   | 37/57 [00:

Epoch: 23/40 - Loss: 0.0693 - Accuracy: 0.9726



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:01<00:08,  1.27s/it][A
 38%|███▊      | 3/8 [00:01<00:01,  2.62it/s][A
 62%|██████▎   | 5/8 [00:02<00:01,  2.48it/s][A
100%|██████████| 8/8 [00:02<00:00,  3.24it/s][A
Epochs:  57%|█████▊    | 23/40 [06:48<05:04, 17.92s/it]

Val Loss: 0.0871 - Val Accuracy: 0.9674



Training:   0%|          | 0/57 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/57 [00:01<01:20,  1.44s/it][A
Training:   9%|▉         | 5/57 [00:02<00:21,  2.41it/s][A
Training:  11%|█         | 6/57 [00:02<00:17,  2.84it/s][A
Training:  16%|█▌        | 9/57 [00:03<00:15,  3.02it/s][A
Training:  18%|█▊        | 10/57 [00:03<00:13,  3.41it/s][A
Training:  23%|██▎       | 13/57 [00:04<00:12,  3.47it/s][A
Training:  25%|██▍       | 14/57 [00:04<00:11,  3.73it/s][A
Training:  30%|██▉       | 17/57 [00:05<00:10,  3.68it/s][A
Training:  32%|███▏      | 18/57 [00:05<00:10,  3.82it/s][A
Training:  37%|███▋      | 21/57 [00:06<00:09,  3.62it/s][A
Training:  39%|███▊      | 22/57 [00:06<00:09,  3.81it/s][A
Training:  44%|████▍     | 25/57 [00:07<00:08,  3.67it/s][A
Training:  46%|████▌     | 26/57 [00:07<00:08,  3.84it/s][A
Training:  51%|█████     | 29/57 [00:08<00:07,  3.87it/s][A
Training:  53%|█████▎    | 30/57 [00:08<00:06,  3.88it/s][A
Training:  56%|█████▌    | 32/57 [00

Epoch: 24/40 - Loss: 0.0710 - Accuracy: 0.9744



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:01<00:09,  1.38s/it][A
 50%|█████     | 4/8 [00:01<00:01,  3.28it/s][A
100%|██████████| 8/8 [00:02<00:00,  3.23it/s][A
Epochs:  60%|██████    | 24/40 [07:06<04:47, 17.94s/it]

Val Loss: 0.0893 - Val Accuracy: 0.9659



Training:   0%|          | 0/57 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/57 [00:01<01:19,  1.42s/it][A
Training:   7%|▋         | 4/57 [00:01<00:16,  3.28it/s][A
Training:  11%|█         | 6/57 [00:02<00:19,  2.58it/s][A
Training:  14%|█▍        | 8/57 [00:02<00:12,  3.82it/s][A
Training:  18%|█▊        | 10/57 [00:03<00:16,  2.89it/s][A
Training:  21%|██        | 12/57 [00:03<00:11,  4.00it/s][A
Training:  25%|██▍       | 14/57 [00:04<00:13,  3.29it/s][A
Training:  28%|██▊       | 16/57 [00:04<00:09,  4.34it/s][A
Training:  32%|███▏      | 18/57 [00:05<00:12,  3.17it/s][A
Training:  37%|███▋      | 21/57 [00:06<00:11,  3.15it/s][A
Training:  42%|████▏     | 24/57 [00:06<00:07,  4.34it/s][A
Training:  44%|████▍     | 25/57 [00:07<00:09,  3.25it/s][A
Training:  47%|████▋     | 27/57 [00:07<00:06,  4.32it/s][A
Training:  51%|█████     | 29/57 [00:08<00:08,  3.23it/s][A
Training:  56%|█████▌    | 32/57 [00:09<00:05,  4.44it/s][A
Training:  58%|█████▊    | 33/57 [00

Epoch: 25/40 - Loss: 0.0679 - Accuracy: 0.9740



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:01<00:09,  1.38s/it][A
100%|██████████| 8/8 [00:02<00:00,  3.25it/s][A
Epochs:  62%|██████▎   | 25/40 [07:24<04:29, 17.99s/it]

Val Loss: 0.0885 - Val Accuracy: 0.9659



Training:   0%|          | 0/57 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/57 [00:01<01:16,  1.36s/it][A
Training:   7%|▋         | 4/57 [00:01<00:15,  3.51it/s][A
Training:  11%|█         | 6/57 [00:02<00:19,  2.63it/s][A
Training:  16%|█▌        | 9/57 [00:03<00:17,  2.69it/s][A
Training:  21%|██        | 12/57 [00:03<00:10,  4.27it/s][A
Training:  25%|██▍       | 14/57 [00:04<00:13,  3.24it/s][A
Training:  30%|██▉       | 17/57 [00:05<00:12,  3.17it/s][A
Training:  33%|███▎      | 19/57 [00:05<00:09,  4.03it/s][A
Training:  37%|███▋      | 21/57 [00:06<00:11,  3.26it/s][A
Training:  40%|████      | 23/57 [00:06<00:08,  4.23it/s][A
Training:  44%|████▍     | 25/57 [00:07<00:09,  3.35it/s][A
Training:  49%|████▉     | 28/57 [00:07<00:05,  5.03it/s][A
Training:  53%|█████▎    | 30/57 [00:08<00:07,  3.62it/s][A
Training:  58%|█████▊    | 33/57 [00:09<00:07,  3.32it/s][A
Training:  65%|██████▍   | 37/57 [00:10<00:05,  3.59it/s][A
Training:  68%|██████▊   | 39/57 [00

Epoch: 26/40 - Loss: 0.0664 - Accuracy: 0.9744



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:01<00:09,  1.34s/it][A
100%|██████████| 8/8 [00:02<00:00,  3.19it/s][A
Epochs:  65%|██████▌   | 26/40 [07:42<04:11, 17.96s/it]

Val Loss: 0.0914 - Val Accuracy: 0.9644



Training:   0%|          | 0/57 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/57 [00:01<01:14,  1.33s/it][A
Training:   4%|▎         | 2/57 [00:01<00:34,  1.59it/s][A
Training:   9%|▉         | 5/57 [00:02<00:20,  2.59it/s][A
Training:  14%|█▍        | 8/57 [00:02<00:10,  4.75it/s][A
Training:  18%|█▊        | 10/57 [00:03<00:14,  3.16it/s][A
Training:  21%|██        | 12/57 [00:03<00:10,  4.18it/s][A
Training:  25%|██▍       | 14/57 [00:04<00:13,  3.24it/s][A
Training:  30%|██▉       | 17/57 [00:05<00:12,  3.30it/s][A
Training:  32%|███▏      | 18/57 [00:05<00:10,  3.58it/s][A
Training:  35%|███▌      | 20/57 [00:05<00:08,  4.62it/s][A
Training:  37%|███▋      | 21/57 [00:06<00:11,  3.14it/s][A
Training:  40%|████      | 23/57 [00:06<00:07,  4.28it/s][A
Training:  44%|████▍     | 25/57 [00:07<00:09,  3.34it/s][A
Training:  46%|████▌     | 26/57 [00:07<00:08,  3.70it/s][A
Training:  49%|████▉     | 28/57 [00:07<00:05,  5.17it/s][A
Training:  53%|█████▎    | 30/57 [00

Epoch: 27/40 - Loss: 0.0657 - Accuracy: 0.9753



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:01<00:09,  1.41s/it][A
100%|██████████| 8/8 [00:02<00:00,  3.14it/s][A
Epochs:  68%|██████▊   | 27/40 [08:00<03:54, 18.01s/it]

Val Loss: 0.0899 - Val Accuracy: 0.9679



Training:   0%|          | 0/57 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/57 [00:01<01:15,  1.35s/it][A
Training:   7%|▋         | 4/57 [00:01<00:15,  3.43it/s][A
Training:  11%|█         | 6/57 [00:02<00:18,  2.74it/s][A
Training:  16%|█▌        | 9/57 [00:03<00:17,  2.74it/s][A
Training:  21%|██        | 12/57 [00:03<00:10,  4.27it/s][A
Training:  25%|██▍       | 14/57 [00:04<00:12,  3.31it/s][A
Training:  30%|██▉       | 17/57 [00:05<00:12,  3.10it/s][A
Training:  35%|███▌      | 20/57 [00:05<00:08,  4.46it/s][A
Training:  39%|███▊      | 22/57 [00:06<00:09,  3.51it/s][A
Training:  42%|████▏     | 24/57 [00:06<00:07,  4.48it/s][A
Training:  46%|████▌     | 26/57 [00:07<00:09,  3.40it/s][A
Training:  51%|█████     | 29/57 [00:08<00:08,  3.24it/s][A
Training:  54%|█████▍    | 31/57 [00:08<00:06,  4.13it/s][A
Training:  58%|█████▊    | 33/57 [00:09<00:07,  3.29it/s][A
Training:  61%|██████▏   | 35/57 [00:09<00:05,  4.27it/s][A
Training:  65%|██████▍   | 37/57 [00

Epoch: 28/40 - Loss: 0.0648 - Accuracy: 0.9763



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:01<00:09,  1.39s/it][A
 50%|█████     | 4/8 [00:01<00:01,  3.44it/s][A
100%|██████████| 8/8 [00:02<00:00,  3.25it/s][A
Epochs:  70%|███████   | 28/40 [08:18<03:36, 18.05s/it]

Val Loss: 0.0873 - Val Accuracy: 0.9684



Training:   0%|          | 0/57 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/57 [00:01<01:20,  1.44s/it][A
Training:   7%|▋         | 4/57 [00:01<00:17,  3.10it/s][A
Training:  11%|█         | 6/57 [00:02<00:18,  2.75it/s][A
Training:  16%|█▌        | 9/57 [00:03<00:17,  2.78it/s][A
Training:  19%|█▉        | 11/57 [00:03<00:12,  3.75it/s][A
Training:  23%|██▎       | 13/57 [00:04<00:14,  3.08it/s][A
Training:  25%|██▍       | 14/57 [00:04<00:12,  3.42it/s][A
Training:  28%|██▊       | 16/57 [00:04<00:08,  4.67it/s][A
Training:  30%|██▉       | 17/57 [00:05<00:13,  3.03it/s][A
Training:  32%|███▏      | 18/57 [00:05<00:11,  3.25it/s][A
Training:  37%|███▋      | 21/57 [00:06<00:11,  3.17it/s][A
Training:  40%|████      | 23/57 [00:06<00:07,  4.26it/s][A
Training:  44%|████▍     | 25/57 [00:07<00:09,  3.32it/s][A
Training:  51%|█████     | 29/57 [00:08<00:07,  3.57it/s][A
Training:  54%|█████▍    | 31/57 [00:09<00:05,  4.44it/s][A
Training:  58%|█████▊    | 33/57 [00

Epoch: 29/40 - Loss: 0.0655 - Accuracy: 0.9748



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:01<00:09,  1.42s/it][A
100%|██████████| 8/8 [00:02<00:00,  3.16it/s][A
Epochs:  72%|███████▎  | 29/40 [08:36<03:19, 18.10s/it]

Val Loss: 0.0877 - Val Accuracy: 0.9659



Training:   0%|          | 0/57 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/57 [00:01<01:15,  1.34s/it][A
Training:   9%|▉         | 5/57 [00:02<00:22,  2.35it/s][A
Training:  14%|█▍        | 8/57 [00:02<00:11,  4.18it/s][A
Training:  18%|█▊        | 10/57 [00:03<00:15,  3.04it/s][A
Training:  23%|██▎       | 13/57 [00:04<00:14,  3.07it/s][A
Training:  28%|██▊       | 16/57 [00:04<00:09,  4.53it/s][A
Training:  32%|███▏      | 18/57 [00:05<00:11,  3.41it/s][A
Training:  37%|███▋      | 21/57 [00:06<00:11,  3.25it/s][A
Training:  39%|███▊      | 22/57 [00:06<00:09,  3.55it/s][A
Training:  42%|████▏     | 24/57 [00:06<00:07,  4.65it/s][A
Training:  46%|████▌     | 26/57 [00:07<00:08,  3.49it/s][A
Training:  51%|█████     | 29/57 [00:08<00:08,  3.47it/s][A
Training:  53%|█████▎    | 30/57 [00:08<00:07,  3.59it/s][A
Training:  56%|█████▌    | 32/57 [00:09<00:05,  4.76it/s][A
Training:  58%|█████▊    | 33/57 [00:09<00:07,  3.25it/s][A
Training:  60%|█████▉    | 34/57 [0

Epoch: 30/40 - Loss: 0.0648 - Accuracy: 0.9759



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:01<00:09,  1.33s/it][A
100%|██████████| 8/8 [00:02<00:00,  3.32it/s][A
Epochs:  75%|███████▌  | 30/40 [08:54<03:00, 18.01s/it]

Val Loss: 0.0892 - Val Accuracy: 0.9689



Training:   0%|          | 0/57 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/57 [00:01<01:21,  1.45s/it][A
Training:   7%|▋         | 4/57 [00:01<00:16,  3.19it/s][A
Training:  11%|█         | 6/57 [00:02<00:18,  2.72it/s][A
Training:  14%|█▍        | 8/57 [00:02<00:12,  4.01it/s][A
Training:  18%|█▊        | 10/57 [00:03<00:15,  3.02it/s][A
Training:  19%|█▉        | 11/57 [00:03<00:13,  3.48it/s][A
Training:  23%|██▎       | 13/57 [00:04<00:15,  2.91it/s][A
Training:  28%|██▊       | 16/57 [00:04<00:08,  4.78it/s][A
Training:  32%|███▏      | 18/57 [00:05<00:11,  3.35it/s][A
Training:  35%|███▌      | 20/57 [00:05<00:08,  4.39it/s][A
Training:  39%|███▊      | 22/57 [00:06<00:11,  3.17it/s][A
Training:  44%|████▍     | 25/57 [00:07<00:10,  3.08it/s][A
Training:  51%|█████     | 29/57 [00:08<00:08,  3.48it/s][A
Training:  54%|█████▍    | 31/57 [00:08<00:06,  4.24it/s][A
Training:  58%|█████▊    | 33/57 [00:09<00:07,  3.37it/s][A
Training:  63%|██████▎   | 36/57 [00

Epoch: 31/40 - Loss: 0.0654 - Accuracy: 0.9753



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:01<00:09,  1.30s/it][A
 38%|███▊      | 3/8 [00:01<00:01,  2.57it/s][A
100%|██████████| 8/8 [00:02<00:00,  3.22it/s][A
Epochs:  78%|███████▊  | 31/40 [09:12<02:42, 18.03s/it]

Val Loss: 0.1042 - Val Accuracy: 0.9649



Training:   0%|          | 0/57 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/57 [00:01<01:20,  1.44s/it][A
Training:   5%|▌         | 3/57 [00:01<00:22,  2.37it/s][A
Training:   9%|▉         | 5/57 [00:02<00:22,  2.29it/s][A
Training:  16%|█▌        | 9/57 [00:03<00:16,  2.99it/s][A
Training:  19%|█▉        | 11/57 [00:03<00:11,  3.97it/s][A
Training:  23%|██▎       | 13/57 [00:04<00:14,  3.12it/s][A
Training:  30%|██▉       | 17/57 [00:05<00:11,  3.37it/s][A
Training:  33%|███▎      | 19/57 [00:05<00:08,  4.23it/s][A
Training:  37%|███▋      | 21/57 [00:06<00:10,  3.42it/s][A
Training:  42%|████▏     | 24/57 [00:06<00:06,  4.95it/s][A
Training:  46%|████▌     | 26/57 [00:07<00:08,  3.70it/s][A
Training:  51%|█████     | 29/57 [00:08<00:08,  3.40it/s][A
Training:  58%|█████▊    | 33/57 [00:09<00:06,  3.50it/s][A
Training:  63%|██████▎   | 36/57 [00:09<00:04,  4.72it/s][A
Training:  67%|██████▋   | 38/57 [00:10<00:04,  3.83it/s][A
Training:  72%|███████▏  | 41/57 [00

Epoch: 32/40 - Loss: 0.0710 - Accuracy: 0.9726



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:01<00:09,  1.41s/it][A
 50%|█████     | 4/8 [00:01<00:01,  3.37it/s][A
100%|██████████| 8/8 [00:02<00:00,  3.12it/s][A
Epochs:  80%|████████  | 32/40 [09:30<02:23, 18.00s/it]

Val Loss: 0.1309 - Val Accuracy: 0.9598



Training:   0%|          | 0/57 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/57 [00:01<01:20,  1.43s/it][A
Training:   9%|▉         | 5/57 [00:02<00:21,  2.41it/s][A
Training:  14%|█▍        | 8/57 [00:02<00:11,  4.28it/s][A
Training:  18%|█▊        | 10/57 [00:03<00:14,  3.15it/s][A
Training:  23%|██▎       | 13/57 [00:04<00:14,  3.02it/s][A
Training:  28%|██▊       | 16/57 [00:04<00:09,  4.47it/s][A
Training:  32%|███▏      | 18/57 [00:05<00:11,  3.47it/s][A
Training:  37%|███▋      | 21/57 [00:06<00:11,  3.20it/s][A
Training:  40%|████      | 23/57 [00:06<00:08,  4.06it/s][A
Training:  44%|████▍     | 25/57 [00:07<00:09,  3.28it/s][A
Training:  49%|████▉     | 28/57 [00:07<00:06,  4.70it/s][A
Training:  53%|█████▎    | 30/57 [00:08<00:07,  3.60it/s][A
Training:  58%|█████▊    | 33/57 [00:09<00:07,  3.28it/s][A
Training:  63%|██████▎   | 36/57 [00:09<00:04,  4.60it/s][A
Training:  67%|██████▋   | 38/57 [00:10<00:05,  3.76it/s][A
Training:  70%|███████   | 40/57 [0

Epoch: 33/40 - Loss: 0.0649 - Accuracy: 0.9753



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:01<00:09,  1.41s/it][A
 38%|███▊      | 3/8 [00:01<00:02,  2.39it/s][A
100%|██████████| 8/8 [00:02<00:00,  3.14it/s][A
Epochs:  82%|████████▎ | 33/40 [09:48<02:05, 17.97s/it]

Val Loss: 0.0901 - Val Accuracy: 0.9679



Training:   0%|          | 0/57 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/57 [00:01<01:21,  1.45s/it][A
Training:   7%|▋         | 4/57 [00:01<00:16,  3.25it/s][A
Training:  11%|█         | 6/57 [00:02<00:18,  2.70it/s][A
Training:  14%|█▍        | 8/57 [00:02<00:12,  4.03it/s][A
Training:  18%|█▊        | 10/57 [00:03<00:15,  2.98it/s][A
Training:  21%|██        | 12/57 [00:03<00:10,  4.11it/s][A
Training:  25%|██▍       | 14/57 [00:04<00:13,  3.18it/s][A
Training:  30%|██▉       | 17/57 [00:05<00:12,  3.17it/s][A
Training:  35%|███▌      | 20/57 [00:05<00:07,  4.66it/s][A
Training:  39%|███▊      | 22/57 [00:06<00:09,  3.59it/s][A
Training:  42%|████▏     | 24/57 [00:06<00:07,  4.38it/s][A
Training:  44%|████▍     | 25/57 [00:07<00:10,  3.01it/s][A
Training:  47%|████▋     | 27/57 [00:07<00:07,  4.04it/s][A
Training:  51%|█████     | 29/57 [00:08<00:08,  3.31it/s][A
Training:  54%|█████▍    | 31/57 [00:08<00:05,  4.37it/s][A
Training:  56%|█████▌    | 32/57 [00

Epoch: 34/40 - Loss: 0.0632 - Accuracy: 0.9765



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:01<00:09,  1.36s/it][A
 38%|███▊      | 3/8 [00:01<00:01,  2.51it/s][A
100%|██████████| 8/8 [00:02<00:00,  3.17it/s][A
Epochs:  85%|████████▌ | 34/40 [10:06<01:47, 17.94s/it]

Val Loss: 0.0920 - Val Accuracy: 0.9679



Training:   0%|          | 0/57 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/57 [00:01<01:26,  1.55s/it][A
Training:   9%|▉         | 5/57 [00:02<00:22,  2.27it/s][A
Training:  16%|█▌        | 9/57 [00:03<00:16,  2.83it/s][A
Training:  21%|██        | 12/57 [00:03<00:10,  4.25it/s][A
Training:  25%|██▍       | 14/57 [00:04<00:13,  3.28it/s][A
Training:  30%|██▉       | 17/57 [00:05<00:13,  3.02it/s][A
Training:  37%|███▋      | 21/57 [00:07<00:11,  3.24it/s][A
Training:  42%|████▏     | 24/57 [00:07<00:07,  4.42it/s][A
Training:  46%|████▌     | 26/57 [00:08<00:09,  3.43it/s][A
Training:  49%|████▉     | 28/57 [00:08<00:06,  4.21it/s][A
Training:  53%|█████▎    | 30/57 [00:09<00:07,  3.40it/s][A
Training:  58%|█████▊    | 33/57 [00:10<00:07,  3.29it/s][A
Training:  65%|██████▍   | 37/57 [00:11<00:05,  3.49it/s][A
Training:  70%|███████   | 40/57 [00:11<00:03,  4.75it/s][A
Training:  74%|███████▎  | 42/57 [00:12<00:04,  3.65it/s][A
Training:  79%|███████▉  | 45/57 [0

Epoch: 35/40 - Loss: 0.0628 - Accuracy: 0.9754



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:01<00:09,  1.37s/it][A
 50%|█████     | 4/8 [00:01<00:01,  3.13it/s][A
 62%|██████▎   | 5/8 [00:02<00:01,  2.24it/s][A
100%|██████████| 8/8 [00:02<00:00,  3.08it/s][A
Epochs:  88%|████████▊ | 35/40 [10:24<01:30, 18.08s/it]

Val Loss: 0.0965 - Val Accuracy: 0.9664



Training:   0%|          | 0/57 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/57 [00:01<01:18,  1.40s/it][A
Training:   7%|▋         | 4/57 [00:01<00:16,  3.30it/s][A
Training:  11%|█         | 6/57 [00:02<00:19,  2.66it/s][A
Training:  16%|█▌        | 9/57 [00:03<00:17,  2.75it/s][A
Training:  21%|██        | 12/57 [00:03<00:10,  4.32it/s][A
Training:  25%|██▍       | 14/57 [00:04<00:12,  3.32it/s][A
Training:  30%|██▉       | 17/57 [00:05<00:12,  3.15it/s][A
Training:  33%|███▎      | 19/57 [00:05<00:09,  4.04it/s][A
Training:  37%|███▋      | 21/57 [00:06<00:11,  3.08it/s][A
Training:  42%|████▏     | 24/57 [00:06<00:07,  4.58it/s][A
Training:  46%|████▌     | 26/57 [00:07<00:09,  3.35it/s][A
Training:  51%|█████     | 29/57 [00:09<00:08,  3.20it/s][A
Training:  56%|█████▌    | 32/57 [00:09<00:05,  4.50it/s][A
Training:  60%|█████▉    | 34/57 [00:10<00:06,  3.52it/s][A
Training:  65%|██████▍   | 37/57 [00:11<00:06,  3.32it/s][A
Training:  72%|███████▏  | 41/57 [00

Epoch: 36/40 - Loss: 0.0644 - Accuracy: 0.9753



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:01<00:09,  1.36s/it][A
100%|██████████| 8/8 [00:02<00:00,  3.20it/s][A
Epochs:  90%|█████████ | 36/40 [10:42<01:12, 18.08s/it]

Val Loss: 0.0933 - Val Accuracy: 0.9684



Training:   0%|          | 0/57 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/57 [00:01<01:16,  1.36s/it][A
Training:   7%|▋         | 4/57 [00:01<00:15,  3.52it/s][A
Training:  11%|█         | 6/57 [00:02<00:18,  2.71it/s][A
Training:  16%|█▌        | 9/57 [00:03<00:17,  2.69it/s][A
Training:  19%|█▉        | 11/57 [00:03<00:12,  3.59it/s][A
Training:  23%|██▎       | 13/57 [00:04<00:14,  3.08it/s][A
Training:  28%|██▊       | 16/57 [00:04<00:08,  4.78it/s][A
Training:  32%|███▏      | 18/57 [00:05<00:11,  3.55it/s][A
Training:  37%|███▋      | 21/57 [00:06<00:10,  3.31it/s][A
Training:  42%|████▏     | 24/57 [00:06<00:06,  4.74it/s][A
Training:  46%|████▌     | 26/57 [00:07<00:08,  3.65it/s][A
Training:  49%|████▉     | 28/57 [00:07<00:06,  4.64it/s][A
Training:  53%|█████▎    | 30/57 [00:08<00:07,  3.62it/s][A
Training:  58%|█████▊    | 33/57 [00:09<00:07,  3.30it/s][A
Training:  61%|██████▏   | 35/57 [00:09<00:05,  4.10it/s][A
Training:  65%|██████▍   | 37/57 [00

Epoch: 37/40 - Loss: 0.0641 - Accuracy: 0.9750



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:01<00:09,  1.39s/it][A
100%|██████████| 8/8 [00:02<00:00,  3.09it/s][A
Epochs:  92%|█████████▎| 37/40 [11:00<00:54, 18.05s/it]

Val Loss: 0.0911 - Val Accuracy: 0.9674



Training:   0%|          | 0/57 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/57 [00:01<01:17,  1.39s/it][A
Training:   4%|▎         | 2/57 [00:01<00:34,  1.58it/s][A
Training:   9%|▉         | 5/57 [00:02<00:20,  2.53it/s][A
Training:  14%|█▍        | 8/57 [00:02<00:10,  4.61it/s][A
Training:  18%|█▊        | 10/57 [00:03<00:14,  3.34it/s][A
Training:  23%|██▎       | 13/57 [00:04<00:13,  3.23it/s][A
Training:  26%|██▋       | 15/57 [00:04<00:10,  4.19it/s][A
Training:  30%|██▉       | 17/57 [00:05<00:12,  3.26it/s][A
Training:  33%|███▎      | 19/57 [00:05<00:09,  4.20it/s][A
Training:  37%|███▋      | 21/57 [00:06<00:11,  3.21it/s][A
Training:  42%|████▏     | 24/57 [00:06<00:06,  4.80it/s][A
Training:  46%|████▌     | 26/57 [00:07<00:08,  3.50it/s][A
Training:  51%|█████     | 29/57 [00:08<00:08,  3.32it/s][A
Training:  54%|█████▍    | 31/57 [00:08<00:06,  4.22it/s][A
Training:  58%|█████▊    | 33/57 [00:09<00:07,  3.42it/s][A
Training:  61%|██████▏   | 35/57 [00

Epoch: 38/40 - Loss: 0.0625 - Accuracy: 0.9757



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:01<00:08,  1.26s/it][A
 38%|███▊      | 3/8 [00:01<00:01,  2.50it/s][A
 62%|██████▎   | 5/8 [00:02<00:01,  2.44it/s][A
100%|██████████| 8/8 [00:02<00:00,  3.25it/s][A
Epochs:  95%|█████████▌| 38/40 [11:18<00:35, 17.99s/it]

Val Loss: 0.1046 - Val Accuracy: 0.9639



Training:   0%|          | 0/57 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/57 [00:01<01:16,  1.37s/it][A
Training:   9%|▉         | 5/57 [00:02<00:21,  2.46it/s][A
Training:  14%|█▍        | 8/57 [00:02<00:11,  4.13it/s][A
Training:  16%|█▌        | 9/57 [00:03<00:17,  2.72it/s][A
Training:  19%|█▉        | 11/57 [00:03<00:12,  3.76it/s][A
Training:  21%|██        | 12/57 [00:03<00:10,  4.27it/s][A
Training:  23%|██▎       | 13/57 [00:04<00:15,  2.83it/s][A
Training:  26%|██▋       | 15/57 [00:04<00:10,  4.07it/s][A
Training:  28%|██▊       | 16/57 [00:04<00:08,  4.62it/s][A
Training:  30%|██▉       | 17/57 [00:05<00:14,  2.69it/s][A
Training:  35%|███▌      | 20/57 [00:05<00:08,  4.48it/s][A
Training:  37%|███▋      | 21/57 [00:06<00:12,  2.87it/s][A
Training:  42%|████▏     | 24/57 [00:06<00:07,  4.33it/s][A
Training:  44%|████▍     | 25/57 [00:07<00:10,  3.10it/s][A
Training:  47%|████▋     | 27/57 [00:07<00:07,  4.22it/s][A
Training:  49%|████▉     | 28/57 [00

Epoch: 39/40 - Loss: 0.0617 - Accuracy: 0.9773



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:01<00:10,  1.43s/it][A
100%|██████████| 8/8 [00:02<00:00,  3.10it/s][A
Epochs:  98%|█████████▊| 39/40 [11:36<00:18, 18.03s/it]

Val Loss: 0.0908 - Val Accuracy: 0.9689



Training:   0%|          | 0/57 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/57 [00:01<01:22,  1.48s/it][A
Training:   5%|▌         | 3/57 [00:01<00:23,  2.34it/s][A
Training:   9%|▉         | 5/57 [00:02<00:21,  2.38it/s][A
Training:  14%|█▍        | 8/57 [00:02<00:10,  4.48it/s][A
Training:  18%|█▊        | 10/57 [00:03<00:14,  3.15it/s][A
Training:  23%|██▎       | 13/57 [00:04<00:13,  3.22it/s][A
Training:  25%|██▍       | 14/57 [00:04<00:11,  3.59it/s][A
Training:  30%|██▉       | 17/57 [00:05<00:11,  3.44it/s][A
Training:  33%|███▎      | 19/57 [00:05<00:08,  4.40it/s][A
Training:  37%|███▋      | 21/57 [00:06<00:10,  3.32it/s][A
Training:  40%|████      | 23/57 [00:06<00:07,  4.32it/s][A
Training:  42%|████▏     | 24/57 [00:06<00:06,  4.75it/s][A
Training:  44%|████▍     | 25/57 [00:07<00:10,  2.99it/s][A
Training:  46%|████▌     | 26/57 [00:07<00:08,  3.52it/s][A
Training:  49%|████▉     | 28/57 [00:07<00:05,  5.01it/s][A
Training:  51%|█████     | 29/57 [00

Epoch: 40/40 - Loss: 0.0614 - Accuracy: 0.9776



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:01<00:09,  1.33s/it][A
 38%|███▊      | 3/8 [00:01<00:01,  2.60it/s][A
 62%|██████▎   | 5/8 [00:02<00:01,  2.47it/s][A
100%|██████████| 8/8 [00:02<00:00,  3.23it/s][A
Epochs: 100%|██████████| 40/40 [11:54<00:00, 17.86s/it]
[32m[I 2023-12-11 23:49:49,115][0m Trial 2 finished with value: 0.9673694372177124 and parameters: {'learning_rate': 0.00010173550281282758, 'weight_decay': 0.008588437544705844, 'epsilon': 3.762780786582391e-09, 'batch_size': 249, 'epochs': 40}. Best is trial 2 with value: 0.9673694372177124.[0m


Val Loss: 0.0958 - Val Accuracy: 0.9674
Saving best model...
Learning rate: 0.003494281053007625
Weight decay: 0.0001149692699183165
Epsilon: 9.569821680316825e-09
Batch size: 98
Number of epochs: 48


Epochs:   0%|          | 0/48 [00:00<?, ?it/s]
Training:   0%|          | 0/143 [00:00<?, ?it/s][A
Training:   1%|          | 1/143 [00:00<01:40,  1.41it/s][A
Training:   3%|▎         | 5/143 [00:01<00:26,  5.12it/s][A
Training:   6%|▋         | 9/143 [00:01<00:18,  7.19it/s][A
Training:   9%|▉         | 13/143 [00:01<00:15,  8.21it/s][A
Training:  12%|█▏        | 17/143 [00:02<00:15,  7.98it/s][A
Training:  14%|█▍        | 20/143 [00:02<00:12, 10.10it/s][A
Training:  15%|█▌        | 22/143 [00:02<00:14,  8.52it/s][A
Training:  17%|█▋        | 25/143 [00:03<00:14,  8.32it/s][A
Training:  20%|██        | 29/143 [00:03<00:13,  8.77it/s][A
Training:  23%|██▎       | 33/143 [00:04<00:11,  9.22it/s][A
Training:  26%|██▌       | 37/143 [00:04<00:11,  9.42it/s][A
Training:  28%|██▊       | 40/143 [00:04<00:09, 11.41it/s][A
Training:  29%|██▉       | 42/143 [00:04<00:10,  9.36it/s][A
Training:  31%|███▏      | 45/143 [00:05<00:10,  8.91it/s][A
Training:  34%|███▍      | 49/143 [

Epoch: 1/48 - Loss: 0.4409 - Accuracy: 0.8953



  0%|          | 0/18 [00:00<?, ?it/s][A
  6%|▌         | 1/18 [00:00<00:12,  1.40it/s][A
 28%|██▊       | 5/18 [00:01<00:02,  5.17it/s][A
 50%|█████     | 9/18 [00:01<00:01,  6.99it/s][A
 56%|█████▌    | 10/18 [00:01<00:01,  7.30it/s][A
 72%|███████▏  | 13/18 [00:01<00:00,  7.90it/s][A
 83%|████████▎ | 15/18 [00:02<00:00,  9.47it/s][A
100%|██████████| 18/18 [00:02<00:00,  7.37it/s][A
Epochs:   2%|▏         | 1/48 [00:18<14:25, 18.42s/it]

Val Loss: 0.1325 - Val Accuracy: 0.9569



Training:   0%|          | 0/143 [00:00<?, ?it/s][A
Training:   1%|          | 1/143 [00:00<01:37,  1.46it/s][A
Training:   3%|▎         | 5/143 [00:01<00:26,  5.22it/s][A
Training:   6%|▋         | 9/143 [00:01<00:19,  6.84it/s][A
Training:   9%|▉         | 13/143 [00:01<00:16,  8.11it/s][A
Training:  12%|█▏        | 17/143 [00:02<00:15,  8.24it/s][A
Training:  15%|█▍        | 21/143 [00:02<00:14,  8.52it/s][A
Training:  17%|█▋        | 25/143 [00:03<00:13,  8.47it/s][A
Training:  20%|██        | 29/143 [00:03<00:13,  8.67it/s][A
Training:  23%|██▎       | 33/143 [00:04<00:12,  9.04it/s][A
Training:  26%|██▌       | 37/143 [00:04<00:11,  9.57it/s][A
Training:  29%|██▊       | 41/143 [00:04<00:10, 10.16it/s][A
Training:  31%|███       | 44/143 [00:04<00:08, 11.87it/s][A
Training:  32%|███▏      | 46/143 [00:05<00:10,  9.58it/s][A
Training:  34%|███▍      | 49/143 [00:05<00:10,  8.83it/s][A
Training:  36%|███▋      | 52/143 [00:05<00:08, 10.24it/s][A
Training:  38%|███▊

Epoch: 2/48 - Loss: 0.1346 - Accuracy: 0.9509



  0%|          | 0/18 [00:00<?, ?it/s][A
  6%|▌         | 1/18 [00:00<00:11,  1.50it/s][A
 28%|██▊       | 5/18 [00:01<00:02,  5.36it/s][A
 44%|████▍     | 8/18 [00:01<00:01,  8.80it/s][A
 56%|█████▌    | 10/18 [00:01<00:01,  7.76it/s][A
 67%|██████▋   | 12/18 [00:01<00:00,  9.06it/s][A
 78%|███████▊  | 14/18 [00:01<00:00,  8.17it/s][A
 89%|████████▉ | 16/18 [00:02<00:00,  8.86it/s][A
100%|██████████| 18/18 [00:02<00:00,  7.54it/s][A
Epochs:   4%|▍         | 2/48 [00:36<14:02, 18.31s/it]

Val Loss: 0.1423 - Val Accuracy: 0.9428



Training:   0%|          | 0/143 [00:00<?, ?it/s][A
Training:   1%|          | 1/143 [00:00<01:32,  1.54it/s][A
Training:   1%|▏         | 2/143 [00:00<00:47,  2.98it/s][A
Training:   3%|▎         | 5/143 [00:01<00:24,  5.63it/s][A
Training:   6%|▌         | 8/143 [00:01<00:14,  9.07it/s][A
Training:   7%|▋         | 10/143 [00:01<00:18,  7.38it/s][A
Training:   9%|▉         | 13/143 [00:01<00:16,  7.97it/s][A
Training:  12%|█▏        | 17/143 [00:02<00:13,  9.06it/s][A
Training:  13%|█▎        | 19/143 [00:02<00:12, 10.29it/s][A
Training:  15%|█▍        | 21/143 [00:02<00:13,  9.11it/s][A
Training:  16%|█▌        | 23/143 [00:02<00:11, 10.53it/s][A
Training:  17%|█▋        | 25/143 [00:03<00:14,  8.25it/s][A
Training:  20%|█▉        | 28/143 [00:03<00:11, 10.35it/s][A
Training:  21%|██        | 30/143 [00:03<00:12,  8.91it/s][A
Training:  22%|██▏       | 32/143 [00:03<00:10, 10.18it/s][A
Training:  24%|██▍       | 34/143 [00:04<00:13,  8.37it/s][A
Training:  25%|██▌  

Epoch: 3/48 - Loss: 0.1227 - Accuracy: 0.9554



  0%|          | 0/18 [00:00<?, ?it/s][A
  6%|▌         | 1/18 [00:00<00:12,  1.39it/s][A
 28%|██▊       | 5/18 [00:01<00:02,  5.01it/s][A
 50%|█████     | 9/18 [00:01<00:01,  6.91it/s][A
 72%|███████▏  | 13/18 [00:02<00:00,  7.68it/s][A
100%|██████████| 18/18 [00:02<00:00,  7.22it/s][A
Epochs:   6%|▋         | 3/48 [00:54<13:43, 18.30s/it]

Val Loss: 0.1319 - Val Accuracy: 0.9537



Training:   0%|          | 0/143 [00:00<?, ?it/s][A
Training:   1%|          | 1/143 [00:00<01:46,  1.34it/s][A
Training:   3%|▎         | 5/143 [00:01<00:27,  4.94it/s][A
Training:   6%|▋         | 9/143 [00:01<00:20,  6.61it/s][A
Training:   9%|▉         | 13/143 [00:02<00:16,  7.74it/s][A
Training:  12%|█▏        | 17/143 [00:02<00:15,  8.32it/s][A
Training:  15%|█▍        | 21/143 [00:02<00:14,  8.65it/s][A
Training:  17%|█▋        | 25/143 [00:03<00:13,  8.72it/s][A
Training:  20%|██        | 29/143 [00:03<00:12,  9.08it/s][A
Training:  23%|██▎       | 33/143 [00:04<00:11,  9.43it/s][A
Training:  26%|██▌       | 37/143 [00:04<00:11,  9.60it/s][A
Training:  27%|██▋       | 39/143 [00:04<00:10, 10.29it/s][A
Training:  29%|██▊       | 41/143 [00:04<00:11,  8.83it/s][A
Training:  31%|███▏      | 45/143 [00:05<00:10,  9.01it/s][A
Training:  33%|███▎      | 47/143 [00:05<00:09, 10.13it/s][A
Training:  34%|███▍      | 49/143 [00:05<00:11,  8.32it/s][A
Training:  37%|███▋

Epoch: 4/48 - Loss: 0.1193 - Accuracy: 0.9573



  0%|          | 0/18 [00:00<?, ?it/s][A
  6%|▌         | 1/18 [00:00<00:10,  1.56it/s][A
 28%|██▊       | 5/18 [00:01<00:02,  5.13it/s][A
 50%|█████     | 9/18 [00:01<00:01,  6.96it/s][A
 72%|███████▏  | 13/18 [00:01<00:00,  7.69it/s][A
100%|██████████| 18/18 [00:02<00:00,  7.31it/s][A
Epochs:   8%|▊         | 4/48 [01:13<13:27, 18.35s/it]

Val Loss: 0.1163 - Val Accuracy: 0.9644



Training:   0%|          | 0/143 [00:00<?, ?it/s][A
Training:   1%|          | 1/143 [00:00<01:40,  1.42it/s][A
Training:   3%|▎         | 5/143 [00:01<00:28,  4.90it/s][A
Training:   6%|▋         | 9/143 [00:01<00:20,  6.48it/s][A
Training:   9%|▉         | 13/143 [00:02<00:17,  7.54it/s][A
Training:  12%|█▏        | 17/143 [00:02<00:15,  8.22it/s][A
Training:  15%|█▍        | 21/143 [00:02<00:14,  8.68it/s][A
Training:  17%|█▋        | 25/143 [00:03<00:13,  8.90it/s][A
Training:  20%|██        | 29/143 [00:03<00:12,  9.29it/s][A
Training:  23%|██▎       | 33/143 [00:04<00:12,  9.07it/s][A
Training:  26%|██▌       | 37/143 [00:04<00:11,  9.15it/s][A
Training:  29%|██▊       | 41/143 [00:04<00:10,  9.48it/s][A
Training:  31%|███▏      | 45/143 [00:05<00:10,  9.52it/s][A
Training:  34%|███▍      | 49/143 [00:05<00:09,  9.55it/s][A
Training:  37%|███▋      | 53/143 [00:06<00:09,  9.30it/s][A
Training:  40%|███▉      | 57/143 [00:06<00:09,  9.05it/s][A
Training:  43%|████

Epoch: 5/48 - Loss: 0.1241 - Accuracy: 0.9553



  0%|          | 0/18 [00:00<?, ?it/s][A
  6%|▌         | 1/18 [00:00<00:11,  1.48it/s][A
 28%|██▊       | 5/18 [00:01<00:02,  5.32it/s][A
 50%|█████     | 9/18 [00:01<00:01,  6.80it/s][A
 72%|███████▏  | 13/18 [00:01<00:00,  7.84it/s][A
100%|██████████| 18/18 [00:02<00:00,  7.39it/s][A
Epochs:  10%|█         | 5/48 [01:31<13:06, 18.28s/it]

Val Loss: 0.1433 - Val Accuracy: 0.9534



Training:   0%|          | 0/143 [00:00<?, ?it/s][A
Training:   1%|          | 1/143 [00:00<01:34,  1.50it/s][A
Training:   3%|▎         | 5/143 [00:01<00:26,  5.23it/s][A
Training:   5%|▍         | 7/143 [00:01<00:19,  7.11it/s][A
Training:   6%|▋         | 9/143 [00:01<00:19,  6.93it/s][A
Training:   9%|▉         | 13/143 [00:01<00:15,  8.34it/s][A
Training:  12%|█▏        | 17/143 [00:02<00:14,  8.56it/s][A
Training:  15%|█▍        | 21/143 [00:02<00:13,  8.99it/s][A
Training:  17%|█▋        | 25/143 [00:03<00:13,  8.97it/s][A
Training:  20%|█▉        | 28/143 [00:03<00:10, 10.69it/s][A
Training:  21%|██        | 30/143 [00:03<00:12,  9.11it/s][A
Training:  23%|██▎       | 33/143 [00:04<00:12,  8.67it/s][A
Training:  26%|██▌       | 37/143 [00:04<00:11,  9.25it/s][A
Training:  29%|██▊       | 41/143 [00:04<00:10,  9.80it/s][A
Training:  30%|███       | 43/143 [00:04<00:09, 10.37it/s][A
Training:  31%|███▏      | 45/143 [00:05<00:10,  9.39it/s][A
Training:  33%|███▎ 

Epoch: 6/48 - Loss: 0.1247 - Accuracy: 0.9561



  0%|          | 0/18 [00:00<?, ?it/s][A
  6%|▌         | 1/18 [00:00<00:11,  1.50it/s][A
 22%|██▏       | 4/18 [00:00<00:02,  6.44it/s][A
 33%|███▎      | 6/18 [00:01<00:01,  6.46it/s][A
 50%|█████     | 9/18 [00:01<00:01,  6.80it/s][A
 67%|██████▋   | 12/18 [00:01<00:00,  9.91it/s][A
 78%|███████▊  | 14/18 [00:01<00:00,  8.10it/s][A
100%|██████████| 18/18 [00:02<00:00,  7.52it/s][A
Epochs:  12%|█▎        | 6/48 [01:49<12:46, 18.26s/it]

Val Loss: 0.1270 - Val Accuracy: 0.9467



Training:   0%|          | 0/143 [00:00<?, ?it/s][A
Training:   1%|          | 1/143 [00:00<01:37,  1.45it/s][A
Training:   3%|▎         | 5/143 [00:01<00:26,  5.15it/s][A
Training:   6%|▋         | 9/143 [00:01<00:20,  6.68it/s][A
Training:   9%|▉         | 13/143 [00:02<00:17,  7.55it/s][A
Training:  12%|█▏        | 17/143 [00:02<00:15,  8.09it/s][A
Training:  15%|█▍        | 21/143 [00:02<00:14,  8.45it/s][A
Training:  17%|█▋        | 25/143 [00:03<00:13,  8.61it/s][A
Training:  20%|██        | 29/143 [00:03<00:12,  8.96it/s][A
Training:  23%|██▎       | 33/143 [00:04<00:11,  9.52it/s][A
Training:  26%|██▌       | 37/143 [00:04<00:10,  9.74it/s][A
Training:  29%|██▊       | 41/143 [00:04<00:10,  9.70it/s][A
Training:  31%|███▏      | 45/143 [00:05<00:10,  9.61it/s][A
Training:  34%|███▎      | 48/143 [00:05<00:08, 11.50it/s][A
Training:  35%|███▍      | 50/143 [00:05<00:09,  9.82it/s][A
Training:  36%|███▋      | 52/143 [00:05<00:08, 10.59it/s][A
Training:  38%|███▊

Epoch: 7/48 - Loss: 0.1492 - Accuracy: 0.9519



  0%|          | 0/18 [00:00<?, ?it/s][A
  6%|▌         | 1/18 [00:00<00:11,  1.49it/s][A
 28%|██▊       | 5/18 [00:01<00:02,  5.52it/s][A
 39%|███▉      | 7/18 [00:01<00:01,  7.59it/s][A
 50%|█████     | 9/18 [00:01<00:01,  7.02it/s][A
 67%|██████▋   | 12/18 [00:01<00:00,  9.76it/s][A
 78%|███████▊  | 14/18 [00:01<00:00,  8.73it/s][A
 89%|████████▉ | 16/18 [00:02<00:00,  9.69it/s][A
100%|██████████| 18/18 [00:02<00:00,  7.66it/s][A
Epochs:  15%|█▍        | 7/48 [02:07<12:28, 18.26s/it]

Val Loss: 0.2045 - Val Accuracy: 0.9473



Training:   0%|          | 0/143 [00:00<?, ?it/s][A
Training:   1%|          | 1/143 [00:00<01:35,  1.49it/s][A
Training:   3%|▎         | 5/143 [00:01<00:26,  5.27it/s][A
Training:   5%|▍         | 7/143 [00:01<00:18,  7.21it/s][A
Training:   6%|▋         | 9/143 [00:01<00:19,  6.77it/s][A
Training:   9%|▉         | 13/143 [00:01<00:16,  7.78it/s][A
Training:  10%|█         | 15/143 [00:02<00:14,  9.06it/s][A
Training:  12%|█▏        | 17/143 [00:02<00:16,  7.71it/s][A
Training:  13%|█▎        | 18/143 [00:02<00:16,  7.79it/s][A
Training:  15%|█▍        | 21/143 [00:02<00:14,  8.58it/s][A
Training:  15%|█▌        | 22/143 [00:03<00:14,  8.33it/s][A
Training:  17%|█▋        | 25/143 [00:03<00:13,  8.59it/s][A
Training:  19%|█▉        | 27/143 [00:03<00:11, 10.01it/s][A
Training:  20%|██        | 29/143 [00:03<00:12,  9.19it/s][A
Training:  22%|██▏       | 31/143 [00:03<00:10, 10.88it/s][A
Training:  23%|██▎       | 33/143 [00:04<00:11,  9.51it/s][A
Training:  26%|██▌  

Epoch: 8/48 - Loss: 0.1561 - Accuracy: 0.9521



  0%|          | 0/18 [00:00<?, ?it/s][A
  6%|▌         | 1/18 [00:00<00:11,  1.49it/s][A
 28%|██▊       | 5/18 [00:01<00:02,  5.00it/s][A
 50%|█████     | 9/18 [00:01<00:01,  6.60it/s][A
 72%|███████▏  | 13/18 [00:02<00:00,  7.45it/s][A
100%|██████████| 18/18 [00:02<00:00,  7.12it/s][A
Epochs:  17%|█▋        | 8/48 [02:26<12:11, 18.29s/it]

Val Loss: 0.1804 - Val Accuracy: 0.9330



Training:   0%|          | 0/143 [00:00<?, ?it/s][A
Training:   1%|          | 1/143 [00:00<01:40,  1.42it/s][A
Training:   3%|▎         | 5/143 [00:01<00:25,  5.41it/s][A
Training:   6%|▋         | 9/143 [00:01<00:18,  7.29it/s][A
Training:   8%|▊         | 11/143 [00:01<00:14,  8.87it/s][A
Training:   9%|▉         | 13/143 [00:01<00:15,  8.26it/s][A
Training:  10%|█         | 15/143 [00:01<00:12,  9.88it/s][A
Training:  12%|█▏        | 17/143 [00:02<00:13,  9.10it/s][A
Training:  14%|█▍        | 20/143 [00:02<00:10, 11.20it/s][A
Training:  15%|█▌        | 22/143 [00:02<00:12,  9.45it/s][A
Training:  17%|█▋        | 24/143 [00:02<00:10, 10.91it/s][A
Training:  18%|█▊        | 26/143 [00:03<00:13,  8.98it/s][A
Training:  20%|█▉        | 28/143 [00:03<00:11, 10.05it/s][A
Training:  21%|██        | 30/143 [00:03<00:13,  8.39it/s][A
Training:  23%|██▎       | 33/143 [00:03<00:13,  8.27it/s][A
Training:  25%|██▌       | 36/143 [00:04<00:09, 11.04it/s][A
Training:  27%|██▋ 

Epoch: 9/48 - Loss: 0.1943 - Accuracy: 0.9475



  0%|          | 0/18 [00:00<?, ?it/s][A
  6%|▌         | 1/18 [00:00<00:10,  1.57it/s][A
 22%|██▏       | 4/18 [00:00<00:02,  6.70it/s][A
 33%|███▎      | 6/18 [00:01<00:02,  5.67it/s][A
 50%|█████     | 9/18 [00:01<00:01,  6.88it/s][A
 61%|██████    | 11/18 [00:01<00:00,  8.60it/s][A
 72%|███████▏  | 13/18 [00:01<00:00,  7.65it/s][A
 89%|████████▉ | 16/18 [00:02<00:00, 10.64it/s][A
100%|██████████| 18/18 [00:02<00:00,  7.50it/s][A
Epochs:  19%|█▉        | 9/48 [02:44<11:48, 18.18s/it]

Val Loss: 0.2245 - Val Accuracy: 0.9486



Training:   0%|          | 0/143 [00:00<?, ?it/s][A
Training:   1%|          | 1/143 [00:00<01:27,  1.62it/s][A
Training:   3%|▎         | 4/143 [00:00<00:20,  6.70it/s][A
Training:   4%|▍         | 6/143 [00:01<00:23,  5.81it/s][A
Training:   6%|▋         | 9/143 [00:01<00:18,  7.16it/s][A
Training:   8%|▊         | 11/143 [00:01<00:14,  8.92it/s][A
Training:   9%|▉         | 13/143 [00:01<00:15,  8.26it/s][A
Training:  10%|█         | 15/143 [00:01<00:12, 10.05it/s][A
Training:  12%|█▏        | 17/143 [00:02<00:14,  8.85it/s][A
Training:  13%|█▎        | 19/143 [00:02<00:12, 10.26it/s][A
Training:  15%|█▍        | 21/143 [00:02<00:13,  8.88it/s][A
Training:  16%|█▌        | 23/143 [00:02<00:11, 10.46it/s][A
Training:  17%|█▋        | 25/143 [00:03<00:13,  8.45it/s][A
Training:  20%|█▉        | 28/143 [00:03<00:10, 11.30it/s][A
Training:  21%|██        | 30/143 [00:03<00:13,  8.42it/s][A
Training:  23%|██▎       | 33/143 [00:03<00:13,  8.33it/s][A
Training:  26%|██▌  

Epoch: 10/48 - Loss: 0.1883 - Accuracy: 0.9503



  0%|          | 0/18 [00:00<?, ?it/s][A
  6%|▌         | 1/18 [00:00<00:11,  1.47it/s][A
 28%|██▊       | 5/18 [00:01<00:02,  5.48it/s][A
 39%|███▉      | 7/18 [00:01<00:01,  7.49it/s][A
 50%|█████     | 9/18 [00:01<00:01,  6.70it/s][A
 67%|██████▋   | 12/18 [00:01<00:00,  9.24it/s][A
 78%|███████▊  | 14/18 [00:01<00:00,  8.78it/s][A
 89%|████████▉ | 16/18 [00:02<00:00,  9.68it/s][A
100%|██████████| 18/18 [00:02<00:00,  7.51it/s][A
Epochs:  21%|██        | 10/48 [03:02<11:29, 18.13s/it]

Val Loss: 0.1449 - Val Accuracy: 0.9559



Training:   0%|          | 0/143 [00:00<?, ?it/s][A
Training:   1%|          | 1/143 [00:00<01:43,  1.38it/s][A
Training:   3%|▎         | 4/143 [00:00<00:22,  6.08it/s][A
Training:   4%|▍         | 6/143 [00:01<00:23,  5.89it/s][A
Training:   6%|▋         | 9/143 [00:01<00:20,  6.57it/s][A
Training:   9%|▉         | 13/143 [00:02<00:17,  7.46it/s][A
Training:  12%|█▏        | 17/143 [00:02<00:14,  8.48it/s][A
Training:  15%|█▍        | 21/143 [00:02<00:14,  8.57it/s][A
Training:  17%|█▋        | 25/143 [00:03<00:13,  8.83it/s][A
Training:  20%|█▉        | 28/143 [00:03<00:10, 10.66it/s][A
Training:  21%|██        | 30/143 [00:03<00:11,  9.85it/s][A
Training:  22%|██▏       | 32/143 [00:03<00:10, 10.64it/s][A
Training:  24%|██▍       | 34/143 [00:04<00:11,  9.28it/s][A
Training:  25%|██▌       | 36/143 [00:04<00:10, 10.53it/s][A
Training:  27%|██▋       | 38/143 [00:04<00:11,  9.34it/s][A
Training:  28%|██▊       | 40/143 [00:04<00:09, 10.83it/s][A
Training:  29%|██▉  

Epoch: 11/48 - Loss: 0.1725 - Accuracy: 0.9534



  0%|          | 0/18 [00:00<?, ?it/s][A
  6%|▌         | 1/18 [00:00<00:10,  1.65it/s][A
 28%|██▊       | 5/18 [00:01<00:02,  5.35it/s][A
 50%|█████     | 9/18 [00:01<00:01,  6.90it/s][A
 67%|██████▋   | 12/18 [00:01<00:00,  9.65it/s][A
 78%|███████▊  | 14/18 [00:02<00:00,  7.79it/s][A
100%|██████████| 18/18 [00:02<00:00,  7.29it/s][A
Epochs:  23%|██▎       | 11/48 [03:20<11:10, 18.12s/it]

Val Loss: 0.2051 - Val Accuracy: 0.9518



Training:   0%|          | 0/143 [00:00<?, ?it/s][A
Training:   1%|          | 1/143 [00:00<01:43,  1.37it/s][A
Training:   3%|▎         | 5/143 [00:01<00:27,  5.03it/s][A
Training:   6%|▋         | 9/143 [00:01<00:20,  6.57it/s][A
Training:   9%|▉         | 13/143 [00:02<00:17,  7.37it/s][A
Training:  12%|█▏        | 17/143 [00:02<00:14,  8.45it/s][A
Training:  15%|█▍        | 21/143 [00:02<00:14,  8.59it/s][A
Training:  17%|█▋        | 25/143 [00:03<00:13,  8.86it/s][A
Training:  20%|██        | 29/143 [00:03<00:12,  8.97it/s][A
Training:  22%|██▏       | 32/143 [00:03<00:10, 10.91it/s][A
Training:  24%|██▍       | 34/143 [00:04<00:11,  9.08it/s][A
Training:  26%|██▌       | 37/143 [00:04<00:12,  8.53it/s][A
Training:  29%|██▊       | 41/143 [00:05<00:11,  8.88it/s][A
Training:  31%|███▏      | 45/143 [00:05<00:11,  8.84it/s][A
Training:  34%|███▍      | 49/143 [00:06<00:11,  8.41it/s][A
Training:  37%|███▋      | 53/143 [00:06<00:10,  8.76it/s][A
Training:  40%|███▉

Epoch: 12/48 - Loss: 0.2177 - Accuracy: 0.9502



  0%|          | 0/18 [00:00<?, ?it/s][A
  6%|▌         | 1/18 [00:00<00:11,  1.46it/s][A
 28%|██▊       | 5/18 [00:01<00:02,  5.34it/s][A
 50%|█████     | 9/18 [00:01<00:01,  6.90it/s][A
 72%|███████▏  | 13/18 [00:01<00:00,  7.82it/s][A
100%|██████████| 18/18 [00:02<00:00,  7.46it/s][A
Epochs:  25%|██▌       | 12/48 [03:38<10:52, 18.13s/it]

Val Loss: 0.1894 - Val Accuracy: 0.9513



Training:   0%|          | 0/143 [00:00<?, ?it/s][A
Training:   1%|          | 1/143 [00:00<01:35,  1.49it/s][A
Training:   3%|▎         | 4/143 [00:00<00:21,  6.43it/s][A
Training:   4%|▍         | 6/143 [00:01<00:22,  6.05it/s][A
Training:   6%|▋         | 9/143 [00:01<00:20,  6.63it/s][A
Training:   8%|▊         | 11/143 [00:01<00:15,  8.37it/s][A
Training:   9%|▉         | 13/143 [00:02<00:17,  7.23it/s][A
Training:  12%|█▏        | 17/143 [00:02<00:15,  8.30it/s][A
Training:  15%|█▍        | 21/143 [00:02<00:14,  8.32it/s][A
Training:  17%|█▋        | 25/143 [00:03<00:13,  8.67it/s][A
Training:  20%|██        | 29/143 [00:03<00:12,  8.88it/s][A
Training:  23%|██▎       | 33/143 [00:04<00:12,  9.11it/s][A
Training:  26%|██▌       | 37/143 [00:04<00:11,  9.11it/s][A
Training:  29%|██▊       | 41/143 [00:04<00:10,  9.67it/s][A
Training:  31%|███▏      | 45/143 [00:05<00:10,  9.61it/s][A
Training:  34%|███▍      | 49/143 [00:05<00:09,  9.57it/s][A
Training:  37%|███▋ 

Epoch: 13/48 - Loss: 0.2444 - Accuracy: 0.9492



  0%|          | 0/18 [00:00<?, ?it/s][A
  6%|▌         | 1/18 [00:00<00:10,  1.64it/s][A
 22%|██▏       | 4/18 [00:00<00:02,  6.61it/s][A
 33%|███▎      | 6/18 [00:01<00:01,  6.33it/s][A
 50%|█████     | 9/18 [00:01<00:01,  6.64it/s][A
 72%|███████▏  | 13/18 [00:01<00:00,  8.05it/s][A
 89%|████████▉ | 16/18 [00:02<00:00, 10.69it/s][A
100%|██████████| 18/18 [00:02<00:00,  7.57it/s][A
Epochs:  27%|██▋       | 13/48 [03:56<10:33, 18.11s/it]

Val Loss: 0.2919 - Val Accuracy: 0.9616



Training:   0%|          | 0/143 [00:00<?, ?it/s][A
Training:   1%|          | 1/143 [00:00<01:42,  1.38it/s][A
Training:   3%|▎         | 5/143 [00:01<00:26,  5.16it/s][A
Training:   6%|▋         | 9/143 [00:01<00:19,  6.86it/s][A
Training:   9%|▉         | 13/143 [00:01<00:15,  8.23it/s][A
Training:  12%|█▏        | 17/143 [00:02<00:14,  8.86it/s][A
Training:  15%|█▍        | 21/143 [00:02<00:13,  9.00it/s][A
Training:  17%|█▋        | 25/143 [00:03<00:13,  9.01it/s][A
Training:  20%|██        | 29/143 [00:03<00:12,  9.32it/s][A
Training:  23%|██▎       | 33/143 [00:04<00:12,  9.05it/s][A
Training:  26%|██▌       | 37/143 [00:04<00:11,  9.36it/s][A
Training:  29%|██▊       | 41/143 [00:04<00:10,  9.54it/s][A
Training:  31%|███▏      | 45/143 [00:05<00:10,  9.42it/s][A
Training:  34%|███▍      | 49/143 [00:05<00:10,  9.24it/s][A
Training:  37%|███▋      | 53/143 [00:06<00:09,  9.35it/s][A
Training:  39%|███▉      | 56/143 [00:06<00:07, 10.98it/s][A
Training:  41%|████

Epoch: 14/48 - Loss: 0.2162 - Accuracy: 0.9538



  0%|          | 0/18 [00:00<?, ?it/s][A
  6%|▌         | 1/18 [00:00<00:10,  1.60it/s][A
 28%|██▊       | 5/18 [00:01<00:02,  5.69it/s][A
 44%|████▍     | 8/18 [00:01<00:01,  8.90it/s][A
 56%|█████▌    | 10/18 [00:01<00:01,  7.75it/s][A
 67%|██████▋   | 12/18 [00:01<00:00,  9.18it/s][A
 78%|███████▊  | 14/18 [00:01<00:00,  8.19it/s][A
 89%|████████▉ | 16/18 [00:02<00:00,  9.23it/s][A
100%|██████████| 18/18 [00:02<00:00,  7.59it/s][A
Epochs:  29%|██▉       | 14/48 [04:14<10:16, 18.13s/it]

Val Loss: 0.1710 - Val Accuracy: 0.9571



Training:   0%|          | 0/143 [00:00<?, ?it/s][A
Training:   1%|          | 1/143 [00:00<01:23,  1.69it/s][A
Training:   1%|▏         | 2/143 [00:00<00:42,  3.29it/s][A
Training:   3%|▎         | 5/143 [00:01<00:23,  5.90it/s][A
Training:   5%|▍         | 7/143 [00:01<00:17,  7.68it/s][A
Training:   6%|▋         | 9/143 [00:01<00:18,  7.31it/s][A
Training:   8%|▊         | 11/143 [00:01<00:14,  9.27it/s][A
Training:   9%|▉         | 13/143 [00:01<00:15,  8.44it/s][A
Training:  10%|█         | 15/143 [00:01<00:12, 10.20it/s][A
Training:  12%|█▏        | 17/143 [00:02<00:15,  8.26it/s][A
Training:  13%|█▎        | 19/143 [00:02<00:12, 10.05it/s][A
Training:  15%|█▍        | 21/143 [00:02<00:14,  8.36it/s][A
Training:  16%|█▌        | 23/143 [00:02<00:12,  9.94it/s][A
Training:  17%|█▋        | 25/143 [00:03<00:14,  8.05it/s][A
Training:  20%|██        | 29/143 [00:03<00:13,  8.64it/s][A
Training:  22%|██▏       | 31/143 [00:03<00:11,  9.85it/s][A
Training:  23%|██▎   

Epoch: 15/48 - Loss: 0.1936 - Accuracy: 0.9579



  0%|          | 0/18 [00:00<?, ?it/s][A
  6%|▌         | 1/18 [00:00<00:11,  1.44it/s][A
 28%|██▊       | 5/18 [00:01<00:02,  4.76it/s][A
 50%|█████     | 9/18 [00:01<00:01,  6.66it/s][A
 72%|███████▏  | 13/18 [00:02<00:00,  7.55it/s][A
100%|██████████| 18/18 [00:02<00:00,  7.13it/s][A
Epochs:  31%|███▏      | 15/48 [04:33<10:00, 18.19s/it]

Val Loss: 0.2487 - Val Accuracy: 0.9467



Training:   0%|          | 0/143 [00:00<?, ?it/s][A
Training:   1%|          | 1/143 [00:00<01:35,  1.49it/s][A
Training:   3%|▎         | 5/143 [00:01<00:25,  5.31it/s][A
Training:   6%|▋         | 9/143 [00:01<00:18,  7.27it/s][A
Training:   9%|▉         | 13/143 [00:01<00:16,  8.03it/s][A
Training:  12%|█▏        | 17/143 [00:02<00:14,  8.44it/s][A
Training:  15%|█▍        | 21/143 [00:02<00:14,  8.24it/s][A
Training:  17%|█▋        | 25/143 [00:03<00:13,  8.63it/s][A
Training:  20%|██        | 29/143 [00:03<00:13,  8.61it/s][A
Training:  23%|██▎       | 33/143 [00:04<00:11,  9.23it/s][A
Training:  26%|██▌       | 37/143 [00:04<00:11,  9.25it/s][A
Training:  29%|██▊       | 41/143 [00:05<00:11,  8.88it/s][A
Training:  31%|███       | 44/143 [00:05<00:09, 10.74it/s][A
Training:  32%|███▏      | 46/143 [00:05<00:10,  8.92it/s][A
Training:  34%|███▍      | 49/143 [00:05<00:10,  8.76it/s][A
Training:  37%|███▋      | 53/143 [00:06<00:09,  9.19it/s][A
Training:  40%|███▉

Epoch: 16/48 - Loss: 0.2435 - Accuracy: 0.9497



  0%|          | 0/18 [00:00<?, ?it/s][A
  6%|▌         | 1/18 [00:00<00:11,  1.50it/s][A
 28%|██▊       | 5/18 [00:01<00:02,  5.58it/s][A
 44%|████▍     | 8/18 [00:01<00:01,  9.02it/s][A
 56%|█████▌    | 10/18 [00:01<00:01,  7.90it/s][A
 67%|██████▋   | 12/18 [00:01<00:00,  9.39it/s][A
 78%|███████▊  | 14/18 [00:01<00:00,  8.37it/s][A
 89%|████████▉ | 16/18 [00:01<00:00, 10.16it/s][A
100%|██████████| 18/18 [00:02<00:00,  7.71it/s][A
Epochs:  33%|███▎      | 16/48 [04:51<09:42, 18.22s/it]

Val Loss: 0.6428 - Val Accuracy: 0.9341



Training:   0%|          | 0/143 [00:00<?, ?it/s][A
Training:   1%|          | 1/143 [00:00<01:33,  1.52it/s][A
Training:   3%|▎         | 4/143 [00:00<00:21,  6.40it/s][A
Training:   4%|▍         | 6/143 [00:01<00:20,  6.55it/s][A
Training:   6%|▋         | 9/143 [00:01<00:17,  7.65it/s][A
Training:   8%|▊         | 11/143 [00:01<00:14,  9.30it/s][A
Training:   9%|▉         | 13/143 [00:01<00:16,  7.88it/s][A
Training:  11%|█         | 16/143 [00:02<00:12, 10.07it/s][A
Training:  13%|█▎        | 18/143 [00:02<00:14,  8.76it/s][A
Training:  14%|█▍        | 20/143 [00:02<00:11, 10.34it/s][A
Training:  15%|█▌        | 22/143 [00:02<00:14,  8.47it/s][A
Training:  17%|█▋        | 24/143 [00:02<00:12,  9.75it/s][A
Training:  18%|█▊        | 26/143 [00:03<00:13,  8.89it/s][A
Training:  20%|█▉        | 28/143 [00:03<00:11,  9.74it/s][A
Training:  21%|██        | 30/143 [00:03<00:12,  9.28it/s][A
Training:  22%|██▏       | 32/143 [00:03<00:10, 10.35it/s][A
Training:  24%|██▍  

Epoch: 17/48 - Loss: 0.2703 - Accuracy: 0.9516



  0%|          | 0/18 [00:00<?, ?it/s][A
  6%|▌         | 1/18 [00:00<00:10,  1.56it/s][A
 22%|██▏       | 4/18 [00:00<00:02,  6.61it/s][A
 33%|███▎      | 6/18 [00:01<00:01,  6.56it/s][A
 50%|█████     | 9/18 [00:01<00:01,  6.88it/s][A
 67%|██████▋   | 12/18 [00:01<00:00,  9.35it/s][A
 78%|███████▊  | 14/18 [00:01<00:00,  8.27it/s][A
 89%|████████▉ | 16/18 [00:02<00:00,  9.46it/s][A
100%|██████████| 18/18 [00:02<00:00,  7.44it/s][A
Epochs:  35%|███▌      | 17/48 [05:09<09:22, 18.16s/it]

Val Loss: 0.2403 - Val Accuracy: 0.9565



Training:   0%|          | 0/143 [00:00<?, ?it/s][A
Training:   1%|          | 1/143 [00:00<01:41,  1.40it/s][A
Training:   3%|▎         | 5/143 [00:01<00:27,  5.11it/s][A
Training:   6%|▋         | 9/143 [00:01<00:19,  6.95it/s][A
Training:   9%|▉         | 13/143 [00:01<00:16,  8.01it/s][A
Training:  12%|█▏        | 17/143 [00:02<00:14,  8.53it/s][A
Training:  15%|█▍        | 21/143 [00:02<00:14,  8.54it/s][A
Training:  17%|█▋        | 25/143 [00:03<00:13,  9.07it/s][A
Training:  20%|██        | 29/143 [00:03<00:12,  9.29it/s][A
Training:  23%|██▎       | 33/143 [00:04<00:11,  9.44it/s][A
Training:  26%|██▌       | 37/143 [00:04<00:10,  9.95it/s][A
Training:  27%|██▋       | 39/143 [00:04<00:09, 10.86it/s][A
Training:  29%|██▊       | 41/143 [00:04<00:10,  9.45it/s][A
Training:  30%|███       | 43/143 [00:04<00:09, 10.36it/s][A
Training:  31%|███▏      | 45/143 [00:05<00:11,  8.88it/s][A
Training:  33%|███▎      | 47/143 [00:05<00:09, 10.29it/s][A
Training:  34%|███▍

Epoch: 18/48 - Loss: 0.2171 - Accuracy: 0.9574



  0%|          | 0/18 [00:00<?, ?it/s][A
  6%|▌         | 1/18 [00:00<00:11,  1.54it/s][A
 28%|██▊       | 5/18 [00:01<00:02,  5.37it/s][A
 50%|█████     | 9/18 [00:01<00:01,  7.09it/s][A
 67%|██████▋   | 12/18 [00:01<00:00,  9.83it/s][A
 78%|███████▊  | 14/18 [00:01<00:00,  8.54it/s][A
 89%|████████▉ | 16/18 [00:02<00:00, 10.01it/s][A
100%|██████████| 18/18 [00:02<00:00,  7.73it/s][A
Epochs:  38%|███▊      | 18/48 [05:27<09:04, 18.15s/it]

Val Loss: 0.3540 - Val Accuracy: 0.9518



Training:   0%|          | 0/143 [00:00<?, ?it/s][A
Training:   1%|          | 1/143 [00:00<01:42,  1.38it/s][A
Training:   3%|▎         | 5/143 [00:01<00:26,  5.16it/s][A
Training:   6%|▋         | 9/143 [00:01<00:19,  6.92it/s][A
Training:   9%|▉         | 13/143 [00:01<00:16,  7.86it/s][A
Training:  12%|█▏        | 17/143 [00:02<00:15,  8.18it/s][A
Training:  15%|█▍        | 21/143 [00:02<00:14,  8.66it/s][A
Training:  17%|█▋        | 25/143 [00:03<00:13,  8.74it/s][A
Training:  19%|█▉        | 27/143 [00:03<00:12,  9.64it/s][A
Training:  20%|██        | 29/143 [00:03<00:12,  8.89it/s][A
Training:  22%|██▏       | 32/143 [00:03<00:09, 11.42it/s][A
Training:  24%|██▍       | 34/143 [00:04<00:11,  9.90it/s][A
Training:  26%|██▌       | 37/143 [00:04<00:11,  9.02it/s][A
Training:  27%|██▋       | 39/143 [00:04<00:10, 10.32it/s][A
Training:  29%|██▊       | 41/143 [00:04<00:11,  8.61it/s][A
Training:  31%|███       | 44/143 [00:05<00:08, 11.33it/s][A
Training:  32%|███▏

Epoch: 19/48 - Loss: 0.2115 - Accuracy: 0.9557



  0%|          | 0/18 [00:00<?, ?it/s][A
  6%|▌         | 1/18 [00:00<00:10,  1.56it/s][A
 22%|██▏       | 4/18 [00:00<00:02,  6.63it/s][A
 33%|███▎      | 6/18 [00:01<00:01,  6.36it/s][A
 44%|████▍     | 8/18 [00:01<00:01,  8.32it/s][A
 56%|█████▌    | 10/18 [00:01<00:01,  7.52it/s][A
 67%|██████▋   | 12/18 [00:01<00:00,  9.31it/s][A
 78%|███████▊  | 14/18 [00:01<00:00,  7.97it/s][A
100%|██████████| 18/18 [00:02<00:00,  7.53it/s][A
Epochs:  40%|███▉      | 19/48 [05:45<08:46, 18.16s/it]

Val Loss: 0.2745 - Val Accuracy: 0.9508



Training:   0%|          | 0/143 [00:00<?, ?it/s][A
Training:   1%|          | 1/143 [00:00<01:34,  1.50it/s][A
Training:   3%|▎         | 4/143 [00:00<00:21,  6.48it/s][A
Training:   4%|▍         | 6/143 [00:01<00:21,  6.47it/s][A
Training:   6%|▋         | 9/143 [00:01<00:17,  7.55it/s][A
Training:   9%|▉         | 13/143 [00:01<00:15,  8.67it/s][A
Training:  11%|█         | 16/143 [00:01<00:11, 11.22it/s][A
Training:  13%|█▎        | 18/143 [00:02<00:14,  8.55it/s][A
Training:  15%|█▍        | 21/143 [00:02<00:14,  8.67it/s][A
Training:  16%|█▌        | 23/143 [00:02<00:12,  9.92it/s][A
Training:  17%|█▋        | 25/143 [00:03<00:13,  8.62it/s][A
Training:  19%|█▉        | 27/143 [00:03<00:13,  8.91it/s][A
Training:  20%|██        | 29/143 [00:03<00:12,  9.00it/s][A
Training:  22%|██▏       | 31/143 [00:03<00:11,  9.90it/s][A
Training:  23%|██▎       | 33/143 [00:03<00:11,  9.95it/s][A
Training:  24%|██▍       | 35/143 [00:04<00:09, 10.84it/s][A
Training:  26%|██▌  

Epoch: 20/48 - Loss: 0.2376 - Accuracy: 0.9551



  0%|          | 0/18 [00:00<?, ?it/s][A
  6%|▌         | 1/18 [00:00<00:11,  1.42it/s][A
 28%|██▊       | 5/18 [00:01<00:02,  5.02it/s][A
 50%|█████     | 9/18 [00:01<00:01,  6.56it/s][A
 72%|███████▏  | 13/18 [00:02<00:00,  7.74it/s][A
100%|██████████| 18/18 [00:02<00:00,  7.31it/s][A
Epochs:  42%|████▏     | 20/48 [06:03<08:27, 18.12s/it]

Val Loss: 0.3536 - Val Accuracy: 0.9549



Training:   0%|          | 0/143 [00:00<?, ?it/s][A
Training:   1%|          | 1/143 [00:00<01:29,  1.58it/s][A
Training:   2%|▏         | 3/143 [00:00<00:29,  4.74it/s][A
Training:   3%|▎         | 5/143 [00:01<00:24,  5.59it/s][A
Training:   6%|▌         | 8/143 [00:01<00:14,  9.55it/s][A
Training:   7%|▋         | 10/143 [00:01<00:15,  8.35it/s][A
Training:   9%|▉         | 13/143 [00:01<00:16,  8.01it/s][A
Training:  10%|█         | 15/143 [00:02<00:14,  8.99it/s][A
Training:  12%|█▏        | 17/143 [00:02<00:14,  8.77it/s][A
Training:  13%|█▎        | 19/143 [00:02<00:13,  9.27it/s][A
Training:  15%|█▍        | 21/143 [00:02<00:13,  8.93it/s][A
Training:  16%|█▌        | 23/143 [00:02<00:12,  9.55it/s][A
Training:  17%|█▋        | 25/143 [00:03<00:13,  8.66it/s][A
Training:  19%|█▉        | 27/143 [00:03<00:12,  9.36it/s][A
Training:  20%|██        | 29/143 [00:03<00:12,  9.16it/s][A
Training:  22%|██▏       | 31/143 [00:03<00:11,  9.72it/s][A
Training:  23%|██▎  

Epoch: 21/48 - Loss: 0.2183 - Accuracy: 0.9579



  0%|          | 0/18 [00:00<?, ?it/s][A
  6%|▌         | 1/18 [00:00<00:11,  1.44it/s][A
 28%|██▊       | 5/18 [00:01<00:02,  5.23it/s][A
 44%|████▍     | 8/18 [00:01<00:01,  8.48it/s][A
 56%|█████▌    | 10/18 [00:01<00:01,  7.12it/s][A
 72%|███████▏  | 13/18 [00:02<00:00,  7.19it/s][A
 78%|███████▊  | 14/18 [00:02<00:00,  7.38it/s][A
100%|██████████| 18/18 [00:02<00:00,  7.21it/s][A
Epochs:  44%|████▍     | 21/48 [06:22<08:11, 18.19s/it]

Val Loss: 0.3446 - Val Accuracy: 0.9467



Training:   0%|          | 0/143 [00:00<?, ?it/s][A
Training:   1%|          | 1/143 [00:00<01:34,  1.51it/s][A
Training:   3%|▎         | 5/143 [00:00<00:22,  6.08it/s][A
Training:   6%|▋         | 9/143 [00:01<00:16,  8.00it/s][A
Training:   7%|▋         | 10/143 [00:01<00:16,  8.21it/s][A
Training:   9%|▉         | 13/143 [00:01<00:14,  8.69it/s][A
Training:  10%|▉         | 14/143 [00:01<00:15,  8.26it/s][A
Training:  12%|█▏        | 17/143 [00:02<00:13,  9.50it/s][A
Training:  13%|█▎        | 18/143 [00:02<00:15,  7.96it/s][A
Training:  15%|█▍        | 21/143 [00:02<00:12,  9.64it/s][A
Training:  15%|█▌        | 22/143 [00:02<00:14,  8.29it/s][A
Training:  17%|█▋        | 25/143 [00:03<00:12,  9.71it/s][A
Training:  18%|█▊        | 26/143 [00:03<00:14,  8.03it/s][A
Training:  20%|██        | 29/143 [00:03<00:10, 10.58it/s][A
Training:  22%|██▏       | 31/143 [00:03<00:11,  9.84it/s][A
Training:  23%|██▎       | 33/143 [00:03<00:11,  9.97it/s][A
Training:  24%|██▍ 

Epoch: 22/48 - Loss: 0.2217 - Accuracy: 0.9573



  0%|          | 0/18 [00:00<?, ?it/s][A
  6%|▌         | 1/18 [00:00<00:09,  1.72it/s][A
 11%|█         | 2/18 [00:00<00:04,  3.23it/s][A
 28%|██▊       | 5/18 [00:01<00:02,  6.00it/s][A
 33%|███▎      | 6/18 [00:01<00:01,  6.58it/s][A
 50%|█████     | 9/18 [00:01<00:01,  7.54it/s][A
 67%|██████▋   | 12/18 [00:01<00:00, 10.89it/s][A
 78%|███████▊  | 14/18 [00:02<00:00,  7.62it/s][A
100%|██████████| 18/18 [00:02<00:00,  7.27it/s][A
Epochs:  46%|████▌     | 22/48 [06:40<07:53, 18.20s/it]

Val Loss: 0.1739 - Val Accuracy: 0.9592



Training:   0%|          | 0/143 [00:00<?, ?it/s][A
Training:   1%|          | 1/143 [00:00<01:30,  1.57it/s][A
Training:   3%|▎         | 4/143 [00:00<00:20,  6.76it/s][A
Training:   4%|▍         | 6/143 [00:01<00:21,  6.23it/s][A
Training:   6%|▋         | 9/143 [00:01<00:18,  7.13it/s][A
Training:   8%|▊         | 12/143 [00:01<00:12, 10.33it/s][A
Training:  10%|▉         | 14/143 [00:01<00:15,  8.31it/s][A
Training:  12%|█▏        | 17/143 [00:02<00:15,  8.18it/s][A
Training:  14%|█▍        | 20/143 [00:02<00:11, 10.90it/s][A
Training:  15%|█▌        | 22/143 [00:02<00:13,  9.04it/s][A
Training:  17%|█▋        | 25/143 [00:03<00:14,  8.41it/s][A
Training:  20%|██        | 29/143 [00:03<00:12,  9.05it/s][A
Training:  22%|██▏       | 32/143 [00:03<00:09, 11.25it/s][A
Training:  24%|██▍       | 34/143 [00:03<00:11,  9.66it/s][A
Training:  26%|██▌       | 37/143 [00:04<00:11,  9.34it/s][A
Training:  27%|██▋       | 39/143 [00:04<00:10, 10.24it/s][A
Training:  29%|██▊  

Epoch: 23/48 - Loss: 0.1930 - Accuracy: 0.9598



  0%|          | 0/18 [00:00<?, ?it/s][A
  6%|▌         | 1/18 [00:00<00:10,  1.62it/s][A
 28%|██▊       | 5/18 [00:01<00:02,  5.43it/s][A
 50%|█████     | 9/18 [00:01<00:01,  7.19it/s][A
 67%|██████▋   | 12/18 [00:01<00:00,  9.62it/s][A
 78%|███████▊  | 14/18 [00:01<00:00,  8.37it/s][A
 89%|████████▉ | 16/18 [00:02<00:00,  9.58it/s][A
100%|██████████| 18/18 [00:02<00:00,  7.61it/s][A
Epochs:  48%|████▊     | 23/48 [06:58<07:32, 18.08s/it]

Val Loss: 0.2714 - Val Accuracy: 0.9541



Training:   0%|          | 0/143 [00:00<?, ?it/s][A
Training:   1%|          | 1/143 [00:00<01:32,  1.54it/s][A
Training:   3%|▎         | 5/143 [00:01<00:25,  5.41it/s][A
Training:   6%|▋         | 9/143 [00:01<00:18,  7.12it/s][A
Training:   9%|▉         | 13/143 [00:01<00:16,  7.85it/s][A
Training:  12%|█▏        | 17/143 [00:02<00:14,  8.41it/s][A
Training:  15%|█▍        | 21/143 [00:02<00:14,  8.59it/s][A
Training:  17%|█▋        | 24/143 [00:02<00:11, 10.51it/s][A
Training:  18%|█▊        | 26/143 [00:03<00:13,  8.87it/s][A
Training:  20%|██        | 29/143 [00:03<00:13,  8.59it/s][A
Training:  23%|██▎       | 33/143 [00:04<00:12,  9.09it/s][A
Training:  26%|██▌       | 37/143 [00:04<00:11,  9.37it/s][A
Training:  29%|██▊       | 41/143 [00:04<00:11,  9.11it/s][A
Training:  31%|███▏      | 45/143 [00:05<00:10,  9.20it/s][A
Training:  34%|███▍      | 49/143 [00:05<00:10,  8.95it/s][A
Training:  37%|███▋      | 53/143 [00:06<00:09,  9.09it/s][A
Training:  40%|███▉

Epoch: 24/48 - Loss: 0.2255 - Accuracy: 0.9598



  0%|          | 0/18 [00:00<?, ?it/s][A
  6%|▌         | 1/18 [00:00<00:11,  1.46it/s][A
 28%|██▊       | 5/18 [00:01<00:02,  5.01it/s][A
 50%|█████     | 9/18 [00:01<00:01,  6.73it/s][A
 72%|███████▏  | 13/18 [00:02<00:00,  7.67it/s][A
100%|██████████| 18/18 [00:02<00:00,  7.32it/s][A
Epochs:  50%|█████     | 24/48 [07:16<07:15, 18.13s/it]

Val Loss: 0.4080 - Val Accuracy: 0.9377



Training:   0%|          | 0/143 [00:00<?, ?it/s][A
Training:   1%|          | 1/143 [00:00<01:31,  1.55it/s][A
Training:   3%|▎         | 5/143 [00:00<00:23,  5.95it/s][A
Training:   6%|▋         | 9/143 [00:01<00:16,  8.34it/s][A
Training:   8%|▊         | 12/143 [00:01<00:11, 11.19it/s][A
Training:  10%|▉         | 14/143 [00:01<00:14,  8.94it/s][A
Training:  12%|█▏        | 17/143 [00:02<00:15,  8.03it/s][A
Training:  15%|█▍        | 21/143 [00:02<00:14,  8.59it/s][A
Training:  17%|█▋        | 24/143 [00:02<00:11, 10.65it/s][A
Training:  18%|█▊        | 26/143 [00:03<00:13,  8.94it/s][A
Training:  20%|██        | 29/143 [00:03<00:13,  8.64it/s][A
Training:  22%|██▏       | 32/143 [00:03<00:10, 10.90it/s][A
Training:  24%|██▍       | 34/143 [00:03<00:11,  9.83it/s][A
Training:  25%|██▌       | 36/143 [00:03<00:09, 11.17it/s][A
Training:  27%|██▋       | 38/143 [00:04<00:11,  9.34it/s][A
Training:  28%|██▊       | 40/143 [00:04<00:09, 10.39it/s][A
Training:  29%|██▉ 

Epoch: 25/48 - Loss: 0.2436 - Accuracy: 0.9572



  0%|          | 0/18 [00:00<?, ?it/s][A
  6%|▌         | 1/18 [00:00<00:11,  1.43it/s][A
 28%|██▊       | 5/18 [00:01<00:02,  5.04it/s][A
 50%|█████     | 9/18 [00:01<00:01,  6.75it/s][A
 72%|███████▏  | 13/18 [00:01<00:00,  7.69it/s][A
100%|██████████| 18/18 [00:02<00:00,  7.32it/s][A
Epochs:  52%|█████▏    | 25/48 [07:34<06:56, 18.11s/it]

Val Loss: 0.2492 - Val Accuracy: 0.9574



Training:   0%|          | 0/143 [00:00<?, ?it/s][A
Training:   1%|          | 1/143 [00:00<01:32,  1.54it/s][A
Training:   3%|▎         | 5/143 [00:01<00:25,  5.33it/s][A
Training:   6%|▋         | 9/143 [00:01<00:17,  7.63it/s][A
Training:   9%|▉         | 13/143 [00:01<00:16,  8.08it/s][A
Training:  12%|█▏        | 17/143 [00:02<00:14,  8.47it/s][A
Training:  15%|█▍        | 21/143 [00:02<00:14,  8.71it/s][A
Training:  17%|█▋        | 24/143 [00:02<00:11, 10.82it/s][A
Training:  18%|█▊        | 26/143 [00:03<00:13,  8.92it/s][A
Training:  20%|██        | 29/143 [00:03<00:12,  9.27it/s][A
Training:  22%|██▏       | 31/143 [00:03<00:11,  9.88it/s][A
Training:  23%|██▎       | 33/143 [00:03<00:11,  9.76it/s][A
Training:  24%|██▍       | 35/143 [00:04<00:10,  9.85it/s][A
Training:  26%|██▌       | 37/143 [00:04<00:10,  9.91it/s][A
Training:  27%|██▋       | 39/143 [00:04<00:11,  9.42it/s][A
Training:  29%|██▊       | 41/143 [00:04<00:10,  9.49it/s][A
Training:  29%|██▉ 

Epoch: 26/48 - Loss: 0.2467 - Accuracy: 0.9562



  0%|          | 0/18 [00:00<?, ?it/s][A
  6%|▌         | 1/18 [00:00<00:11,  1.52it/s][A
 28%|██▊       | 5/18 [00:01<00:02,  5.37it/s][A
 44%|████▍     | 8/18 [00:01<00:01,  8.04it/s][A
 56%|█████▌    | 10/18 [00:01<00:01,  7.99it/s][A
 67%|██████▋   | 12/18 [00:01<00:00,  9.12it/s][A
 78%|███████▊  | 14/18 [00:01<00:00,  8.52it/s][A
 89%|████████▉ | 16/18 [00:02<00:00,  9.16it/s][A
100%|██████████| 18/18 [00:02<00:00,  7.62it/s][A
Epochs:  54%|█████▍    | 26/48 [07:52<06:38, 18.11s/it]

Val Loss: 0.2436 - Val Accuracy: 0.9616



Training:   0%|          | 0/143 [00:00<?, ?it/s][A
Training:   1%|          | 1/143 [00:00<01:28,  1.60it/s][A
Training:   3%|▎         | 5/143 [00:00<00:23,  5.91it/s][A
Training:   6%|▋         | 9/143 [00:01<00:16,  7.96it/s][A
Training:   8%|▊         | 12/143 [00:01<00:12, 10.91it/s][A
Training:  10%|▉         | 14/143 [00:01<00:13,  9.25it/s][A
Training:  11%|█         | 16/143 [00:01<00:12,  9.89it/s][A
Training:  13%|█▎        | 18/143 [00:02<00:14,  8.82it/s][A
Training:  14%|█▍        | 20/143 [00:02<00:12,  9.70it/s][A
Training:  15%|█▌        | 22/143 [00:02<00:13,  8.85it/s][A
Training:  17%|█▋        | 24/143 [00:02<00:12,  9.37it/s][A
Training:  18%|█▊        | 26/143 [00:03<00:13,  8.96it/s][A
Training:  19%|█▉        | 27/143 [00:03<00:13,  8.52it/s][A
Training:  20%|██        | 29/143 [00:03<00:13,  8.73it/s][A
Training:  22%|██▏       | 31/143 [00:03<00:12,  8.92it/s][A
Training:  23%|██▎       | 33/143 [00:03<00:11,  9.82it/s][A
Training:  24%|██▍ 

Epoch: 27/48 - Loss: 0.2283 - Accuracy: 0.9599



  0%|          | 0/18 [00:00<?, ?it/s][A
  6%|▌         | 1/18 [00:00<00:11,  1.44it/s][A
 28%|██▊       | 5/18 [00:01<00:02,  5.49it/s][A
 50%|█████     | 9/18 [00:01<00:01,  7.30it/s][A
 72%|███████▏  | 13/18 [00:01<00:00,  7.71it/s][A
100%|██████████| 18/18 [00:02<00:00,  7.56it/s][A
Epochs:  56%|█████▋    | 27/48 [08:10<06:19, 18.09s/it]

Val Loss: 0.3251 - Val Accuracy: 0.9508



Training:   0%|          | 0/143 [00:00<?, ?it/s][A
Training:   1%|          | 1/143 [00:00<01:36,  1.48it/s][A
Training:   3%|▎         | 5/143 [00:01<00:25,  5.44it/s][A
Training:   6%|▋         | 9/143 [00:01<00:18,  7.22it/s][A
Training:   9%|▉         | 13/143 [00:01<00:16,  7.96it/s][A
Training:  12%|█▏        | 17/143 [00:02<00:15,  8.09it/s][A
Training:  15%|█▍        | 21/143 [00:02<00:14,  8.37it/s][A
Training:  17%|█▋        | 25/143 [00:03<00:13,  8.58it/s][A
Training:  20%|██        | 29/143 [00:03<00:13,  8.58it/s][A
Training:  23%|██▎       | 33/143 [00:04<00:12,  9.05it/s][A
Training:  26%|██▌       | 37/143 [00:04<00:11,  9.51it/s][A
Training:  29%|██▊       | 41/143 [00:04<00:11,  9.18it/s][A
Training:  31%|███▏      | 45/143 [00:05<00:10,  9.24it/s][A
Training:  34%|███▍      | 49/143 [00:05<00:10,  9.23it/s][A
Training:  37%|███▋      | 53/143 [00:06<00:09,  9.13it/s][A
Training:  40%|███▉      | 57/143 [00:06<00:09,  9.35it/s][A
Training:  43%|████

Epoch: 28/48 - Loss: 0.2048 - Accuracy: 0.9620



  0%|          | 0/18 [00:00<?, ?it/s][A
  6%|▌         | 1/18 [00:00<00:10,  1.67it/s][A
 28%|██▊       | 5/18 [00:01<00:02,  5.59it/s][A
 50%|█████     | 9/18 [00:01<00:01,  7.22it/s][A
 67%|██████▋   | 12/18 [00:01<00:00,  9.83it/s][A
 78%|███████▊  | 14/18 [00:01<00:00,  7.94it/s][A
100%|██████████| 18/18 [00:02<00:00,  7.66it/s][A
Epochs:  58%|█████▊    | 28/48 [08:28<06:02, 18.11s/it]

Val Loss: 0.2704 - Val Accuracy: 0.9513



Training:   0%|          | 0/143 [00:00<?, ?it/s][A
Training:   1%|          | 1/143 [00:00<01:34,  1.50it/s][A
Training:   3%|▎         | 5/143 [00:01<00:25,  5.35it/s][A
Training:   6%|▋         | 9/143 [00:01<00:18,  7.14it/s][A
Training:   9%|▉         | 13/143 [00:01<00:16,  7.88it/s][A
Training:  12%|█▏        | 17/143 [00:02<00:14,  8.73it/s][A
Training:  13%|█▎        | 19/143 [00:02<00:12,  9.74it/s][A
Training:  15%|█▍        | 21/143 [00:02<00:13,  8.99it/s][A
Training:  16%|█▌        | 23/143 [00:02<00:12,  9.76it/s][A
Training:  17%|█▋        | 25/143 [00:03<00:13,  8.69it/s][A
Training:  19%|█▉        | 27/143 [00:03<00:11,  9.70it/s][A
Training:  20%|██        | 29/143 [00:03<00:13,  8.68it/s][A
Training:  22%|██▏       | 31/143 [00:03<00:11,  9.91it/s][A
Training:  23%|██▎       | 33/143 [00:03<00:11,  9.37it/s][A
Training:  24%|██▍       | 35/143 [00:04<00:10, 10.45it/s][A
Training:  26%|██▌       | 37/143 [00:04<00:11,  8.85it/s][A
Training:  27%|██▋ 

Epoch: 29/48 - Loss: 0.2456 - Accuracy: 0.9590



  0%|          | 0/18 [00:00<?, ?it/s][A
  6%|▌         | 1/18 [00:00<00:11,  1.54it/s][A
 22%|██▏       | 4/18 [00:00<00:02,  6.17it/s][A
 33%|███▎      | 6/18 [00:01<00:01,  6.24it/s][A
 50%|█████     | 9/18 [00:01<00:01,  6.87it/s][A
 67%|██████▋   | 12/18 [00:01<00:00,  9.62it/s][A
 78%|███████▊  | 14/18 [00:01<00:00,  8.04it/s][A
100%|██████████| 18/18 [00:02<00:00,  7.43it/s][A
Epochs:  60%|██████    | 29/48 [08:46<05:44, 18.13s/it]

Val Loss: 0.2965 - Val Accuracy: 0.9501



Training:   0%|          | 0/143 [00:00<?, ?it/s][A
Training:   1%|          | 1/143 [00:00<01:32,  1.53it/s][A
Training:   2%|▏         | 3/143 [00:00<00:29,  4.72it/s][A
Training:   3%|▎         | 5/143 [00:01<00:23,  5.94it/s][A
Training:   5%|▍         | 7/143 [00:01<00:17,  7.82it/s][A
Training:   6%|▋         | 9/143 [00:01<00:16,  8.02it/s][A
Training:   8%|▊         | 11/143 [00:01<00:14,  8.95it/s][A
Training:   9%|▉         | 13/143 [00:01<00:15,  8.44it/s][A
Training:  10%|█         | 15/143 [00:02<00:13,  9.45it/s][A
Training:  12%|█▏        | 17/143 [00:02<00:14,  8.83it/s][A
Training:  13%|█▎        | 19/143 [00:02<00:12,  9.58it/s][A
Training:  15%|█▍        | 21/143 [00:02<00:13,  8.96it/s][A
Training:  15%|█▌        | 22/143 [00:02<00:13,  8.93it/s][A
Training:  17%|█▋        | 25/143 [00:03<00:13,  8.70it/s][A
Training:  19%|█▉        | 27/143 [00:03<00:11, 10.19it/s][A
Training:  20%|██        | 29/143 [00:03<00:13,  8.44it/s][A
Training:  23%|██▎   

Epoch: 30/48 - Loss: 0.2258 - Accuracy: 0.9591



  0%|          | 0/18 [00:00<?, ?it/s][A
  6%|▌         | 1/18 [00:00<00:11,  1.55it/s][A
 28%|██▊       | 5/18 [00:01<00:02,  5.21it/s][A
 50%|█████     | 9/18 [00:01<00:01,  6.88it/s][A
 72%|███████▏  | 13/18 [00:01<00:00,  7.74it/s][A
100%|██████████| 18/18 [00:02<00:00,  7.32it/s][A
Epochs:  62%|██████▎   | 30/48 [09:05<05:27, 18.18s/it]

Val Loss: 0.4139 - Val Accuracy: 0.9547



Training:   0%|          | 0/143 [00:00<?, ?it/s][A
Training:   1%|          | 1/143 [00:00<01:25,  1.67it/s][A
Training:   3%|▎         | 5/143 [00:00<00:21,  6.31it/s][A
Training:   6%|▌         | 8/143 [00:01<00:13,  9.89it/s][A
Training:   7%|▋         | 10/143 [00:01<00:17,  7.57it/s][A
Training:   9%|▉         | 13/143 [00:01<00:17,  7.31it/s][A
Training:  12%|█▏        | 17/143 [00:02<00:15,  8.11it/s][A
Training:  14%|█▍        | 20/143 [00:02<00:11, 10.29it/s][A
Training:  15%|█▌        | 22/143 [00:02<00:13,  9.09it/s][A
Training:  17%|█▋        | 25/143 [00:03<00:13,  8.68it/s][A
Training:  20%|██        | 29/143 [00:03<00:12,  9.26it/s][A
Training:  22%|██▏       | 32/143 [00:03<00:09, 11.28it/s][A
Training:  24%|██▍       | 34/143 [00:03<00:11,  9.74it/s][A
Training:  25%|██▌       | 36/143 [00:04<00:10, 10.54it/s][A
Training:  27%|██▋       | 38/143 [00:04<00:11,  8.75it/s][A
Training:  29%|██▊       | 41/143 [00:04<00:12,  8.19it/s][A
Training:  31%|███▏

Epoch: 31/48 - Loss: 0.1980 - Accuracy: 0.9621



  0%|          | 0/18 [00:00<?, ?it/s][A
  6%|▌         | 1/18 [00:00<00:10,  1.60it/s][A
 28%|██▊       | 5/18 [00:00<00:02,  5.90it/s][A
 33%|███▎      | 6/18 [00:01<00:01,  6.42it/s][A
 50%|█████     | 9/18 [00:01<00:01,  7.55it/s][A
 56%|█████▌    | 10/18 [00:01<00:01,  7.90it/s][A
 72%|███████▏  | 13/18 [00:01<00:00,  8.34it/s][A
 78%|███████▊  | 14/18 [00:01<00:00,  8.49it/s][A
100%|██████████| 18/18 [00:02<00:00,  7.68it/s][A
Epochs:  65%|██████▍   | 31/48 [09:23<05:08, 18.14s/it]

Val Loss: 0.4865 - Val Accuracy: 0.9500



Training:   0%|          | 0/143 [00:00<?, ?it/s][A
Training:   1%|          | 1/143 [00:00<01:21,  1.73it/s][A
Training:   3%|▎         | 5/143 [00:01<00:25,  5.46it/s][A
Training:   6%|▋         | 9/143 [00:01<00:18,  7.06it/s][A
Training:   9%|▉         | 13/143 [00:01<00:16,  7.76it/s][A
Training:  12%|█▏        | 17/143 [00:02<00:14,  8.46it/s][A
Training:  15%|█▍        | 21/143 [00:02<00:14,  8.66it/s][A
Training:  17%|█▋        | 25/143 [00:03<00:12,  9.09it/s][A
Training:  20%|██        | 29/143 [00:03<00:12,  9.43it/s][A
Training:  23%|██▎       | 33/143 [00:03<00:11,  9.47it/s][A
Training:  26%|██▌       | 37/143 [00:04<00:11,  9.01it/s][A
Training:  28%|██▊       | 40/143 [00:04<00:09, 10.80it/s][A
Training:  29%|██▉       | 42/143 [00:04<00:10,  9.75it/s][A
Training:  31%|███▏      | 45/143 [00:05<00:10,  9.12it/s][A
Training:  34%|███▍      | 49/143 [00:05<00:10,  9.11it/s][A
Training:  37%|███▋      | 53/143 [00:06<00:09,  9.40it/s][A
Training:  40%|███▉

Epoch: 32/48 - Loss: 0.2200 - Accuracy: 0.9616



  0%|          | 0/18 [00:00<?, ?it/s][A
  6%|▌         | 1/18 [00:00<00:12,  1.32it/s][A
 28%|██▊       | 5/18 [00:01<00:02,  5.08it/s][A
 50%|█████     | 9/18 [00:01<00:01,  6.43it/s][A
 72%|███████▏  | 13/18 [00:02<00:00,  7.50it/s][A
100%|██████████| 18/18 [00:02<00:00,  7.19it/s][A
Epochs:  67%|██████▋   | 32/48 [09:41<04:50, 18.17s/it]

Val Loss: 0.3675 - Val Accuracy: 0.9588



Training:   0%|          | 0/143 [00:00<?, ?it/s][A
Training:   1%|          | 1/143 [00:00<01:29,  1.58it/s][A
Training:   3%|▎         | 5/143 [00:01<00:24,  5.68it/s][A
Training:   6%|▌         | 8/143 [00:01<00:14,  9.10it/s][A
Training:   7%|▋         | 10/143 [00:01<00:17,  7.55it/s][A
Training:   9%|▉         | 13/143 [00:01<00:17,  7.48it/s][A
Training:  12%|█▏        | 17/143 [00:02<00:15,  8.15it/s][A
Training:  15%|█▍        | 21/143 [00:02<00:13,  8.97it/s][A
Training:  17%|█▋        | 25/143 [00:03<00:12,  9.41it/s][A
Training:  20%|██        | 29/143 [00:03<00:12,  9.27it/s][A
Training:  23%|██▎       | 33/143 [00:03<00:11,  9.27it/s][A
Training:  25%|██▌       | 36/143 [00:04<00:09, 11.01it/s][A
Training:  27%|██▋       | 38/143 [00:04<00:11,  9.36it/s][A
Training:  29%|██▊       | 41/143 [00:04<00:11,  8.73it/s][A
Training:  31%|███▏      | 45/143 [00:05<00:10,  9.22it/s][A
Training:  33%|███▎      | 47/143 [00:05<00:09, 10.06it/s][A
Training:  34%|███▍

Epoch: 33/48 - Loss: 0.2436 - Accuracy: 0.9597



  0%|          | 0/18 [00:00<?, ?it/s][A
  6%|▌         | 1/18 [00:00<00:10,  1.62it/s][A
 28%|██▊       | 5/18 [00:01<00:02,  5.22it/s][A
 50%|█████     | 9/18 [00:01<00:01,  6.71it/s][A
 72%|███████▏  | 13/18 [00:01<00:00,  7.53it/s][A
100%|██████████| 18/18 [00:02<00:00,  7.44it/s][A
Epochs:  69%|██████▉   | 33/48 [09:59<04:33, 18.20s/it]

Val Loss: 0.3357 - Val Accuracy: 0.9598



Training:   0%|          | 0/143 [00:00<?, ?it/s][A
Training:   1%|          | 1/143 [00:00<01:25,  1.67it/s][A
Training:   2%|▏         | 3/143 [00:00<00:28,  4.91it/s][A
Training:   3%|▎         | 5/143 [00:01<00:24,  5.68it/s][A
Training:   4%|▍         | 6/143 [00:01<00:21,  6.24it/s][A
Training:   6%|▋         | 9/143 [00:01<00:18,  7.33it/s][A
Training:   9%|▉         | 13/143 [00:01<00:15,  8.15it/s][A
Training:  11%|█         | 16/143 [00:02<00:11, 10.77it/s][A
Training:  13%|█▎        | 18/143 [00:02<00:15,  8.20it/s][A
Training:  15%|█▍        | 21/143 [00:02<00:15,  7.93it/s][A
Training:  17%|█▋        | 25/143 [00:03<00:13,  8.60it/s][A
Training:  20%|██        | 29/143 [00:03<00:13,  8.76it/s][A
Training:  23%|██▎       | 33/143 [00:04<00:12,  8.98it/s][A
Training:  26%|██▌       | 37/143 [00:04<00:11,  9.01it/s][A
Training:  29%|██▊       | 41/143 [00:05<00:11,  8.74it/s][A
Training:  31%|███▏      | 45/143 [00:05<00:10,  8.94it/s][A
Training:  34%|███▍  

Epoch: 34/48 - Loss: 0.2153 - Accuracy: 0.9603



  0%|          | 0/18 [00:00<?, ?it/s][A
  6%|▌         | 1/18 [00:00<00:11,  1.49it/s][A
 28%|██▊       | 5/18 [00:01<00:02,  5.17it/s][A
 50%|█████     | 9/18 [00:01<00:01,  6.72it/s][A
 72%|███████▏  | 13/18 [00:02<00:00,  7.43it/s][A
100%|██████████| 18/18 [00:02<00:00,  7.30it/s][A
Epochs:  71%|███████   | 34/48 [10:18<04:15, 18.23s/it]

Val Loss: 0.3595 - Val Accuracy: 0.9449



Training:   0%|          | 0/143 [00:00<?, ?it/s][A
Training:   1%|          | 1/143 [00:00<01:25,  1.67it/s][A
Training:   3%|▎         | 5/143 [00:01<00:24,  5.54it/s][A
Training:   6%|▋         | 9/143 [00:01<00:19,  6.94it/s][A
Training:   9%|▉         | 13/143 [00:01<00:17,  7.59it/s][A
Training:  12%|█▏        | 17/143 [00:02<00:15,  8.03it/s][A
Training:  15%|█▍        | 21/143 [00:02<00:14,  8.55it/s][A
Training:  17%|█▋        | 25/143 [00:03<00:12,  9.21it/s][A
Training:  20%|██        | 29/143 [00:03<00:12,  9.39it/s][A
Training:  23%|██▎       | 33/143 [00:04<00:11,  9.49it/s][A
Training:  26%|██▌       | 37/143 [00:04<00:11,  9.39it/s][A
Training:  29%|██▊       | 41/143 [00:04<00:10,  9.36it/s][A
Training:  31%|███▏      | 45/143 [00:05<00:10,  9.13it/s][A
Training:  34%|███▍      | 49/143 [00:05<00:10,  9.25it/s][A
Training:  37%|███▋      | 53/143 [00:06<00:09,  9.27it/s][A
Training:  40%|███▉      | 57/143 [00:06<00:09,  9.35it/s][A
Training:  43%|████

Epoch: 35/48 - Loss: 0.2704 - Accuracy: 0.9583



  0%|          | 0/18 [00:00<?, ?it/s][A
  6%|▌         | 1/18 [00:00<00:10,  1.60it/s][A
 28%|██▊       | 5/18 [00:01<00:02,  5.25it/s][A
 50%|█████     | 9/18 [00:01<00:01,  7.04it/s][A
 72%|███████▏  | 13/18 [00:01<00:00,  7.68it/s][A
100%|██████████| 18/18 [00:02<00:00,  7.47it/s][A
Epochs:  73%|███████▎  | 35/48 [10:36<03:57, 18.24s/it]

Val Loss: 0.4076 - Val Accuracy: 0.9453



Training:   0%|          | 0/143 [00:00<?, ?it/s][A
Training:   1%|          | 1/143 [00:00<01:23,  1.71it/s][A
Training:   3%|▎         | 4/143 [00:00<00:20,  6.78it/s][A
Training:   4%|▍         | 6/143 [00:01<00:20,  6.56it/s][A
Training:   6%|▋         | 9/143 [00:01<00:17,  7.54it/s][A
Training:   8%|▊         | 11/143 [00:01<00:14,  9.31it/s][A
Training:   9%|▉         | 13/143 [00:01<00:17,  7.60it/s][A
Training:  12%|█▏        | 17/143 [00:02<00:15,  8.29it/s][A
Training:  15%|█▍        | 21/143 [00:02<00:13,  8.89it/s][A
Training:  17%|█▋        | 25/143 [00:03<00:12,  9.70it/s][A
Training:  19%|█▉        | 27/143 [00:03<00:10, 10.75it/s][A
Training:  20%|██        | 29/143 [00:03<00:11,  9.65it/s][A
Training:  22%|██▏       | 31/143 [00:03<00:10, 10.78it/s][A
Training:  23%|██▎       | 33/143 [00:03<00:12,  8.91it/s][A
Training:  24%|██▍       | 35/143 [00:04<00:11,  9.59it/s][A
Training:  26%|██▌       | 37/143 [00:04<00:12,  8.39it/s][A
Training:  27%|██▋  

Epoch: 36/48 - Loss: 0.2749 - Accuracy: 0.9604



  0%|          | 0/18 [00:00<?, ?it/s][A
  6%|▌         | 1/18 [00:00<00:11,  1.48it/s][A
 22%|██▏       | 4/18 [00:00<00:02,  6.34it/s][A
 33%|███▎      | 6/18 [00:01<00:02,  5.86it/s][A
 50%|█████     | 9/18 [00:01<00:01,  6.56it/s][A
 67%|██████▋   | 12/18 [00:01<00:00,  9.25it/s][A
 78%|███████▊  | 14/18 [00:01<00:00,  8.74it/s][A
 89%|████████▉ | 16/18 [00:02<00:00, 10.11it/s][A
100%|██████████| 18/18 [00:02<00:00,  7.61it/s][A
Epochs:  75%|███████▌  | 36/48 [10:54<03:39, 18.28s/it]

Val Loss: 0.3477 - Val Accuracy: 0.9491



Training:   0%|          | 0/143 [00:00<?, ?it/s][A
Training:   1%|          | 1/143 [00:00<01:27,  1.62it/s][A
Training:   3%|▎         | 5/143 [00:01<00:26,  5.21it/s][A
Training:   6%|▋         | 9/143 [00:01<00:18,  7.13it/s][A
Training:   8%|▊         | 11/143 [00:01<00:15,  8.66it/s][A
Training:   9%|▉         | 13/143 [00:01<00:16,  7.86it/s][A
Training:  10%|█         | 15/143 [00:02<00:14,  9.04it/s][A
Training:  12%|█▏        | 17/143 [00:02<00:14,  8.42it/s][A
Training:  13%|█▎        | 19/143 [00:02<00:13,  9.03it/s][A
Training:  15%|█▍        | 21/143 [00:02<00:13,  9.19it/s][A
Training:  16%|█▌        | 23/143 [00:02<00:11, 10.12it/s][A
Training:  17%|█▋        | 25/143 [00:03<00:12,  9.75it/s][A
Training:  19%|█▉        | 27/143 [00:03<00:12,  9.44it/s][A
Training:  20%|██        | 29/143 [00:03<00:11,  9.58it/s][A
Training:  21%|██        | 30/143 [00:03<00:13,  8.07it/s][A
Training:  23%|██▎       | 33/143 [00:03<00:11,  9.64it/s][A
Training:  24%|██▍ 

Epoch: 37/48 - Loss: 0.2583 - Accuracy: 0.9579



  0%|          | 0/18 [00:00<?, ?it/s][A
  6%|▌         | 1/18 [00:00<00:12,  1.41it/s][A
 28%|██▊       | 5/18 [00:01<00:02,  4.93it/s][A
 50%|█████     | 9/18 [00:01<00:01,  6.90it/s][A
 72%|███████▏  | 13/18 [00:02<00:00,  7.60it/s][A
100%|██████████| 18/18 [00:02<00:00,  7.31it/s][A
Epochs:  77%|███████▋  | 37/48 [11:13<03:21, 18.29s/it]

Val Loss: 0.2550 - Val Accuracy: 0.9583



Training:   0%|          | 0/143 [00:00<?, ?it/s][A
Training:   1%|          | 1/143 [00:00<01:27,  1.63it/s][A
Training:   3%|▎         | 4/143 [00:00<00:19,  6.97it/s][A
Training:   4%|▍         | 6/143 [00:01<00:21,  6.39it/s][A
Training:   6%|▋         | 9/143 [00:01<00:19,  6.95it/s][A
Training:   9%|▉         | 13/143 [00:01<00:16,  7.83it/s][A
Training:  12%|█▏        | 17/143 [00:02<00:14,  8.69it/s][A
Training:  15%|█▍        | 21/143 [00:02<00:13,  9.20it/s][A
Training:  17%|█▋        | 25/143 [00:03<00:12,  9.47it/s][A
Training:  20%|██        | 29/143 [00:03<00:11,  9.57it/s][A
Training:  23%|██▎       | 33/143 [00:03<00:11,  9.70it/s][A
Training:  24%|██▍       | 35/143 [00:04<00:10, 10.47it/s][A
Training:  26%|██▌       | 37/143 [00:04<00:11,  9.55it/s][A
Training:  27%|██▋       | 39/143 [00:04<00:10, 10.11it/s][A
Training:  29%|██▊       | 41/143 [00:04<00:10,  9.34it/s][A
Training:  30%|███       | 43/143 [00:04<00:09, 10.27it/s][A
Training:  31%|███▏ 

Epoch: 38/48 - Loss: 0.2175 - Accuracy: 0.9625



  0%|          | 0/18 [00:00<?, ?it/s][A
  6%|▌         | 1/18 [00:00<00:12,  1.40it/s][A
 28%|██▊       | 5/18 [00:01<00:02,  4.93it/s][A
 50%|█████     | 9/18 [00:01<00:01,  6.67it/s][A
 72%|███████▏  | 13/18 [00:02<00:00,  7.53it/s][A
100%|██████████| 18/18 [00:02<00:00,  7.35it/s][A
Epochs:  79%|███████▉  | 38/48 [11:31<03:02, 18.21s/it]

Val Loss: 0.3847 - Val Accuracy: 0.9542



Training:   0%|          | 0/143 [00:00<?, ?it/s][A
Training:   1%|          | 1/143 [00:00<01:24,  1.68it/s][A
Training:   3%|▎         | 5/143 [00:00<00:23,  5.76it/s][A
Training:   6%|▋         | 9/143 [00:01<00:17,  7.47it/s][A
Training:   8%|▊         | 11/143 [00:01<00:14,  8.98it/s][A
Training:   9%|▉         | 13/143 [00:01<00:16,  7.84it/s][A
Training:  11%|█         | 16/143 [00:01<00:11, 10.76it/s][A
Training:  13%|█▎        | 18/143 [00:02<00:14,  8.47it/s][A
Training:  15%|█▍        | 21/143 [00:02<00:14,  8.20it/s][A
Training:  17%|█▋        | 25/143 [00:03<00:12,  9.19it/s][A
Training:  20%|██        | 29/143 [00:03<00:12,  9.19it/s][A
Training:  23%|██▎       | 33/143 [00:03<00:11,  9.26it/s][A
Training:  26%|██▌       | 37/143 [00:04<00:11,  9.06it/s][A
Training:  29%|██▊       | 41/143 [00:04<00:11,  9.25it/s][A
Training:  31%|███▏      | 45/143 [00:05<00:10,  9.41it/s][A
Training:  34%|███▍      | 49/143 [00:05<00:10,  9.35it/s][A
Training:  37%|███▋

Epoch: 39/48 - Loss: 0.2212 - Accuracy: 0.9636



  0%|          | 0/18 [00:00<?, ?it/s][A
  6%|▌         | 1/18 [00:00<00:10,  1.55it/s][A
 28%|██▊       | 5/18 [00:01<00:02,  5.38it/s][A
 50%|█████     | 9/18 [00:01<00:01,  7.14it/s][A
 67%|██████▋   | 12/18 [00:01<00:00,  9.78it/s][A
 78%|███████▊  | 14/18 [00:01<00:00,  7.82it/s][A
100%|██████████| 18/18 [00:02<00:00,  7.67it/s][A
Epochs:  81%|████████▏ | 39/48 [11:49<02:43, 18.17s/it]

Val Loss: 0.3026 - Val Accuracy: 0.9371



Training:   0%|          | 0/143 [00:00<?, ?it/s][A
Training:   1%|          | 1/143 [00:00<01:24,  1.69it/s][A
Training:   3%|▎         | 5/143 [00:00<00:23,  5.91it/s][A
Training:   6%|▌         | 8/143 [00:01<00:14,  9.39it/s][A
Training:   7%|▋         | 10/143 [00:01<00:17,  7.63it/s][A
Training:   8%|▊         | 12/143 [00:01<00:13,  9.40it/s][A
Training:  10%|▉         | 14/143 [00:01<00:16,  7.60it/s][A
Training:  12%|█▏        | 17/143 [00:02<00:17,  7.27it/s][A
Training:  15%|█▍        | 21/143 [00:02<00:14,  8.18it/s][A
Training:  17%|█▋        | 25/143 [00:03<00:13,  8.91it/s][A
Training:  20%|██        | 29/143 [00:03<00:12,  9.12it/s][A
Training:  23%|██▎       | 33/143 [00:04<00:12,  9.01it/s][A
Training:  26%|██▌       | 37/143 [00:04<00:11,  9.23it/s][A
Training:  29%|██▊       | 41/143 [00:04<00:11,  9.12it/s][A
Training:  31%|███▏      | 45/143 [00:05<00:10,  9.26it/s][A
Training:  34%|███▍      | 49/143 [00:05<00:09,  9.44it/s][A
Training:  37%|███▋

Epoch: 40/48 - Loss: 0.2423 - Accuracy: 0.9613



  0%|          | 0/18 [00:00<?, ?it/s][A
  6%|▌         | 1/18 [00:00<00:11,  1.51it/s][A
 28%|██▊       | 5/18 [00:01<00:02,  5.16it/s][A
 50%|█████     | 9/18 [00:01<00:01,  6.52it/s][A
 72%|███████▏  | 13/18 [00:02<00:00,  7.34it/s][A
100%|██████████| 18/18 [00:02<00:00,  7.21it/s][A
Epochs:  83%|████████▎ | 40/48 [12:07<02:26, 18.27s/it]

Val Loss: 0.5462 - Val Accuracy: 0.9541



Training:   0%|          | 0/143 [00:00<?, ?it/s][A
Training:   1%|          | 1/143 [00:00<01:43,  1.38it/s][A
Training:   3%|▎         | 5/143 [00:01<00:27,  5.02it/s][A
Training:   6%|▌         | 8/143 [00:01<00:16,  8.20it/s][A
Training:   7%|▋         | 10/143 [00:01<00:17,  7.46it/s][A
Training:   9%|▉         | 13/143 [00:02<00:17,  7.32it/s][A
Training:  12%|█▏        | 17/143 [00:02<00:15,  8.21it/s][A
Training:  15%|█▍        | 21/143 [00:02<00:13,  9.23it/s][A
Training:  17%|█▋        | 25/143 [00:03<00:12,  9.21it/s][A
Training:  20%|█▉        | 28/143 [00:03<00:10, 11.04it/s][A
Training:  21%|██        | 30/143 [00:03<00:12,  9.03it/s][A
Training:  23%|██▎       | 33/143 [00:04<00:11,  9.38it/s][A
Training:  24%|██▍       | 35/143 [00:04<00:11,  9.65it/s][A
Training:  26%|██▌       | 37/143 [00:04<00:11,  9.63it/s][A
Training:  27%|██▋       | 39/143 [00:04<00:11,  9.09it/s][A
Training:  29%|██▊       | 41/143 [00:04<00:10,  9.57it/s][A
Training:  30%|███ 

Epoch: 41/48 - Loss: 0.2242 - Accuracy: 0.9609



  0%|          | 0/18 [00:00<?, ?it/s][A
  6%|▌         | 1/18 [00:00<00:11,  1.42it/s][A
 28%|██▊       | 5/18 [00:01<00:02,  5.07it/s][A
 50%|█████     | 9/18 [00:01<00:01,  6.40it/s][A
 72%|███████▏  | 13/18 [00:02<00:00,  7.25it/s][A
100%|██████████| 18/18 [00:02<00:00,  7.25it/s][A
Epochs:  85%|████████▌ | 41/48 [12:25<02:07, 18.28s/it]

Val Loss: 0.2418 - Val Accuracy: 0.9574



Training:   0%|          | 0/143 [00:00<?, ?it/s][A
Training:   1%|          | 1/143 [00:00<01:27,  1.61it/s][A
Training:   3%|▎         | 5/143 [00:01<00:25,  5.50it/s][A
Training:   6%|▋         | 9/143 [00:01<00:18,  7.07it/s][A
Training:   9%|▉         | 13/143 [00:01<00:17,  7.59it/s][A
Training:  12%|█▏        | 17/143 [00:02<00:15,  8.19it/s][A
Training:  15%|█▍        | 21/143 [00:02<00:13,  9.02it/s][A
Training:  17%|█▋        | 25/143 [00:03<00:12,  9.52it/s][A
Training:  20%|██        | 29/143 [00:03<00:11,  9.61it/s][A
Training:  22%|██▏       | 32/143 [00:03<00:10, 10.62it/s][A
Training:  24%|██▍       | 34/143 [00:03<00:10, 10.12it/s][A
Training:  25%|██▌       | 36/143 [00:04<00:10, 10.41it/s][A
Training:  27%|██▋       | 38/143 [00:04<00:11,  9.40it/s][A
Training:  28%|██▊       | 40/143 [00:04<00:10,  9.99it/s][A
Training:  29%|██▉       | 42/143 [00:04<00:11,  8.59it/s][A
Training:  31%|███       | 44/143 [00:05<00:10,  9.85it/s][A
Training:  32%|███▏

Epoch: 42/48 - Loss: 0.2284 - Accuracy: 0.9621



  0%|          | 0/18 [00:00<?, ?it/s][A
  6%|▌         | 1/18 [00:00<00:11,  1.48it/s][A
 28%|██▊       | 5/18 [00:01<00:02,  5.49it/s][A
 50%|█████     | 9/18 [00:01<00:01,  7.02it/s][A
 72%|███████▏  | 13/18 [00:01<00:00,  7.81it/s][A
100%|██████████| 18/18 [00:02<00:00,  7.61it/s][A
Epochs:  88%|████████▊ | 42/48 [12:43<01:48, 18.15s/it]

Val Loss: 0.3312 - Val Accuracy: 0.9603



Training:   0%|          | 0/143 [00:00<?, ?it/s][A
Training:   1%|          | 1/143 [00:00<01:27,  1.62it/s][A
Training:   3%|▎         | 5/143 [00:01<00:26,  5.27it/s][A
Training:   6%|▋         | 9/143 [00:01<00:19,  6.96it/s][A
Training:   9%|▉         | 13/143 [00:01<00:16,  7.73it/s][A
Training:  12%|█▏        | 17/143 [00:02<00:15,  8.09it/s][A
Training:  15%|█▍        | 21/143 [00:02<00:14,  8.71it/s][A
Training:  17%|█▋        | 25/143 [00:03<00:12,  9.44it/s][A
Training:  20%|█▉        | 28/143 [00:03<00:10, 11.43it/s][A
Training:  21%|██        | 30/143 [00:03<00:12,  9.23it/s][A
Training:  23%|██▎       | 33/143 [00:04<00:12,  8.83it/s][A
Training:  26%|██▌       | 37/143 [00:04<00:11,  8.92it/s][A
Training:  29%|██▊       | 41/143 [00:04<00:11,  9.01it/s][A
Training:  31%|███▏      | 45/143 [00:05<00:10,  9.60it/s][A
Training:  34%|███▍      | 49/143 [00:05<00:09,  9.80it/s][A
Training:  37%|███▋      | 53/143 [00:06<00:09,  9.71it/s][A
Training:  40%|███▉

Epoch: 43/48 - Loss: 0.2426 - Accuracy: 0.9624



  0%|          | 0/18 [00:00<?, ?it/s][A
  6%|▌         | 1/18 [00:00<00:11,  1.49it/s][A
 28%|██▊       | 5/18 [00:01<00:02,  5.15it/s][A
 50%|█████     | 9/18 [00:01<00:01,  6.76it/s][A
 72%|███████▏  | 13/18 [00:01<00:00,  7.78it/s][A
 78%|███████▊  | 14/18 [00:02<00:00,  7.97it/s][A
100%|██████████| 18/18 [00:02<00:00,  7.41it/s][A
Epochs:  90%|████████▉ | 43/48 [13:01<01:30, 18.15s/it]

Val Loss: 0.2466 - Val Accuracy: 0.9626



Training:   0%|          | 0/143 [00:00<?, ?it/s][A
Training:   1%|          | 1/143 [00:00<01:17,  1.84it/s][A
Training:   3%|▎         | 5/143 [00:00<00:24,  5.67it/s][A
Training:   6%|▌         | 8/143 [00:01<00:14,  9.21it/s][A
Training:   7%|▋         | 10/143 [00:01<00:18,  7.34it/s][A
Training:   9%|▉         | 13/143 [00:01<00:17,  7.51it/s][A
Training:  10%|█         | 15/143 [00:01<00:14,  9.04it/s][A
Training:  12%|█▏        | 17/143 [00:02<00:16,  7.81it/s][A
Training:  14%|█▍        | 20/143 [00:02<00:11, 10.76it/s][A
Training:  15%|█▌        | 22/143 [00:02<00:14,  8.55it/s][A
Training:  17%|█▋        | 25/143 [00:03<00:13,  8.80it/s][A
Training:  20%|██        | 29/143 [00:03<00:13,  8.73it/s][A
Training:  23%|██▎       | 33/143 [00:04<00:12,  8.78it/s][A
Training:  26%|██▌       | 37/143 [00:04<00:11,  9.30it/s][A
Training:  29%|██▊       | 41/143 [00:04<00:11,  9.24it/s][A
Training:  31%|███       | 44/143 [00:04<00:08, 11.10it/s][A
Training:  32%|███▏

Epoch: 44/48 - Loss: 0.2208 - Accuracy: 0.9628



  0%|          | 0/18 [00:00<?, ?it/s][A
  6%|▌         | 1/18 [00:00<00:11,  1.46it/s][A
 28%|██▊       | 5/18 [00:01<00:02,  5.25it/s][A
 50%|█████     | 9/18 [00:01<00:01,  6.93it/s][A
 72%|███████▏  | 13/18 [00:02<00:00,  7.46it/s][A
100%|██████████| 18/18 [00:02<00:00,  7.29it/s][A
Epochs:  92%|█████████▏| 44/48 [13:19<01:12, 18.10s/it]

Val Loss: 0.4099 - Val Accuracy: 0.9422



Training:   0%|          | 0/143 [00:00<?, ?it/s][A
Training:   1%|          | 1/143 [00:00<01:22,  1.72it/s][A
Training:   3%|▎         | 5/143 [00:01<00:24,  5.55it/s][A
Training:   6%|▋         | 9/143 [00:01<00:19,  6.87it/s][A
Training:   9%|▉         | 13/143 [00:01<00:16,  7.79it/s][A
Training:  12%|█▏        | 17/143 [00:02<00:15,  8.32it/s][A
Training:  15%|█▍        | 21/143 [00:02<00:14,  8.70it/s][A
Training:  17%|█▋        | 25/143 [00:03<00:12,  9.30it/s][A
Training:  20%|██        | 29/143 [00:03<00:11,  9.62it/s][A
Training:  23%|██▎       | 33/143 [00:04<00:12,  9.00it/s][A
Training:  26%|██▌       | 37/143 [00:04<00:11,  9.11it/s][A
Training:  29%|██▊       | 41/143 [00:04<00:11,  9.01it/s][A
Training:  31%|███▏      | 45/143 [00:05<00:10,  9.36it/s][A
Training:  34%|███▍      | 49/143 [00:05<00:10,  9.26it/s][A
Training:  37%|███▋      | 53/143 [00:06<00:09,  9.77it/s][A
Training:  40%|███▉      | 57/143 [00:06<00:08,  9.94it/s][A
Training:  42%|████

Epoch: 45/48 - Loss: 0.2413 - Accuracy: 0.9635



  0%|          | 0/18 [00:00<?, ?it/s][A
  6%|▌         | 1/18 [00:00<00:10,  1.60it/s][A
 28%|██▊       | 5/18 [00:01<00:02,  5.43it/s][A
 50%|█████     | 9/18 [00:01<00:01,  6.64it/s][A
 72%|███████▏  | 13/18 [00:02<00:00,  7.44it/s][A
100%|██████████| 18/18 [00:02<00:00,  7.35it/s][A
Epochs:  94%|█████████▍| 45/48 [13:37<00:54, 18.06s/it]

Val Loss: 0.4293 - Val Accuracy: 0.9462



Training:   0%|          | 0/143 [00:00<?, ?it/s][A
Training:   1%|          | 1/143 [00:00<01:24,  1.68it/s][A
Training:   3%|▎         | 5/143 [00:00<00:23,  5.85it/s][A
Training:   6%|▋         | 9/143 [00:01<00:18,  7.11it/s][A
Training:   9%|▉         | 13/143 [00:01<00:17,  7.64it/s][A
Training:  12%|█▏        | 17/143 [00:02<00:15,  8.12it/s][A
Training:  15%|█▍        | 21/143 [00:02<00:13,  8.75it/s][A
Training:  17%|█▋        | 25/143 [00:03<00:12,  9.12it/s][A
Training:  20%|█▉        | 28/143 [00:03<00:10, 10.96it/s][A
Training:  21%|██        | 30/143 [00:03<00:11,  9.57it/s][A
Training:  23%|██▎       | 33/143 [00:04<00:12,  8.75it/s][A
Training:  26%|██▌       | 37/143 [00:04<00:11,  9.13it/s][A
Training:  29%|██▊       | 41/143 [00:04<00:10,  9.35it/s][A
Training:  31%|███▏      | 45/143 [00:05<00:10,  9.29it/s][A
Training:  34%|███▍      | 49/143 [00:05<00:10,  8.93it/s][A
Training:  37%|███▋      | 53/143 [00:06<00:09,  9.20it/s][A
Training:  40%|███▉

Epoch: 46/48 - Loss: 0.2550 - Accuracy: 0.9621



  0%|          | 0/18 [00:00<?, ?it/s][A
  6%|▌         | 1/18 [00:00<00:11,  1.49it/s][A
 28%|██▊       | 5/18 [00:01<00:02,  5.20it/s][A
 44%|████▍     | 8/18 [00:01<00:01,  8.31it/s][A
 56%|█████▌    | 10/18 [00:01<00:01,  7.38it/s][A
 67%|██████▋   | 12/18 [00:01<00:00,  9.15it/s][A
 78%|███████▊  | 14/18 [00:01<00:00,  7.95it/s][A
100%|██████████| 18/18 [00:02<00:00,  7.44it/s][A
Epochs:  96%|█████████▌| 46/48 [13:56<00:36, 18.11s/it]

Val Loss: 0.3929 - Val Accuracy: 0.9547



Training:   0%|          | 0/143 [00:00<?, ?it/s][A
Training:   1%|          | 1/143 [00:00<01:24,  1.68it/s][A
Training:   2%|▏         | 3/143 [00:00<00:29,  4.72it/s][A
Training:   3%|▎         | 5/143 [00:00<00:22,  6.22it/s][A
Training:   5%|▍         | 7/143 [00:01<00:17,  7.59it/s][A
Training:   6%|▋         | 9/143 [00:01<00:18,  7.26it/s][A
Training:   8%|▊         | 11/143 [00:01<00:15,  8.54it/s][A
Training:   9%|▉         | 13/143 [00:01<00:15,  8.61it/s][A
Training:  10%|█         | 15/143 [00:02<00:13,  9.60it/s][A
Training:  12%|█▏        | 17/143 [00:02<00:14,  8.91it/s][A
Training:  13%|█▎        | 19/143 [00:02<00:13,  9.28it/s][A
Training:  15%|█▍        | 21/143 [00:02<00:12, 10.03it/s][A
Training:  16%|█▌        | 23/143 [00:02<00:12,  9.65it/s][A
Training:  17%|█▋        | 25/143 [00:03<00:11,  9.99it/s][A
Training:  19%|█▉        | 27/143 [00:03<00:12,  9.64it/s][A
Training:  20%|██        | 29/143 [00:03<00:11, 10.29it/s][A
Training:  22%|██▏   

Epoch: 47/48 - Loss: 0.2510 - Accuracy: 0.9623



  0%|          | 0/18 [00:00<?, ?it/s][A
  6%|▌         | 1/18 [00:00<00:12,  1.36it/s][A
 28%|██▊       | 5/18 [00:01<00:02,  4.96it/s][A
 44%|████▍     | 8/18 [00:01<00:01,  8.19it/s][A
 56%|█████▌    | 10/18 [00:01<00:01,  7.15it/s][A
 72%|███████▏  | 13/18 [00:02<00:00,  7.25it/s][A
100%|██████████| 18/18 [00:02<00:00,  7.32it/s][A
Epochs:  98%|█████████▊| 47/48 [14:14<00:18, 18.18s/it]

Val Loss: 0.4144 - Val Accuracy: 0.9518



Training:   0%|          | 0/143 [00:00<?, ?it/s][A
Training:   1%|          | 1/143 [00:00<01:32,  1.53it/s][A
Training:   3%|▎         | 5/143 [00:01<00:26,  5.28it/s][A
Training:   6%|▋         | 9/143 [00:01<00:18,  7.19it/s][A
Training:   8%|▊         | 12/143 [00:01<00:14,  9.29it/s][A
Training:  10%|▉         | 14/143 [00:01<00:16,  8.00it/s][A
Training:  11%|█         | 16/143 [00:02<00:14,  9.07it/s][A
Training:  13%|█▎        | 18/143 [00:02<00:15,  8.07it/s][A
Training:  15%|█▍        | 21/143 [00:02<00:14,  8.53it/s][A
Training:  16%|█▌        | 23/143 [00:02<00:12,  9.95it/s][A
Training:  17%|█▋        | 25/143 [00:03<00:13,  8.53it/s][A
Training:  20%|█▉        | 28/143 [00:03<00:11,  9.87it/s][A
Training:  21%|██        | 30/143 [00:03<00:13,  8.50it/s][A
Training:  23%|██▎       | 33/143 [00:04<00:11,  9.21it/s][A
Training:  24%|██▍       | 35/143 [00:04<00:10,  9.92it/s][A
Training:  26%|██▌       | 37/143 [00:04<00:11,  9.40it/s][A
Training:  27%|██▋ 

Epoch: 48/48 - Loss: 0.2206 - Accuracy: 0.9649



  0%|          | 0/18 [00:00<?, ?it/s][A
  6%|▌         | 1/18 [00:00<00:11,  1.54it/s][A
 28%|██▊       | 5/18 [00:01<00:02,  5.04it/s][A
 50%|█████     | 9/18 [00:01<00:01,  6.52it/s][A
 72%|███████▏  | 13/18 [00:02<00:00,  7.49it/s][A
100%|██████████| 18/18 [00:02<00:00,  7.31it/s][A
Epochs: 100%|██████████| 48/48 [14:32<00:00, 18.19s/it]
[32m[I 2023-12-12 00:04:22,557][0m Trial 3 finished with value: 0.9541031718254089 and parameters: {'learning_rate': 0.003494281053007625, 'weight_decay': 0.0001149692699183165, 'epsilon': 9.569821680316825e-09, 'batch_size': 98, 'epochs': 48}. Best is trial 2 with value: 0.9673694372177124.[0m


Val Loss: 0.3561 - Val Accuracy: 0.9541
Learning rate: 0.008903291501466909
Weight decay: 0.0005440025295771077
Epsilon: 7.786125083908577e-08
Batch size: 241
Number of epochs: 27


Epochs:   0%|          | 0/27 [00:00<?, ?it/s]
Training:   0%|          | 0/58 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/58 [00:01<01:24,  1.48s/it][A
Training:   5%|▌         | 3/58 [00:01<00:23,  2.36it/s][A
Training:   9%|▊         | 5/58 [00:02<00:22,  2.34it/s][A
Training:  14%|█▍        | 8/58 [00:02<00:11,  4.46it/s][A
Training:  17%|█▋        | 10/58 [00:03<00:15,  3.08it/s][A
Training:  22%|██▏       | 13/58 [00:04<00:14,  3.18it/s][A
Training:  26%|██▌       | 15/58 [00:04<00:10,  4.12it/s][A
Training:  29%|██▉       | 17/58 [00:05<00:12,  3.21it/s][A
Training:  34%|███▍      | 20/58 [00:05<00:07,  4.81it/s][A
Training:  38%|███▊      | 22/58 [00:06<00:09,  3.66it/s][A
Training:  43%|████▎     | 25/58 [00:07<00:09,  3.40it/s][A
Training:  47%|████▋     | 27/58 [00:07<00:07,  4.31it/s][A
Training:  50%|█████     | 29/58 [00:08<00:08,  3.40it/s][A
Training:  57%|█████▋    | 33/58 [00:09<00:07,  3.55it/s][A
Training:  60%|██████    | 35/58 [00:09<00:05,  4.4

Epoch: 1/27 - Loss: 1.9349 - Accuracy: 0.8507



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:01<00:09,  1.31s/it][A
 50%|█████     | 4/8 [00:01<00:01,  3.45it/s][A
100%|██████████| 8/8 [00:02<00:00,  3.39it/s][A
Epochs:   4%|▎         | 1/27 [00:18<07:56, 18.31s/it]

Val Loss: 0.1762 - Val Accuracy: 0.9431



Training:   0%|          | 0/58 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/58 [00:01<01:14,  1.30s/it][A
Training:   9%|▊         | 5/58 [00:02<00:21,  2.50it/s][A
Training:  12%|█▏        | 7/58 [00:02<00:13,  3.68it/s][A
Training:  16%|█▌        | 9/58 [00:03<00:16,  2.92it/s][A
Training:  22%|██▏       | 13/58 [00:04<00:12,  3.58it/s][A
Training:  26%|██▌       | 15/58 [00:04<00:09,  4.47it/s][A
Training:  29%|██▉       | 17/58 [00:05<00:12,  3.42it/s][A
Training:  34%|███▍      | 20/58 [00:05<00:07,  4.95it/s][A
Training:  38%|███▊      | 22/58 [00:06<00:09,  3.77it/s][A
Training:  43%|████▎     | 25/58 [00:07<00:09,  3.47it/s][A
Training:  45%|████▍     | 26/58 [00:07<00:08,  3.81it/s][A
Training:  50%|█████     | 29/58 [00:08<00:08,  3.58it/s][A
Training:  52%|█████▏    | 30/58 [00:08<00:07,  3.88it/s][A
Training:  57%|█████▋    | 33/58 [00:09<00:07,  3.45it/s][A
Training:  62%|██████▏   | 36/58 [00:09<00:04,  4.99it/s][A
Training:  66%|██████▌   | 38/58 [00

Epoch: 2/27 - Loss: 0.1314 - Accuracy: 0.9526



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:01<00:08,  1.23s/it][A
100%|██████████| 8/8 [00:02<00:00,  3.43it/s][A
Epochs:   7%|▋         | 2/27 [00:36<07:38, 18.32s/it]

Val Loss: 0.1400 - Val Accuracy: 0.9525



Training:   0%|          | 0/58 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/58 [00:01<01:12,  1.28s/it][A
Training:   9%|▊         | 5/58 [00:02<00:21,  2.46it/s][A
Training:  12%|█▏        | 7/58 [00:02<00:13,  3.66it/s][A
Training:  16%|█▌        | 9/58 [00:03<00:15,  3.08it/s][A
Training:  21%|██        | 12/58 [00:03<00:09,  4.93it/s][A
Training:  24%|██▍       | 14/58 [00:04<00:12,  3.47it/s][A
Training:  28%|██▊       | 16/58 [00:04<00:09,  4.55it/s][A
Training:  31%|███       | 18/58 [00:05<00:11,  3.42it/s][A
Training:  36%|███▌      | 21/58 [00:06<00:11,  3.19it/s][A
Training:  41%|████▏     | 24/58 [00:06<00:07,  4.60it/s][A
Training:  45%|████▍     | 26/58 [00:07<00:08,  3.62it/s][A
Training:  50%|█████     | 29/58 [00:08<00:08,  3.39it/s][A
Training:  57%|█████▋    | 33/58 [00:09<00:07,  3.55it/s][A
Training:  62%|██████▏   | 36/58 [00:09<00:04,  4.79it/s][A
Training:  66%|██████▌   | 38/58 [00:10<00:05,  3.73it/s][A
Training:  71%|███████   | 41/58 [00

Epoch: 3/27 - Loss: 0.1164 - Accuracy: 0.9564



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:01<00:08,  1.20s/it][A
 50%|█████     | 4/8 [00:01<00:01,  3.76it/s][A
100%|██████████| 8/8 [00:02<00:00,  3.36it/s][A
Epochs:  11%|█         | 3/27 [00:54<07:19, 18.30s/it]

Val Loss: 0.1417 - Val Accuracy: 0.9557



Training:   0%|          | 0/58 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/58 [00:01<01:17,  1.35s/it][A
Training:   7%|▋         | 4/58 [00:01<00:15,  3.52it/s][A
Training:  10%|█         | 6/58 [00:02<00:19,  2.70it/s][A
Training:  16%|█▌        | 9/58 [00:03<00:16,  2.98it/s][A
Training:  21%|██        | 12/58 [00:03<00:09,  4.71it/s][A
Training:  24%|██▍       | 14/58 [00:04<00:13,  3.29it/s][A
Training:  28%|██▊       | 16/58 [00:04<00:09,  4.28it/s][A
Training:  31%|███       | 18/58 [00:05<00:12,  3.22it/s][A
Training:  36%|███▌      | 21/58 [00:06<00:11,  3.14it/s][A
Training:  43%|████▎     | 25/58 [00:07<00:09,  3.44it/s][A
Training:  48%|████▊     | 28/58 [00:07<00:06,  4.74it/s][A
Training:  52%|█████▏    | 30/58 [00:08<00:07,  3.61it/s][A
Training:  57%|█████▋    | 33/58 [00:09<00:07,  3.47it/s][A
Training:  64%|██████▍   | 37/58 [00:10<00:05,  3.67it/s][A
Training:  69%|██████▉   | 40/58 [00:10<00:03,  4.91it/s][A
Training:  72%|███████▏  | 42/58 [00

Epoch: 4/27 - Loss: 0.1108 - Accuracy: 0.9579



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:01<00:08,  1.19s/it][A
 38%|███▊      | 3/8 [00:01<00:01,  2.82it/s][A
100%|██████████| 8/8 [00:02<00:00,  3.44it/s][A
Epochs:  15%|█▍        | 4/27 [01:13<07:01, 18.31s/it]

Val Loss: 0.1389 - Val Accuracy: 0.9478



Training:   0%|          | 0/58 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/58 [00:01<01:07,  1.19s/it][A
Training:   3%|▎         | 2/58 [00:01<00:31,  1.77it/s][A
Training:   9%|▊         | 5/58 [00:02<00:19,  2.74it/s][A
Training:  14%|█▍        | 8/58 [00:02<00:09,  5.04it/s][A
Training:  17%|█▋        | 10/58 [00:03<00:14,  3.37it/s][A
Training:  22%|██▏       | 13/58 [00:04<00:13,  3.22it/s][A
Training:  29%|██▉       | 17/58 [00:05<00:11,  3.54it/s][A
Training:  34%|███▍      | 20/58 [00:05<00:07,  4.93it/s][A
Training:  38%|███▊      | 22/58 [00:06<00:09,  3.76it/s][A
Training:  40%|███▉      | 23/58 [00:06<00:08,  4.13it/s][A
Training:  43%|████▎     | 25/58 [00:07<00:10,  3.13it/s][A
Training:  48%|████▊     | 28/58 [00:07<00:06,  4.68it/s][A
Training:  52%|█████▏    | 30/58 [00:08<00:07,  3.50it/s][A
Training:  57%|█████▋    | 33/58 [00:09<00:07,  3.33it/s][A
Training:  62%|██████▏   | 36/58 [00:09<00:04,  4.71it/s][A
Training:  66%|██████▌   | 38/58 [00

Epoch: 5/27 - Loss: 0.1083 - Accuracy: 0.9608



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:01<00:09,  1.30s/it][A
 50%|█████     | 4/8 [00:01<00:01,  3.55it/s][A
100%|██████████| 8/8 [00:02<00:00,  3.40it/s][A
Epochs:  19%|█▊        | 5/27 [01:31<06:41, 18.26s/it]

Val Loss: 0.1241 - Val Accuracy: 0.9572



Training:   0%|          | 0/58 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/58 [00:01<01:12,  1.26s/it][A
Training:   7%|▋         | 4/58 [00:01<00:14,  3.65it/s][A
Training:  10%|█         | 6/58 [00:02<00:18,  2.87it/s][A
Training:  16%|█▌        | 9/58 [00:03<00:17,  2.85it/s][A
Training:  21%|██        | 12/58 [00:03<00:10,  4.47it/s][A
Training:  24%|██▍       | 14/58 [00:04<00:12,  3.58it/s][A
Training:  28%|██▊       | 16/58 [00:04<00:09,  4.66it/s][A
Training:  31%|███       | 18/58 [00:05<00:11,  3.37it/s][A
Training:  34%|███▍      | 20/58 [00:05<00:08,  4.35it/s][A
Training:  38%|███▊      | 22/58 [00:06<00:10,  3.50it/s][A
Training:  43%|████▎     | 25/58 [00:07<00:10,  3.13it/s][A
Training:  48%|████▊     | 28/58 [00:07<00:06,  4.52it/s][A
Training:  52%|█████▏    | 30/58 [00:08<00:08,  3.49it/s][A
Training:  55%|█████▌    | 32/58 [00:08<00:05,  4.43it/s][A
Training:  59%|█████▊    | 34/58 [00:09<00:07,  3.36it/s][A
Training:  62%|██████▏   | 36/58 [00

Epoch: 6/27 - Loss: 0.1063 - Accuracy: 0.9616



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:01<00:08,  1.19s/it][A
 38%|███▊      | 3/8 [00:01<00:01,  2.81it/s][A
100%|██████████| 8/8 [00:02<00:00,  3.54it/s][A
Epochs:  22%|██▏       | 6/27 [01:49<06:22, 18.21s/it]

Val Loss: 0.1279 - Val Accuracy: 0.9546



Training:   0%|          | 0/58 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/58 [00:01<01:10,  1.24s/it][A
Training:   9%|▊         | 5/58 [00:02<00:21,  2.43it/s][A
Training:  12%|█▏        | 7/58 [00:02<00:14,  3.56it/s][A
Training:  16%|█▌        | 9/58 [00:03<00:16,  2.94it/s][A
Training:  22%|██▏       | 13/58 [00:04<00:13,  3.43it/s][A
Training:  29%|██▉       | 17/58 [00:05<00:11,  3.44it/s][A
Training:  36%|███▌      | 21/58 [00:06<00:10,  3.61it/s][A
Training:  41%|████▏     | 24/58 [00:06<00:07,  4.77it/s][A
Training:  45%|████▍     | 26/58 [00:07<00:08,  3.77it/s][A
Training:  50%|█████     | 29/58 [00:08<00:08,  3.47it/s][A
Training:  57%|█████▋    | 33/58 [00:09<00:06,  3.67it/s][A
Training:  62%|██████▏   | 36/58 [00:09<00:04,  4.89it/s][A
Training:  66%|██████▌   | 38/58 [00:10<00:05,  3.92it/s][A
Training:  69%|██████▉   | 40/58 [00:10<00:03,  4.64it/s][A
Training:  72%|███████▏  | 42/58 [00:11<00:04,  3.61it/s][A
Training:  78%|███████▊  | 45/58 [00

Epoch: 7/27 - Loss: 0.1014 - Accuracy: 0.9620



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:01<00:09,  1.35s/it][A
100%|██████████| 8/8 [00:02<00:00,  3.25it/s][A
Epochs:  26%|██▌       | 7/27 [02:07<06:03, 18.19s/it]

Val Loss: 0.1213 - Val Accuracy: 0.9567



Training:   0%|          | 0/58 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/58 [00:01<01:07,  1.18s/it][A
Training:   5%|▌         | 3/58 [00:01<00:18,  2.90it/s][A
Training:   9%|▊         | 5/58 [00:02<00:21,  2.45it/s][A
Training:  12%|█▏        | 7/58 [00:02<00:13,  3.86it/s][A
Training:  16%|█▌        | 9/58 [00:03<00:16,  3.01it/s][A
Training:  19%|█▉        | 11/58 [00:03<00:10,  4.28it/s][A
Training:  22%|██▏       | 13/58 [00:04<00:14,  3.19it/s][A
Training:  28%|██▊       | 16/58 [00:04<00:08,  4.83it/s][A
Training:  31%|███       | 18/58 [00:05<00:11,  3.39it/s][A
Training:  36%|███▌      | 21/58 [00:06<00:11,  3.21it/s][A
Training:  43%|████▎     | 25/58 [00:07<00:09,  3.43it/s][A
Training:  48%|████▊     | 28/58 [00:07<00:06,  4.68it/s][A
Training:  52%|█████▏    | 30/58 [00:08<00:07,  3.70it/s][A
Training:  55%|█████▌    | 32/58 [00:08<00:05,  4.57it/s][A
Training:  59%|█████▊    | 34/58 [00:09<00:06,  3.62it/s][A
Training:  62%|██████▏   | 36/58 [00:

Epoch: 8/27 - Loss: 0.1054 - Accuracy: 0.9614



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:01<00:09,  1.38s/it][A
 38%|███▊      | 3/8 [00:01<00:02,  2.48it/s][A
 62%|██████▎   | 5/8 [00:02<00:01,  2.60it/s][A
100%|██████████| 8/8 [00:02<00:00,  3.31it/s][A
Epochs:  30%|██▉       | 8/27 [02:25<05:45, 18.19s/it]

Val Loss: 0.1255 - Val Accuracy: 0.9588



Training:   0%|          | 0/58 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/58 [00:01<01:12,  1.27s/it][A
Training:   3%|▎         | 2/58 [00:01<00:33,  1.66it/s][A
Training:   9%|▊         | 5/58 [00:02<00:20,  2.60it/s][A
Training:  12%|█▏        | 7/58 [00:02<00:12,  3.92it/s][A
Training:  16%|█▌        | 9/58 [00:03<00:15,  3.21it/s][A
Training:  17%|█▋        | 10/58 [00:03<00:13,  3.63it/s][A
Training:  22%|██▏       | 13/58 [00:04<00:12,  3.47it/s][A
Training:  24%|██▍       | 14/58 [00:04<00:11,  3.76it/s][A
Training:  29%|██▉       | 17/58 [00:05<00:11,  3.62it/s][A
Training:  31%|███       | 18/58 [00:05<00:10,  3.76it/s][A
Training:  36%|███▌      | 21/58 [00:06<00:09,  3.79it/s][A
Training:  38%|███▊      | 22/58 [00:06<00:09,  3.85it/s][A
Training:  43%|████▎     | 25/58 [00:07<00:08,  3.84it/s][A
Training:  45%|████▍     | 26/58 [00:07<00:08,  3.83it/s][A
Training:  50%|█████     | 29/58 [00:08<00:07,  3.75it/s][A
Training:  52%|█████▏    | 30/58 [00:

Epoch: 9/27 - Loss: 0.1051 - Accuracy: 0.9621



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:01<00:09,  1.33s/it][A
 50%|█████     | 4/8 [00:01<00:01,  3.56it/s][A
100%|██████████| 8/8 [00:02<00:00,  3.38it/s][A
Epochs:  33%|███▎      | 9/27 [02:44<05:27, 18.18s/it]

Val Loss: 0.1490 - Val Accuracy: 0.9577



Training:   0%|          | 0/58 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/58 [00:01<01:14,  1.31s/it][A
Training:   5%|▌         | 3/58 [00:01<00:21,  2.62it/s][A
Training:   9%|▊         | 5/58 [00:02<00:21,  2.47it/s][A
Training:  12%|█▏        | 7/58 [00:02<00:13,  3.82it/s][A
Training:  16%|█▌        | 9/58 [00:03<00:16,  3.02it/s][A
Training:  19%|█▉        | 11/58 [00:03<00:11,  4.14it/s][A
Training:  22%|██▏       | 13/58 [00:04<00:13,  3.26it/s][A
Training:  26%|██▌       | 15/58 [00:04<00:10,  4.09it/s][A
Training:  29%|██▉       | 17/58 [00:05<00:11,  3.47it/s][A
Training:  33%|███▎      | 19/58 [00:05<00:09,  4.23it/s][A
Training:  36%|███▌      | 21/58 [00:06<00:10,  3.39it/s][A
Training:  40%|███▉      | 23/58 [00:06<00:08,  4.33it/s][A
Training:  43%|████▎     | 25/58 [00:07<00:09,  3.51it/s][A
Training:  47%|████▋     | 27/58 [00:07<00:07,  4.26it/s][A
Training:  50%|█████     | 29/58 [00:08<00:08,  3.56it/s][A
Training:  53%|█████▎    | 31/58 [00:

Epoch: 10/27 - Loss: 0.1150 - Accuracy: 0.9586



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:01<00:09,  1.30s/it][A
 50%|█████     | 4/8 [00:01<00:01,  3.63it/s][A
100%|██████████| 8/8 [00:02<00:00,  3.50it/s][A
Epochs:  37%|███▋      | 10/27 [03:02<05:08, 18.13s/it]

Val Loss: 0.1316 - Val Accuracy: 0.9488



Training:   0%|          | 0/58 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/58 [00:01<01:12,  1.28s/it][A
Training:   5%|▌         | 3/58 [00:01<00:21,  2.54it/s][A
Training:   9%|▊         | 5/58 [00:02<00:22,  2.41it/s][A
Training:  14%|█▍        | 8/58 [00:02<00:10,  4.55it/s][A
Training:  17%|█▋        | 10/58 [00:03<00:13,  3.45it/s][A
Training:  21%|██        | 12/58 [00:03<00:09,  4.66it/s][A
Training:  24%|██▍       | 14/58 [00:04<00:12,  3.50it/s][A
Training:  26%|██▌       | 15/58 [00:04<00:10,  3.97it/s][A
Training:  29%|██▉       | 17/58 [00:05<00:12,  3.29it/s][A
Training:  31%|███       | 18/58 [00:05<00:10,  3.78it/s][A
Training:  33%|███▎      | 19/58 [00:05<00:09,  4.14it/s][A
Training:  34%|███▍      | 20/58 [00:05<00:08,  4.48it/s][A
Training:  36%|███▌      | 21/58 [00:06<00:11,  3.20it/s][A
Training:  38%|███▊      | 22/58 [00:06<00:09,  3.65it/s][A
Training:  40%|███▉      | 23/58 [00:06<00:08,  4.29it/s][A
Training:  41%|████▏     | 24/58 [00

Epoch: 11/27 - Loss: 0.1083 - Accuracy: 0.9621



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:01<00:08,  1.25s/it][A
 50%|█████     | 4/8 [00:01<00:01,  3.61it/s][A
100%|██████████| 8/8 [00:02<00:00,  3.53it/s][A
Epochs:  41%|████      | 11/27 [03:20<04:49, 18.12s/it]

Val Loss: 0.1440 - Val Accuracy: 0.9577



Training:   0%|          | 0/58 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/58 [00:01<01:20,  1.41s/it][A
Training:   9%|▊         | 5/58 [00:02<00:22,  2.34it/s][A
Training:  14%|█▍        | 8/58 [00:02<00:12,  4.03it/s][A
Training:  17%|█▋        | 10/58 [00:03<00:14,  3.28it/s][A
Training:  22%|██▏       | 13/58 [00:04<00:14,  3.10it/s][A
Training:  28%|██▊       | 16/58 [00:04<00:09,  4.51it/s][A
Training:  31%|███       | 18/58 [00:05<00:11,  3.56it/s][A
Training:  36%|███▌      | 21/58 [00:06<00:10,  3.42it/s][A
Training:  41%|████▏     | 24/58 [00:06<00:07,  4.85it/s][A
Training:  45%|████▍     | 26/58 [00:07<00:08,  3.62it/s][A
Training:  48%|████▊     | 28/58 [00:07<00:06,  4.57it/s][A
Training:  52%|█████▏    | 30/58 [00:08<00:08,  3.48it/s][A
Training:  57%|█████▋    | 33/58 [00:09<00:07,  3.19it/s][A
Training:  64%|██████▍   | 37/58 [00:10<00:06,  3.36it/s][A
Training:  67%|██████▋   | 39/58 [00:10<00:04,  4.14it/s][A
Training:  71%|███████   | 41/58 [0

Epoch: 12/27 - Loss: 0.1038 - Accuracy: 0.9622



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:01<00:09,  1.29s/it][A
100%|██████████| 8/8 [00:02<00:00,  3.51it/s][A
Epochs:  44%|████▍     | 12/27 [03:38<04:32, 18.16s/it]

Val Loss: 0.1341 - Val Accuracy: 0.9567



Training:   0%|          | 0/58 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/58 [00:01<01:13,  1.30s/it][A
Training:   9%|▊         | 5/58 [00:02<00:21,  2.47it/s][A
Training:  16%|█▌        | 9/58 [00:03<00:16,  3.06it/s][A
Training:  21%|██        | 12/58 [00:03<00:10,  4.55it/s][A
Training:  24%|██▍       | 14/58 [00:04<00:13,  3.30it/s][A
Training:  29%|██▉       | 17/58 [00:05<00:13,  3.10it/s][A
Training:  33%|███▎      | 19/58 [00:05<00:09,  3.93it/s][A
Training:  36%|███▌      | 21/58 [00:06<00:11,  3.27it/s][A
Training:  43%|████▎     | 25/58 [00:07<00:09,  3.53it/s][A
Training:  47%|████▋     | 27/58 [00:07<00:07,  4.36it/s][A
Training:  50%|█████     | 29/58 [00:08<00:08,  3.51it/s][A
Training:  53%|█████▎    | 31/58 [00:08<00:06,  4.39it/s][A
Training:  57%|█████▋    | 33/58 [00:09<00:07,  3.51it/s][A
Training:  59%|█████▊    | 34/58 [00:09<00:06,  3.89it/s][A
Training:  64%|██████▍   | 37/58 [00:10<00:05,  3.55it/s][A
Training:  66%|██████▌   | 38/58 [0

Epoch: 13/27 - Loss: 0.1025 - Accuracy: 0.9619



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:01<00:08,  1.20s/it][A
100%|██████████| 8/8 [00:02<00:00,  3.61it/s][A
Epochs:  48%|████▊     | 13/27 [03:56<04:14, 18.17s/it]

Val Loss: 0.1378 - Val Accuracy: 0.9577



Training:   0%|          | 0/58 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/58 [00:01<01:11,  1.25s/it][A
Training:   9%|▊         | 5/58 [00:02<00:21,  2.41it/s][A
Training:  14%|█▍        | 8/58 [00:02<00:11,  4.29it/s][A
Training:  17%|█▋        | 10/58 [00:03<00:14,  3.23it/s][A
Training:  22%|██▏       | 13/58 [00:04<00:14,  3.12it/s][A
Training:  29%|██▉       | 17/58 [00:05<00:12,  3.40it/s][A
Training:  36%|███▌      | 21/58 [00:06<00:10,  3.53it/s][A
Training:  40%|███▉      | 23/58 [00:06<00:08,  4.28it/s][A
Training:  43%|████▎     | 25/58 [00:07<00:09,  3.54it/s][A
Training:  48%|████▊     | 28/58 [00:07<00:06,  4.99it/s][A
Training:  52%|█████▏    | 30/58 [00:08<00:07,  3.81it/s][A
Training:  57%|█████▋    | 33/58 [00:09<00:07,  3.42it/s][A
Training:  62%|██████▏   | 36/58 [00:09<00:04,  4.77it/s][A
Training:  66%|██████▌   | 38/58 [00:10<00:05,  3.63it/s][A
Training:  71%|███████   | 41/58 [00:11<00:04,  3.41it/s][A
Training:  76%|███████▌  | 44/58 [0

Epoch: 14/27 - Loss: 0.1113 - Accuracy: 0.9613



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:01<00:08,  1.22s/it][A
100%|██████████| 8/8 [00:02<00:00,  3.49it/s][A
Epochs:  52%|█████▏    | 14/27 [04:14<03:55, 18.13s/it]

Val Loss: 0.1627 - Val Accuracy: 0.9471



Training:   0%|          | 0/58 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/58 [00:01<01:03,  1.11s/it][A
Training:   3%|▎         | 2/58 [00:01<00:29,  1.92it/s][A
Training:   7%|▋         | 4/58 [00:01<00:12,  4.38it/s][A
Training:  10%|█         | 6/58 [00:02<00:16,  3.10it/s][A
Training:  14%|█▍        | 8/58 [00:02<00:10,  4.56it/s][A
Training:  17%|█▋        | 10/58 [00:03<00:14,  3.26it/s][A
Training:  22%|██▏       | 13/58 [00:04<00:13,  3.33it/s][A
Training:  24%|██▍       | 14/58 [00:04<00:11,  3.72it/s][A
Training:  28%|██▊       | 16/58 [00:04<00:08,  4.98it/s][A
Training:  29%|██▉       | 17/58 [00:05<00:13,  3.08it/s][A
Training:  33%|███▎      | 19/58 [00:05<00:08,  4.36it/s][A
Training:  36%|███▌      | 21/58 [00:06<00:11,  3.29it/s][A
Training:  41%|████▏     | 24/58 [00:06<00:06,  5.10it/s][A
Training:  45%|████▍     | 26/58 [00:07<00:08,  3.58it/s][A
Training:  50%|█████     | 29/58 [00:08<00:08,  3.40it/s][A
Training:  53%|█████▎    | 31/58 [00:

Epoch: 15/27 - Loss: 0.1458 - Accuracy: 0.9543



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:01<00:07,  1.05s/it][A
 38%|███▊      | 3/8 [00:01<00:01,  3.12it/s][A
 62%|██████▎   | 5/8 [00:02<00:01,  2.67it/s][A
100%|██████████| 8/8 [00:02<00:00,  3.53it/s][A
Epochs:  56%|█████▌    | 15/27 [04:32<03:36, 18.04s/it]

Val Loss: 0.1944 - Val Accuracy: 0.9531



Training:   0%|          | 0/58 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/58 [00:01<01:04,  1.13s/it][A
Training:   5%|▌         | 3/58 [00:01<00:18,  2.94it/s][A
Training:   9%|▊         | 5/58 [00:02<00:20,  2.56it/s][A
Training:  12%|█▏        | 7/58 [00:02<00:12,  4.00it/s][A
Training:  16%|█▌        | 9/58 [00:03<00:15,  3.09it/s][A
Training:  17%|█▋        | 10/58 [00:03<00:13,  3.43it/s][A
Training:  22%|██▏       | 13/58 [00:04<00:13,  3.43it/s][A
Training:  24%|██▍       | 14/58 [00:04<00:12,  3.56it/s][A
Training:  29%|██▉       | 17/58 [00:05<00:11,  3.63it/s][A
Training:  31%|███       | 18/58 [00:05<00:10,  3.82it/s][A
Training:  36%|███▌      | 21/58 [00:06<00:09,  3.72it/s][A
Training:  38%|███▊      | 22/58 [00:06<00:09,  3.84it/s][A
Training:  43%|████▎     | 25/58 [00:07<00:08,  3.71it/s][A
Training:  45%|████▍     | 26/58 [00:07<00:08,  3.86it/s][A
Training:  48%|████▊     | 28/58 [00:07<00:05,  5.12it/s][A
Training:  50%|█████     | 29/58 [00:

Epoch: 16/27 - Loss: 0.2138 - Accuracy: 0.9461



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:01<00:07,  1.09s/it][A
100%|██████████| 8/8 [00:02<00:00,  3.56it/s][A
Epochs:  59%|█████▉    | 16/27 [04:50<03:17, 17.97s/it]

Val Loss: 0.2196 - Val Accuracy: 0.9493



Training:   0%|          | 0/58 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/58 [00:01<01:10,  1.23s/it][A
Training:   9%|▊         | 5/58 [00:02<00:22,  2.41it/s][A
Training:  16%|█▌        | 9/58 [00:03<00:16,  3.05it/s][A
Training:  22%|██▏       | 13/58 [00:04<00:13,  3.29it/s][A
Training:  29%|██▉       | 17/58 [00:05<00:11,  3.44it/s][A
Training:  36%|███▌      | 21/58 [00:06<00:10,  3.52it/s][A
Training:  41%|████▏     | 24/58 [00:06<00:07,  4.58it/s][A
Training:  43%|████▎     | 25/58 [00:07<00:09,  3.51it/s][A
Training:  50%|█████     | 29/58 [00:08<00:07,  3.70it/s][A
Training:  57%|█████▋    | 33/58 [00:09<00:06,  3.81it/s][A
Training:  64%|██████▍   | 37/58 [00:10<00:05,  3.91it/s][A
Training:  67%|██████▋   | 39/58 [00:10<00:04,  4.64it/s][A
Training:  71%|███████   | 41/58 [00:11<00:04,  3.62it/s][A
Training:  76%|███████▌  | 44/58 [00:11<00:02,  4.98it/s][A
Training:  79%|███████▉  | 46/58 [00:12<00:03,  3.86it/s][A
Training:  84%|████████▍ | 49/58 [0

Epoch: 17/27 - Loss: 0.1643 - Accuracy: 0.9510



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:01<00:07,  1.12s/it][A
100%|██████████| 8/8 [00:02<00:00,  3.60it/s][A
Epochs:  63%|██████▎   | 17/27 [05:07<02:58, 17.88s/it]

Val Loss: 0.2356 - Val Accuracy: 0.9526



Training:   0%|          | 0/58 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/58 [00:01<01:09,  1.23s/it][A
Training:   7%|▋         | 4/58 [00:01<00:14,  3.83it/s][A
Training:  10%|█         | 6/58 [00:02<00:18,  2.86it/s][A
Training:  16%|█▌        | 9/58 [00:03<00:16,  2.96it/s][A
Training:  21%|██        | 12/58 [00:03<00:09,  4.62it/s][A
Training:  24%|██▍       | 14/58 [00:04<00:12,  3.59it/s][A
Training:  29%|██▉       | 17/58 [00:05<00:11,  3.42it/s][A
Training:  33%|███▎      | 19/58 [00:05<00:09,  4.32it/s][A
Training:  36%|███▌      | 21/58 [00:06<00:10,  3.50it/s][A
Training:  40%|███▉      | 23/58 [00:06<00:07,  4.51it/s][A
Training:  43%|████▎     | 25/58 [00:07<00:09,  3.39it/s][A
Training:  47%|████▋     | 27/58 [00:07<00:07,  4.39it/s][A
Training:  50%|█████     | 29/58 [00:08<00:08,  3.42it/s][A
Training:  52%|█████▏    | 30/58 [00:08<00:07,  3.83it/s][A
Training:  55%|█████▌    | 32/58 [00:08<00:04,  5.21it/s][A
Training:  59%|█████▊    | 34/58 [00

Epoch: 18/27 - Loss: 0.1627 - Accuracy: 0.9565



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:01<00:07,  1.10s/it][A
100%|██████████| 8/8 [00:02<00:00,  3.64it/s][A
Epochs:  67%|██████▋   | 18/27 [05:25<02:40, 17.79s/it]

Val Loss: 0.2779 - Val Accuracy: 0.9291



Training:   0%|          | 0/58 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/58 [00:01<01:11,  1.25s/it][A
Training:   9%|▊         | 5/58 [00:02<00:21,  2.44it/s][A
Training:  12%|█▏        | 7/58 [00:02<00:14,  3.61it/s][A
Training:  16%|█▌        | 9/58 [00:03<00:17,  2.77it/s][A
Training:  19%|█▉        | 11/58 [00:03<00:12,  3.89it/s][A
Training:  22%|██▏       | 13/58 [00:04<00:14,  3.10it/s][A
Training:  28%|██▊       | 16/58 [00:04<00:08,  4.78it/s][A
Training:  31%|███       | 18/58 [00:05<00:11,  3.51it/s][A
Training:  36%|███▌      | 21/58 [00:06<00:11,  3.29it/s][A
Training:  41%|████▏     | 24/58 [00:06<00:07,  4.74it/s][A
Training:  45%|████▍     | 26/58 [00:07<00:09,  3.55it/s][A
Training:  50%|█████     | 29/58 [00:08<00:08,  3.41it/s][A
Training:  57%|█████▋    | 33/58 [00:09<00:06,  3.67it/s][A
Training:  62%|██████▏   | 36/58 [00:09<00:04,  4.98it/s][A
Training:  66%|██████▌   | 38/58 [00:10<00:05,  3.63it/s][A
Training:  71%|███████   | 41/58 [00

Epoch: 19/27 - Loss: 0.1547 - Accuracy: 0.9560



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:01<00:07,  1.12s/it][A
100%|██████████| 8/8 [00:02<00:00,  3.50it/s][A
Epochs:  70%|███████   | 19/27 [05:43<02:22, 17.85s/it]

Val Loss: 0.2543 - Val Accuracy: 0.9468



Training:   0%|          | 0/58 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/58 [00:01<01:08,  1.20s/it][A
Training:   9%|▊         | 5/58 [00:02<00:19,  2.65it/s][A
Training:  14%|█▍        | 8/58 [00:02<00:10,  4.58it/s][A
Training:  17%|█▋        | 10/58 [00:03<00:14,  3.33it/s][A
Training:  21%|██        | 12/58 [00:03<00:10,  4.47it/s][A
Training:  24%|██▍       | 14/58 [00:04<00:13,  3.26it/s][A
Training:  29%|██▉       | 17/58 [00:05<00:12,  3.24it/s][A
Training:  34%|███▍      | 20/58 [00:05<00:08,  4.63it/s][A
Training:  38%|███▊      | 22/58 [00:06<00:10,  3.57it/s][A
Training:  41%|████▏     | 24/58 [00:06<00:07,  4.42it/s][A
Training:  43%|████▎     | 25/58 [00:07<00:10,  3.07it/s][A
Training:  47%|████▋     | 27/58 [00:07<00:07,  4.17it/s][A
Training:  50%|█████     | 29/58 [00:08<00:09,  3.21it/s][A
Training:  53%|█████▎    | 31/58 [00:08<00:06,  4.15it/s][A
Training:  55%|█████▌    | 32/58 [00:08<00:05,  4.49it/s][A
Training:  57%|█████▋    | 33/58 [0

Epoch: 20/27 - Loss: 0.1774 - Accuracy: 0.9530



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:01<00:08,  1.18s/it][A
100%|██████████| 8/8 [00:02<00:00,  3.64it/s][A
Epochs:  74%|███████▍  | 20/27 [06:01<02:04, 17.84s/it]

Val Loss: 0.2655 - Val Accuracy: 0.9417



Training:   0%|          | 0/58 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/58 [00:01<01:05,  1.14s/it][A
Training:   3%|▎         | 2/58 [00:01<00:30,  1.81it/s][A
Training:   7%|▋         | 4/58 [00:01<00:12,  4.17it/s][A
Training:  10%|█         | 6/58 [00:02<00:16,  3.15it/s][A
Training:  14%|█▍        | 8/58 [00:02<00:10,  4.68it/s][A
Training:  17%|█▋        | 10/58 [00:03<00:14,  3.41it/s][A
Training:  21%|██        | 12/58 [00:03<00:10,  4.50it/s][A
Training:  22%|██▏       | 13/58 [00:04<00:14,  3.08it/s][A
Training:  24%|██▍       | 14/58 [00:04<00:12,  3.49it/s][A
Training:  28%|██▊       | 16/58 [00:04<00:08,  5.06it/s][A
Training:  31%|███       | 18/58 [00:05<00:11,  3.47it/s][A
Training:  34%|███▍      | 20/58 [00:05<00:07,  4.81it/s][A
Training:  38%|███▊      | 22/58 [00:06<00:10,  3.39it/s][A
Training:  41%|████▏     | 24/58 [00:06<00:07,  4.45it/s][A
Training:  45%|████▍     | 26/58 [00:07<00:09,  3.53it/s][A
Training:  47%|████▋     | 27/58 [00:

Epoch: 21/27 - Loss: 0.1806 - Accuracy: 0.9551



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:01<00:08,  1.24s/it][A
100%|██████████| 8/8 [00:02<00:00,  3.66it/s][A
Epochs:  78%|███████▊  | 21/27 [06:18<01:46, 17.77s/it]

Val Loss: 0.3972 - Val Accuracy: 0.9342



Training:   0%|          | 0/58 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/58 [00:01<01:16,  1.35s/it][A
Training:   9%|▊         | 5/58 [00:02<00:20,  2.53it/s][A
Training:  14%|█▍        | 8/58 [00:02<00:11,  4.46it/s][A
Training:  17%|█▋        | 10/58 [00:03<00:14,  3.26it/s][A
Training:  22%|██▏       | 13/58 [00:04<00:15,  2.98it/s][A
Training:  28%|██▊       | 16/58 [00:04<00:09,  4.34it/s][A
Training:  31%|███       | 18/58 [00:05<00:11,  3.47it/s][A
Training:  36%|███▌      | 21/58 [00:06<00:11,  3.27it/s][A
Training:  43%|████▎     | 25/58 [00:07<00:09,  3.49it/s][A
Training:  50%|█████     | 29/58 [00:08<00:08,  3.61it/s][A
Training:  53%|█████▎    | 31/58 [00:08<00:06,  4.32it/s][A
Training:  57%|█████▋    | 33/58 [00:09<00:07,  3.55it/s][A
Training:  64%|██████▍   | 37/58 [00:10<00:05,  3.66it/s][A
Training:  71%|███████   | 41/58 [00:11<00:04,  3.84it/s][A
Training:  76%|███████▌  | 44/58 [00:11<00:02,  5.07it/s][A
Training:  79%|███████▉  | 46/58 [0

Epoch: 22/27 - Loss: 0.2480 - Accuracy: 0.9506



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:01<00:08,  1.24s/it][A
100%|██████████| 8/8 [00:02<00:00,  3.70it/s][A
Epochs:  81%|████████▏ | 22/27 [06:36<01:28, 17.76s/it]

Val Loss: 0.2272 - Val Accuracy: 0.9526



Training:   0%|          | 0/58 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/58 [00:01<01:13,  1.29s/it][A
Training:   5%|▌         | 3/58 [00:01<00:20,  2.68it/s][A
Training:   9%|▊         | 5/58 [00:02<00:21,  2.49it/s][A
Training:  10%|█         | 6/58 [00:02<00:16,  3.07it/s][A
Training:  16%|█▌        | 9/58 [00:03<00:14,  3.36it/s][A
Training:  17%|█▋        | 10/58 [00:03<00:13,  3.66it/s][A
Training:  22%|██▏       | 13/58 [00:04<00:13,  3.38it/s][A
Training:  26%|██▌       | 15/58 [00:04<00:09,  4.47it/s][A
Training:  29%|██▉       | 17/58 [00:05<00:11,  3.44it/s][A
Training:  31%|███       | 18/58 [00:05<00:10,  3.89it/s][A
Training:  36%|███▌      | 21/58 [00:06<00:10,  3.58it/s][A
Training:  38%|███▊      | 22/58 [00:06<00:09,  3.84it/s][A
Training:  43%|████▎     | 25/58 [00:07<00:09,  3.52it/s][A
Training:  47%|████▋     | 27/58 [00:07<00:06,  4.60it/s][A
Training:  50%|█████     | 29/58 [00:08<00:08,  3.51it/s][A
Training:  52%|█████▏    | 30/58 [00:

Epoch: 23/27 - Loss: 0.2786 - Accuracy: 0.9493



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:01<00:08,  1.22s/it][A
 38%|███▊      | 3/8 [00:01<00:01,  2.79it/s][A
100%|██████████| 8/8 [00:02<00:00,  3.57it/s][A
Epochs:  85%|████████▌ | 23/27 [06:54<01:11, 17.76s/it]

Val Loss: 0.6086 - Val Accuracy: 0.9265



Training:   0%|          | 0/58 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/58 [00:01<01:12,  1.27s/it][A
Training:   5%|▌         | 3/58 [00:01<00:20,  2.66it/s][A
Training:   9%|▊         | 5/58 [00:02<00:21,  2.45it/s][A
Training:  12%|█▏        | 7/58 [00:02<00:13,  3.90it/s][A
Training:  16%|█▌        | 9/58 [00:03<00:16,  3.00it/s][A
Training:  19%|█▉        | 11/58 [00:03<00:11,  4.25it/s][A
Training:  22%|██▏       | 13/58 [00:04<00:14,  3.13it/s][A
Training:  26%|██▌       | 15/58 [00:04<00:10,  4.27it/s][A
Training:  29%|██▉       | 17/58 [00:05<00:13,  3.11it/s][A
Training:  36%|███▌      | 21/58 [00:06<00:10,  3.41it/s][A
Training:  40%|███▉      | 23/58 [00:06<00:08,  4.30it/s][A
Training:  43%|████▎     | 25/58 [00:07<00:09,  3.56it/s][A
Training:  50%|█████     | 29/58 [00:08<00:08,  3.58it/s][A
Training:  55%|█████▌    | 32/58 [00:08<00:05,  4.92it/s][A
Training:  59%|█████▊    | 34/58 [00:09<00:06,  3.66it/s][A
Training:  64%|██████▍   | 37/58 [00:

Epoch: 24/27 - Loss: 0.3004 - Accuracy: 0.9484



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:01<00:08,  1.28s/it][A
 50%|█████     | 4/8 [00:01<00:01,  3.68it/s][A
100%|██████████| 8/8 [00:02<00:00,  3.59it/s][A
Epochs:  89%|████████▉ | 24/27 [07:12<00:53, 17.84s/it]

Val Loss: 0.2322 - Val Accuracy: 0.9537



Training:   0%|          | 0/58 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/58 [00:01<01:14,  1.31s/it][A
Training:   7%|▋         | 4/58 [00:01<00:14,  3.64it/s][A
Training:  10%|█         | 6/58 [00:02<00:18,  2.78it/s][A
Training:  16%|█▌        | 9/58 [00:03<00:15,  3.07it/s][A
Training:  22%|██▏       | 13/58 [00:04<00:12,  3.52it/s][A
Training:  26%|██▌       | 15/58 [00:04<00:10,  4.25it/s][A
Training:  29%|██▉       | 17/58 [00:05<00:11,  3.53it/s][A
Training:  31%|███       | 18/58 [00:05<00:10,  3.92it/s][A
Training:  34%|███▍      | 20/58 [00:05<00:07,  5.00it/s][A
Training:  36%|███▌      | 21/58 [00:06<00:11,  3.33it/s][A
Training:  38%|███▊      | 22/58 [00:06<00:09,  3.76it/s][A
Training:  43%|████▎     | 25/58 [00:07<00:09,  3.60it/s][A
Training:  45%|████▍     | 26/58 [00:07<00:08,  3.94it/s][A
Training:  50%|█████     | 29/58 [00:08<00:08,  3.53it/s][A
Training:  55%|█████▌    | 32/58 [00:08<00:04,  5.32it/s][A
Training:  59%|█████▊    | 34/58 [00

Epoch: 25/27 - Loss: 0.2430 - Accuracy: 0.9541



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:01<00:08,  1.28s/it][A
 38%|███▊      | 3/8 [00:01<00:01,  2.55it/s][A
 62%|██████▎   | 5/8 [00:02<00:01,  2.66it/s][A
100%|██████████| 8/8 [00:02<00:00,  3.39it/s][A
Epochs:  93%|█████████▎| 25/27 [07:30<00:35, 17.86s/it]

Val Loss: 0.3262 - Val Accuracy: 0.9488



Training:   0%|          | 0/58 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/58 [00:01<01:09,  1.22s/it][A
Training:   3%|▎         | 2/58 [00:01<00:32,  1.73it/s][A
Training:   9%|▊         | 5/58 [00:02<00:19,  2.71it/s][A
Training:  10%|█         | 6/58 [00:02<00:16,  3.20it/s][A
Training:  16%|█▌        | 9/58 [00:03<00:13,  3.55it/s][A
Training:  17%|█▋        | 10/58 [00:03<00:12,  3.80it/s][A
Training:  22%|██▏       | 13/58 [00:04<00:12,  3.74it/s][A
Training:  24%|██▍       | 14/58 [00:04<00:10,  4.02it/s][A
Training:  28%|██▊       | 16/58 [00:04<00:07,  5.47it/s][A
Training:  29%|██▉       | 17/58 [00:05<00:12,  3.35it/s][A
Training:  31%|███       | 18/58 [00:05<00:10,  3.90it/s][A
Training:  36%|███▌      | 21/58 [00:06<00:10,  3.59it/s][A
Training:  38%|███▊      | 22/58 [00:06<00:08,  4.01it/s][A
Training:  43%|████▎     | 25/58 [00:07<00:09,  3.49it/s][A
Training:  48%|████▊     | 28/58 [00:07<00:05,  5.28it/s][A
Training:  52%|█████▏    | 30/58 [00:

Epoch: 26/27 - Loss: 0.4515 - Accuracy: 0.9467



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:01<00:09,  1.30s/it][A
 62%|██████▎   | 5/8 [00:02<00:01,  2.63it/s][A
100%|██████████| 8/8 [00:02<00:00,  3.42it/s][A
Epochs:  96%|█████████▋| 26/27 [07:48<00:17, 17.86s/it]

Val Loss: 0.5486 - Val Accuracy: 0.9326



Training:   0%|          | 0/58 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/58 [00:01<01:18,  1.38s/it][A
Training:   9%|▊         | 5/58 [00:02<00:22,  2.36it/s][A
Training:  16%|█▌        | 9/58 [00:03<00:15,  3.14it/s][A
Training:  21%|██        | 12/58 [00:03<00:09,  4.66it/s][A
Training:  24%|██▍       | 14/58 [00:04<00:13,  3.26it/s][A
Training:  28%|██▊       | 16/58 [00:04<00:10,  4.18it/s][A
Training:  31%|███       | 18/58 [00:05<00:11,  3.45it/s][A
Training:  36%|███▌      | 21/58 [00:06<00:11,  3.27it/s][A
Training:  40%|███▉      | 23/58 [00:06<00:08,  4.18it/s][A
Training:  43%|████▎     | 25/58 [00:07<00:09,  3.32it/s][A
Training:  50%|█████     | 29/58 [00:08<00:08,  3.58it/s][A
Training:  57%|█████▋    | 33/58 [00:09<00:06,  3.81it/s][A
Training:  62%|██████▏   | 36/58 [00:09<00:04,  5.00it/s][A
Training:  66%|██████▌   | 38/58 [00:10<00:05,  3.92it/s][A
Training:  71%|███████   | 41/58 [00:11<00:04,  3.72it/s][A
Training:  74%|███████▍  | 43/58 [0

Epoch: 27/27 - Loss: 1.1070 - Accuracy: 0.9339



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:01<00:09,  1.36s/it][A
 50%|█████     | 4/8 [00:01<00:01,  3.50it/s][A
100%|██████████| 8/8 [00:02<00:00,  3.35it/s][A
Epochs: 100%|██████████| 27/27 [08:06<00:00, 18.01s/it]
[32m[I 2023-12-12 00:12:29,151][0m Trial 4 finished with value: 0.9456557035446167 and parameters: {'learning_rate': 0.008903291501466909, 'weight_decay': 0.0005440025295771077, 'epsilon': 7.786125083908577e-08, 'batch_size': 241, 'epochs': 27}. Best is trial 2 with value: 0.9673694372177124.[0m


Val Loss: 1.0486 - Val Accuracy: 0.9457
Learning rate: 0.0009368984847459859
Weight decay: 0.00208747352992348
Epsilon: 1.6491425686354776e-08
Batch size: 163
Number of epochs: 98


Epochs:   0%|          | 0/98 [00:00<?, ?it/s]
Training:   0%|          | 0/86 [00:00<?, ?it/s][A
Training:   1%|          | 1/86 [00:00<01:23,  1.02it/s][A
Training:   6%|▌         | 5/86 [00:01<00:24,  3.29it/s][A
Training:  10%|█         | 9/86 [00:02<00:18,  4.26it/s][A
Training:  15%|█▌        | 13/86 [00:03<00:14,  5.13it/s][A
Training:  20%|█▉        | 17/86 [00:03<00:12,  5.33it/s][A
Training:  23%|██▎       | 20/86 [00:03<00:09,  6.93it/s][A
Training:  26%|██▌       | 22/86 [00:04<00:11,  5.52it/s][A
Training:  29%|██▉       | 25/86 [00:05<00:12,  5.01it/s][A
Training:  33%|███▎      | 28/86 [00:05<00:08,  6.73it/s][A
Training:  35%|███▍      | 30/86 [00:05<00:10,  5.37it/s][A
Training:  38%|███▊      | 33/86 [00:06<00:10,  4.91it/s][A
Training:  42%|████▏     | 36/86 [00:06<00:07,  6.69it/s][A
Training:  44%|████▍     | 38/86 [00:07<00:08,  5.46it/s][A
Training:  48%|████▊     | 41/86 [00:07<00:08,  5.34it/s][A
Training:  51%|█████     | 44/86 [00:08<00:05,  7.

Epoch: 1/98 - Loss: 0.2500 - Accuracy: 0.9029



  0%|          | 0/11 [00:00<?, ?it/s][A
  9%|▉         | 1/11 [00:00<00:09,  1.03it/s][A
 27%|██▋       | 3/11 [00:01<00:02,  3.42it/s][A
 45%|████▌     | 5/11 [00:01<00:01,  3.42it/s][A
100%|██████████| 11/11 [00:02<00:00,  4.68it/s][A
Epochs:   1%|          | 1/98 [00:18<29:09, 18.03s/it]

Val Loss: 0.1293 - Val Accuracy: 0.9537



Training:   0%|          | 0/86 [00:00<?, ?it/s][A
Training:   1%|          | 1/86 [00:00<01:17,  1.10it/s][A
Training:   6%|▌         | 5/86 [00:01<00:22,  3.64it/s][A
Training:   7%|▋         | 6/86 [00:01<00:18,  4.24it/s][A
Training:  10%|█         | 9/86 [00:02<00:16,  4.63it/s][A
Training:  14%|█▍        | 12/86 [00:02<00:10,  7.14it/s][A
Training:  16%|█▋        | 14/86 [00:02<00:12,  5.59it/s][A
Training:  20%|█▉        | 17/86 [00:03<00:12,  5.36it/s][A
Training:  21%|██        | 18/86 [00:03<00:11,  5.67it/s][A
Training:  24%|██▍       | 21/86 [00:04<00:12,  5.38it/s][A
Training:  26%|██▌       | 22/86 [00:04<00:11,  5.62it/s][A
Training:  29%|██▉       | 25/86 [00:04<00:11,  5.43it/s][A
Training:  31%|███▏      | 27/86 [00:05<00:08,  6.67it/s][A
Training:  34%|███▎      | 29/86 [00:05<00:10,  5.19it/s][A
Training:  37%|███▋      | 32/86 [00:05<00:07,  7.47it/s][A
Training:  40%|███▉      | 34/86 [00:06<00:09,  5.47it/s][A
Training:  43%|████▎     | 37/86 [00

Epoch: 2/98 - Loss: 0.1267 - Accuracy: 0.9529



  0%|          | 0/11 [00:00<?, ?it/s][A
  9%|▉         | 1/11 [00:00<00:09,  1.04it/s][A
 45%|████▌     | 5/11 [00:01<00:01,  3.30it/s][A
100%|██████████| 11/11 [00:02<00:00,  4.58it/s][A
Epochs:   2%|▏         | 2/98 [00:35<28:43, 17.95s/it]

Val Loss: 0.1267 - Val Accuracy: 0.9505



Training:   0%|          | 0/86 [00:00<?, ?it/s][A
Training:   1%|          | 1/86 [00:00<01:13,  1.15it/s][A
Training:   2%|▏         | 2/86 [00:00<00:35,  2.38it/s][A
Training:   6%|▌         | 5/86 [00:01<00:20,  3.90it/s][A
Training:   7%|▋         | 6/86 [00:01<00:18,  4.39it/s][A
Training:  10%|█         | 9/86 [00:02<00:15,  4.84it/s][A
Training:  13%|█▎        | 11/86 [00:02<00:11,  6.33it/s][A
Training:  15%|█▌        | 13/86 [00:02<00:13,  5.28it/s][A
Training:  17%|█▋        | 15/86 [00:02<00:10,  6.84it/s][A
Training:  20%|█▉        | 17/86 [00:03<00:13,  5.07it/s][A
Training:  21%|██        | 18/86 [00:03<00:12,  5.56it/s][A
Training:  24%|██▍       | 21/86 [00:04<00:12,  5.12it/s][A
Training:  28%|██▊       | 24/86 [00:04<00:08,  7.36it/s][A
Training:  30%|███       | 26/86 [00:05<00:10,  5.53it/s][A
Training:  34%|███▎      | 29/86 [00:05<00:11,  5.10it/s][A
Training:  38%|███▊      | 33/86 [00:06<00:09,  5.65it/s][A
Training:  43%|████▎     | 37/86 [00:

Epoch: 3/98 - Loss: 0.1121 - Accuracy: 0.9573



  0%|          | 0/11 [00:00<?, ?it/s][A
  9%|▉         | 1/11 [00:01<00:10,  1.00s/it][A
 45%|████▌     | 5/11 [00:01<00:01,  3.38it/s][A
 73%|███████▎  | 8/11 [00:01<00:00,  5.83it/s][A
100%|██████████| 11/11 [00:02<00:00,  4.59it/s][A
Epochs:   2%|▏         | 2/98 [00:53<43:00, 26.88s/it]
[32m[I 2023-12-12 00:13:23,210][0m Trial 5 pruned. [0m


Val Loss: 0.1201 - Val Accuracy: 0.9543
Learning rate: 0.0034193504484732735
Weight decay: 0.0017395839341624465
Epsilon: 4.952790310532769e-09
Batch size: 123
Number of epochs: 73


Epochs:   0%|          | 0/73 [00:00<?, ?it/s]
Training:   0%|          | 0/114 [00:00<?, ?it/s][A
Training:   1%|          | 1/114 [00:00<01:29,  1.26it/s][A
Training:   4%|▍         | 5/114 [00:01<00:25,  4.31it/s][A
Training:   8%|▊         | 9/114 [00:01<00:18,  5.53it/s][A
Training:  11%|█▏        | 13/114 [00:02<00:15,  6.49it/s][A
Training:  15%|█▍        | 17/114 [00:02<00:13,  6.99it/s][A
Training:  18%|█▊        | 21/114 [00:03<00:12,  7.23it/s][A
Training:  22%|██▏       | 25/114 [00:03<00:11,  7.45it/s][A
Training:  25%|██▌       | 29/114 [00:04<00:11,  7.34it/s][A
Training:  29%|██▉       | 33/114 [00:04<00:10,  7.43it/s][A
Training:  32%|███▏      | 37/114 [00:05<00:09,  7.71it/s][A
Training:  36%|███▌      | 41/114 [00:05<00:09,  7.85it/s][A
Training:  39%|███▉      | 45/114 [00:06<00:09,  7.55it/s][A
Training:  43%|████▎     | 49/114 [00:07<00:08,  7.54it/s][A
Training:  46%|████▋     | 53/114 [00:07<00:08,  7.40it/s][A
Training:  50%|█████     | 57/114 [

Epoch: 1/73 - Loss: 0.3056 - Accuracy: 0.9031



  0%|          | 0/15 [00:00<?, ?it/s][A
  7%|▋         | 1/15 [00:00<00:10,  1.31it/s][A
 33%|███▎      | 5/15 [00:01<00:02,  4.51it/s][A
 47%|████▋     | 7/15 [00:01<00:01,  6.37it/s][A
 60%|██████    | 9/15 [00:01<00:01,  5.95it/s][A
 67%|██████▋   | 10/15 [00:01<00:00,  6.35it/s][A
 87%|████████▋ | 13/15 [00:02<00:00,  7.70it/s][A
100%|██████████| 15/15 [00:02<00:00,  6.41it/s][A
Epochs:   1%|▏         | 1/73 [00:17<21:23, 17.82s/it]

Val Loss: 0.1386 - Val Accuracy: 0.9536



Training:   0%|          | 0/114 [00:00<?, ?it/s][A
Training:   1%|          | 1/114 [00:00<01:24,  1.33it/s][A
Training:   4%|▎         | 4/114 [00:00<00:18,  5.86it/s][A
Training:   5%|▌         | 6/114 [00:01<00:21,  5.09it/s][A
Training:   8%|▊         | 9/114 [00:01<00:20,  5.22it/s][A
Training:  11%|█▏        | 13/114 [00:02<00:16,  6.20it/s][A
Training:  15%|█▍        | 17/114 [00:02<00:14,  6.87it/s][A
Training:  18%|█▊        | 20/114 [00:02<00:10,  8.84it/s][A
Training:  19%|█▉        | 22/114 [00:03<00:12,  7.61it/s][A
Training:  22%|██▏       | 25/114 [00:03<00:12,  6.91it/s][A
Training:  25%|██▌       | 29/114 [00:04<00:11,  7.30it/s][A
Training:  29%|██▉       | 33/114 [00:04<00:10,  7.62it/s][A
Training:  32%|███▏      | 37/114 [00:05<00:10,  7.52it/s][A
Training:  36%|███▌      | 41/114 [00:05<00:09,  7.46it/s][A
Training:  39%|███▉      | 45/114 [00:06<00:09,  7.51it/s][A
Training:  43%|████▎     | 49/114 [00:06<00:08,  7.82it/s][A
Training:  46%|████▋

Epoch: 2/73 - Loss: 0.1273 - Accuracy: 0.9550



  0%|          | 0/15 [00:00<?, ?it/s][A
  7%|▋         | 1/15 [00:00<00:11,  1.22it/s][A
 33%|███▎      | 5/15 [00:01<00:02,  4.40it/s][A
 60%|██████    | 9/15 [00:01<00:01,  5.64it/s][A
100%|██████████| 15/15 [00:02<00:00,  6.28it/s][A
Epochs:   3%|▎         | 2/73 [00:35<21:11, 17.91s/it]

Val Loss: 0.1338 - Val Accuracy: 0.9536



Training:   0%|          | 0/114 [00:00<?, ?it/s][A
Training:   1%|          | 1/114 [00:00<01:16,  1.47it/s][A
Training:   4%|▎         | 4/114 [00:00<00:17,  6.17it/s][A
Training:   5%|▌         | 6/114 [00:01<00:21,  5.13it/s][A
Training:   8%|▊         | 9/114 [00:01<00:19,  5.47it/s][A
Training:  11%|█         | 12/114 [00:01<00:12,  8.12it/s][A
Training:  12%|█▏        | 14/114 [00:02<00:14,  6.78it/s][A
Training:  15%|█▍        | 17/114 [00:02<00:15,  6.46it/s][A
Training:  18%|█▊        | 21/114 [00:03<00:12,  7.39it/s][A
Training:  22%|██▏       | 25/114 [00:03<00:11,  7.67it/s][A
Training:  25%|██▌       | 29/114 [00:04<00:10,  8.06it/s][A
Training:  29%|██▉       | 33/114 [00:04<00:10,  8.05it/s][A
Training:  32%|███▏      | 36/114 [00:04<00:07,  9.91it/s][A
Training:  33%|███▎      | 38/114 [00:05<00:09,  8.03it/s][A
Training:  35%|███▌      | 40/114 [00:05<00:08,  9.20it/s][A
Training:  37%|███▋      | 42/114 [00:05<00:10,  7.19it/s][A
Training:  39%|███▉ 

Epoch: 3/73 - Loss: 0.1272 - Accuracy: 0.9530



  0%|          | 0/15 [00:00<?, ?it/s][A
  7%|▋         | 1/15 [00:00<00:11,  1.18it/s][A
 33%|███▎      | 5/15 [00:01<00:02,  4.55it/s][A
 53%|█████▎    | 8/15 [00:01<00:00,  7.36it/s][A
 67%|██████▋   | 10/15 [00:01<00:00,  6.09it/s][A
100%|██████████| 15/15 [00:02<00:00,  6.30it/s][A
Epochs:   3%|▎         | 2/73 [00:53<31:38, 26.74s/it]
[32m[I 2023-12-12 00:14:17,003][0m Trial 6 pruned. [0m


Val Loss: 0.1370 - Val Accuracy: 0.9492
Learning rate: 0.005341483543312573
Weight decay: 0.0007532182516513662
Epsilon: 1.4570935842064741e-08
Batch size: 167
Number of epochs: 96


Epochs:   0%|          | 0/96 [00:00<?, ?it/s]
Training:   0%|          | 0/84 [00:00<?, ?it/s][A
Training:   1%|          | 1/84 [00:00<01:15,  1.10it/s][A
Training:   6%|▌         | 5/84 [00:01<00:22,  3.57it/s][A
Training:  11%|█         | 9/84 [00:02<00:17,  4.26it/s][A
Training:  15%|█▌        | 13/84 [00:03<00:14,  4.89it/s][A
Training:  20%|██        | 17/84 [00:03<00:11,  5.59it/s][A
Training:  25%|██▌       | 21/84 [00:04<00:10,  5.80it/s][A
Training:  30%|██▉       | 25/84 [00:05<00:10,  5.62it/s][A
Training:  35%|███▍      | 29/84 [00:05<00:09,  5.62it/s][A
Training:  39%|███▉      | 33/84 [00:06<00:08,  5.82it/s][A
Training:  44%|████▍     | 37/84 [00:07<00:08,  5.64it/s][A
Training:  46%|████▋     | 39/84 [00:07<00:06,  6.43it/s][A
Training:  49%|████▉     | 41/84 [00:07<00:07,  5.39it/s][A
Training:  54%|█████▎    | 45/84 [00:08<00:07,  5.51it/s][A
Training:  57%|█████▋    | 48/84 [00:08<00:05,  7.16it/s][A
Training:  60%|█████▉    | 50/84 [00:09<00:06,  5.

Epoch: 1/96 - Loss: 0.5257 - Accuracy: 0.8786



  0%|          | 0/11 [00:00<?, ?it/s][A
  9%|▉         | 1/11 [00:00<00:09,  1.05it/s][A
 36%|███▋      | 4/11 [00:01<00:01,  4.78it/s][A
 55%|█████▍    | 6/11 [00:01<00:01,  3.85it/s][A
100%|██████████| 11/11 [00:02<00:00,  4.52it/s][A
Epochs:   1%|          | 1/96 [00:17<27:57, 17.65s/it]

Val Loss: 0.1440 - Val Accuracy: 0.9564



Training:   0%|          | 0/84 [00:00<?, ?it/s][A
Training:   1%|          | 1/84 [00:00<01:10,  1.17it/s][A
Training:   5%|▍         | 4/84 [00:00<00:15,  5.29it/s][A
Training:   7%|▋         | 6/84 [00:01<00:18,  4.29it/s][A
Training:  11%|█         | 9/84 [00:02<00:16,  4.55it/s][A
Training:  12%|█▏        | 10/84 [00:02<00:15,  4.80it/s][A
Training:  15%|█▌        | 13/84 [00:02<00:14,  4.85it/s][A
Training:  18%|█▊        | 15/84 [00:03<00:11,  6.13it/s][A
Training:  20%|██        | 17/84 [00:03<00:12,  5.34it/s][A
Training:  25%|██▌       | 21/84 [00:04<00:10,  5.76it/s][A
Training:  30%|██▉       | 25/84 [00:04<00:10,  5.75it/s][A
Training:  33%|███▎      | 28/84 [00:04<00:07,  7.46it/s][A
Training:  36%|███▌      | 30/84 [00:05<00:09,  5.83it/s][A
Training:  39%|███▉      | 33/84 [00:06<00:09,  5.50it/s][A
Training:  43%|████▎     | 36/84 [00:06<00:06,  7.33it/s][A
Training:  45%|████▌     | 38/84 [00:07<00:08,  5.40it/s][A
Training:  49%|████▉     | 41/84 [00

Epoch: 2/96 - Loss: 0.1384 - Accuracy: 0.9493



  0%|          | 0/11 [00:00<?, ?it/s][A
  9%|▉         | 1/11 [00:01<00:10,  1.04s/it][A
 45%|████▌     | 5/11 [00:01<00:01,  3.33it/s][A
100%|██████████| 11/11 [00:02<00:00,  4.41it/s][A
Epochs:   2%|▏         | 2/96 [00:35<27:28, 17.54s/it]

Val Loss: 0.1290 - Val Accuracy: 0.9570



Training:   0%|          | 0/84 [00:00<?, ?it/s][A
Training:   1%|          | 1/84 [00:00<01:16,  1.08it/s][A
Training:   6%|▌         | 5/84 [00:01<00:20,  3.87it/s][A
Training:  10%|▉         | 8/84 [00:01<00:11,  6.52it/s][A
Training:  12%|█▏        | 10/84 [00:02<00:14,  5.01it/s][A
Training:  14%|█▍        | 12/84 [00:02<00:11,  6.47it/s][A
Training:  17%|█▋        | 14/84 [00:02<00:13,  5.06it/s][A
Training:  20%|██        | 17/84 [00:03<00:13,  5.15it/s][A
Training:  21%|██▏       | 18/84 [00:03<00:11,  5.54it/s][A
Training:  25%|██▌       | 21/84 [00:04<00:11,  5.70it/s][A
Training:  26%|██▌       | 22/84 [00:04<00:10,  6.03it/s][A
Training:  30%|██▉       | 25/84 [00:04<00:09,  5.96it/s][A
Training:  31%|███       | 26/84 [00:04<00:10,  5.78it/s][A
Training:  35%|███▍      | 29/84 [00:05<00:09,  5.90it/s][A
Training:  36%|███▌      | 30/84 [00:05<00:09,  5.80it/s][A
Training:  39%|███▉      | 33/84 [00:06<00:08,  6.37it/s][A
Training:  40%|████      | 34/84 [0

Epoch: 3/96 - Loss: 0.1199 - Accuracy: 0.9560



  0%|          | 0/11 [00:00<?, ?it/s][A
  9%|▉         | 1/11 [00:01<00:10,  1.02s/it][A
 45%|████▌     | 5/11 [00:01<00:01,  3.38it/s][A
100%|██████████| 11/11 [00:02<00:00,  4.43it/s][A
Epochs:   3%|▎         | 3/96 [00:52<27:05, 17.48s/it]

Val Loss: 0.1271 - Val Accuracy: 0.9520



Training:   0%|          | 0/84 [00:00<?, ?it/s][A
Training:   1%|          | 1/84 [00:00<01:20,  1.04it/s][A
Training:   2%|▏         | 2/84 [00:01<00:38,  2.12it/s][A
Training:   6%|▌         | 5/84 [00:01<00:21,  3.73it/s][A
Training:   8%|▊         | 7/84 [00:01<00:13,  5.52it/s][A
Training:  11%|█         | 9/84 [00:02<00:15,  4.79it/s][A
Training:  15%|█▌        | 13/84 [00:02<00:13,  5.44it/s][A
Training:  20%|██        | 17/84 [00:03<00:11,  5.72it/s][A
Training:  25%|██▌       | 21/84 [00:04<00:10,  5.88it/s][A
Training:  30%|██▉       | 25/84 [00:04<00:09,  6.12it/s][A
Training:  33%|███▎      | 28/84 [00:04<00:07,  7.60it/s][A
Training:  36%|███▌      | 30/84 [00:05<00:08,  6.11it/s][A
Training:  39%|███▉      | 33/84 [00:06<00:08,  5.79it/s][A
Training:  44%|████▍     | 37/84 [00:06<00:08,  5.65it/s][A
Training:  45%|████▌     | 38/84 [00:06<00:07,  5.94it/s][A
Training:  49%|████▉     | 41/84 [00:07<00:07,  5.55it/s][A
Training:  52%|█████▏    | 44/84 [00:

Epoch: 4/96 - Loss: 0.1202 - Accuracy: 0.9560



  0%|          | 0/11 [00:00<?, ?it/s][A
  9%|▉         | 1/11 [00:01<00:09,  1.00it/s][A
 45%|████▌     | 5/11 [00:01<00:01,  3.21it/s][A
100%|██████████| 11/11 [00:02<00:00,  4.34it/s][A
Epochs:   4%|▍         | 4/96 [01:09<26:46, 17.46s/it]

Val Loss: 0.1238 - Val Accuracy: 0.9554



Training:   0%|          | 0/84 [00:00<?, ?it/s][A
Training:   1%|          | 1/84 [00:01<01:24,  1.02s/it][A
Training:   5%|▍         | 4/84 [00:01<00:17,  4.53it/s][A
Training:   7%|▋         | 6/84 [00:01<00:20,  3.82it/s][A
Training:  11%|█         | 9/84 [00:02<00:17,  4.18it/s][A
Training:  15%|█▌        | 13/84 [00:03<00:14,  5.07it/s][A
Training:  20%|██        | 17/84 [00:03<00:11,  5.79it/s][A
Training:  25%|██▌       | 21/84 [00:04<00:10,  6.03it/s][A
Training:  30%|██▉       | 25/84 [00:04<00:10,  5.85it/s][A
Training:  35%|███▍      | 29/84 [00:05<00:09,  5.98it/s][A
Training:  39%|███▉      | 33/84 [00:06<00:08,  6.22it/s][A
Training:  43%|████▎     | 36/84 [00:06<00:06,  7.72it/s][A
Training:  45%|████▌     | 38/84 [00:06<00:07,  6.28it/s][A
Training:  49%|████▉     | 41/84 [00:07<00:07,  5.42it/s][A
Training:  52%|█████▏    | 44/84 [00:07<00:05,  7.12it/s][A
Training:  55%|█████▍    | 46/84 [00:08<00:06,  5.74it/s][A
Training:  58%|█████▊    | 49/84 [00

Epoch: 5/96 - Loss: 0.1170 - Accuracy: 0.9566



  0%|          | 0/11 [00:00<?, ?it/s][A
  9%|▉         | 1/11 [00:00<00:08,  1.12it/s][A
 36%|███▋      | 4/11 [00:01<00:01,  4.88it/s][A
 55%|█████▍    | 6/11 [00:01<00:01,  3.97it/s][A
 73%|███████▎  | 8/11 [00:01<00:00,  5.56it/s][A
100%|██████████| 11/11 [00:02<00:00,  4.65it/s][A
Epochs:   5%|▌         | 5/96 [01:27<26:23, 17.40s/it]

Val Loss: 0.1539 - Val Accuracy: 0.9439



Training:   0%|          | 0/84 [00:00<?, ?it/s][A
Training:   1%|          | 1/84 [00:00<01:17,  1.07it/s][A
Training:   6%|▌         | 5/84 [00:01<00:22,  3.52it/s][A
Training:  10%|▉         | 8/84 [00:01<00:12,  5.92it/s][A
Training:  12%|█▏        | 10/84 [00:02<00:15,  4.72it/s][A
Training:  15%|█▌        | 13/84 [00:03<00:15,  4.67it/s][A
Training:  20%|██        | 17/84 [00:03<00:12,  5.33it/s][A
Training:  25%|██▌       | 21/84 [00:04<00:10,  5.86it/s][A
Training:  30%|██▉       | 25/84 [00:04<00:10,  5.74it/s][A
Training:  35%|███▍      | 29/84 [00:05<00:09,  5.60it/s][A
Training:  39%|███▉      | 33/84 [00:06<00:08,  5.97it/s][A
Training:  44%|████▍     | 37/84 [00:06<00:07,  6.13it/s][A
Training:  49%|████▉     | 41/84 [00:07<00:07,  5.75it/s][A
Training:  51%|█████     | 43/84 [00:07<00:06,  6.58it/s][A
Training:  54%|█████▎    | 45/84 [00:08<00:06,  5.68it/s][A
Training:  58%|█████▊    | 49/84 [00:08<00:06,  5.77it/s][A
Training:  63%|██████▎   | 53/84 [0

Epoch: 6/96 - Loss: 0.1315 - Accuracy: 0.9547



  0%|          | 0/11 [00:00<?, ?it/s][A
  9%|▉         | 1/11 [00:00<00:09,  1.08it/s][A
 45%|████▌     | 5/11 [00:01<00:01,  3.34it/s][A
100%|██████████| 11/11 [00:02<00:00,  4.42it/s][A
Epochs:   6%|▋         | 6/96 [01:44<26:04, 17.38s/it]

Val Loss: 0.1428 - Val Accuracy: 0.9489



Training:   0%|          | 0/84 [00:00<?, ?it/s][A
Training:   1%|          | 1/84 [00:01<01:27,  1.05s/it][A
Training:   6%|▌         | 5/84 [00:01<00:24,  3.23it/s][A
Training:  11%|█         | 9/84 [00:02<00:17,  4.17it/s][A
Training:  15%|█▌        | 13/84 [00:03<00:15,  4.71it/s][A
Training:  19%|█▉        | 16/84 [00:03<00:10,  6.41it/s][A
Training:  21%|██▏       | 18/84 [00:03<00:12,  5.09it/s][A
Training:  25%|██▌       | 21/84 [00:04<00:12,  5.08it/s][A
Training:  30%|██▉       | 25/84 [00:05<00:10,  5.68it/s][A
Training:  35%|███▍      | 29/84 [00:05<00:09,  5.73it/s][A
Training:  39%|███▉      | 33/84 [00:06<00:08,  5.85it/s][A
Training:  44%|████▍     | 37/84 [00:07<00:07,  6.07it/s][A
Training:  48%|████▊     | 40/84 [00:07<00:05,  7.64it/s][A
Training:  50%|█████     | 42/84 [00:07<00:06,  6.24it/s][A
Training:  54%|█████▎    | 45/84 [00:08<00:06,  5.65it/s][A
Training:  57%|█████▋    | 48/84 [00:08<00:04,  7.40it/s][A
Training:  60%|█████▉    | 50/84 [0

Epoch: 7/96 - Loss: 0.1239 - Accuracy: 0.9573



  0%|          | 0/11 [00:00<?, ?it/s][A
  9%|▉         | 1/11 [00:00<00:09,  1.05it/s][A
 45%|████▌     | 5/11 [00:01<00:01,  3.37it/s][A
100%|██████████| 11/11 [00:02<00:00,  4.47it/s][A
Epochs:   7%|▋         | 7/96 [02:01<25:45, 17.36s/it]

Val Loss: 0.1595 - Val Accuracy: 0.9410



Training:   0%|          | 0/84 [00:00<?, ?it/s][A
Training:   1%|          | 1/84 [00:00<01:18,  1.05it/s][A
Training:   5%|▍         | 4/84 [00:01<00:16,  4.74it/s][A
Training:   7%|▋         | 6/84 [00:01<00:19,  4.06it/s][A
Training:  10%|▉         | 8/84 [00:01<00:13,  5.75it/s][A
Training:  12%|█▏        | 10/84 [00:02<00:17,  4.34it/s][A
Training:  15%|█▌        | 13/84 [00:03<00:15,  4.54it/s][A
Training:  18%|█▊        | 15/84 [00:03<00:11,  5.76it/s][A
Training:  20%|██        | 17/84 [00:03<00:14,  4.75it/s][A
Training:  24%|██▍       | 20/84 [00:03<00:09,  6.61it/s][A
Training:  26%|██▌       | 22/84 [00:04<00:11,  5.26it/s][A
Training:  30%|██▉       | 25/84 [00:05<00:11,  5.32it/s][A
Training:  32%|███▏      | 27/84 [00:05<00:08,  6.51it/s][A
Training:  35%|███▍      | 29/84 [00:05<00:09,  5.57it/s][A
Training:  38%|███▊      | 32/84 [00:05<00:06,  7.94it/s][A
Training:  40%|████      | 34/84 [00:06<00:08,  5.66it/s][A
Training:  44%|████▍     | 37/84 [00

Epoch: 8/96 - Loss: 0.1349 - Accuracy: 0.9549



  0%|          | 0/11 [00:00<?, ?it/s][A
  9%|▉         | 1/11 [00:00<00:09,  1.07it/s][A
 45%|████▌     | 5/11 [00:01<00:01,  3.46it/s][A
100%|██████████| 11/11 [00:02<00:00,  4.61it/s][A
Epochs:   8%|▊         | 8/96 [02:19<25:23, 17.32s/it]

Val Loss: 0.1744 - Val Accuracy: 0.9456



Training:   0%|          | 0/84 [00:00<?, ?it/s][A
Training:   1%|          | 1/84 [00:01<01:27,  1.05s/it][A
Training:   6%|▌         | 5/84 [00:01<00:23,  3.34it/s][A
Training:  10%|▉         | 8/84 [00:01<00:13,  5.68it/s][A
Training:  12%|█▏        | 10/84 [00:02<00:16,  4.46it/s][A
Training:  15%|█▌        | 13/84 [00:03<00:17,  4.17it/s][A
Training:  20%|██        | 17/84 [00:04<00:14,  4.63it/s][A
Training:  24%|██▍       | 20/84 [00:04<00:10,  6.32it/s][A
Training:  26%|██▌       | 22/84 [00:04<00:11,  5.24it/s][A
Training:  30%|██▉       | 25/84 [00:05<00:11,  5.10it/s][A
Training:  35%|███▍      | 29/84 [00:05<00:09,  5.58it/s][A
Training:  39%|███▉      | 33/84 [00:06<00:08,  5.95it/s][A
Training:  42%|████▏     | 35/84 [00:06<00:07,  6.91it/s][A
Training:  44%|████▍     | 37/84 [00:07<00:08,  5.77it/s][A
Training:  49%|████▉     | 41/84 [00:07<00:07,  5.80it/s][A
Training:  54%|█████▎    | 45/84 [00:08<00:06,  5.89it/s][A
Training:  58%|█████▊    | 49/84 [0

Epoch: 9/96 - Loss: 0.1388 - Accuracy: 0.9559



  0%|          | 0/11 [00:00<?, ?it/s][A
  9%|▉         | 1/11 [00:00<00:09,  1.02it/s][A
 36%|███▋      | 4/11 [00:01<00:01,  4.43it/s][A
 55%|█████▍    | 6/11 [00:01<00:01,  3.80it/s][A
 73%|███████▎  | 8/11 [00:01<00:00,  5.32it/s][A
100%|██████████| 11/11 [00:02<00:00,  4.43it/s][A
Epochs:   8%|▊         | 8/96 [02:36<28:43, 19.59s/it]
[32m[I 2023-12-12 00:16:54,086][0m Trial 7 pruned. [0m


Val Loss: 0.1640 - Val Accuracy: 0.9489
Learning rate: 0.023311317528376157
Weight decay: 0.00116289474973586
Epsilon: 2.5173517380909117e-08
Batch size: 53
Number of epochs: 63


Epochs:   0%|          | 0/63 [00:00<?, ?it/s]
Training:   0%|          | 0/264 [00:00<?, ?it/s][A
Training:   0%|          | 1/264 [00:00<01:57,  2.25it/s][A
Training:   2%|▏         | 5/264 [00:00<00:29,  8.81it/s][A
Training:   3%|▎         | 9/264 [00:00<00:21, 11.82it/s][A
Training:   5%|▍         | 13/264 [00:01<00:18, 13.44it/s][A
Training:   6%|▋         | 17/264 [00:01<00:16, 14.87it/s][A
Training:   8%|▊         | 21/264 [00:01<00:16, 15.10it/s][A
Training:   9%|▉         | 25/264 [00:01<00:15, 14.97it/s][A
Training:  11%|█         | 29/264 [00:02<00:15, 15.37it/s][A
Training:  12%|█▎        | 33/264 [00:02<00:14, 15.42it/s][A
Training:  14%|█▍        | 37/264 [00:02<00:14, 15.47it/s][A
Training:  16%|█▌        | 41/264 [00:02<00:13, 16.51it/s][A
Training:  17%|█▋        | 45/264 [00:03<00:12, 17.33it/s][A
Training:  19%|█▊        | 49/264 [00:03<00:12, 17.57it/s][A
Training:  20%|██        | 53/264 [00:03<00:12, 17.57it/s][A
Training:  22%|██▏       | 57/264 [

Epoch: 1/63 - Loss: 5.7018 - Accuracy: 0.8801



  0%|          | 0/33 [00:00<?, ?it/s][A
  3%|▎         | 1/33 [00:00<00:14,  2.15it/s][A
 15%|█▌        | 5/33 [00:00<00:02,  9.38it/s][A
 24%|██▍       | 8/33 [00:00<00:01, 13.53it/s][A
 30%|███       | 10/33 [00:00<00:01, 13.74it/s][A
 39%|███▉      | 13/33 [00:01<00:01, 13.65it/s][A
 52%|█████▏    | 17/33 [00:01<00:01, 15.41it/s][A
 61%|██████    | 20/33 [00:01<00:00, 17.09it/s][A
 67%|██████▋   | 22/33 [00:01<00:00, 16.96it/s][A
 73%|███████▎  | 24/33 [00:01<00:00, 17.08it/s][A
 79%|███████▉  | 26/33 [00:01<00:00, 17.74it/s][A
 85%|████████▍ | 28/33 [00:01<00:00, 16.82it/s][A
 91%|█████████ | 30/33 [00:02<00:00, 17.32it/s][A
100%|██████████| 33/33 [00:02<00:00, 14.46it/s][A
Epochs:   0%|          | 0/63 [00:17<?, ?it/s]
[32m[I 2023-12-12 00:17:12,074][0m Trial 8 pruned. [0m


Val Loss: 1.2338 - Val Accuracy: 0.9404
Learning rate: 0.0010605960903737042
Weight decay: 0.0002773257856992925
Epsilon: 1.6352363585303134e-09
Batch size: 296
Number of epochs: 18


Epochs:   0%|          | 0/18 [00:00<?, ?it/s]
Training:   0%|          | 0/48 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/48 [00:01<01:15,  1.61s/it][A
Training:  10%|█         | 5/48 [00:02<00:21,  2.04it/s][A
Training:  12%|█▎        | 6/48 [00:02<00:17,  2.40it/s][A
Training:  19%|█▉        | 9/48 [00:03<00:14,  2.71it/s][A
Training:  21%|██        | 10/48 [00:04<00:12,  2.96it/s][A
Training:  27%|██▋       | 13/48 [00:05<00:11,  2.98it/s][A
Training:  29%|██▉       | 14/48 [00:05<00:10,  3.24it/s][A
Training:  35%|███▌      | 17/48 [00:06<00:09,  3.22it/s][A
Training:  38%|███▊      | 18/48 [00:06<00:08,  3.51it/s][A
Training:  44%|████▍     | 21/48 [00:07<00:08,  3.35it/s][A
Training:  46%|████▌     | 22/48 [00:07<00:07,  3.70it/s][A
Training:  52%|█████▏    | 25/48 [00:08<00:07,  3.18it/s][A
Training:  54%|█████▍    | 26/48 [00:08<00:06,  3.32it/s][A
Training:  60%|██████    | 29/48 [00:09<00:05,  3.36it/s][A
Training:  62%|██████▎   | 30/48 [00:09<00:04,  3.7

Epoch: 1/18 - Loss: 0.3759 - Accuracy: 0.8644



  0%|          | 0/6 [00:00<?, ?it/s][A
 17%|█▋        | 1/6 [00:01<00:07,  1.52s/it][A
100%|██████████| 6/6 [00:02<00:00,  2.22it/s][A
Epochs:   0%|          | 0/18 [00:17<?, ?it/s]
[32m[I 2023-12-12 00:17:30,298][0m Trial 9 pruned. [0m


Val Loss: 0.1416 - Val Accuracy: 0.9495

Study statistics: 
  Number of finished trials:  10
  Number of pruned trials:  5
  Number of complete trials:  5


In [20]:
print("Best trial:")
trial = study.best_trial

print("  Value: ", trial.value)

print("  Params: ")
for key, value in trial.params.items():
    print("    {}: {}".format(key, value))

Best trial:
  Value:  0.9673694372177124
  Params: 
    batch_size: 249
    epochs: 40
    epsilon: 3.762780786582391e-09
    learning_rate: 0.00010173550281282758
    weight_decay: 0.008588437544705844


In [None]:
# ViT 12-8 CrossEntropyLoss Mean

Best trial:
Value:  0.9673694372177124
Params: 
batch_size: 249
epochs: 40
epsilon: 3.762780786582391e-09
learning_rate: 0.00010173550281282758
weight_decay: 0.008588437544705844