In [1]:
import os
import random
import pandas as pd
import numpy as np
import mxnet as mx
import torch
import torch.nn as nn
import torch.nn.functional as F
import torch.optim as opt
from torch.utils.data import Dataset, DataLoader
from einops import rearrange, repeat
import optuna
from optuna.trial import TrialState
from tqdm import tqdm

In [2]:
def file_to_embed(embeds, file):
    emb = []
    for f in file:
        emb.append(embeds[f][0])
    return torch.stack(emb)

In [3]:
MIN_NUM_PATCHES = 16

In [4]:
device = torch.device("cuda:3" if torch.cuda.is_available() else "cpu")
device

device(type='cuda', index=3)

In [5]:
class AdienceDataset(Dataset):
    def __init__(self, annot_file, img_dir):
        self.img_lbls = pd.read_csv(annot_file, header=None)
        self.img_dir = img_dir
    
    def __len__(self):
        return len(self.img_lbls)
    
    def __getitem__(self, idx):
        img_file = self.img_lbls.iloc[idx, 0]
        img_path = os.path.join(self.img_dir, img_file)
        image = mx.image.imread(img_path)
        if image.shape[1] != 112:
            image = mx.image.resize_short(image, 112)
        image = mx.nd.transpose(image, axes=(2,0,1))
        image = torch.tensor(image.asnumpy()).type(torch.FloatTensor)
        label = self.img_lbls.iloc[idx, 1]

        return image, label, img_file

In [6]:
train_data = AdienceDataset("../train.csv", "../cropped_Adience/")
val_data = AdienceDataset("../val.csv", "../cropped_Adience/")

In [7]:
class CosFace(nn.Module):
    r"""Implement of CosFace (https://arxiv.org/pdf/1801.09414.pdf):
    Args:
        in_features: size of each input sample
        out_features: size of each output sample
        device_id: the ID of GPU where the model will be trained by model parallel.
                       if device_id=None, it will be trained on CPU without model parallel.
        s: norm of input feature
        m: margin
        cos(theta)-m
    """

    def __init__(self, in_features, out_features, device_id, s=64.0, m=0.35):
        super(CosFace, self).__init__()
        self.in_features = in_features
        self.out_features = out_features
        self.device_id = device_id
        self.s = s
        self.m = m
        print("self.device_id", self.device_id)
        self.weight = nn.Parameter(torch.FloatTensor(out_features, in_features))
        nn.init.xavier_uniform_(self.weight)

    def forward(self, input, label):
        # --------------------------- cos(theta) & phi(theta) ---------------------------

        if self.device_id == None:
            cosine = F.linear(F.normalize(input), F.normalize(self.weight))
        else:
            x = input
            sub_weights = torch.chunk(self.weight, len(self.device_id), dim=0)
            temp_x = x.cuda(self.device_id[0])
            weight = sub_weights[0].cuda(self.device_id[0])
            cosine = F.linear(F.normalize(temp_x), F.normalize(weight))
            for i in range(1, len(self.device_id)):
                temp_x = x.cuda(self.device_id[i])
                weight = sub_weights[i].cuda(self.device_id[i])
                cosine = torch.cat((cosine, F.linear(F.normalize(temp_x), F.normalize(weight)).cuda(self.device_id[0])),
                                   dim=1)
        phi = cosine - self.m
        # --------------------------- convert label to one-hot ---------------------------
        one_hot = torch.zeros(cosine.size())
        if self.device_id != None:
            one_hot = one_hot.cuda(self.device_id[0])
        # one_hot = one_hot.cuda() if cosine.is_cuda else one_hot

        one_hot.scatter_(1, label.view(-1, 1).long(), 1)
        # -------------torch.where(out_i = {x_i if condition_i else y_i) -------------
        output = (one_hot * phi) + (
                    (1.0 - one_hot) * cosine)  # you can use torch.where if your torch.__version__ is 0.4
        output *= self.s

        return output

    def __repr__(self):
        return self.__class__.__name__ + '(' \
               + 'in_features = ' + str(self.in_features) \
               + ', out_features = ' + str(self.out_features) \
               + ', s = ' + str(self.s) \
               + ', m = ' + str(self.m) + ')'

In [8]:
class Residual(nn.Module):
    def __init__(self, fn):
        super().__init__()
        self.fn = fn
    def forward(self, x, **kwargs):
        return self.fn(x, **kwargs) + x

In [9]:
class PreNorm(nn.Module):
    def __init__(self, dim, fn):
        super().__init__()
        self.norm = nn.LayerNorm(dim)
        self.fn = fn
    def forward(self, x, **kwargs):
        return self.fn(self.norm(x), **kwargs)

In [10]:
class FeedForward(nn.Module):
    def __init__(self, dim, hidden_dim, dropout = 0.):
        super().__init__()
        self.net = nn.Sequential(
            nn.Linear(dim, hidden_dim),
            nn.GELU(),
            nn.Dropout(dropout),
            nn.Linear(hidden_dim, dim),
            nn.Dropout(dropout)
        )
    def forward(self, x):
        return self.net(x)

In [11]:
class Attention(nn.Module):
    def __init__(self, dim, heads = 8, dim_head = 64, dropout = 0.):
        super().__init__()
        inner_dim = dim_head *  heads
        self.heads = heads
        self.scale = dim ** -0.5

        self.to_qkv = nn.Linear(dim, inner_dim * 3, bias = False)
        self.to_out = nn.Sequential(
            nn.Linear(inner_dim, dim),
            nn.Dropout(dropout)
        )

    def forward(self, x, mask = None):
        b, n, _, h = *x.shape, self.heads
        qkv = self.to_qkv(x).chunk(3, dim = -1)

        q, k, v = map(lambda t: rearrange(t, 'b n (h d) -> b h n d', h = h), qkv)
        dots = torch.einsum('bhid,bhjd->bhij', q, k) * self.scale
        mask_value = -torch.finfo(dots.dtype).max
        #embed()
        if mask is not None:
            mask = F.pad(mask.flatten(1), (1, 0), value = True)
            assert mask.shape[-1] == dots.shape[-1], 'mask has incorrect dimensions'
            mask = mask[:, None, :] * mask[:, :, None]
            dots.masked_fill_(~mask, mask_value)
            del mask

        attn = dots.softmax(dim=-1)

        out = torch.einsum('bhij,bhjd->bhid', attn, v)
        out = rearrange(out, 'b h n d -> b n (h d)')
        out =  self.to_out(out)

        return out

In [12]:
class Transformer(nn.Module):
    def __init__(self, dim, depth, heads, dim_head, mlp_dim, dropout):
        super().__init__()
        self.layers = nn.ModuleList([])
        for _ in range(depth):
            self.layers.append(nn.ModuleList([
                Residual(PreNorm(dim, Attention(dim, heads = heads, dim_head = dim_head, dropout = dropout))),
                Residual(PreNorm(dim, FeedForward(dim, mlp_dim, dropout = dropout)))
            ]))
    def forward(self, x, mask = None):
        for attn, ff in self.layers:
            x = attn(x, mask = mask)
            #embed()
            x = ff(x)
        return x

In [13]:
class ViTs_face(nn.Module):
    def __init__(self, *, loss_type, GPU_ID, num_class, image_size, patch_size, ac_patch_size,
                         pad, dim, depth, heads, mlp_dim, pool = 'mean', channels = 3, dim_head = 64, dropout = 0., emb_dropout = 0.):
        super().__init__()
        assert image_size % patch_size == 0, 'Image dimensions must be divisible by the patch size.'
        num_patches = (image_size // patch_size) ** 2
        patch_dim = channels * ac_patch_size ** 2
        assert num_patches > MIN_NUM_PATCHES, f'your number of patches ({num_patches}) is way too small for attention to be effective (at least 16). Try decreasing your patch size'
        assert pool in {'cls', 'mean'}, 'pool type must be either cls (cls token) or mean (mean pooling)'

        self.patch_size = patch_size
        self.soft_split = nn.Unfold(kernel_size=(ac_patch_size, ac_patch_size), stride=(self.patch_size, self.patch_size), padding=(pad, pad))


        self.pos_embedding = nn.Parameter(torch.randn(1, num_patches + 1, dim))
        self.patch_to_embedding = nn.Linear(patch_dim, dim)
        self.cls_token = nn.Parameter(torch.randn(1, 1, dim))
        self.dropout = nn.Dropout(emb_dropout)

        self.transformer = Transformer(dim, depth, heads, dim_head, mlp_dim, dropout)

        self.pool = pool
        self.to_latent = nn.Identity()

        self.mlp_head = nn.Sequential(
            nn.LayerNorm(dim),
        )
        self.loss_type = loss_type
        self.GPU_ID = GPU_ID
        if self.loss_type == 'None':
            print("no loss for vit_face")
        else:
            if self.loss_type == 'CosFace':
                self.loss = CosFace(in_features=dim, out_features=num_class, device_id=self.GPU_ID)

    def forward(self, img, label= None , mask = None):
        p = self.patch_size
        x = self.soft_split(img).transpose(1, 2)
        x = self.patch_to_embedding(x)
        b, n, _ = x.shape

        cls_tokens = repeat(self.cls_token, '() n d -> b n d', b = b)
        x = torch.cat((cls_tokens, x), dim=1)
        x += self.pos_embedding[:, :(n + 1)]
        x = self.dropout(x)
        x = self.transformer(x, mask)

        # y = x[:, 0]
        z = x[:, 1:].mean(dim = 1)

        # y = self.to_latent(y)
        # emb_y = self.mlp_head(y)
        z = self.to_latent(z)
        emb_z = self.mlp_head(z)
        # emb = torch.cat((emb_y, emb_z), dim=1)
        emb = emb_z
        if label is not None:
            x = self.loss(emb, label)
            return x, emb
        else:
            return emb

In [14]:
class ViT_plus(nn.Module):
    def __init__(self):
        super(ViT_plus, self).__init__()
        
        self.fc1 = nn.Linear(in_features=512, out_features=512)
        self.fc2 = nn.Linear(in_features=512, out_features=2)
        
    def forward(self, x):
        x = self.fc1(x)
        x_cosface = x
        x_classification = self.fc2(x)
        
        return x_cosface, x_classification

In [15]:
model = ViTs_face(
            loss_type='CosFace',
            GPU_ID=[device],
            num_class=93431,
            image_size=112,
            patch_size=8,
            ac_patch_size=12,
            pad=4,
            dim=512,
            depth=20,
            heads=8,
            mlp_dim=2048,
            dropout=0.1,
            emb_dropout=0.1
        ).to(device)
model.load_state_dict(
    torch.load("../Backbone_VITs_Epoch_2_Batch_12000_Time_2021-03-17-04-05_checkpoint.pth", map_location=device)
)

self.device_id [device(type='cuda', index=3)]


<All keys matched successfully>

In [16]:
for param in model.parameters():
    param.requires_grad = False

In [17]:
embeds = {}
model.eval()

with torch.no_grad():
    for img, label, file in train_data:
        img = img.to(device)
        embeds[file] = model(torch.unsqueeze(img, 0))

    for img, label, file in val_data:
        img = img.to(device)
        embeds[file] = model(torch.unsqueeze(img, 0))

In [18]:
best_accu = 0.0
def objective(trial):
    model_xtr = ViT_plus().to(device)
    
    lr = trial.suggest_float("learning_rate", 1e-5, 1e-1, log=True)
    wd = trial.suggest_float('weight_decay', 1e-4, 1e-2, log=True)
    eps = trial.suggest_float("epsilon", 1e-9, 1e-7, log=True)
    optimizer = opt.AdamW(model_xtr.parameters(), lr=lr, eps=eps, weight_decay=wd)
    
    criterion = nn.CrossEntropyLoss()
    
    batch_size = trial.suggest_int('batch_size', 50, 300)
    num_epochs = trial.suggest_int('epochs', 10, 100)
    
    print("Learning rate: "+ str(lr))
    print("Weight decay: "+ str(wd))
    print("Epsilon: "+ str(eps))
    print("Batch size: "+ str(batch_size))
    print("Number of epochs: "+ str(num_epochs))
    
    for epoch in tqdm(range(num_epochs), desc="Epochs"):
        train_loader = DataLoader(train_data, batch_size=batch_size, shuffle=True, num_workers=4)
        val_loader = DataLoader(val_data, batch_size=batch_size, shuffle=False, num_workers=4)
        
        # training loop
        running_loss = []
        running_accu = []
        
        model_xtr.train()
        for img, label, file in tqdm(train_loader, desc="Training", leave=False):
            img, label = img.to(device), label.to(device)

            x = file_to_embed(embeds, file)
            
            optimizer.zero_grad()
            embed, output = model_xtr(x)
            
            pred = torch.argmax(output, 1)
            accuracy = torch.eq(pred, label).sum() / len(img)

            loss = criterion(output, label)
            loss.backward()
            optimizer.step()

            running_accu.append(accuracy.cpu().detach().numpy())
            running_loss.append(loss.cpu().detach().numpy())
        print("Epoch: {}/{} - Loss: {:.4f} - Accuracy: {:.4f}".format(epoch+1, num_epochs, np.mean(running_loss), np.mean(running_accu)))
        
        # validation loop
        val_loss = []
        val_accu = []

        model_xtr.eval()
        with torch.no_grad():
            for img, label, file in tqdm(val_loader):
                img, label = img.to(device), label.to(device)
                
                x = file_to_embed(embeds, file)
                
                embed, output = model_xtr(x)
                
                pred = torch.argmax(output, 1)
                accuracy = torch.eq(pred, label).sum() / len(img)
                
                loss = criterion(output, label)
                
                val_accu.append(accuracy.cpu().detach().numpy())
                val_loss.append(loss.cpu().detach().numpy())
        val_accu = np.mean(val_accu)
        val_loss = np.mean(val_loss)
        print("Val Loss: {:.4f} - Val Accuracy: {:.4f}".format(val_loss, val_accu))
        
        trial.report(val_accu, epoch)
        if trial.should_prune():
            raise optuna.exceptions.TrialPruned()
    
    global best_accu
    if val_accu > best_accu:
        best_accu = val_accu
        print("Saving best model...")
        torch.save(model_xtr.state_dict(), "../vit_12-8_mean_only.pt")
            
    return val_accu

In [19]:
study = optuna.create_study(direction='maximize',
                            study_name='12-8-mean-only-vit-study',
                            storage='sqlite:///study3.db',
                            load_if_exists=True)
study.optimize(objective, n_trials=20)

pruned_trials = study.get_trials(deepcopy=False, states=[TrialState.PRUNED])
complete_trials = study.get_trials(deepcopy=False, states=[TrialState.COMPLETE])

# Display the study statistics
print("\nStudy statistics: ")
print("  Number of finished trials: ", len(study.trials))
print("  Number of pruned trials: ", len(pruned_trials))
print("  Number of complete trials: ", len(complete_trials))

[32m[I 2023-12-14 22:16:04,491][0m A new study created in RDB with name: 12-8-mean-only-vit-study[0m


Learning rate: 0.0033208789761545975
Weight decay: 0.002976249303166988
Epsilon: 8.228177962798885e-08
Batch size: 136
Number of epochs: 68


Epochs:   0%|          | 0/68 [00:00<?, ?it/s]
Training:   0%|          | 0/103 [00:00<?, ?it/s][A
Training:   1%|          | 1/103 [00:00<01:26,  1.18it/s][A
Training:   5%|▍         | 5/103 [00:01<00:23,  4.25it/s][A
Training:   9%|▊         | 9/103 [00:01<00:17,  5.38it/s][A
Training:  13%|█▎        | 13/103 [00:02<00:15,  5.90it/s][A
Training:  17%|█▋        | 17/103 [00:03<00:13,  6.26it/s][A
Training:  20%|██        | 21/103 [00:03<00:13,  6.24it/s][A
Training:  24%|██▍       | 25/103 [00:04<00:12,  6.29it/s][A
Training:  28%|██▊       | 29/103 [00:04<00:11,  6.61it/s][A
Training:  31%|███       | 32/103 [00:05<00:08,  8.24it/s][A
Training:  33%|███▎      | 34/103 [00:05<00:11,  6.10it/s][A
Training:  36%|███▌      | 37/103 [00:06<00:10,  6.04it/s][A
Training:  39%|███▉      | 40/103 [00:06<00:08,  7.82it/s][A
Training:  41%|████      | 42/103 [00:06<00:09,  6.75it/s][A
Training:  44%|████▎     | 45/103 [00:07<00:09,  5.94it/s][A
Training:  48%|████▊     | 49/103 [

Epoch: 1/68 - Loss: 0.4933 - Accuracy: 0.8117



  0%|          | 0/13 [00:00<?, ?it/s][A
  8%|▊         | 1/13 [00:01<00:15,  1.32s/it][A
 31%|███       | 4/13 [00:01<00:02,  3.49it/s][A
 46%|████▌     | 6/13 [00:02<00:02,  2.75it/s][A
 62%|██████▏   | 8/13 [00:02<00:01,  4.10it/s][A
 77%|███████▋  | 10/13 [00:03<00:01,  2.95it/s][A
100%|██████████| 13/13 [00:04<00:00,  3.02it/s][A
Epochs:   1%|▏         | 1/68 [00:22<25:15, 22.62s/it]

Val Loss: 0.2095 - Val Accuracy: 0.9162



Training:   0%|          | 0/103 [00:00<?, ?it/s][A
Training:   1%|          | 1/103 [00:01<02:27,  1.45s/it][A
Training:   3%|▎         | 3/103 [00:01<00:41,  2.42it/s][A
Training:   5%|▍         | 5/103 [00:02<00:40,  2.45it/s][A
Training:   6%|▌         | 6/103 [00:02<00:32,  3.00it/s][A
Training:   9%|▊         | 9/103 [00:03<00:29,  3.18it/s][A
Training:  11%|█         | 11/103 [00:03<00:21,  4.23it/s][A
Training:  13%|█▎        | 13/103 [00:04<00:25,  3.49it/s][A
Training:  14%|█▎        | 14/103 [00:04<00:24,  3.67it/s][A
Training:  17%|█▋        | 17/103 [00:05<00:21,  3.98it/s][A
Training:  17%|█▋        | 18/103 [00:05<00:21,  3.98it/s][A
Training:  19%|█▉        | 20/103 [00:05<00:16,  5.18it/s][A
Training:  20%|██        | 21/103 [00:06<00:23,  3.44it/s][A
Training:  21%|██▏       | 22/103 [00:06<00:21,  3.74it/s][A
Training:  24%|██▍       | 25/103 [00:07<00:20,  3.73it/s][A
Training:  25%|██▌       | 26/103 [00:07<00:19,  3.91it/s][A
Training:  27%|██▋   

Epoch: 2/68 - Loss: 0.2053 - Accuracy: 0.9106



  0%|          | 0/13 [00:00<?, ?it/s][A
  8%|▊         | 1/13 [00:01<00:14,  1.21s/it][A
 31%|███       | 4/13 [00:01<00:02,  3.82it/s][A
 46%|████▌     | 6/13 [00:02<00:02,  3.04it/s][A
 69%|██████▉   | 9/13 [00:03<00:01,  2.98it/s][A
100%|██████████| 13/13 [00:03<00:00,  3.26it/s][A
Epochs:   3%|▎         | 2/68 [00:53<29:56, 27.23s/it]

Val Loss: 0.1793 - Val Accuracy: 0.9197



Training:   0%|          | 0/103 [00:00<?, ?it/s][A
Training:   1%|          | 1/103 [00:01<02:07,  1.25s/it][A
Training:   2%|▏         | 2/103 [00:01<01:09,  1.45it/s][A
Training:   4%|▍         | 4/103 [00:01<00:30,  3.28it/s][A
Training:   5%|▍         | 5/103 [00:02<00:36,  2.71it/s][A
Training:   6%|▌         | 6/103 [00:02<00:37,  2.58it/s][A
Training:   8%|▊         | 8/103 [00:02<00:21,  4.32it/s][A
Training:   9%|▊         | 9/103 [00:03<00:30,  3.04it/s][A
Training:  10%|▉         | 10/103 [00:03<00:30,  3.02it/s][A
Training:  12%|█▏        | 12/103 [00:03<00:19,  4.56it/s][A
Training:  13%|█▎        | 13/103 [00:04<00:29,  3.03it/s][A
Training:  15%|█▍        | 15/103 [00:04<00:20,  4.40it/s][A
Training:  16%|█▌        | 16/103 [00:04<00:18,  4.82it/s][A
Training:  17%|█▋        | 17/103 [00:05<00:31,  2.70it/s][A
Training:  18%|█▊        | 19/103 [00:05<00:22,  3.70it/s][A
Training:  20%|██        | 21/103 [00:06<00:24,  3.35it/s][A
Training:  22%|██▏     

Epoch: 3/68 - Loss: 0.1781 - Accuracy: 0.9274



  0%|          | 0/13 [00:00<?, ?it/s][A
  8%|▊         | 1/13 [00:01<00:15,  1.28s/it][A
 38%|███▊      | 5/13 [00:02<00:03,  2.26it/s][A
 69%|██████▉   | 9/13 [00:03<00:01,  2.82it/s][A
100%|██████████| 13/13 [00:04<00:00,  2.93it/s][A
Epochs:   4%|▍         | 3/68 [01:22<30:38, 28.29s/it]

Val Loss: 0.1644 - Val Accuracy: 0.9325



Training:   0%|          | 0/103 [00:00<?, ?it/s][A
Training:   1%|          | 1/103 [00:01<02:15,  1.33s/it][A
Training:   2%|▏         | 2/103 [00:01<01:15,  1.34it/s][A
Training:   4%|▍         | 4/103 [00:01<00:31,  3.16it/s][A
Training:   5%|▍         | 5/103 [00:02<00:31,  3.13it/s][A
Training:   6%|▌         | 6/103 [00:02<00:39,  2.46it/s][A
Training:   8%|▊         | 8/103 [00:02<00:23,  3.96it/s][A
Training:   9%|▊         | 9/103 [00:03<00:23,  3.96it/s][A
Training:  10%|▉         | 10/103 [00:03<00:30,  3.05it/s][A
Training:  12%|█▏        | 12/103 [00:03<00:20,  4.54it/s][A
Training:  13%|█▎        | 13/103 [00:04<00:24,  3.69it/s][A
Training:  14%|█▎        | 14/103 [00:04<00:25,  3.53it/s][A
Training:  15%|█▍        | 15/103 [00:04<00:22,  3.96it/s][A
Training:  16%|█▌        | 16/103 [00:04<00:18,  4.71it/s][A
Training:  17%|█▋        | 17/103 [00:05<00:22,  3.84it/s][A
Training:  17%|█▋        | 18/103 [00:05<00:22,  3.72it/s][A
Training:  19%|█▉      

Epoch: 4/68 - Loss: 0.1748 - Accuracy: 0.9271



  0%|          | 0/13 [00:00<?, ?it/s][A
  8%|▊         | 1/13 [00:01<00:13,  1.09s/it][A
 15%|█▌        | 2/13 [00:01<00:06,  1.72it/s][A
 38%|███▊      | 5/13 [00:02<00:03,  2.29it/s][A
 54%|█████▍    | 7/13 [00:02<00:01,  3.49it/s][A
 69%|██████▉   | 9/13 [00:03<00:01,  3.05it/s][A
 85%|████████▍ | 11/13 [00:03<00:00,  4.28it/s][A
100%|██████████| 13/13 [00:04<00:00,  3.12it/s][A
Epochs:   6%|▌         | 4/68 [01:51<30:35, 28.67s/it]

Val Loss: 0.2054 - Val Accuracy: 0.9142



Training:   0%|          | 0/103 [00:00<?, ?it/s][A
Training:   1%|          | 1/103 [00:01<02:11,  1.29s/it][A
Training:   2%|▏         | 2/103 [00:01<01:05,  1.55it/s][A
Training:   3%|▎         | 3/103 [00:01<00:43,  2.29it/s][A
Training:   4%|▍         | 4/103 [00:01<00:30,  3.25it/s][A
Training:   5%|▍         | 5/103 [00:02<00:36,  2.66it/s][A
Training:   6%|▌         | 6/103 [00:02<00:35,  2.70it/s][A
Training:   7%|▋         | 7/103 [00:02<00:27,  3.50it/s][A
Training:   9%|▊         | 9/103 [00:03<00:27,  3.42it/s][A
Training:  10%|▉         | 10/103 [00:03<00:26,  3.53it/s][A
Training:  12%|█▏        | 12/103 [00:03<00:17,  5.34it/s][A
Training:  13%|█▎        | 13/103 [00:04<00:27,  3.22it/s][A
Training:  15%|█▍        | 15/103 [00:04<00:18,  4.66it/s][A
Training:  17%|█▋        | 17/103 [00:05<00:20,  4.10it/s][A
Training:  17%|█▋        | 18/103 [00:05<00:21,  3.90it/s][A
Training:  20%|██        | 21/103 [00:06<00:19,  4.14it/s][A
Training:  21%|██▏      

Epoch: 5/68 - Loss: 0.1667 - Accuracy: 0.9312



  0%|          | 0/13 [00:00<?, ?it/s][A
  8%|▊         | 1/13 [00:01<00:13,  1.13s/it][A
 15%|█▌        | 2/13 [00:01<00:06,  1.73it/s][A
 31%|███       | 4/13 [00:01<00:02,  3.96it/s][A
 38%|███▊      | 5/13 [00:02<00:02,  2.84it/s][A
 46%|████▌     | 6/13 [00:02<00:02,  3.16it/s][A
 62%|██████▏   | 8/13 [00:02<00:01,  4.95it/s][A
 69%|██████▉   | 9/13 [00:03<00:01,  3.07it/s][A
 77%|███████▋  | 10/13 [00:03<00:00,  3.13it/s][A
100%|██████████| 13/13 [00:03<00:00,  3.38it/s][A
Epochs:   7%|▋         | 5/68 [02:21<30:24, 28.96s/it]

Val Loss: 0.1703 - Val Accuracy: 0.9237



Training:   0%|          | 0/103 [00:00<?, ?it/s][A
Training:   1%|          | 1/103 [00:01<02:32,  1.49s/it][A
Training:   2%|▏         | 2/103 [00:01<01:09,  1.45it/s][A
Training:   4%|▍         | 4/103 [00:01<00:29,  3.33it/s][A
Training:   5%|▍         | 5/103 [00:02<00:37,  2.60it/s][A
Training:   6%|▌         | 6/103 [00:02<00:33,  2.89it/s][A
Training:   8%|▊         | 8/103 [00:02<00:19,  4.81it/s][A
Training:  10%|▉         | 10/103 [00:03<00:27,  3.41it/s][A
Training:  13%|█▎        | 13/103 [00:04<00:23,  3.76it/s][A
Training:  14%|█▎        | 14/103 [00:04<00:22,  3.92it/s][A
Training:  16%|█▌        | 16/103 [00:04<00:16,  5.39it/s][A
Training:  17%|█▋        | 18/103 [00:05<00:27,  3.11it/s][A
Training:  18%|█▊        | 19/103 [00:05<00:23,  3.51it/s][A
Training:  19%|█▉        | 20/103 [00:06<00:20,  3.96it/s][A
Training:  20%|██        | 21/103 [00:06<00:19,  4.21it/s][A
Training:  21%|██▏       | 22/103 [00:06<00:28,  2.86it/s][A
Training:  24%|██▍    

Epoch: 6/68 - Loss: 0.1624 - Accuracy: 0.9359



  0%|          | 0/13 [00:00<?, ?it/s][A
  8%|▊         | 1/13 [00:01<00:14,  1.20s/it][A
 38%|███▊      | 5/13 [00:02<00:03,  2.58it/s][A
 54%|█████▍    | 7/13 [00:02<00:01,  3.71it/s][A
 69%|██████▉   | 9/13 [00:03<00:01,  3.18it/s][A
 85%|████████▍ | 11/13 [00:03<00:00,  3.96it/s][A
100%|██████████| 13/13 [00:03<00:00,  3.30it/s][A
Epochs:   9%|▉         | 6/68 [02:50<30:08, 29.17s/it]

Val Loss: 0.1545 - Val Accuracy: 0.9303



Training:   0%|          | 0/103 [00:00<?, ?it/s][A
Training:   1%|          | 1/103 [00:01<02:20,  1.37s/it][A
Training:   3%|▎         | 3/103 [00:01<00:40,  2.47it/s][A
Training:   5%|▍         | 5/103 [00:02<00:40,  2.42it/s][A
Training:   7%|▋         | 7/103 [00:02<00:25,  3.74it/s][A
Training:   9%|▊         | 9/103 [00:03<00:31,  3.02it/s][A
Training:  11%|█         | 11/103 [00:03<00:22,  4.12it/s][A
Training:  13%|█▎        | 13/103 [00:04<00:27,  3.24it/s][A
Training:  15%|█▍        | 15/103 [00:04<00:20,  4.33it/s][A
Training:  17%|█▋        | 17/103 [00:05<00:24,  3.52it/s][A
Training:  18%|█▊        | 19/103 [00:05<00:18,  4.51it/s][A
Training:  20%|██        | 21/103 [00:06<00:22,  3.64it/s][A
Training:  23%|██▎       | 24/103 [00:06<00:14,  5.55it/s][A
Training:  25%|██▌       | 26/103 [00:07<00:20,  3.74it/s][A
Training:  26%|██▌       | 27/103 [00:07<00:18,  4.12it/s][A
Training:  28%|██▊       | 29/103 [00:08<00:22,  3.32it/s][A
Training:  30%|███   

Epoch: 7/68 - Loss: 0.1607 - Accuracy: 0.9355



  0%|          | 0/13 [00:00<?, ?it/s][A
  8%|▊         | 1/13 [00:01<00:12,  1.04s/it][A
 23%|██▎       | 3/13 [00:01<00:03,  3.26it/s][A
 38%|███▊      | 5/13 [00:01<00:02,  2.98it/s][A
 62%|██████▏   | 8/13 [00:01<00:00,  5.53it/s][A
 77%|███████▋  | 10/13 [00:02<00:00,  4.40it/s][A
100%|██████████| 13/13 [00:03<00:00,  4.15it/s][A
Epochs:  10%|█         | 7/68 [03:19<29:26, 28.96s/it]

Val Loss: 0.1842 - Val Accuracy: 0.9173



Training:   0%|          | 0/103 [00:00<?, ?it/s][A
Training:   1%|          | 1/103 [00:01<02:06,  1.24s/it][A
Training:   3%|▎         | 3/103 [00:01<00:36,  2.72it/s][A
Training:   5%|▍         | 5/103 [00:02<00:35,  2.75it/s][A
Training:   7%|▋         | 7/103 [00:02<00:22,  4.29it/s][A
Training:   9%|▊         | 9/103 [00:03<00:30,  3.04it/s][A
Training:  11%|█         | 11/103 [00:03<00:21,  4.25it/s][A
Training:  13%|█▎        | 13/103 [00:04<00:27,  3.29it/s][A
Training:  17%|█▋        | 17/103 [00:05<00:22,  3.90it/s][A
Training:  18%|█▊        | 19/103 [00:05<00:17,  4.90it/s][A
Training:  20%|██        | 21/103 [00:05<00:22,  3.72it/s][A
Training:  22%|██▏       | 23/103 [00:06<00:16,  4.73it/s][A
Training:  24%|██▍       | 25/103 [00:06<00:20,  3.82it/s][A
Training:  26%|██▌       | 27/103 [00:07<00:15,  4.93it/s][A
Training:  28%|██▊       | 29/103 [00:07<00:19,  3.84it/s][A
Training:  30%|███       | 31/103 [00:07<00:14,  5.01it/s][A
Training:  32%|███▏  

Epoch: 8/68 - Loss: 0.1541 - Accuracy: 0.9378



  0%|          | 0/13 [00:00<?, ?it/s][A
  8%|▊         | 1/13 [00:01<00:14,  1.20s/it][A
 38%|███▊      | 5/13 [00:02<00:02,  2.76it/s][A
 69%|██████▉   | 9/13 [00:02<00:01,  3.44it/s][A
100%|██████████| 13/13 [00:03<00:00,  3.53it/s][A
Epochs:  12%|█▏        | 8/68 [03:46<28:18, 28.31s/it]

Val Loss: 0.1555 - Val Accuracy: 0.9328



Training:   0%|          | 0/103 [00:00<?, ?it/s][A
Training:   1%|          | 1/103 [00:01<01:50,  1.09s/it][A
Training:   2%|▏         | 2/103 [00:01<00:58,  1.73it/s][A
Training:   5%|▍         | 5/103 [00:02<00:33,  2.91it/s][A
Training:   7%|▋         | 7/103 [00:02<00:22,  4.32it/s][A
Training:   8%|▊         | 8/103 [00:02<00:19,  4.84it/s][A
Training:   9%|▊         | 9/103 [00:02<00:29,  3.22it/s][A
Training:  10%|▉         | 10/103 [00:03<00:24,  3.82it/s][A
Training:  12%|█▏        | 12/103 [00:03<00:17,  5.25it/s][A
Training:  13%|█▎        | 13/103 [00:03<00:25,  3.55it/s][A
Training:  14%|█▎        | 14/103 [00:03<00:21,  4.07it/s][A
Training:  16%|█▌        | 16/103 [00:04<00:16,  5.21it/s][A
Training:  17%|█▋        | 17/103 [00:04<00:23,  3.66it/s][A
Training:  18%|█▊        | 19/103 [00:04<00:15,  5.40it/s][A
Training:  19%|█▉        | 20/103 [00:05<00:16,  5.01it/s][A
Training:  20%|██        | 21/103 [00:05<00:21,  3.83it/s][A
Training:  22%|██▏    

Epoch: 9/68 - Loss: 0.1607 - Accuracy: 0.9341



  0%|          | 0/13 [00:00<?, ?it/s][A
  8%|▊         | 1/13 [00:01<00:14,  1.25s/it][A
 38%|███▊      | 5/13 [00:02<00:03,  2.64it/s][A
 54%|█████▍    | 7/13 [00:02<00:01,  3.83it/s][A
 69%|██████▉   | 9/13 [00:03<00:01,  3.03it/s][A
100%|██████████| 13/13 [00:03<00:00,  3.39it/s][A
Epochs:  13%|█▎        | 9/68 [04:14<27:45, 28.23s/it]

Val Loss: 0.1650 - Val Accuracy: 0.9252



Training:   0%|          | 0/103 [00:00<?, ?it/s][A
Training:   1%|          | 1/103 [00:01<02:18,  1.36s/it][A
Training:   4%|▍         | 4/103 [00:01<00:38,  2.59it/s][A
Training:   5%|▍         | 5/103 [00:02<00:36,  2.71it/s][A
Training:   6%|▌         | 6/103 [00:02<00:30,  3.16it/s][A
Training:   8%|▊         | 8/103 [00:02<00:24,  3.90it/s][A
Training:   9%|▊         | 9/103 [00:03<00:29,  3.22it/s][A
Training:  11%|█         | 11/103 [00:03<00:20,  4.40it/s][A
Training:  12%|█▏        | 12/103 [00:03<00:22,  4.05it/s][A
Training:  13%|█▎        | 13/103 [00:04<00:25,  3.53it/s][A
Training:  14%|█▎        | 14/103 [00:04<00:22,  4.02it/s][A
Training:  16%|█▌        | 16/103 [00:04<00:22,  3.79it/s][A
Training:  17%|█▋        | 17/103 [00:05<00:23,  3.64it/s][A
Training:  18%|█▊        | 19/103 [00:05<00:16,  5.13it/s][A
Training:  19%|█▉        | 20/103 [00:06<00:26,  3.16it/s][A
Training:  20%|██        | 21/103 [00:06<00:22,  3.59it/s][A
Training:  22%|██▏    

Epoch: 10/68 - Loss: 0.1577 - Accuracy: 0.9355



  0%|          | 0/13 [00:00<?, ?it/s][A
  8%|▊         | 1/13 [00:01<00:13,  1.10s/it][A
 23%|██▎       | 3/13 [00:01<00:03,  3.10it/s][A
 38%|███▊      | 5/13 [00:01<00:02,  3.20it/s][A
 46%|████▌     | 6/13 [00:02<00:02,  3.35it/s][A
 62%|██████▏   | 8/13 [00:02<00:00,  5.23it/s][A
 77%|███████▋  | 10/13 [00:03<00:00,  3.42it/s][A
100%|██████████| 13/13 [00:03<00:00,  3.47it/s][A
Epochs:  15%|█▍        | 10/68 [04:44<27:41, 28.65s/it]

Val Loss: 0.2595 - Val Accuracy: 0.8926



Training:   0%|          | 0/103 [00:00<?, ?it/s][A
Training:   1%|          | 1/103 [00:01<02:15,  1.33s/it][A
Training:   4%|▍         | 4/103 [00:01<00:33,  2.94it/s][A
Training:   5%|▍         | 5/103 [00:02<00:46,  2.11it/s][A
Training:   7%|▋         | 7/103 [00:02<00:27,  3.43it/s][A
Training:   8%|▊         | 8/103 [00:02<00:25,  3.70it/s][A
Training:   9%|▊         | 9/103 [00:03<00:35,  2.67it/s][A
Training:  11%|█         | 11/103 [00:03<00:22,  4.06it/s][A
Training:  12%|█▏        | 12/103 [00:03<00:23,  3.95it/s][A
Training:  13%|█▎        | 13/103 [00:04<00:28,  3.11it/s][A
Training:  16%|█▌        | 16/103 [00:05<00:22,  3.90it/s][A
Training:  17%|█▋        | 17/103 [00:05<00:24,  3.52it/s][A
Training:  18%|█▊        | 19/103 [00:05<00:17,  4.70it/s][A
Training:  19%|█▉        | 20/103 [00:05<00:20,  4.14it/s][A
Training:  20%|██        | 21/103 [00:06<00:19,  4.11it/s][A
Training:  22%|██▏       | 23/103 [00:06<00:13,  5.87it/s][A
Training:  23%|██▎    

Epoch: 11/68 - Loss: 0.1526 - Accuracy: 0.9407



  0%|          | 0/13 [00:00<?, ?it/s][A
  8%|▊         | 1/13 [00:01<00:13,  1.09s/it][A
 15%|█▌        | 2/13 [00:01<00:05,  1.96it/s][A
 31%|███       | 4/13 [00:01<00:02,  3.72it/s][A
 38%|███▊      | 5/13 [00:01<00:02,  3.03it/s][A
 46%|████▌     | 6/13 [00:02<00:02,  3.15it/s][A
 62%|██████▏   | 8/13 [00:02<00:01,  4.98it/s][A
 69%|██████▉   | 9/13 [00:02<00:01,  3.79it/s][A
 77%|███████▋  | 10/13 [00:03<00:00,  3.95it/s][A
100%|██████████| 13/13 [00:03<00:00,  3.77it/s][A
Epochs:  16%|█▌        | 11/68 [05:12<27:18, 28.74s/it]

Val Loss: 0.1450 - Val Accuracy: 0.9394



Training:   0%|          | 0/103 [00:00<?, ?it/s][A
Training:   1%|          | 1/103 [00:01<02:12,  1.30s/it][A
Training:   3%|▎         | 3/103 [00:01<00:37,  2.64it/s][A
Training:   5%|▍         | 5/103 [00:02<00:41,  2.37it/s][A
Training:   7%|▋         | 7/103 [00:02<00:25,  3.70it/s][A
Training:   9%|▊         | 9/103 [00:03<00:30,  3.11it/s][A
Training:  11%|█         | 11/103 [00:03<00:21,  4.26it/s][A
Training:  13%|█▎        | 13/103 [00:04<00:24,  3.64it/s][A
Training:  14%|█▎        | 14/103 [00:04<00:21,  4.15it/s][A
Training:  15%|█▍        | 15/103 [00:04<00:19,  4.41it/s][A
Training:  17%|█▋        | 17/103 [00:05<00:26,  3.28it/s][A
Training:  18%|█▊        | 19/103 [00:05<00:18,  4.58it/s][A
Training:  19%|█▉        | 20/103 [00:05<00:17,  4.70it/s][A
Training:  20%|██        | 21/103 [00:06<00:28,  2.92it/s][A
Training:  23%|██▎       | 24/103 [00:06<00:16,  4.71it/s][A
Training:  24%|██▍       | 25/103 [00:07<00:25,  3.05it/s][A
Training:  25%|██▌   

Epoch: 12/68 - Loss: 0.1574 - Accuracy: 0.9360



  0%|          | 0/13 [00:00<?, ?it/s][A
  8%|▊         | 1/13 [00:01<00:16,  1.40s/it][A
 23%|██▎       | 3/13 [00:01<00:04,  2.44it/s][A
 38%|███▊      | 5/13 [00:02<00:02,  2.76it/s][A
 69%|██████▉   | 9/13 [00:03<00:01,  3.55it/s][A
 85%|████████▍ | 11/13 [00:03<00:00,  4.65it/s][A
100%|██████████| 13/13 [00:03<00:00,  3.43it/s][A
Epochs:  18%|█▊        | 12/68 [05:42<27:04, 29.00s/it]

Val Loss: 0.1897 - Val Accuracy: 0.9232



Training:   0%|          | 0/103 [00:00<?, ?it/s][A
Training:   1%|          | 1/103 [00:01<02:18,  1.36s/it][A
Training:   4%|▍         | 4/103 [00:01<00:28,  3.45it/s][A
Training:   6%|▌         | 6/103 [00:02<00:33,  2.89it/s][A
Training:   9%|▊         | 9/103 [00:03<00:35,  2.68it/s][A
Training:  11%|█         | 11/103 [00:03<00:25,  3.62it/s][A
Training:  13%|█▎        | 13/103 [00:04<00:29,  3.02it/s][A
Training:  15%|█▍        | 15/103 [00:04<00:21,  4.01it/s][A
Training:  17%|█▋        | 17/103 [00:05<00:24,  3.56it/s][A
Training:  19%|█▉        | 20/103 [00:05<00:15,  5.29it/s][A
Training:  21%|██▏       | 22/103 [00:06<00:22,  3.57it/s][A
Training:  24%|██▍       | 25/103 [00:07<00:21,  3.67it/s][A
Training:  26%|██▌       | 27/103 [00:07<00:17,  4.41it/s][A
Training:  27%|██▋       | 28/103 [00:07<00:16,  4.62it/s][A
Training:  28%|██▊       | 29/103 [00:08<00:23,  3.16it/s][A
Training:  30%|███       | 31/103 [00:08<00:16,  4.36it/s][A
Training:  31%|███  

Epoch: 13/68 - Loss: 0.1532 - Accuracy: 0.9377



  0%|          | 0/13 [00:00<?, ?it/s][A
  8%|▊         | 1/13 [00:01<00:12,  1.08s/it][A
 23%|██▎       | 3/13 [00:01<00:03,  3.07it/s][A
 38%|███▊      | 5/13 [00:01<00:02,  2.96it/s][A
 46%|████▌     | 6/13 [00:02<00:02,  3.40it/s][A
 62%|██████▏   | 8/13 [00:02<00:00,  5.27it/s][A
 77%|███████▋  | 10/13 [00:03<00:00,  3.52it/s][A
 85%|████████▍ | 11/13 [00:03<00:00,  4.04it/s][A
100%|██████████| 13/13 [00:03<00:00,  3.49it/s][A
Epochs:  19%|█▉        | 13/68 [06:12<26:50, 29.29s/it]

Val Loss: 0.1455 - Val Accuracy: 0.9434



Training:   0%|          | 0/103 [00:00<?, ?it/s][A
Training:   1%|          | 1/103 [00:01<02:04,  1.22s/it][A
Training:   4%|▍         | 4/103 [00:01<00:29,  3.32it/s][A
Training:   5%|▍         | 5/103 [00:02<00:37,  2.59it/s][A
Training:   8%|▊         | 8/103 [00:02<00:21,  4.40it/s][A
Training:   9%|▊         | 9/103 [00:03<00:30,  3.07it/s][A
Training:  12%|█▏        | 12/103 [00:03<00:18,  4.87it/s][A
Training:  13%|█▎        | 13/103 [00:03<00:26,  3.37it/s][A
Training:  15%|█▍        | 15/103 [00:04<00:18,  4.71it/s][A
Training:  17%|█▋        | 17/103 [00:04<00:23,  3.61it/s][A
Training:  18%|█▊        | 19/103 [00:05<00:17,  4.77it/s][A
Training:  20%|██        | 21/103 [00:05<00:23,  3.46it/s][A
Training:  23%|██▎       | 24/103 [00:06<00:18,  4.32it/s][A
Training:  24%|██▍       | 25/103 [00:06<00:22,  3.51it/s][A
Training:  27%|██▋       | 28/103 [00:07<00:16,  4.42it/s][A
Training:  28%|██▊       | 29/103 [00:07<00:20,  3.56it/s][A
Training:  31%|███   

Epoch: 14/68 - Loss: 0.1482 - Accuracy: 0.9395



  0%|          | 0/13 [00:00<?, ?it/s][A
  8%|▊         | 1/13 [00:01<00:18,  1.57s/it][A
 38%|███▊      | 5/13 [00:02<00:03,  2.60it/s][A
 62%|██████▏   | 8/13 [00:02<00:01,  4.57it/s][A
 77%|███████▋  | 10/13 [00:03<00:00,  3.53it/s][A
100%|██████████| 13/13 [00:04<00:00,  3.16it/s][A
Epochs:  21%|██        | 14/68 [06:42<26:27, 29.39s/it]

Val Loss: 0.1512 - Val Accuracy: 0.9340



Training:   0%|          | 0/103 [00:00<?, ?it/s][A
Training:   1%|          | 1/103 [00:01<02:23,  1.41s/it][A
Training:   3%|▎         | 3/103 [00:01<00:41,  2.39it/s][A
Training:   5%|▍         | 5/103 [00:02<00:41,  2.38it/s][A
Training:   7%|▋         | 7/103 [00:02<00:26,  3.59it/s][A
Training:   9%|▊         | 9/103 [00:03<00:30,  3.07it/s][A
Training:  11%|█         | 11/103 [00:03<00:21,  4.25it/s][A
Training:  12%|█▏        | 12/103 [00:03<00:19,  4.76it/s][A
Training:  13%|█▎        | 13/103 [00:04<00:30,  3.00it/s][A
Training:  15%|█▍        | 15/103 [00:04<00:20,  4.36it/s][A
Training:  17%|█▋        | 17/103 [00:05<00:28,  3.02it/s][A
Training:  18%|█▊        | 19/103 [00:05<00:20,  4.10it/s][A
Training:  20%|██        | 21/103 [00:06<00:25,  3.26it/s][A
Training:  22%|██▏       | 23/103 [00:06<00:18,  4.37it/s][A
Training:  24%|██▍       | 25/103 [00:07<00:22,  3.50it/s][A
Training:  26%|██▌       | 27/103 [00:07<00:16,  4.69it/s][A
Training:  28%|██▊   

Epoch: 15/68 - Loss: 0.1513 - Accuracy: 0.9397



  0%|          | 0/13 [00:00<?, ?it/s][A
  8%|▊         | 1/13 [00:01<00:16,  1.40s/it][A
 38%|███▊      | 5/13 [00:02<00:03,  2.46it/s][A
 54%|█████▍    | 7/13 [00:02<00:01,  3.61it/s][A
 69%|██████▉   | 9/13 [00:03<00:01,  3.34it/s][A
100%|██████████| 13/13 [00:03<00:00,  3.48it/s][A
Epochs:  22%|██▏       | 15/68 [07:11<26:02, 29.48s/it]

Val Loss: 0.1589 - Val Accuracy: 0.9382



Training:   0%|          | 0/103 [00:00<?, ?it/s][A
Training:   1%|          | 1/103 [00:01<01:56,  1.14s/it][A
Training:   3%|▎         | 3/103 [00:01<00:33,  2.99it/s][A
Training:   5%|▍         | 5/103 [00:02<00:38,  2.54it/s][A
Training:   7%|▋         | 7/103 [00:02<00:24,  3.93it/s][A
Training:   9%|▊         | 9/103 [00:03<00:31,  2.98it/s][A
Training:  11%|█         | 11/103 [00:03<00:22,  4.15it/s][A
Training:  13%|█▎        | 13/103 [00:04<00:26,  3.37it/s][A
Training:  15%|█▍        | 15/103 [00:04<00:19,  4.53it/s][A
Training:  17%|█▋        | 17/103 [00:04<00:20,  4.10it/s][A
Training:  19%|█▉        | 20/103 [00:04<00:13,  6.23it/s][A
Training:  21%|██▏       | 22/103 [00:05<00:19,  4.22it/s][A
Training:  24%|██▍       | 25/103 [00:06<00:20,  3.79it/s][A
Training:  26%|██▌       | 27/103 [00:07<00:17,  4.43it/s][A
Training:  28%|██▊       | 29/103 [00:07<00:19,  3.76it/s][A
Training:  30%|███       | 31/103 [00:08<00:16,  4.45it/s][A
Training:  32%|███▏  

Epoch: 16/68 - Loss: 0.1482 - Accuracy: 0.9383



  0%|          | 0/13 [00:00<?, ?it/s][A
  8%|▊         | 1/13 [00:01<00:14,  1.21s/it][A
 23%|██▎       | 3/13 [00:01<00:03,  2.72it/s][A
 38%|███▊      | 5/13 [00:02<00:03,  2.63it/s][A
 54%|█████▍    | 7/13 [00:02<00:01,  4.06it/s][A
 62%|██████▏   | 8/13 [00:02<00:01,  4.57it/s][A
 69%|██████▉   | 9/13 [00:03<00:01,  3.08it/s][A
 92%|█████████▏| 12/13 [00:03<00:00,  4.56it/s][A
100%|██████████| 13/13 [00:03<00:00,  3.47it/s][A
Epochs:  24%|██▎       | 16/68 [07:41<25:30, 29.44s/it]

Val Loss: 0.1435 - Val Accuracy: 0.9423



Training:   0%|          | 0/103 [00:00<?, ?it/s][A
Training:   1%|          | 1/103 [00:01<02:17,  1.35s/it][A
Training:   3%|▎         | 3/103 [00:01<00:38,  2.57it/s][A
Training:   5%|▍         | 5/103 [00:02<00:36,  2.66it/s][A
Training:   7%|▋         | 7/103 [00:02<00:23,  4.13it/s][A
Training:   9%|▊         | 9/103 [00:03<00:29,  3.21it/s][A
Training:  11%|█         | 11/103 [00:03<00:21,  4.38it/s][A
Training:  13%|█▎        | 13/103 [00:04<00:26,  3.42it/s][A
Training:  15%|█▍        | 15/103 [00:04<00:19,  4.56it/s][A
Training:  17%|█▋        | 17/103 [00:05<00:23,  3.66it/s][A
Training:  18%|█▊        | 19/103 [00:05<00:17,  4.80it/s][A
Training:  20%|██        | 21/103 [00:05<00:21,  3.85it/s][A
Training:  22%|██▏       | 23/103 [00:06<00:15,  5.04it/s][A
Training:  24%|██▍       | 25/103 [00:06<00:19,  4.02it/s][A
Training:  26%|██▌       | 27/103 [00:07<00:16,  4.68it/s][A
Training:  28%|██▊       | 29/103 [00:07<00:19,  3.82it/s][A
Training:  30%|███   

Epoch: 17/68 - Loss: 0.1601 - Accuracy: 0.9349



  0%|          | 0/13 [00:00<?, ?it/s][A
  8%|▊         | 1/13 [00:01<00:13,  1.14s/it][A
 38%|███▊      | 5/13 [00:02<00:03,  2.66it/s][A
 69%|██████▉   | 9/13 [00:03<00:01,  3.39it/s][A
100%|██████████| 13/13 [00:03<00:00,  3.46it/s][A
Epochs:  25%|██▌       | 17/68 [08:10<24:52, 29.26s/it]

Val Loss: 0.1866 - Val Accuracy: 0.9240



Training:   0%|          | 0/103 [00:00<?, ?it/s][A
Training:   1%|          | 1/103 [00:00<01:39,  1.02it/s][A
Training:   3%|▎         | 3/103 [00:01<00:33,  2.95it/s][A
Training:   5%|▍         | 5/103 [00:01<00:31,  3.11it/s][A
Training:   7%|▋         | 7/103 [00:02<00:22,  4.26it/s][A
Training:   9%|▊         | 9/103 [00:02<00:24,  3.83it/s][A
Training:  11%|█         | 11/103 [00:02<00:18,  4.97it/s][A
Training:  13%|█▎        | 13/103 [00:03<00:20,  4.44it/s][A
Training:  15%|█▍        | 15/103 [00:03<00:16,  5.32it/s][A
Training:  17%|█▋        | 17/103 [00:04<00:20,  4.20it/s][A
Training:  18%|█▊        | 19/103 [00:04<00:16,  5.16it/s][A
Training:  20%|██        | 21/103 [00:05<00:20,  4.01it/s][A
Training:  22%|██▏       | 23/103 [00:05<00:15,  5.09it/s][A
Training:  24%|██▍       | 25/103 [00:06<00:20,  3.76it/s][A
Training:  27%|██▋       | 28/103 [00:06<00:13,  5.61it/s][A
Training:  29%|██▉       | 30/103 [00:06<00:15,  4.74it/s][A
Training:  30%|███   

Epoch: 18/68 - Loss: 0.1466 - Accuracy: 0.9415



  0%|          | 0/13 [00:00<?, ?it/s][A
  8%|▊         | 1/13 [00:01<00:12,  1.03s/it][A
 15%|█▌        | 2/13 [00:01<00:06,  1.76it/s][A
 38%|███▊      | 5/13 [00:01<00:02,  3.74it/s][A
 46%|████▌     | 6/13 [00:01<00:01,  3.74it/s][A
 69%|██████▉   | 9/13 [00:02<00:00,  4.14it/s][A
 77%|███████▋  | 10/13 [00:02<00:00,  4.49it/s][A
100%|██████████| 13/13 [00:03<00:00,  3.76it/s][A
Epochs:  26%|██▋       | 18/68 [08:37<23:59, 28.79s/it]

Val Loss: 0.1410 - Val Accuracy: 0.9440



Training:   0%|          | 0/103 [00:00<?, ?it/s][A
Training:   1%|          | 1/103 [00:01<02:00,  1.18s/it][A
Training:   2%|▏         | 2/103 [00:01<00:59,  1.70it/s][A
Training:   5%|▍         | 5/103 [00:02<00:35,  2.76it/s][A
Training:   6%|▌         | 6/103 [00:02<00:28,  3.37it/s][A
Training:   8%|▊         | 8/103 [00:02<00:18,  5.07it/s][A
Training:   9%|▊         | 9/103 [00:03<00:29,  3.23it/s][A
Training:  12%|█▏        | 12/103 [00:03<00:16,  5.43it/s][A
Training:  14%|█▎        | 14/103 [00:04<00:23,  3.83it/s][A
Training:  17%|█▋        | 17/103 [00:04<00:23,  3.66it/s][A
Training:  18%|█▊        | 19/103 [00:05<00:17,  4.69it/s][A
Training:  20%|██        | 21/103 [00:05<00:21,  3.85it/s][A
Training:  22%|██▏       | 23/103 [00:05<00:16,  5.00it/s][A
Training:  24%|██▍       | 25/103 [00:06<00:19,  4.01it/s][A
Training:  28%|██▊       | 29/103 [00:07<00:16,  4.46it/s][A
Training:  30%|███       | 31/103 [00:07<00:13,  5.50it/s][A
Training:  32%|███▏   

Epoch: 19/68 - Loss: 0.1427 - Accuracy: 0.9433



  0%|          | 0/13 [00:00<?, ?it/s][A
  8%|▊         | 1/13 [00:01<00:13,  1.13s/it][A
 15%|█▌        | 2/13 [00:01<00:06,  1.77it/s][A
 38%|███▊      | 5/13 [00:01<00:02,  3.23it/s][A
 46%|████▌     | 6/13 [00:02<00:02,  3.35it/s][A
 62%|██████▏   | 8/13 [00:02<00:00,  5.14it/s][A
 69%|██████▉   | 9/13 [00:02<00:00,  4.09it/s][A
 77%|███████▋  | 10/13 [00:03<00:00,  3.58it/s][A
100%|██████████| 13/13 [00:03<00:00,  3.72it/s][A
Epochs:  28%|██▊       | 19/68 [09:05<23:10, 28.38s/it]

Val Loss: 0.1671 - Val Accuracy: 0.9348



Training:   0%|          | 0/103 [00:00<?, ?it/s][A
Training:   1%|          | 1/103 [00:01<01:49,  1.07s/it][A
Training:   3%|▎         | 3/103 [00:01<00:34,  2.92it/s][A
Training:   5%|▍         | 5/103 [00:01<00:30,  3.21it/s][A
Training:   7%|▋         | 7/103 [00:02<00:26,  3.65it/s][A
Training:   9%|▊         | 9/103 [00:02<00:25,  3.64it/s][A
Training:  10%|▉         | 10/103 [00:02<00:22,  4.08it/s][A
Training:  12%|█▏        | 12/103 [00:03<00:16,  5.61it/s][A
Training:  13%|█▎        | 13/103 [00:03<00:25,  3.58it/s][A
Training:  15%|█▍        | 15/103 [00:03<00:17,  5.16it/s][A
Training:  17%|█▋        | 17/103 [00:04<00:19,  4.37it/s][A
Training:  18%|█▊        | 19/103 [00:04<00:14,  5.68it/s][A
Training:  20%|██        | 21/103 [00:05<00:18,  4.41it/s][A
Training:  21%|██▏       | 22/103 [00:05<00:17,  4.73it/s][A
Training:  23%|██▎       | 24/103 [00:05<00:12,  6.32it/s][A
Training:  25%|██▌       | 26/103 [00:06<00:18,  4.24it/s][A
Training:  26%|██▌   

Epoch: 20/68 - Loss: 0.1523 - Accuracy: 0.9385



  0%|          | 0/13 [00:00<?, ?it/s][A
  8%|▊         | 1/13 [00:01<00:14,  1.20s/it][A
 15%|█▌        | 2/13 [00:01<00:06,  1.64it/s][A
 38%|███▊      | 5/13 [00:02<00:02,  2.89it/s][A
 62%|██████▏   | 8/13 [00:02<00:00,  5.19it/s][A
 77%|███████▋  | 10/13 [00:03<00:00,  3.64it/s][A
100%|██████████| 13/13 [00:03<00:00,  3.50it/s][A
Epochs:  29%|██▉       | 20/68 [09:32<22:29, 28.11s/it]

Val Loss: 0.1470 - Val Accuracy: 0.9360



Training:   0%|          | 0/103 [00:00<?, ?it/s][A
Training:   1%|          | 1/103 [00:01<02:27,  1.45s/it][A
Training:   3%|▎         | 3/103 [00:01<00:41,  2.39it/s][A
Training:   5%|▍         | 5/103 [00:02<00:37,  2.58it/s][A
Training:   8%|▊         | 8/103 [00:02<00:19,  4.86it/s][A
Training:  10%|▉         | 10/103 [00:03<00:24,  3.83it/s][A
Training:  13%|█▎        | 13/103 [00:03<00:22,  3.95it/s][A
Training:  16%|█▌        | 16/103 [00:04<00:16,  5.18it/s][A
Training:  17%|█▋        | 17/103 [00:04<00:22,  3.81it/s][A
Training:  19%|█▉        | 20/103 [00:05<00:16,  4.93it/s][A
Training:  20%|██        | 21/103 [00:05<00:19,  4.10it/s][A
Training:  22%|██▏       | 23/103 [00:05<00:14,  5.43it/s][A
Training:  23%|██▎       | 24/103 [00:05<00:15,  5.02it/s][A
Training:  24%|██▍       | 25/103 [00:06<00:18,  4.16it/s][A
Training:  26%|██▌       | 27/103 [00:06<00:13,  5.84it/s][A
Training:  28%|██▊       | 29/103 [00:07<00:18,  3.98it/s][A
Training:  30%|███  

Epoch: 21/68 - Loss: 0.1441 - Accuracy: 0.9428



  0%|          | 0/13 [00:00<?, ?it/s][A
  8%|▊         | 1/13 [00:01<00:14,  1.18s/it][A
 15%|█▌        | 2/13 [00:01<00:06,  1.82it/s][A
 31%|███       | 4/13 [00:01<00:02,  4.19it/s][A
 46%|████▌     | 6/13 [00:02<00:02,  3.38it/s][A
 69%|██████▉   | 9/13 [00:02<00:01,  3.43it/s][A
 77%|███████▋  | 10/13 [00:03<00:00,  3.86it/s][A
100%|██████████| 13/13 [00:03<00:00,  3.55it/s][A
Epochs:  31%|███       | 21/68 [10:00<21:51, 27.90s/it]

Val Loss: 0.2078 - Val Accuracy: 0.9170



Training:   0%|          | 0/103 [00:00<?, ?it/s][A
Training:   1%|          | 1/103 [00:01<02:10,  1.27s/it][A
Training:   2%|▏         | 2/103 [00:01<00:59,  1.69it/s][A
Training:   4%|▍         | 4/103 [00:01<00:26,  3.73it/s][A
Training:   5%|▍         | 5/103 [00:02<00:33,  2.94it/s][A
Training:   6%|▌         | 6/103 [00:02<00:28,  3.38it/s][A
Training:   8%|▊         | 8/103 [00:02<00:19,  4.82it/s][A
Training:   9%|▊         | 9/103 [00:02<00:25,  3.70it/s][A
Training:  10%|▉         | 10/103 [00:03<00:24,  3.84it/s][A
Training:  12%|█▏        | 12/103 [00:03<00:16,  5.44it/s][A
Training:  13%|█▎        | 13/103 [00:03<00:25,  3.47it/s][A
Training:  14%|█▎        | 14/103 [00:04<00:24,  3.58it/s][A
Training:  16%|█▌        | 16/103 [00:04<00:16,  5.22it/s][A
Training:  17%|█▋        | 17/103 [00:04<00:25,  3.37it/s][A
Training:  17%|█▋        | 18/103 [00:05<00:24,  3.44it/s][A
Training:  19%|█▉        | 20/103 [00:05<00:16,  5.10it/s][A
Training:  20%|██      

Epoch: 22/68 - Loss: 0.1506 - Accuracy: 0.9384



  0%|          | 0/13 [00:00<?, ?it/s][A
  8%|▊         | 1/13 [00:01<00:15,  1.25s/it][A
 15%|█▌        | 2/13 [00:01<00:06,  1.64it/s][A
 38%|███▊      | 5/13 [00:02<00:02,  2.76it/s][A
 54%|█████▍    | 7/13 [00:02<00:01,  4.22it/s][A
 69%|██████▉   | 9/13 [00:03<00:01,  3.57it/s][A
 77%|███████▋  | 10/13 [00:03<00:00,  3.81it/s][A
100%|██████████| 13/13 [00:03<00:00,  3.39it/s][A
Epochs:  32%|███▏      | 22/68 [10:27<21:23, 27.91s/it]

Val Loss: 0.1609 - Val Accuracy: 0.9295



Training:   0%|          | 0/103 [00:00<?, ?it/s][A
Training:   1%|          | 1/103 [00:01<01:59,  1.18s/it][A
Training:   2%|▏         | 2/103 [00:01<00:55,  1.82it/s][A
Training:   5%|▍         | 5/103 [00:02<00:34,  2.81it/s][A
Training:   7%|▋         | 7/103 [00:02<00:23,  4.14it/s][A
Training:   9%|▊         | 9/103 [00:03<00:29,  3.18it/s][A
Training:  11%|█         | 11/103 [00:03<00:20,  4.40it/s][A
Training:  13%|█▎        | 13/103 [00:04<00:26,  3.36it/s][A
Training:  16%|█▌        | 16/103 [00:04<00:16,  5.29it/s][A
Training:  17%|█▋        | 18/103 [00:05<00:21,  3.99it/s][A
Training:  19%|█▉        | 20/103 [00:05<00:16,  5.12it/s][A
Training:  21%|██▏       | 22/103 [00:05<00:18,  4.30it/s][A
Training:  23%|██▎       | 24/103 [00:05<00:14,  5.58it/s][A
Training:  25%|██▌       | 26/103 [00:06<00:19,  3.93it/s][A
Training:  27%|██▋       | 28/103 [00:06<00:14,  5.09it/s][A
Training:  29%|██▉       | 30/103 [00:07<00:18,  4.02it/s][A
Training:  32%|███▏  

Epoch: 23/68 - Loss: 0.1448 - Accuracy: 0.9419



  0%|          | 0/13 [00:00<?, ?it/s][A
  8%|▊         | 1/13 [00:01<00:14,  1.19s/it][A
 23%|██▎       | 3/13 [00:01<00:03,  2.79it/s][A
 38%|███▊      | 5/13 [00:02<00:03,  2.52it/s][A
 46%|████▌     | 6/13 [00:02<00:02,  2.74it/s][A
 69%|██████▉   | 9/13 [00:03<00:01,  3.34it/s][A
 77%|███████▋  | 10/13 [00:03<00:00,  3.49it/s][A
100%|██████████| 13/13 [00:04<00:00,  3.15it/s][A
Epochs:  34%|███▍      | 23/68 [10:55<20:45, 27.67s/it]

Val Loss: 0.1616 - Val Accuracy: 0.9369



Training:   0%|          | 0/103 [00:00<?, ?it/s][A
Training:   1%|          | 1/103 [00:01<02:35,  1.52s/it][A
Training:   4%|▍         | 4/103 [00:01<00:32,  3.03it/s][A
Training:   6%|▌         | 6/103 [00:02<00:38,  2.50it/s][A
Training:   9%|▊         | 9/103 [00:03<00:32,  2.88it/s][A
Training:  10%|▉         | 10/103 [00:03<00:28,  3.22it/s][A
Training:  13%|█▎        | 13/103 [00:04<00:26,  3.34it/s][A
Training:  15%|█▍        | 15/103 [00:04<00:20,  4.26it/s][A
Training:  17%|█▋        | 17/103 [00:05<00:24,  3.44it/s][A
Training:  18%|█▊        | 19/103 [00:05<00:18,  4.44it/s][A
Training:  20%|██        | 21/103 [00:06<00:22,  3.61it/s][A
Training:  22%|██▏       | 23/103 [00:06<00:18,  4.40it/s][A
Training:  24%|██▍       | 25/103 [00:07<00:20,  3.88it/s][A
Training:  26%|██▌       | 27/103 [00:07<00:16,  4.59it/s][A
Training:  28%|██▊       | 29/103 [00:08<00:19,  3.78it/s][A
Training:  30%|███       | 31/103 [00:08<00:15,  4.62it/s][A
Training:  32%|███▏ 

Epoch: 24/68 - Loss: 0.1497 - Accuracy: 0.9398



  0%|          | 0/13 [00:00<?, ?it/s][A
  8%|▊         | 1/13 [00:01<00:14,  1.24s/it][A
 15%|█▌        | 2/13 [00:01<00:07,  1.50it/s][A
 31%|███       | 4/13 [00:01<00:02,  3.54it/s][A
 38%|███▊      | 5/13 [00:02<00:02,  3.00it/s][A
 46%|████▌     | 6/13 [00:02<00:02,  3.40it/s][A
 62%|██████▏   | 8/13 [00:02<00:01,  4.99it/s][A
 69%|██████▉   | 9/13 [00:02<00:01,  3.55it/s][A
 85%|████████▍ | 11/13 [00:03<00:00,  4.85it/s][A
 92%|█████████▏| 12/13 [00:03<00:00,  5.28it/s][A
100%|██████████| 13/13 [00:03<00:00,  3.52it/s][A
Epochs:  35%|███▌      | 24/68 [11:25<20:55, 28.54s/it]

Val Loss: 0.1604 - Val Accuracy: 0.9370



Training:   0%|          | 0/103 [00:00<?, ?it/s][A
Training:   1%|          | 1/103 [00:01<02:29,  1.46s/it][A
Training:   2%|▏         | 2/103 [00:01<01:10,  1.44it/s][A
Training:   5%|▍         | 5/103 [00:02<00:35,  2.75it/s][A
Training:   6%|▌         | 6/103 [00:02<00:29,  3.24it/s][A
Training:   8%|▊         | 8/103 [00:02<00:19,  4.80it/s][A
Training:   9%|▊         | 9/103 [00:03<00:33,  2.80it/s][A
Training:  11%|█         | 11/103 [00:03<00:22,  4.17it/s][A
Training:  13%|█▎        | 13/103 [00:04<00:27,  3.21it/s][A
Training:  15%|█▍        | 15/103 [00:04<00:20,  4.31it/s][A
Training:  17%|█▋        | 17/103 [00:05<00:24,  3.45it/s][A
Training:  18%|█▊        | 19/103 [00:05<00:18,  4.56it/s][A
Training:  20%|██        | 21/103 [00:06<00:23,  3.43it/s][A
Training:  22%|██▏       | 23/103 [00:06<00:17,  4.60it/s][A
Training:  24%|██▍       | 25/103 [00:07<00:22,  3.45it/s][A
Training:  26%|██▌       | 27/103 [00:07<00:16,  4.50it/s][A
Training:  28%|██▊    

Epoch: 25/68 - Loss: 0.1471 - Accuracy: 0.9410



  0%|          | 0/13 [00:00<?, ?it/s][A
  8%|▊         | 1/13 [00:01<00:13,  1.16s/it][A
 23%|██▎       | 3/13 [00:01<00:03,  2.72it/s][A
 31%|███       | 4/13 [00:01<00:02,  3.59it/s][A
 38%|███▊      | 5/13 [00:02<00:03,  2.45it/s][A
 46%|████▌     | 6/13 [00:02<00:02,  2.86it/s][A
 62%|██████▏   | 8/13 [00:02<00:01,  4.41it/s][A
 69%|██████▉   | 9/13 [00:02<00:01,  3.55it/s][A
 77%|███████▋  | 10/13 [00:03<00:00,  3.25it/s][A
100%|██████████| 13/13 [00:03<00:00,  3.58it/s][A
Epochs:  37%|███▋      | 25/68 [11:54<20:27, 28.54s/it]

Val Loss: 0.1541 - Val Accuracy: 0.9315



Training:   0%|          | 0/103 [00:00<?, ?it/s][A
Training:   1%|          | 1/103 [00:01<02:21,  1.39s/it][A
Training:   4%|▍         | 4/103 [00:01<00:28,  3.44it/s][A
Training:   6%|▌         | 6/103 [00:02<00:37,  2.58it/s][A
Training:   8%|▊         | 8/103 [00:02<00:24,  3.81it/s][A
Training:  10%|▉         | 10/103 [00:03<00:29,  3.19it/s][A
Training:  12%|█▏        | 12/103 [00:03<00:21,  4.33it/s][A
Training:  14%|█▎        | 14/103 [00:04<00:24,  3.62it/s][A
Training:  17%|█▋        | 17/103 [00:05<00:22,  3.86it/s][A
Training:  17%|█▋        | 18/103 [00:05<00:22,  3.79it/s][A
Training:  19%|█▉        | 20/103 [00:05<00:16,  5.04it/s][A
Training:  20%|██        | 21/103 [00:05<00:21,  3.79it/s][A
Training:  21%|██▏       | 22/103 [00:06<00:24,  3.31it/s][A
Training:  24%|██▍       | 25/103 [00:06<00:18,  4.23it/s][A
Training:  25%|██▌       | 26/103 [00:07<00:19,  3.85it/s][A
Training:  28%|██▊       | 29/103 [00:08<00:19,  3.73it/s][A
Training:  29%|██▉  

Epoch: 26/68 - Loss: 0.1468 - Accuracy: 0.9427



  0%|          | 0/13 [00:00<?, ?it/s][A
  8%|▊         | 1/13 [00:01<00:16,  1.34s/it][A
 38%|███▊      | 5/13 [00:02<00:03,  2.47it/s][A
 54%|█████▍    | 7/13 [00:02<00:01,  3.66it/s][A
 69%|██████▉   | 9/13 [00:03<00:01,  2.90it/s][A
100%|██████████| 13/13 [00:04<00:00,  3.25it/s][A
Epochs:  38%|███▊      | 26/68 [12:23<20:02, 28.64s/it]

Val Loss: 0.1500 - Val Accuracy: 0.9389



Training:   0%|          | 0/103 [00:00<?, ?it/s][A
Training:   1%|          | 1/103 [00:01<02:34,  1.51s/it][A
Training:   2%|▏         | 2/103 [00:01<01:09,  1.44it/s][A
Training:   5%|▍         | 5/103 [00:02<00:38,  2.53it/s][A
Training:   7%|▋         | 7/103 [00:02<00:25,  3.75it/s][A
Training:   9%|▊         | 9/103 [00:03<00:27,  3.44it/s][A
Training:  10%|▉         | 10/103 [00:03<00:26,  3.51it/s][A
Training:  12%|█▏        | 12/103 [00:03<00:19,  4.77it/s][A
Training:  13%|█▎        | 13/103 [00:04<00:24,  3.71it/s][A
Training:  14%|█▎        | 14/103 [00:04<00:24,  3.64it/s][A
Training:  15%|█▍        | 15/103 [00:04<00:20,  4.31it/s][A
Training:  17%|█▋        | 17/103 [00:05<00:21,  3.93it/s][A
Training:  17%|█▋        | 18/103 [00:05<00:22,  3.78it/s][A
Training:  19%|█▉        | 20/103 [00:05<00:15,  5.35it/s][A
Training:  20%|██        | 21/103 [00:06<00:21,  3.88it/s][A
Training:  21%|██▏       | 22/103 [00:06<00:21,  3.78it/s][A
Training:  24%|██▍   

Epoch: 27/68 - Loss: 0.1438 - Accuracy: 0.9419



  0%|          | 0/13 [00:00<?, ?it/s][A
  8%|▊         | 1/13 [00:00<00:11,  1.01it/s][A
 15%|█▌        | 2/13 [00:01<00:06,  1.70it/s][A
 38%|███▊      | 5/13 [00:01<00:02,  3.29it/s][A
 46%|████▌     | 6/13 [00:02<00:02,  3.05it/s][A
 69%|██████▉   | 9/13 [00:02<00:00,  4.08it/s][A
 77%|███████▋  | 10/13 [00:03<00:00,  3.84it/s][A
100%|██████████| 13/13 [00:03<00:00,  3.71it/s][A
Epochs:  40%|███▉      | 27/68 [12:51<19:34, 28.65s/it]

Val Loss: 0.1970 - Val Accuracy: 0.9262



Training:   0%|          | 0/103 [00:00<?, ?it/s][A
Training:   1%|          | 1/103 [00:01<02:27,  1.45s/it][A
Training:   3%|▎         | 3/103 [00:01<00:42,  2.33it/s][A
Training:   5%|▍         | 5/103 [00:02<00:41,  2.34it/s][A
Training:   8%|▊         | 8/103 [00:02<00:21,  4.49it/s][A
Training:  10%|▉         | 10/103 [00:03<00:24,  3.75it/s][A
Training:  13%|█▎        | 13/103 [00:04<00:24,  3.67it/s][A
Training:  16%|█▌        | 16/103 [00:04<00:16,  5.31it/s][A
Training:  17%|█▋        | 18/103 [00:04<00:19,  4.36it/s][A
Training:  18%|█▊        | 19/103 [00:05<00:19,  4.30it/s][A
Training:  20%|██        | 21/103 [00:05<00:22,  3.60it/s][A
Training:  22%|██▏       | 23/103 [00:06<00:17,  4.62it/s][A
Training:  23%|██▎       | 24/103 [00:06<00:15,  5.11it/s][A
Training:  24%|██▍       | 25/103 [00:06<00:23,  3.30it/s][A
Training:  26%|██▌       | 27/103 [00:07<00:16,  4.57it/s][A
Training:  28%|██▊       | 29/103 [00:07<00:19,  3.81it/s][A
Training:  30%|███  

Epoch: 28/68 - Loss: 0.1423 - Accuracy: 0.9436



  0%|          | 0/13 [00:00<?, ?it/s][A
  8%|▊         | 1/13 [00:01<00:15,  1.29s/it][A
 31%|███       | 4/13 [00:01<00:02,  3.66it/s][A
 46%|████▌     | 6/13 [00:02<00:02,  2.70it/s][A
 69%|██████▉   | 9/13 [00:03<00:01,  3.08it/s][A
 77%|███████▋  | 10/13 [00:03<00:00,  3.30it/s][A
100%|██████████| 13/13 [00:04<00:00,  3.23it/s][A
Epochs:  41%|████      | 28/68 [13:20<19:08, 28.72s/it]

Val Loss: 0.1587 - Val Accuracy: 0.9326



Training:   0%|          | 0/103 [00:00<?, ?it/s][A
Training:   1%|          | 1/103 [00:01<02:15,  1.33s/it][A
Training:   3%|▎         | 3/103 [00:01<00:40,  2.48it/s][A
Training:   5%|▍         | 5/103 [00:02<00:43,  2.24it/s][A
Training:   7%|▋         | 7/103 [00:02<00:27,  3.49it/s][A
Training:   9%|▊         | 9/103 [00:03<00:33,  2.83it/s][A
Training:  11%|█         | 11/103 [00:03<00:23,  3.96it/s][A
Training:  13%|█▎        | 13/103 [00:04<00:26,  3.36it/s][A
Training:  16%|█▌        | 16/103 [00:04<00:16,  5.32it/s][A
Training:  17%|█▋        | 18/103 [00:05<00:22,  3.79it/s][A
Training:  19%|█▉        | 20/103 [00:05<00:16,  4.93it/s][A
Training:  21%|██▏       | 22/103 [00:06<00:21,  3.71it/s][A
Training:  24%|██▍       | 25/103 [00:07<00:21,  3.57it/s][A
Training:  26%|██▌       | 27/103 [00:07<00:16,  4.58it/s][A
Training:  28%|██▊       | 29/103 [00:08<00:20,  3.61it/s][A
Training:  31%|███       | 32/103 [00:08<00:13,  5.27it/s][A
Training:  33%|███▎  

Epoch: 29/68 - Loss: 0.1550 - Accuracy: 0.9369



  0%|          | 0/13 [00:00<?, ?it/s][A
  8%|▊         | 1/13 [00:01<00:13,  1.11s/it][A
 31%|███       | 4/13 [00:01<00:02,  4.09it/s][A
 46%|████▌     | 6/13 [00:02<00:02,  2.90it/s][A
 69%|██████▉   | 9/13 [00:02<00:01,  3.48it/s][A
 77%|███████▋  | 10/13 [00:03<00:00,  3.61it/s][A
100%|██████████| 13/13 [00:03<00:00,  3.59it/s][A
Epochs:  43%|████▎     | 29/68 [13:49<18:39, 28.70s/it]

Val Loss: 0.1415 - Val Accuracy: 0.9405



Training:   0%|          | 0/103 [00:00<?, ?it/s][A
Training:   1%|          | 1/103 [00:00<01:39,  1.02it/s][A
Training:   3%|▎         | 3/103 [00:01<00:29,  3.34it/s][A
Training:   5%|▍         | 5/103 [00:01<00:34,  2.82it/s][A
Training:   7%|▋         | 7/103 [00:02<00:22,  4.34it/s][A
Training:   9%|▊         | 9/103 [00:03<00:31,  3.02it/s][A
Training:  13%|█▎        | 13/103 [00:03<00:24,  3.70it/s][A
Training:  16%|█▌        | 16/103 [00:04<00:16,  5.28it/s][A
Training:  17%|█▋        | 18/103 [00:04<00:21,  3.87it/s][A
Training:  19%|█▉        | 20/103 [00:05<00:16,  4.92it/s][A
Training:  21%|██▏       | 22/103 [00:05<00:21,  3.83it/s][A
Training:  23%|██▎       | 24/103 [00:06<00:16,  4.87it/s][A
Training:  25%|██▌       | 26/103 [00:06<00:19,  3.95it/s][A
Training:  27%|██▋       | 28/103 [00:06<00:15,  4.99it/s][A
Training:  29%|██▉       | 30/103 [00:07<00:17,  4.10it/s][A
Training:  32%|███▏      | 33/103 [00:08<00:17,  4.10it/s][A
Training:  35%|███▍  

Epoch: 30/68 - Loss: 0.1433 - Accuracy: 0.9421



  0%|          | 0/13 [00:00<?, ?it/s][A
  8%|▊         | 1/13 [00:01<00:12,  1.07s/it][A
 23%|██▎       | 3/13 [00:01<00:04,  2.12it/s][A
 38%|███▊      | 5/13 [00:01<00:02,  3.16it/s][A
 54%|█████▍    | 7/13 [00:02<00:01,  3.30it/s][A
 69%|██████▉   | 9/13 [00:02<00:01,  3.68it/s][A
 85%|████████▍ | 11/13 [00:03<00:00,  4.18it/s][A
100%|██████████| 13/13 [00:03<00:00,  3.65it/s][A
Epochs:  44%|████▍     | 30/68 [14:16<17:51, 28.19s/it]

Val Loss: 0.1457 - Val Accuracy: 0.9366



Training:   0%|          | 0/103 [00:00<?, ?it/s][A
Training:   1%|          | 1/103 [00:01<02:02,  1.20s/it][A
Training:   3%|▎         | 3/103 [00:01<00:37,  2.68it/s][A
Training:   5%|▍         | 5/103 [00:01<00:32,  2.98it/s][A
Training:   6%|▌         | 6/103 [00:02<00:28,  3.43it/s][A
Training:   8%|▊         | 8/103 [00:02<00:18,  5.19it/s][A
Training:   9%|▊         | 9/103 [00:02<00:25,  3.62it/s][A
Training:  10%|▉         | 10/103 [00:03<00:28,  3.32it/s][A
Training:  12%|█▏        | 12/103 [00:03<00:18,  4.81it/s][A
Training:  13%|█▎        | 13/103 [00:03<00:21,  4.19it/s][A
Training:  14%|█▎        | 14/103 [00:04<00:26,  3.30it/s][A
Training:  16%|█▌        | 16/103 [00:04<00:17,  4.93it/s][A
Training:  17%|█▋        | 17/103 [00:04<00:21,  3.95it/s][A
Training:  17%|█▋        | 18/103 [00:05<00:24,  3.43it/s][A
Training:  20%|██        | 21/103 [00:05<00:20,  3.95it/s][A
Training:  21%|██▏       | 22/103 [00:05<00:18,  4.28it/s][A
Training:  22%|██▏    

Epoch: 31/68 - Loss: 0.1425 - Accuracy: 0.9450



  0%|          | 0/13 [00:00<?, ?it/s][A
  8%|▊         | 1/13 [00:01<00:14,  1.21s/it][A
 31%|███       | 4/13 [00:01<00:02,  3.80it/s][A
 46%|████▌     | 6/13 [00:02<00:02,  3.27it/s][A
 69%|██████▉   | 9/13 [00:02<00:01,  3.50it/s][A
 77%|███████▋  | 10/13 [00:02<00:00,  3.95it/s][A
100%|██████████| 13/13 [00:03<00:00,  3.59it/s][A
Epochs:  46%|████▌     | 31/68 [14:43<17:13, 27.93s/it]

Val Loss: 0.1619 - Val Accuracy: 0.9377



Training:   0%|          | 0/103 [00:00<?, ?it/s][A
Training:   1%|          | 1/103 [00:01<02:15,  1.32s/it][A
Training:   5%|▍         | 5/103 [00:02<00:38,  2.57it/s][A
Training:   7%|▋         | 7/103 [00:02<00:25,  3.70it/s][A
Training:   8%|▊         | 8/103 [00:02<00:22,  4.24it/s][A
Training:   9%|▊         | 9/103 [00:03<00:31,  2.95it/s][A
Training:  11%|█         | 11/103 [00:03<00:21,  4.32it/s][A
Training:  13%|█▎        | 13/103 [00:04<00:27,  3.33it/s][A
Training:  16%|█▌        | 16/103 [00:04<00:16,  5.26it/s][A
Training:  17%|█▋        | 18/103 [00:05<00:23,  3.66it/s][A
Training:  19%|█▉        | 20/103 [00:05<00:18,  4.58it/s][A
Training:  20%|██        | 21/103 [00:06<00:25,  3.23it/s][A
Training:  23%|██▎       | 24/103 [00:06<00:16,  4.84it/s][A
Training:  24%|██▍       | 25/103 [00:07<00:22,  3.52it/s][A
Training:  27%|██▋       | 28/103 [00:07<00:15,  4.85it/s][A
Training:  28%|██▊       | 29/103 [00:07<00:19,  3.83it/s][A
Training:  31%|███   

Epoch: 32/68 - Loss: 0.1425 - Accuracy: 0.9419



  0%|          | 0/13 [00:00<?, ?it/s][A
  8%|▊         | 1/13 [00:01<00:13,  1.12s/it][A
 23%|██▎       | 3/13 [00:01<00:03,  3.02it/s][A
 38%|███▊      | 5/13 [00:01<00:02,  3.08it/s][A
 69%|██████▉   | 9/13 [00:02<00:01,  3.79it/s][A
100%|██████████| 13/13 [00:03<00:00,  3.83it/s][A
Epochs:  47%|████▋     | 32/68 [15:10<16:34, 27.62s/it]

Val Loss: 0.1531 - Val Accuracy: 0.9378



Training:   0%|          | 0/103 [00:00<?, ?it/s][A
Training:   1%|          | 1/103 [00:01<02:02,  1.20s/it][A
Training:   3%|▎         | 3/103 [00:01<00:36,  2.74it/s][A
Training:   5%|▍         | 5/103 [00:02<00:36,  2.67it/s][A
Training:   7%|▋         | 7/103 [00:02<00:23,  4.14it/s][A
Training:   9%|▊         | 9/103 [00:03<00:27,  3.37it/s][A
Training:  12%|█▏        | 12/103 [00:03<00:16,  5.35it/s][A
Training:  14%|█▎        | 14/103 [00:04<00:23,  3.72it/s][A
Training:  15%|█▍        | 15/103 [00:04<00:21,  4.18it/s][A
Training:  16%|█▌        | 16/103 [00:04<00:18,  4.67it/s][A
Training:  17%|█▋        | 17/103 [00:04<00:24,  3.47it/s][A
Training:  18%|█▊        | 19/103 [00:04<00:16,  4.95it/s][A
Training:  20%|██        | 21/103 [00:05<00:23,  3.48it/s][A
Training:  22%|██▏       | 23/103 [00:05<00:17,  4.70it/s][A
Training:  24%|██▍       | 25/103 [00:06<00:21,  3.66it/s][A
Training:  26%|██▌       | 27/103 [00:06<00:15,  4.79it/s][A
Training:  28%|██▊   

Epoch: 33/68 - Loss: 0.1468 - Accuracy: 0.9432



  0%|          | 0/13 [00:00<?, ?it/s][A
  8%|▊         | 1/13 [00:01<00:14,  1.21s/it][A
 31%|███       | 4/13 [00:01<00:02,  3.73it/s][A
 46%|████▌     | 6/13 [00:01<00:01,  3.66it/s][A
 54%|█████▍    | 7/13 [00:02<00:01,  4.20it/s][A
 69%|██████▉   | 9/13 [00:02<00:01,  3.61it/s][A
 85%|████████▍ | 11/13 [00:02<00:00,  4.98it/s][A
100%|██████████| 13/13 [00:03<00:00,  3.75it/s][A
Epochs:  49%|████▊     | 33/68 [15:37<16:03, 27.53s/it]

Val Loss: 0.1499 - Val Accuracy: 0.9360



Training:   0%|          | 0/103 [00:00<?, ?it/s][A
Training:   1%|          | 1/103 [00:01<02:01,  1.19s/it][A
Training:   4%|▍         | 4/103 [00:01<00:26,  3.80it/s][A
Training:   6%|▌         | 6/103 [00:02<00:29,  3.31it/s][A
Training:   8%|▊         | 8/103 [00:02<00:21,  4.48it/s][A
Training:   9%|▊         | 9/103 [00:02<00:26,  3.49it/s][A
Training:  10%|▉         | 10/103 [00:02<00:25,  3.65it/s][A
Training:  11%|█         | 11/103 [00:03<00:21,  4.32it/s][A
Training:  12%|█▏        | 12/103 [00:03<00:18,  5.00it/s][A
Training:  13%|█▎        | 13/103 [00:03<00:22,  3.94it/s][A
Training:  14%|█▎        | 14/103 [00:03<00:25,  3.43it/s][A
Training:  16%|█▌        | 16/103 [00:04<00:16,  5.37it/s][A
Training:  17%|█▋        | 17/103 [00:04<00:19,  4.38it/s][A
Training:  17%|█▋        | 18/103 [00:04<00:22,  3.79it/s][A
Training:  18%|█▊        | 19/103 [00:04<00:19,  4.39it/s][A
Training:  20%|██        | 21/103 [00:05<00:15,  5.40it/s][A
Training:  21%|██▏   

Epoch: 34/68 - Loss: 0.1504 - Accuracy: 0.9398



  0%|          | 0/13 [00:00<?, ?it/s][A
  8%|▊         | 1/13 [00:01<00:12,  1.04s/it][A
 15%|█▌        | 2/13 [00:01<00:05,  1.96it/s][A
 31%|███       | 4/13 [00:01<00:02,  4.49it/s][A
 46%|████▌     | 6/13 [00:01<00:01,  3.55it/s][A
 69%|██████▉   | 9/13 [00:02<00:01,  3.32it/s][A
100%|██████████| 13/13 [00:03<00:00,  3.70it/s][A
Epochs:  50%|█████     | 34/68 [16:04<15:32, 27.42s/it]

Val Loss: 0.1523 - Val Accuracy: 0.9381



Training:   0%|          | 0/103 [00:00<?, ?it/s][A
Training:   1%|          | 1/103 [00:01<01:44,  1.02s/it][A
Training:   5%|▍         | 5/103 [00:01<00:33,  2.92it/s][A
Training:   7%|▋         | 7/103 [00:02<00:23,  4.12it/s][A
Training:   9%|▊         | 9/103 [00:02<00:26,  3.62it/s][A
Training:  11%|█         | 11/103 [00:02<00:18,  4.95it/s][A
Training:  13%|█▎        | 13/103 [00:03<00:22,  3.95it/s][A
Training:  15%|█▍        | 15/103 [00:03<00:17,  5.10it/s][A
Training:  17%|█▋        | 17/103 [00:04<00:20,  4.19it/s][A
Training:  17%|█▋        | 18/103 [00:04<00:18,  4.67it/s][A
Training:  19%|█▉        | 20/103 [00:04<00:13,  6.26it/s][A
Training:  21%|██▏       | 22/103 [00:05<00:16,  4.90it/s][A
Training:  22%|██▏       | 23/103 [00:05<00:15,  5.21it/s][A
Training:  23%|██▎       | 24/103 [00:05<00:18,  4.33it/s][A
Training:  24%|██▍       | 25/103 [00:06<00:20,  3.75it/s][A
Training:  26%|██▌       | 27/103 [00:06<00:14,  5.09it/s][A
Training:  27%|██▋  

Epoch: 35/68 - Loss: 0.1399 - Accuracy: 0.9451



  0%|          | 0/13 [00:00<?, ?it/s][A
  8%|▊         | 1/13 [00:01<00:15,  1.28s/it][A
 38%|███▊      | 5/13 [00:02<00:02,  2.74it/s][A
 54%|█████▍    | 7/13 [00:02<00:01,  4.01it/s][A
 69%|██████▉   | 9/13 [00:02<00:01,  3.51it/s][A
100%|██████████| 13/13 [00:03<00:00,  3.71it/s][A
Epochs:  51%|█████▏    | 35/68 [16:32<15:06, 27.46s/it]

Val Loss: 0.1420 - Val Accuracy: 0.9413



Training:   0%|          | 0/103 [00:00<?, ?it/s][A
Training:   1%|          | 1/103 [00:00<01:33,  1.09it/s][A
Training:   2%|▏         | 2/103 [00:01<00:46,  2.17it/s][A
Training:   4%|▍         | 4/103 [00:01<00:20,  4.75it/s][A
Training:   5%|▍         | 5/103 [00:01<00:28,  3.44it/s][A
Training:   6%|▌         | 6/103 [00:01<00:23,  4.15it/s][A
Training:   8%|▊         | 8/103 [00:01<00:14,  6.43it/s][A
Training:  10%|▉         | 10/103 [00:02<00:22,  4.14it/s][A
Training:  11%|█         | 11/103 [00:02<00:19,  4.74it/s][A
Training:  13%|█▎        | 13/103 [00:03<00:29,  3.03it/s][A
Training:  16%|█▌        | 16/103 [00:03<00:17,  5.00it/s][A
Training:  17%|█▋        | 18/103 [00:04<00:22,  3.76it/s][A
Training:  19%|█▉        | 20/103 [00:04<00:17,  4.86it/s][A
Training:  21%|██▏       | 22/103 [00:05<00:19,  4.09it/s][A
Training:  24%|██▍       | 25/103 [00:06<00:21,  3.71it/s][A
Training:  28%|██▊       | 29/103 [00:07<00:19,  3.78it/s][A
Training:  32%|███▏   

Epoch: 36/68 - Loss: 0.1409 - Accuracy: 0.9434



  0%|          | 0/13 [00:00<?, ?it/s][A
  8%|▊         | 1/13 [00:01<00:13,  1.11s/it][A
 38%|███▊      | 5/13 [00:01<00:02,  3.06it/s][A
 69%|██████▉   | 9/13 [00:02<00:01,  3.70it/s][A
 85%|████████▍ | 11/13 [00:02<00:00,  4.68it/s][A
100%|██████████| 13/13 [00:03<00:00,  3.82it/s][A
Epochs:  53%|█████▎    | 36/68 [17:00<14:41, 27.56s/it]

Val Loss: 0.1505 - Val Accuracy: 0.9369



Training:   0%|          | 0/103 [00:00<?, ?it/s][A
Training:   1%|          | 1/103 [00:01<01:55,  1.13s/it][A
Training:   4%|▍         | 4/103 [00:01<00:24,  4.02it/s][A
Training:   6%|▌         | 6/103 [00:02<00:30,  3.22it/s][A
Training:   8%|▊         | 8/103 [00:02<00:20,  4.74it/s][A
Training:  10%|▉         | 10/103 [00:03<00:26,  3.47it/s][A
Training:  13%|█▎        | 13/103 [00:03<00:26,  3.43it/s][A
Training:  15%|█▍        | 15/103 [00:04<00:19,  4.45it/s][A
Training:  17%|█▋        | 17/103 [00:04<00:23,  3.74it/s][A
Training:  20%|██        | 21/103 [00:05<00:18,  4.32it/s][A
Training:  23%|██▎       | 24/103 [00:05<00:13,  5.96it/s][A
Training:  25%|██▌       | 26/103 [00:06<00:16,  4.70it/s][A
Training:  27%|██▋       | 28/103 [00:06<00:13,  5.54it/s][A
Training:  29%|██▉       | 30/103 [00:07<00:16,  4.47it/s][A
Training:  30%|███       | 31/103 [00:07<00:15,  4.80it/s][A
Training:  32%|███▏      | 33/103 [00:08<00:17,  3.91it/s][A
Training:  34%|███▍ 

Epoch: 37/68 - Loss: 0.1429 - Accuracy: 0.9437



  0%|          | 0/13 [00:00<?, ?it/s][A
  8%|▊         | 1/13 [00:01<00:13,  1.15s/it][A
 31%|███       | 4/13 [00:01<00:02,  3.93it/s][A
 46%|████▌     | 6/13 [00:02<00:02,  3.20it/s][A
 69%|██████▉   | 9/13 [00:02<00:01,  3.30it/s][A
100%|██████████| 13/13 [00:03<00:00,  3.60it/s][A
Epochs:  54%|█████▍    | 37/68 [17:27<14:11, 27.47s/it]

Val Loss: 0.1848 - Val Accuracy: 0.9314



Training:   0%|          | 0/103 [00:00<?, ?it/s][A
Training:   1%|          | 1/103 [00:01<01:52,  1.10s/it][A
Training:   3%|▎         | 3/103 [00:01<00:32,  3.04it/s][A
Training:   5%|▍         | 5/103 [00:01<00:34,  2.85it/s][A
Training:   8%|▊         | 8/103 [00:02<00:17,  5.29it/s][A
Training:  10%|▉         | 10/103 [00:02<00:23,  3.94it/s][A
Training:  12%|█▏        | 12/103 [00:02<00:17,  5.15it/s][A
Training:  14%|█▎        | 14/103 [00:03<00:21,  4.20it/s][A
Training:  15%|█▍        | 15/103 [00:03<00:18,  4.65it/s][A
Training:  17%|█▋        | 17/103 [00:04<00:21,  3.99it/s][A
Training:  20%|██        | 21/103 [00:05<00:17,  4.61it/s][A
Training:  21%|██▏       | 22/103 [00:05<00:16,  4.97it/s][A
Training:  24%|██▍       | 25/103 [00:06<00:17,  4.53it/s][A
Training:  25%|██▌       | 26/103 [00:06<00:15,  4.82it/s][A
Training:  28%|██▊       | 29/103 [00:06<00:16,  4.54it/s][A
Training:  29%|██▉       | 30/103 [00:06<00:14,  4.92it/s][A
Training:  32%|███▏ 

Epoch: 38/68 - Loss: 0.1440 - Accuracy: 0.9426



  0%|          | 0/13 [00:00<?, ?it/s][A
  8%|▊         | 1/13 [00:01<00:15,  1.31s/it][A
 31%|███       | 4/13 [00:01<00:02,  3.23it/s][A
 38%|███▊      | 5/13 [00:02<00:03,  2.45it/s][A
 62%|██████▏   | 8/13 [00:02<00:01,  4.57it/s][A
 69%|██████▉   | 9/13 [00:03<00:01,  2.96it/s][A
100%|██████████| 13/13 [00:03<00:00,  3.50it/s][A
Epochs:  56%|█████▌    | 38/68 [17:54<13:38, 27.27s/it]

Val Loss: 0.1510 - Val Accuracy: 0.9388



Training:   0%|          | 0/103 [00:00<?, ?it/s][A
Training:   1%|          | 1/103 [00:01<02:05,  1.23s/it][A
Training:   3%|▎         | 3/103 [00:01<00:36,  2.74it/s][A
Training:   5%|▍         | 5/103 [00:02<00:36,  2.65it/s][A
Training:   9%|▊         | 9/103 [00:02<00:26,  3.57it/s][A
Training:  11%|█         | 11/103 [00:03<00:19,  4.67it/s][A
Training:  13%|█▎        | 13/103 [00:03<00:24,  3.70it/s][A
Training:  15%|█▍        | 15/103 [00:04<00:18,  4.83it/s][A
Training:  17%|█▋        | 17/103 [00:04<00:21,  4.03it/s][A
Training:  18%|█▊        | 19/103 [00:04<00:16,  4.96it/s][A
Training:  20%|██        | 21/103 [00:05<00:18,  4.48it/s][A
Training:  22%|██▏       | 23/103 [00:05<00:16,  4.95it/s][A
Training:  24%|██▍       | 25/103 [00:06<00:16,  4.73it/s][A
Training:  26%|██▌       | 27/103 [00:06<00:14,  5.13it/s][A
Training:  28%|██▊       | 29/103 [00:07<00:16,  4.55it/s][A
Training:  30%|███       | 31/103 [00:07<00:15,  4.70it/s][A
Training:  32%|███▏ 

Epoch: 39/68 - Loss: 0.1400 - Accuracy: 0.9445



  0%|          | 0/13 [00:00<?, ?it/s][A
  8%|▊         | 1/13 [00:01<00:14,  1.19s/it][A
 38%|███▊      | 5/13 [00:02<00:03,  2.65it/s][A
 54%|█████▍    | 7/13 [00:02<00:01,  3.81it/s][A
 62%|██████▏   | 8/13 [00:02<00:01,  4.34it/s][A
 69%|██████▉   | 9/13 [00:03<00:01,  3.11it/s][A
 85%|████████▍ | 11/13 [00:03<00:00,  4.68it/s][A
100%|██████████| 13/13 [00:03<00:00,  3.61it/s][A
Epochs:  57%|█████▋    | 39/68 [18:21<13:07, 27.17s/it]

Val Loss: 0.1627 - Val Accuracy: 0.9293



Training:   0%|          | 0/103 [00:00<?, ?it/s][A
Training:   1%|          | 1/103 [00:00<01:40,  1.02it/s][A
Training:   3%|▎         | 3/103 [00:01<00:29,  3.42it/s][A
Training:   5%|▍         | 5/103 [00:01<00:33,  2.89it/s][A
Training:   8%|▊         | 8/103 [00:01<00:17,  5.45it/s][A
Training:  10%|▉         | 10/103 [00:02<00:22,  4.18it/s][A
Training:  13%|█▎        | 13/103 [00:03<00:22,  4.06it/s][A
Training:  16%|█▌        | 16/103 [00:03<00:14,  5.87it/s][A
Training:  17%|█▋        | 18/103 [00:04<00:18,  4.58it/s][A
Training:  19%|█▉        | 20/103 [00:04<00:14,  5.64it/s][A
Training:  21%|██▏       | 22/103 [00:05<00:20,  4.05it/s][A
Training:  24%|██▍       | 25/103 [00:06<00:20,  3.79it/s][A
Training:  26%|██▌       | 27/103 [00:06<00:15,  4.80it/s][A
Training:  28%|██▊       | 29/103 [00:06<00:17,  4.16it/s][A
Training:  31%|███       | 32/103 [00:07<00:11,  6.05it/s][A
Training:  33%|███▎      | 34/103 [00:07<00:15,  4.44it/s][A
Training:  35%|███▍ 

Epoch: 40/68 - Loss: 0.1394 - Accuracy: 0.9442



  0%|          | 0/13 [00:00<?, ?it/s][A
  8%|▊         | 1/13 [00:01<00:16,  1.41s/it][A
 38%|███▊      | 5/13 [00:02<00:03,  2.65it/s][A
 62%|██████▏   | 8/13 [00:02<00:01,  4.56it/s][A
 77%|███████▋  | 10/13 [00:03<00:00,  3.74it/s][A
100%|██████████| 13/13 [00:03<00:00,  3.45it/s][A
Epochs:  59%|█████▉    | 40/68 [18:47<12:35, 26.99s/it]

Val Loss: 0.1570 - Val Accuracy: 0.9350



Training:   0%|          | 0/103 [00:00<?, ?it/s][A
Training:   1%|          | 1/103 [00:01<02:05,  1.23s/it][A
Training:   3%|▎         | 3/103 [00:01<00:37,  2.63it/s][A
Training:   5%|▍         | 5/103 [00:01<00:31,  3.10it/s][A
Training:   6%|▌         | 6/103 [00:02<00:29,  3.32it/s][A
Training:   8%|▊         | 8/103 [00:02<00:18,  5.05it/s][A
Training:   9%|▊         | 9/103 [00:02<00:25,  3.69it/s][A
Training:  10%|▉         | 10/103 [00:03<00:25,  3.62it/s][A
Training:  12%|█▏        | 12/103 [00:03<00:17,  5.25it/s][A
Training:  13%|█▎        | 13/103 [00:03<00:24,  3.65it/s][A
Training:  14%|█▎        | 14/103 [00:04<00:22,  3.89it/s][A
Training:  17%|█▋        | 17/103 [00:04<00:19,  4.36it/s][A
Training:  17%|█▋        | 18/103 [00:04<00:18,  4.49it/s][A
Training:  20%|██        | 21/103 [00:05<00:17,  4.81it/s][A
Training:  21%|██▏       | 22/103 [00:05<00:16,  5.02it/s][A
Training:  23%|██▎       | 24/103 [00:05<00:12,  6.45it/s][A
Training:  24%|██▍    

Epoch: 41/68 - Loss: 0.1470 - Accuracy: 0.9396



  0%|          | 0/13 [00:00<?, ?it/s][A
  8%|▊         | 1/13 [00:01<00:15,  1.26s/it][A
 23%|██▎       | 3/13 [00:01<00:03,  2.65it/s][A
 38%|███▊      | 5/13 [00:02<00:03,  2.47it/s][A
 62%|██████▏   | 8/13 [00:02<00:01,  4.59it/s][A
 77%|███████▋  | 10/13 [00:03<00:00,  3.91it/s][A
100%|██████████| 13/13 [00:03<00:00,  3.49it/s][A
Epochs:  60%|██████    | 41/68 [19:15<12:11, 27.08s/it]

Val Loss: 0.1592 - Val Accuracy: 0.9328



Training:   0%|          | 0/103 [00:00<?, ?it/s][A
Training:   1%|          | 1/103 [00:01<01:52,  1.10s/it][A
Training:   3%|▎         | 3/103 [00:01<00:33,  2.95it/s][A
Training:   5%|▍         | 5/103 [00:02<00:37,  2.64it/s][A
Training:   7%|▋         | 7/103 [00:02<00:24,  3.95it/s][A
Training:   9%|▊         | 9/103 [00:03<00:30,  3.13it/s][A
Training:  11%|█         | 11/103 [00:03<00:22,  4.13it/s][A
Training:  13%|█▎        | 13/103 [00:04<00:26,  3.40it/s][A
Training:  15%|█▍        | 15/103 [00:04<00:19,  4.50it/s][A
Training:  17%|█▋        | 17/103 [00:05<00:24,  3.44it/s][A
Training:  17%|█▋        | 18/103 [00:05<00:21,  3.87it/s][A
Training:  20%|██        | 21/103 [00:06<00:21,  3.78it/s][A
Training:  22%|██▏       | 23/103 [00:06<00:16,  4.75it/s][A
Training:  24%|██▍       | 25/103 [00:06<00:19,  4.07it/s][A
Training:  27%|██▋       | 28/103 [00:06<00:12,  6.10it/s][A
Training:  29%|██▉       | 30/103 [00:07<00:16,  4.35it/s][A
Training:  32%|███▏  

Epoch: 42/68 - Loss: 0.1416 - Accuracy: 0.9429



  0%|          | 0/13 [00:00<?, ?it/s][A
  8%|▊         | 1/13 [00:01<00:15,  1.26s/it][A
 15%|█▌        | 2/13 [00:01<00:07,  1.50it/s][A
 38%|███▊      | 5/13 [00:02<00:02,  3.10it/s][A
 46%|████▌     | 6/13 [00:02<00:02,  3.45it/s][A
 69%|██████▉   | 9/13 [00:02<00:01,  3.95it/s][A
 77%|███████▋  | 10/13 [00:03<00:00,  4.10it/s][A
100%|██████████| 13/13 [00:03<00:00,  3.51it/s][A
Epochs:  62%|██████▏   | 42/68 [19:42<11:47, 27.21s/it]

Val Loss: 0.1535 - Val Accuracy: 0.9416



Training:   0%|          | 0/103 [00:00<?, ?it/s][A
Training:   1%|          | 1/103 [00:01<02:19,  1.37s/it][A
Training:   3%|▎         | 3/103 [00:01<00:39,  2.52it/s][A
Training:   5%|▍         | 5/103 [00:02<00:38,  2.57it/s][A
Training:   7%|▋         | 7/103 [00:02<00:23,  4.01it/s][A
Training:   9%|▊         | 9/103 [00:03<00:26,  3.52it/s][A
Training:  12%|█▏        | 12/103 [00:03<00:16,  5.66it/s][A
Training:  14%|█▎        | 14/103 [00:04<00:22,  3.98it/s][A
Training:  17%|█▋        | 17/103 [00:04<00:23,  3.64it/s][A
Training:  20%|██        | 21/103 [00:05<00:19,  4.19it/s][A
Training:  23%|██▎       | 24/103 [00:05<00:14,  5.61it/s][A
Training:  25%|██▌       | 26/103 [00:06<00:18,  4.17it/s][A
Training:  27%|██▋       | 28/103 [00:06<00:14,  5.17it/s][A
Training:  29%|██▉       | 30/103 [00:07<00:16,  4.31it/s][A
Training:  32%|███▏      | 33/103 [00:08<00:17,  4.06it/s][A
Training:  34%|███▍      | 35/103 [00:08<00:13,  4.98it/s][A
Training:  36%|███▌  

Epoch: 43/68 - Loss: 0.1431 - Accuracy: 0.9424



  0%|          | 0/13 [00:00<?, ?it/s][A
  8%|▊         | 1/13 [00:01<00:13,  1.12s/it][A
 31%|███       | 4/13 [00:01<00:02,  4.17it/s][A
 46%|████▌     | 6/13 [00:02<00:02,  3.04it/s][A
 69%|██████▉   | 9/13 [00:02<00:01,  3.55it/s][A
 77%|███████▋  | 10/13 [00:03<00:00,  3.67it/s][A
100%|██████████| 13/13 [00:03<00:00,  3.66it/s][A
Epochs:  63%|██████▎   | 43/68 [20:09<11:20, 27.21s/it]

Val Loss: 0.1705 - Val Accuracy: 0.9317



Training:   0%|          | 0/103 [00:00<?, ?it/s][A
Training:   1%|          | 1/103 [00:01<02:02,  1.20s/it][A
Training:   5%|▍         | 5/103 [00:02<00:35,  2.80it/s][A
Training:   7%|▋         | 7/103 [00:02<00:23,  4.10it/s][A
Training:   9%|▊         | 9/103 [00:02<00:25,  3.73it/s][A
Training:  13%|█▎        | 13/103 [00:03<00:20,  4.40it/s][A
Training:  16%|█▌        | 16/103 [00:03<00:13,  6.23it/s][A
Training:  17%|█▋        | 18/103 [00:04<00:19,  4.40it/s][A
Training:  19%|█▉        | 20/103 [00:04<00:15,  5.53it/s][A
Training:  21%|██▏       | 22/103 [00:05<00:19,  4.09it/s][A
Training:  24%|██▍       | 25/103 [00:06<00:19,  3.95it/s][A
Training:  28%|██▊       | 29/103 [00:07<00:17,  4.26it/s][A
Training:  29%|██▉       | 30/103 [00:07<00:16,  4.38it/s][A
Training:  31%|███       | 32/103 [00:07<00:12,  5.51it/s][A
Training:  33%|███▎      | 34/103 [00:08<00:15,  4.35it/s][A
Training:  36%|███▌      | 37/103 [00:08<00:13,  5.01it/s][A
Training:  37%|███▋ 

Epoch: 44/68 - Loss: 0.1392 - Accuracy: 0.9452



  0%|          | 0/13 [00:00<?, ?it/s][A
  8%|▊         | 1/13 [00:01<00:14,  1.22s/it][A
 23%|██▎       | 3/13 [00:01<00:03,  2.82it/s][A
 38%|███▊      | 5/13 [00:02<00:02,  2.73it/s][A
 46%|████▌     | 6/13 [00:02<00:02,  3.05it/s][A
 69%|██████▉   | 9/13 [00:02<00:01,  3.74it/s][A
 77%|███████▋  | 10/13 [00:03<00:00,  3.71it/s][A
100%|██████████| 13/13 [00:03<00:00,  3.56it/s][A
Epochs:  65%|██████▍   | 44/68 [20:36<10:46, 26.94s/it]

Val Loss: 0.1541 - Val Accuracy: 0.9325



Training:   0%|          | 0/103 [00:00<?, ?it/s][A
Training:   1%|          | 1/103 [00:01<02:17,  1.35s/it][A
Training:   3%|▎         | 3/103 [00:01<00:39,  2.51it/s][A
Training:   5%|▍         | 5/103 [00:02<00:36,  2.68it/s][A
Training:   7%|▋         | 7/103 [00:02<00:26,  3.66it/s][A
Training:   9%|▊         | 9/103 [00:03<00:26,  3.56it/s][A
Training:  11%|█         | 11/103 [00:03<00:22,  4.09it/s][A
Training:  13%|█▎        | 13/103 [00:04<00:24,  3.66it/s][A
Training:  15%|█▍        | 15/103 [00:04<00:20,  4.29it/s][A
Training:  17%|█▋        | 17/103 [00:05<00:23,  3.72it/s][A
Training:  18%|█▊        | 19/103 [00:05<00:18,  4.46it/s][A
Training:  20%|██        | 21/103 [00:05<00:20,  4.05it/s][A
Training:  22%|██▏       | 23/103 [00:06<00:18,  4.41it/s][A
Training:  24%|██▍       | 25/103 [00:06<00:17,  4.56it/s][A
Training:  25%|██▌       | 26/103 [00:06<00:15,  4.99it/s][A
Training:  26%|██▌       | 27/103 [00:07<00:18,  4.18it/s][A
Training:  28%|██▊   

Epoch: 45/68 - Loss: 0.1409 - Accuracy: 0.9451



  0%|          | 0/13 [00:00<?, ?it/s][A
  8%|▊         | 1/13 [00:01<00:14,  1.18s/it][A
 38%|███▊      | 5/13 [00:01<00:02,  2.89it/s][A
 62%|██████▏   | 8/13 [00:02<00:01,  4.96it/s][A
 77%|███████▋  | 10/13 [00:02<00:00,  3.78it/s][A
 85%|████████▍ | 11/13 [00:03<00:00,  4.25it/s][A
100%|██████████| 13/13 [00:03<00:00,  3.55it/s][A
Epochs:  66%|██████▌   | 45/68 [21:03<10:22, 27.08s/it]

Val Loss: 0.1620 - Val Accuracy: 0.9354



Training:   0%|          | 0/103 [00:00<?, ?it/s][A
Training:   1%|          | 1/103 [00:01<02:19,  1.37s/it][A
Training:   3%|▎         | 3/103 [00:01<00:40,  2.46it/s][A
Training:   5%|▍         | 5/103 [00:02<00:37,  2.60it/s][A
Training:   7%|▋         | 7/103 [00:02<00:24,  4.00it/s][A
Training:   9%|▊         | 9/103 [00:03<00:32,  2.93it/s][A
Training:  11%|█         | 11/103 [00:03<00:22,  4.16it/s][A
Training:  13%|█▎        | 13/103 [00:04<00:28,  3.12it/s][A
Training:  17%|█▋        | 17/103 [00:05<00:22,  3.80it/s][A
Training:  18%|█▊        | 19/103 [00:05<00:17,  4.78it/s][A
Training:  20%|██        | 21/103 [00:06<00:21,  3.78it/s][A
Training:  23%|██▎       | 24/103 [00:06<00:14,  5.53it/s][A
Training:  25%|██▌       | 26/103 [00:07<00:18,  4.13it/s][A
Training:  27%|██▋       | 28/103 [00:07<00:14,  5.16it/s][A
Training:  29%|██▉       | 30/103 [00:08<00:18,  4.00it/s][A
Training:  32%|███▏      | 33/103 [00:08<00:18,  3.74it/s][A
Training:  36%|███▌  

Epoch: 46/68 - Loss: 0.1437 - Accuracy: 0.9427



  0%|          | 0/13 [00:00<?, ?it/s][A
  8%|▊         | 1/13 [00:01<00:12,  1.02s/it][A
 38%|███▊      | 5/13 [00:02<00:02,  2.72it/s][A
 54%|█████▍    | 7/13 [00:02<00:01,  4.00it/s][A
 69%|██████▉   | 9/13 [00:02<00:01,  3.37it/s][A
 85%|████████▍ | 11/13 [00:03<00:00,  4.63it/s][A
100%|██████████| 13/13 [00:03<00:00,  3.58it/s][A
Epochs:  68%|██████▊   | 46/68 [21:30<09:55, 27.06s/it]

Val Loss: 0.1656 - Val Accuracy: 0.9296



Training:   0%|          | 0/103 [00:00<?, ?it/s][A
Training:   1%|          | 1/103 [00:00<01:40,  1.02it/s][A
Training:   2%|▏         | 2/103 [00:01<01:01,  1.65it/s][A
Training:   5%|▍         | 5/103 [00:01<00:27,  3.52it/s][A
Training:   6%|▌         | 6/103 [00:02<00:31,  3.07it/s][A
Training:   8%|▊         | 8/103 [00:02<00:20,  4.63it/s][A
Training:   9%|▊         | 9/103 [00:02<00:24,  3.79it/s][A
Training:  10%|▉         | 10/103 [00:03<00:27,  3.33it/s][A
Training:  12%|█▏        | 12/103 [00:03<00:18,  4.98it/s][A
Training:  13%|█▎        | 13/103 [00:03<00:23,  3.79it/s][A
Training:  14%|█▎        | 14/103 [00:04<00:25,  3.48it/s][A
Training:  16%|█▌        | 16/103 [00:04<00:16,  5.16it/s][A
Training:  17%|█▋        | 17/103 [00:04<00:18,  4.59it/s][A
Training:  17%|█▋        | 18/103 [00:05<00:23,  3.67it/s][A
Training:  19%|█▉        | 20/103 [00:05<00:15,  5.35it/s][A
Training:  20%|██        | 21/103 [00:05<00:14,  5.82it/s][A
Training:  21%|██▏    

Epoch: 47/68 - Loss: 0.1483 - Accuracy: 0.9431



  0%|          | 0/13 [00:00<?, ?it/s][A
  8%|▊         | 1/13 [00:00<00:11,  1.01it/s][A
 15%|█▌        | 2/13 [00:01<00:05,  1.98it/s][A
 38%|███▊      | 5/13 [00:01<00:02,  3.26it/s][A
 46%|████▌     | 6/13 [00:02<00:02,  3.34it/s][A
 62%|██████▏   | 8/13 [00:02<00:01,  4.99it/s][A
 69%|██████▉   | 9/13 [00:02<00:01,  3.31it/s][A
 77%|███████▋  | 10/13 [00:03<00:00,  3.51it/s][A
100%|██████████| 13/13 [00:03<00:00,  3.54it/s][A
Epochs:  69%|██████▉   | 47/68 [21:57<09:25, 26.94s/it]

Val Loss: 0.1898 - Val Accuracy: 0.9298



Training:   0%|          | 0/103 [00:00<?, ?it/s][A
Training:   1%|          | 1/103 [00:00<01:31,  1.11it/s][A
Training:   2%|▏         | 2/103 [00:01<00:52,  1.92it/s][A
Training:   4%|▍         | 4/103 [00:01<00:25,  3.85it/s][A
Training:   5%|▍         | 5/103 [00:01<00:32,  3.06it/s][A
Training:   6%|▌         | 6/103 [00:02<00:28,  3.44it/s][A
Training:   8%|▊         | 8/103 [00:02<00:21,  4.34it/s][A
Training:   9%|▊         | 9/103 [00:02<00:27,  3.43it/s][A
Training:  10%|▉         | 10/103 [00:03<00:24,  3.87it/s][A
Training:  12%|█▏        | 12/103 [00:03<00:18,  4.86it/s][A
Training:  13%|█▎        | 13/103 [00:03<00:22,  3.99it/s][A
Training:  14%|█▎        | 14/103 [00:03<00:21,  4.20it/s][A
Training:  16%|█▌        | 16/103 [00:04<00:15,  5.60it/s][A
Training:  17%|█▋        | 17/103 [00:04<00:21,  4.07it/s][A
Training:  17%|█▋        | 18/103 [00:04<00:17,  4.77it/s][A
Training:  19%|█▉        | 20/103 [00:04<00:12,  6.44it/s][A
Training:  20%|██      

Epoch: 48/68 - Loss: 0.1497 - Accuracy: 0.9416



  0%|          | 0/13 [00:00<?, ?it/s][A
  8%|▊         | 1/13 [00:01<00:14,  1.20s/it][A
 23%|██▎       | 3/13 [00:01<00:03,  2.71it/s][A
 38%|███▊      | 5/13 [00:02<00:02,  2.70it/s][A
 54%|█████▍    | 7/13 [00:02<00:01,  4.16it/s][A
 69%|██████▉   | 9/13 [00:02<00:01,  3.51it/s][A
 85%|████████▍ | 11/13 [00:03<00:00,  4.86it/s][A
100%|██████████| 13/13 [00:03<00:00,  3.64it/s][A
Epochs:  71%|███████   | 48/68 [22:23<08:54, 26.74s/it]

Val Loss: 0.1584 - Val Accuracy: 0.9354



Training:   0%|          | 0/103 [00:00<?, ?it/s][A
Training:   1%|          | 1/103 [00:01<01:56,  1.15s/it][A
Training:   3%|▎         | 3/103 [00:01<00:36,  2.72it/s][A
Training:   5%|▍         | 5/103 [00:02<00:34,  2.85it/s][A
Training:   6%|▌         | 6/103 [00:02<00:34,  2.83it/s][A
Training:   9%|▊         | 9/103 [00:02<00:24,  3.78it/s][A
Training:  10%|▉         | 10/103 [00:03<00:26,  3.48it/s][A
Training:  13%|█▎        | 13/103 [00:03<00:19,  4.50it/s][A
Training:  14%|█▎        | 14/103 [00:04<00:22,  3.92it/s][A
Training:  16%|█▌        | 16/103 [00:04<00:16,  5.17it/s][A
Training:  17%|█▋        | 17/103 [00:04<00:22,  3.88it/s][A
Training:  17%|█▋        | 18/103 [00:05<00:21,  3.86it/s][A
Training:  19%|█▉        | 20/103 [00:05<00:14,  5.57it/s][A
Training:  20%|██        | 21/103 [00:05<00:22,  3.60it/s][A
Training:  21%|██▏       | 22/103 [00:06<00:21,  3.71it/s][A
Training:  24%|██▍       | 25/103 [00:06<00:17,  4.54it/s][A
Training:  25%|██▌   

Epoch: 49/68 - Loss: 0.1434 - Accuracy: 0.9441



  0%|          | 0/13 [00:00<?, ?it/s][A
  8%|▊         | 1/13 [00:01<00:13,  1.16s/it][A
 23%|██▎       | 3/13 [00:01<00:03,  2.89it/s][A
 38%|███▊      | 5/13 [00:01<00:02,  2.92it/s][A
 46%|████▌     | 6/13 [00:02<00:02,  3.06it/s][A
 62%|██████▏   | 8/13 [00:02<00:01,  4.80it/s][A
 77%|███████▋  | 10/13 [00:03<00:00,  3.37it/s][A
100%|██████████| 13/13 [00:03<00:00,  3.64it/s][A
Epochs:  72%|███████▏  | 49/68 [22:51<08:32, 26.98s/it]

Val Loss: 0.2204 - Val Accuracy: 0.9295



Training:   0%|          | 0/103 [00:00<?, ?it/s][A
Training:   1%|          | 1/103 [00:01<02:00,  1.18s/it][A
Training:   2%|▏         | 2/103 [00:01<01:00,  1.67it/s][A
Training:   5%|▍         | 5/103 [00:01<00:30,  3.17it/s][A
Training:   6%|▌         | 6/103 [00:02<00:29,  3.33it/s][A
Training:   7%|▋         | 7/103 [00:02<00:24,  3.90it/s][A
Training:   9%|▊         | 9/103 [00:02<00:24,  3.85it/s][A
Training:  10%|▉         | 10/103 [00:03<00:24,  3.75it/s][A
Training:  12%|█▏        | 12/103 [00:03<00:17,  5.26it/s][A
Training:  13%|█▎        | 13/103 [00:03<00:23,  3.83it/s][A
Training:  14%|█▎        | 14/103 [00:04<00:23,  3.84it/s][A
Training:  16%|█▌        | 16/103 [00:04<00:15,  5.52it/s][A
Training:  17%|█▋        | 17/103 [00:04<00:23,  3.63it/s][A
Training:  17%|█▋        | 18/103 [00:04<00:20,  4.08it/s][A
Training:  19%|█▉        | 20/103 [00:05<00:15,  5.21it/s][A
Training:  20%|██        | 21/103 [00:05<00:20,  3.91it/s][A
Training:  21%|██▏    

Epoch: 50/68 - Loss: 0.1412 - Accuracy: 0.9436



  0%|          | 0/13 [00:00<?, ?it/s][A
  8%|▊         | 1/13 [00:00<00:10,  1.09it/s][A
 31%|███       | 4/13 [00:01<00:01,  4.90it/s][A
 46%|████▌     | 6/13 [00:01<00:01,  3.52it/s][A
 62%|██████▏   | 8/13 [00:01<00:01,  4.88it/s][A
 77%|███████▋  | 10/13 [00:02<00:00,  3.26it/s][A
100%|██████████| 13/13 [00:03<00:00,  3.88it/s][A
Epochs:  74%|███████▎  | 50/68 [23:18<08:05, 26.96s/it]

Val Loss: 0.1647 - Val Accuracy: 0.9365



Training:   0%|          | 0/103 [00:00<?, ?it/s][A
Training:   1%|          | 1/103 [00:01<02:01,  1.19s/it][A
Training:   2%|▏         | 2/103 [00:01<01:00,  1.68it/s][A
Training:   5%|▍         | 5/103 [00:02<00:32,  3.04it/s][A
Training:   6%|▌         | 6/103 [00:02<00:31,  3.04it/s][A
Training:   9%|▊         | 9/103 [00:02<00:23,  4.07it/s][A
Training:  10%|▉         | 10/103 [00:03<00:24,  3.83it/s][A
Training:  12%|█▏        | 12/103 [00:03<00:17,  5.33it/s][A
Training:  13%|█▎        | 13/103 [00:03<00:23,  3.79it/s][A
Training:  14%|█▎        | 14/103 [00:04<00:26,  3.41it/s][A
Training:  17%|█▋        | 17/103 [00:04<00:20,  4.15it/s][A
Training:  17%|█▋        | 18/103 [00:05<00:22,  3.75it/s][A
Training:  19%|█▉        | 20/103 [00:05<00:16,  5.17it/s][A
Training:  20%|██        | 21/103 [00:05<00:18,  4.34it/s][A
Training:  21%|██▏       | 22/103 [00:06<00:20,  4.03it/s][A
Training:  24%|██▍       | 25/103 [00:06<00:17,  4.51it/s][A
Training:  25%|██▌   

Epoch: 51/68 - Loss: 0.1424 - Accuracy: 0.9438



  0%|          | 0/13 [00:00<?, ?it/s][A
  8%|▊         | 1/13 [00:01<00:16,  1.35s/it][A
 38%|███▊      | 5/13 [00:02<00:02,  2.75it/s][A
 54%|█████▍    | 7/13 [00:02<00:01,  4.08it/s][A
 69%|██████▉   | 9/13 [00:02<00:01,  3.69it/s][A
 85%|████████▍ | 11/13 [00:02<00:00,  5.03it/s][A
100%|██████████| 13/13 [00:03<00:00,  3.68it/s][A
Epochs:  75%|███████▌  | 51/68 [23:45<07:40, 27.08s/it]

Val Loss: 0.1918 - Val Accuracy: 0.9251



Training:   0%|          | 0/103 [00:00<?, ?it/s][A
Training:   1%|          | 1/103 [00:01<01:58,  1.16s/it][A
Training:   2%|▏         | 2/103 [00:01<00:56,  1.80it/s][A
Training:   3%|▎         | 3/103 [00:01<00:37,  2.68it/s][A
Training:   5%|▍         | 5/103 [00:02<00:34,  2.82it/s][A
Training:   7%|▋         | 7/103 [00:02<00:21,  4.50it/s][A
Training:   9%|▊         | 9/103 [00:02<00:26,  3.59it/s][A
Training:  11%|█         | 11/103 [00:03<00:18,  5.06it/s][A
Training:  13%|█▎        | 13/103 [00:03<00:23,  3.80it/s][A
Training:  14%|█▎        | 14/103 [00:03<00:20,  4.31it/s][A
Training:  17%|█▋        | 17/103 [00:04<00:22,  3.75it/s][A
Training:  19%|█▉        | 20/103 [00:05<00:14,  5.71it/s][A
Training:  21%|██▏       | 22/103 [00:05<00:19,  4.15it/s][A
Training:  24%|██▍       | 25/103 [00:06<00:20,  3.87it/s][A
Training:  28%|██▊       | 29/103 [00:07<00:16,  4.37it/s][A
Training:  31%|███       | 32/103 [00:07<00:12,  5.83it/s][A
Training:  33%|███▎   

Epoch: 52/68 - Loss: 0.1545 - Accuracy: 0.9373



  0%|          | 0/13 [00:00<?, ?it/s][A
  8%|▊         | 1/13 [00:01<00:13,  1.09s/it][A
 15%|█▌        | 2/13 [00:01<00:05,  1.89it/s][A
 38%|███▊      | 5/13 [00:01<00:02,  3.10it/s][A
 46%|████▌     | 6/13 [00:02<00:02,  3.39it/s][A
 69%|██████▉   | 9/13 [00:02<00:00,  4.10it/s][A
 77%|███████▋  | 10/13 [00:03<00:00,  3.75it/s][A
100%|██████████| 13/13 [00:03<00:00,  3.59it/s][A
Epochs:  76%|███████▋  | 52/68 [24:12<07:11, 26.98s/it]

Val Loss: 0.2035 - Val Accuracy: 0.9098



Training:   0%|          | 0/103 [00:00<?, ?it/s][A
Training:   1%|          | 1/103 [00:01<02:02,  1.21s/it][A
Training:   3%|▎         | 3/103 [00:01<00:35,  2.84it/s][A
Training:   5%|▍         | 5/103 [00:02<00:37,  2.62it/s][A
Training:   6%|▌         | 6/103 [00:02<00:30,  3.20it/s][A
Training:   8%|▊         | 8/103 [00:02<00:18,  5.02it/s][A
Training:  10%|▉         | 10/103 [00:02<00:22,  4.20it/s][A
Training:  12%|█▏        | 12/103 [00:03<00:16,  5.67it/s][A
Training:  14%|█▎        | 14/103 [00:03<00:21,  4.12it/s][A
Training:  16%|█▌        | 16/103 [00:03<00:16,  5.38it/s][A
Training:  17%|█▋        | 18/103 [00:04<00:22,  3.72it/s][A
Training:  20%|██        | 21/103 [00:05<00:23,  3.49it/s][A
Training:  23%|██▎       | 24/103 [00:05<00:15,  5.08it/s][A
Training:  25%|██▌       | 26/103 [00:06<00:18,  4.14it/s][A
Training:  28%|██▊       | 29/103 [00:07<00:18,  4.05it/s][A
Training:  29%|██▉       | 30/103 [00:07<00:17,  4.29it/s][A
Training:  32%|███▏  

Epoch: 53/68 - Loss: 0.1476 - Accuracy: 0.9418



  0%|          | 0/13 [00:00<?, ?it/s][A
  8%|▊         | 1/13 [00:01<00:15,  1.29s/it][A
 38%|███▊      | 5/13 [00:02<00:02,  2.70it/s][A
 69%|██████▉   | 9/13 [00:02<00:01,  3.51it/s][A
100%|██████████| 13/13 [00:03<00:00,  3.58it/s][A
Epochs:  78%|███████▊  | 53/68 [24:39<06:45, 27.03s/it]

Val Loss: 0.1590 - Val Accuracy: 0.9399



Training:   0%|          | 0/103 [00:00<?, ?it/s][A
Training:   1%|          | 1/103 [00:01<02:21,  1.39s/it][A
Training:   2%|▏         | 2/103 [00:01<01:08,  1.49it/s][A
Training:   4%|▍         | 4/103 [00:01<00:28,  3.47it/s][A
Training:   5%|▍         | 5/103 [00:02<00:36,  2.65it/s][A
Training:   6%|▌         | 6/103 [00:02<00:30,  3.14it/s][A
Training:   8%|▊         | 8/103 [00:02<00:19,  4.82it/s][A
Training:   9%|▊         | 9/103 [00:03<00:29,  3.16it/s][A
Training:  10%|▉         | 10/103 [00:03<00:24,  3.80it/s][A
Training:  12%|█▏        | 12/103 [00:03<00:16,  5.62it/s][A
Training:  13%|█▎        | 13/103 [00:04<00:25,  3.53it/s][A
Training:  14%|█▎        | 14/103 [00:04<00:21,  4.05it/s][A
Training:  17%|█▋        | 17/103 [00:05<00:21,  3.96it/s][A
Training:  17%|█▋        | 18/103 [00:05<00:19,  4.26it/s][A
Training:  20%|██        | 21/103 [00:05<00:19,  4.13it/s][A
Training:  21%|██▏       | 22/103 [00:06<00:19,  4.10it/s][A
Training:  23%|██▎     

Epoch: 54/68 - Loss: 0.1456 - Accuracy: 0.9422



  0%|          | 0/13 [00:00<?, ?it/s][A
  8%|▊         | 1/13 [00:01<00:15,  1.29s/it][A
 38%|███▊      | 5/13 [00:02<00:03,  2.59it/s][A
 62%|██████▏   | 8/13 [00:02<00:01,  4.52it/s][A
 77%|███████▋  | 10/13 [00:03<00:00,  3.29it/s][A
100%|██████████| 13/13 [00:03<00:00,  3.33it/s][A
Epochs:  79%|███████▉  | 54/68 [25:07<06:22, 27.29s/it]

Val Loss: 0.1999 - Val Accuracy: 0.9209



Training:   0%|          | 0/103 [00:00<?, ?it/s][A
Training:   1%|          | 1/103 [00:01<01:54,  1.12s/it][A
Training:   4%|▍         | 4/103 [00:01<00:24,  4.03it/s][A
Training:   6%|▌         | 6/103 [00:02<00:31,  3.05it/s][A
Training:   9%|▊         | 9/103 [00:03<00:29,  3.17it/s][A
Training:  12%|█▏        | 12/103 [00:03<00:18,  5.00it/s][A
Training:  14%|█▎        | 14/103 [00:03<00:22,  4.04it/s][A
Training:  16%|█▌        | 16/103 [00:04<00:18,  4.77it/s][A
Training:  17%|█▋        | 18/103 [00:04<00:19,  4.38it/s][A
Training:  18%|█▊        | 19/103 [00:04<00:18,  4.54it/s][A
Training:  20%|██        | 21/103 [00:05<00:19,  4.27it/s][A
Training:  22%|██▏       | 23/103 [00:05<00:15,  5.06it/s][A
Training:  23%|██▎       | 24/103 [00:05<00:14,  5.36it/s][A
Training:  24%|██▍       | 25/103 [00:06<00:19,  4.09it/s][A
Training:  26%|██▌       | 27/103 [00:06<00:15,  4.90it/s][A
Training:  28%|██▊       | 29/103 [00:07<00:19,  3.88it/s][A
Training:  30%|███  

Epoch: 55/68 - Loss: 0.1457 - Accuracy: 0.9411



  0%|          | 0/13 [00:00<?, ?it/s][A
  8%|▊         | 1/13 [00:01<00:13,  1.14s/it][A
 15%|█▌        | 2/13 [00:01<00:05,  1.87it/s][A
 23%|██▎       | 3/13 [00:01<00:03,  2.78it/s][A
 38%|███▊      | 5/13 [00:02<00:02,  3.07it/s][A
 46%|████▌     | 6/13 [00:02<00:01,  3.66it/s][A
 69%|██████▉   | 9/13 [00:02<00:01,  3.66it/s][A
 77%|███████▋  | 10/13 [00:03<00:00,  4.22it/s][A
100%|██████████| 13/13 [00:03<00:00,  3.48it/s][A
Epochs:  81%|████████  | 55/68 [25:34<05:55, 27.33s/it]

Val Loss: 0.1582 - Val Accuracy: 0.9383



Training:   0%|          | 0/103 [00:00<?, ?it/s][A
Training:   1%|          | 1/103 [00:01<01:48,  1.06s/it][A
Training:   2%|▏         | 2/103 [00:01<00:53,  1.89it/s][A
Training:   4%|▍         | 4/103 [00:01<00:23,  4.28it/s][A
Training:   6%|▌         | 6/103 [00:01<00:25,  3.75it/s][A
Training:   9%|▊         | 9/103 [00:02<00:25,  3.63it/s][A
Training:  11%|█         | 11/103 [00:02<00:19,  4.79it/s][A
Training:  13%|█▎        | 13/103 [00:03<00:25,  3.55it/s][A
Training:  15%|█▍        | 15/103 [00:03<00:18,  4.73it/s][A
Training:  17%|█▋        | 17/103 [00:04<00:21,  4.08it/s][A
Training:  17%|█▋        | 18/103 [00:04<00:20,  4.22it/s][A
Training:  20%|██        | 21/103 [00:05<00:17,  4.81it/s][A
Training:  21%|██▏       | 22/103 [00:05<00:16,  4.85it/s][A
Training:  24%|██▍       | 25/103 [00:06<00:15,  5.17it/s][A
Training:  25%|██▌       | 26/103 [00:06<00:15,  5.02it/s][A
Training:  28%|██▊       | 29/103 [00:06<00:13,  5.36it/s][A
Training:  29%|██▉   

Epoch: 56/68 - Loss: 0.1451 - Accuracy: 0.9430



  0%|          | 0/13 [00:00<?, ?it/s][A
  8%|▊         | 1/13 [00:01<00:15,  1.28s/it][A
 31%|███       | 4/13 [00:01<00:02,  3.62it/s][A
 46%|████▌     | 6/13 [00:02<00:02,  2.96it/s][A
 62%|██████▏   | 8/13 [00:02<00:01,  4.33it/s][A
 77%|███████▋  | 10/13 [00:03<00:00,  3.40it/s][A
100%|██████████| 13/13 [00:03<00:00,  3.55it/s][A
Epochs:  82%|████████▏ | 56/68 [26:01<05:26, 27.18s/it]

Val Loss: 0.1545 - Val Accuracy: 0.9390



Training:   0%|          | 0/103 [00:00<?, ?it/s][A
Training:   1%|          | 1/103 [00:01<02:08,  1.26s/it][A
Training:   5%|▍         | 5/103 [00:02<00:37,  2.64it/s][A
Training:   6%|▌         | 6/103 [00:02<00:31,  3.11it/s][A
Training:   8%|▊         | 8/103 [00:02<00:21,  4.49it/s][A
Training:   9%|▊         | 9/103 [00:02<00:27,  3.48it/s][A
Training:  10%|▉         | 10/103 [00:03<00:24,  3.85it/s][A
Training:  12%|█▏        | 12/103 [00:03<00:16,  5.59it/s][A
Training:  13%|█▎        | 13/103 [00:03<00:24,  3.64it/s][A
Training:  15%|█▍        | 15/103 [00:03<00:16,  5.30it/s][A
Training:  17%|█▋        | 17/103 [00:04<00:20,  4.29it/s][A
Training:  17%|█▋        | 18/103 [00:04<00:18,  4.64it/s][A
Training:  20%|██        | 21/103 [00:05<00:18,  4.52it/s][A
Training:  21%|██▏       | 22/103 [00:05<00:16,  5.00it/s][A
Training:  23%|██▎       | 24/103 [00:05<00:12,  6.54it/s][A
Training:  25%|██▌       | 26/103 [00:06<00:18,  4.07it/s][A
Training:  27%|██▋   

Epoch: 57/68 - Loss: 0.1380 - Accuracy: 0.9446



  0%|          | 0/13 [00:00<?, ?it/s][A
  8%|▊         | 1/13 [00:01<00:13,  1.11s/it][A
 23%|██▎       | 3/13 [00:01<00:03,  3.03it/s][A
 38%|███▊      | 5/13 [00:01<00:02,  2.82it/s][A
 46%|████▌     | 6/13 [00:02<00:02,  3.27it/s][A
 62%|██████▏   | 8/13 [00:02<00:00,  5.12it/s][A
 77%|███████▋  | 10/13 [00:03<00:00,  3.40it/s][A
100%|██████████| 13/13 [00:03<00:00,  3.54it/s][A
Epochs:  84%|████████▍ | 57/68 [26:28<04:57, 27.07s/it]

Val Loss: 0.1520 - Val Accuracy: 0.9346



Training:   0%|          | 0/103 [00:00<?, ?it/s][A
Training:   1%|          | 1/103 [00:01<01:57,  1.15s/it][A
Training:   2%|▏         | 2/103 [00:01<00:54,  1.85it/s][A
Training:   4%|▍         | 4/103 [00:01<00:23,  4.23it/s][A
Training:   6%|▌         | 6/103 [00:02<00:29,  3.34it/s][A
Training:   9%|▊         | 9/103 [00:02<00:27,  3.45it/s][A
Training:  11%|█         | 11/103 [00:03<00:19,  4.61it/s][A
Training:  13%|█▎        | 13/103 [00:03<00:25,  3.48it/s][A
Training:  15%|█▍        | 15/103 [00:04<00:19,  4.55it/s][A
Training:  17%|█▋        | 17/103 [00:04<00:23,  3.59it/s][A
Training:  18%|█▊        | 19/103 [00:05<00:17,  4.77it/s][A
Training:  20%|██        | 21/103 [00:05<00:21,  3.73it/s][A
Training:  22%|██▏       | 23/103 [00:05<00:16,  4.78it/s][A
Training:  24%|██▍       | 25/103 [00:06<00:19,  3.98it/s][A
Training:  27%|██▋       | 28/103 [00:06<00:12,  5.81it/s][A
Training:  29%|██▉       | 30/103 [00:07<00:14,  5.14it/s][A
Training:  30%|███   

Epoch: 58/68 - Loss: 0.1422 - Accuracy: 0.9420



  0%|          | 0/13 [00:00<?, ?it/s][A
  8%|▊         | 1/13 [00:01<00:16,  1.37s/it][A
 23%|██▎       | 3/13 [00:01<00:04,  2.48it/s][A
 31%|███       | 4/13 [00:01<00:02,  3.09it/s][A
 38%|███▊      | 5/13 [00:02<00:03,  2.24it/s][A
 46%|████▌     | 6/13 [00:02<00:02,  2.87it/s][A
 62%|██████▏   | 8/13 [00:02<00:01,  4.63it/s][A
 69%|██████▉   | 9/13 [00:03<00:01,  3.08it/s][A
 77%|███████▋  | 10/13 [00:03<00:00,  3.64it/s][A
100%|██████████| 13/13 [00:04<00:00,  3.22it/s][A
Epochs:  85%|████████▌ | 58/68 [26:56<04:35, 27.53s/it]

Val Loss: 0.1524 - Val Accuracy: 0.9347



Training:   0%|          | 0/103 [00:00<?, ?it/s][A
Training:   1%|          | 1/103 [00:01<02:29,  1.47s/it][A
Training:   5%|▍         | 5/103 [00:02<00:41,  2.38it/s][A
Training:   9%|▊         | 9/103 [00:03<00:30,  3.10it/s][A
Training:  11%|█         | 11/103 [00:03<00:22,  4.05it/s][A
Training:  13%|█▎        | 13/103 [00:04<00:25,  3.48it/s][A
Training:  17%|█▋        | 17/103 [00:05<00:21,  3.97it/s][A
Training:  18%|█▊        | 19/103 [00:05<00:17,  4.80it/s][A
Training:  20%|██        | 21/103 [00:06<00:20,  3.96it/s][A
Training:  22%|██▏       | 23/103 [00:06<00:16,  4.94it/s][A
Training:  24%|██▍       | 25/103 [00:06<00:20,  3.80it/s][A
Training:  26%|██▌       | 27/103 [00:07<00:15,  4.88it/s][A
Training:  28%|██▊       | 29/103 [00:07<00:18,  4.04it/s][A
Training:  29%|██▉       | 30/103 [00:07<00:16,  4.37it/s][A
Training:  32%|███▏      | 33/103 [00:08<00:16,  4.25it/s][A
Training:  33%|███▎      | 34/103 [00:08<00:15,  4.55it/s][A
Training:  35%|███▍

Epoch: 59/68 - Loss: 0.1470 - Accuracy: 0.9416



  0%|          | 0/13 [00:00<?, ?it/s][A
  8%|▊         | 1/13 [00:01<00:15,  1.30s/it][A
 15%|█▌        | 2/13 [00:01<00:06,  1.66it/s][A
 38%|███▊      | 5/13 [00:02<00:02,  2.95it/s][A
 46%|████▌     | 6/13 [00:02<00:02,  3.31it/s][A
 69%|██████▉   | 9/13 [00:03<00:01,  3.74it/s][A
 77%|███████▋  | 10/13 [00:03<00:00,  4.06it/s][A
 85%|████████▍ | 11/13 [00:03<00:00,  4.52it/s][A
100%|██████████| 13/13 [00:03<00:00,  3.35it/s][A
Epochs:  87%|████████▋ | 59/68 [27:24<04:07, 27.53s/it]

Val Loss: 0.1760 - Val Accuracy: 0.9323



Training:   0%|          | 0/103 [00:00<?, ?it/s][A
Training:   1%|          | 1/103 [00:01<02:11,  1.29s/it][A
Training:   4%|▍         | 4/103 [00:01<00:28,  3.51it/s][A
Training:   6%|▌         | 6/103 [00:02<00:32,  2.95it/s][A
Training:   9%|▊         | 9/103 [00:03<00:29,  3.23it/s][A
Training:  11%|█         | 11/103 [00:03<00:22,  4.02it/s][A
Training:  13%|█▎        | 13/103 [00:04<00:27,  3.33it/s][A
Training:  15%|█▍        | 15/103 [00:04<00:20,  4.26it/s][A
Training:  17%|█▋        | 17/103 [00:05<00:24,  3.57it/s][A
Training:  18%|█▊        | 19/103 [00:05<00:18,  4.48it/s][A
Training:  19%|█▉        | 20/103 [00:05<00:16,  4.93it/s][A
Training:  20%|██        | 21/103 [00:05<00:22,  3.59it/s][A
Training:  22%|██▏       | 23/103 [00:06<00:17,  4.55it/s][A
Training:  24%|██▍       | 25/103 [00:06<00:18,  4.13it/s][A
Training:  26%|██▌       | 27/103 [00:07<00:20,  3.70it/s][A
Training:  28%|██▊       | 29/103 [00:07<00:18,  3.96it/s][A
Training:  30%|███  

Epoch: 60/68 - Loss: 0.1419 - Accuracy: 0.9438



  0%|          | 0/13 [00:00<?, ?it/s][A
  8%|▊         | 1/13 [00:01<00:14,  1.18s/it][A
 23%|██▎       | 3/13 [00:01<00:03,  2.81it/s][A
 31%|███       | 4/13 [00:01<00:03,  2.97it/s][A
 38%|███▊      | 5/13 [00:02<00:03,  2.41it/s][A
 54%|█████▍    | 7/13 [00:02<00:01,  3.94it/s][A
 62%|██████▏   | 8/13 [00:02<00:01,  3.96it/s][A
 69%|██████▉   | 9/13 [00:03<00:01,  2.97it/s][A
 85%|████████▍ | 11/13 [00:03<00:00,  4.70it/s][A
 92%|█████████▏| 12/13 [00:03<00:00,  3.96it/s][A
100%|██████████| 13/13 [00:03<00:00,  3.34it/s][A
Epochs:  88%|████████▊ | 60/68 [27:52<03:41, 27.64s/it]

Val Loss: 0.1582 - Val Accuracy: 0.9354



Training:   0%|          | 0/103 [00:00<?, ?it/s][A
Training:   1%|          | 1/103 [00:01<02:28,  1.46s/it][A
Training:   3%|▎         | 3/103 [00:01<00:41,  2.40it/s][A
Training:   5%|▍         | 5/103 [00:02<00:44,  2.23it/s][A
Training:   7%|▋         | 7/103 [00:02<00:26,  3.57it/s][A
Training:   9%|▊         | 9/103 [00:03<00:30,  3.10it/s][A
Training:  11%|█         | 11/103 [00:03<00:21,  4.35it/s][A
Training:  13%|█▎        | 13/103 [00:04<00:28,  3.18it/s][A
Training:  17%|█▋        | 17/103 [00:05<00:24,  3.56it/s][A
Training:  20%|██        | 21/103 [00:06<00:20,  3.96it/s][A
Training:  23%|██▎       | 24/103 [00:06<00:14,  5.27it/s][A
Training:  25%|██▌       | 26/103 [00:07<00:17,  4.32it/s][A
Training:  27%|██▋       | 28/103 [00:07<00:14,  5.28it/s][A
Training:  29%|██▉       | 30/103 [00:08<00:17,  4.08it/s][A
Training:  32%|███▏      | 33/103 [00:09<00:19,  3.66it/s][A
Training:  35%|███▍      | 36/103 [00:09<00:12,  5.19it/s][A
Training:  37%|███▋  

Epoch: 61/68 - Loss: 0.1393 - Accuracy: 0.9448



  0%|          | 0/13 [00:00<?, ?it/s][A
  8%|▊         | 1/13 [00:01<00:13,  1.10s/it][A
 23%|██▎       | 3/13 [00:01<00:03,  3.06it/s][A
 38%|███▊      | 5/13 [00:02<00:02,  2.71it/s][A
 54%|█████▍    | 7/13 [00:02<00:01,  4.22it/s][A
 69%|██████▉   | 9/13 [00:02<00:01,  3.41it/s][A
100%|██████████| 13/13 [00:03<00:00,  3.48it/s][A
Epochs:  90%|████████▉ | 61/68 [28:19<03:12, 27.56s/it]

Val Loss: 0.1566 - Val Accuracy: 0.9371



Training:   0%|          | 0/103 [00:00<?, ?it/s][A
Training:   1%|          | 1/103 [00:01<02:07,  1.25s/it][A
Training:   5%|▍         | 5/103 [00:02<00:39,  2.48it/s][A
Training:   7%|▋         | 7/103 [00:02<00:26,  3.60it/s][A
Training:   9%|▊         | 9/103 [00:03<00:29,  3.18it/s][A
Training:  12%|█▏        | 12/103 [00:03<00:18,  4.97it/s][A
Training:  14%|█▎        | 14/103 [00:04<00:23,  3.80it/s][A
Training:  16%|█▌        | 16/103 [00:04<00:17,  4.88it/s][A
Training:  17%|█▋        | 18/103 [00:05<00:23,  3.67it/s][A
Training:  20%|██        | 21/103 [00:06<00:22,  3.63it/s][A
Training:  23%|██▎       | 24/103 [00:06<00:15,  5.14it/s][A
Training:  25%|██▌       | 26/103 [00:07<00:20,  3.73it/s][A
Training:  28%|██▊       | 29/103 [00:07<00:20,  3.68it/s][A
Training:  31%|███       | 32/103 [00:08<00:13,  5.10it/s][A
Training:  33%|███▎      | 34/103 [00:08<00:16,  4.11it/s][A
Training:  35%|███▍      | 36/103 [00:08<00:13,  5.13it/s][A
Training:  37%|███▋ 

Epoch: 62/68 - Loss: 0.1377 - Accuracy: 0.9458



  0%|          | 0/13 [00:00<?, ?it/s][A
  8%|▊         | 1/13 [00:01<00:16,  1.35s/it][A
 23%|██▎       | 3/13 [00:01<00:03,  2.58it/s][A
 38%|███▊      | 5/13 [00:02<00:03,  2.51it/s][A
 46%|████▌     | 6/13 [00:02<00:02,  3.10it/s][A
 54%|█████▍    | 7/13 [00:02<00:01,  3.61it/s][A
 69%|██████▉   | 9/13 [00:03<00:01,  3.23it/s][A
 77%|███████▋  | 10/13 [00:03<00:00,  3.65it/s][A
 85%|████████▍ | 11/13 [00:03<00:00,  4.35it/s][A
100%|██████████| 13/13 [00:04<00:00,  3.11it/s][A
Epochs:  91%|█████████ | 62/68 [28:48<02:46, 27.83s/it]

Val Loss: 0.1704 - Val Accuracy: 0.9338



Training:   0%|          | 0/103 [00:00<?, ?it/s][A
Training:   1%|          | 1/103 [00:01<02:16,  1.33s/it][A
Training:   2%|▏         | 2/103 [00:01<01:08,  1.47it/s][A
Training:   5%|▍         | 5/103 [00:02<00:39,  2.46it/s][A
Training:   6%|▌         | 6/103 [00:02<00:33,  2.92it/s][A
Training:   9%|▊         | 9/103 [00:03<00:25,  3.67it/s][A
Training:  10%|▉         | 10/103 [00:03<00:24,  3.86it/s][A
Training:  13%|█▎        | 13/103 [00:04<00:22,  4.02it/s][A
Training:  14%|█▎        | 14/103 [00:04<00:22,  4.03it/s][A
Training:  16%|█▌        | 16/103 [00:04<00:15,  5.44it/s][A
Training:  17%|█▋        | 17/103 [00:05<00:21,  4.03it/s][A
Training:  17%|█▋        | 18/103 [00:05<00:22,  3.82it/s][A
Training:  19%|█▉        | 20/103 [00:05<00:15,  5.36it/s][A
Training:  20%|██        | 21/103 [00:06<00:21,  3.84it/s][A
Training:  21%|██▏       | 22/103 [00:06<00:22,  3.61it/s][A
Training:  24%|██▍       | 25/103 [00:06<00:19,  4.06it/s][A
Training:  25%|██▌   

Epoch: 63/68 - Loss: 0.1523 - Accuracy: 0.9418



  0%|          | 0/13 [00:00<?, ?it/s][A
  8%|▊         | 1/13 [00:01<00:12,  1.06s/it][A
 31%|███       | 4/13 [00:01<00:02,  4.25it/s][A
 46%|████▌     | 6/13 [00:02<00:02,  3.09it/s][A
 62%|██████▏   | 8/13 [00:02<00:01,  4.50it/s][A
 77%|███████▋  | 10/13 [00:02<00:00,  3.73it/s][A
 92%|█████████▏| 12/13 [00:03<00:00,  4.79it/s][A
100%|██████████| 13/13 [00:03<00:00,  3.55it/s][A
Epochs:  93%|█████████▎| 63/68 [29:16<02:19, 27.89s/it]

Val Loss: 0.1598 - Val Accuracy: 0.9348



Training:   0%|          | 0/103 [00:00<?, ?it/s][A
Training:   1%|          | 1/103 [00:01<02:10,  1.28s/it][A
Training:   2%|▏         | 2/103 [00:01<00:59,  1.70it/s][A
Training:   4%|▍         | 4/103 [00:01<00:26,  3.67it/s][A
Training:   5%|▍         | 5/103 [00:02<00:40,  2.42it/s][A
Training:   7%|▋         | 7/103 [00:02<00:25,  3.83it/s][A
Training:   9%|▊         | 9/103 [00:03<00:33,  2.83it/s][A
Training:  10%|▉         | 10/103 [00:03<00:27,  3.37it/s][A
Training:  12%|█▏        | 12/103 [00:03<00:18,  4.92it/s][A
Training:  14%|█▎        | 14/103 [00:04<00:24,  3.63it/s][A
Training:  16%|█▌        | 16/103 [00:04<00:17,  4.99it/s][A
Training:  17%|█▋        | 18/103 [00:05<00:22,  3.70it/s][A
Training:  19%|█▉        | 20/103 [00:05<00:16,  4.92it/s][A
Training:  21%|██▏       | 22/103 [00:06<00:22,  3.63it/s][A
Training:  23%|██▎       | 24/103 [00:06<00:16,  4.85it/s][A
Training:  25%|██▌       | 26/103 [00:07<00:20,  3.69it/s][A
Training:  28%|██▊    

Epoch: 64/68 - Loss: 0.1375 - Accuracy: 0.9451



  0%|          | 0/13 [00:00<?, ?it/s][A
  8%|▊         | 1/13 [00:01<00:13,  1.16s/it][A
 23%|██▎       | 3/13 [00:01<00:03,  2.95it/s][A
 38%|███▊      | 5/13 [00:01<00:02,  3.25it/s][A
 62%|██████▏   | 8/13 [00:01<00:00,  5.96it/s][A
 77%|███████▋  | 10/13 [00:02<00:00,  4.40it/s][A
100%|██████████| 13/13 [00:03<00:00,  3.97it/s][A
Epochs:  94%|█████████▍| 64/68 [29:42<01:49, 27.44s/it]

Val Loss: 0.1571 - Val Accuracy: 0.9406



Training:   0%|          | 0/103 [00:00<?, ?it/s][A
Training:   1%|          | 1/103 [00:01<02:05,  1.23s/it][A
Training:   2%|▏         | 2/103 [00:01<00:57,  1.76it/s][A
Training:   4%|▍         | 4/103 [00:01<00:24,  4.09it/s][A
Training:   6%|▌         | 6/103 [00:02<00:27,  3.54it/s][A
Training:   8%|▊         | 8/103 [00:02<00:21,  4.49it/s][A
Training:   9%|▊         | 9/103 [00:02<00:27,  3.43it/s][A
Training:  11%|█         | 11/103 [00:03<00:19,  4.79it/s][A
Training:  12%|█▏        | 12/103 [00:03<00:19,  4.74it/s][A
Training:  13%|█▎        | 13/103 [00:03<00:26,  3.44it/s][A
Training:  15%|█▍        | 15/103 [00:03<00:18,  4.86it/s][A
Training:  16%|█▌        | 16/103 [00:04<00:18,  4.62it/s][A
Training:  17%|█▋        | 17/103 [00:04<00:26,  3.23it/s][A
Training:  18%|█▊        | 19/103 [00:04<00:17,  4.83it/s][A
Training:  20%|██        | 21/103 [00:05<00:21,  3.78it/s][A
Training:  21%|██▏       | 22/103 [00:05<00:19,  4.16it/s][A
Training:  24%|██▍    

Epoch: 65/68 - Loss: 0.1333 - Accuracy: 0.9492



  0%|          | 0/13 [00:00<?, ?it/s][A
  8%|▊         | 1/13 [00:01<00:13,  1.11s/it][A
 23%|██▎       | 3/13 [00:01<00:03,  2.95it/s][A
 38%|███▊      | 5/13 [00:01<00:02,  3.16it/s][A
 54%|█████▍    | 7/13 [00:02<00:01,  4.35it/s][A
 69%|██████▉   | 9/13 [00:02<00:01,  3.91it/s][A
 85%|████████▍ | 11/13 [00:02<00:00,  5.29it/s][A
100%|██████████| 13/13 [00:03<00:00,  3.85it/s][A
Epochs:  96%|█████████▌| 65/68 [30:10<01:22, 27.64s/it]

Val Loss: 0.1820 - Val Accuracy: 0.9304



Training:   0%|          | 0/103 [00:00<?, ?it/s][A
Training:   1%|          | 1/103 [00:01<01:57,  1.16s/it][A
Training:   4%|▍         | 4/103 [00:01<00:24,  4.00it/s][A
Training:   6%|▌         | 6/103 [00:02<00:33,  2.91it/s][A
Training:   9%|▊         | 9/103 [00:03<00:31,  2.99it/s][A
Training:  13%|█▎        | 13/103 [00:04<00:25,  3.56it/s][A
Training:  16%|█▌        | 16/103 [00:04<00:17,  5.03it/s][A
Training:  17%|█▋        | 18/103 [00:05<00:21,  3.87it/s][A
Training:  19%|█▉        | 20/103 [00:05<00:17,  4.81it/s][A
Training:  21%|██▏       | 22/103 [00:05<00:20,  3.99it/s][A
Training:  23%|██▎       | 24/103 [00:06<00:15,  5.08it/s][A
Training:  25%|██▌       | 26/103 [00:06<00:19,  3.94it/s][A
Training:  28%|██▊       | 29/103 [00:07<00:19,  3.82it/s][A
Training:  30%|███       | 31/103 [00:07<00:14,  4.80it/s][A
Training:  32%|███▏      | 33/103 [00:08<00:16,  4.14it/s][A
Training:  35%|███▍      | 36/103 [00:08<00:11,  5.90it/s][A
Training:  37%|███▋ 

Epoch: 66/68 - Loss: 0.1399 - Accuracy: 0.9440



  0%|          | 0/13 [00:00<?, ?it/s][A
  8%|▊         | 1/13 [00:01<00:14,  1.19s/it][A
 38%|███▊      | 5/13 [00:02<00:03,  2.54it/s][A
 62%|██████▏   | 8/13 [00:02<00:01,  4.47it/s][A
 77%|███████▋  | 10/13 [00:02<00:00,  3.91it/s][A
100%|██████████| 13/13 [00:03<00:00,  3.54it/s][A
Epochs:  97%|█████████▋| 66/68 [30:38<00:55, 27.73s/it]

Val Loss: 0.1502 - Val Accuracy: 0.9378



Training:   0%|          | 0/103 [00:00<?, ?it/s][A
Training:   1%|          | 1/103 [00:01<02:31,  1.49s/it][A
Training:   5%|▍         | 5/103 [00:02<00:39,  2.46it/s][A
Training:   6%|▌         | 6/103 [00:02<00:32,  2.98it/s][A
Training:   8%|▊         | 8/103 [00:02<00:22,  4.23it/s][A
Training:   9%|▊         | 9/103 [00:03<00:32,  2.87it/s][A
Training:  10%|▉         | 10/103 [00:03<00:27,  3.43it/s][A
Training:  12%|█▏        | 12/103 [00:03<00:17,  5.08it/s][A
Training:  14%|█▎        | 14/103 [00:04<00:24,  3.67it/s][A
Training:  16%|█▌        | 16/103 [00:04<00:17,  4.97it/s][A
Training:  17%|█▋        | 18/103 [00:05<00:24,  3.51it/s][A
Training:  20%|██        | 21/103 [00:06<00:22,  3.73it/s][A
Training:  22%|██▏       | 23/103 [00:06<00:16,  4.79it/s][A
Training:  24%|██▍       | 25/103 [00:07<00:19,  3.90it/s][A
Training:  25%|██▌       | 26/103 [00:07<00:17,  4.30it/s][A
Training:  28%|██▊       | 29/103 [00:07<00:16,  4.38it/s][A
Training:  29%|██▉   

Epoch: 67/68 - Loss: 0.1362 - Accuracy: 0.9467



  0%|          | 0/13 [00:00<?, ?it/s][A
  8%|▊         | 1/13 [00:01<00:13,  1.11s/it][A
 38%|███▊      | 5/13 [00:02<00:02,  2.74it/s][A
 54%|█████▍    | 7/13 [00:02<00:01,  4.00it/s][A
 69%|██████▉   | 9/13 [00:03<00:01,  3.24it/s][A
100%|██████████| 13/13 [00:03<00:00,  3.44it/s][A
Epochs:  99%|█████████▊| 67/68 [31:06<00:27, 27.70s/it]

Val Loss: 0.1578 - Val Accuracy: 0.9338



Training:   0%|          | 0/103 [00:00<?, ?it/s][A
Training:   1%|          | 1/103 [00:01<01:44,  1.03s/it][A
Training:   3%|▎         | 3/103 [00:01<00:32,  3.09it/s][A
Training:   5%|▍         | 5/103 [00:01<00:35,  2.74it/s][A
Training:   7%|▋         | 7/103 [00:02<00:23,  4.08it/s][A
Training:   9%|▊         | 9/103 [00:03<00:30,  3.12it/s][A
Training:  12%|█▏        | 12/103 [00:03<00:18,  4.99it/s][A
Training:  14%|█▎        | 14/103 [00:03<00:22,  3.89it/s][A
Training:  17%|█▋        | 17/103 [00:04<00:22,  3.90it/s][A
Training:  18%|█▊        | 19/103 [00:04<00:17,  4.79it/s][A
Training:  20%|██        | 21/103 [00:05<00:22,  3.65it/s][A
Training:  21%|██▏       | 22/103 [00:05<00:19,  4.07it/s][A
Training:  23%|██▎       | 24/103 [00:06<00:14,  5.43it/s][A
Training:  25%|██▌       | 26/103 [00:06<00:18,  4.11it/s][A
Training:  26%|██▌       | 27/103 [00:06<00:18,  4.20it/s][A
Training:  28%|██▊       | 29/103 [00:07<00:18,  3.96it/s][A
Training:  29%|██▉   

Epoch: 68/68 - Loss: 0.1419 - Accuracy: 0.9463



  0%|          | 0/13 [00:00<?, ?it/s][A
  8%|▊         | 1/13 [00:00<00:11,  1.06it/s][A
 23%|██▎       | 3/13 [00:01<00:02,  3.38it/s][A
 38%|███▊      | 5/13 [00:01<00:02,  3.45it/s][A
 46%|████▌     | 6/13 [00:01<00:01,  3.97it/s][A
 69%|██████▉   | 9/13 [00:02<00:00,  4.19it/s][A
 77%|███████▋  | 10/13 [00:02<00:00,  4.14it/s][A
100%|██████████| 13/13 [00:03<00:00,  4.12it/s][A
Epochs: 100%|██████████| 68/68 [31:33<00:00, 27.85s/it]


Val Loss: 0.1400 - Val Accuracy: 0.9405
Saving best model...


[32m[I 2023-12-14 22:47:38,779][0m Trial 0 finished with value: 0.9404857158660889 and parameters: {'learning_rate': 0.0033208789761545975, 'weight_decay': 0.002976249303166988, 'epsilon': 8.228177962798885e-08, 'batch_size': 136, 'epochs': 68}. Best is trial 0 with value: 0.9404857158660889.[0m


Learning rate: 0.0008620992852806465
Weight decay: 0.0007106239797227544
Epsilon: 8.116463668208938e-09
Batch size: 232
Number of epochs: 63


Epochs:   0%|          | 0/63 [00:00<?, ?it/s]
Training:   0%|          | 0/61 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/61 [00:01<01:44,  1.75s/it][A
Training:   3%|▎         | 2/61 [00:01<00:49,  1.18it/s][A
Training:   7%|▋         | 4/61 [00:02<00:20,  2.81it/s][A
Training:   8%|▊         | 5/61 [00:03<00:32,  1.74it/s][A
Training:  10%|▉         | 6/61 [00:03<00:28,  1.92it/s][A
Training:  13%|█▎        | 8/61 [00:03<00:16,  3.24it/s][A
Training:  15%|█▍        | 9/61 [00:05<00:31,  1.64it/s][A
Training:  16%|█▋        | 10/61 [00:05<00:30,  1.69it/s][A
Training:  20%|█▉        | 12/61 [00:05<00:17,  2.74it/s][A
Training:  21%|██▏       | 13/61 [00:06<00:21,  2.22it/s][A
Training:  23%|██▎       | 14/61 [00:07<00:24,  1.90it/s][A
Training:  25%|██▍       | 15/61 [00:07<00:19,  2.42it/s][A
Training:  28%|██▊       | 17/61 [00:08<00:16,  2.70it/s][A
Training:  30%|██▉       | 18/61 [00:08<00:20,  2.12it/s][A
Training:  33%|███▎      | 20/61 [00:08<00:12,  3.29it

Epoch: 1/63 - Loss: 0.4347 - Accuracy: 0.7973



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:02<00:14,  2.07s/it][A
 38%|███▊      | 3/8 [00:02<00:02,  1.73it/s][A
 62%|██████▎   | 5/8 [00:03<00:01,  1.62it/s][A
100%|██████████| 8/8 [00:03<00:00,  2.10it/s][A
Epochs:   2%|▏         | 1/63 [00:27<28:15, 27.34s/it]

Val Loss: 0.2681 - Val Accuracy: 0.8944



Training:   0%|          | 0/61 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/61 [00:01<01:43,  1.73s/it][A
Training:   3%|▎         | 2/61 [00:01<00:47,  1.24it/s][A
Training:   8%|▊         | 5/61 [00:03<00:27,  2.00it/s][A
Training:  11%|█▏        | 7/61 [00:03<00:17,  3.04it/s][A
Training:  15%|█▍        | 9/61 [00:04<00:27,  1.88it/s][A
Training:  16%|█▋        | 10/61 [00:05<00:22,  2.25it/s][A
Training:  18%|█▊        | 11/61 [00:05<00:18,  2.73it/s][A
Training:  21%|██▏       | 13/61 [00:06<00:21,  2.24it/s][A
Training:  23%|██▎       | 14/61 [00:06<00:20,  2.26it/s][A
Training:  26%|██▌       | 16/61 [00:06<00:13,  3.34it/s][A
Training:  28%|██▊       | 17/61 [00:07<00:19,  2.22it/s][A
Training:  30%|██▉       | 18/61 [00:08<00:17,  2.40it/s][A
Training:  31%|███       | 19/61 [00:08<00:14,  2.95it/s][A
Training:  34%|███▍      | 21/61 [00:09<00:16,  2.47it/s][A
Training:  36%|███▌      | 22/61 [00:09<00:15,  2.53it/s][A
Training:  39%|███▉      | 24/61 [00:

Epoch: 2/63 - Loss: 0.2254 - Accuracy: 0.9079



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:01<00:12,  1.83s/it][A
 38%|███▊      | 3/8 [00:01<00:02,  1.91it/s][A
 62%|██████▎   | 5/8 [00:03<00:02,  1.48it/s][A
100%|██████████| 8/8 [00:03<00:00,  2.08it/s][A
Epochs:   3%|▎         | 2/63 [00:54<27:56, 27.49s/it]

Val Loss: 0.1980 - Val Accuracy: 0.9170



Training:   0%|          | 0/61 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/61 [00:01<01:46,  1.78s/it][A
Training:   3%|▎         | 2/61 [00:01<00:48,  1.22it/s][A
Training:   7%|▋         | 4/61 [00:02<00:20,  2.77it/s][A
Training:   8%|▊         | 5/61 [00:03<00:38,  1.47it/s][A
Training:  10%|▉         | 6/61 [00:03<00:31,  1.76it/s][A
Training:  15%|█▍        | 9/61 [00:05<00:24,  2.12it/s][A
Training:  16%|█▋        | 10/61 [00:05<00:24,  2.08it/s][A
Training:  18%|█▊        | 11/61 [00:05<00:19,  2.53it/s][A
Training:  20%|█▉        | 12/61 [00:05<00:15,  3.09it/s][A
Training:  21%|██▏       | 13/61 [00:06<00:23,  2.07it/s][A
Training:  23%|██▎       | 14/61 [00:06<00:19,  2.40it/s][A
Training:  26%|██▌       | 16/61 [00:07<00:11,  3.84it/s][A
Training:  28%|██▊       | 17/61 [00:08<00:20,  2.11it/s][A
Training:  30%|██▉       | 18/61 [00:08<00:17,  2.45it/s][A
Training:  33%|███▎      | 20/61 [00:08<00:10,  3.78it/s][A
Training:  34%|███▍      | 21/61 [00:0

Epoch: 3/63 - Loss: 0.1869 - Accuracy: 0.9234



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:02<00:15,  2.28s/it][A
 25%|██▌       | 2/8 [00:02<00:05,  1.00it/s][A
 38%|███▊      | 3/8 [00:02<00:03,  1.59it/s][A
 62%|██████▎   | 5/8 [00:03<00:01,  1.78it/s][A
100%|██████████| 8/8 [00:03<00:00,  2.11it/s][A
Epochs:   5%|▍         | 3/63 [01:22<27:25, 27.43s/it]

Val Loss: 0.1777 - Val Accuracy: 0.9234



Training:   0%|          | 0/61 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/61 [00:02<02:36,  2.61s/it][A
Training:   5%|▍         | 3/61 [00:02<00:42,  1.35it/s][A
Training:   8%|▊         | 5/61 [00:04<00:37,  1.48it/s][A
Training:  11%|█▏        | 7/61 [00:04<00:22,  2.41it/s][A
Training:  15%|█▍        | 9/61 [00:05<00:26,  1.93it/s][A
Training:  18%|█▊        | 11/61 [00:05<00:17,  2.79it/s][A
Training:  21%|██▏       | 13/61 [00:07<00:24,  1.94it/s][A
Training:  23%|██▎       | 14/61 [00:07<00:20,  2.29it/s][A
Training:  25%|██▍       | 15/61 [00:07<00:16,  2.74it/s][A
Training:  26%|██▌       | 16/61 [00:07<00:14,  3.20it/s][A
Training:  28%|██▊       | 17/61 [00:08<00:23,  1.84it/s][A
Training:  30%|██▉       | 18/61 [00:08<00:18,  2.33it/s][A
Training:  34%|███▍      | 21/61 [00:10<00:18,  2.14it/s][A
Training:  41%|████      | 25/61 [00:12<00:15,  2.32it/s][A
Training:  44%|████▍     | 27/61 [00:12<00:11,  2.97it/s][A
Training:  48%|████▊     | 29/61 [00:

Epoch: 4/63 - Loss: 0.1706 - Accuracy: 0.9301



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:01<00:13,  1.97s/it][A
 25%|██▌       | 2/8 [00:02<00:05,  1.14it/s][A
 38%|███▊      | 3/8 [00:02<00:03,  1.59it/s][A
 62%|██████▎   | 5/8 [00:03<00:01,  1.71it/s][A
100%|██████████| 8/8 [00:03<00:00,  2.04it/s][A
Epochs:   6%|▋         | 4/63 [01:49<26:51, 27.31s/it]

Val Loss: 0.1625 - Val Accuracy: 0.9308



Training:   0%|          | 0/61 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/61 [00:01<01:58,  1.98s/it][A
Training:   5%|▍         | 3/61 [00:02<00:39,  1.45it/s][A
Training:   8%|▊         | 5/61 [00:03<00:33,  1.67it/s][A
Training:  10%|▉         | 6/61 [00:03<00:25,  2.14it/s][A
Training:  11%|█▏        | 7/61 [00:03<00:23,  2.32it/s][A
Training:  13%|█▎        | 8/61 [00:04<00:18,  2.93it/s][A
Training:  15%|█▍        | 9/61 [00:04<00:24,  2.11it/s][A
Training:  18%|█▊        | 11/61 [00:05<00:18,  2.74it/s][A
Training:  21%|██▏       | 13/61 [00:06<00:18,  2.55it/s][A
Training:  23%|██▎       | 14/61 [00:06<00:15,  3.02it/s][A
Training:  25%|██▍       | 15/61 [00:06<00:17,  2.63it/s][A
Training:  28%|██▊       | 17/61 [00:07<00:17,  2.56it/s][A
Training:  30%|██▉       | 18/61 [00:07<00:14,  3.02it/s][A
Training:  31%|███       | 19/61 [00:08<00:15,  2.78it/s][A
Training:  34%|███▍      | 21/61 [00:09<00:19,  2.09it/s][A
Training:  38%|███▊      | 23/61 [00:09

Epoch: 5/63 - Loss: 0.1677 - Accuracy: 0.9320



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:02<00:17,  2.54s/it][A
 50%|█████     | 4/8 [00:02<00:02,  1.89it/s][A
 62%|██████▎   | 5/8 [00:03<00:01,  1.52it/s][A
100%|██████████| 8/8 [00:04<00:00,  1.97it/s][A
Epochs:   8%|▊         | 5/63 [02:17<26:30, 27.41s/it]

Val Loss: 0.1689 - Val Accuracy: 0.9303



Training:   0%|          | 0/61 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/61 [00:02<02:28,  2.47s/it][A
Training:   5%|▍         | 3/61 [00:02<00:40,  1.43it/s][A
Training:   8%|▊         | 5/61 [00:04<00:38,  1.44it/s][A
Training:  11%|█▏        | 7/61 [00:04<00:23,  2.34it/s][A
Training:  15%|█▍        | 9/61 [00:05<00:27,  1.90it/s][A
Training:  18%|█▊        | 11/61 [00:05<00:18,  2.73it/s][A
Training:  21%|██▏       | 13/61 [00:07<00:22,  2.15it/s][A
Training:  23%|██▎       | 14/61 [00:07<00:18,  2.49it/s][A
Training:  25%|██▍       | 15/61 [00:07<00:15,  2.96it/s][A
Training:  26%|██▌       | 16/61 [00:07<00:12,  3.52it/s][A
Training:  28%|██▊       | 17/61 [00:08<00:23,  1.91it/s][A
Training:  31%|███       | 19/61 [00:08<00:14,  2.96it/s][A
Training:  34%|███▍      | 21/61 [00:09<00:17,  2.23it/s][A
Training:  39%|███▉      | 24/61 [00:10<00:09,  3.74it/s][A
Training:  43%|████▎     | 26/61 [00:11<00:14,  2.38it/s][A
Training:  48%|████▊     | 29/61 [00:

Epoch: 6/63 - Loss: 0.1610 - Accuracy: 0.9344



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:01<00:12,  1.81s/it][A
 25%|██▌       | 2/8 [00:02<00:05,  1.13it/s][A
 38%|███▊      | 3/8 [00:02<00:02,  1.86it/s][A
 62%|██████▎   | 5/8 [00:03<00:01,  1.87it/s][A
100%|██████████| 8/8 [00:03<00:00,  2.19it/s][A
Epochs:  10%|▉         | 6/63 [02:44<26:00, 27.38s/it]

Val Loss: 0.1594 - Val Accuracy: 0.9330



Training:   0%|          | 0/61 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/61 [00:01<01:58,  1.97s/it][A
Training:   3%|▎         | 2/61 [00:02<00:52,  1.13it/s][A
Training:   8%|▊         | 5/61 [00:03<00:32,  1.74it/s][A
Training:  15%|█▍        | 9/61 [00:05<00:24,  2.12it/s][A
Training:  16%|█▋        | 10/61 [00:05<00:21,  2.42it/s][A
Training:  20%|█▉        | 12/61 [00:05<00:14,  3.31it/s][A
Training:  21%|██▏       | 13/61 [00:06<00:23,  2.01it/s][A
Training:  25%|██▍       | 15/61 [00:06<00:15,  2.93it/s][A
Training:  28%|██▊       | 17/61 [00:07<00:18,  2.37it/s][A
Training:  33%|███▎      | 20/61 [00:08<00:10,  3.79it/s][A
Training:  36%|███▌      | 22/61 [00:09<00:14,  2.60it/s][A
Training:  39%|███▉      | 24/61 [00:09<00:10,  3.42it/s][A
Training:  43%|████▎     | 26/61 [00:11<00:15,  2.33it/s][A
Training:  46%|████▌     | 28/61 [00:11<00:10,  3.09it/s][A
Training:  48%|████▊     | 29/61 [00:12<00:15,  2.07it/s][A
Training:  49%|████▉     | 30/61 [00

Epoch: 7/63 - Loss: 0.1624 - Accuracy: 0.9330



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:02<00:16,  2.30s/it][A
 38%|███▊      | 3/8 [00:02<00:03,  1.57it/s][A
 62%|██████▎   | 5/8 [00:03<00:01,  1.63it/s][A
100%|██████████| 8/8 [00:03<00:00,  2.10it/s][A
Epochs:  11%|█         | 7/63 [03:11<25:24, 27.22s/it]

Val Loss: 0.1484 - Val Accuracy: 0.9361



Training:   0%|          | 0/61 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/61 [00:01<01:58,  1.98s/it][A
Training:   5%|▍         | 3/61 [00:02<00:32,  1.80it/s][A
Training:   8%|▊         | 5/61 [00:03<00:33,  1.69it/s][A
Training:  13%|█▎        | 8/61 [00:03<00:16,  3.20it/s][A
Training:  16%|█▋        | 10/61 [00:04<00:20,  2.43it/s][A
Training:  20%|█▉        | 12/61 [00:04<00:15,  3.19it/s][A
Training:  21%|██▏       | 13/61 [00:06<00:23,  2.04it/s][A
Training:  23%|██▎       | 14/61 [00:06<00:19,  2.45it/s][A
Training:  26%|██▌       | 16/61 [00:06<00:12,  3.49it/s][A
Training:  28%|██▊       | 17/61 [00:07<00:22,  1.94it/s][A
Training:  31%|███       | 19/61 [00:08<00:14,  2.81it/s][A
Training:  34%|███▍      | 21/61 [00:09<00:16,  2.38it/s][A
Training:  39%|███▉      | 24/61 [00:09<00:10,  3.67it/s][A
Training:  41%|████      | 25/61 [00:10<00:14,  2.51it/s][A
Training:  46%|████▌     | 28/61 [00:10<00:08,  4.06it/s][A
Training:  49%|████▉     | 30/61 [00

Epoch: 8/63 - Loss: 0.1521 - Accuracy: 0.9376



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:02<00:15,  2.22s/it][A
 38%|███▊      | 3/8 [00:02<00:03,  1.58it/s][A
 62%|██████▎   | 5/8 [00:03<00:01,  1.61it/s][A
100%|██████████| 8/8 [00:03<00:00,  2.11it/s][A
Epochs:  13%|█▎        | 8/63 [03:37<24:34, 26.81s/it]

Val Loss: 0.1506 - Val Accuracy: 0.9388



Training:   0%|          | 0/61 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/61 [00:01<01:40,  1.67s/it][A
Training:   3%|▎         | 2/61 [00:01<00:45,  1.31it/s][A
Training:   7%|▋         | 4/61 [00:01<00:18,  3.07it/s][A
Training:   8%|▊         | 5/61 [00:03<00:36,  1.53it/s][A
Training:  15%|█▍        | 9/61 [00:04<00:24,  2.10it/s][A
Training:  18%|█▊        | 11/61 [00:04<00:17,  2.84it/s][A
Training:  21%|██▏       | 13/61 [00:06<00:19,  2.44it/s][A
Training:  23%|██▎       | 14/61 [00:06<00:17,  2.74it/s][A
Training:  25%|██▍       | 15/61 [00:06<00:17,  2.60it/s][A
Training:  26%|██▌       | 16/61 [00:06<00:14,  3.09it/s][A
Training:  28%|██▊       | 17/61 [00:07<00:18,  2.32it/s][A
Training:  30%|██▉       | 18/61 [00:07<00:17,  2.52it/s][A
Training:  31%|███       | 19/61 [00:08<00:16,  2.56it/s][A
Training:  34%|███▍      | 21/61 [00:08<00:13,  2.92it/s][A
Training:  36%|███▌      | 22/61 [00:09<00:15,  2.53it/s][A
Training:  38%|███▊      | 23/61 [00:

Epoch: 9/63 - Loss: 0.1513 - Accuracy: 0.9387



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:01<00:13,  1.95s/it][A
 62%|██████▎   | 5/8 [00:03<00:01,  1.57it/s][A
100%|██████████| 8/8 [00:03<00:00,  2.12it/s][A
Epochs:  14%|█▍        | 9/63 [04:04<24:10, 26.86s/it]

Val Loss: 0.1607 - Val Accuracy: 0.9303



Training:   0%|          | 0/61 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/61 [00:02<01:59,  2.00s/it][A
Training:   3%|▎         | 2/61 [00:02<00:52,  1.13it/s][A
Training:   7%|▋         | 4/61 [00:02<00:21,  2.69it/s][A
Training:  10%|▉         | 6/61 [00:03<00:30,  1.82it/s][A
Training:  13%|█▎        | 8/61 [00:03<00:19,  2.75it/s][A
Training:  15%|█▍        | 9/61 [00:05<00:27,  1.88it/s][A
Training:  16%|█▋        | 10/61 [00:05<00:21,  2.33it/s][A
Training:  20%|█▉        | 12/61 [00:05<00:14,  3.27it/s][A
Training:  21%|██▏       | 13/61 [00:06<00:25,  1.87it/s][A
Training:  25%|██▍       | 15/61 [00:06<00:16,  2.84it/s][A
Training:  26%|██▌       | 16/61 [00:07<00:15,  2.90it/s][A
Training:  28%|██▊       | 17/61 [00:08<00:21,  2.04it/s][A
Training:  31%|███       | 19/61 [00:08<00:13,  3.19it/s][A
Training:  33%|███▎      | 20/61 [00:08<00:12,  3.23it/s][A
Training:  34%|███▍      | 21/61 [00:09<00:16,  2.39it/s][A
Training:  38%|███▊      | 23/61 [00:0

Epoch: 10/63 - Loss: 0.1526 - Accuracy: 0.9397



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:01<00:12,  1.78s/it][A
 25%|██▌       | 2/8 [00:02<00:05,  1.13it/s][A
 62%|██████▎   | 5/8 [00:03<00:01,  1.85it/s][A
100%|██████████| 8/8 [00:03<00:00,  2.18it/s][A
Epochs:  16%|█▌        | 10/63 [04:31<23:49, 26.97s/it]

Val Loss: 0.1580 - Val Accuracy: 0.9309



Training:   0%|          | 0/61 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/61 [00:01<01:42,  1.71s/it][A
Training:   3%|▎         | 2/61 [00:01<00:49,  1.20it/s][A
Training:   5%|▍         | 3/61 [00:02<00:33,  1.76it/s][A
Training:   8%|▊         | 5/61 [00:03<00:31,  1.76it/s][A
Training:  10%|▉         | 6/61 [00:03<00:24,  2.29it/s][A
Training:  11%|█▏        | 7/61 [00:03<00:19,  2.79it/s][A
Training:  15%|█▍        | 9/61 [00:04<00:24,  2.13it/s][A
Training:  18%|█▊        | 11/61 [00:05<00:20,  2.41it/s][A
Training:  21%|██▏       | 13/61 [00:06<00:20,  2.30it/s][A
Training:  25%|██▍       | 15/61 [00:07<00:19,  2.39it/s][A
Training:  28%|██▊       | 17/61 [00:08<00:18,  2.36it/s][A
Training:  31%|███       | 19/61 [00:08<00:16,  2.57it/s][A
Training:  34%|███▍      | 21/61 [00:09<00:15,  2.58it/s][A
Training:  38%|███▊      | 23/61 [00:10<00:14,  2.61it/s][A
Training:  39%|███▉      | 24/61 [00:10<00:12,  2.90it/s][A
Training:  41%|████      | 25/61 [00:11

Epoch: 11/63 - Loss: 0.1416 - Accuracy: 0.9434



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:01<00:13,  1.90s/it][A
 38%|███▊      | 3/8 [00:02<00:02,  1.84it/s][A
 62%|██████▎   | 5/8 [00:03<00:01,  1.79it/s][A
100%|██████████| 8/8 [00:03<00:00,  2.27it/s][A
Epochs:  17%|█▋        | 11/63 [04:58<23:30, 27.12s/it]

Val Loss: 0.1422 - Val Accuracy: 0.9442



Training:   0%|          | 0/61 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/61 [00:01<01:56,  1.95s/it][A
Training:   5%|▍         | 3/61 [00:02<00:32,  1.79it/s][A
Training:   7%|▋         | 4/61 [00:02<00:25,  2.25it/s][A
Training:   8%|▊         | 5/61 [00:03<00:37,  1.50it/s][A
Training:  10%|▉         | 6/61 [00:03<00:26,  2.05it/s][A
Training:  13%|█▎        | 8/61 [00:03<00:15,  3.32it/s][A
Training:  15%|█▍        | 9/61 [00:04<00:25,  2.01it/s][A
Training:  16%|█▋        | 10/61 [00:05<00:24,  2.11it/s][A
Training:  20%|█▉        | 12/61 [00:05<00:17,  2.87it/s][A
Training:  21%|██▏       | 13/61 [00:06<00:21,  2.24it/s][A
Training:  23%|██▎       | 14/61 [00:06<00:22,  2.10it/s][A
Training:  28%|██▊       | 17/61 [00:07<00:16,  2.61it/s][A
Training:  30%|██▉       | 18/61 [00:08<00:20,  2.11it/s][A
Training:  31%|███       | 19/61 [00:08<00:16,  2.55it/s][A
Training:  34%|███▍      | 21/61 [00:09<00:13,  2.99it/s][A
Training:  36%|███▌      | 22/61 [00:10

Epoch: 12/63 - Loss: 0.1428 - Accuracy: 0.9428



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:02<00:15,  2.20s/it][A
 38%|███▊      | 3/8 [00:02<00:03,  1.60it/s][A
 62%|██████▎   | 5/8 [00:03<00:02,  1.47it/s][A
100%|██████████| 8/8 [00:04<00:00,  1.97it/s][A
Epochs:  19%|█▉        | 12/63 [05:26<23:15, 27.37s/it]

Val Loss: 0.1395 - Val Accuracy: 0.9399



Training:   0%|          | 0/61 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/61 [00:01<01:47,  1.79s/it][A
Training:   5%|▍         | 3/61 [00:01<00:29,  1.98it/s][A
Training:   8%|▊         | 5/61 [00:03<00:32,  1.74it/s][A
Training:  11%|█▏        | 7/61 [00:03<00:19,  2.83it/s][A
Training:  15%|█▍        | 9/61 [00:04<00:25,  2.06it/s][A
Training:  20%|█▉        | 12/61 [00:05<00:16,  2.99it/s][A
Training:  21%|██▏       | 13/61 [00:06<00:21,  2.27it/s][A
Training:  23%|██▎       | 14/61 [00:06<00:17,  2.68it/s][A
Training:  26%|██▌       | 16/61 [00:06<00:14,  3.13it/s][A
Training:  28%|██▊       | 17/61 [00:07<00:20,  2.15it/s][A
Training:  31%|███       | 19/61 [00:07<00:13,  3.02it/s][A
Training:  33%|███▎      | 20/61 [00:08<00:13,  2.95it/s][A
Training:  34%|███▍      | 21/61 [00:09<00:18,  2.17it/s][A
Training:  38%|███▊      | 23/61 [00:09<00:11,  3.24it/s][A
Training:  39%|███▉      | 24/61 [00:09<00:13,  2.85it/s][A
Training:  41%|████      | 25/61 [00:

Epoch: 13/63 - Loss: 0.1421 - Accuracy: 0.9427



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:01<00:13,  1.90s/it][A
 25%|██▌       | 2/8 [00:02<00:05,  1.17it/s][A
 50%|█████     | 4/8 [00:02<00:01,  2.72it/s][A
 62%|██████▎   | 5/8 [00:03<00:01,  1.72it/s][A
 75%|███████▌  | 6/8 [00:03<00:00,  2.11it/s][A
100%|██████████| 8/8 [00:03<00:00,  2.18it/s][A
Epochs:  21%|██        | 13/63 [05:54<22:48, 27.38s/it]

Val Loss: 0.1491 - Val Accuracy: 0.9420



Training:   0%|          | 0/61 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/61 [00:01<01:54,  1.91s/it][A
Training:   3%|▎         | 2/61 [00:02<00:50,  1.18it/s][A
Training:   8%|▊         | 5/61 [00:03<00:34,  1.63it/s][A
Training:  11%|█▏        | 7/61 [00:03<00:21,  2.52it/s][A
Training:  15%|█▍        | 9/61 [00:05<00:27,  1.89it/s][A
Training:  18%|█▊        | 11/61 [00:05<00:18,  2.69it/s][A
Training:  21%|██▏       | 13/61 [00:06<00:22,  2.14it/s][A
Training:  25%|██▍       | 15/61 [00:06<00:15,  2.98it/s][A
Training:  28%|██▊       | 17/61 [00:08<00:18,  2.33it/s][A
Training:  31%|███       | 19/61 [00:08<00:13,  3.13it/s][A
Training:  34%|███▍      | 21/61 [00:09<00:18,  2.16it/s][A
Training:  38%|███▊      | 23/61 [00:09<00:13,  2.91it/s][A
Training:  41%|████      | 25/61 [00:11<00:15,  2.29it/s][A
Training:  48%|████▊     | 29/61 [00:12<00:12,  2.59it/s][A
Training:  51%|█████     | 31/61 [00:12<00:09,  3.21it/s][A
Training:  52%|█████▏    | 32/61 [00:

Epoch: 14/63 - Loss: 0.1441 - Accuracy: 0.9422



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:02<00:14,  2.10s/it][A
 38%|███▊      | 3/8 [00:02<00:02,  1.68it/s][A
 62%|██████▎   | 5/8 [00:03<00:02,  1.47it/s][A
100%|██████████| 8/8 [00:03<00:00,  2.00it/s][A
Epochs:  22%|██▏       | 14/63 [06:21<22:20, 27.36s/it]

Val Loss: 0.1444 - Val Accuracy: 0.9420



Training:   0%|          | 0/61 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/61 [00:01<01:56,  1.94s/it][A
Training:   3%|▎         | 2/61 [00:02<00:53,  1.11it/s][A
Training:   5%|▍         | 3/61 [00:02<00:33,  1.71it/s][A
Training:   8%|▊         | 5/61 [00:03<00:32,  1.75it/s][A
Training:  11%|█▏        | 7/61 [00:03<00:22,  2.36it/s][A
Training:  15%|█▍        | 9/61 [00:05<00:25,  2.05it/s][A
Training:  16%|█▋        | 10/61 [00:05<00:21,  2.42it/s][A
Training:  18%|█▊        | 11/61 [00:05<00:19,  2.50it/s][A
Training:  20%|█▉        | 12/61 [00:05<00:16,  3.02it/s][A
Training:  21%|██▏       | 13/61 [00:06<00:23,  2.07it/s][A
Training:  25%|██▍       | 15/61 [00:07<00:17,  2.58it/s][A
Training:  28%|██▊       | 17/61 [00:07<00:17,  2.51it/s][A
Training:  30%|██▉       | 18/61 [00:08<00:15,  2.78it/s][A
Training:  31%|███       | 19/61 [00:08<00:15,  2.74it/s][A
Training:  34%|███▍      | 21/61 [00:09<00:15,  2.50it/s][A
Training:  36%|███▌      | 22/61 [00:0

Epoch: 15/63 - Loss: 0.1419 - Accuracy: 0.9434



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:01<00:11,  1.70s/it][A
 25%|██▌       | 2/8 [00:02<00:05,  1.11it/s][A
 50%|█████     | 4/8 [00:02<00:01,  2.70it/s][A
 62%|██████▎   | 5/8 [00:03<00:02,  1.44it/s][A
100%|██████████| 8/8 [00:03<00:00,  2.06it/s][A
Epochs:  24%|██▍       | 15/63 [06:49<21:57, 27.45s/it]

Val Loss: 0.1457 - Val Accuracy: 0.9425



Training:   0%|          | 0/61 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/61 [00:02<02:00,  2.00s/it][A
Training:   7%|▋         | 4/61 [00:02<00:24,  2.37it/s][A
Training:  10%|▉         | 6/61 [00:03<00:34,  1.60it/s][A
Training:  13%|█▎        | 8/61 [00:04<00:22,  2.40it/s][A
Training:  15%|█▍        | 9/61 [00:05<00:29,  1.76it/s][A
Training:  16%|█▋        | 10/61 [00:05<00:25,  1.99it/s][A
Training:  21%|██▏       | 13/61 [00:06<00:21,  2.19it/s][A
Training:  23%|██▎       | 14/61 [00:07<00:19,  2.39it/s][A
Training:  26%|██▌       | 16/61 [00:07<00:13,  3.39it/s][A
Training:  28%|██▊       | 17/61 [00:08<00:22,  1.98it/s][A
Training:  31%|███       | 19/61 [00:08<00:14,  2.89it/s][A
Training:  34%|███▍      | 21/61 [00:09<00:16,  2.42it/s][A
Training:  38%|███▊      | 23/61 [00:09<00:11,  3.29it/s][A
Training:  41%|████      | 25/61 [00:11<00:15,  2.29it/s][A
Training:  43%|████▎     | 26/61 [00:11<00:13,  2.66it/s][A
Training:  44%|████▍     | 27/61 [00:

Epoch: 16/63 - Loss: 0.1467 - Accuracy: 0.9419



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:01<00:13,  1.87s/it][A
 38%|███▊      | 3/8 [00:02<00:02,  1.85it/s][A
 50%|█████     | 4/8 [00:02<00:01,  2.56it/s][A
100%|██████████| 8/8 [00:03<00:00,  2.24it/s][A
Epochs:  25%|██▌       | 16/63 [07:16<21:30, 27.46s/it]

Val Loss: 0.1465 - Val Accuracy: 0.9393



Training:   0%|          | 0/61 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/61 [00:01<01:51,  1.86s/it][A
Training:   7%|▋         | 4/61 [00:02<00:22,  2.56it/s][A
Training:  10%|▉         | 6/61 [00:03<00:34,  1.61it/s][A
Training:  13%|█▎        | 8/61 [00:03<00:21,  2.48it/s][A
Training:  16%|█▋        | 10/61 [00:05<00:25,  1.97it/s][A
Training:  21%|██▏       | 13/61 [00:06<00:23,  2.07it/s][A
Training:  25%|██▍       | 15/61 [00:06<00:16,  2.78it/s][A
Training:  28%|██▊       | 17/61 [00:07<00:17,  2.47it/s][A
Training:  30%|██▉       | 18/61 [00:08<00:15,  2.71it/s][A
Training:  34%|███▍      | 21/61 [00:09<00:15,  2.65it/s][A
Training:  36%|███▌      | 22/61 [00:09<00:13,  2.87it/s][A
Training:  39%|███▉      | 24/61 [00:09<00:09,  3.80it/s][A
Training:  41%|████      | 25/61 [00:10<00:15,  2.33it/s][A
Training:  43%|████▎     | 26/61 [00:10<00:13,  2.64it/s][A
Training:  44%|████▍     | 27/61 [00:11<00:11,  3.01it/s][A
Training:  48%|████▊     | 29/61 [00

Epoch: 17/63 - Loss: 0.1442 - Accuracy: 0.9427



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:01<00:11,  1.69s/it][A
 25%|██▌       | 2/8 [00:01<00:05,  1.17it/s][A
 62%|██████▎   | 5/8 [00:03<00:01,  1.80it/s][A
100%|██████████| 8/8 [00:03<00:00,  2.26it/s][A
Epochs:  27%|██▋       | 17/63 [07:44<21:04, 27.49s/it]

Val Loss: 0.1600 - Val Accuracy: 0.9314



Training:   0%|          | 0/61 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/61 [00:02<02:10,  2.17s/it][A
Training:   8%|▊         | 5/61 [00:03<00:35,  1.56it/s][A
Training:  11%|█▏        | 7/61 [00:03<00:23,  2.34it/s][A
Training:  15%|█▍        | 9/61 [00:05<00:27,  1.87it/s][A
Training:  16%|█▋        | 10/61 [00:05<00:22,  2.23it/s][A
Training:  18%|█▊        | 11/61 [00:05<00:18,  2.69it/s][A
Training:  21%|██▏       | 13/61 [00:06<00:22,  2.18it/s][A
Training:  23%|██▎       | 14/61 [00:06<00:18,  2.60it/s][A
Training:  26%|██▌       | 16/61 [00:06<00:11,  3.87it/s][A
Training:  30%|██▉       | 18/61 [00:08<00:16,  2.61it/s][A
Training:  33%|███▎      | 20/61 [00:08<00:11,  3.53it/s][A
Training:  34%|███▍      | 21/61 [00:09<00:20,  1.95it/s][A
Training:  38%|███▊      | 23/61 [00:09<00:13,  2.79it/s][A
Training:  41%|████      | 25/61 [00:11<00:17,  2.07it/s][A
Training:  43%|████▎     | 26/61 [00:11<00:14,  2.42it/s][A
Training:  48%|████▊     | 29/61 [00

Epoch: 18/63 - Loss: 0.1457 - Accuracy: 0.9418



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:01<00:12,  1.77s/it][A
 25%|██▌       | 2/8 [00:01<00:04,  1.24it/s][A
 50%|█████     | 4/8 [00:02<00:01,  2.98it/s][A
100%|██████████| 8/8 [00:03<00:00,  2.17it/s][A
Epochs:  29%|██▊       | 18/63 [08:12<20:43, 27.63s/it]

Val Loss: 0.1701 - Val Accuracy: 0.9298



Training:   0%|          | 0/61 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/61 [00:02<02:01,  2.03s/it][A
Training:   5%|▍         | 3/61 [00:02<00:34,  1.69it/s][A
Training:   8%|▊         | 5/61 [00:03<00:36,  1.54it/s][A
Training:  11%|█▏        | 7/61 [00:03<00:21,  2.47it/s][A
Training:  15%|█▍        | 9/61 [00:05<00:26,  2.00it/s][A
Training:  18%|█▊        | 11/61 [00:05<00:18,  2.76it/s][A
Training:  20%|█▉        | 12/61 [00:05<00:15,  3.17it/s][A
Training:  21%|██▏       | 13/61 [00:06<00:26,  1.85it/s][A
Training:  23%|██▎       | 14/61 [00:06<00:20,  2.28it/s][A
Training:  26%|██▌       | 16/61 [00:06<00:12,  3.49it/s][A
Training:  28%|██▊       | 17/61 [00:08<00:23,  1.87it/s][A
Training:  31%|███       | 19/61 [00:08<00:14,  2.83it/s][A
Training:  34%|███▍      | 21/61 [00:09<00:17,  2.27it/s][A
Training:  38%|███▊      | 23/61 [00:09<00:11,  3.24it/s][A
Training:  41%|████      | 25/61 [00:11<00:16,  2.12it/s][A
Training:  44%|████▍     | 27/61 [00:

Epoch: 19/63 - Loss: 0.1398 - Accuracy: 0.9435



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:01<00:12,  1.76s/it][A
 38%|███▊      | 3/8 [00:01<00:02,  1.98it/s][A
 62%|██████▎   | 5/8 [00:03<00:01,  1.77it/s][A
100%|██████████| 8/8 [00:03<00:00,  2.35it/s][A
Epochs:  30%|███       | 19/63 [08:39<20:12, 27.56s/it]

Val Loss: 0.1577 - Val Accuracy: 0.9357



Training:   0%|          | 0/61 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/61 [00:02<02:02,  2.04s/it][A
Training:   3%|▎         | 2/61 [00:02<00:55,  1.07it/s][A
Training:   8%|▊         | 5/61 [00:03<00:35,  1.57it/s][A
Training:  11%|█▏        | 7/61 [00:03<00:22,  2.45it/s][A
Training:  15%|█▍        | 9/61 [00:05<00:27,  1.90it/s][A
Training:  20%|█▉        | 12/61 [00:05<00:15,  3.18it/s][A
Training:  23%|██▎       | 14/61 [00:07<00:21,  2.23it/s][A
Training:  28%|██▊       | 17/61 [00:08<00:20,  2.20it/s][A
Training:  31%|███       | 19/61 [00:08<00:14,  2.89it/s][A
Training:  34%|███▍      | 21/61 [00:09<00:18,  2.22it/s][A
Training:  41%|████      | 25/61 [00:11<00:14,  2.46it/s][A
Training:  46%|████▌     | 28/61 [00:11<00:09,  3.35it/s][A
Training:  48%|████▊     | 29/61 [00:12<00:13,  2.41it/s][A
Training:  52%|█████▏    | 32/61 [00:12<00:08,  3.44it/s][A
Training:  54%|█████▍    | 33/61 [00:14<00:12,  2.33it/s][A
Training:  56%|█████▌    | 34/61 [00:

Epoch: 20/63 - Loss: 0.1441 - Accuracy: 0.9430



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:01<00:12,  1.72s/it][A
 50%|█████     | 4/8 [00:01<00:01,  2.81it/s][A
100%|██████████| 8/8 [00:03<00:00,  2.28it/s][A
Epochs:  32%|███▏      | 20/63 [09:06<19:41, 27.48s/it]

Val Loss: 0.1719 - Val Accuracy: 0.9297



Training:   0%|          | 0/61 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/61 [00:01<01:46,  1.78s/it][A
Training:   3%|▎         | 2/61 [00:02<00:55,  1.05it/s][A
Training:   5%|▍         | 3/61 [00:02<00:32,  1.77it/s][A
Training:   8%|▊         | 5/61 [00:03<00:30,  1.85it/s][A
Training:  10%|▉         | 6/61 [00:03<00:29,  1.85it/s][A
Training:  13%|█▎        | 8/61 [00:04<00:18,  2.90it/s][A
Training:  15%|█▍        | 9/61 [00:04<00:24,  2.10it/s][A
Training:  16%|█▋        | 10/61 [00:05<00:25,  2.02it/s][A
Training:  20%|█▉        | 12/61 [00:05<00:15,  3.19it/s][A
Training:  21%|██▏       | 13/61 [00:06<00:21,  2.28it/s][A
Training:  23%|██▎       | 14/61 [00:07<00:23,  2.02it/s][A
Training:  26%|██▌       | 16/61 [00:07<00:14,  3.18it/s][A
Training:  28%|██▊       | 17/61 [00:07<00:17,  2.55it/s][A
Training:  30%|██▉       | 18/61 [00:08<00:17,  2.50it/s][A
Training:  34%|███▍      | 21/61 [00:09<00:14,  2.78it/s][A
Training:  36%|███▌      | 22/61 [00:09

Epoch: 21/63 - Loss: 0.1481 - Accuracy: 0.9400



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:01<00:12,  1.79s/it][A
 25%|██▌       | 2/8 [00:01<00:04,  1.24it/s][A
 50%|█████     | 4/8 [00:02<00:01,  2.87it/s][A
 62%|██████▎   | 5/8 [00:03<00:01,  1.71it/s][A
100%|██████████| 8/8 [00:03<00:00,  2.40it/s][A
Epochs:  33%|███▎      | 21/63 [09:34<19:16, 27.53s/it]

Val Loss: 0.1673 - Val Accuracy: 0.9345



Training:   0%|          | 0/61 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/61 [00:01<01:54,  1.92s/it][A
Training:   5%|▍         | 3/61 [00:02<00:32,  1.78it/s][A
Training:   7%|▋         | 4/61 [00:02<00:24,  2.37it/s][A
Training:   8%|▊         | 5/61 [00:03<00:42,  1.31it/s][A
Training:  11%|█▏        | 7/61 [00:03<00:23,  2.34it/s][A
Training:  15%|█▍        | 9/61 [00:05<00:27,  1.89it/s][A
Training:  20%|█▉        | 12/61 [00:05<00:14,  3.35it/s][A
Training:  23%|██▎       | 14/61 [00:06<00:19,  2.43it/s][A
Training:  26%|██▌       | 16/61 [00:06<00:14,  3.14it/s][A
Training:  28%|██▊       | 17/61 [00:07<00:19,  2.21it/s][A
Training:  31%|███       | 19/61 [00:08<00:13,  3.11it/s][A
Training:  33%|███▎      | 20/61 [00:08<00:13,  3.14it/s][A
Training:  34%|███▍      | 21/61 [00:09<00:18,  2.11it/s][A
Training:  38%|███▊      | 23/61 [00:09<00:12,  3.13it/s][A
Training:  39%|███▉      | 24/61 [00:09<00:11,  3.19it/s][A
Training:  41%|████      | 25/61 [00:1

Epoch: 22/63 - Loss: 0.1427 - Accuracy: 0.9431



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:01<00:13,  1.90s/it][A
 38%|███▊      | 3/8 [00:02<00:02,  1.89it/s][A
 62%|██████▎   | 5/8 [00:03<00:01,  1.59it/s][A
100%|██████████| 8/8 [00:03<00:00,  2.17it/s][A
Epochs:  35%|███▍      | 22/63 [10:02<18:52, 27.61s/it]

Val Loss: 0.1509 - Val Accuracy: 0.9357



Training:   0%|          | 0/61 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/61 [00:02<01:59,  2.00s/it][A
Training:   5%|▍         | 3/61 [00:02<00:33,  1.73it/s][A
Training:   7%|▋         | 4/61 [00:02<00:23,  2.41it/s][A
Training:   8%|▊         | 5/61 [00:03<00:37,  1.50it/s][A
Training:  10%|▉         | 6/61 [00:03<00:29,  1.86it/s][A
Training:  11%|█▏        | 7/61 [00:03<00:21,  2.48it/s][A
Training:  15%|█▍        | 9/61 [00:05<00:25,  2.03it/s][A
Training:  16%|█▋        | 10/61 [00:05<00:22,  2.25it/s][A
Training:  18%|█▊        | 11/61 [00:05<00:19,  2.53it/s][A
Training:  20%|█▉        | 12/61 [00:05<00:15,  3.12it/s][A
Training:  21%|██▏       | 13/61 [00:06<00:20,  2.31it/s][A
Training:  23%|██▎       | 14/61 [00:06<00:16,  2.79it/s][A
Training:  25%|██▍       | 15/61 [00:07<00:18,  2.54it/s][A
Training:  28%|██▊       | 17/61 [00:07<00:16,  2.68it/s][A
Training:  30%|██▉       | 18/61 [00:08<00:16,  2.55it/s][A
Training:  31%|███       | 19/61 [00:08

Epoch: 23/63 - Loss: 0.1369 - Accuracy: 0.9471



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:02<00:14,  2.02s/it][A
 38%|███▊      | 3/8 [00:02<00:02,  1.75it/s][A
 62%|██████▎   | 5/8 [00:03<00:01,  1.66it/s][A
100%|██████████| 8/8 [00:03<00:00,  2.20it/s][A
Epochs:  37%|███▋      | 23/63 [10:30<18:31, 27.79s/it]

Val Loss: 0.1395 - Val Accuracy: 0.9441



Training:   0%|          | 0/61 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/61 [00:02<02:04,  2.07s/it][A
Training:   5%|▍         | 3/61 [00:02<00:33,  1.73it/s][A
Training:   8%|▊         | 5/61 [00:03<00:39,  1.43it/s][A
Training:  11%|█▏        | 7/61 [00:03<00:23,  2.28it/s][A
Training:  15%|█▍        | 9/61 [00:05<00:28,  1.79it/s][A
Training:  18%|█▊        | 11/61 [00:05<00:19,  2.61it/s][A
Training:  20%|█▉        | 12/61 [00:05<00:16,  3.01it/s][A
Training:  21%|██▏       | 13/61 [00:07<00:28,  1.71it/s][A
Training:  25%|██▍       | 15/61 [00:07<00:17,  2.59it/s][A
Training:  28%|██▊       | 17/61 [00:08<00:21,  2.06it/s][A
Training:  31%|███       | 19/61 [00:08<00:14,  2.95it/s][A
Training:  34%|███▍      | 21/61 [00:10<00:17,  2.29it/s][A
Training:  38%|███▊      | 23/61 [00:10<00:11,  3.18it/s][A
Training:  41%|████      | 25/61 [00:11<00:15,  2.28it/s][A
Training:  44%|████▍     | 27/61 [00:11<00:11,  2.98it/s][A
Training:  46%|████▌     | 28/61 [00:

Epoch: 24/63 - Loss: 0.1339 - Accuracy: 0.9466



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:01<00:12,  1.82s/it][A
 25%|██▌       | 2/8 [00:01<00:04,  1.23it/s][A
 50%|█████     | 4/8 [00:02<00:01,  2.93it/s][A
 75%|███████▌  | 6/8 [00:03<00:01,  1.93it/s][A
100%|██████████| 8/8 [00:03<00:00,  2.16it/s][A
Epochs:  38%|███▊      | 24/63 [10:59<18:23, 28.29s/it]

Val Loss: 0.1517 - Val Accuracy: 0.9356



Training:   0%|          | 0/61 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/61 [00:01<01:43,  1.73s/it][A
Training:   3%|▎         | 2/61 [00:01<00:50,  1.17it/s][A
Training:   8%|▊         | 5/61 [00:03<00:34,  1.65it/s][A
Training:  10%|▉         | 6/61 [00:03<00:28,  1.92it/s][A
Training:  13%|█▎        | 8/61 [00:03<00:17,  2.98it/s][A
Training:  15%|█▍        | 9/61 [00:05<00:26,  1.96it/s][A
Training:  16%|█▋        | 10/61 [00:05<00:23,  2.17it/s][A
Training:  20%|█▉        | 12/61 [00:05<00:14,  3.41it/s][A
Training:  21%|██▏       | 13/61 [00:06<00:22,  2.09it/s][A
Training:  23%|██▎       | 14/61 [00:06<00:20,  2.26it/s][A
Training:  25%|██▍       | 15/61 [00:07<00:16,  2.76it/s][A
Training:  26%|██▌       | 16/61 [00:07<00:13,  3.41it/s][A
Training:  28%|██▊       | 17/61 [00:08<00:26,  1.64it/s][A
Training:  30%|██▉       | 18/61 [00:08<00:21,  1.97it/s][A
Training:  31%|███       | 19/61 [00:08<00:16,  2.56it/s][A
Training:  34%|███▍      | 21/61 [00:1

Epoch: 25/63 - Loss: 0.1366 - Accuracy: 0.9453



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:01<00:13,  1.92s/it][A
 38%|███▊      | 3/8 [00:02<00:02,  1.77it/s][A
 50%|█████     | 4/8 [00:02<00:01,  2.43it/s][A
 62%|██████▎   | 5/8 [00:03<00:02,  1.36it/s][A
100%|██████████| 8/8 [00:03<00:00,  2.10it/s][A
Epochs:  40%|███▉      | 25/63 [11:28<18:03, 28.51s/it]

Val Loss: 0.1661 - Val Accuracy: 0.9277



Training:   0%|          | 0/61 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/61 [00:01<01:47,  1.79s/it][A
Training:   3%|▎         | 2/61 [00:01<00:49,  1.19it/s][A
Training:   7%|▋         | 4/61 [00:02<00:20,  2.83it/s][A
Training:   8%|▊         | 5/61 [00:03<00:37,  1.50it/s][A
Training:  10%|▉         | 6/61 [00:03<00:28,  1.90it/s][A
Training:  13%|█▎        | 8/61 [00:03<00:17,  3.09it/s][A
Training:  15%|█▍        | 9/61 [00:05<00:28,  1.80it/s][A
Training:  16%|█▋        | 10/61 [00:05<00:22,  2.29it/s][A
Training:  20%|█▉        | 12/61 [00:05<00:13,  3.62it/s][A
Training:  21%|██▏       | 13/61 [00:06<00:25,  1.89it/s][A
Training:  23%|██▎       | 14/61 [00:06<00:20,  2.32it/s][A
Training:  28%|██▊       | 17/61 [00:08<00:18,  2.34it/s][A
Training:  30%|██▉       | 18/61 [00:08<00:15,  2.70it/s][A
Training:  31%|███       | 19/61 [00:08<00:13,  3.05it/s][A
Training:  34%|███▍      | 21/61 [00:09<00:16,  2.48it/s][A
Training:  36%|███▌      | 22/61 [00:09

Epoch: 26/63 - Loss: 0.1428 - Accuracy: 0.9424



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:01<00:12,  1.84s/it][A
 38%|███▊      | 3/8 [00:01<00:02,  1.91it/s][A
 62%|██████▎   | 5/8 [00:03<00:01,  1.58it/s][A
100%|██████████| 8/8 [00:03<00:00,  2.21it/s][A
Epochs:  41%|████▏     | 26/63 [11:56<17:23, 28.20s/it]

Val Loss: 0.1492 - Val Accuracy: 0.9346



Training:   0%|          | 0/61 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/61 [00:01<01:44,  1.74s/it][A
Training:   5%|▍         | 3/61 [00:01<00:30,  1.93it/s][A
Training:   8%|▊         | 5/61 [00:03<00:36,  1.54it/s][A
Training:  11%|█▏        | 7/61 [00:03<00:21,  2.50it/s][A
Training:  15%|█▍        | 9/61 [00:04<00:25,  2.08it/s][A
Training:  18%|█▊        | 11/61 [00:04<00:16,  3.00it/s][A
Training:  21%|██▏       | 13/61 [00:06<00:21,  2.26it/s][A
Training:  25%|██▍       | 15/61 [00:06<00:15,  3.04it/s][A
Training:  28%|██▊       | 17/61 [00:07<00:16,  2.64it/s][A
Training:  30%|██▉       | 18/61 [00:07<00:14,  2.90it/s][A
Training:  31%|███       | 19/61 [00:07<00:13,  3.10it/s][A
Training:  34%|███▍      | 21/61 [00:08<00:15,  2.50it/s][A
Training:  36%|███▌      | 22/61 [00:09<00:13,  2.85it/s][A
Training:  38%|███▊      | 23/61 [00:09<00:15,  2.50it/s][A
Training:  41%|████      | 25/61 [00:10<00:14,  2.53it/s][A
Training:  44%|████▍     | 27/61 [00:

Epoch: 27/63 - Loss: 0.1395 - Accuracy: 0.9438



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:01<00:12,  1.75s/it][A
 38%|███▊      | 3/8 [00:01<00:02,  1.99it/s][A
 62%|██████▎   | 5/8 [00:03<00:01,  1.65it/s][A
100%|██████████| 8/8 [00:03<00:00,  2.28it/s][A
Epochs:  43%|████▎     | 27/63 [12:23<16:43, 27.87s/it]

Val Loss: 0.1542 - Val Accuracy: 0.9362



Training:   0%|          | 0/61 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/61 [00:01<01:38,  1.65s/it][A
Training:   3%|▎         | 2/61 [00:01<00:44,  1.33it/s][A
Training:   7%|▋         | 4/61 [00:01<00:18,  3.04it/s][A
Training:   8%|▊         | 5/61 [00:03<00:34,  1.62it/s][A
Training:  10%|▉         | 6/61 [00:03<00:26,  2.05it/s][A
Training:  13%|█▎        | 8/61 [00:03<00:15,  3.48it/s][A
Training:  15%|█▍        | 9/61 [00:04<00:26,  1.99it/s][A
Training:  16%|█▋        | 10/61 [00:05<00:24,  2.08it/s][A
Training:  21%|██▏       | 13/61 [00:05<00:17,  2.77it/s][A
Training:  23%|██▎       | 14/61 [00:06<00:19,  2.44it/s][A
Training:  26%|██▌       | 16/61 [00:06<00:13,  3.43it/s][A
Training:  28%|██▊       | 17/61 [00:07<00:17,  2.46it/s][A
Training:  30%|██▉       | 18/61 [00:08<00:19,  2.26it/s][A
Training:  33%|███▎      | 20/61 [00:08<00:12,  3.38it/s][A
Training:  34%|███▍      | 21/61 [00:09<00:18,  2.19it/s][A
Training:  36%|███▌      | 22/61 [00:09

Epoch: 28/63 - Loss: 0.1349 - Accuracy: 0.9482



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:01<00:10,  1.54s/it][A
 62%|██████▎   | 5/8 [00:02<00:01,  2.02it/s][A
 75%|███████▌  | 6/8 [00:02<00:00,  2.40it/s][A
100%|██████████| 8/8 [00:03<00:00,  2.55it/s][A
Epochs:  44%|████▍     | 28/63 [12:50<16:06, 27.63s/it]

Val Loss: 0.1394 - Val Accuracy: 0.9393



Training:   0%|          | 0/61 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/61 [00:01<01:33,  1.57s/it][A
Training:   3%|▎         | 2/61 [00:01<00:43,  1.36it/s][A
Training:   7%|▋         | 4/61 [00:01<00:17,  3.21it/s][A
Training:   8%|▊         | 5/61 [00:03<00:34,  1.64it/s][A
Training:  13%|█▎        | 8/61 [00:03<00:15,  3.52it/s][A
Training:  16%|█▋        | 10/61 [00:04<00:23,  2.22it/s][A
Training:  20%|█▉        | 12/61 [00:04<00:15,  3.13it/s][A
Training:  23%|██▎       | 14/61 [00:06<00:19,  2.41it/s][A
Training:  26%|██▌       | 16/61 [00:06<00:13,  3.25it/s][A
Training:  30%|██▉       | 18/61 [00:07<00:18,  2.33it/s][A
Training:  34%|███▍      | 21/61 [00:08<00:17,  2.30it/s][A
Training:  38%|███▊      | 23/61 [00:09<00:12,  2.99it/s][A
Training:  39%|███▉      | 24/61 [00:09<00:11,  3.33it/s][A
Training:  41%|████      | 25/61 [00:10<00:17,  2.04it/s][A
Training:  46%|████▌     | 28/61 [00:10<00:09,  3.48it/s][A
Training:  49%|████▉     | 30/61 [00:

Epoch: 29/63 - Loss: 0.1349 - Accuracy: 0.9467



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:01<00:12,  1.78s/it][A
 38%|███▊      | 3/8 [00:01<00:02,  1.97it/s][A
 62%|██████▎   | 5/8 [00:03<00:01,  1.80it/s][A
 75%|███████▌  | 6/8 [00:03<00:00,  2.20it/s][A
100%|██████████| 8/8 [00:03<00:00,  2.24it/s][A
Epochs:  46%|████▌     | 29/63 [13:17<15:36, 27.54s/it]

Val Loss: 0.1411 - Val Accuracy: 0.9437



Training:   0%|          | 0/61 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/61 [00:01<01:47,  1.80s/it][A
Training:   5%|▍         | 3/61 [00:01<00:30,  1.93it/s][A
Training:   8%|▊         | 5/61 [00:03<00:34,  1.61it/s][A
Training:  11%|█▏        | 7/61 [00:03<00:20,  2.63it/s][A
Training:  15%|█▍        | 9/61 [00:04<00:25,  2.03it/s][A
Training:  18%|█▊        | 11/61 [00:04<00:17,  2.88it/s][A
Training:  21%|██▏       | 13/61 [00:06<00:21,  2.26it/s][A
Training:  26%|██▌       | 16/61 [00:06<00:12,  3.60it/s][A
Training:  30%|██▉       | 18/61 [00:07<00:16,  2.65it/s][A
Training:  31%|███       | 19/61 [00:07<00:14,  2.84it/s][A
Training:  34%|███▍      | 21/61 [00:08<00:15,  2.55it/s][A
Training:  36%|███▌      | 22/61 [00:09<00:14,  2.64it/s][A
Training:  38%|███▊      | 23/61 [00:09<00:12,  3.04it/s][A
Training:  41%|████      | 25/61 [00:10<00:13,  2.59it/s][A
Training:  43%|████▎     | 26/61 [00:10<00:14,  2.43it/s][A
Training:  44%|████▍     | 27/61 [00:

Epoch: 30/63 - Loss: 0.1335 - Accuracy: 0.9479



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:01<00:12,  1.85s/it][A
 38%|███▊      | 3/8 [00:01<00:02,  1.92it/s][A
 62%|██████▎   | 5/8 [00:03<00:01,  1.80it/s][A
100%|██████████| 8/8 [00:03<00:00,  2.37it/s][A
Epochs:  48%|████▊     | 30/63 [13:44<15:03, 27.36s/it]

Val Loss: 0.1454 - Val Accuracy: 0.9421



Training:   0%|          | 0/61 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/61 [00:02<02:02,  2.05s/it][A
Training:   5%|▍         | 3/61 [00:02<00:33,  1.74it/s][A
Training:   8%|▊         | 5/61 [00:03<00:34,  1.61it/s][A
Training:  11%|█▏        | 7/61 [00:03<00:21,  2.54it/s][A
Training:  13%|█▎        | 8/61 [00:03<00:17,  2.99it/s][A
Training:  15%|█▍        | 9/61 [00:04<00:27,  1.89it/s][A
Training:  18%|█▊        | 11/61 [00:05<00:17,  2.93it/s][A
Training:  21%|██▏       | 13/61 [00:06<00:21,  2.22it/s][A
Training:  25%|██▍       | 15/61 [00:06<00:14,  3.15it/s][A
Training:  28%|██▊       | 17/61 [00:07<00:18,  2.43it/s][A
Training:  30%|██▉       | 18/61 [00:07<00:15,  2.84it/s][A
Training:  31%|███       | 19/61 [00:07<00:12,  3.30it/s][A
Training:  34%|███▍      | 21/61 [00:09<00:17,  2.33it/s][A
Training:  38%|███▊      | 23/61 [00:09<00:12,  3.13it/s][A
Training:  41%|████      | 25/61 [00:10<00:15,  2.32it/s][A
Training:  44%|████▍     | 27/61 [00:1

Epoch: 31/63 - Loss: 0.1320 - Accuracy: 0.9465



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:01<00:12,  1.74s/it][A
 25%|██▌       | 2/8 [00:02<00:05,  1.10it/s][A
 62%|██████▎   | 5/8 [00:03<00:01,  1.88it/s][A
100%|██████████| 8/8 [00:03<00:00,  2.30it/s][A
Epochs:  49%|████▉     | 31/63 [14:12<14:38, 27.46s/it]

Val Loss: 0.1528 - Val Accuracy: 0.9372



Training:   0%|          | 0/61 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/61 [00:02<02:01,  2.03s/it][A
Training:   8%|▊         | 5/61 [00:03<00:32,  1.72it/s][A
Training:  13%|█▎        | 8/61 [00:03<00:17,  3.09it/s][A
Training:  16%|█▋        | 10/61 [00:04<00:22,  2.28it/s][A
Training:  18%|█▊        | 11/61 [00:04<00:18,  2.65it/s][A
Training:  21%|██▏       | 13/61 [00:06<00:21,  2.23it/s][A
Training:  23%|██▎       | 14/61 [00:06<00:17,  2.62it/s][A
Training:  25%|██▍       | 15/61 [00:06<00:15,  3.06it/s][A
Training:  28%|██▊       | 17/61 [00:07<00:21,  2.05it/s][A
Training:  31%|███       | 19/61 [00:07<00:14,  2.94it/s][A
Training:  34%|███▍      | 21/61 [00:09<00:17,  2.35it/s][A
Training:  38%|███▊      | 23/61 [00:09<00:11,  3.21it/s][A
Training:  41%|████      | 25/61 [00:10<00:15,  2.36it/s][A
Training:  44%|████▍     | 27/61 [00:10<00:10,  3.19it/s][A
Training:  46%|████▌     | 28/61 [00:10<00:09,  3.61it/s][A
Training:  48%|████▊     | 29/61 [0

Epoch: 32/63 - Loss: 0.1372 - Accuracy: 0.9441



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:01<00:13,  1.91s/it][A
 38%|███▊      | 3/8 [00:02<00:02,  1.73it/s][A
100%|██████████| 8/8 [00:03<00:00,  2.30it/s][A
Epochs:  51%|█████     | 32/63 [14:39<14:04, 27.24s/it]

Val Loss: 0.1417 - Val Accuracy: 0.9410



Training:   0%|          | 0/61 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/61 [00:01<01:28,  1.48s/it][A
Training:   5%|▍         | 3/61 [00:01<00:24,  2.37it/s][A
Training:   8%|▊         | 5/61 [00:02<00:31,  1.78it/s][A
Training:  10%|▉         | 6/61 [00:03<00:24,  2.27it/s][A
Training:  13%|█▎        | 8/61 [00:03<00:15,  3.46it/s][A
Training:  15%|█▍        | 9/61 [00:04<00:25,  2.08it/s][A
Training:  18%|█▊        | 11/61 [00:04<00:15,  3.18it/s][A
Training:  21%|██▏       | 13/61 [00:05<00:21,  2.20it/s][A
Training:  25%|██▍       | 15/61 [00:06<00:14,  3.10it/s][A
Training:  28%|██▊       | 17/61 [00:07<00:19,  2.21it/s][A
Training:  30%|██▉       | 18/61 [00:07<00:16,  2.57it/s][A
Training:  31%|███       | 19/61 [00:07<00:13,  3.04it/s][A
Training:  34%|███▍      | 21/61 [00:09<00:19,  2.01it/s][A
Training:  39%|███▉      | 24/61 [00:09<00:11,  3.33it/s][A
Training:  41%|████      | 25/61 [00:10<00:18,  1.98it/s][A
Training:  44%|████▍     | 27/61 [00:1

Epoch: 33/63 - Loss: 0.1318 - Accuracy: 0.9478



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:01<00:13,  1.95s/it][A
 38%|███▊      | 3/8 [00:02<00:02,  1.78it/s][A
 50%|█████     | 4/8 [00:02<00:01,  2.47it/s][A
 62%|██████▎   | 5/8 [00:03<00:01,  1.60it/s][A
100%|██████████| 8/8 [00:03<00:00,  2.22it/s][A
Epochs:  52%|█████▏    | 33/63 [15:06<13:33, 27.13s/it]

Val Loss: 0.1485 - Val Accuracy: 0.9400



Training:   0%|          | 0/61 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/61 [00:02<02:02,  2.05s/it][A
Training:   5%|▍         | 3/61 [00:02<00:34,  1.70it/s][A
Training:   8%|▊         | 5/61 [00:03<00:34,  1.62it/s][A
Training:  11%|█▏        | 7/61 [00:03<00:20,  2.62it/s][A
Training:  15%|█▍        | 9/61 [00:04<00:23,  2.17it/s][A
Training:  18%|█▊        | 11/61 [00:04<00:15,  3.16it/s][A
Training:  21%|██▏       | 13/61 [00:06<00:21,  2.27it/s][A
Training:  25%|██▍       | 15/61 [00:06<00:14,  3.13it/s][A
Training:  28%|██▊       | 17/61 [00:07<00:19,  2.24it/s][A
Training:  33%|███▎      | 20/61 [00:08<00:11,  3.48it/s][A
Training:  36%|███▌      | 22/61 [00:09<00:14,  2.64it/s][A
Training:  41%|████      | 25/61 [00:10<00:15,  2.39it/s][A
Training:  43%|████▎     | 26/61 [00:10<00:12,  2.70it/s][A
Training:  46%|████▌     | 28/61 [00:10<00:09,  3.56it/s][A
Training:  48%|████▊     | 29/61 [00:12<00:14,  2.23it/s][A
Training:  51%|█████     | 31/61 [00:

Epoch: 34/63 - Loss: 0.1307 - Accuracy: 0.9475



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:01<00:13,  1.87s/it][A
 25%|██▌       | 2/8 [00:01<00:04,  1.21it/s][A
 50%|█████     | 4/8 [00:02<00:01,  2.87it/s][A
100%|██████████| 8/8 [00:03<00:00,  2.21it/s][A
Epochs:  54%|█████▍    | 34/63 [15:32<13:03, 27.03s/it]

Val Loss: 0.1417 - Val Accuracy: 0.9442



Training:   0%|          | 0/61 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/61 [00:01<01:48,  1.80s/it][A
Training:   3%|▎         | 2/61 [00:01<00:47,  1.23it/s][A
Training:   7%|▋         | 4/61 [00:02<00:19,  2.88it/s][A
Training:   8%|▊         | 5/61 [00:03<00:37,  1.51it/s][A
Training:  11%|█▏        | 7/61 [00:03<00:20,  2.66it/s][A
Training:  15%|█▍        | 9/61 [00:04<00:24,  2.09it/s][A
Training:  16%|█▋        | 10/61 [00:04<00:20,  2.46it/s][A
Training:  18%|█▊        | 11/61 [00:05<00:16,  3.00it/s][A
Training:  21%|██▏       | 13/61 [00:06<00:19,  2.42it/s][A
Training:  23%|██▎       | 14/61 [00:06<00:16,  2.87it/s][A
Training:  28%|██▊       | 17/61 [00:07<00:16,  2.74it/s][A
Training:  30%|██▉       | 18/61 [00:07<00:14,  2.97it/s][A
Training:  31%|███       | 19/61 [00:07<00:12,  3.30it/s][A
Training:  34%|███▍      | 21/61 [00:08<00:14,  2.68it/s][A
Training:  36%|███▌      | 22/61 [00:08<00:12,  3.04it/s][A
Training:  38%|███▊      | 23/61 [00:0

Epoch: 35/63 - Loss: 0.1369 - Accuracy: 0.9455



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:01<00:13,  1.98s/it][A
 38%|███▊      | 3/8 [00:02<00:02,  1.79it/s][A
100%|██████████| 8/8 [00:03<00:00,  2.19it/s][A
Epochs:  56%|█████▌    | 35/63 [15:59<12:36, 27.01s/it]

Val Loss: 0.1731 - Val Accuracy: 0.9346



Training:   0%|          | 0/61 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/61 [00:02<02:03,  2.06s/it][A
Training:   8%|▊         | 5/61 [00:03<00:34,  1.63it/s][A
Training:  15%|█▍        | 9/61 [00:05<00:25,  2.07it/s][A
Training:  18%|█▊        | 11/61 [00:05<00:18,  2.70it/s][A
Training:  21%|██▏       | 13/61 [00:06<00:19,  2.44it/s][A
Training:  26%|██▌       | 16/61 [00:06<00:12,  3.74it/s][A
Training:  30%|██▉       | 18/61 [00:07<00:17,  2.41it/s][A
Training:  33%|███▎      | 20/61 [00:08<00:13,  3.13it/s][A
Training:  36%|███▌      | 22/61 [00:09<00:16,  2.36it/s][A
Training:  39%|███▉      | 24/61 [00:09<00:11,  3.15it/s][A
Training:  43%|████▎     | 26/61 [00:11<00:15,  2.30it/s][A
Training:  44%|████▍     | 27/61 [00:11<00:12,  2.62it/s][A
Training:  48%|████▊     | 29/61 [00:12<00:14,  2.20it/s][A
Training:  51%|█████     | 31/61 [00:12<00:10,  3.00it/s][A
Training:  54%|█████▍    | 33/61 [00:13<00:12,  2.28it/s][A
Training:  57%|█████▋    | 35/61 [0

Epoch: 36/63 - Loss: 0.1315 - Accuracy: 0.9486



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:01<00:12,  1.73s/it][A
 25%|██▌       | 2/8 [00:01<00:04,  1.29it/s][A
 38%|███▊      | 3/8 [00:02<00:02,  1.79it/s][A
 62%|██████▎   | 5/8 [00:03<00:01,  1.79it/s][A
100%|██████████| 8/8 [00:03<00:00,  2.19it/s][A
Epochs:  57%|█████▋    | 36/63 [16:27<12:15, 27.26s/it]

Val Loss: 0.1421 - Val Accuracy: 0.9388



Training:   0%|          | 0/61 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/61 [00:01<01:58,  1.98s/it][A
Training:   5%|▍         | 3/61 [00:02<00:32,  1.81it/s][A
Training:   8%|▊         | 5/61 [00:03<00:32,  1.72it/s][A
Training:  11%|█▏        | 7/61 [00:03<00:19,  2.80it/s][A
Training:  15%|█▍        | 9/61 [00:04<00:24,  2.15it/s][A
Training:  16%|█▋        | 10/61 [00:04<00:19,  2.55it/s][A
Training:  20%|█▉        | 12/61 [00:04<00:13,  3.72it/s][A
Training:  23%|██▎       | 14/61 [00:05<00:16,  2.85it/s][A
Training:  26%|██▌       | 16/61 [00:06<00:11,  3.97it/s][A
Training:  30%|██▉       | 18/61 [00:07<00:16,  2.57it/s][A
Training:  33%|███▎      | 20/61 [00:07<00:12,  3.26it/s][A
Training:  34%|███▍      | 21/61 [00:08<00:17,  2.29it/s][A
Training:  36%|███▌      | 22/61 [00:09<00:16,  2.36it/s][A
Training:  39%|███▉      | 24/61 [00:09<00:11,  3.26it/s][A
Training:  41%|████      | 25/61 [00:10<00:15,  2.35it/s][A
Training:  43%|████▎     | 26/61 [00:

Epoch: 37/63 - Loss: 0.1325 - Accuracy: 0.9465



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:01<00:13,  1.87s/it][A
 25%|██▌       | 2/8 [00:02<00:05,  1.10it/s][A
 62%|██████▎   | 5/8 [00:03<00:01,  1.84it/s][A
100%|██████████| 8/8 [00:03<00:00,  2.12it/s][A
Epochs:  59%|█████▊    | 37/63 [16:54<11:45, 27.14s/it]

Val Loss: 0.1401 - Val Accuracy: 0.9420



Training:   0%|          | 0/61 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/61 [00:01<01:46,  1.78s/it][A
Training:   5%|▍         | 3/61 [00:01<00:29,  1.96it/s][A
Training:   8%|▊         | 5/61 [00:03<00:30,  1.83it/s][A
Training:  10%|▉         | 6/61 [00:03<00:25,  2.15it/s][A
Training:  11%|█▏        | 7/61 [00:03<00:20,  2.63it/s][A
Training:  15%|█▍        | 9/61 [00:04<00:24,  2.14it/s][A
Training:  16%|█▋        | 10/61 [00:04<00:21,  2.42it/s][A
Training:  18%|█▊        | 11/61 [00:04<00:16,  2.97it/s][A
Training:  21%|██▏       | 13/61 [00:05<00:19,  2.47it/s][A
Training:  23%|██▎       | 14/61 [00:06<00:16,  2.78it/s][A
Training:  26%|██▌       | 16/61 [00:06<00:10,  4.13it/s][A
Training:  28%|██▊       | 17/61 [00:07<00:18,  2.36it/s][A
Training:  30%|██▉       | 18/61 [00:07<00:15,  2.75it/s][A
Training:  31%|███       | 19/61 [00:07<00:12,  3.31it/s][A
Training:  33%|███▎      | 20/61 [00:07<00:11,  3.46it/s][A
Training:  34%|███▍      | 21/61 [00:0

Epoch: 38/63 - Loss: 0.1385 - Accuracy: 0.9438



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:01<00:12,  1.74s/it][A
 25%|██▌       | 2/8 [00:01<00:04,  1.25it/s][A
 62%|██████▎   | 5/8 [00:03<00:01,  1.78it/s][A
100%|██████████| 8/8 [00:03<00:00,  2.27it/s][A
Epochs:  60%|██████    | 38/63 [17:21<11:19, 27.19s/it]

Val Loss: 0.1469 - Val Accuracy: 0.9383



Training:   0%|          | 0/61 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/61 [00:01<01:50,  1.84s/it][A
Training:   7%|▋         | 4/61 [00:02<00:23,  2.46it/s][A
Training:   8%|▊         | 5/61 [00:03<00:36,  1.53it/s][A
Training:  11%|█▏        | 7/61 [00:03<00:21,  2.57it/s][A
Training:  15%|█▍        | 9/61 [00:04<00:25,  2.01it/s][A
Training:  20%|█▉        | 12/61 [00:04<00:14,  3.34it/s][A
Training:  23%|██▎       | 14/61 [00:06<00:18,  2.49it/s][A
Training:  26%|██▌       | 16/61 [00:06<00:13,  3.32it/s][A
Training:  28%|██▊       | 17/61 [00:07<00:19,  2.28it/s][A
Training:  30%|██▉       | 18/61 [00:07<00:18,  2.38it/s][A
Training:  33%|███▎      | 20/61 [00:07<00:11,  3.43it/s][A
Training:  34%|███▍      | 21/61 [00:09<00:18,  2.21it/s][A
Training:  36%|███▌      | 22/61 [00:09<00:15,  2.44it/s][A
Training:  41%|████      | 25/61 [00:10<00:15,  2.29it/s][A
Training:  44%|████▍     | 27/61 [00:10<00:10,  3.14it/s][A
Training:  48%|████▊     | 29/61 [00:

Epoch: 39/63 - Loss: 0.1331 - Accuracy: 0.9491



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:01<00:12,  1.76s/it][A
 50%|█████     | 4/8 [00:01<00:01,  2.63it/s][A
 75%|███████▌  | 6/8 [00:03<00:00,  2.12it/s][A
100%|██████████| 8/8 [00:03<00:00,  2.36it/s][A
Epochs:  62%|██████▏   | 39/63 [17:49<10:53, 27.22s/it]

Val Loss: 0.1428 - Val Accuracy: 0.9400



Training:   0%|          | 0/61 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/61 [00:02<02:04,  2.08s/it][A
Training:   8%|▊         | 5/61 [00:03<00:35,  1.57it/s][A
Training:  11%|█▏        | 7/61 [00:03<00:23,  2.28it/s][A
Training:  15%|█▍        | 9/61 [00:05<00:25,  2.00it/s][A
Training:  18%|█▊        | 11/61 [00:05<00:17,  2.82it/s][A
Training:  21%|██▏       | 13/61 [00:06<00:20,  2.36it/s][A
Training:  25%|██▍       | 15/61 [00:06<00:14,  3.25it/s][A
Training:  28%|██▊       | 17/61 [00:07<00:18,  2.36it/s][A
Training:  33%|███▎      | 20/61 [00:08<00:11,  3.60it/s][A
Training:  36%|███▌      | 22/61 [00:09<00:14,  2.65it/s][A
Training:  41%|████      | 25/61 [00:10<00:14,  2.47it/s][A
Training:  44%|████▍     | 27/61 [00:10<00:10,  3.17it/s][A
Training:  48%|████▊     | 29/61 [00:12<00:12,  2.48it/s][A
Training:  51%|█████     | 31/61 [00:12<00:09,  3.24it/s][A
Training:  52%|█████▏    | 32/61 [00:12<00:08,  3.25it/s][A
Training:  54%|█████▍    | 33/61 [00

Epoch: 40/63 - Loss: 0.1314 - Accuracy: 0.9483



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:01<00:13,  1.97s/it][A
 38%|███▊      | 3/8 [00:02<00:02,  1.78it/s][A
 62%|██████▎   | 5/8 [00:03<00:01,  1.64it/s][A
100%|██████████| 8/8 [00:03<00:00,  2.10it/s][A
Epochs:  63%|██████▎   | 40/63 [18:16<10:24, 27.16s/it]

Val Loss: 0.1457 - Val Accuracy: 0.9308



Training:   0%|          | 0/61 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/61 [00:01<01:52,  1.88s/it][A
Training:   3%|▎         | 2/61 [00:02<00:51,  1.15it/s][A
Training:   7%|▋         | 4/61 [00:02<00:20,  2.76it/s][A
Training:   8%|▊         | 5/61 [00:03<00:37,  1.49it/s][A
Training:  11%|█▏        | 7/61 [00:03<00:21,  2.55it/s][A
Training:  15%|█▍        | 9/61 [00:05<00:26,  1.99it/s][A
Training:  21%|██▏       | 13/61 [00:06<00:18,  2.53it/s][A
Training:  23%|██▎       | 14/61 [00:06<00:17,  2.76it/s][A
Training:  26%|██▌       | 16/61 [00:06<00:12,  3.65it/s][A
Training:  28%|██▊       | 17/61 [00:07<00:17,  2.49it/s][A
Training:  30%|██▉       | 18/61 [00:07<00:17,  2.49it/s][A
Training:  33%|███▎      | 20/61 [00:08<00:11,  3.61it/s][A
Training:  34%|███▍      | 21/61 [00:08<00:15,  2.50it/s][A
Training:  36%|███▌      | 22/61 [00:09<00:15,  2.49it/s][A
Training:  39%|███▉      | 24/61 [00:09<00:10,  3.68it/s][A
Training:  41%|████      | 25/61 [00:1

Epoch: 41/63 - Loss: 0.1351 - Accuracy: 0.9472



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:02<00:14,  2.06s/it][A
 38%|███▊      | 3/8 [00:02<00:02,  1.70it/s][A
 62%|██████▎   | 5/8 [00:03<00:01,  1.60it/s][A
100%|██████████| 8/8 [00:03<00:00,  2.15it/s][A
Epochs:  65%|██████▌   | 41/63 [18:43<09:57, 27.17s/it]

Val Loss: 0.1684 - Val Accuracy: 0.9292



Training:   0%|          | 0/61 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/61 [00:01<01:56,  1.94s/it][A
Training:   3%|▎         | 2/61 [00:02<00:53,  1.10it/s][A
Training:   7%|▋         | 4/61 [00:02<00:22,  2.57it/s][A
Training:   8%|▊         | 5/61 [00:03<00:35,  1.59it/s][A
Training:  10%|▉         | 6/61 [00:03<00:29,  1.90it/s][A
Training:  13%|█▎        | 8/61 [00:03<00:16,  3.21it/s][A
Training:  15%|█▍        | 9/61 [00:04<00:21,  2.42it/s][A
Training:  16%|█▋        | 10/61 [00:05<00:21,  2.40it/s][A
Training:  20%|█▉        | 12/61 [00:05<00:13,  3.74it/s][A
Training:  21%|██▏       | 13/61 [00:05<00:18,  2.54it/s][A
Training:  23%|██▎       | 14/61 [00:06<00:21,  2.21it/s][A
Training:  26%|██▌       | 16/61 [00:06<00:13,  3.44it/s][A
Training:  28%|██▊       | 17/61 [00:07<00:19,  2.27it/s][A
Training:  30%|██▉       | 18/61 [00:07<00:16,  2.59it/s][A
Training:  34%|███▍      | 21/61 [00:09<00:15,  2.62it/s][A
Training:  36%|███▌      | 22/61 [00:09

Epoch: 42/63 - Loss: 0.1306 - Accuracy: 0.9470



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:01<00:12,  1.79s/it][A
 25%|██▌       | 2/8 [00:01<00:04,  1.23it/s][A
 50%|█████     | 4/8 [00:02<00:01,  2.95it/s][A
100%|██████████| 8/8 [00:03<00:00,  2.20it/s][A
Epochs:  67%|██████▋   | 42/63 [19:11<09:33, 27.33s/it]

Val Loss: 0.1380 - Val Accuracy: 0.9421



Training:   0%|          | 0/61 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/61 [00:01<01:52,  1.88s/it][A
Training:   3%|▎         | 2/61 [00:02<00:54,  1.07it/s][A
Training:   5%|▍         | 3/61 [00:02<00:32,  1.80it/s][A
Training:   8%|▊         | 5/61 [00:03<00:33,  1.69it/s][A
Training:  11%|█▏        | 7/61 [00:03<00:20,  2.60it/s][A
Training:  15%|█▍        | 9/61 [00:04<00:21,  2.46it/s][A
Training:  16%|█▋        | 10/61 [00:04<00:17,  2.91it/s][A
Training:  18%|█▊        | 11/61 [00:04<00:15,  3.20it/s][A
Training:  20%|█▉        | 12/61 [00:05<00:12,  3.86it/s][A
Training:  21%|██▏       | 13/61 [00:06<00:22,  2.10it/s][A
Training:  23%|██▎       | 14/61 [00:06<00:19,  2.46it/s][A
Training:  25%|██▍       | 15/61 [00:06<00:17,  2.63it/s][A
Training:  28%|██▊       | 17/61 [00:07<00:18,  2.41it/s][A
Training:  30%|██▉       | 18/61 [00:07<00:15,  2.81it/s][A
Training:  31%|███       | 19/61 [00:07<00:13,  3.20it/s][A
Training:  34%|███▍      | 21/61 [00:0

Epoch: 43/63 - Loss: 0.1302 - Accuracy: 0.9488



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:01<00:13,  1.94s/it][A
 25%|██▌       | 2/8 [00:02<00:05,  1.06it/s][A
 62%|██████▎   | 5/8 [00:03<00:01,  1.74it/s][A
 75%|███████▌  | 6/8 [00:03<00:00,  2.14it/s][A
100%|██████████| 8/8 [00:03<00:00,  2.04it/s][A
Epochs:  68%|██████▊   | 43/63 [19:38<09:07, 27.36s/it]

Val Loss: 0.1383 - Val Accuracy: 0.9437



Training:   0%|          | 0/61 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/61 [00:02<02:03,  2.05s/it][A
Training:   3%|▎         | 2/61 [00:02<00:55,  1.05it/s][A
Training:   8%|▊         | 5/61 [00:03<00:30,  1.84it/s][A
Training:  10%|▉         | 6/61 [00:03<00:25,  2.13it/s][A
Training:  13%|█▎        | 8/61 [00:03<00:16,  3.25it/s][A
Training:  15%|█▍        | 9/61 [00:04<00:21,  2.45it/s][A
Training:  16%|█▋        | 10/61 [00:04<00:20,  2.49it/s][A
Training:  18%|█▊        | 11/61 [00:05<00:16,  3.09it/s][A
Training:  20%|█▉        | 12/61 [00:05<00:13,  3.74it/s][A
Training:  21%|██▏       | 13/61 [00:06<00:21,  2.28it/s][A
Training:  23%|██▎       | 14/61 [00:06<00:21,  2.16it/s][A
Training:  28%|██▊       | 17/61 [00:07<00:16,  2.62it/s][A
Training:  30%|██▉       | 18/61 [00:07<00:16,  2.69it/s][A
Training:  31%|███       | 19/61 [00:07<00:13,  3.12it/s][A
Training:  34%|███▍      | 21/61 [00:08<00:15,  2.62it/s][A
Training:  36%|███▌      | 22/61 [00:0

Epoch: 44/63 - Loss: 0.1321 - Accuracy: 0.9489



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:01<00:13,  1.89s/it][A
 25%|██▌       | 2/8 [00:02<00:05,  1.11it/s][A
 38%|███▊      | 3/8 [00:02<00:02,  1.77it/s][A
 62%|██████▎   | 5/8 [00:03<00:01,  1.72it/s][A
100%|██████████| 8/8 [00:03<00:00,  2.12it/s][A
Epochs:  70%|██████▉   | 44/63 [20:05<08:36, 27.16s/it]

Val Loss: 0.1422 - Val Accuracy: 0.9405



Training:   0%|          | 0/61 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/61 [00:02<02:03,  2.06s/it][A
Training:   3%|▎         | 2/61 [00:02<00:53,  1.10it/s][A
Training:   8%|▊         | 5/61 [00:03<00:33,  1.69it/s][A
Training:  13%|█▎        | 8/61 [00:03<00:16,  3.21it/s][A
Training:  16%|█▋        | 10/61 [00:05<00:21,  2.35it/s][A
Training:  20%|█▉        | 12/61 [00:05<00:15,  3.23it/s][A
Training:  23%|██▎       | 14/61 [00:06<00:16,  2.82it/s][A
Training:  28%|██▊       | 17/61 [00:07<00:15,  2.80it/s][A
Training:  30%|██▉       | 18/61 [00:07<00:14,  2.89it/s][A
Training:  33%|███▎      | 20/61 [00:07<00:10,  3.86it/s][A
Training:  34%|███▍      | 21/61 [00:08<00:14,  2.74it/s][A
Training:  36%|███▌      | 22/61 [00:09<00:16,  2.32it/s][A
Training:  38%|███▊      | 23/61 [00:09<00:13,  2.81it/s][A
Training:  41%|████      | 25/61 [00:09<00:10,  3.57it/s][A
Training:  43%|████▎     | 26/61 [00:10<00:15,  2.22it/s][A
Training:  46%|████▌     | 28/61 [00

Epoch: 45/63 - Loss: 0.1315 - Accuracy: 0.9487



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:01<00:13,  1.95s/it][A
 38%|███▊      | 3/8 [00:02<00:02,  1.78it/s][A
100%|██████████| 8/8 [00:03<00:00,  2.19it/s][A
Epochs:  71%|███████▏  | 45/63 [20:31<08:04, 26.89s/it]

Val Loss: 0.1497 - Val Accuracy: 0.9432



Training:   0%|          | 0/61 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/61 [00:01<01:52,  1.87s/it][A
Training:   3%|▎         | 2/61 [00:01<00:49,  1.20it/s][A
Training:   7%|▋         | 4/61 [00:02<00:19,  2.92it/s][A
Training:  10%|▉         | 6/61 [00:03<00:28,  1.91it/s][A
Training:  13%|█▎        | 8/61 [00:03<00:18,  2.92it/s][A
Training:  15%|█▍        | 9/61 [00:04<00:28,  1.83it/s][A
Training:  18%|█▊        | 11/61 [00:05<00:17,  2.78it/s][A
Training:  21%|██▏       | 13/61 [00:06<00:22,  2.14it/s][A
Training:  25%|██▍       | 15/61 [00:06<00:15,  3.05it/s][A
Training:  28%|██▊       | 17/61 [00:07<00:19,  2.26it/s][A
Training:  33%|███▎      | 20/61 [00:08<00:11,  3.57it/s][A
Training:  36%|███▌      | 22/61 [00:09<00:14,  2.69it/s][A
Training:  39%|███▉      | 24/61 [00:09<00:10,  3.53it/s][A
Training:  43%|████▎     | 26/61 [00:10<00:13,  2.67it/s][A
Training:  48%|████▊     | 29/61 [00:11<00:13,  2.40it/s][A
Training:  51%|█████     | 31/61 [00:1

Epoch: 46/63 - Loss: 0.1334 - Accuracy: 0.9484



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:01<00:12,  1.77s/it][A
 25%|██▌       | 2/8 [00:01<00:05,  1.18it/s][A
 50%|█████     | 4/8 [00:02<00:01,  2.73it/s][A
 62%|██████▎   | 5/8 [00:03<00:01,  1.59it/s][A
100%|██████████| 8/8 [00:03<00:00,  2.19it/s][A
Epochs:  73%|███████▎  | 46/63 [20:58<07:38, 26.97s/it]

Val Loss: 0.1416 - Val Accuracy: 0.9426



Training:   0%|          | 0/61 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/61 [00:01<01:44,  1.73s/it][A
Training:   3%|▎         | 2/61 [00:01<00:47,  1.24it/s][A
Training:   5%|▍         | 3/61 [00:02<00:28,  2.03it/s][A
Training:   8%|▊         | 5/61 [00:03<00:32,  1.72it/s][A
Training:  10%|▉         | 6/61 [00:03<00:25,  2.13it/s][A
Training:  15%|█▍        | 9/61 [00:04<00:22,  2.33it/s][A
Training:  20%|█▉        | 12/61 [00:04<00:13,  3.60it/s][A
Training:  21%|██▏       | 13/61 [00:06<00:22,  2.12it/s][A
Training:  26%|██▌       | 16/61 [00:06<00:13,  3.44it/s][A
Training:  30%|██▉       | 18/61 [00:07<00:16,  2.53it/s][A
Training:  33%|███▎      | 20/61 [00:07<00:12,  3.32it/s][A
Training:  34%|███▍      | 21/61 [00:08<00:17,  2.33it/s][A
Training:  36%|███▌      | 22/61 [00:09<00:14,  2.74it/s][A
Training:  39%|███▉      | 24/61 [00:09<00:09,  3.84it/s][A
Training:  41%|████      | 25/61 [00:10<00:16,  2.19it/s][A
Training:  46%|████▌     | 28/61 [00:1

Epoch: 47/63 - Loss: 0.1313 - Accuracy: 0.9477



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:02<00:14,  2.05s/it][A
 50%|█████     | 4/8 [00:02<00:01,  2.36it/s][A
100%|██████████| 8/8 [00:03<00:00,  2.14it/s][A
Epochs:  75%|███████▍  | 47/63 [21:25<07:11, 26.99s/it]

Val Loss: 0.1400 - Val Accuracy: 0.9405



Training:   0%|          | 0/61 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/61 [00:01<01:59,  1.99s/it][A
Training:   3%|▎         | 2/61 [00:02<00:53,  1.09it/s][A
Training:   7%|▋         | 4/61 [00:02<00:21,  2.61it/s][A
Training:   8%|▊         | 5/61 [00:03<00:38,  1.47it/s][A
Training:  11%|█▏        | 7/61 [00:03<00:21,  2.56it/s][A
Training:  15%|█▍        | 9/61 [00:04<00:24,  2.09it/s][A
Training:  16%|█▋        | 10/61 [00:05<00:20,  2.43it/s][A
Training:  21%|██▏       | 13/61 [00:06<00:21,  2.27it/s][A
Training:  23%|██▎       | 14/61 [00:06<00:17,  2.65it/s][A
Training:  26%|██▌       | 16/61 [00:06<00:11,  3.76it/s][A
Training:  28%|██▊       | 17/61 [00:07<00:18,  2.42it/s][A
Training:  30%|██▉       | 18/61 [00:07<00:15,  2.79it/s][A
Training:  33%|███▎      | 20/61 [00:08<00:10,  3.92it/s][A
Training:  34%|███▍      | 21/61 [00:09<00:16,  2.40it/s][A
Training:  36%|███▌      | 22/61 [00:09<00:14,  2.65it/s][A
Training:  39%|███▉      | 24/61 [00:0

Epoch: 48/63 - Loss: 0.1325 - Accuracy: 0.9452



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:01<00:12,  1.78s/it][A
 38%|███▊      | 3/8 [00:01<00:02,  1.98it/s][A
 62%|██████▎   | 5/8 [00:03<00:01,  1.88it/s][A
 75%|███████▌  | 6/8 [00:03<00:00,  2.21it/s][A
100%|██████████| 8/8 [00:03<00:00,  2.29it/s][A
Epochs:  76%|███████▌  | 48/63 [21:52<06:42, 26.83s/it]

Val Loss: 0.1383 - Val Accuracy: 0.9405



Training:   0%|          | 0/61 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/61 [00:01<01:56,  1.94s/it][A
Training:   3%|▎         | 2/61 [00:02<00:51,  1.15it/s][A
Training:   7%|▋         | 4/61 [00:02<00:21,  2.60it/s][A
Training:   8%|▊         | 5/61 [00:03<00:32,  1.71it/s][A
Training:  10%|▉         | 6/61 [00:03<00:26,  2.04it/s][A
Training:  13%|█▎        | 8/61 [00:03<00:16,  3.27it/s][A
Training:  15%|█▍        | 9/61 [00:04<00:26,  1.96it/s][A
Training:  16%|█▋        | 10/61 [00:05<00:21,  2.39it/s][A
Training:  20%|█▉        | 12/61 [00:05<00:12,  3.82it/s][A
Training:  21%|██▏       | 13/61 [00:06<00:23,  2.02it/s][A
Training:  23%|██▎       | 14/61 [00:06<00:18,  2.49it/s][A
Training:  26%|██▌       | 16/61 [00:06<00:12,  3.66it/s][A
Training:  28%|██▊       | 17/61 [00:07<00:18,  2.35it/s][A
Training:  30%|██▉       | 18/61 [00:07<00:14,  2.88it/s][A
Training:  34%|███▍      | 21/61 [00:08<00:13,  3.01it/s][A
Training:  36%|███▌      | 22/61 [00:08

Epoch: 49/63 - Loss: 0.1256 - Accuracy: 0.9521



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:01<00:13,  1.87s/it][A
 38%|███▊      | 3/8 [00:02<00:02,  1.86it/s][A
100%|██████████| 8/8 [00:03<00:00,  2.22it/s][A
Epochs:  78%|███████▊  | 49/63 [22:18<06:11, 26.55s/it]

Val Loss: 0.1447 - Val Accuracy: 0.9410



Training:   0%|          | 0/61 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/61 [00:01<01:50,  1.85s/it][A
Training:   3%|▎         | 2/61 [00:02<00:54,  1.08it/s][A
Training:   5%|▍         | 3/61 [00:02<00:32,  1.79it/s][A
Training:   7%|▋         | 4/61 [00:02<00:21,  2.65it/s][A
Training:   8%|▊         | 5/61 [00:03<00:34,  1.62it/s][A
Training:  10%|▉         | 6/61 [00:03<00:29,  1.87it/s][A
Training:  13%|█▎        | 8/61 [00:03<00:16,  3.25it/s][A
Training:  15%|█▍        | 9/61 [00:04<00:22,  2.26it/s][A
Training:  16%|█▋        | 10/61 [00:05<00:22,  2.30it/s][A
Training:  21%|██▏       | 13/61 [00:06<00:19,  2.49it/s][A
Training:  23%|██▎       | 14/61 [00:06<00:19,  2.37it/s][A
Training:  26%|██▌       | 16/61 [00:06<00:13,  3.33it/s][A
Training:  28%|██▊       | 17/61 [00:08<00:20,  2.19it/s][A
Training:  30%|██▉       | 18/61 [00:08<00:18,  2.38it/s][A
Training:  34%|███▍      | 21/61 [00:09<00:15,  2.57it/s][A
Training:  36%|███▌      | 22/61 [00:09<

Epoch: 50/63 - Loss: 0.1273 - Accuracy: 0.9492



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:01<00:12,  1.85s/it][A
 50%|█████     | 4/8 [00:01<00:01,  2.63it/s][A
100%|██████████| 8/8 [00:03<00:00,  2.29it/s][A
Epochs:  79%|███████▉  | 50/63 [22:45<05:46, 26.68s/it]

Val Loss: 0.1583 - Val Accuracy: 0.9345



Training:   0%|          | 0/61 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/61 [00:01<01:58,  1.97s/it][A
Training:   3%|▎         | 2/61 [00:02<00:52,  1.12it/s][A
Training:   8%|▊         | 5/61 [00:03<00:31,  1.77it/s][A
Training:  11%|█▏        | 7/61 [00:03<00:19,  2.76it/s][A
Training:  15%|█▍        | 9/61 [00:04<00:23,  2.17it/s][A
Training:  16%|█▋        | 10/61 [00:04<00:20,  2.52it/s][A
Training:  18%|█▊        | 11/61 [00:05<00:16,  3.03it/s][A
Training:  20%|█▉        | 12/61 [00:05<00:13,  3.63it/s][A
Training:  21%|██▏       | 13/61 [00:06<00:23,  2.03it/s][A
Training:  23%|██▎       | 14/61 [00:06<00:19,  2.41it/s][A
Training:  28%|██▊       | 17/61 [00:07<00:18,  2.41it/s][A
Training:  30%|██▉       | 18/61 [00:07<00:15,  2.76it/s][A
Training:  33%|███▎      | 20/61 [00:08<00:10,  3.85it/s][A
Training:  34%|███▍      | 21/61 [00:09<00:16,  2.44it/s][A
Training:  36%|███▌      | 22/61 [00:09<00:14,  2.66it/s][A
Training:  41%|████      | 25/61 [00:

Epoch: 51/63 - Loss: 0.1287 - Accuracy: 0.9486



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:01<00:13,  1.86s/it][A
 38%|███▊      | 3/8 [00:02<00:02,  1.87it/s][A
 62%|██████▎   | 5/8 [00:03<00:01,  1.64it/s][A
100%|██████████| 8/8 [00:03<00:00,  2.18it/s][A
Epochs:  81%|████████  | 51/63 [23:11<05:20, 26.71s/it]

Val Loss: 0.1505 - Val Accuracy: 0.9394



Training:   0%|          | 0/61 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/61 [00:01<01:37,  1.62s/it][A
Training:   3%|▎         | 2/61 [00:01<00:42,  1.38it/s][A
Training:   5%|▍         | 3/61 [00:01<00:25,  2.27it/s][A
Training:   8%|▊         | 5/61 [00:03<00:33,  1.68it/s][A
Training:  10%|▉         | 6/61 [00:03<00:24,  2.20it/s][A
Training:  11%|█▏        | 7/61 [00:03<00:19,  2.75it/s][A
Training:  15%|█▍        | 9/61 [00:04<00:25,  2.07it/s][A
Training:  16%|█▋        | 10/61 [00:04<00:19,  2.56it/s][A
Training:  20%|█▉        | 12/61 [00:05<00:13,  3.76it/s][A
Training:  21%|██▏       | 13/61 [00:06<00:22,  2.13it/s][A
Training:  23%|██▎       | 14/61 [00:06<00:18,  2.60it/s][A
Training:  26%|██▌       | 16/61 [00:06<00:11,  4.00it/s][A
Training:  28%|██▊       | 17/61 [00:07<00:21,  2.04it/s][A
Training:  30%|██▉       | 18/61 [00:07<00:17,  2.46it/s][A
Training:  33%|███▎      | 20/61 [00:08<00:11,  3.67it/s][A
Training:  34%|███▍      | 21/61 [00:09

Epoch: 52/63 - Loss: 0.1296 - Accuracy: 0.9498



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:01<00:12,  1.85s/it][A
 38%|███▊      | 3/8 [00:02<00:02,  1.78it/s][A
 50%|█████     | 4/8 [00:02<00:01,  2.43it/s][A
 62%|██████▎   | 5/8 [00:03<00:01,  1.52it/s][A
100%|██████████| 8/8 [00:03<00:00,  2.21it/s][A
Epochs:  83%|████████▎ | 52/63 [23:39<04:55, 26.85s/it]

Val Loss: 0.1473 - Val Accuracy: 0.9384



Training:   0%|          | 0/61 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/61 [00:01<01:48,  1.81s/it][A
Training:   3%|▎         | 2/61 [00:01<00:47,  1.24it/s][A
Training:   7%|▋         | 4/61 [00:02<00:19,  2.87it/s][A
Training:   8%|▊         | 5/61 [00:03<00:39,  1.43it/s][A
Training:  11%|█▏        | 7/61 [00:03<00:22,  2.43it/s][A
Training:  15%|█▍        | 9/61 [00:04<00:25,  2.03it/s][A
Training:  18%|█▊        | 11/61 [00:05<00:17,  2.89it/s][A
Training:  21%|██▏       | 13/61 [00:06<00:20,  2.31it/s][A
Training:  25%|██▍       | 15/61 [00:06<00:14,  3.22it/s][A
Training:  28%|██▊       | 17/61 [00:07<00:18,  2.35it/s][A
Training:  31%|███       | 19/61 [00:07<00:13,  3.22it/s][A
Training:  34%|███▍      | 21/61 [00:09<00:17,  2.29it/s][A
Training:  39%|███▉      | 24/61 [00:09<00:10,  3.61it/s][A
Training:  43%|████▎     | 26/61 [00:10<00:12,  2.83it/s][A
Training:  48%|████▊     | 29/61 [00:11<00:11,  2.70it/s][A
Training:  49%|████▉     | 30/61 [00:1

Epoch: 53/63 - Loss: 0.1376 - Accuracy: 0.9454



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:01<00:11,  1.63s/it][A
 25%|██▌       | 2/8 [00:01<00:04,  1.24it/s][A
 38%|███▊      | 3/8 [00:01<00:02,  2.03it/s][A
 62%|██████▎   | 5/8 [00:03<00:01,  1.85it/s][A
 75%|███████▌  | 6/8 [00:03<00:00,  2.01it/s][A
100%|██████████| 8/8 [00:03<00:00,  2.15it/s][A
Epochs:  84%|████████▍ | 53/63 [24:04<04:25, 26.55s/it]

Val Loss: 0.1406 - Val Accuracy: 0.9405



Training:   0%|          | 0/61 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/61 [00:01<01:41,  1.69s/it][A
Training:   3%|▎         | 2/61 [00:01<00:49,  1.18it/s][A
Training:   5%|▍         | 3/61 [00:02<00:29,  1.94it/s][A
Training:   8%|▊         | 5/61 [00:03<00:35,  1.60it/s][A
Training:  10%|▉         | 6/61 [00:03<00:26,  2.04it/s][A
Training:  13%|█▎        | 8/61 [00:03<00:15,  3.40it/s][A
Training:  15%|█▍        | 9/61 [00:04<00:26,  1.95it/s][A
Training:  18%|█▊        | 11/61 [00:05<00:16,  2.97it/s][A
Training:  21%|██▏       | 13/61 [00:06<00:21,  2.22it/s][A
Training:  23%|██▎       | 14/61 [00:06<00:17,  2.63it/s][A
Training:  25%|██▍       | 15/61 [00:06<00:14,  3.10it/s][A
Training:  26%|██▌       | 16/61 [00:06<00:13,  3.27it/s][A
Training:  28%|██▊       | 17/61 [00:07<00:19,  2.25it/s][A
Training:  30%|██▉       | 18/61 [00:07<00:16,  2.65it/s][A
Training:  33%|███▎      | 20/61 [00:08<00:11,  3.68it/s][A
Training:  34%|███▍      | 21/61 [00:09

Epoch: 54/63 - Loss: 0.1322 - Accuracy: 0.9461



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:01<00:13,  1.93s/it][A
 25%|██▌       | 2/8 [00:02<00:05,  1.12it/s][A
 50%|█████     | 4/8 [00:02<00:01,  2.59it/s][A
 62%|██████▎   | 5/8 [00:03<00:01,  1.67it/s][A
 75%|███████▌  | 6/8 [00:03<00:01,  1.98it/s][A
100%|██████████| 8/8 [00:03<00:00,  2.09it/s][A
Epochs:  86%|████████▌ | 54/63 [24:31<03:59, 26.66s/it]

Val Loss: 0.1439 - Val Accuracy: 0.9416



Training:   0%|          | 0/61 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/61 [00:01<01:51,  1.85s/it][A
Training:   3%|▎         | 2/61 [00:02<00:52,  1.12it/s][A
Training:   7%|▋         | 4/61 [00:02<00:20,  2.72it/s][A
Training:   8%|▊         | 5/61 [00:03<00:33,  1.66it/s][A
Training:  10%|▉         | 6/61 [00:03<00:29,  1.85it/s][A
Training:  15%|█▍        | 9/61 [00:04<00:23,  2.26it/s][A
Training:  16%|█▋        | 10/61 [00:05<00:21,  2.42it/s][A
Training:  20%|█▉        | 12/61 [00:05<00:13,  3.52it/s][A
Training:  21%|██▏       | 13/61 [00:06<00:22,  2.10it/s][A
Training:  23%|██▎       | 14/61 [00:06<00:18,  2.49it/s][A
Training:  25%|██▍       | 15/61 [00:06<00:16,  2.87it/s][A
Training:  28%|██▊       | 17/61 [00:07<00:16,  2.59it/s][A
Training:  30%|██▉       | 18/61 [00:07<00:14,  2.89it/s][A
Training:  34%|███▍      | 21/61 [00:09<00:15,  2.65it/s][A
Training:  36%|███▌      | 22/61 [00:09<00:13,  2.85it/s][A
Training:  39%|███▉      | 24/61 [00:0

Epoch: 55/63 - Loss: 0.1310 - Accuracy: 0.9482



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:02<00:15,  2.20s/it][A
 38%|███▊      | 3/8 [00:02<00:03,  1.62it/s][A
 62%|██████▎   | 5/8 [00:03<00:02,  1.47it/s][A
100%|██████████| 8/8 [00:04<00:00,  1.99it/s][A
Epochs:  87%|████████▋ | 55/63 [24:58<03:33, 26.73s/it]

Val Loss: 0.1449 - Val Accuracy: 0.9399



Training:   0%|          | 0/61 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/61 [00:02<02:03,  2.05s/it][A
Training:   5%|▍         | 3/61 [00:02<00:34,  1.69it/s][A
Training:   8%|▊         | 5/61 [00:03<00:36,  1.54it/s][A
Training:  15%|█▍        | 9/61 [00:05<00:25,  2.07it/s][A
Training:  18%|█▊        | 11/61 [00:05<00:17,  2.82it/s][A
Training:  21%|██▏       | 13/61 [00:06<00:22,  2.17it/s][A
Training:  25%|██▍       | 15/61 [00:07<00:17,  2.67it/s][A
Training:  26%|██▌       | 16/61 [00:07<00:15,  2.98it/s][A
Training:  28%|██▊       | 17/61 [00:08<00:19,  2.20it/s][A
Training:  31%|███       | 19/61 [00:08<00:16,  2.61it/s][A
Training:  34%|███▍      | 21/61 [00:09<00:15,  2.55it/s][A
Training:  36%|███▌      | 22/61 [00:09<00:13,  2.96it/s][A
Training:  38%|███▊      | 23/61 [00:09<00:13,  2.78it/s][A
Training:  39%|███▉      | 24/61 [00:10<00:11,  3.31it/s][A
Training:  41%|████      | 25/61 [00:10<00:15,  2.33it/s][A
Training:  43%|████▎     | 26/61 [00

Epoch: 56/63 - Loss: 0.1267 - Accuracy: 0.9495



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:01<00:11,  1.71s/it][A
 25%|██▌       | 2/8 [00:02<00:05,  1.11it/s][A
100%|██████████| 8/8 [00:03<00:00,  2.26it/s][A
Epochs:  89%|████████▉ | 56/63 [25:25<03:07, 26.73s/it]

Val Loss: 0.1404 - Val Accuracy: 0.9405



Training:   0%|          | 0/61 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/61 [00:01<01:59,  1.99s/it][A
Training:   3%|▎         | 2/61 [00:02<00:52,  1.13it/s][A
Training:   8%|▊         | 5/61 [00:03<00:31,  1.75it/s][A
Training:  13%|█▎        | 8/61 [00:03<00:17,  3.05it/s][A
Training:  15%|█▍        | 9/61 [00:04<00:25,  2.02it/s][A
Training:  21%|██▏       | 13/61 [00:06<00:20,  2.34it/s][A
Training:  25%|██▍       | 15/61 [00:06<00:15,  2.97it/s][A
Training:  28%|██▊       | 17/61 [00:07<00:18,  2.35it/s][A
Training:  31%|███       | 19/61 [00:08<00:13,  3.01it/s][A
Training:  34%|███▍      | 21/61 [00:08<00:14,  2.69it/s][A
Training:  39%|███▉      | 24/61 [00:09<00:10,  3.63it/s][A
Training:  41%|████      | 25/61 [00:10<00:13,  2.65it/s][A
Training:  43%|████▎     | 26/61 [00:10<00:12,  2.91it/s][A
Training:  46%|████▌     | 28/61 [00:10<00:08,  3.79it/s][A
Training:  48%|████▊     | 29/61 [00:11<00:13,  2.38it/s][A
Training:  49%|████▉     | 30/61 [00:

Epoch: 57/63 - Loss: 0.1298 - Accuracy: 0.9491



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:01<00:11,  1.67s/it][A
 25%|██▌       | 2/8 [00:01<00:04,  1.28it/s][A
 62%|██████▎   | 5/8 [00:03<00:01,  1.80it/s][A
100%|██████████| 8/8 [00:03<00:00,  2.24it/s][A
Epochs:  90%|█████████ | 57/63 [25:51<02:39, 26.51s/it]

Val Loss: 0.1401 - Val Accuracy: 0.9405



Training:   0%|          | 0/61 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/61 [00:01<01:48,  1.81s/it][A
Training:   7%|▋         | 4/61 [00:01<00:21,  2.62it/s][A
Training:  10%|▉         | 6/61 [00:03<00:29,  1.85it/s][A
Training:  13%|█▎        | 8/61 [00:03<00:19,  2.78it/s][A
Training:  16%|█▋        | 10/61 [00:05<00:26,  1.95it/s][A
Training:  18%|█▊        | 11/61 [00:05<00:21,  2.31it/s][A
Training:  21%|██▏       | 13/61 [00:06<00:20,  2.31it/s][A
Training:  23%|██▎       | 14/61 [00:06<00:21,  2.22it/s][A
Training:  25%|██▍       | 15/61 [00:06<00:17,  2.68it/s][A
Training:  28%|██▊       | 17/61 [00:07<00:17,  2.45it/s][A
Training:  30%|██▉       | 18/61 [00:08<00:19,  2.24it/s][A
Training:  33%|███▎      | 20/61 [00:08<00:12,  3.28it/s][A
Training:  34%|███▍      | 21/61 [00:09<00:15,  2.55it/s][A
Training:  36%|███▌      | 22/61 [00:09<00:15,  2.47it/s][A
Training:  41%|████      | 25/61 [00:10<00:12,  2.87it/s][A
Training:  43%|████▎     | 26/61 [00

Epoch: 58/63 - Loss: 0.1278 - Accuracy: 0.9490



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:01<00:12,  1.84s/it][A
 38%|███▊      | 3/8 [00:01<00:02,  1.90it/s][A
 62%|██████▎   | 5/8 [00:03<00:01,  1.68it/s][A
100%|██████████| 8/8 [00:03<00:00,  2.22it/s][A
Epochs:  92%|█████████▏| 58/63 [26:18<02:12, 26.55s/it]

Val Loss: 0.1519 - Val Accuracy: 0.9420



Training:   0%|          | 0/61 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/61 [00:01<01:50,  1.83s/it][A
Training:   7%|▋         | 4/61 [00:02<00:24,  2.30it/s][A
Training:   8%|▊         | 5/61 [00:03<00:36,  1.54it/s][A
Training:  11%|█▏        | 7/61 [00:03<00:21,  2.49it/s][A
Training:  13%|█▎        | 8/61 [00:03<00:18,  2.86it/s][A
Training:  15%|█▍        | 9/61 [00:05<00:30,  1.69it/s][A
Training:  16%|█▋        | 10/61 [00:05<00:23,  2.16it/s][A
Training:  21%|██▏       | 13/61 [00:06<00:21,  2.23it/s][A
Training:  25%|██▍       | 15/61 [00:06<00:15,  3.05it/s][A
Training:  28%|██▊       | 17/61 [00:08<00:20,  2.12it/s][A
Training:  31%|███       | 19/61 [00:08<00:14,  2.86it/s][A
Training:  34%|███▍      | 21/61 [00:09<00:17,  2.33it/s][A
Training:  36%|███▌      | 22/61 [00:09<00:14,  2.70it/s][A
Training:  38%|███▊      | 23/61 [00:09<00:11,  3.17it/s][A
Training:  41%|████      | 25/61 [00:11<00:15,  2.31it/s][A
Training:  44%|████▍     | 27/61 [00:1

Epoch: 59/63 - Loss: 0.1341 - Accuracy: 0.9456



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:01<00:12,  1.79s/it][A
 25%|██▌       | 2/8 [00:01<00:05,  1.16it/s][A
 50%|█████     | 4/8 [00:02<00:01,  2.81it/s][A
 62%|██████▎   | 5/8 [00:03<00:01,  1.52it/s][A
100%|██████████| 8/8 [00:03<00:00,  2.18it/s][A
Epochs:  94%|█████████▎| 59/63 [26:45<01:46, 26.68s/it]

Val Loss: 0.1381 - Val Accuracy: 0.9394



Training:   0%|          | 0/61 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/61 [00:01<01:50,  1.85s/it][A
Training:   3%|▎         | 2/61 [00:01<00:49,  1.20it/s][A
Training:   7%|▋         | 4/61 [00:02<00:20,  2.85it/s][A
Training:   8%|▊         | 5/61 [00:03<00:35,  1.58it/s][A
Training:  11%|█▏        | 7/61 [00:03<00:20,  2.65it/s][A
Training:  15%|█▍        | 9/61 [00:04<00:25,  2.04it/s][A
Training:  16%|█▋        | 10/61 [00:04<00:20,  2.47it/s][A
Training:  20%|█▉        | 12/61 [00:05<00:13,  3.62it/s][A
Training:  21%|██▏       | 13/61 [00:06<00:26,  1.82it/s][A
Training:  25%|██▍       | 15/61 [00:06<00:16,  2.75it/s][A
Training:  28%|██▊       | 17/61 [00:08<00:21,  2.00it/s][A
Training:  31%|███       | 19/61 [00:08<00:15,  2.80it/s][A
Training:  34%|███▍      | 21/61 [00:09<00:17,  2.28it/s][A
Training:  38%|███▊      | 23/61 [00:09<00:12,  3.06it/s][A
Training:  39%|███▉      | 24/61 [00:09<00:10,  3.49it/s][A
Training:  41%|████      | 25/61 [00:1

Epoch: 60/63 - Loss: 0.1253 - Accuracy: 0.9507



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:02<00:14,  2.14s/it][A
 50%|█████     | 4/8 [00:02<00:01,  2.31it/s][A
100%|██████████| 8/8 [00:03<00:00,  2.19it/s][A
Epochs:  95%|█████████▌| 60/63 [27:11<01:19, 26.55s/it]

Val Loss: 0.1612 - Val Accuracy: 0.9330



Training:   0%|          | 0/61 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/61 [00:01<01:58,  1.98s/it][A
Training:   3%|▎         | 2/61 [00:02<00:55,  1.06it/s][A
Training:   8%|▊         | 5/61 [00:03<00:31,  1.77it/s][A
Training:  11%|█▏        | 7/61 [00:03<00:20,  2.65it/s][A
Training:  13%|█▎        | 8/61 [00:03<00:16,  3.14it/s][A
Training:  15%|█▍        | 9/61 [00:05<00:28,  1.80it/s][A
Training:  16%|█▋        | 10/61 [00:05<00:22,  2.27it/s][A
Training:  20%|█▉        | 12/61 [00:05<00:14,  3.44it/s][A
Training:  21%|██▏       | 13/61 [00:06<00:24,  1.99it/s][A
Training:  23%|██▎       | 14/61 [00:06<00:19,  2.44it/s][A
Training:  26%|██▌       | 16/61 [00:06<00:12,  3.65it/s][A
Training:  28%|██▊       | 17/61 [00:07<00:19,  2.20it/s][A
Training:  30%|██▉       | 18/61 [00:08<00:16,  2.54it/s][A
Training:  33%|███▎      | 20/61 [00:08<00:12,  3.38it/s][A
Training:  34%|███▍      | 21/61 [00:09<00:16,  2.37it/s][A
Training:  36%|███▌      | 22/61 [00:0

Epoch: 61/63 - Loss: 0.1275 - Accuracy: 0.9497



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:02<00:14,  2.08s/it][A
 25%|██▌       | 2/8 [00:02<00:05,  1.05it/s][A
 62%|██████▎   | 5/8 [00:03<00:01,  1.81it/s][A
100%|██████████| 8/8 [00:03<00:00,  2.14it/s][A
Epochs:  97%|█████████▋| 61/63 [27:37<00:53, 26.55s/it]

Val Loss: 0.1497 - Val Accuracy: 0.9388



Training:   0%|          | 0/61 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/61 [00:02<02:02,  2.04s/it][A
Training:   5%|▍         | 3/61 [00:02<00:33,  1.71it/s][A
Training:   8%|▊         | 5/61 [00:03<00:34,  1.61it/s][A
Training:  13%|█▎        | 8/61 [00:03<00:17,  3.04it/s][A
Training:  15%|█▍        | 9/61 [00:05<00:28,  1.84it/s][A
Training:  16%|█▋        | 10/61 [00:05<00:22,  2.25it/s][A
Training:  20%|█▉        | 12/61 [00:05<00:14,  3.40it/s][A
Training:  23%|██▎       | 14/61 [00:06<00:20,  2.32it/s][A
Training:  26%|██▌       | 16/61 [00:06<00:14,  3.11it/s][A
Training:  28%|██▊       | 17/61 [00:08<00:22,  1.99it/s][A
Training:  31%|███       | 19/61 [00:08<00:14,  2.85it/s][A
Training:  33%|███▎      | 20/61 [00:08<00:14,  2.88it/s][A
Training:  34%|███▍      | 21/61 [00:09<00:20,  1.94it/s][A
Training:  36%|███▌      | 22/61 [00:09<00:17,  2.29it/s][A
Training:  38%|███▊      | 23/61 [00:10<00:13,  2.82it/s][A
Training:  41%|████      | 25/61 [00:

Epoch: 62/63 - Loss: 0.1311 - Accuracy: 0.9492



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:01<00:13,  1.93s/it][A
 38%|███▊      | 3/8 [00:02<00:02,  1.76it/s][A
 62%|██████▎   | 5/8 [00:03<00:01,  1.70it/s][A
100%|██████████| 8/8 [00:03<00:00,  2.24it/s][A
Epochs:  98%|█████████▊| 62/63 [28:04<00:26, 26.69s/it]

Val Loss: 0.1559 - Val Accuracy: 0.9340



Training:   0%|          | 0/61 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/61 [00:01<01:54,  1.91s/it][A
Training:   5%|▍         | 3/61 [00:02<00:32,  1.79it/s][A
Training:   7%|▋         | 4/61 [00:02<00:23,  2.46it/s][A
Training:   8%|▊         | 5/61 [00:03<00:39,  1.43it/s][A
Training:  10%|▉         | 6/61 [00:03<00:27,  1.97it/s][A
Training:  11%|█▏        | 7/61 [00:03<00:20,  2.60it/s][A
Training:  15%|█▍        | 9/61 [00:04<00:25,  2.02it/s][A
Training:  16%|█▋        | 10/61 [00:05<00:20,  2.48it/s][A
Training:  18%|█▊        | 11/61 [00:05<00:16,  3.09it/s][A
Training:  21%|██▏       | 13/61 [00:06<00:22,  2.16it/s][A
Training:  23%|██▎       | 14/61 [00:06<00:19,  2.36it/s][A
Training:  26%|██▌       | 16/61 [00:06<00:12,  3.52it/s][A
Training:  28%|██▊       | 17/61 [00:08<00:20,  2.15it/s][A
Training:  30%|██▉       | 18/61 [00:08<00:16,  2.60it/s][A
Training:  31%|███       | 19/61 [00:08<00:14,  2.96it/s][A
Training:  34%|███▍      | 21/61 [00:09

Epoch: 63/63 - Loss: 0.1327 - Accuracy: 0.9471



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:01<00:12,  1.79s/it][A
 25%|██▌       | 2/8 [00:01<00:04,  1.22it/s][A
 50%|█████     | 4/8 [00:02<00:01,  2.88it/s][A
 62%|██████▎   | 5/8 [00:03<00:01,  1.57it/s][A
100%|██████████| 8/8 [00:03<00:00,  2.24it/s][A
Epochs: 100%|██████████| 63/63 [28:32<00:00, 27.18s/it]


Val Loss: 0.1385 - Val Accuracy: 0.9432
Saving best model...


[32m[I 2023-12-14 23:16:11,436][0m Trial 1 finished with value: 0.94315505027771 and parameters: {'learning_rate': 0.0008620992852806465, 'weight_decay': 0.0007106239797227544, 'epsilon': 8.116463668208938e-09, 'batch_size': 232, 'epochs': 63}. Best is trial 1 with value: 0.94315505027771.[0m


Learning rate: 0.0006309153512084874
Weight decay: 0.003266596022466009
Epsilon: 5.483962201164423e-08
Batch size: 57
Number of epochs: 11


Epochs:   0%|          | 0/11 [00:00<?, ?it/s]
Training:   0%|          | 0/246 [00:00<?, ?it/s][A
Training:   0%|          | 1/246 [00:00<02:33,  1.60it/s][A
Training:   2%|▏         | 4/246 [00:00<00:36,  6.66it/s][A
Training:   2%|▏         | 6/246 [00:01<00:36,  6.58it/s][A
Training:   4%|▎         | 9/246 [00:01<00:30,  7.65it/s][A
Training:   5%|▍         | 12/246 [00:01<00:21, 10.86it/s][A
Training:   6%|▌         | 14/246 [00:01<00:27,  8.40it/s][A
Training:   7%|▋         | 17/246 [00:02<00:27,  8.32it/s][A
Training:   9%|▊         | 21/246 [00:02<00:26,  8.63it/s][A
Training:  10%|█         | 25/246 [00:03<00:24,  9.12it/s][A
Training:  12%|█▏        | 29/246 [00:03<00:23,  9.33it/s][A
Training:  13%|█▎        | 33/246 [00:03<00:22,  9.54it/s][A
Training:  15%|█▌        | 37/246 [00:04<00:20, 10.03it/s][A
Training:  17%|█▋        | 41/246 [00:04<00:19, 10.25it/s][A
Training:  18%|█▊        | 45/246 [00:04<00:18, 10.74it/s][A
Training:  20%|█▉        | 48/246 [0

Epoch: 1/11 - Loss: 0.2853 - Accuracy: 0.8737



  0%|          | 0/31 [00:00<?, ?it/s][A
  3%|▎         | 1/31 [00:00<00:20,  1.46it/s][A
 16%|█▌        | 5/31 [00:01<00:04,  5.59it/s][A
 26%|██▌       | 8/31 [00:01<00:02,  9.12it/s][A
 32%|███▏      | 10/31 [00:01<00:03,  6.97it/s][A
 42%|████▏     | 13/31 [00:01<00:02,  7.26it/s][A
 55%|█████▍    | 17/31 [00:02<00:01,  8.30it/s][A
 68%|██████▊   | 21/31 [00:02<00:01,  9.16it/s][A
 81%|████████  | 25/31 [00:03<00:00,  9.00it/s][A
100%|██████████| 31/31 [00:03<00:00,  8.48it/s][A
Epochs:   9%|▉         | 1/11 [00:26<04:25, 26.59s/it]

Val Loss: 0.1762 - Val Accuracy: 0.9218



Training:   0%|          | 0/246 [00:00<?, ?it/s][A
Training:   0%|          | 1/246 [00:00<03:04,  1.33it/s][A
Training:   2%|▏         | 5/246 [00:01<00:41,  5.76it/s][A
Training:   3%|▎         | 8/246 [00:01<00:25,  9.37it/s][A
Training:   4%|▍         | 10/246 [00:01<00:30,  7.66it/s][A
Training:   5%|▌         | 13/246 [00:01<00:31,  7.31it/s][A
Training:   7%|▋         | 16/246 [00:02<00:23,  9.94it/s][A
Training:   7%|▋         | 18/246 [00:02<00:24,  9.38it/s][A
Training:   9%|▊         | 21/246 [00:02<00:26,  8.40it/s][A
Training:  10%|█         | 25/246 [00:03<00:24,  9.07it/s][A
Training:  11%|█▏        | 28/246 [00:03<00:19, 11.43it/s][A
Training:  12%|█▏        | 30/246 [00:03<00:21, 10.06it/s][A
Training:  13%|█▎        | 33/246 [00:03<00:22,  9.46it/s][A
Training:  15%|█▌        | 37/246 [00:04<00:19, 10.59it/s][A
Training:  17%|█▋        | 41/246 [00:04<00:18, 10.89it/s][A
Training:  18%|█▊        | 45/246 [00:04<00:19, 10.47it/s][A
Training:  20%|█▉  

Epoch: 2/11 - Loss: 0.2025 - Accuracy: 0.9164



  0%|          | 0/31 [00:00<?, ?it/s][A
  3%|▎         | 1/31 [00:00<00:19,  1.57it/s][A
 13%|█▎        | 4/31 [00:00<00:04,  6.51it/s][A
 19%|█▉        | 6/31 [00:01<00:03,  6.47it/s][A
 26%|██▌       | 8/31 [00:01<00:02,  7.80it/s][A
 32%|███▏      | 10/31 [00:01<00:02,  8.54it/s][A
 39%|███▊      | 12/31 [00:01<00:02,  8.92it/s][A
 45%|████▌     | 14/31 [00:01<00:01,  9.09it/s][A
 52%|█████▏    | 16/31 [00:02<00:01,  9.91it/s][A
 58%|█████▊    | 18/31 [00:02<00:01,  9.33it/s][A
 65%|██████▍   | 20/31 [00:02<00:01,  9.98it/s][A
 71%|███████   | 22/31 [00:02<00:00,  9.62it/s][A
 77%|███████▋  | 24/31 [00:02<00:00, 10.67it/s][A
 84%|████████▍ | 26/31 [00:03<00:00,  8.38it/s][A
 94%|█████████▎| 29/31 [00:03<00:00, 10.09it/s][A
100%|██████████| 31/31 [00:03<00:00,  8.74it/s][A
Epochs:  18%|█▊        | 2/11 [00:53<03:58, 26.54s/it]

Val Loss: 0.1679 - Val Accuracy: 0.9282



Training:   0%|          | 0/246 [00:00<?, ?it/s][A
Training:   0%|          | 1/246 [00:00<02:46,  1.47it/s][A
Training:   2%|▏         | 4/246 [00:00<00:38,  6.29it/s][A
Training:   2%|▏         | 6/246 [00:01<00:35,  6.85it/s][A
Training:   3%|▎         | 8/246 [00:01<00:27,  8.76it/s][A
Training:   4%|▍         | 10/246 [00:01<00:28,  8.21it/s][A
Training:   5%|▍         | 12/246 [00:01<00:24,  9.60it/s][A
Training:   6%|▌         | 14/246 [00:01<00:25,  9.11it/s][A
Training:   7%|▋         | 16/246 [00:02<00:25,  9.04it/s][A
Training:   7%|▋         | 18/246 [00:02<00:22, 10.08it/s][A
Training:   8%|▊         | 20/246 [00:02<00:22,  9.89it/s][A
Training:   9%|▉         | 22/246 [00:02<00:20, 10.78it/s][A
Training:  10%|▉         | 24/246 [00:02<00:23,  9.61it/s][A
Training:  11%|█         | 26/246 [00:02<00:19, 11.14it/s][A
Training:  11%|█▏        | 28/246 [00:03<00:23,  9.16it/s][A
Training:  13%|█▎        | 32/246 [00:03<00:21, 10.15it/s][A
Training:  14%|█▍   

Epoch: 3/11 - Loss: 0.1736 - Accuracy: 0.9285



  0%|          | 0/31 [00:00<?, ?it/s][A
  3%|▎         | 1/31 [00:00<00:20,  1.46it/s][A
 16%|█▌        | 5/31 [00:00<00:04,  6.09it/s][A
 29%|██▉       | 9/31 [00:01<00:02,  7.66it/s][A
 42%|████▏     | 13/31 [00:01<00:02,  8.83it/s][A
 55%|█████▍    | 17/31 [00:02<00:01,  9.41it/s][A
 68%|██████▊   | 21/31 [00:02<00:01,  9.41it/s][A
 81%|████████  | 25/31 [00:02<00:00,  9.37it/s][A
100%|██████████| 31/31 [00:03<00:00,  9.03it/s][A
Epochs:  27%|██▋       | 3/11 [01:19<03:31, 26.49s/it]

Val Loss: 0.1536 - Val Accuracy: 0.9368



Training:   0%|          | 0/246 [00:00<?, ?it/s][A
Training:   0%|          | 1/246 [00:00<02:40,  1.53it/s][A
Training:   1%|          | 3/246 [00:00<00:55,  4.37it/s][A
Training:   2%|▏         | 6/246 [00:01<00:33,  7.21it/s][A
Training:   3%|▎         | 8/246 [00:01<00:25,  9.26it/s][A
Training:   4%|▍         | 10/246 [00:01<00:29,  8.07it/s][A
Training:   5%|▌         | 13/246 [00:01<00:27,  8.46it/s][A
Training:   6%|▌         | 15/246 [00:02<00:27,  8.27it/s][A
Training:   7%|▋         | 17/246 [00:02<00:25,  8.88it/s][A
Training:   7%|▋         | 18/246 [00:02<00:27,  8.35it/s][A
Training:   9%|▊         | 21/246 [00:02<00:21, 10.26it/s][A
Training:   9%|▉         | 23/246 [00:02<00:21, 10.17it/s][A
Training:  10%|█         | 25/246 [00:02<00:21, 10.49it/s][A
Training:  11%|█         | 27/246 [00:03<00:21, 10.35it/s][A
Training:  12%|█▏        | 29/246 [00:03<00:20, 10.38it/s][A
Training:  13%|█▎        | 31/246 [00:03<00:20, 10.45it/s][A
Training:  13%|█▎   

Epoch: 4/11 - Loss: 0.1673 - Accuracy: 0.9320



  0%|          | 0/31 [00:00<?, ?it/s][A
  3%|▎         | 1/31 [00:00<00:21,  1.38it/s][A
 16%|█▌        | 5/31 [00:01<00:04,  5.64it/s][A
 29%|██▉       | 9/31 [00:01<00:02,  7.81it/s][A
 42%|████▏     | 13/31 [00:01<00:02,  8.70it/s][A
 55%|█████▍    | 17/31 [00:02<00:01,  9.38it/s][A
 61%|██████▏   | 19/31 [00:02<00:01, 10.50it/s][A
 68%|██████▊   | 21/31 [00:02<00:01,  9.23it/s][A
 74%|███████▍  | 23/31 [00:02<00:00, 10.63it/s][A
 81%|████████  | 25/31 [00:02<00:00,  9.46it/s][A
 87%|████████▋ | 27/31 [00:03<00:00, 11.02it/s][A
100%|██████████| 31/31 [00:03<00:00,  8.94it/s][A
Epochs:  36%|███▋      | 4/11 [01:46<03:06, 26.69s/it]

Val Loss: 0.1584 - Val Accuracy: 0.9340



Training:   0%|          | 0/246 [00:00<?, ?it/s][A
Training:   0%|          | 1/246 [00:00<02:35,  1.57it/s][A
Training:   2%|▏         | 5/246 [00:01<00:42,  5.66it/s][A
Training:   3%|▎         | 8/246 [00:01<00:26,  8.82it/s][A
Training:   4%|▍         | 10/246 [00:01<00:31,  7.44it/s][A
Training:   5%|▌         | 13/246 [00:01<00:30,  7.54it/s][A
Training:   7%|▋         | 17/246 [00:02<00:28,  7.94it/s][A
Training:   9%|▊         | 21/246 [00:02<00:25,  8.82it/s][A
Training:  10%|█         | 25/246 [00:03<00:23,  9.32it/s][A
Training:  12%|█▏        | 29/246 [00:03<00:22,  9.44it/s][A
Training:  13%|█▎        | 33/246 [00:03<00:22,  9.66it/s][A
Training:  15%|█▌        | 37/246 [00:04<00:20, 10.01it/s][A
Training:  17%|█▋        | 41/246 [00:04<00:18, 10.95it/s][A
Training:  18%|█▊        | 45/246 [00:04<00:18, 10.88it/s][A
Training:  20%|█▉        | 48/246 [00:05<00:15, 12.57it/s][A
Training:  20%|██        | 50/246 [00:05<00:17, 10.98it/s][A
Training:  22%|██▏ 

Epoch: 5/11 - Loss: 0.1677 - Accuracy: 0.9314



  0%|          | 0/31 [00:00<?, ?it/s][A
  3%|▎         | 1/31 [00:00<00:23,  1.30it/s][A
 16%|█▌        | 5/31 [00:01<00:04,  5.55it/s][A
 29%|██▉       | 9/31 [00:01<00:02,  7.95it/s][A
 42%|████▏     | 13/31 [00:01<00:01,  9.60it/s][A
 48%|████▊     | 15/31 [00:01<00:01, 10.46it/s][A
 55%|█████▍    | 17/31 [00:02<00:01,  9.44it/s][A
 68%|██████▊   | 21/31 [00:02<00:01,  9.45it/s][A
 81%|████████  | 25/31 [00:02<00:00,  9.86it/s][A
100%|██████████| 31/31 [00:03<00:00,  9.36it/s][A
Epochs:  45%|████▌     | 5/11 [02:13<02:39, 26.65s/it]

Val Loss: 0.1459 - Val Accuracy: 0.9385



Training:   0%|          | 0/246 [00:00<?, ?it/s][A
Training:   0%|          | 1/246 [00:00<03:00,  1.36it/s][A
Training:   2%|▏         | 5/246 [00:01<00:42,  5.73it/s][A
Training:   3%|▎         | 8/246 [00:01<00:26,  8.94it/s][A
Training:   4%|▍         | 10/246 [00:01<00:34,  6.94it/s][A
Training:   5%|▌         | 13/246 [00:02<00:33,  6.97it/s][A
Training:   7%|▋         | 17/246 [00:02<00:28,  8.11it/s][A
Training:   9%|▊         | 21/246 [00:02<00:24,  9.28it/s][A
Training:  10%|█         | 25/246 [00:03<00:22,  9.91it/s][A
Training:  12%|█▏        | 29/246 [00:03<00:22,  9.67it/s][A
Training:  13%|█▎        | 33/246 [00:03<00:21, 10.09it/s][A
Training:  15%|█▌        | 37/246 [00:04<00:21,  9.89it/s][A
Training:  17%|█▋        | 41/246 [00:04<00:21,  9.33it/s][A
Training:  18%|█▊        | 45/246 [00:05<00:20,  9.62it/s][A
Training:  20%|█▉        | 49/246 [00:05<00:19, 10.18it/s][A
Training:  21%|██        | 52/246 [00:05<00:15, 12.13it/s][A
Training:  22%|██▏ 

Epoch: 6/11 - Loss: 0.1653 - Accuracy: 0.9316



  0%|          | 0/31 [00:00<?, ?it/s][A
  3%|▎         | 1/31 [00:00<00:18,  1.64it/s][A
 16%|█▌        | 5/31 [00:00<00:04,  6.30it/s][A
 29%|██▉       | 9/31 [00:01<00:02,  8.74it/s][A
 42%|████▏     | 13/31 [00:01<00:01, 10.16it/s][A
 55%|█████▍    | 17/31 [00:01<00:01, 10.64it/s][A
 68%|██████▊   | 21/31 [00:02<00:00, 11.20it/s][A
 74%|███████▍  | 23/31 [00:02<00:00, 12.29it/s][A
 81%|████████  | 25/31 [00:02<00:00, 10.74it/s][A
 87%|████████▋ | 27/31 [00:02<00:00, 11.61it/s][A
100%|██████████| 31/31 [00:02<00:00, 10.37it/s][A
Epochs:  55%|█████▍    | 6/11 [02:39<02:12, 26.56s/it]

Val Loss: 0.1683 - Val Accuracy: 0.9314



Training:   0%|          | 0/246 [00:00<?, ?it/s][A
Training:   0%|          | 1/246 [00:00<02:32,  1.61it/s][A
Training:   2%|▏         | 4/246 [00:00<00:35,  6.89it/s][A
Training:   2%|▏         | 6/246 [00:01<00:36,  6.58it/s][A
Training:   4%|▎         | 9/246 [00:01<00:34,  6.82it/s][A
Training:   5%|▌         | 13/246 [00:01<00:27,  8.47it/s][A
Training:   7%|▋         | 16/246 [00:01<00:20, 11.06it/s][A
Training:   7%|▋         | 18/246 [00:02<00:25,  9.11it/s][A
Training:   9%|▊         | 21/246 [00:02<00:27,  8.23it/s][A
Training:  10%|█         | 25/246 [00:03<00:24,  8.99it/s][A
Training:  12%|█▏        | 29/246 [00:03<00:21, 10.15it/s][A
Training:  13%|█▎        | 33/246 [00:03<00:22,  9.64it/s][A
Training:  15%|█▌        | 37/246 [00:04<00:20, 10.31it/s][A
Training:  17%|█▋        | 41/246 [00:04<00:19, 10.53it/s][A
Training:  18%|█▊        | 44/246 [00:04<00:16, 12.28it/s][A
Training:  19%|█▊        | 46/246 [00:04<00:18, 10.85it/s][A
Training:  20%|█▉   

Epoch: 7/11 - Loss: 0.1534 - Accuracy: 0.9388



  0%|          | 0/31 [00:00<?, ?it/s][A
  3%|▎         | 1/31 [00:00<00:16,  1.81it/s][A
 16%|█▌        | 5/31 [00:00<00:04,  6.39it/s][A
 26%|██▌       | 8/31 [00:01<00:02,  9.13it/s][A
 32%|███▏      | 10/31 [00:01<00:02,  8.62it/s][A
 39%|███▊      | 12/31 [00:01<00:02,  9.43it/s][A
 45%|████▌     | 14/31 [00:01<00:01, 10.49it/s][A
 52%|█████▏    | 16/31 [00:01<00:01, 10.21it/s][A
 58%|█████▊    | 18/31 [00:02<00:01, 10.95it/s][A
 65%|██████▍   | 20/31 [00:02<00:00, 11.77it/s][A
 71%|███████   | 22/31 [00:02<00:00, 11.67it/s][A
 77%|███████▋  | 24/31 [00:02<00:00, 11.78it/s][A
 84%|████████▍ | 26/31 [00:02<00:00, 12.93it/s][A
 90%|█████████ | 28/31 [00:02<00:00, 13.08it/s][A
100%|██████████| 31/31 [00:02<00:00, 10.42it/s][A
Epochs:  64%|██████▎   | 7/11 [03:06<01:46, 26.63s/it]

Val Loss: 0.1619 - Val Accuracy: 0.9346



Training:   0%|          | 0/246 [00:00<?, ?it/s][A
Training:   0%|          | 1/246 [00:00<02:36,  1.56it/s][A
Training:   2%|▏         | 4/246 [00:00<00:36,  6.64it/s][A
Training:   2%|▏         | 6/246 [00:01<00:37,  6.36it/s][A
Training:   4%|▎         | 9/246 [00:01<00:33,  7.09it/s][A
Training:   5%|▌         | 13/246 [00:01<00:27,  8.46it/s][A
Training:   7%|▋         | 16/246 [00:01<00:20, 11.14it/s][A
Training:   7%|▋         | 18/246 [00:02<00:23,  9.74it/s][A
Training:   9%|▊         | 21/246 [00:02<00:24,  9.24it/s][A
Training:   9%|▉         | 23/246 [00:02<00:21, 10.57it/s][A
Training:  10%|█         | 25/246 [00:02<00:24,  9.11it/s][A
Training:  11%|█         | 27/246 [00:03<00:20, 10.45it/s][A
Training:  12%|█▏        | 29/246 [00:03<00:22,  9.56it/s][A
Training:  13%|█▎        | 31/246 [00:03<00:21, 10.11it/s][A
Training:  13%|█▎        | 33/246 [00:03<00:20, 10.34it/s][A
Training:  14%|█▍        | 35/246 [00:03<00:21, 10.01it/s][A
Training:  15%|█▌   

Epoch: 8/11 - Loss: 0.1527 - Accuracy: 0.9384



  0%|          | 0/31 [00:00<?, ?it/s][A
  3%|▎         | 1/31 [00:00<00:16,  1.81it/s][A
 10%|▉         | 3/31 [00:00<00:05,  5.47it/s][A
 16%|█▌        | 5/31 [00:00<00:03,  6.99it/s][A
 23%|██▎       | 7/31 [00:01<00:02,  8.99it/s][A
 29%|██▉       | 9/31 [00:01<00:02,  9.46it/s][A
 35%|███▌      | 11/31 [00:01<00:02,  8.80it/s][A
 42%|████▏     | 13/31 [00:01<00:01,  9.92it/s][A
 48%|████▊     | 15/31 [00:01<00:01,  9.40it/s][A
 55%|█████▍    | 17/31 [00:02<00:01,  9.60it/s][A
 61%|██████▏   | 19/31 [00:02<00:01,  9.21it/s][A
 68%|██████▊   | 21/31 [00:02<00:01,  8.53it/s][A
 74%|███████▍  | 23/31 [00:02<00:00,  9.35it/s][A
 81%|████████  | 25/31 [00:02<00:00,  9.26it/s][A
 87%|████████▋ | 27/31 [00:03<00:00, 10.53it/s][A
100%|██████████| 31/31 [00:03<00:00,  9.25it/s][A
Epochs:  73%|███████▎  | 8/11 [03:33<01:20, 26.67s/it]

Val Loss: 0.1471 - Val Accuracy: 0.9385



Training:   0%|          | 0/246 [00:00<?, ?it/s][A
Training:   0%|          | 1/246 [00:00<02:25,  1.68it/s][A
Training:   2%|▏         | 5/246 [00:00<00:33,  7.15it/s][A
Training:   4%|▎         | 9/246 [00:01<00:26,  8.99it/s][A
Training:   5%|▌         | 13/246 [00:01<00:22, 10.17it/s][A
Training:   7%|▋         | 17/246 [00:01<00:22, 10.26it/s][A
Training:   9%|▊         | 21/246 [00:02<00:21, 10.54it/s][A
Training:  10%|▉         | 24/246 [00:02<00:18, 11.86it/s][A
Training:  11%|█         | 26/246 [00:02<00:21, 10.22it/s][A
Training:  11%|█▏        | 28/246 [00:02<00:19, 11.05it/s][A
Training:  12%|█▏        | 30/246 [00:03<00:20, 10.35it/s][A
Training:  13%|█▎        | 32/246 [00:03<00:18, 11.54it/s][A
Training:  14%|█▍        | 34/246 [00:03<00:21,  9.93it/s][A
Training:  15%|█▍        | 36/246 [00:03<00:18, 11.43it/s][A
Training:  15%|█▌        | 38/246 [00:03<00:20, 10.39it/s][A
Training:  16%|█▋        | 40/246 [00:03<00:17, 11.73it/s][A
Training:  17%|█▋  

Epoch: 9/11 - Loss: 0.1582 - Accuracy: 0.9345



  0%|          | 0/31 [00:00<?, ?it/s][A
  3%|▎         | 1/31 [00:00<00:19,  1.51it/s][A
 16%|█▌        | 5/31 [00:00<00:04,  6.47it/s][A
 29%|██▉       | 9/31 [00:01<00:02,  8.61it/s][A
 42%|████▏     | 13/31 [00:01<00:01,  9.96it/s][A
 55%|█████▍    | 17/31 [00:01<00:01, 11.07it/s][A
 65%|██████▍   | 20/31 [00:01<00:00, 13.54it/s][A
 71%|███████   | 22/31 [00:02<00:00, 10.69it/s][A
 81%|████████  | 25/31 [00:02<00:00, 11.13it/s][A
 87%|████████▋ | 27/31 [00:02<00:00, 11.90it/s][A
 94%|█████████▎| 29/31 [00:02<00:00, 11.10it/s][A
100%|██████████| 31/31 [00:03<00:00,  9.79it/s][A
Epochs:  82%|████████▏ | 9/11 [03:59<00:53, 26.65s/it]

Val Loss: 0.1568 - Val Accuracy: 0.9310



Training:   0%|          | 0/246 [00:00<?, ?it/s][A
Training:   0%|          | 1/246 [00:00<03:17,  1.24it/s][A
Training:   2%|▏         | 4/246 [00:00<00:44,  5.44it/s][A
Training:   2%|▏         | 6/246 [00:01<00:38,  6.30it/s][A
Training:   4%|▎         | 9/246 [00:01<00:31,  7.50it/s][A
Training:   5%|▌         | 13/246 [00:01<00:24,  9.61it/s][A
Training:   7%|▋         | 17/246 [00:02<00:20, 11.08it/s][A
Training:   9%|▊         | 21/246 [00:02<00:18, 12.25it/s][A
Training:  10%|▉         | 24/246 [00:02<00:15, 14.67it/s][A
Training:  11%|█         | 26/246 [00:02<00:17, 12.35it/s][A
Training:  12%|█▏        | 29/246 [00:03<00:19, 11.16it/s][A
Training:  13%|█▎        | 33/246 [00:03<00:19, 10.82it/s][A
Training:  15%|█▍        | 36/246 [00:03<00:16, 13.08it/s][A
Training:  15%|█▌        | 38/246 [00:03<00:18, 11.49it/s][A
Training:  16%|█▋        | 40/246 [00:03<00:16, 12.68it/s][A
Training:  17%|█▋        | 42/246 [00:04<00:19, 10.72it/s][A
Training:  18%|█▊   

Epoch: 10/11 - Loss: 0.1498 - Accuracy: 0.9404



  0%|          | 0/31 [00:00<?, ?it/s][A
  3%|▎         | 1/31 [00:00<00:17,  1.68it/s][A
 16%|█▌        | 5/31 [00:00<00:03,  7.03it/s][A
 29%|██▉       | 9/31 [00:01<00:02,  9.55it/s][A
 42%|████▏     | 13/31 [00:01<00:01, 11.07it/s][A
 52%|█████▏    | 16/31 [00:01<00:01, 13.76it/s][A
 58%|█████▊    | 18/31 [00:01<00:01, 11.25it/s][A
 68%|██████▊   | 21/31 [00:02<00:00, 10.43it/s][A
 81%|████████  | 25/31 [00:02<00:00, 11.07it/s][A
100%|██████████| 31/31 [00:02<00:00, 10.84it/s][A
Epochs:  91%|█████████ | 10/11 [04:25<00:26, 26.32s/it]

Val Loss: 0.1424 - Val Accuracy: 0.9385



Training:   0%|          | 0/246 [00:00<?, ?it/s][A
Training:   0%|          | 1/246 [00:00<02:29,  1.64it/s][A
Training:   2%|▏         | 5/246 [00:00<00:37,  6.47it/s][A
Training:   4%|▎         | 9/246 [00:01<00:28,  8.26it/s][A
Training:   5%|▍         | 12/246 [00:01<00:20, 11.20it/s][A
Training:   6%|▌         | 14/246 [00:01<00:24,  9.55it/s][A
Training:   7%|▋         | 17/246 [00:02<00:29,  7.66it/s][A
Training:   9%|▊         | 21/246 [00:02<00:25,  8.69it/s][A
Training:  10%|█         | 25/246 [00:02<00:22,  9.64it/s][A
Training:  12%|█▏        | 29/246 [00:03<00:19, 10.93it/s][A
Training:  13%|█▎        | 33/246 [00:03<00:17, 11.98it/s][A
Training:  15%|█▌        | 37/246 [00:03<00:15, 13.39it/s][A
Training:  17%|█▋        | 41/246 [00:04<00:15, 12.98it/s][A
Training:  18%|█▊        | 45/246 [00:04<00:15, 12.67it/s][A
Training:  20%|█▉        | 49/246 [00:04<00:16, 11.67it/s][A
Training:  22%|██▏       | 53/246 [00:05<00:16, 11.66it/s][A
Training:  23%|██▎ 

Epoch: 11/11 - Loss: 0.1520 - Accuracy: 0.9380



  0%|          | 0/31 [00:00<?, ?it/s][A
  3%|▎         | 1/31 [00:00<00:17,  1.69it/s][A
 13%|█▎        | 4/31 [00:00<00:03,  6.93it/s][A
 19%|█▉        | 6/31 [00:01<00:04,  6.24it/s][A
 29%|██▉       | 9/31 [00:01<00:03,  7.27it/s][A
 42%|████▏     | 13/31 [00:01<00:02,  8.72it/s][A
 52%|█████▏    | 16/31 [00:01<00:01, 11.03it/s][A
 58%|█████▊    | 18/31 [00:02<00:01,  9.07it/s][A
 68%|██████▊   | 21/31 [00:02<00:01,  9.88it/s][A
 77%|███████▋  | 24/31 [00:02<00:00, 12.40it/s][A
 84%|████████▍ | 26/31 [00:02<00:00, 10.43it/s][A
100%|██████████| 31/31 [00:03<00:00,  9.37it/s][A
Epochs: 100%|██████████| 11/11 [04:51<00:00, 26.52s/it]


Val Loss: 0.1477 - Val Accuracy: 0.9336


[32m[I 2023-12-14 23:21:03,779][0m Trial 2 finished with value: 0.9336405992507935 and parameters: {'learning_rate': 0.0006309153512084874, 'weight_decay': 0.003266596022466009, 'epsilon': 5.483962201164423e-08, 'batch_size': 57, 'epochs': 11}. Best is trial 1 with value: 0.94315505027771.[0m


Learning rate: 0.02816733929912164
Weight decay: 0.001632793638917931
Epsilon: 4.700125142204821e-08
Batch size: 125
Number of epochs: 69


Epochs:   0%|          | 0/69 [00:00<?, ?it/s]
Training:   0%|          | 0/112 [00:00<?, ?it/s][A
Training:   1%|          | 1/112 [00:01<02:02,  1.10s/it][A
Training:   4%|▍         | 5/112 [00:02<00:38,  2.79it/s][A
Training:   6%|▋         | 7/112 [00:02<00:26,  4.03it/s][A
Training:   8%|▊         | 9/112 [00:02<00:30,  3.42it/s][A
Training:  12%|█▏        | 13/112 [00:03<00:24,  4.11it/s][A
Training:  14%|█▍        | 16/112 [00:03<00:16,  5.84it/s][A
Training:  16%|█▌        | 18/112 [00:04<00:20,  4.60it/s][A
Training:  19%|█▉        | 21/112 [00:05<00:19,  4.63it/s][A
Training:  21%|██▏       | 24/112 [00:05<00:13,  6.38it/s][A
Training:  23%|██▎       | 26/112 [00:06<00:18,  4.65it/s][A
Training:  25%|██▌       | 28/112 [00:06<00:14,  5.76it/s][A
Training:  27%|██▋       | 30/112 [00:06<00:18,  4.50it/s][A
Training:  29%|██▉       | 33/112 [00:07<00:17,  4.39it/s][A
Training:  32%|███▏      | 36/112 [00:07<00:12,  6.02it/s][A
Training:  34%|███▍      | 38/112 [0

Epoch: 1/69 - Loss: 7.6669 - Accuracy: 0.7569



  0%|          | 0/14 [00:00<?, ?it/s][A
  7%|▋         | 1/14 [00:01<00:14,  1.15s/it][A
 14%|█▍        | 2/14 [00:01<00:06,  1.85it/s][A
 21%|██▏       | 3/14 [00:01<00:03,  2.83it/s][A
 36%|███▌      | 5/14 [00:02<00:02,  3.04it/s][A
 50%|█████     | 7/14 [00:02<00:01,  4.62it/s][A
 64%|██████▍   | 9/14 [00:02<00:01,  3.41it/s][A
100%|██████████| 14/14 [00:03<00:00,  3.73it/s][A
Epochs:   1%|▏         | 1/69 [00:27<30:37, 27.03s/it]

Val Loss: 0.2319 - Val Accuracy: 0.9106



Training:   0%|          | 0/112 [00:00<?, ?it/s][A
Training:   1%|          | 1/112 [00:00<01:34,  1.17it/s][A
Training:   3%|▎         | 3/112 [00:00<00:28,  3.77it/s][A
Training:   4%|▍         | 5/112 [00:01<00:27,  3.87it/s][A
Training:   5%|▌         | 6/112 [00:01<00:23,  4.60it/s][A
Training:   8%|▊         | 9/112 [00:02<00:20,  5.12it/s][A
Training:   9%|▉         | 10/112 [00:02<00:20,  5.10it/s][A
Training:  11%|█         | 12/112 [00:02<00:14,  6.72it/s][A
Training:  12%|█▏        | 13/112 [00:02<00:20,  4.72it/s][A
Training:  12%|█▎        | 14/112 [00:03<00:20,  4.80it/s][A
Training:  14%|█▍        | 16/112 [00:03<00:14,  6.54it/s][A
Training:  15%|█▌        | 17/112 [00:03<00:21,  4.41it/s][A
Training:  16%|█▌        | 18/112 [00:03<00:20,  4.51it/s][A
Training:  18%|█▊        | 20/112 [00:04<00:14,  6.49it/s][A
Training:  19%|█▉        | 21/112 [00:04<00:19,  4.59it/s][A
Training:  20%|█▉        | 22/112 [00:04<00:18,  4.79it/s][A
Training:  22%|██▏   

Epoch: 2/69 - Loss: 0.2088 - Accuracy: 0.9111



  0%|          | 0/14 [00:00<?, ?it/s][A
  7%|▋         | 1/14 [00:01<00:16,  1.23s/it][A
 29%|██▊       | 4/14 [00:01<00:02,  3.77it/s][A
 43%|████▎     | 6/14 [00:02<00:02,  3.11it/s][A
 64%|██████▍   | 9/14 [00:03<00:01,  3.23it/s][A
100%|██████████| 14/14 [00:03<00:00,  3.71it/s][A
Epochs:   3%|▎         | 2/69 [00:53<29:45, 26.65s/it]

Val Loss: 0.2055 - Val Accuracy: 0.9175



Training:   0%|          | 0/112 [00:00<?, ?it/s][A
Training:   1%|          | 1/112 [00:01<02:37,  1.42s/it][A
Training:   4%|▍         | 5/112 [00:02<00:38,  2.79it/s][A
Training:   8%|▊         | 9/112 [00:02<00:25,  3.97it/s][A
Training:  10%|▉         | 11/112 [00:02<00:19,  5.07it/s][A
Training:  12%|█▏        | 13/112 [00:03<00:23,  4.20it/s][A
Training:  13%|█▎        | 15/112 [00:03<00:18,  5.36it/s][A
Training:  15%|█▌        | 17/112 [00:04<00:21,  4.35it/s][A
Training:  19%|█▉        | 21/112 [00:05<00:20,  4.41it/s][A
Training:  22%|██▏       | 25/112 [00:05<00:17,  5.02it/s][A
Training:  26%|██▌       | 29/112 [00:06<00:15,  5.37it/s][A
Training:  29%|██▊       | 32/112 [00:06<00:11,  6.86it/s][A
Training:  30%|███       | 34/112 [00:07<00:14,  5.26it/s][A
Training:  33%|███▎      | 37/112 [00:08<00:15,  4.92it/s][A
Training:  34%|███▍      | 38/112 [00:08<00:15,  4.93it/s][A
Training:  37%|███▋      | 41/112 [00:08<00:14,  4.87it/s][A
Training:  38%|███▊

Epoch: 3/69 - Loss: 0.1986 - Accuracy: 0.9177



  0%|          | 0/14 [00:00<?, ?it/s][A
  7%|▋         | 1/14 [00:00<00:12,  1.08it/s][A
 14%|█▍        | 2/14 [00:01<00:05,  2.23it/s][A
 36%|███▌      | 5/14 [00:01<00:02,  3.12it/s][A
 43%|████▎     | 6/14 [00:01<00:02,  3.77it/s][A
 57%|█████▋    | 8/14 [00:02<00:01,  5.65it/s][A
 71%|███████▏  | 10/14 [00:02<00:01,  3.91it/s][A
100%|██████████| 14/14 [00:03<00:00,  3.85it/s][A
Epochs:   4%|▍         | 3/69 [01:20<29:30, 26.83s/it]

Val Loss: 0.1811 - Val Accuracy: 0.9232



Training:   0%|          | 0/112 [00:00<?, ?it/s][A
Training:   1%|          | 1/112 [00:00<01:47,  1.03it/s][A
Training:   3%|▎         | 3/112 [00:01<00:35,  3.10it/s][A
Training:   4%|▍         | 5/112 [00:01<00:28,  3.73it/s][A
Training:   6%|▋         | 7/112 [00:01<00:18,  5.55it/s][A
Training:   8%|▊         | 9/112 [00:02<00:21,  4.90it/s][A
Training:  10%|▉         | 11/112 [00:02<00:18,  5.50it/s][A
Training:  12%|█▏        | 13/112 [00:02<00:19,  5.01it/s][A
Training:  13%|█▎        | 15/112 [00:03<00:19,  5.06it/s][A
Training:  15%|█▌        | 17/112 [00:03<00:19,  4.85it/s][A
Training:  17%|█▋        | 19/112 [00:04<00:19,  4.69it/s][A
Training:  19%|█▉        | 21/112 [00:04<00:17,  5.08it/s][A
Training:  21%|██        | 23/112 [00:05<00:18,  4.76it/s][A
Training:  22%|██▏       | 25/112 [00:05<00:16,  5.38it/s][A
Training:  24%|██▍       | 27/112 [00:05<00:16,  5.17it/s][A
Training:  26%|██▌       | 29/112 [00:05<00:14,  5.93it/s][A
Training:  28%|██▊   

Epoch: 4/69 - Loss: 0.1914 - Accuracy: 0.9220



  0%|          | 0/14 [00:00<?, ?it/s][A
  7%|▋         | 1/14 [00:01<00:13,  1.01s/it][A
 29%|██▊       | 4/14 [00:01<00:02,  4.10it/s][A
 36%|███▌      | 5/14 [00:01<00:03,  2.80it/s][A
 57%|█████▋    | 8/14 [00:02<00:01,  5.27it/s][A
 71%|███████▏  | 10/14 [00:02<00:00,  4.08it/s][A
100%|██████████| 14/14 [00:03<00:00,  3.90it/s][A
Epochs:   6%|▌         | 4/69 [01:47<29:07, 26.88s/it]

Val Loss: 0.2096 - Val Accuracy: 0.9118



Training:   0%|          | 0/112 [00:00<?, ?it/s][A
Training:   1%|          | 1/112 [00:01<02:13,  1.20s/it][A
Training:   4%|▎         | 4/112 [00:01<00:28,  3.79it/s][A
Training:   5%|▌         | 6/112 [00:01<00:29,  3.62it/s][A
Training:   7%|▋         | 8/112 [00:02<00:20,  5.17it/s][A
Training:   9%|▉         | 10/112 [00:02<00:21,  4.64it/s][A
Training:  10%|▉         | 11/112 [00:02<00:19,  5.18it/s][A
Training:  12%|█▏        | 13/112 [00:03<00:21,  4.57it/s][A
Training:  13%|█▎        | 15/112 [00:03<00:19,  5.09it/s][A
Training:  15%|█▌        | 17/112 [00:04<00:20,  4.53it/s][A
Training:  16%|█▌        | 18/112 [00:04<00:18,  4.95it/s][A
Training:  17%|█▋        | 19/112 [00:04<00:19,  4.69it/s][A
Training:  19%|█▉        | 21/112 [00:04<00:18,  4.84it/s][A
Training:  20%|█▉        | 22/112 [00:05<00:18,  4.82it/s][A
Training:  21%|██        | 23/112 [00:05<00:19,  4.53it/s][A
Training:  22%|██▏       | 25/112 [00:05<00:16,  5.34it/s][A
Training:  23%|██▎  

Epoch: 5/69 - Loss: 0.1810 - Accuracy: 0.9287



  0%|          | 0/14 [00:00<?, ?it/s][A
  7%|▋         | 1/14 [00:01<00:13,  1.01s/it][A
 14%|█▍        | 2/14 [00:01<00:06,  1.97it/s][A
 36%|███▌      | 5/14 [00:01<00:02,  3.31it/s][A
 43%|████▎     | 6/14 [00:02<00:02,  3.52it/s][A
 64%|██████▍   | 9/14 [00:02<00:01,  3.72it/s][A
 71%|███████▏  | 10/14 [00:02<00:00,  4.22it/s][A
 93%|█████████▎| 13/14 [00:03<00:00,  4.53it/s][A
100%|██████████| 14/14 [00:03<00:00,  3.74it/s][A
Epochs:   7%|▋         | 5/69 [02:14<28:40, 26.88s/it]

Val Loss: 0.2089 - Val Accuracy: 0.9147



Training:   0%|          | 0/112 [00:00<?, ?it/s][A
Training:   1%|          | 1/112 [00:00<01:45,  1.06it/s][A
Training:   2%|▏         | 2/112 [00:01<00:55,  1.98it/s][A
Training:   4%|▍         | 5/112 [00:01<00:29,  3.61it/s][A
Training:   5%|▌         | 6/112 [00:01<00:28,  3.68it/s][A
Training:   8%|▊         | 9/112 [00:02<00:22,  4.63it/s][A
Training:   9%|▉         | 10/112 [00:02<00:21,  4.83it/s][A
Training:  12%|█▏        | 13/112 [00:03<00:18,  5.27it/s][A
Training:  13%|█▎        | 15/112 [00:03<00:14,  6.72it/s][A
Training:  15%|█▌        | 17/112 [00:03<00:18,  5.09it/s][A
Training:  19%|█▉        | 21/112 [00:04<00:18,  5.00it/s][A
Training:  21%|██        | 23/112 [00:04<00:14,  5.95it/s][A
Training:  22%|██▏       | 25/112 [00:05<00:19,  4.50it/s][A
Training:  24%|██▍       | 27/112 [00:05<00:14,  5.68it/s][A
Training:  26%|██▌       | 29/112 [00:06<00:18,  4.41it/s][A
Training:  29%|██▉       | 33/112 [00:07<00:15,  5.01it/s][A
Training:  33%|███▎  

Epoch: 6/69 - Loss: 0.1817 - Accuracy: 0.9272



  0%|          | 0/14 [00:00<?, ?it/s][A
  7%|▋         | 1/14 [00:01<00:13,  1.06s/it][A
 29%|██▊       | 4/14 [00:01<00:02,  3.72it/s][A
 36%|███▌      | 5/14 [00:01<00:03,  2.78it/s][A
 50%|█████     | 7/14 [00:02<00:01,  4.46it/s][A
 64%|██████▍   | 9/14 [00:02<00:01,  3.58it/s][A
 79%|███████▊  | 11/14 [00:02<00:00,  5.05it/s][A
100%|██████████| 14/14 [00:03<00:00,  3.85it/s][A
Epochs:   9%|▊         | 6/69 [02:40<27:55, 26.60s/it]

Val Loss: 0.2519 - Val Accuracy: 0.9071



Training:   0%|          | 0/112 [00:00<?, ?it/s][A
Training:   1%|          | 1/112 [00:01<01:59,  1.08s/it][A
Training:   2%|▏         | 2/112 [00:01<01:01,  1.78it/s][A
Training:   4%|▎         | 4/112 [00:01<00:26,  4.03it/s][A
Training:   4%|▍         | 5/112 [00:01<00:36,  2.95it/s][A
Training:   5%|▌         | 6/112 [00:02<00:28,  3.69it/s][A
Training:   8%|▊         | 9/112 [00:02<00:26,  3.95it/s][A
Training:   9%|▉         | 10/112 [00:03<00:26,  3.92it/s][A
Training:  11%|█         | 12/112 [00:03<00:18,  5.44it/s][A
Training:  12%|█▏        | 13/112 [00:03<00:25,  3.86it/s][A
Training:  12%|█▎        | 14/112 [00:03<00:21,  4.46it/s][A
Training:  15%|█▌        | 17/112 [00:04<00:21,  4.43it/s][A
Training:  17%|█▋        | 19/112 [00:04<00:15,  5.85it/s][A
Training:  19%|█▉        | 21/112 [00:05<00:19,  4.57it/s][A
Training:  21%|██        | 23/112 [00:05<00:14,  5.95it/s][A
Training:  22%|██▏       | 25/112 [00:06<00:19,  4.37it/s][A
Training:  26%|██▌    

Epoch: 7/69 - Loss: 0.1784 - Accuracy: 0.9279



  0%|          | 0/14 [00:00<?, ?it/s][A
  7%|▋         | 1/14 [00:00<00:12,  1.04it/s][A
 21%|██▏       | 3/14 [00:01<00:03,  3.37it/s][A
 36%|███▌      | 5/14 [00:01<00:02,  3.03it/s][A
 57%|█████▋    | 8/14 [00:01<00:01,  5.47it/s][A
 71%|███████▏  | 10/14 [00:02<00:00,  4.13it/s][A
100%|██████████| 14/14 [00:03<00:00,  4.13it/s][A
Epochs:  10%|█         | 7/69 [03:06<27:16, 26.40s/it]

Val Loss: 0.1836 - Val Accuracy: 0.9244



Training:   0%|          | 0/112 [00:00<?, ?it/s][A
Training:   1%|          | 1/112 [00:01<02:08,  1.16s/it][A
Training:   3%|▎         | 3/112 [00:01<00:37,  2.90it/s][A
Training:   4%|▍         | 5/112 [00:02<00:39,  2.69it/s][A
Training:   7%|▋         | 8/112 [00:02<00:20,  4.96it/s][A
Training:   9%|▉         | 10/112 [00:03<00:27,  3.71it/s][A
Training:  12%|█▏        | 13/112 [00:03<00:27,  3.66it/s][A
Training:  13%|█▎        | 15/112 [00:03<00:20,  4.70it/s][A
Training:  15%|█▌        | 17/112 [00:04<00:22,  4.29it/s][A
Training:  19%|█▉        | 21/112 [00:05<00:17,  5.07it/s][A
Training:  21%|██▏       | 24/112 [00:05<00:13,  6.73it/s][A
Training:  23%|██▎       | 26/112 [00:05<00:15,  5.45it/s][A
Training:  26%|██▌       | 29/112 [00:06<00:17,  4.88it/s][A
Training:  29%|██▊       | 32/112 [00:06<00:12,  6.64it/s][A
Training:  30%|███       | 34/112 [00:07<00:15,  5.01it/s][A
Training:  33%|███▎      | 37/112 [00:08<00:16,  4.58it/s][A
Training:  35%|███▍ 

Epoch: 8/69 - Loss: 0.1627 - Accuracy: 0.9325



  0%|          | 0/14 [00:00<?, ?it/s][A
  7%|▋         | 1/14 [00:01<00:13,  1.07s/it][A
 14%|█▍        | 2/14 [00:01<00:06,  1.90it/s][A
 29%|██▊       | 4/14 [00:01<00:02,  4.17it/s][A
 36%|███▌      | 5/14 [00:02<00:03,  2.66it/s][A
 64%|██████▍   | 9/14 [00:02<00:01,  3.61it/s][A
100%|██████████| 14/14 [00:03<00:00,  3.72it/s][A
Epochs:  12%|█▏        | 8/69 [03:32<26:53, 26.44s/it]

Val Loss: 0.1614 - Val Accuracy: 0.9307



Training:   0%|          | 0/112 [00:00<?, ?it/s][A
Training:   1%|          | 1/112 [00:01<02:24,  1.30s/it][A
Training:   3%|▎         | 3/112 [00:01<00:40,  2.66it/s][A
Training:   4%|▍         | 5/112 [00:02<00:37,  2.87it/s][A
Training:   6%|▋         | 7/112 [00:02<00:23,  4.41it/s][A
Training:   8%|▊         | 9/112 [00:02<00:29,  3.53it/s][A
Training:  11%|█         | 12/112 [00:03<00:17,  5.79it/s][A
Training:  12%|█▎        | 14/112 [00:03<00:24,  3.99it/s][A
Training:  15%|█▌        | 17/112 [00:04<00:24,  3.94it/s][A
Training:  17%|█▋        | 19/112 [00:04<00:18,  5.02it/s][A
Training:  19%|█▉        | 21/112 [00:05<00:21,  4.25it/s][A
Training:  22%|██▏       | 25/112 [00:06<00:17,  4.84it/s][A
Training:  26%|██▌       | 29/112 [00:06<00:15,  5.38it/s][A
Training:  28%|██▊       | 31/112 [00:06<00:12,  6.25it/s][A
Training:  29%|██▉       | 33/112 [00:07<00:15,  5.03it/s][A
Training:  33%|███▎      | 37/112 [00:08<00:15,  4.88it/s][A
Training:  35%|███▍  

Epoch: 9/69 - Loss: 0.2294 - Accuracy: 0.9142



  0%|          | 0/14 [00:00<?, ?it/s][A
  7%|▋         | 1/14 [00:01<00:16,  1.31s/it][A
 29%|██▊       | 4/14 [00:01<00:02,  3.54it/s][A
 43%|████▎     | 6/14 [00:02<00:02,  3.24it/s][A
 57%|█████▋    | 8/14 [00:02<00:01,  4.57it/s][A
 71%|███████▏  | 10/14 [00:02<00:01,  3.98it/s][A
100%|██████████| 14/14 [00:03<00:00,  3.78it/s][A
Epochs:  13%|█▎        | 9/69 [03:59<26:26, 26.43s/it]

Val Loss: 0.1666 - Val Accuracy: 0.9359



Training:   0%|          | 0/112 [00:00<?, ?it/s][A
Training:   1%|          | 1/112 [00:01<02:00,  1.08s/it][A
Training:   3%|▎         | 3/112 [00:01<00:36,  3.00it/s][A
Training:   4%|▍         | 5/112 [00:01<00:37,  2.85it/s][A
Training:   6%|▋         | 7/112 [00:02<00:24,  4.21it/s][A
Training:   8%|▊         | 9/112 [00:02<00:28,  3.65it/s][A
Training:  11%|█         | 12/112 [00:02<00:17,  5.86it/s][A
Training:  12%|█▎        | 14/112 [00:03<00:24,  4.04it/s][A
Training:  15%|█▌        | 17/112 [00:04<00:23,  4.05it/s][A
Training:  16%|█▌        | 18/112 [00:04<00:21,  4.45it/s][A
Training:  19%|█▉        | 21/112 [00:05<00:21,  4.14it/s][A
Training:  21%|██        | 23/112 [00:05<00:17,  5.22it/s][A
Training:  22%|██▏       | 25/112 [00:06<00:21,  4.13it/s][A
Training:  25%|██▌       | 28/112 [00:06<00:14,  5.93it/s][A
Training:  27%|██▋       | 30/112 [00:07<00:17,  4.76it/s][A
Training:  29%|██▉       | 33/112 [00:07<00:18,  4.38it/s][A
Training:  33%|███▎  

Epoch: 10/69 - Loss: 0.1683 - Accuracy: 0.9352



  0%|          | 0/14 [00:00<?, ?it/s][A
  7%|▋         | 1/14 [00:01<00:14,  1.15s/it][A
 29%|██▊       | 4/14 [00:01<00:02,  4.00it/s][A
 43%|████▎     | 6/14 [00:02<00:02,  2.97it/s][A
 64%|██████▍   | 9/14 [00:02<00:01,  3.40it/s][A
 86%|████████▌ | 12/14 [00:03<00:00,  4.95it/s][A
100%|██████████| 14/14 [00:03<00:00,  3.80it/s][A
Epochs:  14%|█▍        | 10/69 [04:26<26:10, 26.62s/it]

Val Loss: 0.1612 - Val Accuracy: 0.9336



Training:   0%|          | 0/112 [00:00<?, ?it/s][A
Training:   1%|          | 1/112 [00:01<01:50,  1.01it/s][A
Training:   4%|▎         | 4/112 [00:01<00:25,  4.27it/s][A
Training:   5%|▌         | 6/112 [00:01<00:32,  3.29it/s][A
Training:   8%|▊         | 9/112 [00:02<00:28,  3.63it/s][A
Training:  10%|▉         | 11/112 [00:02<00:21,  4.80it/s][A
Training:  11%|█         | 12/112 [00:02<00:19,  5.22it/s][A
Training:  12%|█▏        | 13/112 [00:03<00:27,  3.58it/s][A
Training:  13%|█▎        | 15/112 [00:03<00:19,  4.98it/s][A
Training:  15%|█▌        | 17/112 [00:04<00:22,  4.31it/s][A
Training:  16%|█▌        | 18/112 [00:04<00:20,  4.69it/s][A
Training:  18%|█▊        | 20/112 [00:04<00:14,  6.45it/s][A
Training:  20%|█▉        | 22/112 [00:05<00:20,  4.37it/s][A
Training:  21%|██▏       | 24/112 [00:05<00:15,  5.73it/s][A
Training:  23%|██▎       | 26/112 [00:06<00:21,  4.04it/s][A
Training:  26%|██▌       | 29/112 [00:06<00:17,  4.82it/s][A
Training:  27%|██▋  

Epoch: 11/69 - Loss: 0.1747 - Accuracy: 0.9318



  0%|          | 0/14 [00:00<?, ?it/s][A
  7%|▋         | 1/14 [00:00<00:11,  1.18it/s][A
 14%|█▍        | 2/14 [00:01<00:05,  2.17it/s][A
 29%|██▊       | 4/14 [00:01<00:02,  4.87it/s][A
 43%|████▎     | 6/14 [00:01<00:02,  3.78it/s][A
 64%|██████▍   | 9/14 [00:02<00:01,  3.66it/s][A
 79%|███████▊  | 11/14 [00:02<00:00,  4.96it/s][A
100%|██████████| 14/14 [00:03<00:00,  4.09it/s][A
Epochs:  16%|█▌        | 11/69 [04:52<25:28, 26.36s/it]

Val Loss: 0.1625 - Val Accuracy: 0.9330



Training:   0%|          | 0/112 [00:00<?, ?it/s][A
Training:   1%|          | 1/112 [00:01<02:00,  1.09s/it][A
Training:   4%|▎         | 4/112 [00:01<00:25,  4.27it/s][A
Training:   5%|▌         | 6/112 [00:02<00:32,  3.23it/s][A
Training:   7%|▋         | 8/112 [00:02<00:22,  4.67it/s][A
Training:   9%|▉         | 10/112 [00:02<00:26,  3.88it/s][A
Training:  12%|█▏        | 13/112 [00:03<00:26,  3.75it/s][A
Training:  13%|█▎        | 15/112 [00:03<00:19,  4.86it/s][A
Training:  15%|█▌        | 17/112 [00:04<00:23,  4.03it/s][A
Training:  17%|█▋        | 19/112 [00:04<00:17,  5.17it/s][A
Training:  19%|█▉        | 21/112 [00:05<00:20,  4.36it/s][A
Training:  22%|██▏       | 25/112 [00:06<00:18,  4.63it/s][A
Training:  25%|██▌       | 28/112 [00:06<00:13,  6.31it/s][A
Training:  27%|██▋       | 30/112 [00:06<00:17,  4.61it/s][A
Training:  29%|██▊       | 32/112 [00:07<00:14,  5.70it/s][A
Training:  30%|███       | 34/112 [00:07<00:17,  4.39it/s][A
Training:  33%|███▎ 

Epoch: 12/69 - Loss: 0.2143 - Accuracy: 0.9196



  0%|          | 0/14 [00:00<?, ?it/s][A
  7%|▋         | 1/14 [00:01<00:15,  1.16s/it][A
 36%|███▌      | 5/14 [00:01<00:03,  2.96it/s][A
 50%|█████     | 7/14 [00:02<00:01,  4.37it/s][A
 64%|██████▍   | 9/14 [00:02<00:01,  3.68it/s][A
 71%|███████▏  | 10/14 [00:02<00:00,  4.04it/s][A
100%|██████████| 14/14 [00:03<00:00,  3.86it/s][A
Epochs:  17%|█▋        | 12/69 [05:18<25:09, 26.49s/it]

Val Loss: 0.2228 - Val Accuracy: 0.9095



Training:   0%|          | 0/112 [00:00<?, ?it/s][A
Training:   1%|          | 1/112 [00:01<02:05,  1.13s/it][A
Training:   3%|▎         | 3/112 [00:01<00:40,  2.69it/s][A
Training:   4%|▍         | 5/112 [00:01<00:36,  2.93it/s][A
Training:   6%|▋         | 7/112 [00:02<00:25,  4.16it/s][A
Training:   8%|▊         | 9/112 [00:02<00:26,  3.85it/s][A
Training:  10%|▉         | 11/112 [00:02<00:21,  4.79it/s][A
Training:  12%|█▏        | 13/112 [00:03<00:23,  4.17it/s][A
Training:  13%|█▎        | 15/112 [00:03<00:17,  5.41it/s][A
Training:  15%|█▌        | 17/112 [00:04<00:22,  4.22it/s][A
Training:  17%|█▋        | 19/112 [00:04<00:18,  5.03it/s][A
Training:  19%|█▉        | 21/112 [00:05<00:21,  4.17it/s][A
Training:  21%|██        | 23/112 [00:05<00:16,  5.37it/s][A
Training:  22%|██▏       | 25/112 [00:06<00:21,  4.08it/s][A
Training:  24%|██▍       | 27/112 [00:06<00:17,  4.90it/s][A
Training:  26%|██▌       | 29/112 [00:06<00:18,  4.46it/s][A
Training:  28%|██▊   

Epoch: 13/69 - Loss: 6.6115 - Accuracy: 0.8433



  0%|          | 0/14 [00:00<?, ?it/s][A
  7%|▋         | 1/14 [00:01<00:15,  1.21s/it][A
 36%|███▌      | 5/14 [00:02<00:03,  2.77it/s][A
 43%|████▎     | 6/14 [00:02<00:02,  3.25it/s][A
 64%|██████▍   | 9/14 [00:02<00:01,  3.62it/s][A
 79%|███████▊  | 11/14 [00:03<00:00,  4.78it/s][A
100%|██████████| 14/14 [00:03<00:00,  3.72it/s][A
Epochs:  19%|█▉        | 13/69 [05:46<25:00, 26.80s/it]

Val Loss: 1.7536 - Val Accuracy: 0.8871



Training:   0%|          | 0/112 [00:00<?, ?it/s][A
Training:   1%|          | 1/112 [00:01<02:09,  1.17s/it][A
Training:   4%|▍         | 5/112 [00:01<00:35,  2.98it/s][A
Training:   6%|▋         | 7/112 [00:02<00:24,  4.32it/s][A
Training:   8%|▊         | 9/112 [00:02<00:28,  3.60it/s][A
Training:  11%|█         | 12/112 [00:02<00:17,  5.64it/s][A
Training:  12%|█▎        | 14/112 [00:03<00:23,  4.17it/s][A
Training:  15%|█▌        | 17/112 [00:04<00:22,  4.17it/s][A
Training:  18%|█▊        | 20/112 [00:04<00:15,  5.96it/s][A
Training:  20%|█▉        | 22/112 [00:05<00:19,  4.73it/s][A
Training:  22%|██▏       | 25/112 [00:05<00:18,  4.58it/s][A
Training:  24%|██▍       | 27/112 [00:06<00:15,  5.60it/s][A
Training:  26%|██▌       | 29/112 [00:06<00:18,  4.58it/s][A
Training:  28%|██▊       | 31/112 [00:06<00:14,  5.59it/s][A
Training:  29%|██▉       | 33/112 [00:07<00:17,  4.63it/s][A
Training:  31%|███▏      | 35/112 [00:07<00:13,  5.76it/s][A
Training:  33%|███▎ 

Epoch: 14/69 - Loss: 1.3267 - Accuracy: 0.8905



  0%|          | 0/14 [00:00<?, ?it/s][A
  7%|▋         | 1/14 [00:01<00:16,  1.29s/it][A
 29%|██▊       | 4/14 [00:01<00:02,  3.60it/s][A
 43%|████▎     | 6/14 [00:02<00:02,  3.31it/s][A
 64%|██████▍   | 9/14 [00:02<00:01,  3.53it/s][A
 86%|████████▌ | 12/14 [00:02<00:00,  5.51it/s][A
100%|██████████| 14/14 [00:03<00:00,  3.78it/s][A
Epochs:  20%|██        | 14/69 [06:12<24:23, 26.62s/it]

Val Loss: 0.2916 - Val Accuracy: 0.9222



Training:   0%|          | 0/112 [00:00<?, ?it/s][A
Training:   1%|          | 1/112 [00:01<02:12,  1.19s/it][A
Training:   3%|▎         | 3/112 [00:01<00:42,  2.54it/s][A
Training:   4%|▍         | 5/112 [00:01<00:35,  2.99it/s][A
Training:   5%|▌         | 6/112 [00:02<00:31,  3.38it/s][A
Training:   7%|▋         | 8/112 [00:02<00:20,  5.12it/s][A
Training:   8%|▊         | 9/112 [00:02<00:27,  3.75it/s][A
Training:   9%|▉         | 10/112 [00:03<00:26,  3.82it/s][A
Training:  10%|▉         | 11/112 [00:03<00:22,  4.40it/s][A
Training:  12%|█▏        | 13/112 [00:03<00:19,  4.95it/s][A
Training:  12%|█▎        | 14/112 [00:03<00:22,  4.38it/s][A
Training:  13%|█▎        | 15/112 [00:04<00:23,  4.14it/s][A
Training:  15%|█▌        | 17/112 [00:04<00:17,  5.47it/s][A
Training:  16%|█▌        | 18/112 [00:04<00:25,  3.75it/s][A
Training:  17%|█▋        | 19/112 [00:04<00:21,  4.29it/s][A
Training:  19%|█▉        | 21/112 [00:05<00:15,  5.93it/s][A
Training:  20%|█▉     

Epoch: 15/69 - Loss: 0.3243 - Accuracy: 0.9136



  0%|          | 0/14 [00:00<?, ?it/s][A
  7%|▋         | 1/14 [00:01<00:15,  1.16s/it][A
 36%|███▌      | 5/14 [00:02<00:03,  2.80it/s][A
 50%|█████     | 7/14 [00:02<00:01,  4.14it/s][A
 64%|██████▍   | 9/14 [00:02<00:01,  3.79it/s][A
 86%|████████▌ | 12/14 [00:02<00:00,  6.00it/s][A
100%|██████████| 14/14 [00:03<00:00,  3.84it/s][A
Epochs:  22%|██▏       | 15/69 [06:38<23:50, 26.49s/it]

Val Loss: 0.2853 - Val Accuracy: 0.8969



Training:   0%|          | 0/112 [00:00<?, ?it/s][A
Training:   1%|          | 1/112 [00:01<02:18,  1.24s/it][A
Training:   3%|▎         | 3/112 [00:01<00:42,  2.57it/s][A
Training:   4%|▍         | 5/112 [00:01<00:35,  2.99it/s][A
Training:   5%|▌         | 6/112 [00:02<00:30,  3.43it/s][A
Training:   7%|▋         | 8/112 [00:02<00:20,  5.18it/s][A
Training:   8%|▊         | 9/112 [00:02<00:29,  3.53it/s][A
Training:   9%|▉         | 10/112 [00:03<00:26,  3.90it/s][A
Training:  11%|█         | 12/112 [00:03<00:17,  5.67it/s][A
Training:  12%|█▏        | 13/112 [00:03<00:21,  4.65it/s][A
Training:  12%|█▎        | 14/112 [00:03<00:22,  4.31it/s][A
Training:  14%|█▍        | 16/112 [00:03<00:15,  6.32it/s][A
Training:  15%|█▌        | 17/112 [00:04<00:21,  4.37it/s][A
Training:  16%|█▌        | 18/112 [00:04<00:23,  4.00it/s][A
Training:  19%|█▉        | 21/112 [00:05<00:19,  4.58it/s][A
Training:  20%|█▉        | 22/112 [00:05<00:22,  3.94it/s][A
Training:  21%|██▏    

Epoch: 16/69 - Loss: 0.4550 - Accuracy: 0.9154



  0%|          | 0/14 [00:00<?, ?it/s][A
  7%|▋         | 1/14 [00:01<00:14,  1.10s/it][A
 14%|█▍        | 2/14 [00:01<00:06,  1.77it/s][A
 36%|███▌      | 5/14 [00:01<00:02,  3.39it/s][A
 43%|████▎     | 6/14 [00:02<00:02,  3.36it/s][A
 64%|██████▍   | 9/14 [00:02<00:01,  4.41it/s][A
 71%|███████▏  | 10/14 [00:03<00:01,  3.74it/s][A
 93%|█████████▎| 13/14 [00:03<00:00,  5.18it/s][A
100%|██████████| 14/14 [00:03<00:00,  3.62it/s][A
Epochs:  23%|██▎       | 16/69 [07:05<23:30, 26.60s/it]

Val Loss: 1.4407 - Val Accuracy: 0.9232



Training:   0%|          | 0/112 [00:00<?, ?it/s][A
Training:   1%|          | 1/112 [00:01<01:50,  1.00it/s][A
Training:   2%|▏         | 2/112 [00:01<00:51,  2.13it/s][A
Training:   4%|▎         | 4/112 [00:01<00:22,  4.70it/s][A
Training:   5%|▌         | 6/112 [00:02<00:31,  3.34it/s][A
Training:   7%|▋         | 8/112 [00:02<00:21,  4.81it/s][A
Training:   8%|▊         | 9/112 [00:02<00:26,  3.83it/s][A
Training:   9%|▉         | 10/112 [00:02<00:28,  3.63it/s][A
Training:  11%|█         | 12/112 [00:03<00:19,  5.18it/s][A
Training:  12%|█▏        | 13/112 [00:03<00:24,  4.12it/s][A
Training:  12%|█▎        | 14/112 [00:03<00:24,  3.93it/s][A
Training:  14%|█▍        | 16/112 [00:03<00:16,  5.78it/s][A
Training:  15%|█▌        | 17/112 [00:04<00:20,  4.67it/s][A
Training:  16%|█▌        | 18/112 [00:04<00:21,  4.37it/s][A
Training:  18%|█▊        | 20/112 [00:04<00:15,  6.13it/s][A
Training:  19%|█▉        | 21/112 [00:04<00:18,  4.92it/s][A
Training:  20%|█▉     

Epoch: 17/69 - Loss: 5.9168 - Accuracy: 0.8808



  0%|          | 0/14 [00:00<?, ?it/s][A
  7%|▋         | 1/14 [00:01<00:16,  1.24s/it][A
 29%|██▊       | 4/14 [00:01<00:02,  3.75it/s][A
 43%|████▎     | 6/14 [00:02<00:02,  3.27it/s][A
 64%|██████▍   | 9/14 [00:02<00:01,  3.50it/s][A
 86%|████████▌ | 12/14 [00:03<00:00,  5.33it/s][A
100%|██████████| 14/14 [00:03<00:00,  3.80it/s][A
Epochs:  25%|██▍       | 17/69 [07:31<22:57, 26.49s/it]

Val Loss: 1.4413 - Val Accuracy: 0.8894



Training:   0%|          | 0/112 [00:00<?, ?it/s][A
Training:   1%|          | 1/112 [00:01<02:01,  1.10s/it][A
Training:   3%|▎         | 3/112 [00:01<00:35,  3.07it/s][A
Training:   4%|▍         | 5/112 [00:01<00:34,  3.10it/s][A
Training:   6%|▋         | 7/112 [00:02<00:23,  4.56it/s][A
Training:   8%|▊         | 9/112 [00:02<00:28,  3.68it/s][A
Training:  10%|▉         | 11/112 [00:02<00:20,  4.91it/s][A
Training:  11%|█         | 12/112 [00:03<00:21,  4.59it/s][A
Training:  12%|█▏        | 13/112 [00:03<00:26,  3.77it/s][A
Training:  13%|█▎        | 15/112 [00:03<00:18,  5.30it/s][A
Training:  14%|█▍        | 16/112 [00:04<00:24,  3.93it/s][A
Training:  15%|█▌        | 17/112 [00:04<00:23,  4.09it/s][A
Training:  18%|█▊        | 20/112 [00:05<00:20,  4.53it/s][A
Training:  19%|█▉        | 21/112 [00:05<00:19,  4.69it/s][A
Training:  21%|██        | 23/112 [00:05<00:14,  6.21it/s][A
Training:  21%|██▏       | 24/112 [00:05<00:21,  4.08it/s][A
Training:  22%|██▏   

Epoch: 18/69 - Loss: 0.6506 - Accuracy: 0.9096



  0%|          | 0/14 [00:00<?, ?it/s][A
  7%|▋         | 1/14 [00:01<00:15,  1.19s/it][A
 21%|██▏       | 3/14 [00:01<00:04,  2.65it/s][A
 36%|███▌      | 5/14 [00:01<00:02,  3.13it/s][A
 50%|█████     | 7/14 [00:02<00:01,  4.28it/s][A
 64%|██████▍   | 9/14 [00:02<00:01,  3.88it/s][A
 79%|███████▊  | 11/14 [00:02<00:00,  5.29it/s][A
100%|██████████| 14/14 [00:03<00:00,  3.95it/s][A
Epochs:  26%|██▌       | 18/69 [07:58<22:32, 26.52s/it]

Val Loss: 0.8195 - Val Accuracy: 0.8326



Training:   0%|          | 0/112 [00:00<?, ?it/s][A
Training:   1%|          | 1/112 [00:01<02:36,  1.41s/it][A
Training:   4%|▎         | 4/112 [00:01<00:31,  3.38it/s][A
Training:   5%|▌         | 6/112 [00:02<00:32,  3.28it/s][A
Training:   8%|▊         | 9/112 [00:02<00:27,  3.71it/s][A
Training:  10%|▉         | 11/112 [00:02<00:20,  4.95it/s][A
Training:  12%|█▏        | 13/112 [00:03<00:24,  4.00it/s][A
Training:  13%|█▎        | 15/112 [00:03<00:18,  5.15it/s][A
Training:  15%|█▌        | 17/112 [00:04<00:22,  4.26it/s][A
Training:  17%|█▋        | 19/112 [00:04<00:17,  5.18it/s][A
Training:  19%|█▉        | 21/112 [00:05<00:20,  4.38it/s][A
Training:  21%|██        | 23/112 [00:05<00:18,  4.84it/s][A
Training:  22%|██▏       | 25/112 [00:05<00:17,  4.90it/s][A
Training:  23%|██▎       | 26/112 [00:06<00:16,  5.07it/s][A
Training:  25%|██▌       | 28/112 [00:06<00:13,  6.22it/s][A
Training:  26%|██▌       | 29/112 [00:06<00:17,  4.82it/s][A
Training:  27%|██▋  

Epoch: 19/69 - Loss: 0.4647 - Accuracy: 0.9176



  0%|          | 0/14 [00:00<?, ?it/s][A
  7%|▋         | 1/14 [00:00<00:12,  1.02it/s][A
 36%|███▌      | 5/14 [00:01<00:03,  2.92it/s][A
 50%|█████     | 7/14 [00:02<00:01,  4.29it/s][A
 64%|██████▍   | 9/14 [00:02<00:01,  3.67it/s][A
 86%|████████▌ | 12/14 [00:02<00:00,  5.75it/s][A
100%|██████████| 14/14 [00:03<00:00,  3.96it/s][A
Epochs:  28%|██▊       | 19/69 [08:24<21:54, 26.29s/it]

Val Loss: 0.3598 - Val Accuracy: 0.9273



Training:   0%|          | 0/112 [00:00<?, ?it/s][A
Training:   1%|          | 1/112 [00:01<02:22,  1.29s/it][A
Training:   3%|▎         | 3/112 [00:01<00:40,  2.68it/s][A
Training:   4%|▍         | 5/112 [00:02<00:39,  2.69it/s][A
Training:   6%|▋         | 7/112 [00:02<00:24,  4.22it/s][A
Training:   8%|▊         | 9/112 [00:02<00:26,  3.84it/s][A
Training:  10%|▉         | 11/112 [00:02<00:19,  5.21it/s][A
Training:  12%|█▏        | 13/112 [00:03<00:23,  4.22it/s][A
Training:  13%|█▎        | 15/112 [00:03<00:19,  4.97it/s][A
Training:  15%|█▌        | 17/112 [00:04<00:20,  4.74it/s][A
Training:  16%|█▌        | 18/112 [00:04<00:19,  4.79it/s][A
Training:  17%|█▋        | 19/112 [00:04<00:18,  5.00it/s][A
Training:  19%|█▉        | 21/112 [00:05<00:19,  4.72it/s][A
Training:  20%|█▉        | 22/112 [00:05<00:18,  4.77it/s][A
Training:  21%|██        | 23/112 [00:05<00:20,  4.35it/s][A
Training:  22%|██▏       | 25/112 [00:06<00:18,  4.70it/s][A
Training:  24%|██▍   

Epoch: 20/69 - Loss: 0.3192 - Accuracy: 0.9211



  0%|          | 0/14 [00:00<?, ?it/s][A
  7%|▋         | 1/14 [00:01<00:13,  1.03s/it][A
 36%|███▌      | 5/14 [00:01<00:02,  3.24it/s][A
 64%|██████▍   | 9/14 [00:02<00:01,  4.09it/s][A
 86%|████████▌ | 12/14 [00:02<00:00,  5.95it/s][A
100%|██████████| 14/14 [00:03<00:00,  4.27it/s][A
Epochs:  29%|██▉       | 20/69 [08:50<21:34, 26.42s/it]

Val Loss: 0.2434 - Val Accuracy: 0.9089



Training:   0%|          | 0/112 [00:00<?, ?it/s][A
Training:   1%|          | 1/112 [00:01<02:16,  1.23s/it][A
Training:   3%|▎         | 3/112 [00:01<00:40,  2.72it/s][A
Training:   4%|▎         | 4/112 [00:01<00:29,  3.63it/s][A
Training:   4%|▍         | 5/112 [00:02<00:40,  2.66it/s][A
Training:   6%|▋         | 7/112 [00:02<00:23,  4.46it/s][A
Training:   8%|▊         | 9/112 [00:02<00:27,  3.79it/s][A
Training:  10%|▉         | 11/112 [00:02<00:19,  5.28it/s][A
Training:  12%|█▏        | 13/112 [00:03<00:24,  4.11it/s][A
Training:  14%|█▍        | 16/112 [00:03<00:15,  6.31it/s][A
Training:  16%|█▌        | 18/112 [00:04<00:21,  4.35it/s][A
Training:  19%|█▉        | 21/112 [00:05<00:22,  3.96it/s][A
Training:  22%|██▏       | 25/112 [00:06<00:20,  4.19it/s][A
Training:  26%|██▌       | 29/112 [00:07<00:18,  4.49it/s][A
Training:  28%|██▊       | 31/112 [00:07<00:15,  5.30it/s][A
Training:  29%|██▉       | 33/112 [00:07<00:17,  4.40it/s][A
Training:  33%|███▎   

Epoch: 21/69 - Loss: 0.7902 - Accuracy: 0.9254



  0%|          | 0/14 [00:00<?, ?it/s][A
  7%|▋         | 1/14 [00:01<00:13,  1.05s/it][A
 36%|███▌      | 5/14 [00:01<00:02,  3.25it/s][A
 50%|█████     | 7/14 [00:01<00:01,  4.72it/s][A
 64%|██████▍   | 9/14 [00:02<00:01,  4.25it/s][A
 79%|███████▊  | 11/14 [00:02<00:00,  5.20it/s][A
100%|██████████| 14/14 [00:03<00:00,  4.25it/s][A
Epochs:  30%|███       | 21/69 [09:17<21:10, 26.47s/it]

Val Loss: 0.9101 - Val Accuracy: 0.8595



Training:   0%|          | 0/112 [00:00<?, ?it/s][A
Training:   1%|          | 1/112 [00:01<02:31,  1.37s/it][A
Training:   3%|▎         | 3/112 [00:01<00:44,  2.43it/s][A
Training:   4%|▍         | 5/112 [00:02<00:38,  2.80it/s][A
Training:   7%|▋         | 8/112 [00:02<00:20,  5.17it/s][A
Training:   9%|▉         | 10/112 [00:03<00:29,  3.46it/s][A
Training:  12%|█▏        | 13/112 [00:03<00:26,  3.72it/s][A
Training:  14%|█▍        | 16/112 [00:04<00:18,  5.28it/s][A
Training:  16%|█▌        | 18/112 [00:04<00:19,  4.73it/s][A
Training:  18%|█▊        | 20/112 [00:04<00:16,  5.63it/s][A
Training:  19%|█▉        | 21/112 [00:05<00:22,  4.10it/s][A
Training:  21%|██▏       | 24/112 [00:05<00:15,  5.55it/s][A
Training:  22%|██▏       | 25/112 [00:06<00:20,  4.26it/s][A
Training:  24%|██▍       | 27/112 [00:06<00:15,  5.54it/s][A
Training:  25%|██▌       | 28/112 [00:06<00:15,  5.44it/s][A
Training:  26%|██▌       | 29/112 [00:07<00:20,  4.08it/s][A
Training:  29%|██▊  

Epoch: 22/69 - Loss: 0.5123 - Accuracy: 0.9187



  0%|          | 0/14 [00:00<?, ?it/s][A
  7%|▋         | 1/14 [00:01<00:16,  1.27s/it][A
 29%|██▊       | 4/14 [00:01<00:02,  3.70it/s][A
 43%|████▎     | 6/14 [00:02<00:02,  3.14it/s][A
 64%|██████▍   | 9/14 [00:02<00:01,  3.66it/s][A
 86%|████████▌ | 12/14 [00:02<00:00,  5.59it/s][A
100%|██████████| 14/14 [00:03<00:00,  3.84it/s][A
Epochs:  32%|███▏      | 22/69 [09:44<20:51, 26.62s/it]

Val Loss: 0.4081 - Val Accuracy: 0.8860



Training:   0%|          | 0/112 [00:00<?, ?it/s][A
Training:   1%|          | 1/112 [00:01<02:12,  1.19s/it][A
Training:   3%|▎         | 3/112 [00:01<00:38,  2.81it/s][A
Training:   4%|▍         | 5/112 [00:01<00:35,  3.01it/s][A
Training:   5%|▌         | 6/112 [00:02<00:29,  3.65it/s][A
Training:   7%|▋         | 8/112 [00:02<00:19,  5.28it/s][A
Training:   8%|▊         | 9/112 [00:02<00:27,  3.75it/s][A
Training:   9%|▉         | 10/112 [00:02<00:25,  4.07it/s][A
Training:  11%|█         | 12/112 [00:03<00:16,  5.93it/s][A
Training:  12%|█▏        | 13/112 [00:03<00:21,  4.59it/s][A
Training:  12%|█▎        | 14/112 [00:03<00:23,  4.14it/s][A
Training:  15%|█▌        | 17/112 [00:04<00:18,  5.13it/s][A
Training:  16%|█▌        | 18/112 [00:04<00:19,  4.73it/s][A
Training:  18%|█▊        | 20/112 [00:04<00:14,  6.36it/s][A
Training:  19%|█▉        | 21/112 [00:05<00:20,  4.39it/s][A
Training:  20%|█▉        | 22/112 [00:05<00:19,  4.66it/s][A
Training:  21%|██▏    

Epoch: 23/69 - Loss: 0.5752 - Accuracy: 0.9185



  0%|          | 0/14 [00:00<?, ?it/s][A
  7%|▋         | 1/14 [00:00<00:12,  1.03it/s][A
 14%|█▍        | 2/14 [00:01<00:05,  2.14it/s][A
 36%|███▌      | 5/14 [00:01<00:02,  3.36it/s][A
 57%|█████▋    | 8/14 [00:01<00:01,  5.83it/s][A
 71%|███████▏  | 10/14 [00:02<00:00,  4.49it/s][A
100%|██████████| 14/14 [00:03<00:00,  4.42it/s][A
Epochs:  33%|███▎      | 23/69 [10:10<20:15, 26.43s/it]

Val Loss: 0.3692 - Val Accuracy: 0.9347



Training:   0%|          | 0/112 [00:00<?, ?it/s][A
Training:   1%|          | 1/112 [00:01<02:21,  1.27s/it][A
Training:   4%|▎         | 4/112 [00:01<00:29,  3.62it/s][A
Training:   5%|▌         | 6/112 [00:02<00:36,  2.89it/s][A
Training:   8%|▊         | 9/112 [00:03<00:31,  3.31it/s][A
Training:  10%|▉         | 11/112 [00:03<00:22,  4.48it/s][A
Training:  12%|█▏        | 13/112 [00:03<00:25,  3.82it/s][A
Training:  15%|█▌        | 17/112 [00:04<00:23,  4.01it/s][A
Training:  16%|█▌        | 18/112 [00:04<00:21,  4.38it/s][A
Training:  19%|█▉        | 21/112 [00:05<00:21,  4.23it/s][A
Training:  20%|█▉        | 22/112 [00:05<00:19,  4.61it/s][A
Training:  21%|██▏       | 24/112 [00:05<00:14,  5.98it/s][A
Training:  23%|██▎       | 26/112 [00:06<00:20,  4.29it/s][A
Training:  26%|██▌       | 29/112 [00:07<00:17,  4.78it/s][A
Training:  27%|██▋       | 30/112 [00:07<00:18,  4.40it/s][A
Training:  29%|██▉       | 33/112 [00:08<00:16,  4.66it/s][A
Training:  30%|███  

Epoch: 24/69 - Loss: 0.9157 - Accuracy: 0.9100



  0%|          | 0/14 [00:00<?, ?it/s][A
  7%|▋         | 1/14 [00:01<00:16,  1.27s/it][A
 14%|█▍        | 2/14 [00:01<00:07,  1.71it/s][A
 29%|██▊       | 4/14 [00:01<00:02,  3.83it/s][A
 36%|███▌      | 5/14 [00:02<00:03,  2.93it/s][A
 64%|██████▍   | 9/14 [00:02<00:01,  3.80it/s][A
100%|██████████| 14/14 [00:03<00:00,  3.76it/s][A
Epochs:  35%|███▍      | 24/69 [10:37<19:52, 26.49s/it]

Val Loss: 0.4055 - Val Accuracy: 0.9376



Training:   0%|          | 0/112 [00:00<?, ?it/s][A
Training:   1%|          | 1/112 [00:01<01:51,  1.00s/it][A
Training:   4%|▎         | 4/112 [00:01<00:24,  4.40it/s][A
Training:   5%|▌         | 6/112 [00:01<00:29,  3.59it/s][A
Training:   8%|▊         | 9/112 [00:02<00:27,  3.78it/s][A
Training:  11%|█         | 12/112 [00:02<00:17,  5.64it/s][A
Training:  12%|█▎        | 14/112 [00:03<00:23,  4.21it/s][A
Training:  14%|█▍        | 16/112 [00:03<00:18,  5.22it/s][A
Training:  15%|█▌        | 17/112 [00:04<00:27,  3.49it/s][A
Training:  17%|█▋        | 19/112 [00:04<00:19,  4.75it/s][A
Training:  19%|█▉        | 21/112 [00:05<00:23,  3.81it/s][A
Training:  21%|██        | 23/112 [00:05<00:17,  5.03it/s][A
Training:  22%|██▏       | 25/112 [00:06<00:21,  4.12it/s][A
Training:  24%|██▍       | 27/112 [00:06<00:16,  5.25it/s][A
Training:  26%|██▌       | 29/112 [00:06<00:17,  4.77it/s][A
Training:  28%|██▊       | 31/112 [00:06<00:15,  5.39it/s][A
Training:  29%|██▉  

Epoch: 25/69 - Loss: 0.3781 - Accuracy: 0.9196



  0%|          | 0/14 [00:00<?, ?it/s][A
  7%|▋         | 1/14 [00:01<00:13,  1.02s/it][A
 14%|█▍        | 2/14 [00:01<00:06,  1.97it/s][A
 36%|███▌      | 5/14 [00:01<00:02,  3.50it/s][A
 64%|██████▍   | 9/14 [00:02<00:01,  4.22it/s][A
 86%|████████▌ | 12/14 [00:02<00:00,  6.00it/s][A
100%|██████████| 14/14 [00:03<00:00,  4.09it/s][A
Epochs:  36%|███▌      | 25/69 [11:03<19:28, 26.57s/it]

Val Loss: 0.5215 - Val Accuracy: 0.8045



Training:   0%|          | 0/112 [00:00<?, ?it/s][A
Training:   1%|          | 1/112 [00:01<02:14,  1.21s/it][A
Training:   4%|▍         | 5/112 [00:01<00:34,  3.07it/s][A
Training:   7%|▋         | 8/112 [00:02<00:20,  5.19it/s][A
Training:   9%|▉         | 10/112 [00:02<00:22,  4.49it/s][A
Training:  11%|█         | 12/112 [00:02<00:17,  5.76it/s][A
Training:  12%|█▎        | 14/112 [00:03<00:22,  4.38it/s][A
Training:  15%|█▌        | 17/112 [00:04<00:22,  4.25it/s][A
Training:  18%|█▊        | 20/112 [00:04<00:15,  6.06it/s][A
Training:  20%|█▉        | 22/112 [00:05<00:19,  4.53it/s][A
Training:  21%|██▏       | 24/112 [00:05<00:15,  5.68it/s][A
Training:  23%|██▎       | 26/112 [00:05<00:19,  4.47it/s][A
Training:  25%|██▌       | 28/112 [00:05<00:14,  5.72it/s][A
Training:  27%|██▋       | 30/112 [00:06<00:17,  4.60it/s][A
Training:  29%|██▊       | 32/112 [00:06<00:13,  5.85it/s][A
Training:  30%|███       | 34/112 [00:07<00:17,  4.45it/s][A
Training:  32%|███▏

Epoch: 26/69 - Loss: 0.5909 - Accuracy: 0.9172



  0%|          | 0/14 [00:00<?, ?it/s][A
  7%|▋         | 1/14 [00:00<00:11,  1.09it/s][A
 21%|██▏       | 3/14 [00:01<00:03,  3.42it/s][A
 29%|██▊       | 4/14 [00:01<00:02,  4.00it/s][A
 36%|███▌      | 5/14 [00:01<00:02,  3.58it/s][A
 43%|████▎     | 6/14 [00:01<00:01,  4.15it/s][A
 57%|█████▋    | 8/14 [00:01<00:00,  6.12it/s][A
 64%|██████▍   | 9/14 [00:02<00:01,  4.09it/s][A
 79%|███████▊  | 11/14 [00:02<00:00,  5.35it/s][A
100%|██████████| 14/14 [00:03<00:00,  4.41it/s][A
Epochs:  38%|███▊      | 26/69 [11:30<19:00, 26.52s/it]

Val Loss: 0.2361 - Val Accuracy: 0.9318



Training:   0%|          | 0/112 [00:00<?, ?it/s][A
Training:   1%|          | 1/112 [00:01<02:14,  1.21s/it][A
Training:   3%|▎         | 3/112 [00:01<00:39,  2.77it/s][A
Training:   4%|▍         | 5/112 [00:01<00:35,  3.03it/s][A
Training:   7%|▋         | 8/112 [00:02<00:18,  5.68it/s][A
Training:   9%|▉         | 10/112 [00:02<00:24,  4.13it/s][A
Training:  11%|█         | 12/112 [00:02<00:18,  5.45it/s][A
Training:  12%|█▎        | 14/112 [00:03<00:22,  4.40it/s][A
Training:  15%|█▌        | 17/112 [00:04<00:20,  4.58it/s][A
Training:  18%|█▊        | 20/112 [00:04<00:15,  5.79it/s][A
Training:  19%|█▉        | 21/112 [00:04<00:19,  4.68it/s][A
Training:  21%|██        | 23/112 [00:05<00:16,  5.33it/s][A
Training:  22%|██▏       | 25/112 [00:05<00:18,  4.63it/s][A
Training:  24%|██▍       | 27/112 [00:06<00:16,  5.19it/s][A
Training:  25%|██▌       | 28/112 [00:06<00:17,  4.82it/s][A
Training:  26%|██▌       | 29/112 [00:06<00:17,  4.61it/s][A
Training:  28%|██▊  

Epoch: 27/69 - Loss: 0.3341 - Accuracy: 0.9233



  0%|          | 0/14 [00:00<?, ?it/s][A
  7%|▋         | 1/14 [00:00<00:12,  1.04it/s][A
 21%|██▏       | 3/14 [00:01<00:03,  3.45it/s][A
 36%|███▌      | 5/14 [00:01<00:02,  3.62it/s][A
 43%|████▎     | 6/14 [00:01<00:02,  3.48it/s][A
 57%|█████▋    | 8/14 [00:02<00:01,  5.43it/s][A
 71%|███████▏  | 10/14 [00:02<00:00,  4.03it/s][A
 86%|████████▌ | 12/14 [00:02<00:00,  5.39it/s][A
100%|██████████| 14/14 [00:03<00:00,  4.29it/s][A
Epochs:  39%|███▉      | 27/69 [11:56<18:33, 26.50s/it]

Val Loss: 0.2258 - Val Accuracy: 0.9323



Training:   0%|          | 0/112 [00:00<?, ?it/s][A
Training:   1%|          | 1/112 [00:01<01:58,  1.07s/it][A
Training:   3%|▎         | 3/112 [00:01<00:37,  2.90it/s][A
Training:   4%|▍         | 5/112 [00:01<00:34,  3.08it/s][A
Training:   6%|▋         | 7/112 [00:01<00:22,  4.73it/s][A
Training:   8%|▊         | 9/112 [00:02<00:27,  3.72it/s][A
Training:  11%|█         | 12/112 [00:02<00:16,  6.09it/s][A
Training:  12%|█▎        | 14/112 [00:03<00:22,  4.34it/s][A
Training:  14%|█▍        | 16/112 [00:03<00:16,  5.67it/s][A
Training:  16%|█▌        | 18/112 [00:04<00:19,  4.74it/s][A
Training:  19%|█▉        | 21/112 [00:05<00:20,  4.49it/s][A
Training:  21%|██        | 23/112 [00:05<00:16,  5.52it/s][A
Training:  22%|██▏       | 25/112 [00:05<00:20,  4.31it/s][A
Training:  24%|██▍       | 27/112 [00:05<00:15,  5.45it/s][A
Training:  26%|██▌       | 29/112 [00:06<00:19,  4.25it/s][A
Training:  28%|██▊       | 31/112 [00:06<00:14,  5.49it/s][A
Training:  29%|██▉   

Epoch: 28/69 - Loss: 0.8409 - Accuracy: 0.9120



  0%|          | 0/14 [00:00<?, ?it/s][A
  7%|▋         | 1/14 [00:01<00:13,  1.03s/it][A
 21%|██▏       | 3/14 [00:01<00:03,  2.90it/s][A
 36%|███▌      | 5/14 [00:01<00:02,  3.24it/s][A
 50%|█████     | 7/14 [00:02<00:01,  4.00it/s][A
 64%|██████▍   | 9/14 [00:02<00:01,  4.02it/s][A
 71%|███████▏  | 10/14 [00:02<00:00,  4.31it/s][A
 79%|███████▊  | 11/14 [00:03<00:00,  4.18it/s][A
100%|██████████| 14/14 [00:03<00:00,  3.95it/s][A
Epochs:  41%|████      | 28/69 [12:23<18:12, 26.63s/it]

Val Loss: 0.4031 - Val Accuracy: 0.9284



Training:   0%|          | 0/112 [00:00<?, ?it/s][A
Training:   1%|          | 1/112 [00:01<01:53,  1.02s/it][A
Training:   4%|▎         | 4/112 [00:01<00:24,  4.34it/s][A
Training:   5%|▌         | 6/112 [00:01<00:32,  3.27it/s][A
Training:   7%|▋         | 8/112 [00:02<00:21,  4.78it/s][A
Training:   9%|▉         | 10/112 [00:02<00:26,  3.79it/s][A
Training:  11%|█         | 12/112 [00:02<00:19,  5.09it/s][A
Training:  12%|█▎        | 14/112 [00:03<00:24,  3.98it/s][A
Training:  14%|█▍        | 16/112 [00:03<00:18,  5.20it/s][A
Training:  16%|█▌        | 18/112 [00:04<00:22,  4.23it/s][A
Training:  19%|█▉        | 21/112 [00:04<00:17,  5.12it/s][A
Training:  20%|█▉        | 22/112 [00:05<00:19,  4.65it/s][A
Training:  22%|██▏       | 25/112 [00:05<00:16,  5.30it/s][A
Training:  23%|██▎       | 26/112 [00:06<00:18,  4.57it/s][A
Training:  25%|██▌       | 28/112 [00:06<00:13,  6.00it/s][A
Training:  26%|██▌       | 29/112 [00:06<00:16,  5.18it/s][A
Training:  27%|██▋  

Epoch: 29/69 - Loss: 0.3005 - Accuracy: 0.9260



  0%|          | 0/14 [00:00<?, ?it/s][A
  7%|▋         | 1/14 [00:01<00:13,  1.06s/it][A
 29%|██▊       | 4/14 [00:01<00:02,  3.93it/s][A
 36%|███▌      | 5/14 [00:01<00:03,  2.93it/s][A
 57%|█████▋    | 8/14 [00:01<00:01,  5.46it/s][A
 71%|███████▏  | 10/14 [00:02<00:00,  4.24it/s][A
 79%|███████▊  | 11/14 [00:02<00:00,  4.75it/s][A
100%|██████████| 14/14 [00:03<00:00,  4.00it/s][A
Epochs:  42%|████▏     | 29/69 [12:50<17:44, 26.62s/it]

Val Loss: 0.2612 - Val Accuracy: 0.9175



Training:   0%|          | 0/112 [00:00<?, ?it/s][A
Training:   1%|          | 1/112 [00:01<01:51,  1.00s/it][A
Training:   4%|▍         | 5/112 [00:01<00:30,  3.51it/s][A
Training:   5%|▌         | 6/112 [00:01<00:26,  4.03it/s][A
Training:   8%|▊         | 9/112 [00:02<00:23,  4.46it/s][A
Training:  10%|▉         | 11/112 [00:02<00:17,  5.77it/s][A
Training:  12%|█▏        | 13/112 [00:03<00:24,  4.03it/s][A
Training:  14%|█▍        | 16/112 [00:03<00:16,  5.99it/s][A
Training:  16%|█▌        | 18/112 [00:04<00:20,  4.64it/s][A
Training:  18%|█▊        | 20/112 [00:04<00:16,  5.73it/s][A
Training:  20%|█▉        | 22/112 [00:05<00:21,  4.23it/s][A
Training:  21%|██▏       | 24/112 [00:05<00:16,  5.42it/s][A
Training:  23%|██▎       | 26/112 [00:05<00:18,  4.64it/s][A
Training:  26%|██▌       | 29/112 [00:06<00:19,  4.22it/s][A
Training:  28%|██▊       | 31/112 [00:06<00:15,  5.19it/s][A
Training:  29%|██▉       | 33/112 [00:07<00:18,  4.30it/s][A
Training:  32%|███▏ 

Epoch: 30/69 - Loss: 0.2766 - Accuracy: 0.9273



  0%|          | 0/14 [00:00<?, ?it/s][A
  7%|▋         | 1/14 [00:01<00:17,  1.36s/it][A
 21%|██▏       | 3/14 [00:01<00:04,  2.50it/s][A
 36%|███▌      | 5/14 [00:02<00:03,  2.86it/s][A
 50%|█████     | 7/14 [00:02<00:01,  3.99it/s][A
 64%|██████▍   | 9/14 [00:02<00:01,  3.92it/s][A
 79%|███████▊  | 11/14 [00:03<00:00,  5.04it/s][A
100%|██████████| 14/14 [00:03<00:00,  3.84it/s][A
Epochs:  43%|████▎     | 30/69 [13:17<17:20, 26.69s/it]

Val Loss: 0.3100 - Val Accuracy: 0.9210



Training:   0%|          | 0/112 [00:00<?, ?it/s][A
Training:   1%|          | 1/112 [00:01<02:12,  1.19s/it][A
Training:   3%|▎         | 3/112 [00:01<00:38,  2.81it/s][A
Training:   4%|▍         | 5/112 [00:02<00:38,  2.81it/s][A
Training:   7%|▋         | 8/112 [00:02<00:20,  5.19it/s][A
Training:   9%|▉         | 10/112 [00:02<00:24,  4.16it/s][A
Training:  12%|█▏        | 13/112 [00:03<00:25,  3.85it/s][A
Training:  13%|█▎        | 15/112 [00:03<00:19,  4.96it/s][A
Training:  15%|█▌        | 17/112 [00:04<00:24,  3.85it/s][A
Training:  17%|█▋        | 19/112 [00:04<00:19,  4.86it/s][A
Training:  18%|█▊        | 20/112 [00:04<00:17,  5.29it/s][A
Training:  19%|█▉        | 21/112 [00:05<00:24,  3.79it/s][A
Training:  21%|██▏       | 24/112 [00:05<00:13,  6.31it/s][A
Training:  23%|██▎       | 26/112 [00:06<00:18,  4.70it/s][A
Training:  26%|██▌       | 29/112 [00:06<00:17,  4.70it/s][A
Training:  28%|██▊       | 31/112 [00:06<00:13,  5.82it/s][A
Training:  29%|██▉  

Epoch: 31/69 - Loss: 0.3147 - Accuracy: 0.9253



  0%|          | 0/14 [00:00<?, ?it/s][A
  7%|▋         | 1/14 [00:01<00:13,  1.01s/it][A
 21%|██▏       | 3/14 [00:01<00:03,  3.29it/s][A
 36%|███▌      | 5/14 [00:01<00:02,  3.03it/s][A
 64%|██████▍   | 9/14 [00:02<00:01,  4.20it/s][A
100%|██████████| 14/14 [00:03<00:00,  4.30it/s][A
Epochs:  45%|████▍     | 31/69 [13:43<16:49, 26.57s/it]

Val Loss: 0.3404 - Val Accuracy: 0.8946



Training:   0%|          | 0/112 [00:00<?, ?it/s][A
Training:   1%|          | 1/112 [00:01<01:59,  1.07s/it][A
Training:   4%|▍         | 5/112 [00:01<00:33,  3.16it/s][A
Training:   7%|▋         | 8/112 [00:01<00:19,  5.32it/s][A
Training:   9%|▉         | 10/112 [00:02<00:25,  3.93it/s][A
Training:  12%|█▏        | 13/112 [00:03<00:23,  4.25it/s][A
Training:  13%|█▎        | 15/112 [00:03<00:18,  5.35it/s][A
Training:  15%|█▌        | 17/112 [00:04<00:20,  4.58it/s][A
Training:  18%|█▊        | 20/112 [00:04<00:13,  6.66it/s][A
Training:  20%|█▉        | 22/112 [00:05<00:19,  4.55it/s][A
Training:  22%|██▏       | 25/112 [00:05<00:19,  4.38it/s][A
Training:  26%|██▌       | 29/112 [00:06<00:17,  4.69it/s][A
Training:  27%|██▋       | 30/112 [00:06<00:16,  4.93it/s][A
Training:  29%|██▉       | 33/112 [00:07<00:17,  4.60it/s][A
Training:  32%|███▏      | 36/112 [00:07<00:11,  6.36it/s][A
Training:  34%|███▍      | 38/112 [00:08<00:14,  5.00it/s][A
Training:  37%|███▋

Epoch: 32/69 - Loss: 8.0058 - Accuracy: 0.8878



  0%|          | 0/14 [00:00<?, ?it/s][A
  7%|▋         | 1/14 [00:01<00:13,  1.05s/it][A
 29%|██▊       | 4/14 [00:01<00:02,  4.34it/s][A
 43%|████▎     | 6/14 [00:01<00:02,  3.61it/s][A
 64%|██████▍   | 9/14 [00:02<00:01,  4.06it/s][A
 71%|███████▏  | 10/14 [00:02<00:00,  4.07it/s][A
 93%|█████████▎| 13/14 [00:03<00:00,  4.96it/s][A
100%|██████████| 14/14 [00:03<00:00,  4.12it/s][A
Epochs:  46%|████▋     | 32/69 [14:09<16:19, 26.48s/it]

Val Loss: 3.1041 - Val Accuracy: 0.8790



Training:   0%|          | 0/112 [00:00<?, ?it/s][A
Training:   1%|          | 1/112 [00:01<02:16,  1.23s/it][A
Training:   4%|▍         | 5/112 [00:02<00:38,  2.79it/s][A
Training:   6%|▋         | 7/112 [00:02<00:25,  4.05it/s][A
Training:   8%|▊         | 9/112 [00:02<00:28,  3.68it/s][A
Training:  10%|▉         | 11/112 [00:02<00:20,  4.89it/s][A
Training:  12%|█▏        | 13/112 [00:03<00:23,  4.19it/s][A
Training:  13%|█▎        | 15/112 [00:03<00:17,  5.47it/s][A
Training:  15%|█▌        | 17/112 [00:04<00:21,  4.49it/s][A
Training:  18%|█▊        | 20/112 [00:04<00:13,  6.78it/s][A
Training:  20%|█▉        | 22/112 [00:05<00:17,  5.06it/s][A
Training:  22%|██▏       | 25/112 [00:05<00:20,  4.34it/s][A
Training:  26%|██▌       | 29/112 [00:06<00:18,  4.58it/s][A
Training:  28%|██▊       | 31/112 [00:06<00:14,  5.50it/s][A
Training:  29%|██▉       | 33/112 [00:07<00:17,  4.46it/s][A
Training:  32%|███▏      | 36/112 [00:07<00:12,  6.09it/s][A
Training:  34%|███▍ 

Epoch: 33/69 - Loss: 1.2242 - Accuracy: 0.9124



  0%|          | 0/14 [00:00<?, ?it/s][A
  7%|▋         | 1/14 [00:01<00:15,  1.22s/it][A
 36%|███▌      | 5/14 [00:01<00:03,  3.00it/s][A
 43%|████▎     | 6/14 [00:02<00:02,  3.48it/s][A
 64%|██████▍   | 9/14 [00:02<00:01,  4.21it/s][A
 71%|███████▏  | 10/14 [00:02<00:00,  4.13it/s][A
 86%|████████▌ | 12/14 [00:03<00:00,  5.65it/s][A
 93%|█████████▎| 13/14 [00:03<00:00,  4.41it/s][A
100%|██████████| 14/14 [00:03<00:00,  3.79it/s][A
Epochs:  48%|████▊     | 33/69 [14:36<15:58, 26.62s/it]

Val Loss: 1.1148 - Val Accuracy: 0.8098



Training:   0%|          | 0/112 [00:00<?, ?it/s][A
Training:   1%|          | 1/112 [00:01<02:17,  1.24s/it][A
Training:   4%|▎         | 4/112 [00:01<00:28,  3.81it/s][A
Training:   5%|▌         | 6/112 [00:01<00:27,  3.79it/s][A
Training:   7%|▋         | 8/112 [00:02<00:19,  5.26it/s][A
Training:   9%|▉         | 10/112 [00:02<00:25,  4.03it/s][A
Training:  11%|█         | 12/112 [00:02<00:19,  5.25it/s][A
Training:  12%|█▎        | 14/112 [00:03<00:25,  3.79it/s][A
Training:  13%|█▎        | 15/112 [00:03<00:22,  4.23it/s][A
Training:  15%|█▌        | 17/112 [00:04<00:21,  4.52it/s][A
Training:  16%|█▌        | 18/112 [00:04<00:22,  4.10it/s][A
Training:  19%|█▉        | 21/112 [00:05<00:18,  4.85it/s][A
Training:  20%|█▉        | 22/112 [00:05<00:19,  4.52it/s][A
Training:  22%|██▏       | 25/112 [00:05<00:16,  5.21it/s][A
Training:  23%|██▎       | 26/112 [00:06<00:17,  4.86it/s][A
Training:  26%|██▌       | 29/112 [00:06<00:16,  5.12it/s][A
Training:  27%|██▋  

Epoch: 34/69 - Loss: 2.6498 - Accuracy: 0.9077



  0%|          | 0/14 [00:00<?, ?it/s][A
  7%|▋         | 1/14 [00:01<00:16,  1.29s/it][A
 29%|██▊       | 4/14 [00:01<00:02,  3.67it/s][A
 43%|████▎     | 6/14 [00:02<00:02,  3.35it/s][A
 64%|██████▍   | 9/14 [00:02<00:01,  3.87it/s][A
 79%|███████▊  | 11/14 [00:02<00:00,  5.09it/s][A
 93%|█████████▎| 13/14 [00:03<00:00,  4.78it/s][A
100%|██████████| 14/14 [00:03<00:00,  3.91it/s][A
Epochs:  49%|████▉     | 34/69 [15:03<15:35, 26.74s/it]

Val Loss: 1.1556 - Val Accuracy: 0.9255



Training:   0%|          | 0/112 [00:00<?, ?it/s][A
Training:   1%|          | 1/112 [00:01<02:08,  1.16s/it][A
Training:   3%|▎         | 3/112 [00:01<00:38,  2.86it/s][A
Training:   4%|▍         | 5/112 [00:01<00:37,  2.85it/s][A
Training:   5%|▌         | 6/112 [00:02<00:30,  3.52it/s][A
Training:   8%|▊         | 9/112 [00:02<00:24,  4.13it/s][A
Training:  10%|▉         | 11/112 [00:02<00:19,  5.12it/s][A
Training:  12%|█▏        | 13/112 [00:03<00:20,  4.90it/s][A
Training:  13%|█▎        | 15/112 [00:03<00:16,  5.79it/s][A
Training:  15%|█▌        | 17/112 [00:04<00:22,  4.25it/s][A
Training:  17%|█▋        | 19/112 [00:04<00:18,  5.09it/s][A
Training:  19%|█▉        | 21/112 [00:05<00:21,  4.26it/s][A
Training:  21%|██        | 23/112 [00:05<00:16,  5.55it/s][A
Training:  22%|██▏       | 25/112 [00:05<00:20,  4.33it/s][A
Training:  26%|██▌       | 29/112 [00:06<00:17,  4.83it/s][A
Training:  29%|██▊       | 32/112 [00:06<00:12,  6.52it/s][A
Training:  30%|███   

Epoch: 35/69 - Loss: 0.8887 - Accuracy: 0.9187



  0%|          | 0/14 [00:00<?, ?it/s][A
  7%|▋         | 1/14 [00:01<00:15,  1.17s/it][A
 29%|██▊       | 4/14 [00:01<00:02,  3.92it/s][A
 43%|████▎     | 6/14 [00:02<00:02,  3.32it/s][A
 64%|██████▍   | 9/14 [00:02<00:01,  3.60it/s][A
100%|██████████| 14/14 [00:03<00:00,  4.14it/s][A
Epochs:  51%|█████     | 35/69 [15:29<15:05, 26.62s/it]

Val Loss: 0.5975 - Val Accuracy: 0.9244



Training:   0%|          | 0/112 [00:00<?, ?it/s][A
Training:   1%|          | 1/112 [00:00<01:38,  1.12it/s][A
Training:   2%|▏         | 2/112 [00:01<00:48,  2.28it/s][A
Training:   4%|▍         | 5/112 [00:01<00:30,  3.46it/s][A
Training:   5%|▌         | 6/112 [00:01<00:27,  3.93it/s][A
Training:   8%|▊         | 9/112 [00:02<00:23,  4.37it/s][A
Training:   9%|▉         | 10/112 [00:02<00:23,  4.39it/s][A
Training:  11%|█         | 12/112 [00:02<00:16,  6.00it/s][A
Training:  12%|█▏        | 13/112 [00:03<00:19,  4.97it/s][A
Training:  12%|█▎        | 14/112 [00:03<00:20,  4.75it/s][A
Training:  14%|█▍        | 16/112 [00:03<00:14,  6.44it/s][A
Training:  15%|█▌        | 17/112 [00:03<00:17,  5.32it/s][A
Training:  16%|█▌        | 18/112 [00:04<00:21,  4.35it/s][A
Training:  19%|█▉        | 21/112 [00:04<00:17,  5.22it/s][A
Training:  20%|█▉        | 22/112 [00:05<00:20,  4.50it/s][A
Training:  21%|██        | 23/112 [00:05<00:17,  5.04it/s][A
Training:  22%|██▏   

Epoch: 36/69 - Loss: 0.4274 - Accuracy: 0.9249



  0%|          | 0/14 [00:00<?, ?it/s][A
  7%|▋         | 1/14 [00:01<00:13,  1.05s/it][A
 21%|██▏       | 3/14 [00:01<00:03,  2.82it/s][A
 36%|███▌      | 5/14 [00:01<00:02,  3.08it/s][A
 50%|█████     | 7/14 [00:01<00:01,  4.77it/s][A
 64%|██████▍   | 9/14 [00:02<00:01,  3.91it/s][A
 79%|███████▊  | 11/14 [00:02<00:00,  5.25it/s][A
100%|██████████| 14/14 [00:03<00:00,  4.03it/s][A
Epochs:  52%|█████▏    | 36/69 [15:56<14:36, 26.56s/it]

Val Loss: 0.2218 - Val Accuracy: 0.9330



Training:   0%|          | 0/112 [00:00<?, ?it/s][A
Training:   1%|          | 1/112 [00:01<02:11,  1.18s/it][A
Training:   3%|▎         | 3/112 [00:01<00:38,  2.86it/s][A
Training:   4%|▍         | 5/112 [00:01<00:33,  3.16it/s][A
Training:   6%|▋         | 7/112 [00:01<00:21,  4.88it/s][A
Training:   8%|▊         | 9/112 [00:02<00:26,  3.83it/s][A
Training:  11%|█         | 12/112 [00:02<00:15,  6.26it/s][A
Training:  12%|█▎        | 14/112 [00:03<00:22,  4.45it/s][A
Training:  14%|█▍        | 16/112 [00:03<00:17,  5.64it/s][A
Training:  16%|█▌        | 18/112 [00:04<00:22,  4.13it/s][A
Training:  18%|█▊        | 20/112 [00:04<00:17,  5.39it/s][A
Training:  20%|█▉        | 22/112 [00:05<00:21,  4.18it/s][A
Training:  22%|██▏       | 25/112 [00:05<00:16,  5.13it/s][A
Training:  23%|██▎       | 26/112 [00:06<00:20,  4.22it/s][A
Training:  26%|██▌       | 29/112 [00:06<00:16,  4.91it/s][A
Training:  27%|██▋       | 30/112 [00:06<00:18,  4.43it/s][A
Training:  29%|██▊   

Epoch: 37/69 - Loss: 0.3174 - Accuracy: 0.9250



  0%|          | 0/14 [00:00<?, ?it/s][A
  7%|▋         | 1/14 [00:01<00:14,  1.11s/it][A
 14%|█▍        | 2/14 [00:01<00:06,  1.82it/s][A
 36%|███▌      | 5/14 [00:02<00:03,  2.99it/s][A
 57%|█████▋    | 8/14 [00:02<00:01,  5.08it/s][A
 64%|██████▍   | 9/14 [00:02<00:01,  3.48it/s][A
 86%|████████▌ | 12/14 [00:03<00:00,  5.40it/s][A
100%|██████████| 14/14 [00:03<00:00,  3.80it/s][A
Epochs:  54%|█████▎    | 37/69 [16:23<14:14, 26.70s/it]

Val Loss: 0.5315 - Val Accuracy: 0.9393



Training:   0%|          | 0/112 [00:00<?, ?it/s][A
Training:   1%|          | 1/112 [00:01<01:58,  1.07s/it][A
Training:   3%|▎         | 3/112 [00:01<00:35,  3.08it/s][A
Training:   4%|▍         | 5/112 [00:01<00:33,  3.19it/s][A
Training:   7%|▋         | 8/112 [00:01<00:18,  5.50it/s][A
Training:   9%|▉         | 10/112 [00:02<00:24,  4.11it/s][A
Training:  12%|█▏        | 13/112 [00:03<00:23,  4.18it/s][A
Training:  14%|█▍        | 16/112 [00:03<00:15,  6.09it/s][A
Training:  16%|█▌        | 18/112 [00:04<00:21,  4.42it/s][A
Training:  18%|█▊        | 20/112 [00:04<00:16,  5.61it/s][A
Training:  20%|█▉        | 22/112 [00:05<00:19,  4.51it/s][A
Training:  22%|██▏       | 25/112 [00:05<00:20,  4.27it/s][A
Training:  24%|██▍       | 27/112 [00:06<00:16,  5.15it/s][A
Training:  26%|██▌       | 29/112 [00:06<00:17,  4.65it/s][A
Training:  28%|██▊       | 31/112 [00:06<00:14,  5.48it/s][A
Training:  29%|██▉       | 33/112 [00:07<00:16,  4.82it/s][A
Training:  31%|███▏ 

Epoch: 38/69 - Loss: 0.5213 - Accuracy: 0.9217



  0%|          | 0/14 [00:00<?, ?it/s][A
  7%|▋         | 1/14 [00:01<00:14,  1.11s/it][A
 21%|██▏       | 3/14 [00:01<00:03,  3.06it/s][A
 36%|███▌      | 5/14 [00:01<00:03,  2.82it/s][A
 57%|█████▋    | 8/14 [00:02<00:01,  5.25it/s][A
 71%|███████▏  | 10/14 [00:02<00:01,  3.97it/s][A
100%|██████████| 14/14 [00:03<00:00,  3.71it/s][A
Epochs:  55%|█████▌    | 38/69 [16:50<13:50, 26.78s/it]

Val Loss: 1.0194 - Val Accuracy: 0.9433



Training:   0%|          | 0/112 [00:00<?, ?it/s][A
Training:   1%|          | 1/112 [00:01<02:30,  1.35s/it][A
Training:   4%|▎         | 4/112 [00:01<00:31,  3.43it/s][A
Training:   5%|▌         | 6/112 [00:02<00:34,  3.07it/s][A
Training:   8%|▊         | 9/112 [00:02<00:28,  3.63it/s][A
Training:  10%|▉         | 11/112 [00:03<00:20,  4.86it/s][A
Training:  12%|█▏        | 13/112 [00:03<00:26,  3.68it/s][A
Training:  13%|█▎        | 15/112 [00:03<00:19,  4.90it/s][A
Training:  15%|█▌        | 17/112 [00:04<00:21,  4.51it/s][A
Training:  18%|█▊        | 20/112 [00:04<00:13,  6.67it/s][A
Training:  20%|█▉        | 22/112 [00:05<00:17,  5.04it/s][A
Training:  22%|██▏       | 25/112 [00:06<00:19,  4.56it/s][A
Training:  24%|██▍       | 27/112 [00:06<00:15,  5.52it/s][A
Training:  26%|██▌       | 29/112 [00:06<00:17,  4.77it/s][A
Training:  27%|██▋       | 30/112 [00:06<00:16,  4.86it/s][A
Training:  29%|██▊       | 32/112 [00:07<00:13,  6.12it/s][A
Training:  29%|██▉  

Epoch: 39/69 - Loss: 5.9973 - Accuracy: 0.8942



  0%|          | 0/14 [00:00<?, ?it/s][A
  7%|▋         | 1/14 [00:01<00:15,  1.16s/it][A
 36%|███▌      | 5/14 [00:01<00:02,  3.07it/s][A
 64%|██████▍   | 9/14 [00:02<00:01,  3.83it/s][A
100%|██████████| 14/14 [00:03<00:00,  3.87it/s][A
Epochs:  57%|█████▋    | 39/69 [17:17<13:23, 26.77s/it]

Val Loss: 3.1680 - Val Accuracy: 0.9272



Training:   0%|          | 0/112 [00:00<?, ?it/s][A
Training:   1%|          | 1/112 [00:00<01:48,  1.02it/s][A
Training:   4%|▎         | 4/112 [00:01<00:23,  4.63it/s][A
Training:   5%|▌         | 6/112 [00:01<00:27,  3.90it/s][A
Training:   7%|▋         | 8/112 [00:01<00:18,  5.56it/s][A
Training:   9%|▉         | 10/112 [00:02<00:21,  4.68it/s][A
Training:  11%|█         | 12/112 [00:02<00:16,  5.91it/s][A
Training:  12%|█▎        | 14/112 [00:03<00:20,  4.79it/s][A
Training:  14%|█▍        | 16/112 [00:03<00:18,  5.15it/s][A
Training:  15%|█▌        | 17/112 [00:03<00:20,  4.56it/s][A
Training:  16%|█▌        | 18/112 [00:04<00:20,  4.52it/s][A
Training:  18%|█▊        | 20/112 [00:04<00:17,  5.38it/s][A
Training:  19%|█▉        | 21/112 [00:04<00:19,  4.70it/s][A
Training:  20%|█▉        | 22/112 [00:04<00:18,  4.98it/s][A
Training:  21%|██▏       | 24/112 [00:04<00:15,  5.83it/s][A
Training:  22%|██▏       | 25/112 [00:05<00:17,  5.10it/s][A
Training:  23%|██▎  

Epoch: 40/69 - Loss: 1.6300 - Accuracy: 0.9110



  0%|          | 0/14 [00:00<?, ?it/s][A
  7%|▋         | 1/14 [00:01<00:14,  1.15s/it][A
 36%|███▌      | 5/14 [00:01<00:02,  3.04it/s][A
 50%|█████     | 7/14 [00:02<00:01,  4.36it/s][A
 64%|██████▍   | 9/14 [00:02<00:01,  3.75it/s][A
 71%|███████▏  | 10/14 [00:02<00:00,  4.06it/s][A
 93%|█████████▎| 13/14 [00:03<00:00,  4.34it/s][A
100%|██████████| 14/14 [00:03<00:00,  3.69it/s][A
Epochs:  58%|█████▊    | 40/69 [17:43<12:52, 26.65s/it]

Val Loss: 0.4806 - Val Accuracy: 0.9192



Training:   0%|          | 0/112 [00:00<?, ?it/s][A
Training:   1%|          | 1/112 [00:01<02:00,  1.08s/it][A
Training:   2%|▏         | 2/112 [00:01<01:00,  1.81it/s][A
Training:   4%|▎         | 4/112 [00:01<00:28,  3.84it/s][A
Training:   4%|▍         | 5/112 [00:01<00:30,  3.51it/s][A
Training:   5%|▌         | 6/112 [00:02<00:30,  3.49it/s][A
Training:   7%|▋         | 8/112 [00:02<00:25,  4.07it/s][A
Training:   8%|▊         | 9/112 [00:02<00:22,  4.49it/s][A
Training:   9%|▉         | 10/112 [00:02<00:25,  4.00it/s][A
Training:  11%|█         | 12/112 [00:03<00:24,  4.12it/s][A
Training:  12%|█▎        | 14/112 [00:03<00:20,  4.73it/s][A
Training:  14%|█▍        | 16/112 [00:04<00:20,  4.68it/s][A
Training:  16%|█▌        | 18/112 [00:04<00:17,  5.35it/s][A
Training:  18%|█▊        | 20/112 [00:04<00:19,  4.82it/s][A
Training:  20%|█▉        | 22/112 [00:05<00:16,  5.34it/s][A
Training:  21%|██▏       | 24/112 [00:05<00:20,  4.31it/s][A
Training:  23%|██▎     

Epoch: 41/69 - Loss: 0.4560 - Accuracy: 0.9220



  0%|          | 0/14 [00:00<?, ?it/s][A
  7%|▋         | 1/14 [00:01<00:18,  1.43s/it][A
 36%|███▌      | 5/14 [00:02<00:03,  2.86it/s][A
 43%|████▎     | 6/14 [00:02<00:02,  3.32it/s][A
 64%|██████▍   | 9/14 [00:02<00:01,  3.70it/s][A
 71%|███████▏  | 10/14 [00:03<00:01,  3.90it/s][A
 93%|█████████▎| 13/14 [00:03<00:00,  4.30it/s][A
100%|██████████| 14/14 [00:03<00:00,  3.52it/s][A
Epochs:  59%|█████▉    | 41/69 [18:11<12:37, 27.07s/it]

Val Loss: 0.6606 - Val Accuracy: 0.9250



Training:   0%|          | 0/112 [00:00<?, ?it/s][A
Training:   1%|          | 1/112 [00:01<02:16,  1.23s/it][A
Training:   3%|▎         | 3/112 [00:01<00:41,  2.61it/s][A
Training:   4%|▍         | 5/112 [00:02<00:39,  2.70it/s][A
Training:   7%|▋         | 8/112 [00:02<00:20,  5.01it/s][A
Training:   9%|▉         | 10/112 [00:02<00:23,  4.25it/s][A
Training:  11%|█         | 12/112 [00:03<00:19,  5.18it/s][A
Training:  12%|█▏        | 13/112 [00:03<00:24,  3.98it/s][A
Training:  14%|█▍        | 16/112 [00:04<00:19,  4.89it/s][A
Training:  15%|█▌        | 17/112 [00:04<00:22,  4.23it/s][A
Training:  17%|█▋        | 19/112 [00:04<00:17,  5.26it/s][A
Training:  18%|█▊        | 20/112 [00:04<00:20,  4.53it/s][A
Training:  19%|█▉        | 21/112 [00:05<00:20,  4.53it/s][A
Training:  20%|█▉        | 22/112 [00:05<00:17,  5.17it/s][A
Training:  21%|██        | 23/112 [00:05<00:17,  5.15it/s][A
Training:  21%|██▏       | 24/112 [00:05<00:18,  4.65it/s][A
Training:  22%|██▏  

Epoch: 42/69 - Loss: 0.4044 - Accuracy: 0.9243



  0%|          | 0/14 [00:00<?, ?it/s][A
  7%|▋         | 1/14 [00:01<00:14,  1.08s/it][A
 14%|█▍        | 2/14 [00:01<00:06,  1.81it/s][A
 29%|██▊       | 4/14 [00:01<00:02,  4.08it/s][A
 36%|███▌      | 5/14 [00:01<00:02,  3.02it/s][A
 43%|████▎     | 6/14 [00:02<00:02,  3.32it/s][A
 64%|██████▍   | 9/14 [00:02<00:01,  3.78it/s][A
 71%|███████▏  | 10/14 [00:03<00:00,  4.14it/s][A
100%|██████████| 14/14 [00:03<00:00,  3.67it/s][A
Epochs:  61%|██████    | 42/69 [18:39<12:14, 27.20s/it]

Val Loss: 0.5515 - Val Accuracy: 0.9324



Training:   0%|          | 0/112 [00:00<?, ?it/s][A
Training:   1%|          | 1/112 [00:01<02:12,  1.19s/it][A
Training:   3%|▎         | 3/112 [00:01<00:43,  2.50it/s][A
Training:   4%|▍         | 5/112 [00:01<00:34,  3.07it/s][A
Training:   5%|▌         | 6/112 [00:02<00:31,  3.40it/s][A
Training:   7%|▋         | 8/112 [00:02<00:20,  5.13it/s][A
Training:   8%|▊         | 9/112 [00:02<00:26,  3.86it/s][A
Training:   9%|▉         | 10/112 [00:03<00:26,  3.82it/s][A
Training:  12%|█▏        | 13/112 [00:03<00:20,  4.84it/s][A
Training:  12%|█▎        | 14/112 [00:03<00:21,  4.50it/s][A
Training:  15%|█▌        | 17/112 [00:04<00:21,  4.49it/s][A
Training:  16%|█▌        | 18/112 [00:04<00:19,  4.77it/s][A
Training:  17%|█▋        | 19/112 [00:04<00:17,  5.28it/s][A
Training:  19%|█▉        | 21/112 [00:05<00:21,  4.25it/s][A
Training:  20%|█▉        | 22/112 [00:05<00:18,  4.75it/s][A
Training:  21%|██▏       | 24/112 [00:05<00:13,  6.59it/s][A
Training:  23%|██▎    

Epoch: 43/69 - Loss: 0.4951 - Accuracy: 0.9260



  0%|          | 0/14 [00:00<?, ?it/s][A
  7%|▋         | 1/14 [00:01<00:14,  1.11s/it][A
 36%|███▌      | 5/14 [00:01<00:03,  2.88it/s][A
 57%|█████▋    | 8/14 [00:02<00:01,  4.98it/s][A
 71%|███████▏  | 10/14 [00:02<00:01,  3.98it/s][A
100%|██████████| 14/14 [00:03<00:00,  4.03it/s][A
Epochs:  62%|██████▏   | 43/69 [19:05<11:42, 27.02s/it]

Val Loss: 0.2955 - Val Accuracy: 0.9164



Training:   0%|          | 0/112 [00:00<?, ?it/s][A
Training:   1%|          | 1/112 [00:01<01:53,  1.03s/it][A
Training:   4%|▎         | 4/112 [00:01<00:24,  4.34it/s][A
Training:   5%|▌         | 6/112 [00:01<00:27,  3.90it/s][A
Training:   7%|▋         | 8/112 [00:01<00:20,  5.17it/s][A
Training:   8%|▊         | 9/112 [00:02<00:30,  3.42it/s][A
Training:  10%|▉         | 11/112 [00:02<00:22,  4.43it/s][A
Training:  12%|█▏        | 13/112 [00:03<00:22,  4.42it/s][A
Training:  13%|█▎        | 15/112 [00:03<00:17,  5.50it/s][A
Training:  15%|█▌        | 17/112 [00:03<00:17,  5.49it/s][A
Training:  17%|█▋        | 19/112 [00:04<00:15,  5.99it/s][A
Training:  19%|█▉        | 21/112 [00:04<00:17,  5.09it/s][A
Training:  21%|██        | 23/112 [00:05<00:17,  5.00it/s][A
Training:  22%|██▏       | 25/112 [00:05<00:18,  4.65it/s][A
Training:  24%|██▍       | 27/112 [00:05<00:15,  5.54it/s][A
Training:  26%|██▌       | 29/112 [00:06<00:17,  4.87it/s][A
Training:  28%|██▊   

Epoch: 44/69 - Loss: 2.5716 - Accuracy: 0.9208



  0%|          | 0/14 [00:00<?, ?it/s][A
  7%|▋         | 1/14 [00:01<00:14,  1.09s/it][A
 21%|██▏       | 3/14 [00:01<00:03,  2.78it/s][A
 36%|███▌      | 5/14 [00:01<00:02,  3.04it/s][A
 50%|█████     | 7/14 [00:02<00:01,  4.20it/s][A
 64%|██████▍   | 9/14 [00:02<00:01,  3.98it/s][A
 71%|███████▏  | 10/14 [00:02<00:00,  4.51it/s][A
 79%|███████▊  | 11/14 [00:03<00:00,  4.21it/s][A
100%|██████████| 14/14 [00:03<00:00,  3.92it/s][A
Epochs:  64%|██████▍   | 44/69 [19:32<11:11, 26.86s/it]

Val Loss: 0.9701 - Val Accuracy: 0.9279



Training:   0%|          | 0/112 [00:00<?, ?it/s][A
Training:   1%|          | 1/112 [00:01<02:07,  1.15s/it][A
Training:   3%|▎         | 3/112 [00:01<00:37,  2.90it/s][A
Training:   4%|▍         | 5/112 [00:01<00:37,  2.87it/s][A
Training:   5%|▌         | 6/112 [00:02<00:30,  3.45it/s][A
Training:   7%|▋         | 8/112 [00:02<00:20,  5.07it/s][A
Training:   8%|▊         | 9/112 [00:02<00:31,  3.32it/s][A
Training:  10%|▉         | 11/112 [00:03<00:20,  4.84it/s][A
Training:  12%|█▏        | 13/112 [00:03<00:27,  3.61it/s][A
Training:  15%|█▌        | 17/112 [00:04<00:21,  4.42it/s][A
Training:  17%|█▋        | 19/112 [00:04<00:16,  5.57it/s][A
Training:  19%|█▉        | 21/112 [00:05<00:22,  4.03it/s][A
Training:  21%|██        | 23/112 [00:05<00:17,  5.20it/s][A
Training:  22%|██▏       | 25/112 [00:06<00:20,  4.15it/s][A
Training:  25%|██▌       | 28/112 [00:06<00:13,  6.04it/s][A
Training:  27%|██▋       | 30/112 [00:07<00:17,  4.67it/s][A
Training:  29%|██▉    

Epoch: 45/69 - Loss: 0.7802 - Accuracy: 0.9209



  0%|          | 0/14 [00:00<?, ?it/s][A
  7%|▋         | 1/14 [00:01<00:14,  1.14s/it][A
 21%|██▏       | 3/14 [00:01<00:03,  2.88it/s][A
 36%|███▌      | 5/14 [00:02<00:03,  2.78it/s][A
 50%|█████     | 7/14 [00:02<00:01,  3.97it/s][A
 64%|██████▍   | 9/14 [00:02<00:01,  3.72it/s][A
 79%|███████▊  | 11/14 [00:02<00:00,  4.98it/s][A
100%|██████████| 14/14 [00:03<00:00,  3.82it/s][A
Epochs:  65%|██████▌   | 45/69 [19:59<10:48, 27.02s/it]

Val Loss: 1.5982 - Val Accuracy: 0.9123



Training:   0%|          | 0/112 [00:00<?, ?it/s][A
Training:   1%|          | 1/112 [00:01<02:31,  1.37s/it][A
Training:   3%|▎         | 3/112 [00:01<00:44,  2.43it/s][A
Training:   4%|▍         | 5/112 [00:02<00:37,  2.89it/s][A
Training:   6%|▋         | 7/112 [00:02<00:23,  4.40it/s][A
Training:   8%|▊         | 9/112 [00:02<00:28,  3.61it/s][A
Training:   9%|▉         | 10/112 [00:03<00:25,  4.05it/s][A
Training:  12%|█▏        | 13/112 [00:03<00:22,  4.31it/s][A
Training:  13%|█▎        | 15/112 [00:03<00:17,  5.58it/s][A
Training:  15%|█▌        | 17/112 [00:04<00:22,  4.28it/s][A
Training:  17%|█▋        | 19/112 [00:04<00:16,  5.55it/s][A
Training:  19%|█▉        | 21/112 [00:05<00:23,  3.85it/s][A
Training:  21%|██        | 23/112 [00:05<00:18,  4.91it/s][A
Training:  22%|██▏       | 25/112 [00:06<00:21,  4.00it/s][A
Training:  25%|██▌       | 28/112 [00:06<00:14,  5.88it/s][A
Training:  27%|██▋       | 30/112 [00:07<00:17,  4.57it/s][A
Training:  29%|██▉   

Epoch: 46/69 - Loss: 0.4890 - Accuracy: 0.9246



  0%|          | 0/14 [00:00<?, ?it/s][A
  7%|▋         | 1/14 [00:01<00:15,  1.22s/it][A
 36%|███▌      | 5/14 [00:02<00:03,  2.88it/s][A
 64%|██████▍   | 9/14 [00:02<00:01,  3.77it/s][A
 86%|████████▌ | 12/14 [00:02<00:00,  5.50it/s][A
100%|██████████| 14/14 [00:03<00:00,  3.78it/s][A
Epochs:  67%|██████▋   | 46/69 [20:27<10:27, 27.28s/it]

Val Loss: 0.4280 - Val Accuracy: 0.8900



Training:   0%|          | 0/112 [00:00<?, ?it/s][A
Training:   1%|          | 1/112 [00:01<02:00,  1.09s/it][A
Training:   4%|▎         | 4/112 [00:01<00:25,  4.20it/s][A
Training:   5%|▌         | 6/112 [00:01<00:31,  3.34it/s][A
Training:   8%|▊         | 9/112 [00:02<00:30,  3.42it/s][A
Training:  11%|█         | 12/112 [00:02<00:19,  5.20it/s][A
Training:  12%|█▎        | 14/112 [00:03<00:24,  3.99it/s][A
Training:  15%|█▌        | 17/112 [00:04<00:22,  4.19it/s][A
Training:  17%|█▋        | 19/112 [00:04<00:17,  5.20it/s][A
Training:  19%|█▉        | 21/112 [00:05<00:20,  4.46it/s][A
Training:  20%|█▉        | 22/112 [00:05<00:21,  4.23it/s][A
Training:  22%|██▏       | 25/112 [00:05<00:18,  4.72it/s][A
Training:  23%|██▎       | 26/112 [00:06<00:21,  4.04it/s][A
Training:  25%|██▌       | 28/112 [00:06<00:15,  5.38it/s][A
Training:  26%|██▌       | 29/112 [00:06<00:18,  4.49it/s][A
Training:  27%|██▋       | 30/112 [00:07<00:19,  4.30it/s][A
Training:  29%|██▉  

Epoch: 47/69 - Loss: 0.3734 - Accuracy: 0.9253



  0%|          | 0/14 [00:00<?, ?it/s][A
  7%|▋         | 1/14 [00:01<00:14,  1.12s/it][A
 21%|██▏       | 3/14 [00:01<00:03,  2.94it/s][A
 36%|███▌      | 5/14 [00:01<00:03,  2.89it/s][A
 50%|█████     | 7/14 [00:02<00:01,  4.12it/s][A
 64%|██████▍   | 9/14 [00:02<00:01,  3.59it/s][A
 79%|███████▊  | 11/14 [00:02<00:00,  4.92it/s][A
 86%|████████▌ | 12/14 [00:03<00:00,  5.43it/s][A
100%|██████████| 14/14 [00:03<00:00,  3.82it/s][A
Epochs:  68%|██████▊   | 47/69 [20:54<09:58, 27.19s/it]

Val Loss: 0.4578 - Val Accuracy: 0.9243



Training:   0%|          | 0/112 [00:00<?, ?it/s][A
Training:   1%|          | 1/112 [00:01<02:14,  1.21s/it][A
Training:   3%|▎         | 3/112 [00:01<00:39,  2.74it/s][A
Training:   4%|▍         | 5/112 [00:02<00:39,  2.70it/s][A
Training:   6%|▋         | 7/112 [00:02<00:25,  4.11it/s][A
Training:   8%|▊         | 9/112 [00:02<00:28,  3.60it/s][A
Training:  11%|█         | 12/112 [00:03<00:17,  5.80it/s][A
Training:  12%|█▎        | 14/112 [00:03<00:21,  4.48it/s][A
Training:  15%|█▌        | 17/112 [00:04<00:18,  5.02it/s][A
Training:  17%|█▋        | 19/112 [00:04<00:14,  6.28it/s][A
Training:  19%|█▉        | 21/112 [00:04<00:17,  5.30it/s][A
Training:  20%|█▉        | 22/112 [00:04<00:15,  5.68it/s][A
Training:  22%|██▏       | 25/112 [00:05<00:17,  4.99it/s][A
Training:  23%|██▎       | 26/112 [00:05<00:16,  5.13it/s][A
Training:  26%|██▌       | 29/112 [00:06<00:17,  4.85it/s][A
Training:  27%|██▋       | 30/112 [00:06<00:16,  5.09it/s][A
Training:  29%|██▊   

Epoch: 48/69 - Loss: 0.4056 - Accuracy: 0.9260



  0%|          | 0/14 [00:00<?, ?it/s][A
  7%|▋         | 1/14 [00:00<00:11,  1.12it/s][A
 14%|█▍        | 2/14 [00:01<00:06,  1.91it/s][A
 29%|██▊       | 4/14 [00:01<00:02,  4.29it/s][A
 36%|███▌      | 5/14 [00:01<00:02,  3.70it/s][A
 43%|████▎     | 6/14 [00:01<00:02,  3.65it/s][A
 57%|█████▋    | 8/14 [00:02<00:01,  5.37it/s][A
 64%|██████▍   | 9/14 [00:02<00:01,  3.87it/s][A
 71%|███████▏  | 10/14 [00:02<00:00,  4.05it/s][A
 79%|███████▊  | 11/14 [00:02<00:00,  4.50it/s][A
 93%|█████████▎| 13/14 [00:03<00:00,  4.44it/s][A
100%|██████████| 14/14 [00:03<00:00,  3.85it/s][A
Epochs:  70%|██████▉   | 48/69 [21:21<09:28, 27.07s/it]

Val Loss: 0.4502 - Val Accuracy: 0.9152



Training:   0%|          | 0/112 [00:00<?, ?it/s][A
Training:   1%|          | 1/112 [00:01<02:04,  1.13s/it][A
Training:   3%|▎         | 3/112 [00:01<00:37,  2.91it/s][A
Training:   4%|▍         | 5/112 [00:01<00:35,  2.97it/s][A
Training:   5%|▌         | 6/112 [00:02<00:28,  3.67it/s][A
Training:   8%|▊         | 9/112 [00:02<00:27,  3.73it/s][A
Training:  10%|▉         | 11/112 [00:02<00:19,  5.08it/s][A
Training:  12%|█▏        | 13/112 [00:03<00:24,  4.03it/s][A
Training:  15%|█▌        | 17/112 [00:04<00:19,  4.83it/s][A
Training:  18%|█▊        | 20/112 [00:04<00:13,  6.74it/s][A
Training:  20%|█▉        | 22/112 [00:05<00:18,  4.96it/s][A
Training:  22%|██▏       | 25/112 [00:05<00:18,  4.61it/s][A
Training:  26%|██▌       | 29/112 [00:06<00:18,  4.39it/s][A
Training:  29%|██▊       | 32/112 [00:06<00:13,  5.73it/s][A
Training:  30%|███       | 34/112 [00:07<00:17,  4.58it/s][A
Training:  33%|███▎      | 37/112 [00:08<00:16,  4.63it/s][A
Training:  37%|███▋  

Epoch: 49/69 - Loss: 0.8336 - Accuracy: 0.9179



  0%|          | 0/14 [00:00<?, ?it/s][A
  7%|▋         | 1/14 [00:01<00:16,  1.25s/it][A
 29%|██▊       | 4/14 [00:01<00:02,  3.76it/s][A
 43%|████▎     | 6/14 [00:02<00:02,  2.91it/s][A
 64%|██████▍   | 9/14 [00:02<00:01,  3.71it/s][A
100%|██████████| 14/14 [00:03<00:00,  3.85it/s][A
Epochs:  71%|███████   | 49/69 [21:48<09:01, 27.08s/it]

Val Loss: 1.0447 - Val Accuracy: 0.9232



Training:   0%|          | 0/112 [00:00<?, ?it/s][A
Training:   1%|          | 1/112 [00:01<02:18,  1.24s/it][A
Training:   3%|▎         | 3/112 [00:01<00:39,  2.73it/s][A
Training:   4%|▍         | 5/112 [00:02<00:37,  2.83it/s][A
Training:   8%|▊         | 9/112 [00:03<00:29,  3.46it/s][A
Training:  12%|█▏        | 13/112 [00:03<00:24,  4.10it/s][A
Training:  15%|█▌        | 17/112 [00:04<00:22,  4.25it/s][A
Training:  18%|█▊        | 20/112 [00:04<00:16,  5.58it/s][A
Training:  20%|█▉        | 22/112 [00:05<00:19,  4.52it/s][A
Training:  21%|██▏       | 24/112 [00:05<00:15,  5.53it/s][A
Training:  23%|██▎       | 26/112 [00:06<00:18,  4.63it/s][A
Training:  24%|██▍       | 27/112 [00:06<00:17,  4.73it/s][A
Training:  26%|██▌       | 29/112 [00:07<00:22,  3.75it/s][A
Training:  28%|██▊       | 31/112 [00:07<00:16,  4.84it/s][A
Training:  29%|██▉       | 33/112 [00:08<00:21,  3.64it/s][A
Training:  33%|███▎      | 37/112 [00:09<00:17,  4.24it/s][A
Training:  37%|███▋ 

Epoch: 50/69 - Loss: 0.6701 - Accuracy: 0.9197



  0%|          | 0/14 [00:00<?, ?it/s][A
  7%|▋         | 1/14 [00:01<00:14,  1.13s/it][A
 36%|███▌      | 5/14 [00:02<00:03,  2.82it/s][A
 57%|█████▋    | 8/14 [00:02<00:01,  4.85it/s][A
 71%|███████▏  | 10/14 [00:02<00:00,  4.01it/s][A
 86%|████████▌ | 12/14 [00:02<00:00,  5.05it/s][A
100%|██████████| 14/14 [00:03<00:00,  3.90it/s][A
Epochs:  72%|███████▏  | 50/69 [22:16<08:38, 27.28s/it]

Val Loss: 0.4169 - Val Accuracy: 0.9221



Training:   0%|          | 0/112 [00:00<?, ?it/s][A
Training:   1%|          | 1/112 [00:01<02:00,  1.08s/it][A
Training:   4%|▍         | 5/112 [00:01<00:37,  2.84it/s][A
Training:   8%|▊         | 9/112 [00:02<00:28,  3.62it/s][A
Training:  11%|█         | 12/112 [00:02<00:19,  5.26it/s][A
Training:  12%|█▎        | 14/112 [00:03<00:26,  3.74it/s][A
Training:  15%|█▌        | 17/112 [00:04<00:22,  4.15it/s][A
Training:  19%|█▉        | 21/112 [00:05<00:20,  4.41it/s][A
Training:  21%|██▏       | 24/112 [00:05<00:15,  5.77it/s][A
Training:  23%|██▎       | 26/112 [00:06<00:18,  4.65it/s][A
Training:  25%|██▌       | 28/112 [00:06<00:15,  5.37it/s][A
Training:  26%|██▌       | 29/112 [00:06<00:20,  4.11it/s][A
Training:  29%|██▊       | 32/112 [00:07<00:14,  5.42it/s][A
Training:  29%|██▉       | 33/112 [00:07<00:18,  4.35it/s][A
Training:  32%|███▏      | 36/112 [00:08<00:13,  5.72it/s][A
Training:  33%|███▎      | 37/112 [00:08<00:15,  4.85it/s][A
Training:  35%|███▍

Epoch: 51/69 - Loss: 1.2358 - Accuracy: 0.9160



  0%|          | 0/14 [00:00<?, ?it/s][A
  7%|▋         | 1/14 [00:01<00:14,  1.09s/it][A
 29%|██▊       | 4/14 [00:01<00:02,  4.15it/s][A
 43%|████▎     | 6/14 [00:01<00:02,  3.59it/s][A
 50%|█████     | 7/14 [00:01<00:01,  4.17it/s][A
 64%|██████▍   | 9/14 [00:02<00:01,  3.48it/s][A
 71%|███████▏  | 10/14 [00:02<00:01,  3.75it/s][A
 86%|████████▌ | 12/14 [00:03<00:00,  5.03it/s][A
 93%|█████████▎| 13/14 [00:03<00:00,  4.20it/s][A
100%|██████████| 14/14 [00:03<00:00,  3.75it/s][A
Epochs:  74%|███████▍  | 51/69 [22:43<08:10, 27.23s/it]

Val Loss: 1.8302 - Val Accuracy: 0.9359



Training:   0%|          | 0/112 [00:00<?, ?it/s][A
Training:   1%|          | 1/112 [00:01<01:55,  1.04s/it][A
Training:   3%|▎         | 3/112 [00:01<00:38,  2.86it/s][A
Training:   4%|▍         | 5/112 [00:01<00:36,  2.92it/s][A
Training:   6%|▋         | 7/112 [00:02<00:25,  4.14it/s][A
Training:   8%|▊         | 9/112 [00:02<00:26,  3.83it/s][A
Training:  10%|▉         | 11/112 [00:02<00:20,  5.02it/s][A
Training:  12%|█▏        | 13/112 [00:03<00:25,  3.91it/s][A
Training:  15%|█▌        | 17/112 [00:04<00:20,  4.68it/s][A
Training:  18%|█▊        | 20/112 [00:04<00:14,  6.43it/s][A
Training:  20%|█▉        | 22/112 [00:05<00:19,  4.56it/s][A
Training:  22%|██▏       | 25/112 [00:05<00:19,  4.55it/s][A
Training:  24%|██▍       | 27/112 [00:06<00:15,  5.49it/s][A
Training:  26%|██▌       | 29/112 [00:06<00:17,  4.69it/s][A
Training:  27%|██▋       | 30/112 [00:06<00:16,  5.10it/s][A
Training:  29%|██▉       | 33/112 [00:07<00:14,  5.32it/s][A
Training:  30%|███   

Epoch: 52/69 - Loss: 2.3738 - Accuracy: 0.9046



  0%|          | 0/14 [00:00<?, ?it/s][A
  7%|▋         | 1/14 [00:01<00:13,  1.07s/it][A
 21%|██▏       | 3/14 [00:01<00:03,  2.98it/s][A
 36%|███▌      | 5/14 [00:01<00:02,  3.02it/s][A
 43%|████▎     | 6/14 [00:01<00:02,  3.65it/s][A
 64%|██████▍   | 9/14 [00:02<00:01,  4.26it/s][A
 71%|███████▏  | 10/14 [00:02<00:00,  4.53it/s][A
 86%|████████▌ | 12/14 [00:02<00:00,  6.24it/s][A
100%|██████████| 14/14 [00:03<00:00,  3.94it/s][A
Epochs:  75%|███████▌  | 52/69 [23:10<07:40, 27.11s/it]

Val Loss: 0.5810 - Val Accuracy: 0.9290



Training:   0%|          | 0/112 [00:00<?, ?it/s][A
Training:   1%|          | 1/112 [00:01<02:15,  1.22s/it][A
Training:   3%|▎         | 3/112 [00:01<00:38,  2.81it/s][A
Training:   4%|▍         | 5/112 [00:01<00:36,  2.97it/s][A
Training:   6%|▋         | 7/112 [00:02<00:23,  4.39it/s][A
Training:   8%|▊         | 9/112 [00:02<00:29,  3.52it/s][A
Training:  10%|▉         | 11/112 [00:02<00:20,  4.89it/s][A
Training:  12%|█▏        | 13/112 [00:03<00:23,  4.24it/s][A
Training:  13%|█▎        | 15/112 [00:03<00:17,  5.40it/s][A
Training:  15%|█▌        | 17/112 [00:04<00:21,  4.50it/s][A
Training:  17%|█▋        | 19/112 [00:04<00:17,  5.32it/s][A
Training:  19%|█▉        | 21/112 [00:05<00:21,  4.23it/s][A
Training:  21%|██        | 23/112 [00:05<00:17,  5.04it/s][A
Training:  22%|██▏       | 25/112 [00:05<00:18,  4.70it/s][A
Training:  23%|██▎       | 26/112 [00:06<00:17,  4.81it/s][A
Training:  25%|██▌       | 28/112 [00:06<00:13,  6.12it/s][A
Training:  26%|██▌   

Epoch: 53/69 - Loss: 0.5146 - Accuracy: 0.9225



  0%|          | 0/14 [00:00<?, ?it/s][A
  7%|▋         | 1/14 [00:01<00:14,  1.08s/it][A
 29%|██▊       | 4/14 [00:01<00:02,  4.25it/s][A
 43%|████▎     | 6/14 [00:01<00:02,  3.45it/s][A
 57%|█████▋    | 8/14 [00:02<00:01,  5.03it/s][A
 71%|███████▏  | 10/14 [00:02<00:01,  3.96it/s][A
 86%|████████▌ | 12/14 [00:02<00:00,  5.16it/s][A
100%|██████████| 14/14 [00:03<00:00,  3.98it/s][A
Epochs:  77%|███████▋  | 53/69 [23:37<07:14, 27.17s/it]

Val Loss: 0.4133 - Val Accuracy: 0.9175



Training:   0%|          | 0/112 [00:00<?, ?it/s][A
Training:   1%|          | 1/112 [00:01<02:11,  1.18s/it][A
Training:   3%|▎         | 3/112 [00:01<00:40,  2.69it/s][A
Training:   4%|▍         | 5/112 [00:01<00:35,  3.04it/s][A
Training:   6%|▋         | 7/112 [00:02<00:24,  4.33it/s][A
Training:   8%|▊         | 9/112 [00:02<00:30,  3.34it/s][A
Training:  10%|▉         | 11/112 [00:03<00:21,  4.66it/s][A
Training:  12%|█▏        | 13/112 [00:03<00:28,  3.52it/s][A
Training:  13%|█▎        | 15/112 [00:04<00:20,  4.68it/s][A
Training:  15%|█▌        | 17/112 [00:04<00:23,  4.08it/s][A
Training:  18%|█▊        | 20/112 [00:04<00:14,  6.17it/s][A
Training:  20%|█▉        | 22/112 [00:05<00:20,  4.42it/s][A
Training:  21%|██▏       | 24/112 [00:05<00:15,  5.62it/s][A
Training:  23%|██▎       | 26/112 [00:06<00:20,  4.28it/s][A
Training:  25%|██▌       | 28/112 [00:06<00:15,  5.45it/s][A
Training:  27%|██▋       | 30/112 [00:07<00:20,  4.01it/s][A
Training:  29%|██▉   

Epoch: 54/69 - Loss: 4.6968 - Accuracy: 0.9008



  0%|          | 0/14 [00:00<?, ?it/s][A
  7%|▋         | 1/14 [00:01<00:17,  1.32s/it][A
 36%|███▌      | 5/14 [00:02<00:03,  2.85it/s][A
 64%|██████▍   | 9/14 [00:02<00:01,  3.80it/s][A
100%|██████████| 14/14 [00:03<00:00,  3.87it/s][A
Epochs:  78%|███████▊  | 54/69 [24:04<06:48, 27.23s/it]

Val Loss: 3.8242 - Val Accuracy: 0.9248



Training:   0%|          | 0/112 [00:00<?, ?it/s][A
Training:   1%|          | 1/112 [00:01<02:15,  1.22s/it][A
Training:   3%|▎         | 3/112 [00:01<00:38,  2.83it/s][A
Training:   4%|▍         | 5/112 [00:02<00:38,  2.77it/s][A
Training:   7%|▋         | 8/112 [00:02<00:20,  5.08it/s][A
Training:   9%|▉         | 10/112 [00:02<00:26,  3.82it/s][A
Training:  11%|█         | 12/112 [00:03<00:19,  5.14it/s][A
Training:  12%|█▎        | 14/112 [00:03<00:25,  3.86it/s][A
Training:  15%|█▌        | 17/112 [00:04<00:24,  3.93it/s][A
Training:  18%|█▊        | 20/112 [00:04<00:16,  5.61it/s][A
Training:  20%|█▉        | 22/112 [00:05<00:20,  4.45it/s][A
Training:  21%|██▏       | 24/112 [00:05<00:15,  5.61it/s][A
Training:  23%|██▎       | 26/112 [00:06<00:17,  4.87it/s][A
Training:  26%|██▌       | 29/112 [00:06<00:19,  4.30it/s][A
Training:  29%|██▉       | 33/112 [00:07<00:17,  4.52it/s][A
Training:  33%|███▎      | 37/112 [00:08<00:15,  4.91it/s][A
Training:  35%|███▍ 

Epoch: 55/69 - Loss: 1.2474 - Accuracy: 0.9167



  0%|          | 0/14 [00:00<?, ?it/s][A
  7%|▋         | 1/14 [00:00<00:11,  1.18it/s][A
 21%|██▏       | 3/14 [00:00<00:02,  3.74it/s][A
 36%|███▌      | 5/14 [00:01<00:02,  3.16it/s][A
 57%|█████▋    | 8/14 [00:01<00:01,  5.82it/s][A
 71%|███████▏  | 10/14 [00:02<00:00,  4.52it/s][A
100%|██████████| 14/14 [00:03<00:00,  4.32it/s][A
Epochs:  80%|███████▉  | 55/69 [24:31<06:20, 27.21s/it]

Val Loss: 0.8223 - Val Accuracy: 0.9267



Training:   0%|          | 0/112 [00:00<?, ?it/s][A
Training:   1%|          | 1/112 [00:01<02:02,  1.11s/it][A
Training:   2%|▏         | 2/112 [00:01<01:07,  1.64it/s][A
Training:   4%|▍         | 5/112 [00:01<00:31,  3.40it/s][A
Training:   5%|▌         | 6/112 [00:02<00:29,  3.57it/s][A
Training:   7%|▋         | 8/112 [00:02<00:19,  5.26it/s][A
Training:   8%|▊         | 9/112 [00:02<00:24,  4.16it/s][A
Training:   9%|▉         | 10/112 [00:03<00:28,  3.63it/s][A
Training:  11%|█         | 12/112 [00:03<00:18,  5.35it/s][A
Training:  12%|█▏        | 13/112 [00:03<00:22,  4.41it/s][A
Training:  12%|█▎        | 14/112 [00:03<00:26,  3.73it/s][A
Training:  15%|█▌        | 17/112 [00:04<00:17,  5.53it/s][A
Training:  16%|█▌        | 18/112 [00:04<00:21,  4.33it/s][A
Training:  18%|█▊        | 20/112 [00:04<00:16,  5.67it/s][A
Training:  19%|█▉        | 21/112 [00:04<00:14,  6.19it/s][A
Training:  20%|█▉        | 22/112 [00:05<00:23,  3.79it/s][A
Training:  22%|██▏    

Epoch: 56/69 - Loss: 0.6773 - Accuracy: 0.9198



  0%|          | 0/14 [00:00<?, ?it/s][A
  7%|▋         | 1/14 [00:01<00:16,  1.27s/it][A
 21%|██▏       | 3/14 [00:01<00:04,  2.71it/s][A
 36%|███▌      | 5/14 [00:02<00:03,  2.66it/s][A
 64%|██████▍   | 9/14 [00:02<00:01,  3.82it/s][A
 86%|████████▌ | 12/14 [00:02<00:00,  5.77it/s][A
100%|██████████| 14/14 [00:03<00:00,  3.77it/s][A
Epochs:  81%|████████  | 56/69 [24:59<05:53, 27.23s/it]

Val Loss: 0.8632 - Val Accuracy: 0.9249



Training:   0%|          | 0/112 [00:00<?, ?it/s][A
Training:   1%|          | 1/112 [00:01<02:44,  1.49s/it][A
Training:   3%|▎         | 3/112 [00:01<00:48,  2.23it/s][A
Training:   4%|▍         | 5/112 [00:02<00:39,  2.70it/s][A
Training:   6%|▋         | 7/112 [00:02<00:25,  4.16it/s][A
Training:   8%|▊         | 9/112 [00:02<00:26,  3.82it/s][A
Training:  10%|▉         | 11/112 [00:03<00:19,  5.31it/s][A
Training:  12%|█▏        | 13/112 [00:03<00:25,  3.88it/s][A
Training:  13%|█▎        | 15/112 [00:03<00:18,  5.20it/s][A
Training:  15%|█▌        | 17/112 [00:04<00:21,  4.41it/s][A
Training:  19%|█▉        | 21/112 [00:05<00:19,  4.64it/s][A
Training:  21%|██        | 23/112 [00:05<00:15,  5.73it/s][A
Training:  22%|██▏       | 25/112 [00:06<00:19,  4.42it/s][A
Training:  24%|██▍       | 27/112 [00:06<00:15,  5.51it/s][A
Training:  26%|██▌       | 29/112 [00:07<00:19,  4.25it/s][A
Training:  28%|██▊       | 31/112 [00:07<00:14,  5.42it/s][A
Training:  29%|██▉   

Epoch: 57/69 - Loss: 0.4770 - Accuracy: 0.9236



  0%|          | 0/14 [00:00<?, ?it/s][A
  7%|▋         | 1/14 [00:01<00:15,  1.19s/it][A
 14%|█▍        | 2/14 [00:01<00:06,  1.77it/s][A
 36%|███▌      | 5/14 [00:02<00:02,  3.09it/s][A
 43%|████▎     | 6/14 [00:02<00:02,  3.34it/s][A
 64%|██████▍   | 9/14 [00:02<00:01,  3.90it/s][A
 71%|███████▏  | 10/14 [00:03<00:00,  4.19it/s][A
100%|██████████| 14/14 [00:03<00:00,  3.82it/s][A
Epochs:  83%|████████▎ | 57/69 [25:26<05:28, 27.35s/it]

Val Loss: 0.3119 - Val Accuracy: 0.9438



Training:   0%|          | 0/112 [00:00<?, ?it/s][A
Training:   1%|          | 1/112 [00:01<02:25,  1.31s/it][A
Training:   3%|▎         | 3/112 [00:01<00:42,  2.59it/s][A
Training:   4%|▍         | 5/112 [00:02<00:38,  2.75it/s][A
Training:   6%|▋         | 7/112 [00:02<00:24,  4.32it/s][A
Training:   8%|▊         | 9/112 [00:02<00:26,  3.85it/s][A
Training:   9%|▉         | 10/112 [00:02<00:23,  4.35it/s][A
Training:  11%|█         | 12/112 [00:03<00:16,  6.13it/s][A
Training:  12%|█▎        | 14/112 [00:03<00:20,  4.82it/s][A
Training:  15%|█▌        | 17/112 [00:04<00:22,  4.25it/s][A
Training:  16%|█▌        | 18/112 [00:04<00:20,  4.56it/s][A
Training:  19%|█▉        | 21/112 [00:05<00:20,  4.44it/s][A
Training:  20%|█▉        | 22/112 [00:05<00:18,  4.75it/s][A
Training:  22%|██▏       | 25/112 [00:06<00:19,  4.50it/s][A
Training:  23%|██▎       | 26/112 [00:06<00:18,  4.66it/s][A
Training:  26%|██▌       | 29/112 [00:06<00:16,  4.92it/s][A
Training:  27%|██▋   

Epoch: 58/69 - Loss: 0.5262 - Accuracy: 0.9235



  0%|          | 0/14 [00:00<?, ?it/s][A
  7%|▋         | 1/14 [00:01<00:12,  1.00it/s][A
 29%|██▊       | 4/14 [00:01<00:02,  4.51it/s][A
 43%|████▎     | 6/14 [00:01<00:02,  3.22it/s][A
 64%|██████▍   | 9/14 [00:02<00:01,  3.40it/s][A
100%|██████████| 14/14 [00:03<00:00,  3.95it/s][A
Epochs:  84%|████████▍ | 58/69 [25:53<04:59, 27.27s/it]

Val Loss: 0.5354 - Val Accuracy: 0.9427



Training:   0%|          | 0/112 [00:00<?, ?it/s][A
Training:   1%|          | 1/112 [00:01<02:16,  1.23s/it][A
Training:   3%|▎         | 3/112 [00:01<00:39,  2.74it/s][A
Training:   4%|▍         | 5/112 [00:02<00:40,  2.64it/s][A
Training:   6%|▋         | 7/112 [00:02<00:25,  4.10it/s][A
Training:   8%|▊         | 9/112 [00:02<00:29,  3.48it/s][A
Training:  12%|█▏        | 13/112 [00:03<00:23,  4.28it/s][A
Training:  15%|█▌        | 17/112 [00:04<00:22,  4.21it/s][A
Training:  19%|█▉        | 21/112 [00:05<00:19,  4.57it/s][A
Training:  20%|█▉        | 22/112 [00:05<00:18,  4.89it/s][A
Training:  21%|██▏       | 24/112 [00:05<00:14,  5.94it/s][A
Training:  22%|██▏       | 25/112 [00:06<00:20,  4.29it/s][A
Training:  23%|██▎       | 26/112 [00:06<00:19,  4.32it/s][A
Training:  26%|██▌       | 29/112 [00:07<00:17,  4.76it/s][A
Training:  27%|██▋       | 30/112 [00:07<00:17,  4.79it/s][A
Training:  29%|██▉       | 33/112 [00:07<00:14,  5.41it/s][A
Training:  30%|███   

Epoch: 59/69 - Loss: 0.5568 - Accuracy: 0.9224



  0%|          | 0/14 [00:00<?, ?it/s][A
  7%|▋         | 1/14 [00:01<00:14,  1.14s/it][A
 29%|██▊       | 4/14 [00:01<00:02,  3.92it/s][A
 43%|████▎     | 6/14 [00:01<00:02,  3.76it/s][A
 64%|██████▍   | 9/14 [00:02<00:01,  4.23it/s][A
 71%|███████▏  | 10/14 [00:02<00:00,  4.56it/s][A
100%|██████████| 14/14 [00:03<00:00,  4.13it/s][A
Epochs:  86%|████████▌ | 59/69 [26:21<04:33, 27.31s/it]

Val Loss: 0.5025 - Val Accuracy: 0.9175



Training:   0%|          | 0/112 [00:00<?, ?it/s][A
Training:   1%|          | 1/112 [00:01<02:00,  1.09s/it][A
Training:   3%|▎         | 3/112 [00:01<00:35,  3.09it/s][A
Training:   4%|▍         | 5/112 [00:01<00:33,  3.17it/s][A
Training:   6%|▋         | 7/112 [00:02<00:23,  4.43it/s][A
Training:   8%|▊         | 9/112 [00:02<00:25,  4.03it/s][A
Training:  10%|▉         | 11/112 [00:02<00:20,  4.91it/s][A
Training:  12%|█▏        | 13/112 [00:03<00:22,  4.39it/s][A
Training:  13%|█▎        | 15/112 [00:03<00:19,  5.10it/s][A
Training:  15%|█▌        | 17/112 [00:04<00:21,  4.34it/s][A
Training:  17%|█▋        | 19/112 [00:04<00:17,  5.19it/s][A
Training:  19%|█▉        | 21/112 [00:05<00:20,  4.35it/s][A
Training:  21%|██        | 23/112 [00:05<00:16,  5.55it/s][A
Training:  22%|██▏       | 25/112 [00:05<00:20,  4.31it/s][A
Training:  24%|██▍       | 27/112 [00:06<00:15,  5.60it/s][A
Training:  26%|██▌       | 29/112 [00:06<00:18,  4.41it/s][A
Training:  28%|██▊   

Epoch: 60/69 - Loss: 0.3810 - Accuracy: 0.9249



  0%|          | 0/14 [00:00<?, ?it/s][A
  7%|▋         | 1/14 [00:00<00:12,  1.02it/s][A
 36%|███▌      | 5/14 [00:01<00:02,  3.44it/s][A
 43%|████▎     | 6/14 [00:01<00:02,  3.66it/s][A
 64%|██████▍   | 9/14 [00:02<00:01,  4.35it/s][A
 71%|███████▏  | 10/14 [00:02<00:00,  4.28it/s][A
 86%|████████▌ | 12/14 [00:02<00:00,  5.78it/s][A
 93%|█████████▎| 13/14 [00:03<00:00,  4.65it/s][A
100%|██████████| 14/14 [00:03<00:00,  4.04it/s][A
Epochs:  87%|████████▋ | 60/69 [26:47<04:04, 27.12s/it]

Val Loss: 0.5431 - Val Accuracy: 0.9243



Training:   0%|          | 0/112 [00:00<?, ?it/s][A
Training:   1%|          | 1/112 [00:01<02:12,  1.20s/it][A
Training:   4%|▍         | 5/112 [00:02<00:39,  2.71it/s][A
Training:   6%|▋         | 7/112 [00:02<00:26,  3.90it/s][A
Training:   8%|▊         | 9/112 [00:02<00:28,  3.63it/s][A
Training:  11%|█         | 12/112 [00:02<00:17,  5.68it/s][A
Training:  12%|█▎        | 14/112 [00:03<00:20,  4.84it/s][A
Training:  14%|█▍        | 16/112 [00:03<00:16,  5.94it/s][A
Training:  16%|█▌        | 18/112 [00:04<00:21,  4.39it/s][A
Training:  18%|█▊        | 20/112 [00:04<00:17,  5.40it/s][A
Training:  19%|█▉        | 21/112 [00:05<00:25,  3.56it/s][A
Training:  22%|██▏       | 25/112 [00:06<00:20,  4.32it/s][A
Training:  25%|██▌       | 28/112 [00:06<00:13,  6.11it/s][A
Training:  27%|██▋       | 30/112 [00:06<00:17,  4.69it/s][A
Training:  29%|██▉       | 33/112 [00:07<00:17,  4.48it/s][A
Training:  32%|███▏      | 36/112 [00:07<00:12,  6.14it/s][A
Training:  34%|███▍ 

Epoch: 61/69 - Loss: 0.5717 - Accuracy: 0.9215



  0%|          | 0/14 [00:00<?, ?it/s][A
  7%|▋         | 1/14 [00:01<00:13,  1.00s/it][A
 29%|██▊       | 4/14 [00:01<00:02,  4.53it/s][A
 43%|████▎     | 6/14 [00:01<00:02,  3.26it/s][A
 64%|██████▍   | 9/14 [00:02<00:01,  3.23it/s][A
 86%|████████▌ | 12/14 [00:03<00:00,  5.03it/s][A
100%|██████████| 14/14 [00:03<00:00,  3.91it/s][A
Epochs:  88%|████████▊ | 61/69 [27:15<03:38, 27.34s/it]

Val Loss: 0.6210 - Val Accuracy: 0.9140



Training:   0%|          | 0/112 [00:00<?, ?it/s][A
Training:   1%|          | 1/112 [00:01<02:02,  1.11s/it][A
Training:   3%|▎         | 3/112 [00:01<00:37,  2.93it/s][A
Training:   4%|▍         | 5/112 [00:01<00:34,  3.07it/s][A
Training:   6%|▋         | 7/112 [00:02<00:23,  4.49it/s][A
Training:   8%|▊         | 9/112 [00:02<00:26,  3.91it/s][A
Training:  11%|█         | 12/112 [00:02<00:16,  6.23it/s][A
Training:  12%|█▎        | 14/112 [00:03<00:21,  4.51it/s][A
Training:  15%|█▌        | 17/112 [00:04<00:21,  4.46it/s][A
Training:  16%|█▌        | 18/112 [00:04<00:21,  4.46it/s][A
Training:  18%|█▊        | 20/112 [00:04<00:15,  5.78it/s][A
Training:  19%|█▉        | 21/112 [00:05<00:24,  3.75it/s][A
Training:  20%|█▉        | 22/112 [00:05<00:21,  4.29it/s][A
Training:  21%|██▏       | 24/112 [00:05<00:15,  5.74it/s][A
Training:  22%|██▏       | 25/112 [00:05<00:21,  4.11it/s][A
Training:  23%|██▎       | 26/112 [00:06<00:18,  4.71it/s][A
Training:  25%|██▌   

Epoch: 62/69 - Loss: 0.5463 - Accuracy: 0.9221



  0%|          | 0/14 [00:00<?, ?it/s][A
  7%|▋         | 1/14 [00:00<00:12,  1.06it/s][A
 14%|█▍        | 2/14 [00:01<00:05,  2.06it/s][A
 36%|███▌      | 5/14 [00:01<00:02,  3.42it/s][A
 43%|████▎     | 6/14 [00:01<00:01,  4.03it/s][A
 64%|██████▍   | 9/14 [00:02<00:01,  3.75it/s][A
 79%|███████▊  | 11/14 [00:02<00:00,  5.06it/s][A
100%|██████████| 14/14 [00:03<00:00,  3.79it/s][A
Epochs:  90%|████████▉ | 62/69 [27:43<03:12, 27.50s/it]

Val Loss: 0.8214 - Val Accuracy: 0.9192



Training:   0%|          | 0/112 [00:00<?, ?it/s][A
Training:   1%|          | 1/112 [00:01<01:57,  1.06s/it][A
Training:   4%|▎         | 4/112 [00:01<00:26,  4.13it/s][A
Training:   5%|▌         | 6/112 [00:01<00:28,  3.71it/s][A
Training:   8%|▊         | 9/112 [00:02<00:25,  4.09it/s][A
Training:  10%|▉         | 11/112 [00:02<00:19,  5.28it/s][A
Training:  12%|█▏        | 13/112 [00:03<00:23,  4.17it/s][A
Training:  13%|█▎        | 15/112 [00:03<00:17,  5.47it/s][A
Training:  15%|█▌        | 17/112 [00:03<00:20,  4.69it/s][A
Training:  16%|█▌        | 18/112 [00:04<00:18,  5.03it/s][A
Training:  18%|█▊        | 20/112 [00:04<00:14,  6.47it/s][A
Training:  20%|█▉        | 22/112 [00:04<00:19,  4.55it/s][A
Training:  21%|██▏       | 24/112 [00:05<00:15,  5.71it/s][A
Training:  22%|██▏       | 25/112 [00:05<00:20,  4.25it/s][A
Training:  24%|██▍       | 27/112 [00:05<00:15,  5.57it/s][A
Training:  25%|██▌       | 28/112 [00:06<00:15,  5.38it/s][A
Training:  26%|██▌  

Epoch: 63/69 - Loss: 1.2206 - Accuracy: 0.9153



  0%|          | 0/14 [00:00<?, ?it/s][A
  7%|▋         | 1/14 [00:00<00:12,  1.05it/s][A
 36%|███▌      | 5/14 [00:01<00:02,  3.56it/s][A
 50%|█████     | 7/14 [00:01<00:01,  5.13it/s][A
 64%|██████▍   | 9/14 [00:02<00:01,  4.24it/s][A
 79%|███████▊  | 11/14 [00:02<00:00,  5.65it/s][A
100%|██████████| 14/14 [00:03<00:00,  4.31it/s][A
Epochs:  91%|█████████▏| 63/69 [28:10<02:43, 27.33s/it]

Val Loss: 1.0619 - Val Accuracy: 0.9192



Training:   0%|          | 0/112 [00:00<?, ?it/s][A
Training:   1%|          | 1/112 [00:01<02:03,  1.11s/it][A
Training:   4%|▍         | 5/112 [00:01<00:35,  3.04it/s][A
Training:   7%|▋         | 8/112 [00:02<00:20,  5.15it/s][A
Training:   9%|▉         | 10/112 [00:02<00:26,  3.80it/s][A
Training:  10%|▉         | 11/112 [00:03<00:24,  4.10it/s][A
Training:  12%|█▏        | 13/112 [00:03<00:27,  3.57it/s][A
Training:  12%|█▎        | 14/112 [00:03<00:24,  4.08it/s][A
Training:  13%|█▎        | 15/112 [00:04<00:23,  4.09it/s][A
Training:  15%|█▌        | 17/112 [00:04<00:21,  4.45it/s][A
Training:  17%|█▋        | 19/112 [00:04<00:18,  5.15it/s][A
Training:  19%|█▉        | 21/112 [00:05<00:18,  5.02it/s][A
Training:  20%|█▉        | 22/112 [00:05<00:18,  4.99it/s][A
Training:  21%|██        | 23/112 [00:05<00:16,  5.56it/s][A
Training:  22%|██▏       | 25/112 [00:06<00:19,  4.47it/s][A
Training:  23%|██▎       | 26/112 [00:06<00:19,  4.49it/s][A
Training:  25%|██▌ 

Epoch: 64/69 - Loss: 1.1883 - Accuracy: 0.9176



  0%|          | 0/14 [00:00<?, ?it/s][A
  7%|▋         | 1/14 [00:00<00:12,  1.01it/s][A
 21%|██▏       | 3/14 [00:01<00:03,  3.33it/s][A
 36%|███▌      | 5/14 [00:01<00:02,  3.02it/s][A
 43%|████▎     | 6/14 [00:01<00:02,  3.64it/s][A
 64%|██████▍   | 9/14 [00:02<00:01,  3.89it/s][A
 71%|███████▏  | 10/14 [00:02<00:00,  4.19it/s][A
 86%|████████▌ | 12/14 [00:02<00:00,  5.65it/s][A
100%|██████████| 14/14 [00:03<00:00,  3.89it/s][A
Epochs:  93%|█████████▎| 64/69 [28:38<02:16, 27.36s/it]

Val Loss: 0.5385 - Val Accuracy: 0.9067



Training:   0%|          | 0/112 [00:00<?, ?it/s][A
Training:   1%|          | 1/112 [00:01<01:50,  1.00it/s][A
Training:   2%|▏         | 2/112 [00:01<00:51,  2.13it/s][A
Training:   4%|▍         | 5/112 [00:01<00:30,  3.51it/s][A
Training:   5%|▌         | 6/112 [00:01<00:25,  4.20it/s][A
Training:   7%|▋         | 8/112 [00:01<00:16,  6.17it/s][A
Training:   9%|▉         | 10/112 [00:02<00:26,  3.84it/s][A
Training:  12%|█▏        | 13/112 [00:03<00:23,  4.28it/s][A
Training:  12%|█▎        | 14/112 [00:03<00:21,  4.60it/s][A
Training:  15%|█▌        | 17/112 [00:04<00:18,  5.04it/s][A
Training:  16%|█▌        | 18/112 [00:04<00:20,  4.56it/s][A
Training:  19%|█▉        | 21/112 [00:04<00:16,  5.41it/s][A
Training:  20%|█▉        | 22/112 [00:05<00:19,  4.58it/s][A
Training:  21%|██▏       | 24/112 [00:05<00:15,  5.78it/s][A
Training:  22%|██▏       | 25/112 [00:05<00:17,  5.11it/s][A
Training:  23%|██▎       | 26/112 [00:06<00:20,  4.11it/s][A
Training:  25%|██▌   

Epoch: 65/69 - Loss: 2.6205 - Accuracy: 0.9012



  0%|          | 0/14 [00:00<?, ?it/s][A
  7%|▋         | 1/14 [00:01<00:14,  1.11s/it][A
 21%|██▏       | 3/14 [00:01<00:03,  3.03it/s][A
 36%|███▌      | 5/14 [00:01<00:02,  3.14it/s][A
 50%|█████     | 7/14 [00:02<00:01,  4.31it/s][A
 64%|██████▍   | 9/14 [00:02<00:01,  4.04it/s][A
 79%|███████▊  | 11/14 [00:02<00:00,  5.11it/s][A
100%|██████████| 14/14 [00:03<00:00,  3.82it/s][A
Epochs:  94%|█████████▍| 65/69 [29:04<01:48, 27.11s/it]

Val Loss: 1.9779 - Val Accuracy: 0.8602



Training:   0%|          | 0/112 [00:00<?, ?it/s][A
Training:   1%|          | 1/112 [00:01<01:51,  1.01s/it][A
Training:   4%|▎         | 4/112 [00:01<00:24,  4.48it/s][A
Training:   5%|▌         | 6/112 [00:01<00:31,  3.33it/s][A
Training:   7%|▋         | 8/112 [00:02<00:21,  4.89it/s][A
Training:   9%|▉         | 10/112 [00:02<00:26,  3.84it/s][A
Training:  12%|█▏        | 13/112 [00:03<00:24,  4.05it/s][A
Training:  14%|█▍        | 16/112 [00:03<00:16,  5.98it/s][A
Training:  16%|█▌        | 18/112 [00:04<00:21,  4.28it/s][A
Training:  18%|█▊        | 20/112 [00:04<00:17,  5.34it/s][A
Training:  20%|█▉        | 22/112 [00:05<00:20,  4.38it/s][A
Training:  21%|██▏       | 24/112 [00:05<00:15,  5.52it/s][A
Training:  23%|██▎       | 26/112 [00:05<00:18,  4.62it/s][A
Training:  25%|██▌       | 28/112 [00:06<00:14,  5.86it/s][A
Training:  27%|██▋       | 30/112 [00:06<00:18,  4.36it/s][A
Training:  29%|██▉       | 33/112 [00:07<00:19,  4.15it/s][A
Training:  31%|███▏ 

Epoch: 66/69 - Loss: 0.9851 - Accuracy: 0.9181



  0%|          | 0/14 [00:00<?, ?it/s][A
  7%|▋         | 1/14 [00:01<00:15,  1.23s/it][A
 21%|██▏       | 3/14 [00:01<00:04,  2.70it/s][A
 36%|███▌      | 5/14 [00:01<00:02,  3.16it/s][A
 43%|████▎     | 6/14 [00:02<00:02,  3.50it/s][A
 64%|██████▍   | 9/14 [00:02<00:01,  4.32it/s][A
 71%|███████▏  | 10/14 [00:02<00:00,  4.47it/s][A
 93%|█████████▎| 13/14 [00:03<00:00,  5.10it/s][A
100%|██████████| 14/14 [00:03<00:00,  3.92it/s][A
Epochs:  96%|█████████▌| 66/69 [29:31<01:21, 27.11s/it]

Val Loss: 0.8238 - Val Accuracy: 0.9462



Training:   0%|          | 0/112 [00:00<?, ?it/s][A
Training:   1%|          | 1/112 [00:01<02:18,  1.24s/it][A
Training:   3%|▎         | 3/112 [00:01<00:39,  2.76it/s][A
Training:   4%|▍         | 5/112 [00:02<00:38,  2.77it/s][A
Training:   7%|▋         | 8/112 [00:02<00:19,  5.21it/s][A
Training:   9%|▉         | 10/112 [00:02<00:23,  4.25it/s][A
Training:  12%|█▏        | 13/112 [00:03<00:23,  4.20it/s][A
Training:  13%|█▎        | 15/112 [00:03<00:18,  5.28it/s][A
Training:  15%|█▌        | 17/112 [00:04<00:22,  4.28it/s][A
Training:  19%|█▉        | 21/112 [00:05<00:18,  4.87it/s][A
Training:  22%|██▏       | 25/112 [00:05<00:16,  5.26it/s][A
Training:  24%|██▍       | 27/112 [00:05<00:13,  6.09it/s][A
Training:  26%|██▌       | 29/112 [00:06<00:16,  5.13it/s][A
Training:  28%|██▊       | 31/112 [00:06<00:13,  6.11it/s][A
Training:  29%|██▉       | 33/112 [00:07<00:17,  4.42it/s][A
Training:  31%|███▏      | 35/112 [00:07<00:13,  5.52it/s][A
Training:  33%|███▎ 

Epoch: 67/69 - Loss: 1.0077 - Accuracy: 0.9221



  0%|          | 0/14 [00:00<?, ?it/s][A
  7%|▋         | 1/14 [00:01<00:15,  1.20s/it][A
 29%|██▊       | 4/14 [00:01<00:02,  3.77it/s][A
 43%|████▎     | 6/14 [00:02<00:02,  2.94it/s][A
 57%|█████▋    | 8/14 [00:02<00:01,  4.29it/s][A
 71%|███████▏  | 10/14 [00:03<00:01,  3.51it/s][A
100%|██████████| 14/14 [00:03<00:00,  3.78it/s][A
Epochs:  97%|█████████▋| 67/69 [29:58<00:53, 26.94s/it]

Val Loss: 2.2813 - Val Accuracy: 0.9072



Training:   0%|          | 0/112 [00:00<?, ?it/s][A
Training:   1%|          | 1/112 [00:00<01:45,  1.05it/s][A
Training:   2%|▏         | 2/112 [00:01<00:54,  2.04it/s][A
Training:   4%|▍         | 5/112 [00:01<00:32,  3.30it/s][A
Training:   6%|▋         | 7/112 [00:01<00:21,  4.89it/s][A
Training:   8%|▊         | 9/112 [00:02<00:25,  4.01it/s][A
Training:  11%|█         | 12/112 [00:02<00:15,  6.42it/s][A
Training:  12%|█▎        | 14/112 [00:03<00:20,  4.87it/s][A
Training:  15%|█▌        | 17/112 [00:04<00:20,  4.53it/s][A
Training:  18%|█▊        | 20/112 [00:04<00:14,  6.30it/s][A
Training:  20%|█▉        | 22/112 [00:05<00:19,  4.57it/s][A
Training:  21%|██        | 23/112 [00:05<00:17,  4.97it/s][A
Training:  22%|██▏       | 25/112 [00:05<00:20,  4.28it/s][A
Training:  24%|██▍       | 27/112 [00:05<00:15,  5.47it/s][A
Training:  26%|██▌       | 29/112 [00:06<00:19,  4.31it/s][A
Training:  27%|██▋       | 30/112 [00:06<00:17,  4.75it/s][A
Training:  29%|██▉   

Epoch: 68/69 - Loss: 1.6026 - Accuracy: 0.9126



  0%|          | 0/14 [00:00<?, ?it/s][A
  7%|▋         | 1/14 [00:00<00:12,  1.02it/s][A
 14%|█▍        | 2/14 [00:01<00:07,  1.58it/s][A
 36%|███▌      | 5/14 [00:01<00:02,  3.53it/s][A
 43%|████▎     | 6/14 [00:02<00:02,  2.97it/s][A
 64%|██████▍   | 9/14 [00:02<00:01,  4.90it/s][A
 71%|███████▏  | 10/14 [00:03<00:01,  3.74it/s][A
 93%|█████████▎| 13/14 [00:03<00:00,  5.21it/s][A
100%|██████████| 14/14 [00:03<00:00,  3.68it/s][A
Epochs:  99%|█████████▊| 68/69 [30:24<00:26, 26.88s/it]

Val Loss: 1.4613 - Val Accuracy: 0.9250



Training:   0%|          | 0/112 [00:00<?, ?it/s][A
Training:   1%|          | 1/112 [00:01<02:02,  1.11s/it][A
Training:   2%|▏         | 2/112 [00:01<00:57,  1.92it/s][A
Training:   4%|▍         | 5/112 [00:01<00:32,  3.34it/s][A
Training:   5%|▌         | 6/112 [00:02<00:27,  3.80it/s][A
Training:   8%|▊         | 9/112 [00:02<00:25,  4.07it/s][A
Training:  11%|█         | 12/112 [00:02<00:15,  6.34it/s][A
Training:  12%|█▎        | 14/112 [00:03<00:22,  4.43it/s][A
Training:  13%|█▎        | 15/112 [00:03<00:19,  4.85it/s][A
Training:  15%|█▌        | 17/112 [00:04<00:21,  4.39it/s][A
Training:  16%|█▌        | 18/112 [00:04<00:20,  4.61it/s][A
Training:  18%|█▊        | 20/112 [00:04<00:15,  6.05it/s][A
Training:  19%|█▉        | 21/112 [00:05<00:20,  4.48it/s][A
Training:  20%|█▉        | 22/112 [00:05<00:18,  4.80it/s][A
Training:  21%|██        | 23/112 [00:05<00:19,  4.53it/s][A
Training:  22%|██▏       | 25/112 [00:05<00:18,  4.65it/s][A
Training:  24%|██▍   

Epoch: 69/69 - Loss: 0.7823 - Accuracy: 0.9250



  0%|          | 0/14 [00:00<?, ?it/s][A
  7%|▋         | 1/14 [00:01<00:13,  1.01s/it][A
 21%|██▏       | 3/14 [00:01<00:03,  3.33it/s][A
 36%|███▌      | 5/14 [00:01<00:02,  3.07it/s][A
 50%|█████     | 7/14 [00:02<00:01,  4.30it/s][A
 64%|██████▍   | 9/14 [00:02<00:01,  3.72it/s][A
 79%|███████▊  | 11/14 [00:02<00:00,  4.67it/s][A
100%|██████████| 14/14 [00:03<00:00,  3.83it/s][A
Epochs: 100%|██████████| 69/69 [30:52<00:00, 26.85s/it]


Val Loss: 1.3743 - Val Accuracy: 0.9025


[32m[I 2023-12-14 23:51:56,974][0m Trial 3 finished with value: 0.9025476574897766 and parameters: {'learning_rate': 0.02816733929912164, 'weight_decay': 0.001632793638917931, 'epsilon': 4.700125142204821e-08, 'batch_size': 125, 'epochs': 69}. Best is trial 1 with value: 0.94315505027771.[0m


Learning rate: 3.220616291387027e-05
Weight decay: 0.0010915949385844237
Epsilon: 7.0510050620049406e-09
Batch size: 134
Number of epochs: 66


Epochs:   0%|          | 0/66 [00:00<?, ?it/s]
Training:   0%|          | 0/105 [00:00<?, ?it/s][A
Training:   1%|          | 1/105 [00:01<02:05,  1.21s/it][A
Training:   2%|▏         | 2/105 [00:01<00:58,  1.77it/s][A
Training:   4%|▍         | 4/105 [00:01<00:24,  4.09it/s][A
Training:   6%|▌         | 6/105 [00:02<00:31,  3.12it/s][A
Training:   8%|▊         | 8/105 [00:02<00:20,  4.70it/s][A
Training:  10%|▉         | 10/105 [00:03<00:25,  3.75it/s][A
Training:  12%|█▏        | 13/105 [00:03<00:21,  4.20it/s][A
Training:  15%|█▌        | 16/105 [00:03<00:14,  6.02it/s][A
Training:  17%|█▋        | 18/105 [00:04<00:18,  4.73it/s][A
Training:  18%|█▊        | 19/105 [00:04<00:17,  5.01it/s][A
Training:  20%|██        | 21/105 [00:05<00:18,  4.48it/s][A
Training:  21%|██        | 22/105 [00:05<00:18,  4.46it/s][A
Training:  24%|██▍       | 25/105 [00:06<00:17,  4.61it/s][A
Training:  25%|██▍       | 26/105 [00:06<00:18,  4.30it/s][A
Training:  27%|██▋       | 28/105 [00

Epoch: 1/66 - Loss: 0.5739 - Accuracy: 0.7607



  0%|          | 0/14 [00:00<?, ?it/s][A
  7%|▋         | 1/14 [00:01<00:16,  1.26s/it][A
 29%|██▊       | 4/14 [00:01<00:02,  3.68it/s][A
 43%|████▎     | 6/14 [00:02<00:02,  3.15it/s][A
 57%|█████▋    | 8/14 [00:02<00:01,  4.45it/s][A
 71%|███████▏  | 10/14 [00:03<00:01,  3.59it/s][A
 79%|███████▊  | 11/14 [00:03<00:00,  3.97it/s][A
100%|██████████| 14/14 [00:03<00:00,  3.62it/s][A
Epochs:   2%|▏         | 1/66 [00:27<29:48, 27.51s/it]

Val Loss: 0.4825 - Val Accuracy: 0.8481



Training:   0%|          | 0/105 [00:00<?, ?it/s][A
Training:   1%|          | 1/105 [00:01<01:57,  1.13s/it][A
Training:   3%|▎         | 3/105 [00:01<00:37,  2.73it/s][A
Training:   5%|▍         | 5/105 [00:01<00:33,  3.01it/s][A
Training:   7%|▋         | 7/105 [00:02<00:24,  4.06it/s][A
Training:   9%|▊         | 9/105 [00:02<00:27,  3.52it/s][A
Training:  10%|█         | 11/105 [00:03<00:21,  4.43it/s][A
Training:  12%|█▏        | 13/105 [00:03<00:23,  3.90it/s][A
Training:  14%|█▍        | 15/105 [00:03<00:18,  4.92it/s][A
Training:  16%|█▌        | 17/105 [00:04<00:21,  4.17it/s][A
Training:  18%|█▊        | 19/105 [00:04<00:16,  5.21it/s][A
Training:  20%|██        | 21/105 [00:05<00:20,  4.18it/s][A
Training:  24%|██▍       | 25/105 [00:06<00:17,  4.66it/s][A
Training:  26%|██▌       | 27/105 [00:06<00:14,  5.28it/s][A
Training:  28%|██▊       | 29/105 [00:06<00:16,  4.67it/s][A
Training:  30%|██▉       | 31/105 [00:07<00:15,  4.91it/s][A
Training:  31%|███▏  

Epoch: 2/66 - Loss: 0.4314 - Accuracy: 0.8511



  0%|          | 0/14 [00:00<?, ?it/s][A
  7%|▋         | 1/14 [00:01<00:14,  1.12s/it][A
 14%|█▍        | 2/14 [00:01<00:06,  1.88it/s][A
 29%|██▊       | 4/14 [00:01<00:02,  4.12it/s][A
 36%|███▌      | 5/14 [00:02<00:03,  2.73it/s][A
 43%|████▎     | 6/14 [00:02<00:02,  3.45it/s][A
 50%|█████     | 7/14 [00:02<00:01,  4.17it/s][A
 57%|█████▋    | 8/14 [00:02<00:01,  4.87it/s][A
 64%|██████▍   | 9/14 [00:02<00:01,  3.49it/s][A
 79%|███████▊  | 11/14 [00:03<00:00,  4.34it/s][A
100%|██████████| 14/14 [00:03<00:00,  3.68it/s][A
Epochs:   3%|▎         | 2/66 [00:54<29:17, 27.46s/it]

Val Loss: 0.3848 - Val Accuracy: 0.8731



Training:   0%|          | 0/105 [00:00<?, ?it/s][A
Training:   1%|          | 1/105 [00:00<01:35,  1.09it/s][A
Training:   4%|▍         | 4/105 [00:01<00:20,  4.93it/s][A
Training:   6%|▌         | 6/105 [00:01<00:25,  3.93it/s][A
Training:   8%|▊         | 8/105 [00:01<00:19,  5.09it/s][A
Training:  10%|▉         | 10/105 [00:02<00:25,  3.71it/s][A
Training:  12%|█▏        | 13/105 [00:03<00:23,  3.87it/s][A
Training:  13%|█▎        | 14/105 [00:03<00:22,  3.97it/s][A
Training:  16%|█▌        | 17/105 [00:04<00:17,  4.92it/s][A
Training:  17%|█▋        | 18/105 [00:04<00:19,  4.53it/s][A
Training:  19%|█▉        | 20/105 [00:04<00:14,  5.91it/s][A
Training:  20%|██        | 21/105 [00:04<00:17,  4.68it/s][A
Training:  21%|██        | 22/105 [00:05<00:19,  4.31it/s][A
Training:  23%|██▎       | 24/105 [00:05<00:14,  5.76it/s][A
Training:  24%|██▍       | 25/105 [00:05<00:18,  4.42it/s][A
Training:  25%|██▍       | 26/105 [00:06<00:19,  4.03it/s][A
Training:  26%|██▌  

Epoch: 3/66 - Loss: 0.3547 - Accuracy: 0.8753



  0%|          | 0/14 [00:00<?, ?it/s][A
  7%|▋         | 1/14 [00:01<00:15,  1.18s/it][A
 21%|██▏       | 3/14 [00:01<00:04,  2.65it/s][A
 36%|███▌      | 5/14 [00:02<00:03,  2.84it/s][A
 43%|████▎     | 6/14 [00:02<00:02,  3.22it/s][A
 50%|█████     | 7/14 [00:02<00:01,  3.90it/s][A
 64%|██████▍   | 9/14 [00:02<00:01,  3.55it/s][A
 71%|███████▏  | 10/14 [00:03<00:01,  3.99it/s][A
 79%|███████▊  | 11/14 [00:03<00:00,  4.46it/s][A
100%|██████████| 14/14 [00:03<00:00,  3.67it/s][A
Epochs:   5%|▍         | 3/66 [01:21<28:28, 27.12s/it]

Val Loss: 0.3269 - Val Accuracy: 0.8918



Training:   0%|          | 0/105 [00:00<?, ?it/s][A
Training:   1%|          | 1/105 [00:01<02:02,  1.18s/it][A
Training:   3%|▎         | 3/105 [00:01<00:36,  2.81it/s][A
Training:   5%|▍         | 5/105 [00:01<00:32,  3.04it/s][A
Training:   7%|▋         | 7/105 [00:02<00:23,  4.12it/s][A
Training:   9%|▊         | 9/105 [00:02<00:27,  3.47it/s][A
Training:  10%|█         | 11/105 [00:03<00:22,  4.22it/s][A
Training:  12%|█▏        | 13/105 [00:03<00:22,  4.11it/s][A
Training:  14%|█▍        | 15/105 [00:04<00:20,  4.41it/s][A
Training:  16%|█▌        | 17/105 [00:04<00:19,  4.58it/s][A
Training:  18%|█▊        | 19/105 [00:04<00:18,  4.59it/s][A
Training:  20%|██        | 21/105 [00:05<00:16,  5.12it/s][A
Training:  22%|██▏       | 23/105 [00:05<00:15,  5.28it/s][A
Training:  24%|██▍       | 25/105 [00:05<00:15,  5.17it/s][A
Training:  26%|██▌       | 27/105 [00:06<00:14,  5.25it/s][A
Training:  28%|██▊       | 29/105 [00:06<00:15,  4.89it/s][A
Training:  30%|██▉   

Epoch: 4/66 - Loss: 0.3072 - Accuracy: 0.8893



  0%|          | 0/14 [00:00<?, ?it/s][A
  7%|▋         | 1/14 [00:01<00:16,  1.29s/it][A
 36%|███▌      | 5/14 [00:02<00:03,  2.82it/s][A
 50%|█████     | 7/14 [00:02<00:01,  4.12it/s][A
 64%|██████▍   | 9/14 [00:03<00:01,  3.19it/s][A
100%|██████████| 14/14 [00:03<00:00,  3.66it/s][A
Epochs:   6%|▌         | 4/66 [01:49<28:10, 27.26s/it]

Val Loss: 0.2872 - Val Accuracy: 0.9009



Training:   0%|          | 0/105 [00:00<?, ?it/s][A
Training:   1%|          | 1/105 [00:01<02:06,  1.21s/it][A
Training:   5%|▍         | 5/105 [00:02<00:35,  2.83it/s][A
Training:   7%|▋         | 7/105 [00:02<00:23,  4.14it/s][A
Training:   9%|▊         | 9/105 [00:02<00:26,  3.61it/s][A
Training:  10%|█         | 11/105 [00:02<00:19,  4.93it/s][A
Training:  12%|█▏        | 13/105 [00:03<00:25,  3.65it/s][A
Training:  15%|█▌        | 16/105 [00:03<00:16,  5.54it/s][A
Training:  17%|█▋        | 18/105 [00:04<00:20,  4.31it/s][A
Training:  20%|██        | 21/105 [00:05<00:19,  4.42it/s][A
Training:  23%|██▎       | 24/105 [00:05<00:13,  6.20it/s][A
Training:  25%|██▍       | 26/105 [00:06<00:17,  4.58it/s][A
Training:  28%|██▊       | 29/105 [00:07<00:18,  4.15it/s][A
Training:  29%|██▊       | 30/105 [00:07<00:16,  4.50it/s][A
Training:  31%|███▏      | 33/105 [00:08<00:17,  4.07it/s][A
Training:  33%|███▎      | 35/105 [00:08<00:14,  4.99it/s][A
Training:  35%|███▌ 

Epoch: 5/66 - Loss: 0.2742 - Accuracy: 0.8996



  0%|          | 0/14 [00:00<?, ?it/s][A
  7%|▋         | 1/14 [00:01<00:14,  1.14s/it][A
 14%|█▍        | 2/14 [00:01<00:06,  1.88it/s][A
 29%|██▊       | 4/14 [00:01<00:02,  4.30it/s][A
 43%|████▎     | 6/14 [00:02<00:02,  3.24it/s][A
 64%|██████▍   | 9/14 [00:03<00:01,  3.20it/s][A
 86%|████████▌ | 12/14 [00:03<00:00,  5.11it/s][A
100%|██████████| 14/14 [00:03<00:00,  3.58it/s][A
Epochs:   8%|▊         | 5/66 [02:16<27:36, 27.16s/it]

Val Loss: 0.2617 - Val Accuracy: 0.9072



Training:   0%|          | 0/105 [00:00<?, ?it/s][A
Training:   1%|          | 1/105 [00:01<02:04,  1.20s/it][A
Training:   3%|▎         | 3/105 [00:01<00:38,  2.68it/s][A
Training:   5%|▍         | 5/105 [00:02<00:35,  2.78it/s][A
Training:   8%|▊         | 8/105 [00:02<00:18,  5.21it/s][A
Training:  10%|▉         | 10/105 [00:03<00:27,  3.51it/s][A
Training:  12%|█▏        | 13/105 [00:03<00:26,  3.49it/s][A
Training:  14%|█▍        | 15/105 [00:04<00:19,  4.51it/s][A
Training:  16%|█▌        | 17/105 [00:04<00:22,  3.90it/s][A
Training:  19%|█▉        | 20/105 [00:04<00:14,  5.82it/s][A
Training:  21%|██        | 22/105 [00:05<00:17,  4.67it/s][A
Training:  24%|██▍       | 25/105 [00:06<00:16,  4.76it/s][A
Training:  26%|██▌       | 27/105 [00:06<00:13,  5.90it/s][A
Training:  28%|██▊       | 29/105 [00:06<00:16,  4.60it/s][A
Training:  30%|██▉       | 31/105 [00:07<00:13,  5.43it/s][A
Training:  31%|███▏      | 33/105 [00:07<00:14,  4.84it/s][A
Training:  33%|███▎ 

Epoch: 6/66 - Loss: 0.2501 - Accuracy: 0.9078



  0%|          | 0/14 [00:00<?, ?it/s][A
  7%|▋         | 1/14 [00:01<00:15,  1.20s/it][A
 36%|███▌      | 5/14 [00:02<00:03,  2.54it/s][A
 57%|█████▋    | 8/14 [00:02<00:01,  4.47it/s][A
 71%|███████▏  | 10/14 [00:03<00:01,  3.48it/s][A
100%|██████████| 14/14 [00:03<00:00,  3.55it/s][A
Epochs:   9%|▉         | 6/66 [02:43<27:06, 27.10s/it]

Val Loss: 0.2417 - Val Accuracy: 0.9152



Training:   0%|          | 0/105 [00:00<?, ?it/s][A
Training:   1%|          | 1/105 [00:01<01:56,  1.12s/it][A
Training:   3%|▎         | 3/105 [00:01<00:34,  2.94it/s][A
Training:   5%|▍         | 5/105 [00:01<00:28,  3.46it/s][A
Training:   7%|▋         | 7/105 [00:01<00:18,  5.31it/s][A
Training:   9%|▊         | 9/105 [00:02<00:26,  3.57it/s][A
Training:  12%|█▏        | 13/105 [00:03<00:23,  3.98it/s][A
Training:  15%|█▌        | 16/105 [00:03<00:15,  5.65it/s][A
Training:  17%|█▋        | 18/105 [00:04<00:19,  4.38it/s][A
Training:  20%|██        | 21/105 [00:05<00:19,  4.40it/s][A
Training:  24%|██▍       | 25/105 [00:05<00:15,  5.19it/s][A
Training:  28%|██▊       | 29/105 [00:06<00:15,  4.95it/s][A
Training:  30%|██▉       | 31/105 [00:06<00:12,  5.79it/s][A
Training:  31%|███▏      | 33/105 [00:07<00:16,  4.28it/s][A
Training:  35%|███▌      | 37/105 [00:08<00:15,  4.51it/s][A
Training:  39%|███▉      | 41/105 [00:09<00:14,  4.47it/s][A
Training:  41%|████  

Epoch: 7/66 - Loss: 0.2324 - Accuracy: 0.9137



  0%|          | 0/14 [00:00<?, ?it/s][A
  7%|▋         | 1/14 [00:01<00:15,  1.21s/it][A
 21%|██▏       | 3/14 [00:01<00:03,  2.79it/s][A
 36%|███▌      | 5/14 [00:02<00:03,  2.82it/s][A
 43%|████▎     | 6/14 [00:02<00:02,  3.40it/s][A
 50%|█████     | 7/14 [00:02<00:01,  4.11it/s][A
 64%|██████▍   | 9/14 [00:02<00:01,  3.47it/s][A
 79%|███████▊  | 11/14 [00:03<00:00,  5.02it/s][A
 86%|████████▌ | 12/14 [00:03<00:00,  4.99it/s][A
100%|██████████| 14/14 [00:03<00:00,  3.59it/s][A
Epochs:  11%|█         | 7/66 [03:09<26:24, 26.86s/it]

Val Loss: 0.2314 - Val Accuracy: 0.9136



Training:   0%|          | 0/105 [00:00<?, ?it/s][A
Training:   1%|          | 1/105 [00:01<01:58,  1.13s/it][A
Training:   5%|▍         | 5/105 [00:01<00:32,  3.03it/s][A
Training:   8%|▊         | 8/105 [00:02<00:18,  5.18it/s][A
Training:  10%|▉         | 10/105 [00:02<00:24,  3.92it/s][A
Training:  11%|█▏        | 12/105 [00:02<00:18,  5.15it/s][A
Training:  13%|█▎        | 14/105 [00:03<00:23,  3.94it/s][A
Training:  15%|█▌        | 16/105 [00:03<00:17,  5.18it/s][A
Training:  17%|█▋        | 18/105 [00:04<00:21,  4.04it/s][A
Training:  19%|█▉        | 20/105 [00:04<00:15,  5.32it/s][A
Training:  21%|██        | 22/105 [00:05<00:21,  3.92it/s][A
Training:  24%|██▍       | 25/105 [00:06<00:18,  4.29it/s][A
Training:  26%|██▌       | 27/105 [00:06<00:14,  5.45it/s][A
Training:  28%|██▊       | 29/105 [00:06<00:17,  4.31it/s][A
Training:  30%|███       | 32/105 [00:07<00:11,  6.25it/s][A
Training:  32%|███▏      | 34/105 [00:07<00:16,  4.21it/s][A
Training:  34%|███▍

Epoch: 8/66 - Loss: 0.2197 - Accuracy: 0.9157



  0%|          | 0/14 [00:00<?, ?it/s][A
  7%|▋         | 1/14 [00:01<00:13,  1.07s/it][A
 14%|█▍        | 2/14 [00:01<00:06,  1.79it/s][A
 29%|██▊       | 4/14 [00:01<00:02,  4.00it/s][A
 36%|███▌      | 5/14 [00:01<00:02,  3.02it/s][A
 43%|████▎     | 6/14 [00:02<00:02,  3.59it/s][A
 50%|█████     | 7/14 [00:02<00:01,  3.92it/s][A
 64%|██████▍   | 9/14 [00:02<00:01,  3.72it/s][A
 79%|███████▊  | 11/14 [00:03<00:00,  4.35it/s][A
100%|██████████| 14/14 [00:03<00:00,  3.73it/s][A
Epochs:  12%|█▏        | 8/66 [03:36<25:58, 26.87s/it]

Val Loss: 0.2161 - Val Accuracy: 0.9248



Training:   0%|          | 0/105 [00:00<?, ?it/s][A
Training:   1%|          | 1/105 [00:01<01:58,  1.14s/it][A
Training:   2%|▏         | 2/105 [00:01<00:55,  1.86it/s][A
Training:   4%|▍         | 4/105 [00:01<00:23,  4.26it/s][A
Training:   6%|▌         | 6/105 [00:02<00:29,  3.31it/s][A
Training:   9%|▊         | 9/105 [00:02<00:26,  3.58it/s][A
Training:  10%|█         | 11/105 [00:03<00:19,  4.73it/s][A
Training:  12%|█▏        | 13/105 [00:03<00:24,  3.75it/s][A
Training:  14%|█▍        | 15/105 [00:03<00:18,  4.87it/s][A
Training:  16%|█▌        | 17/105 [00:04<00:23,  3.67it/s][A
Training:  19%|█▉        | 20/105 [00:04<00:15,  5.57it/s][A
Training:  21%|██        | 22/105 [00:05<00:19,  4.22it/s][A
Training:  23%|██▎       | 24/105 [00:05<00:15,  5.25it/s][A
Training:  25%|██▍       | 26/105 [00:06<00:17,  4.51it/s][A
Training:  27%|██▋       | 28/105 [00:06<00:13,  5.77it/s][A
Training:  29%|██▊       | 30/105 [00:07<00:15,  4.89it/s][A
Training:  31%|███▏  

Epoch: 9/66 - Loss: 0.2097 - Accuracy: 0.9198



  0%|          | 0/14 [00:00<?, ?it/s][A
  7%|▋         | 1/14 [00:01<00:17,  1.33s/it][A
 14%|█▍        | 2/14 [00:01<00:07,  1.64it/s][A
 29%|██▊       | 4/14 [00:01<00:02,  3.78it/s][A
 43%|████▎     | 6/14 [00:02<00:02,  3.19it/s][A
 64%|██████▍   | 9/14 [00:03<00:01,  3.52it/s][A
 71%|███████▏  | 10/14 [00:03<00:01,  3.58it/s][A
100%|██████████| 14/14 [00:03<00:00,  3.60it/s][A
Epochs:  14%|█▎        | 9/66 [04:03<25:32, 26.89s/it]

Val Loss: 0.2102 - Val Accuracy: 0.9232



Training:   0%|          | 0/105 [00:00<?, ?it/s][A
Training:   1%|          | 1/105 [00:01<02:03,  1.18s/it][A
Training:   4%|▍         | 4/105 [00:01<00:26,  3.85it/s][A
Training:   6%|▌         | 6/105 [00:02<00:32,  3.06it/s][A
Training:   9%|▊         | 9/105 [00:02<00:27,  3.51it/s][A
Training:  10%|▉         | 10/105 [00:03<00:25,  3.79it/s][A
Training:  12%|█▏        | 13/105 [00:03<00:23,  3.88it/s][A
Training:  13%|█▎        | 14/105 [00:03<00:21,  4.21it/s][A
Training:  15%|█▌        | 16/105 [00:04<00:15,  5.59it/s][A
Training:  16%|█▌        | 17/105 [00:04<00:22,  3.85it/s][A
Training:  17%|█▋        | 18/105 [00:04<00:21,  4.00it/s][A
Training:  20%|██        | 21/105 [00:05<00:20,  4.17it/s][A
Training:  21%|██        | 22/105 [00:05<00:18,  4.48it/s][A
Training:  24%|██▍       | 25/105 [00:06<00:17,  4.45it/s][A
Training:  25%|██▍       | 26/105 [00:06<00:17,  4.48it/s][A
Training:  27%|██▋       | 28/105 [00:06<00:13,  5.74it/s][A
Training:  28%|██▊  

Epoch: 10/66 - Loss: 0.2000 - Accuracy: 0.9234



  0%|          | 0/14 [00:00<?, ?it/s][A
  7%|▋         | 1/14 [00:01<00:16,  1.28s/it][A
 36%|███▌      | 5/14 [00:02<00:03,  2.50it/s][A
 57%|█████▋    | 8/14 [00:02<00:01,  4.41it/s][A
 71%|███████▏  | 10/14 [00:03<00:01,  3.39it/s][A
100%|██████████| 14/14 [00:04<00:00,  3.39it/s][A
Epochs:  15%|█▌        | 10/66 [04:30<25:13, 27.02s/it]

Val Loss: 0.2018 - Val Accuracy: 0.9264



Training:   0%|          | 0/105 [00:00<?, ?it/s][A
Training:   1%|          | 1/105 [00:01<01:50,  1.07s/it][A
Training:   3%|▎         | 3/105 [00:01<00:33,  3.07it/s][A
Training:   5%|▍         | 5/105 [00:01<00:34,  2.93it/s][A
Training:   7%|▋         | 7/105 [00:02<00:21,  4.55it/s][A
Training:   9%|▊         | 9/105 [00:02<00:23,  4.06it/s][A
Training:  10%|█         | 11/105 [00:02<00:16,  5.60it/s][A
Training:  12%|█▏        | 13/105 [00:03<00:20,  4.42it/s][A
Training:  13%|█▎        | 14/105 [00:03<00:19,  4.77it/s][A
Training:  16%|█▌        | 17/105 [00:04<00:19,  4.61it/s][A
Training:  18%|█▊        | 19/105 [00:04<00:14,  5.74it/s][A
Training:  19%|█▉        | 20/105 [00:04<00:13,  6.19it/s][A
Training:  20%|██        | 21/105 [00:05<00:22,  3.75it/s][A
Training:  21%|██        | 22/105 [00:05<00:19,  4.21it/s][A
Training:  24%|██▍       | 25/105 [00:06<00:20,  3.95it/s][A
Training:  27%|██▋       | 28/105 [00:06<00:12,  6.00it/s][A
Training:  29%|██▊   

Epoch: 11/66 - Loss: 0.1924 - Accuracy: 0.9256



  0%|          | 0/14 [00:00<?, ?it/s][A
  7%|▋         | 1/14 [00:01<00:16,  1.31s/it][A
 29%|██▊       | 4/14 [00:01<00:02,  3.63it/s][A
 43%|████▎     | 6/14 [00:02<00:02,  3.00it/s][A
 64%|██████▍   | 9/14 [00:03<00:01,  3.21it/s][A
100%|██████████| 14/14 [00:03<00:00,  3.54it/s][A
Epochs:  17%|█▋        | 11/66 [04:56<24:33, 26.80s/it]

Val Loss: 0.1949 - Val Accuracy: 0.9286



Training:   0%|          | 0/105 [00:00<?, ?it/s][A
Training:   1%|          | 1/105 [00:01<01:59,  1.15s/it][A
Training:   2%|▏         | 2/105 [00:01<01:00,  1.71it/s][A
Training:   4%|▍         | 4/105 [00:01<00:25,  3.94it/s][A
Training:   5%|▍         | 5/105 [00:02<00:36,  2.76it/s][A
Training:   7%|▋         | 7/105 [00:02<00:21,  4.58it/s][A
Training:   9%|▊         | 9/105 [00:02<00:26,  3.56it/s][A
Training:  10%|█         | 11/105 [00:03<00:19,  4.94it/s][A
Training:  12%|█▏        | 13/105 [00:03<00:22,  4.04it/s][A
Training:  15%|█▌        | 16/105 [00:04<00:18,  4.90it/s][A
Training:  16%|█▌        | 17/105 [00:04<00:19,  4.44it/s][A
Training:  18%|█▊        | 19/105 [00:04<00:15,  5.51it/s][A
Training:  19%|█▉        | 20/105 [00:05<00:18,  4.63it/s][A
Training:  20%|██        | 21/105 [00:05<00:17,  4.83it/s][A
Training:  22%|██▏       | 23/105 [00:05<00:16,  4.86it/s][A
Training:  23%|██▎       | 24/105 [00:05<00:18,  4.26it/s][A
Training:  24%|██▍    

Epoch: 12/66 - Loss: 0.1861 - Accuracy: 0.9271



  0%|          | 0/14 [00:00<?, ?it/s][A
  7%|▋         | 1/14 [00:00<00:12,  1.05it/s][A
 14%|█▍        | 2/14 [00:01<00:05,  2.08it/s][A
 21%|██▏       | 3/14 [00:01<00:03,  3.21it/s][A
 36%|███▌      | 5/14 [00:01<00:02,  3.11it/s][A
 43%|████▎     | 6/14 [00:01<00:02,  3.88it/s][A
 57%|█████▋    | 8/14 [00:02<00:00,  6.01it/s][A
 71%|███████▏  | 10/14 [00:02<00:01,  3.78it/s][A
 79%|███████▊  | 11/14 [00:03<00:00,  4.23it/s][A
100%|██████████| 14/14 [00:03<00:00,  3.91it/s][A
Epochs:  18%|█▊        | 12/66 [05:23<24:07, 26.81s/it]

Val Loss: 0.1902 - Val Accuracy: 0.9291



Training:   0%|          | 0/105 [00:00<?, ?it/s][A
Training:   1%|          | 1/105 [00:01<02:13,  1.28s/it][A
Training:   3%|▎         | 3/105 [00:01<00:38,  2.64it/s][A
Training:   5%|▍         | 5/105 [00:02<00:39,  2.54it/s][A
Training:   8%|▊         | 8/105 [00:02<00:20,  4.78it/s][A
Training:  10%|▉         | 10/105 [00:03<00:26,  3.62it/s][A
Training:  10%|█         | 11/105 [00:03<00:22,  4.12it/s][A
Training:  12%|█▏        | 13/105 [00:04<00:26,  3.41it/s][A
Training:  14%|█▍        | 15/105 [00:04<00:20,  4.43it/s][A
Training:  16%|█▌        | 17/105 [00:04<00:23,  3.80it/s][A
Training:  18%|█▊        | 19/105 [00:05<00:17,  4.92it/s][A
Training:  20%|██        | 21/105 [00:05<00:20,  4.02it/s][A
Training:  22%|██▏       | 23/105 [00:05<00:16,  4.94it/s][A
Training:  24%|██▍       | 25/105 [00:06<00:18,  4.32it/s][A
Training:  27%|██▋       | 28/105 [00:06<00:11,  6.49it/s][A
Training:  29%|██▊       | 30/105 [00:07<00:16,  4.56it/s][A
Training:  30%|██▉  

Epoch: 13/66 - Loss: 0.1811 - Accuracy: 0.9290



  0%|          | 0/14 [00:00<?, ?it/s][A
  7%|▋         | 1/14 [00:01<00:15,  1.17s/it][A
 21%|██▏       | 3/14 [00:01<00:03,  2.86it/s][A
 36%|███▌      | 5/14 [00:02<00:03,  2.52it/s][A
 64%|██████▍   | 9/14 [00:03<00:01,  3.34it/s][A
100%|██████████| 14/14 [00:03<00:00,  3.51it/s][A
Epochs:  20%|█▉        | 13/66 [05:51<23:57, 27.12s/it]

Val Loss: 0.1865 - Val Accuracy: 0.9312



Training:   0%|          | 0/105 [00:00<?, ?it/s][A
Training:   1%|          | 1/105 [00:01<02:14,  1.29s/it][A
Training:   4%|▍         | 4/105 [00:01<00:28,  3.54it/s][A
Training:   6%|▌         | 6/105 [00:02<00:34,  2.90it/s][A
Training:   9%|▊         | 9/105 [00:03<00:29,  3.21it/s][A
Training:  10%|█         | 11/105 [00:03<00:21,  4.35it/s][A
Training:  12%|█▏        | 13/105 [00:03<00:24,  3.76it/s][A
Training:  14%|█▍        | 15/105 [00:04<00:19,  4.72it/s][A
Training:  16%|█▌        | 17/105 [00:04<00:22,  3.90it/s][A
Training:  20%|██        | 21/105 [00:05<00:19,  4.32it/s][A
Training:  22%|██▏       | 23/105 [00:05<00:15,  5.27it/s][A
Training:  23%|██▎       | 24/105 [00:05<00:14,  5.66it/s][A
Training:  24%|██▍       | 25/105 [00:06<00:19,  4.11it/s][A
Training:  26%|██▌       | 27/105 [00:06<00:16,  4.84it/s][A
Training:  28%|██▊       | 29/105 [00:07<00:16,  4.56it/s][A
Training:  30%|██▉       | 31/105 [00:07<00:14,  5.23it/s][A
Training:  31%|███▏ 

Epoch: 14/66 - Loss: 0.1781 - Accuracy: 0.9301



  0%|          | 0/14 [00:00<?, ?it/s][A
  7%|▋         | 1/14 [00:01<00:14,  1.14s/it][A
 14%|█▍        | 2/14 [00:01<00:06,  1.83it/s][A
 29%|██▊       | 4/14 [00:01<00:02,  4.14it/s][A
 43%|████▎     | 6/14 [00:02<00:02,  3.32it/s][A
 64%|██████▍   | 9/14 [00:02<00:01,  3.49it/s][A
 71%|███████▏  | 10/14 [00:03<00:01,  3.66it/s][A
100%|██████████| 14/14 [00:03<00:00,  3.68it/s][A
Epochs:  21%|██        | 14/66 [06:18<23:21, 26.94s/it]

Val Loss: 0.1813 - Val Accuracy: 0.9323



Training:   0%|          | 0/105 [00:00<?, ?it/s][A
Training:   1%|          | 1/105 [00:01<02:04,  1.20s/it][A
Training:   3%|▎         | 3/105 [00:01<00:37,  2.71it/s][A
Training:   5%|▍         | 5/105 [00:02<00:37,  2.65it/s][A
Training:   6%|▌         | 6/105 [00:02<00:30,  3.30it/s][A
Training:   8%|▊         | 8/105 [00:02<00:19,  4.93it/s][A
Training:   9%|▊         | 9/105 [00:03<00:30,  3.12it/s][A
Training:  12%|█▏        | 13/105 [00:03<00:22,  4.02it/s][A
Training:  14%|█▍        | 15/105 [00:03<00:17,  5.23it/s][A
Training:  16%|█▌        | 17/105 [00:04<00:22,  3.87it/s][A
Training:  20%|██        | 21/105 [00:05<00:20,  4.19it/s][A
Training:  23%|██▎       | 24/105 [00:05<00:14,  5.78it/s][A
Training:  25%|██▍       | 26/105 [00:06<00:16,  4.75it/s][A
Training:  28%|██▊       | 29/105 [00:06<00:15,  4.94it/s][A
Training:  31%|███▏      | 33/105 [00:07<00:14,  5.12it/s][A
Training:  35%|███▌      | 37/105 [00:08<00:14,  4.67it/s][A
Training:  36%|███▌   

Epoch: 15/66 - Loss: 0.1739 - Accuracy: 0.9329



  0%|          | 0/14 [00:00<?, ?it/s][A
  7%|▋         | 1/14 [00:01<00:18,  1.39s/it][A
 29%|██▊       | 4/14 [00:01<00:02,  3.44it/s][A
 43%|████▎     | 6/14 [00:02<00:02,  2.82it/s][A
 64%|██████▍   | 9/14 [00:03<00:01,  3.23it/s][A
 71%|███████▏  | 10/14 [00:03<00:01,  3.51it/s][A
100%|██████████| 14/14 [00:04<00:00,  3.44it/s][A
Epochs:  23%|██▎       | 15/66 [06:45<22:54, 26.94s/it]

Val Loss: 0.1828 - Val Accuracy: 0.9344



Training:   0%|          | 0/105 [00:00<?, ?it/s][A
Training:   1%|          | 1/105 [00:01<02:11,  1.26s/it][A
Training:   4%|▍         | 4/105 [00:01<00:28,  3.57it/s][A
Training:   6%|▌         | 6/105 [00:02<00:32,  3.07it/s][A
Training:   8%|▊         | 8/105 [00:02<00:22,  4.39it/s][A
Training:  10%|▉         | 10/105 [00:03<00:26,  3.56it/s][A
Training:  11%|█▏        | 12/105 [00:03<00:19,  4.81it/s][A
Training:  13%|█▎        | 14/105 [00:04<00:26,  3.45it/s][A
Training:  16%|█▌        | 17/105 [00:05<00:28,  3.13it/s][A
Training:  18%|█▊        | 19/105 [00:05<00:21,  3.99it/s][A
Training:  20%|██        | 21/105 [00:06<00:25,  3.30it/s][A
Training:  24%|██▍       | 25/105 [00:07<00:21,  3.80it/s][A
Training:  27%|██▋       | 28/105 [00:07<00:14,  5.24it/s][A
Training:  29%|██▊       | 30/105 [00:07<00:17,  4.24it/s][A
Training:  31%|███▏      | 33/105 [00:08<00:16,  4.30it/s][A
Training:  34%|███▍      | 36/105 [00:08<00:11,  5.88it/s][A
Training:  36%|███▌ 

Epoch: 16/66 - Loss: 0.1702 - Accuracy: 0.9340



  0%|          | 0/14 [00:00<?, ?it/s][A
  7%|▋         | 1/14 [00:01<00:17,  1.32s/it][A
 29%|██▊       | 4/14 [00:01<00:02,  3.45it/s][A
 43%|████▎     | 6/14 [00:02<00:02,  3.22it/s][A
 57%|█████▋    | 8/14 [00:02<00:01,  4.61it/s][A
 71%|███████▏  | 10/14 [00:03<00:01,  3.68it/s][A
100%|██████████| 14/14 [00:03<00:00,  3.72it/s][A
Epochs:  24%|██▍       | 16/66 [07:12<22:38, 27.16s/it]

Val Loss: 0.1762 - Val Accuracy: 0.9350



Training:   0%|          | 0/105 [00:00<?, ?it/s][A
Training:   1%|          | 1/105 [00:01<02:29,  1.44s/it][A
Training:   5%|▍         | 5/105 [00:02<00:40,  2.50it/s][A
Training:   7%|▋         | 7/105 [00:02<00:26,  3.69it/s][A
Training:   9%|▊         | 9/105 [00:03<00:31,  3.08it/s][A
Training:  11%|█▏        | 12/105 [00:03<00:18,  5.00it/s][A
Training:  13%|█▎        | 14/105 [00:04<00:23,  3.91it/s][A
Training:  15%|█▌        | 16/105 [00:04<00:17,  5.08it/s][A
Training:  17%|█▋        | 18/105 [00:05<00:24,  3.54it/s][A
Training:  20%|██        | 21/105 [00:06<00:23,  3.58it/s][A
Training:  24%|██▍       | 25/105 [00:06<00:19,  4.16it/s][A
Training:  25%|██▍       | 26/105 [00:06<00:18,  4.39it/s][A
Training:  28%|██▊       | 29/105 [00:07<00:16,  4.51it/s][A
Training:  30%|██▉       | 31/105 [00:07<00:13,  5.35it/s][A
Training:  31%|███▏      | 33/105 [00:08<00:15,  4.77it/s][A
Training:  32%|███▏      | 34/105 [00:08<00:15,  4.68it/s][A
Training:  34%|███▍ 

Epoch: 17/66 - Loss: 0.1680 - Accuracy: 0.9337



  0%|          | 0/14 [00:00<?, ?it/s][A
  7%|▋         | 1/14 [00:01<00:16,  1.27s/it][A
 14%|█▍        | 2/14 [00:01<00:07,  1.55it/s][A
 29%|██▊       | 4/14 [00:01<00:02,  3.67it/s][A
 43%|████▎     | 6/14 [00:02<00:02,  3.12it/s][A
 64%|██████▍   | 9/14 [00:03<00:01,  3.37it/s][A
 79%|███████▊  | 11/14 [00:03<00:00,  4.48it/s][A
100%|██████████| 14/14 [00:04<00:00,  3.49it/s][A
Epochs:  26%|██▌       | 17/66 [07:40<22:21, 27.38s/it]

Val Loss: 0.1785 - Val Accuracy: 0.9339



Training:   0%|          | 0/105 [00:00<?, ?it/s][A
Training:   1%|          | 1/105 [00:01<02:14,  1.29s/it][A
Training:   3%|▎         | 3/105 [00:01<00:38,  2.64it/s][A
Training:   5%|▍         | 5/105 [00:02<00:35,  2.79it/s][A
Training:   9%|▊         | 9/105 [00:02<00:25,  3.69it/s][A
Training:  10%|█         | 11/105 [00:03<00:19,  4.72it/s][A
Training:  12%|█▏        | 13/105 [00:04<00:26,  3.49it/s][A
Training:  15%|█▌        | 16/105 [00:04<00:16,  5.28it/s][A
Training:  17%|█▋        | 18/105 [00:04<00:20,  4.14it/s][A
Training:  20%|██        | 21/105 [00:05<00:22,  3.69it/s][A
Training:  24%|██▍       | 25/105 [00:06<00:19,  4.03it/s][A
Training:  26%|██▌       | 27/105 [00:06<00:15,  4.88it/s][A
Training:  28%|██▊       | 29/105 [00:07<00:17,  4.28it/s][A
Training:  31%|███▏      | 33/105 [00:08<00:15,  4.74it/s][A
Training:  32%|███▏      | 34/105 [00:08<00:14,  4.74it/s][A
Training:  35%|███▌      | 37/105 [00:08<00:13,  5.21it/s][A
Training:  36%|███▌ 

Epoch: 18/66 - Loss: 0.1665 - Accuracy: 0.9348



  0%|          | 0/14 [00:00<?, ?it/s][A
  7%|▋         | 1/14 [00:01<00:16,  1.29s/it][A
 14%|█▍        | 2/14 [00:01<00:08,  1.47it/s][A
 29%|██▊       | 4/14 [00:01<00:02,  3.50it/s][A
 43%|████▎     | 6/14 [00:02<00:02,  3.07it/s][A
 57%|█████▋    | 8/14 [00:02<00:01,  4.56it/s][A
 71%|███████▏  | 10/14 [00:03<00:01,  4.00it/s][A
 79%|███████▊  | 11/14 [00:03<00:00,  4.16it/s][A
100%|██████████| 14/14 [00:03<00:00,  3.55it/s][A
Epochs:  27%|██▋       | 18/66 [08:07<21:53, 27.37s/it]

Val Loss: 0.1721 - Val Accuracy: 0.9355



Training:   0%|          | 0/105 [00:00<?, ?it/s][A
Training:   1%|          | 1/105 [00:01<02:13,  1.29s/it][A
Training:   3%|▎         | 3/105 [00:01<00:38,  2.68it/s][A
Training:   5%|▍         | 5/105 [00:02<00:39,  2.52it/s][A
Training:   7%|▋         | 7/105 [00:02<00:25,  3.83it/s][A
Training:   8%|▊         | 8/105 [00:02<00:21,  4.42it/s][A
Training:   9%|▊         | 9/105 [00:03<00:31,  3.01it/s][A
Training:  12%|█▏        | 13/105 [00:03<00:21,  4.22it/s][A
Training:  13%|█▎        | 14/105 [00:03<00:19,  4.61it/s][A
Training:  16%|█▌        | 17/105 [00:04<00:18,  4.75it/s][A
Training:  17%|█▋        | 18/105 [00:04<00:18,  4.68it/s][A
Training:  20%|██        | 21/105 [00:05<00:17,  4.92it/s][A
Training:  21%|██        | 22/105 [00:05<00:19,  4.22it/s][A
Training:  24%|██▍       | 25/105 [00:06<00:16,  4.89it/s][A
Training:  25%|██▍       | 26/105 [00:06<00:16,  4.70it/s][A
Training:  28%|██▊       | 29/105 [00:07<00:15,  5.04it/s][A
Training:  29%|██▊    

Epoch: 19/66 - Loss: 0.1627 - Accuracy: 0.9375



  0%|          | 0/14 [00:00<?, ?it/s][A
  7%|▋         | 1/14 [00:01<00:15,  1.23s/it][A
 36%|███▌      | 5/14 [00:02<00:03,  2.86it/s][A
 43%|████▎     | 6/14 [00:02<00:02,  3.36it/s][A
 57%|█████▋    | 8/14 [00:02<00:01,  4.93it/s][A
 64%|██████▍   | 9/14 [00:02<00:01,  3.24it/s][A
 71%|███████▏  | 10/14 [00:03<00:01,  3.58it/s][A
100%|██████████| 14/14 [00:03<00:00,  3.65it/s][A
Epochs:  29%|██▉       | 19/66 [08:34<21:20, 27.25s/it]

Val Loss: 0.1716 - Val Accuracy: 0.9334



Training:   0%|          | 0/105 [00:00<?, ?it/s][A
Training:   1%|          | 1/105 [00:01<02:11,  1.27s/it][A
Training:   2%|▏         | 2/105 [00:01<01:00,  1.71it/s][A
Training:   5%|▍         | 5/105 [00:02<00:31,  3.13it/s][A
Training:   6%|▌         | 6/105 [00:02<00:29,  3.33it/s][A
Training:   8%|▊         | 8/105 [00:02<00:19,  4.89it/s][A
Training:   9%|▊         | 9/105 [00:02<00:25,  3.71it/s][A
Training:  10%|▉         | 10/105 [00:03<00:25,  3.74it/s][A
Training:  11%|█▏        | 12/105 [00:03<00:16,  5.60it/s][A
Training:  12%|█▏        | 13/105 [00:03<00:22,  4.07it/s][A
Training:  13%|█▎        | 14/105 [00:04<00:22,  3.98it/s][A
Training:  15%|█▌        | 16/105 [00:04<00:15,  5.76it/s][A
Training:  16%|█▌        | 17/105 [00:04<00:24,  3.63it/s][A
Training:  17%|█▋        | 18/105 [00:04<00:23,  3.78it/s][A
Training:  20%|██        | 21/105 [00:05<00:18,  4.62it/s][A
Training:  21%|██        | 22/105 [00:05<00:20,  4.06it/s][A
Training:  24%|██▍    

Epoch: 20/66 - Loss: 0.1610 - Accuracy: 0.9366



  0%|          | 0/14 [00:00<?, ?it/s][A
  7%|▋         | 1/14 [00:01<00:17,  1.31s/it][A
 21%|██▏       | 3/14 [00:01<00:04,  2.49it/s][A
 29%|██▊       | 4/14 [00:01<00:03,  3.30it/s][A
 36%|███▌      | 5/14 [00:02<00:03,  2.84it/s][A
 43%|████▎     | 6/14 [00:02<00:02,  3.22it/s][A
 50%|█████     | 7/14 [00:02<00:01,  3.87it/s][A
 64%|██████▍   | 9/14 [00:02<00:01,  3.85it/s][A
 71%|███████▏  | 10/14 [00:03<00:00,  4.13it/s][A
 79%|███████▊  | 11/14 [00:03<00:00,  4.69it/s][A
100%|██████████| 14/14 [00:03<00:00,  3.62it/s][A
Epochs:  30%|███       | 20/66 [09:02<21:01, 27.43s/it]

Val Loss: 0.1675 - Val Accuracy: 0.9360



Training:   0%|          | 0/105 [00:00<?, ?it/s][A
Training:   1%|          | 1/105 [00:01<02:36,  1.50s/it][A
Training:   4%|▍         | 4/105 [00:01<00:31,  3.18it/s][A
Training:   6%|▌         | 6/105 [00:02<00:33,  2.98it/s][A
Training:   9%|▊         | 9/105 [00:03<00:27,  3.45it/s][A
Training:  10%|▉         | 10/105 [00:03<00:25,  3.77it/s][A
Training:  11%|█▏        | 12/105 [00:03<00:18,  4.96it/s][A
Training:  12%|█▏        | 13/105 [00:04<00:26,  3.43it/s][A
Training:  13%|█▎        | 14/105 [00:04<00:23,  3.93it/s][A
Training:  15%|█▌        | 16/105 [00:04<00:16,  5.51it/s][A
Training:  16%|█▌        | 17/105 [00:04<00:24,  3.59it/s][A
Training:  17%|█▋        | 18/105 [00:05<00:21,  4.05it/s][A
Training:  19%|█▉        | 20/105 [00:05<00:14,  5.95it/s][A
Training:  21%|██        | 22/105 [00:05<00:20,  4.01it/s][A
Training:  23%|██▎       | 24/105 [00:06<00:14,  5.48it/s][A
Training:  25%|██▍       | 26/105 [00:06<00:20,  3.91it/s][A
Training:  28%|██▊  

Epoch: 21/66 - Loss: 0.1590 - Accuracy: 0.9388



  0%|          | 0/14 [00:00<?, ?it/s][A
  7%|▋         | 1/14 [00:01<00:16,  1.27s/it][A
 14%|█▍        | 2/14 [00:01<00:07,  1.64it/s][A
 36%|███▌      | 5/14 [00:02<00:03,  2.93it/s][A
 43%|████▎     | 6/14 [00:02<00:02,  3.53it/s][A
 64%|██████▍   | 9/14 [00:03<00:01,  3.71it/s][A
 71%|███████▏  | 10/14 [00:03<00:00,  4.18it/s][A
100%|██████████| 14/14 [00:03<00:00,  3.66it/s][A
Epochs:  32%|███▏      | 21/66 [09:30<20:35, 27.46s/it]

Val Loss: 0.1667 - Val Accuracy: 0.9350



Training:   0%|          | 0/105 [00:00<?, ?it/s][A
Training:   1%|          | 1/105 [00:01<02:25,  1.39s/it][A
Training:   4%|▍         | 4/105 [00:01<00:30,  3.28it/s][A
Training:   6%|▌         | 6/105 [00:02<00:33,  2.99it/s][A
Training:   9%|▊         | 9/105 [00:03<00:29,  3.30it/s][A
Training:  10%|▉         | 10/105 [00:03<00:26,  3.65it/s][A
Training:  12%|█▏        | 13/105 [00:03<00:23,  3.88it/s][A
Training:  13%|█▎        | 14/105 [00:04<00:22,  4.12it/s][A
Training:  15%|█▌        | 16/105 [00:04<00:17,  5.22it/s][A
Training:  16%|█▌        | 17/105 [00:04<00:24,  3.65it/s][A
Training:  18%|█▊        | 19/105 [00:05<00:17,  4.91it/s][A
Training:  20%|██        | 21/105 [00:05<00:20,  4.02it/s][A
Training:  21%|██        | 22/105 [00:05<00:18,  4.54it/s][A
Training:  23%|██▎       | 24/105 [00:05<00:13,  6.22it/s][A
Training:  25%|██▍       | 26/105 [00:06<00:17,  4.52it/s][A
Training:  27%|██▋       | 28/105 [00:06<00:13,  5.83it/s][A
Training:  29%|██▊  

Epoch: 22/66 - Loss: 0.1579 - Accuracy: 0.9384



  0%|          | 0/14 [00:00<?, ?it/s][A
  7%|▋         | 1/14 [00:01<00:18,  1.39s/it][A
 21%|██▏       | 3/14 [00:01<00:04,  2.46it/s][A
 36%|███▌      | 5/14 [00:02<00:03,  2.60it/s][A
 50%|█████     | 7/14 [00:02<00:01,  3.86it/s][A
 64%|██████▍   | 9/14 [00:03<00:01,  3.30it/s][A
 79%|███████▊  | 11/14 [00:03<00:00,  4.49it/s][A
100%|██████████| 14/14 [00:04<00:00,  3.44it/s][A
Epochs:  33%|███▎      | 22/66 [09:57<20:05, 27.39s/it]

Val Loss: 0.1696 - Val Accuracy: 0.9112



Training:   0%|          | 0/105 [00:00<?, ?it/s][A
Training:   1%|          | 1/105 [00:01<02:18,  1.33s/it][A
Training:   5%|▍         | 5/105 [00:02<00:37,  2.68it/s][A
Training:   7%|▋         | 7/105 [00:02<00:25,  3.83it/s][A
Training:   8%|▊         | 8/105 [00:02<00:23,  4.18it/s][A
Training:   9%|▊         | 9/105 [00:03<00:30,  3.16it/s][A
Training:  11%|█▏        | 12/105 [00:03<00:20,  4.60it/s][A
Training:  12%|█▏        | 13/105 [00:04<00:27,  3.34it/s][A
Training:  14%|█▍        | 15/105 [00:04<00:19,  4.64it/s][A
Training:  15%|█▌        | 16/105 [00:04<00:18,  4.83it/s][A
Training:  16%|█▌        | 17/105 [00:04<00:27,  3.25it/s][A
Training:  19%|█▉        | 20/105 [00:05<00:17,  4.93it/s][A
Training:  20%|██        | 21/105 [00:05<00:23,  3.58it/s][A
Training:  23%|██▎       | 24/105 [00:06<00:14,  5.75it/s][A
Training:  25%|██▍       | 26/105 [00:06<00:16,  4.66it/s][A
Training:  27%|██▋       | 28/105 [00:06<00:13,  5.79it/s][A
Training:  28%|██▊   

Epoch: 23/66 - Loss: 0.1561 - Accuracy: 0.9390



  0%|          | 0/14 [00:00<?, ?it/s][A
  7%|▋         | 1/14 [00:01<00:17,  1.31s/it][A
 36%|███▌      | 5/14 [00:02<00:03,  2.64it/s][A
 57%|█████▋    | 8/14 [00:02<00:01,  4.61it/s][A
 71%|███████▏  | 10/14 [00:03<00:01,  3.48it/s][A
100%|██████████| 14/14 [00:04<00:00,  3.49it/s][A
Epochs:  35%|███▍      | 23/66 [10:25<19:39, 27.43s/it]

Val Loss: 0.1693 - Val Accuracy: 0.9112



Training:   0%|          | 0/105 [00:00<?, ?it/s][A
Training:   1%|          | 1/105 [00:01<02:11,  1.26s/it][A
Training:   4%|▍         | 4/105 [00:01<00:28,  3.49it/s][A
Training:   6%|▌         | 6/105 [00:02<00:33,  2.96it/s][A
Training:   9%|▊         | 9/105 [00:03<00:33,  2.89it/s][A
Training:  11%|█▏        | 12/105 [00:03<00:20,  4.57it/s][A
Training:  13%|█▎        | 14/105 [00:04<00:24,  3.70it/s][A
Training:  16%|█▌        | 17/105 [00:05<00:23,  3.70it/s][A
Training:  20%|██        | 21/105 [00:06<00:22,  3.75it/s][A
Training:  23%|██▎       | 24/105 [00:06<00:16,  5.00it/s][A
Training:  25%|██▍       | 26/105 [00:06<00:19,  4.16it/s][A
Training:  28%|██▊       | 29/105 [00:07<00:18,  4.01it/s][A
Training:  30%|██▉       | 31/105 [00:07<00:15,  4.86it/s][A
Training:  31%|███▏      | 33/105 [00:08<00:16,  4.36it/s][A
Training:  34%|███▍      | 36/105 [00:08<00:11,  5.96it/s][A
Training:  36%|███▌      | 38/105 [00:09<00:12,  5.19it/s][A
Training:  37%|███▋ 

Epoch: 24/66 - Loss: 0.1545 - Accuracy: 0.9385



  0%|          | 0/14 [00:00<?, ?it/s][A
  7%|▋         | 1/14 [00:01<00:15,  1.16s/it][A
 14%|█▍        | 2/14 [00:01<00:06,  1.85it/s][A
 29%|██▊       | 4/14 [00:01<00:02,  4.16it/s][A
 43%|████▎     | 6/14 [00:02<00:02,  3.14it/s][A
 57%|█████▋    | 8/14 [00:02<00:01,  4.62it/s][A
 71%|███████▏  | 10/14 [00:03<00:01,  3.61it/s][A
100%|██████████| 14/14 [00:03<00:00,  3.51it/s][A
Epochs:  36%|███▋      | 24/66 [10:53<19:19, 27.60s/it]

Val Loss: 0.1611 - Val Accuracy: 0.9387



Training:   0%|          | 0/105 [00:00<?, ?it/s][A
Training:   1%|          | 1/105 [00:01<02:13,  1.28s/it][A
Training:   5%|▍         | 5/105 [00:02<00:38,  2.57it/s][A
Training:   7%|▋         | 7/105 [00:02<00:25,  3.81it/s][A
Training:   9%|▊         | 9/105 [00:03<00:30,  3.11it/s][A
Training:  10%|█         | 11/105 [00:03<00:21,  4.29it/s][A
Training:  12%|█▏        | 13/105 [00:04<00:27,  3.31it/s][A
Training:  15%|█▌        | 16/105 [00:04<00:17,  5.16it/s][A
Training:  17%|█▋        | 18/105 [00:05<00:22,  3.95it/s][A
Training:  20%|██        | 21/105 [00:05<00:20,  4.11it/s][A
Training:  22%|██▏       | 23/105 [00:05<00:16,  5.10it/s][A
Training:  24%|██▍       | 25/105 [00:06<00:18,  4.28it/s][A
Training:  27%|██▋       | 28/105 [00:06<00:12,  6.24it/s][A
Training:  29%|██▊       | 30/105 [00:07<00:17,  4.40it/s][A
Training:  30%|███       | 32/105 [00:07<00:13,  5.48it/s][A
Training:  32%|███▏      | 34/105 [00:08<00:17,  4.11it/s][A
Training:  35%|███▌ 

Epoch: 25/66 - Loss: 0.1533 - Accuracy: 0.9395



  0%|          | 0/14 [00:00<?, ?it/s][A
  7%|▋         | 1/14 [00:01<00:16,  1.28s/it][A
 21%|██▏       | 3/14 [00:01<00:04,  2.70it/s][A
 36%|███▌      | 5/14 [00:02<00:03,  2.32it/s][A
 64%|██████▍   | 9/14 [00:03<00:01,  3.28it/s][A
 86%|████████▌ | 12/14 [00:03<00:00,  5.03it/s][A
100%|██████████| 14/14 [00:04<00:00,  3.34it/s][A
Epochs:  38%|███▊      | 25/66 [11:20<18:55, 27.69s/it]

Val Loss: 0.1621 - Val Accuracy: 0.9366



Training:   0%|          | 0/105 [00:00<?, ?it/s][A
Training:   1%|          | 1/105 [00:01<02:27,  1.42s/it][A
Training:   3%|▎         | 3/105 [00:01<00:42,  2.40it/s][A
Training:   5%|▍         | 5/105 [00:02<00:39,  2.55it/s][A
Training:   7%|▋         | 7/105 [00:02<00:25,  3.86it/s][A
Training:   9%|▊         | 9/105 [00:03<00:31,  3.05it/s][A
Training:  10%|█         | 11/105 [00:03<00:21,  4.28it/s][A
Training:  12%|█▏        | 13/105 [00:04<00:25,  3.59it/s][A
Training:  16%|█▌        | 17/105 [00:05<00:23,  3.81it/s][A
Training:  18%|█▊        | 19/105 [00:05<00:18,  4.67it/s][A
Training:  20%|██        | 21/105 [00:06<00:21,  3.97it/s][A
Training:  24%|██▍       | 25/105 [00:06<00:18,  4.25it/s][A
Training:  26%|██▌       | 27/105 [00:07<00:15,  5.15it/s][A
Training:  28%|██▊       | 29/105 [00:07<00:18,  4.17it/s][A
Training:  30%|███       | 32/105 [00:07<00:12,  5.88it/s][A
Training:  32%|███▏      | 34/105 [00:08<00:15,  4.55it/s][A
Training:  34%|███▍  

Epoch: 26/66 - Loss: 0.1514 - Accuracy: 0.9408



  0%|          | 0/14 [00:00<?, ?it/s][A
  7%|▋         | 1/14 [00:01<00:13,  1.06s/it][A
 29%|██▊       | 4/14 [00:01<00:02,  4.12it/s][A
 43%|████▎     | 6/14 [00:02<00:02,  3.06it/s][A
 57%|█████▋    | 8/14 [00:02<00:01,  4.45it/s][A
 71%|███████▏  | 10/14 [00:03<00:01,  3.48it/s][A
 86%|████████▌ | 12/14 [00:03<00:00,  4.80it/s][A
100%|██████████| 14/14 [00:03<00:00,  3.64it/s][A
Epochs:  39%|███▉      | 26/66 [11:48<18:24, 27.62s/it]

Val Loss: 0.1595 - Val Accuracy: 0.9382



Training:   0%|          | 0/105 [00:00<?, ?it/s][A
Training:   1%|          | 1/105 [00:01<01:47,  1.03s/it][A
Training:   2%|▏         | 2/105 [00:01<01:00,  1.70it/s][A
Training:   5%|▍         | 5/105 [00:01<00:32,  3.05it/s][A
Training:   7%|▋         | 7/105 [00:02<00:21,  4.62it/s][A
Training:   9%|▊         | 9/105 [00:02<00:26,  3.61it/s][A
Training:  10%|▉         | 10/105 [00:02<00:22,  4.14it/s][A
Training:  12%|█▏        | 13/105 [00:03<00:24,  3.77it/s][A
Training:  14%|█▍        | 15/105 [00:03<00:18,  4.96it/s][A
Training:  16%|█▌        | 17/105 [00:04<00:21,  4.00it/s][A
Training:  19%|█▉        | 20/105 [00:04<00:14,  5.97it/s][A
Training:  21%|██        | 22/105 [00:05<00:18,  4.57it/s][A
Training:  24%|██▍       | 25/105 [00:06<00:19,  4.06it/s][A
Training:  27%|██▋       | 28/105 [00:06<00:13,  5.77it/s][A
Training:  29%|██▊       | 30/105 [00:07<00:18,  4.03it/s][A
Training:  31%|███▏      | 33/105 [00:08<00:17,  4.01it/s][A
Training:  35%|███▌  

Epoch: 27/66 - Loss: 0.1514 - Accuracy: 0.9397



  0%|          | 0/14 [00:00<?, ?it/s][A
  7%|▋         | 1/14 [00:01<00:17,  1.31s/it][A
 21%|██▏       | 3/14 [00:01<00:04,  2.49it/s][A
 36%|███▌      | 5/14 [00:02<00:03,  2.68it/s][A
 50%|█████     | 7/14 [00:02<00:01,  3.92it/s][A
 64%|██████▍   | 9/14 [00:03<00:01,  3.48it/s][A
 79%|███████▊  | 11/14 [00:03<00:00,  4.44it/s][A
100%|██████████| 14/14 [00:03<00:00,  3.64it/s][A
Epochs:  41%|████      | 27/66 [12:15<17:48, 27.39s/it]

Val Loss: 0.1598 - Val Accuracy: 0.9398



Training:   0%|          | 0/105 [00:00<?, ?it/s][A
Training:   1%|          | 1/105 [00:01<02:27,  1.42s/it][A
Training:   3%|▎         | 3/105 [00:01<00:43,  2.33it/s][A
Training:   5%|▍         | 5/105 [00:02<00:39,  2.54it/s][A
Training:   7%|▋         | 7/105 [00:02<00:24,  4.03it/s][A
Training:   9%|▊         | 9/105 [00:03<00:27,  3.45it/s][A
Training:  10%|█         | 11/105 [00:03<00:20,  4.62it/s][A
Training:  12%|█▏        | 13/105 [00:04<00:26,  3.50it/s][A
Training:  14%|█▍        | 15/105 [00:04<00:19,  4.71it/s][A
Training:  16%|█▌        | 17/105 [00:05<00:24,  3.63it/s][A
Training:  18%|█▊        | 19/105 [00:05<00:18,  4.66it/s][A
Training:  20%|██        | 21/105 [00:05<00:20,  4.08it/s][A
Training:  22%|██▏       | 23/105 [00:06<00:17,  4.65it/s][A
Training:  24%|██▍       | 25/105 [00:06<00:17,  4.46it/s][A
Training:  26%|██▌       | 27/105 [00:06<00:15,  4.99it/s][A
Training:  28%|██▊       | 29/105 [00:07<00:18,  4.20it/s][A
Training:  30%|███   

Epoch: 28/66 - Loss: 0.1495 - Accuracy: 0.9421



  0%|          | 0/14 [00:00<?, ?it/s][A
  7%|▋         | 1/14 [00:01<00:17,  1.37s/it][A
 36%|███▌      | 5/14 [00:02<00:03,  2.46it/s][A
 64%|██████▍   | 9/14 [00:03<00:01,  3.32it/s][A
100%|██████████| 14/14 [00:04<00:00,  3.43it/s][A
Epochs:  42%|████▏     | 28/66 [12:43<17:29, 27.62s/it]

Val Loss: 0.1568 - Val Accuracy: 0.9408



Training:   0%|          | 0/105 [00:00<?, ?it/s][A
Training:   1%|          | 1/105 [00:01<02:16,  1.32s/it][A
Training:   5%|▍         | 5/105 [00:02<00:37,  2.64it/s][A
Training:   7%|▋         | 7/105 [00:02<00:25,  3.84it/s][A
Training:   9%|▊         | 9/105 [00:03<00:29,  3.22it/s][A
Training:  10%|▉         | 10/105 [00:03<00:25,  3.66it/s][A
Training:  11%|█▏        | 12/105 [00:03<00:18,  5.04it/s][A
Training:  12%|█▏        | 13/105 [00:04<00:26,  3.48it/s][A
Training:  13%|█▎        | 14/105 [00:04<00:24,  3.77it/s][A
Training:  15%|█▌        | 16/105 [00:04<00:16,  5.29it/s][A
Training:  16%|█▌        | 17/105 [00:05<00:26,  3.32it/s][A
Training:  18%|█▊        | 19/105 [00:05<00:17,  4.80it/s][A
Training:  20%|██        | 21/105 [00:06<00:23,  3.51it/s][A
Training:  23%|██▎       | 24/105 [00:06<00:14,  5.65it/s][A
Training:  25%|██▍       | 26/105 [00:07<00:20,  3.83it/s][A
Training:  28%|██▊       | 29/105 [00:07<00:20,  3.66it/s][A
Training:  31%|███▏ 

Epoch: 29/66 - Loss: 0.1493 - Accuracy: 0.9402



  0%|          | 0/14 [00:00<?, ?it/s][A
  7%|▋         | 1/14 [00:01<00:16,  1.30s/it][A
 21%|██▏       | 3/14 [00:01<00:04,  2.48it/s][A
 36%|███▌      | 5/14 [00:02<00:03,  2.48it/s][A
 57%|█████▋    | 8/14 [00:02<00:01,  4.70it/s][A
 71%|███████▏  | 10/14 [00:03<00:01,  3.72it/s][A
 86%|████████▌ | 12/14 [00:03<00:00,  5.00it/s][A
100%|██████████| 14/14 [00:03<00:00,  3.55it/s][A
Epochs:  44%|████▍     | 29/66 [13:11<17:06, 27.76s/it]

Val Loss: 0.1595 - Val Accuracy: 0.9181



Training:   0%|          | 0/105 [00:00<?, ?it/s][A
Training:   1%|          | 1/105 [00:01<02:10,  1.25s/it][A
Training:   2%|▏         | 2/105 [00:01<00:59,  1.74it/s][A
Training:   4%|▍         | 4/105 [00:01<00:25,  3.94it/s][A
Training:   6%|▌         | 6/105 [00:02<00:33,  2.96it/s][A
Training:   8%|▊         | 8/105 [00:02<00:22,  4.38it/s][A
Training:  10%|▉         | 10/105 [00:03<00:29,  3.24it/s][A
Training:  11%|█▏        | 12/105 [00:03<00:21,  4.41it/s][A
Training:  12%|█▏        | 13/105 [00:04<00:29,  3.17it/s][A
Training:  14%|█▍        | 15/105 [00:04<00:19,  4.52it/s][A
Training:  16%|█▌        | 17/105 [00:05<00:24,  3.63it/s][A
Training:  20%|██        | 21/105 [00:05<00:19,  4.40it/s][A
Training:  24%|██▍       | 25/105 [00:06<00:17,  4.44it/s][A
Training:  26%|██▌       | 27/105 [00:06<00:14,  5.34it/s][A
Training:  28%|██▊       | 29/105 [00:07<00:17,  4.33it/s][A
Training:  30%|██▉       | 31/105 [00:07<00:13,  5.30it/s][A
Training:  31%|███▏  

Epoch: 30/66 - Loss: 0.1498 - Accuracy: 0.9408



  0%|          | 0/14 [00:00<?, ?it/s][A
  7%|▋         | 1/14 [00:01<00:14,  1.14s/it][A
 21%|██▏       | 3/14 [00:01<00:03,  2.92it/s][A
 36%|███▌      | 5/14 [00:02<00:03,  2.79it/s][A
 50%|█████     | 7/14 [00:02<00:01,  4.14it/s][A
 64%|██████▍   | 9/14 [00:03<00:01,  3.13it/s][A
 79%|███████▊  | 11/14 [00:03<00:00,  4.43it/s][A
100%|██████████| 14/14 [00:03<00:00,  3.58it/s][A
Epochs:  45%|████▌     | 30/66 [13:39<16:37, 27.72s/it]

Val Loss: 0.1583 - Val Accuracy: 0.9371



Training:   0%|          | 0/105 [00:00<?, ?it/s][A
Training:   1%|          | 1/105 [00:01<02:08,  1.24s/it][A
Training:   4%|▍         | 4/105 [00:01<00:29,  3.38it/s][A
Training:   5%|▍         | 5/105 [00:01<00:35,  2.80it/s][A
Training:   7%|▋         | 7/105 [00:02<00:22,  4.44it/s][A
Training:   8%|▊         | 8/105 [00:02<00:22,  4.39it/s][A
Training:   9%|▊         | 9/105 [00:02<00:29,  3.29it/s][A
Training:  10%|█         | 11/105 [00:03<00:19,  4.86it/s][A
Training:  11%|█▏        | 12/105 [00:03<00:20,  4.54it/s][A
Training:  12%|█▏        | 13/105 [00:03<00:23,  3.96it/s][A
Training:  13%|█▎        | 14/105 [00:03<00:19,  4.64it/s][A
Training:  15%|█▌        | 16/105 [00:04<00:17,  5.19it/s][A
Training:  16%|█▌        | 17/105 [00:04<00:19,  4.55it/s][A
Training:  18%|█▊        | 19/105 [00:04<00:13,  6.22it/s][A
Training:  19%|█▉        | 20/105 [00:04<00:16,  5.12it/s][A
Training:  20%|██        | 21/105 [00:05<00:17,  4.91it/s][A
Training:  22%|██▏    

Epoch: 31/66 - Loss: 0.1472 - Accuracy: 0.9428



  0%|          | 0/14 [00:00<?, ?it/s][A
  7%|▋         | 1/14 [00:01<00:15,  1.17s/it][A
 29%|██▊       | 4/14 [00:01<00:02,  3.98it/s][A
 43%|████▎     | 6/14 [00:02<00:02,  3.05it/s][A
 64%|██████▍   | 9/14 [00:02<00:01,  3.32it/s][A
 71%|███████▏  | 10/14 [00:03<00:01,  3.60it/s][A
 86%|████████▌ | 12/14 [00:03<00:00,  5.01it/s][A
100%|██████████| 14/14 [00:03<00:00,  3.68it/s][A
Epochs:  47%|████▋     | 31/66 [14:06<16:03, 27.52s/it]

Val Loss: 0.1563 - Val Accuracy: 0.9435



Training:   0%|          | 0/105 [00:00<?, ?it/s][A
Training:   1%|          | 1/105 [00:01<02:08,  1.24s/it][A
Training:   3%|▎         | 3/105 [00:01<00:38,  2.68it/s][A
Training:   4%|▍         | 4/105 [00:01<00:28,  3.51it/s][A
Training:   5%|▍         | 5/105 [00:02<00:42,  2.36it/s][A
Training:   7%|▋         | 7/105 [00:02<00:23,  4.11it/s][A
Training:   9%|▊         | 9/105 [00:03<00:30,  3.16it/s][A
Training:  10%|▉         | 10/105 [00:03<00:25,  3.74it/s][A
Training:  11%|█▏        | 12/105 [00:03<00:17,  5.42it/s][A
Training:  13%|█▎        | 14/105 [00:04<00:22,  4.04it/s][A
Training:  15%|█▌        | 16/105 [00:04<00:16,  5.51it/s][A
Training:  17%|█▋        | 18/105 [00:04<00:21,  4.02it/s][A
Training:  19%|█▉        | 20/105 [00:05<00:15,  5.36it/s][A
Training:  21%|██        | 22/105 [00:05<00:20,  4.05it/s][A
Training:  24%|██▍       | 25/105 [00:06<00:20,  3.85it/s][A
Training:  26%|██▌       | 27/105 [00:06<00:15,  4.94it/s][A
Training:  28%|██▊    

Epoch: 32/66 - Loss: 0.1456 - Accuracy: 0.9428



  0%|          | 0/14 [00:00<?, ?it/s][A
  7%|▋         | 1/14 [00:01<00:13,  1.01s/it][A
 14%|█▍        | 2/14 [00:01<00:06,  1.90it/s][A
 21%|██▏       | 3/14 [00:01<00:03,  2.96it/s][A
 36%|███▌      | 5/14 [00:02<00:03,  2.97it/s][A
 43%|████▎     | 6/14 [00:02<00:02,  3.60it/s][A
 50%|█████     | 7/14 [00:02<00:01,  4.35it/s][A
 64%|██████▍   | 9/14 [00:02<00:01,  3.68it/s][A
 71%|███████▏  | 10/14 [00:03<00:00,  4.05it/s][A
100%|██████████| 14/14 [00:03<00:00,  3.77it/s][A
Epochs:  48%|████▊     | 32/66 [14:33<15:34, 27.47s/it]

Val Loss: 0.1563 - Val Accuracy: 0.9419



Training:   0%|          | 0/105 [00:00<?, ?it/s][A
Training:   1%|          | 1/105 [00:01<02:22,  1.37s/it][A
Training:   4%|▍         | 4/105 [00:01<00:29,  3.47it/s][A
Training:   6%|▌         | 6/105 [00:02<00:35,  2.82it/s][A
Training:   8%|▊         | 8/105 [00:02<00:23,  4.07it/s][A
Training:  10%|▉         | 10/105 [00:03<00:27,  3.47it/s][A
Training:  11%|█▏        | 12/105 [00:03<00:19,  4.72it/s][A
Training:  13%|█▎        | 14/105 [00:03<00:21,  4.14it/s][A
Training:  14%|█▍        | 15/105 [00:04<00:20,  4.45it/s][A
Training:  15%|█▌        | 16/105 [00:04<00:19,  4.60it/s][A
Training:  16%|█▌        | 17/105 [00:04<00:23,  3.72it/s][A
Training:  18%|█▊        | 19/105 [00:05<00:19,  4.48it/s][A
Training:  19%|█▉        | 20/105 [00:05<00:17,  4.84it/s][A
Training:  20%|██        | 21/105 [00:05<00:20,  4.14it/s][A
Training:  22%|██▏       | 23/105 [00:05<00:18,  4.40it/s][A
Training:  23%|██▎       | 24/105 [00:06<00:17,  4.73it/s][A
Training:  24%|██▍  

Epoch: 33/66 - Loss: 0.1456 - Accuracy: 0.9420



  0%|          | 0/14 [00:00<?, ?it/s][A
  7%|▋         | 1/14 [00:01<00:16,  1.28s/it][A
 21%|██▏       | 3/14 [00:01<00:04,  2.58it/s][A
 36%|███▌      | 5/14 [00:02<00:03,  2.73it/s][A
 50%|█████     | 7/14 [00:02<00:01,  4.29it/s][A
 64%|██████▍   | 9/14 [00:03<00:01,  3.21it/s][A
 79%|███████▊  | 11/14 [00:03<00:00,  4.44it/s][A
100%|██████████| 14/14 [00:03<00:00,  3.50it/s][A
Epochs:  50%|█████     | 33/66 [15:01<15:11, 27.63s/it]

Val Loss: 0.1595 - Val Accuracy: 0.9165



Training:   0%|          | 0/105 [00:00<?, ?it/s][A
Training:   1%|          | 1/105 [00:01<02:18,  1.33s/it][A
Training:   4%|▍         | 4/105 [00:01<00:28,  3.49it/s][A
Training:   6%|▌         | 6/105 [00:02<00:33,  2.98it/s][A
Training:   8%|▊         | 8/105 [00:02<00:22,  4.40it/s][A
Training:  10%|▉         | 10/105 [00:03<00:27,  3.45it/s][A
Training:  11%|█▏        | 12/105 [00:03<00:20,  4.61it/s][A
Training:  13%|█▎        | 14/105 [00:04<00:23,  3.85it/s][A
Training:  15%|█▌        | 16/105 [00:04<00:17,  5.15it/s][A
Training:  17%|█▋        | 18/105 [00:04<00:20,  4.34it/s][A
Training:  18%|█▊        | 19/105 [00:04<00:18,  4.77it/s][A
Training:  20%|██        | 21/105 [00:05<00:19,  4.20it/s][A
Training:  22%|██▏       | 23/105 [00:05<00:15,  5.35it/s][A
Training:  24%|██▍       | 25/105 [00:06<00:18,  4.25it/s][A
Training:  25%|██▍       | 26/105 [00:06<00:17,  4.50it/s][A
Training:  28%|██▊       | 29/105 [00:07<00:16,  4.56it/s][A
Training:  29%|██▊  

Epoch: 34/66 - Loss: 0.1446 - Accuracy: 0.9425



  0%|          | 0/14 [00:00<?, ?it/s][A
  7%|▋         | 1/14 [00:01<00:17,  1.35s/it][A
 36%|███▌      | 5/14 [00:02<00:03,  2.68it/s][A
 50%|█████     | 7/14 [00:02<00:01,  3.85it/s][A
 64%|██████▍   | 9/14 [00:03<00:01,  3.33it/s][A
 79%|███████▊  | 11/14 [00:03<00:00,  4.57it/s][A
100%|██████████| 14/14 [00:03<00:00,  3.56it/s][A
Epochs:  52%|█████▏    | 34/66 [15:28<14:33, 27.30s/it]

Val Loss: 0.1629 - Val Accuracy: 0.9128



Training:   0%|          | 0/105 [00:00<?, ?it/s][A
Training:   1%|          | 1/105 [00:01<02:22,  1.37s/it][A
Training:   5%|▍         | 5/105 [00:02<00:36,  2.73it/s][A
Training:   6%|▌         | 6/105 [00:02<00:30,  3.27it/s][A
Training:   8%|▊         | 8/105 [00:02<00:20,  4.76it/s][A
Training:   9%|▊         | 9/105 [00:03<00:32,  2.96it/s][A
Training:  10%|█         | 11/105 [00:03<00:21,  4.31it/s][A
Training:  12%|█▏        | 13/105 [00:04<00:26,  3.53it/s][A
Training:  15%|█▌        | 16/105 [00:04<00:16,  5.55it/s][A
Training:  17%|█▋        | 18/105 [00:04<00:20,  4.33it/s][A
Training:  20%|██        | 21/105 [00:05<00:20,  4.16it/s][A
Training:  22%|██▏       | 23/105 [00:05<00:15,  5.27it/s][A
Training:  24%|██▍       | 25/105 [00:06<00:17,  4.47it/s][A
Training:  26%|██▌       | 27/105 [00:06<00:13,  5.70it/s][A
Training:  28%|██▊       | 29/105 [00:07<00:17,  4.43it/s][A
Training:  30%|██▉       | 31/105 [00:07<00:13,  5.60it/s][A
Training:  31%|███▏  

Epoch: 35/66 - Loss: 0.1440 - Accuracy: 0.9438



  0%|          | 0/14 [00:00<?, ?it/s][A
  7%|▋         | 1/14 [00:01<00:15,  1.19s/it][A
 14%|█▍        | 2/14 [00:01<00:06,  1.80it/s][A
 36%|███▌      | 5/14 [00:01<00:02,  3.26it/s][A
 43%|████▎     | 6/14 [00:02<00:02,  3.76it/s][A
 57%|█████▋    | 8/14 [00:02<00:01,  5.64it/s][A
 71%|███████▏  | 10/14 [00:02<00:01,  3.84it/s][A
100%|██████████| 14/14 [00:03<00:00,  3.70it/s][A
Epochs:  53%|█████▎    | 35/66 [15:54<13:58, 27.04s/it]

Val Loss: 0.1537 - Val Accuracy: 0.9419



Training:   0%|          | 0/105 [00:00<?, ?it/s][A
Training:   1%|          | 1/105 [00:01<02:07,  1.22s/it][A
Training:   5%|▍         | 5/105 [00:02<00:37,  2.69it/s][A
Training:   8%|▊         | 8/105 [00:02<00:21,  4.55it/s][A
Training:  10%|▉         | 10/105 [00:03<00:26,  3.57it/s][A
Training:  11%|█▏        | 12/105 [00:03<00:20,  4.56it/s][A
Training:  12%|█▏        | 13/105 [00:03<00:27,  3.40it/s][A
Training:  13%|█▎        | 14/105 [00:04<00:23,  3.87it/s][A
Training:  14%|█▍        | 15/105 [00:04<00:20,  4.48it/s][A
Training:  16%|█▌        | 17/105 [00:04<00:22,  3.90it/s][A
Training:  18%|█▊        | 19/105 [00:04<00:17,  5.04it/s][A
Training:  19%|█▉        | 20/105 [00:05<00:15,  5.50it/s][A
Training:  20%|██        | 21/105 [00:05<00:22,  3.77it/s][A
Training:  21%|██        | 22/105 [00:05<00:22,  3.74it/s][A
Training:  24%|██▍       | 25/105 [00:06<00:19,  4.14it/s][A
Training:  25%|██▍       | 26/105 [00:06<00:21,  3.74it/s][A
Training:  27%|██▋ 

Epoch: 36/66 - Loss: 0.1432 - Accuracy: 0.9428



  0%|          | 0/14 [00:00<?, ?it/s][A
  7%|▋         | 1/14 [00:01<00:16,  1.24s/it][A
 36%|███▌      | 5/14 [00:02<00:03,  2.65it/s][A
 57%|█████▋    | 8/14 [00:02<00:01,  4.66it/s][A
 71%|███████▏  | 10/14 [00:03<00:01,  3.57it/s][A
100%|██████████| 14/14 [00:03<00:00,  3.56it/s][A
Epochs:  55%|█████▍    | 36/66 [16:21<13:26, 26.90s/it]

Val Loss: 0.1554 - Val Accuracy: 0.9419



Training:   0%|          | 0/105 [00:00<?, ?it/s][A
Training:   1%|          | 1/105 [00:01<02:02,  1.18s/it][A
Training:   3%|▎         | 3/105 [00:01<00:35,  2.91it/s][A
Training:   5%|▍         | 5/105 [00:02<00:36,  2.77it/s][A
Training:   7%|▋         | 7/105 [00:02<00:23,  4.23it/s][A
Training:   9%|▊         | 9/105 [00:02<00:28,  3.33it/s][A
Training:  11%|█▏        | 12/105 [00:03<00:16,  5.52it/s][A
Training:  13%|█▎        | 14/105 [00:04<00:24,  3.74it/s][A
Training:  16%|█▌        | 17/105 [00:04<00:23,  3.74it/s][A
Training:  20%|██        | 21/105 [00:05<00:21,  3.97it/s][A
Training:  22%|██▏       | 23/105 [00:05<00:16,  4.88it/s][A
Training:  24%|██▍       | 25/105 [00:06<00:20,  3.93it/s][A
Training:  26%|██▌       | 27/105 [00:06<00:15,  4.92it/s][A
Training:  28%|██▊       | 29/105 [00:07<00:19,  3.96it/s][A
Training:  30%|██▉       | 31/105 [00:07<00:14,  4.99it/s][A
Training:  31%|███▏      | 33/105 [00:08<00:16,  4.38it/s][A
Training:  33%|███▎  

Epoch: 37/66 - Loss: 0.1429 - Accuracy: 0.9439



  0%|          | 0/14 [00:00<?, ?it/s][A
  7%|▋         | 1/14 [00:01<00:14,  1.11s/it][A
 21%|██▏       | 3/14 [00:01<00:03,  3.01it/s][A
 36%|███▌      | 5/14 [00:02<00:03,  2.65it/s][A
 50%|█████     | 7/14 [00:02<00:01,  4.02it/s][A
 64%|██████▍   | 9/14 [00:03<00:01,  3.20it/s][A
100%|██████████| 14/14 [00:03<00:00,  3.61it/s][A
Epochs:  56%|█████▌    | 37/66 [16:47<12:57, 26.81s/it]

Val Loss: 0.1514 - Val Accuracy: 0.9419



Training:   0%|          | 0/105 [00:00<?, ?it/s][A
Training:   1%|          | 1/105 [00:01<02:19,  1.34s/it][A
Training:   4%|▍         | 4/105 [00:01<00:28,  3.53it/s][A
Training:   6%|▌         | 6/105 [00:02<00:37,  2.65it/s][A
Training:   9%|▊         | 9/105 [00:03<00:32,  2.96it/s][A
Training:  12%|█▏        | 13/105 [00:04<00:25,  3.66it/s][A
Training:  15%|█▌        | 16/105 [00:04<00:17,  5.19it/s][A
Training:  17%|█▋        | 18/105 [00:05<00:21,  4.03it/s][A
Training:  20%|██        | 21/105 [00:06<00:23,  3.61it/s][A
Training:  22%|██▏       | 23/105 [00:06<00:18,  4.52it/s][A
Training:  24%|██▍       | 25/105 [00:06<00:20,  3.86it/s][A
Training:  28%|██▊       | 29/105 [00:07<00:17,  4.38it/s][A
Training:  30%|███       | 32/105 [00:07<00:12,  5.95it/s][A
Training:  32%|███▏      | 34/105 [00:08<00:16,  4.29it/s][A
Training:  34%|███▍      | 36/105 [00:08<00:12,  5.31it/s][A
Training:  36%|███▌      | 38/105 [00:09<00:16,  4.15it/s][A
Training:  39%|███▉ 

Epoch: 38/66 - Loss: 0.1420 - Accuracy: 0.9454



  0%|          | 0/14 [00:00<?, ?it/s][A
  7%|▋         | 1/14 [00:01<00:16,  1.24s/it][A
 14%|█▍        | 2/14 [00:01<00:07,  1.53it/s][A
 36%|███▌      | 5/14 [00:02<00:03,  2.71it/s][A
 43%|████▎     | 6/14 [00:02<00:02,  3.23it/s][A
 64%|██████▍   | 9/14 [00:03<00:01,  3.82it/s][A
 71%|███████▏  | 10/14 [00:03<00:01,  3.89it/s][A
 86%|████████▌ | 12/14 [00:03<00:00,  5.45it/s][A
100%|██████████| 14/14 [00:03<00:00,  3.58it/s][A
Epochs:  58%|█████▊    | 38/66 [17:14<12:33, 26.89s/it]

Val Loss: 0.1550 - Val Accuracy: 0.9186



Training:   0%|          | 0/105 [00:00<?, ?it/s][A
Training:   1%|          | 1/105 [00:01<02:43,  1.57s/it][A
Training:   5%|▍         | 5/105 [00:02<00:38,  2.57it/s][A
Training:   7%|▋         | 7/105 [00:02<00:26,  3.72it/s][A
Training:   9%|▊         | 9/105 [00:03<00:27,  3.52it/s][A
Training:  10%|█         | 11/105 [00:03<00:19,  4.73it/s][A
Training:  12%|█▏        | 13/105 [00:03<00:23,  3.93it/s][A
Training:  13%|█▎        | 14/105 [00:04<00:21,  4.26it/s][A
Training:  14%|█▍        | 15/105 [00:04<00:18,  4.79it/s][A
Training:  16%|█▌        | 17/105 [00:04<00:19,  4.58it/s][A
Training:  17%|█▋        | 18/105 [00:04<00:20,  4.26it/s][A
Training:  20%|██        | 21/105 [00:05<00:16,  5.13it/s][A
Training:  21%|██        | 22/105 [00:05<00:16,  5.09it/s][A
Training:  24%|██▍       | 25/105 [00:06<00:14,  5.46it/s][A
Training:  25%|██▍       | 26/105 [00:06<00:15,  5.22it/s][A
Training:  28%|██▊       | 29/105 [00:06<00:15,  5.03it/s][A
Training:  29%|██▊  

Epoch: 39/66 - Loss: 0.1411 - Accuracy: 0.9442



  0%|          | 0/14 [00:00<?, ?it/s][A
  7%|▋         | 1/14 [00:01<00:18,  1.41s/it][A
 36%|███▌      | 5/14 [00:02<00:03,  2.71it/s][A
 64%|██████▍   | 9/14 [00:02<00:01,  3.65it/s][A
 71%|███████▏  | 10/14 [00:03<00:01,  3.83it/s][A
100%|██████████| 14/14 [00:03<00:00,  3.62it/s][A
Epochs:  59%|█████▉    | 39/66 [17:40<11:58, 26.61s/it]

Val Loss: 0.1498 - Val Accuracy: 0.9446



Training:   0%|          | 0/105 [00:00<?, ?it/s][A
Training:   1%|          | 1/105 [00:01<02:14,  1.29s/it][A
Training:   3%|▎         | 3/105 [00:01<00:38,  2.66it/s][A
Training:   5%|▍         | 5/105 [00:02<00:36,  2.72it/s][A
Training:   6%|▌         | 6/105 [00:02<00:29,  3.38it/s][A
Training:   9%|▊         | 9/105 [00:03<00:26,  3.56it/s][A
Training:  10%|█         | 11/105 [00:03<00:19,  4.74it/s][A
Training:  12%|█▏        | 13/105 [00:03<00:24,  3.80it/s][A
Training:  14%|█▍        | 15/105 [00:04<00:18,  4.95it/s][A
Training:  16%|█▌        | 17/105 [00:04<00:23,  3.71it/s][A
Training:  20%|██        | 21/105 [00:05<00:19,  4.28it/s][A
Training:  22%|██▏       | 23/105 [00:05<00:15,  5.21it/s][A
Training:  24%|██▍       | 25/105 [00:06<00:19,  4.14it/s][A
Training:  26%|██▌       | 27/105 [00:06<00:15,  5.12it/s][A
Training:  28%|██▊       | 29/105 [00:07<00:18,  4.07it/s][A
Training:  29%|██▊       | 30/105 [00:07<00:16,  4.46it/s][A
Training:  31%|███▏  

Epoch: 40/66 - Loss: 0.1420 - Accuracy: 0.9436



  0%|          | 0/14 [00:00<?, ?it/s][A
  7%|▋         | 1/14 [00:01<00:15,  1.20s/it][A
 14%|█▍        | 2/14 [00:01<00:06,  1.78it/s][A
 29%|██▊       | 4/14 [00:01<00:02,  4.10it/s][A
 43%|████▎     | 6/14 [00:02<00:02,  3.18it/s][A
 64%|██████▍   | 9/14 [00:02<00:01,  3.69it/s][A
 71%|███████▏  | 10/14 [00:03<00:01,  3.58it/s][A
100%|██████████| 14/14 [00:03<00:00,  3.67it/s][A
Epochs:  61%|██████    | 40/66 [18:07<11:31, 26.58s/it]

Val Loss: 0.1497 - Val Accuracy: 0.9414



Training:   0%|          | 0/105 [00:00<?, ?it/s][A
Training:   1%|          | 1/105 [00:01<02:00,  1.16s/it][A
Training:   2%|▏         | 2/105 [00:01<00:56,  1.81it/s][A
Training:   4%|▍         | 4/105 [00:01<00:29,  3.47it/s][A
Training:   5%|▍         | 5/105 [00:02<00:35,  2.83it/s][A
Training:   7%|▋         | 7/105 [00:02<00:22,  4.39it/s][A
Training:   9%|▊         | 9/105 [00:02<00:25,  3.79it/s][A
Training:  10%|▉         | 10/105 [00:03<00:22,  4.17it/s][A
Training:  11%|█▏        | 12/105 [00:03<00:19,  4.86it/s][A
Training:  12%|█▏        | 13/105 [00:03<00:20,  4.45it/s][A
Training:  13%|█▎        | 14/105 [00:03<00:22,  3.97it/s][A
Training:  15%|█▌        | 16/105 [00:04<00:16,  5.53it/s][A
Training:  16%|█▌        | 17/105 [00:04<00:17,  5.04it/s][A
Training:  17%|█▋        | 18/105 [00:04<00:23,  3.68it/s][A
Training:  20%|██        | 21/105 [00:05<00:17,  4.77it/s][A
Training:  21%|██        | 22/105 [00:05<00:21,  3.86it/s][A
Training:  23%|██▎    

Epoch: 41/66 - Loss: 0.1413 - Accuracy: 0.9428



  0%|          | 0/14 [00:00<?, ?it/s][A
  7%|▋         | 1/14 [00:01<00:15,  1.15s/it][A
 14%|█▍        | 2/14 [00:01<00:07,  1.66it/s][A
 29%|██▊       | 4/14 [00:01<00:02,  3.91it/s][A
 43%|████▎     | 6/14 [00:02<00:02,  3.39it/s][A
 57%|█████▋    | 8/14 [00:02<00:01,  4.99it/s][A
 71%|███████▏  | 10/14 [00:03<00:01,  3.79it/s][A
 86%|████████▌ | 12/14 [00:03<00:00,  5.11it/s][A
100%|██████████| 14/14 [00:03<00:00,  3.84it/s][A
Epochs:  62%|██████▏   | 41/66 [18:33<11:01, 26.45s/it]

Val Loss: 0.1551 - Val Accuracy: 0.9154



Training:   0%|          | 0/105 [00:00<?, ?it/s][A
Training:   1%|          | 1/105 [00:01<02:21,  1.36s/it][A
Training:   3%|▎         | 3/105 [00:01<00:42,  2.42it/s][A
Training:   5%|▍         | 5/105 [00:02<00:38,  2.57it/s][A
Training:   8%|▊         | 8/105 [00:02<00:20,  4.84it/s][A
Training:  10%|▉         | 10/105 [00:03<00:25,  3.78it/s][A
Training:  12%|█▏        | 13/105 [00:03<00:24,  3.72it/s][A
Training:  15%|█▌        | 16/105 [00:04<00:16,  5.51it/s][A
Training:  17%|█▋        | 18/105 [00:05<00:22,  3.93it/s][A
Training:  19%|█▉        | 20/105 [00:05<00:16,  5.03it/s][A
Training:  21%|██        | 22/105 [00:05<00:22,  3.76it/s][A
Training:  24%|██▍       | 25/105 [00:06<00:21,  3.67it/s][A
Training:  27%|██▋       | 28/105 [00:06<00:14,  5.24it/s][A
Training:  29%|██▊       | 30/105 [00:07<00:18,  4.15it/s][A
Training:  30%|███       | 32/105 [00:07<00:14,  5.18it/s][A
Training:  32%|███▏      | 34/105 [00:08<00:17,  4.16it/s][A
Training:  35%|███▌ 

Epoch: 42/66 - Loss: 0.1394 - Accuracy: 0.9454



  0%|          | 0/14 [00:00<?, ?it/s][A
  7%|▋         | 1/14 [00:01<00:17,  1.31s/it][A
 21%|██▏       | 3/14 [00:01<00:04,  2.56it/s][A
 36%|███▌      | 5/14 [00:02<00:03,  2.63it/s][A
 50%|█████     | 7/14 [00:02<00:01,  3.96it/s][A
 64%|██████▍   | 9/14 [00:03<00:01,  3.57it/s][A
 79%|███████▊  | 11/14 [00:03<00:00,  4.80it/s][A
100%|██████████| 14/14 [00:03<00:00,  3.62it/s][A
Epochs:  64%|██████▎   | 42/66 [19:00<10:38, 26.59s/it]

Val Loss: 0.1504 - Val Accuracy: 0.9451



Training:   0%|          | 0/105 [00:00<?, ?it/s][A
Training:   1%|          | 1/105 [00:01<02:11,  1.27s/it][A
Training:   2%|▏         | 2/105 [00:01<01:01,  1.68it/s][A
Training:   4%|▍         | 4/105 [00:01<00:27,  3.64it/s][A
Training:   5%|▍         | 5/105 [00:02<00:36,  2.74it/s][A
Training:   7%|▋         | 7/105 [00:02<00:21,  4.49it/s][A
Training:   9%|▊         | 9/105 [00:03<00:27,  3.46it/s][A
Training:  10%|█         | 11/105 [00:03<00:20,  4.52it/s][A
Training:  12%|█▏        | 13/105 [00:03<00:24,  3.82it/s][A
Training:  14%|█▍        | 15/105 [00:04<00:17,  5.08it/s][A
Training:  16%|█▌        | 17/105 [00:04<00:21,  4.08it/s][A
Training:  18%|█▊        | 19/105 [00:05<00:18,  4.66it/s][A
Training:  19%|█▉        | 20/105 [00:05<00:16,  5.14it/s][A
Training:  20%|██        | 21/105 [00:05<00:22,  3.68it/s][A
Training:  22%|██▏       | 23/105 [00:06<00:18,  4.38it/s][A
Training:  24%|██▍       | 25/105 [00:06<00:19,  4.10it/s][A
Training:  26%|██▌    

Epoch: 43/66 - Loss: 0.1399 - Accuracy: 0.9438



  0%|          | 0/14 [00:00<?, ?it/s][A
  7%|▋         | 1/14 [00:01<00:16,  1.28s/it][A
 21%|██▏       | 3/14 [00:01<00:04,  2.70it/s][A
 36%|███▌      | 5/14 [00:02<00:03,  2.73it/s][A
 64%|██████▍   | 9/14 [00:03<00:01,  3.35it/s][A
100%|██████████| 14/14 [00:03<00:00,  3.55it/s][A
Epochs:  65%|██████▌   | 43/66 [19:26<10:10, 26.55s/it]

Val Loss: 0.1483 - Val Accuracy: 0.9435



Training:   0%|          | 0/105 [00:00<?, ?it/s][A
Training:   1%|          | 1/105 [00:01<02:18,  1.33s/it][A
Training:   4%|▍         | 4/105 [00:01<00:29,  3.48it/s][A
Training:   6%|▌         | 6/105 [00:02<00:35,  2.75it/s][A
Training:   9%|▊         | 9/105 [00:03<00:32,  2.92it/s][A
Training:  10%|█         | 11/105 [00:03<00:23,  3.97it/s][A
Training:  12%|█▏        | 13/105 [00:04<00:27,  3.39it/s][A
Training:  15%|█▌        | 16/105 [00:04<00:17,  5.15it/s][A
Training:  17%|█▋        | 18/105 [00:05<00:21,  4.04it/s][A
Training:  19%|█▉        | 20/105 [00:05<00:16,  5.18it/s][A
Training:  21%|██        | 22/105 [00:05<00:20,  4.11it/s][A
Training:  23%|██▎       | 24/105 [00:06<00:15,  5.23it/s][A
Training:  25%|██▍       | 26/105 [00:06<00:19,  4.00it/s][A
Training:  28%|██▊       | 29/105 [00:07<00:18,  4.10it/s][A
Training:  31%|███▏      | 33/105 [00:08<00:16,  4.34it/s][A
Training:  33%|███▎      | 35/105 [00:08<00:13,  5.27it/s][A
Training:  35%|███▌ 

Epoch: 44/66 - Loss: 0.1394 - Accuracy: 0.9458



  0%|          | 0/14 [00:00<?, ?it/s][A
  7%|▋         | 1/14 [00:01<00:19,  1.47s/it][A
 36%|███▌      | 5/14 [00:02<00:03,  2.51it/s][A
 57%|█████▋    | 8/14 [00:02<00:01,  4.33it/s][A
 71%|███████▏  | 10/14 [00:03<00:01,  3.50it/s][A
100%|██████████| 14/14 [00:04<00:00,  3.33it/s][A
Epochs:  67%|██████▋   | 44/66 [19:54<09:49, 26.80s/it]

Val Loss: 0.1518 - Val Accuracy: 0.9403



Training:   0%|          | 0/105 [00:00<?, ?it/s][A
Training:   1%|          | 1/105 [00:01<02:24,  1.39s/it][A
Training:   5%|▍         | 5/105 [00:02<00:36,  2.75it/s][A
Training:   7%|▋         | 7/105 [00:02<00:24,  4.08it/s][A
Training:   9%|▊         | 9/105 [00:03<00:31,  3.03it/s][A
Training:  10%|█         | 11/105 [00:03<00:22,  4.19it/s][A
Training:  12%|█▏        | 13/105 [00:04<00:26,  3.50it/s][A
Training:  14%|█▍        | 15/105 [00:04<00:19,  4.69it/s][A
Training:  16%|█▌        | 17/105 [00:04<00:22,  3.90it/s][A
Training:  18%|█▊        | 19/105 [00:05<00:16,  5.18it/s][A
Training:  20%|██        | 21/105 [00:05<00:18,  4.45it/s][A
Training:  22%|██▏       | 23/105 [00:05<00:14,  5.60it/s][A
Training:  24%|██▍       | 25/105 [00:06<00:18,  4.35it/s][A
Training:  26%|██▌       | 27/105 [00:06<00:15,  5.05it/s][A
Training:  27%|██▋       | 28/105 [00:06<00:15,  4.92it/s][A
Training:  28%|██▊       | 29/105 [00:07<00:20,  3.69it/s][A
Training:  30%|██▉  

Epoch: 45/66 - Loss: 0.1380 - Accuracy: 0.9468



  0%|          | 0/14 [00:00<?, ?it/s][A
  7%|▋         | 1/14 [00:01<00:13,  1.06s/it][A
 29%|██▊       | 4/14 [00:01<00:02,  4.15it/s][A
 43%|████▎     | 6/14 [00:02<00:02,  3.02it/s][A
 50%|█████     | 7/14 [00:02<00:01,  3.57it/s][A
 64%|██████▍   | 9/14 [00:02<00:01,  3.38it/s][A
100%|██████████| 14/14 [00:03<00:00,  3.83it/s][A
Epochs:  68%|██████▊   | 45/66 [20:20<09:21, 26.73s/it]

Val Loss: 0.1486 - Val Accuracy: 0.9424



Training:   0%|          | 0/105 [00:00<?, ?it/s][A
Training:   1%|          | 1/105 [00:01<01:55,  1.11s/it][A
Training:   4%|▍         | 4/105 [00:01<00:24,  4.08it/s][A
Training:   6%|▌         | 6/105 [00:02<00:32,  3.03it/s][A
Training:   9%|▊         | 9/105 [00:03<00:31,  3.08it/s][A
Training:  11%|█▏        | 12/105 [00:03<00:20,  4.54it/s][A
Training:  12%|█▏        | 13/105 [00:03<00:25,  3.54it/s][A
Training:  14%|█▍        | 15/105 [00:04<00:19,  4.56it/s][A
Training:  16%|█▌        | 17/105 [00:04<00:24,  3.64it/s][A
Training:  17%|█▋        | 18/105 [00:04<00:21,  4.09it/s][A
Training:  20%|██        | 21/105 [00:05<00:20,  4.04it/s][A
Training:  22%|██▏       | 23/105 [00:05<00:15,  5.25it/s][A
Training:  24%|██▍       | 25/105 [00:06<00:20,  3.91it/s][A
Training:  26%|██▌       | 27/105 [00:06<00:15,  5.10it/s][A
Training:  28%|██▊       | 29/105 [00:07<00:20,  3.71it/s][A
Training:  30%|██▉       | 31/105 [00:07<00:15,  4.79it/s][A
Training:  31%|███▏ 

Epoch: 46/66 - Loss: 0.1387 - Accuracy: 0.9452



  0%|          | 0/14 [00:00<?, ?it/s][A
  7%|▋         | 1/14 [00:01<00:15,  1.22s/it][A
 29%|██▊       | 4/14 [00:01<00:02,  3.79it/s][A
 43%|████▎     | 6/14 [00:02<00:02,  3.21it/s][A
 64%|██████▍   | 9/14 [00:02<00:01,  3.54it/s][A
 86%|████████▌ | 12/14 [00:02<00:00,  5.43it/s][A
100%|██████████| 14/14 [00:03<00:00,  3.72it/s][A
Epochs:  70%|██████▉   | 46/66 [20:47<08:57, 26.90s/it]

Val Loss: 0.1479 - Val Accuracy: 0.9424



Training:   0%|          | 0/105 [00:00<?, ?it/s][A
Training:   1%|          | 1/105 [00:01<02:14,  1.29s/it][A
Training:   3%|▎         | 3/105 [00:01<00:37,  2.69it/s][A
Training:   5%|▍         | 5/105 [00:02<00:36,  2.72it/s][A
Training:   7%|▋         | 7/105 [00:02<00:23,  4.24it/s][A
Training:   9%|▊         | 9/105 [00:02<00:27,  3.48it/s][A
Training:  10%|█         | 11/105 [00:03<00:19,  4.79it/s][A
Training:  12%|█▏        | 13/105 [00:03<00:23,  3.90it/s][A
Training:  14%|█▍        | 15/105 [00:03<00:17,  5.18it/s][A
Training:  16%|█▌        | 17/105 [00:04<00:21,  4.06it/s][A
Training:  19%|█▉        | 20/105 [00:04<00:13,  6.12it/s][A
Training:  21%|██        | 22/105 [00:05<00:20,  4.00it/s][A
Training:  23%|██▎       | 24/105 [00:05<00:15,  5.13it/s][A
Training:  25%|██▍       | 26/105 [00:06<00:19,  4.08it/s][A
Training:  28%|██▊       | 29/105 [00:07<00:17,  4.41it/s][A
Training:  31%|███▏      | 33/105 [00:07<00:15,  4.79it/s][A
Training:  32%|███▏  

Epoch: 47/66 - Loss: 0.1367 - Accuracy: 0.9469



  0%|          | 0/14 [00:00<?, ?it/s][A
  7%|▋         | 1/14 [00:01<00:18,  1.40s/it][A
 36%|███▌      | 5/14 [00:02<00:03,  2.76it/s][A
 64%|██████▍   | 9/14 [00:02<00:01,  3.66it/s][A
100%|██████████| 14/14 [00:03<00:00,  3.62it/s][A
Epochs:  71%|███████   | 47/66 [21:14<08:28, 26.78s/it]

Val Loss: 0.1513 - Val Accuracy: 0.9424



Training:   0%|          | 0/105 [00:00<?, ?it/s][A
Training:   1%|          | 1/105 [00:01<01:56,  1.12s/it][A
Training:   2%|▏         | 2/105 [00:01<00:55,  1.84it/s][A
Training:   5%|▍         | 5/105 [00:02<00:35,  2.80it/s][A
Training:   7%|▋         | 7/105 [00:02<00:24,  4.08it/s][A
Training:   9%|▊         | 9/105 [00:03<00:28,  3.31it/s][A
Training:  10%|█         | 11/105 [00:03<00:21,  4.42it/s][A
Training:  12%|█▏        | 13/105 [00:04<00:26,  3.54it/s][A
Training:  14%|█▍        | 15/105 [00:04<00:18,  4.77it/s][A
Training:  16%|█▌        | 17/105 [00:04<00:23,  3.80it/s][A
Training:  19%|█▉        | 20/105 [00:05<00:14,  5.76it/s][A
Training:  21%|██        | 22/105 [00:05<00:20,  3.97it/s][A
Training:  23%|██▎       | 24/105 [00:06<00:16,  4.89it/s][A
Training:  25%|██▍       | 26/105 [00:07<00:22,  3.55it/s][A
Training:  27%|██▋       | 28/105 [00:07<00:16,  4.65it/s][A
Training:  29%|██▊       | 30/105 [00:07<00:19,  3.90it/s][A
Training:  31%|███▏  

Epoch: 48/66 - Loss: 0.1374 - Accuracy: 0.9449



  0%|          | 0/14 [00:00<?, ?it/s][A
  7%|▋         | 1/14 [00:01<00:15,  1.23s/it][A
 29%|██▊       | 4/14 [00:01<00:02,  3.75it/s][A
 43%|████▎     | 6/14 [00:02<00:02,  2.93it/s][A
 64%|██████▍   | 9/14 [00:02<00:01,  3.60it/s][A
 71%|███████▏  | 10/14 [00:03<00:01,  3.64it/s][A
100%|██████████| 14/14 [00:03<00:00,  3.82it/s][A
Epochs:  73%|███████▎  | 48/66 [21:41<08:02, 26.82s/it]

Val Loss: 0.1432 - Val Accuracy: 0.9456



Training:   0%|          | 0/105 [00:00<?, ?it/s][A
Training:   1%|          | 1/105 [00:01<01:55,  1.11s/it][A
Training:   3%|▎         | 3/105 [00:01<00:34,  2.94it/s][A
Training:   5%|▍         | 5/105 [00:01<00:31,  3.19it/s][A
Training:   6%|▌         | 6/105 [00:01<00:25,  3.90it/s][A
Training:   8%|▊         | 8/105 [00:02<00:16,  5.83it/s][A
Training:  10%|▉         | 10/105 [00:02<00:26,  3.63it/s][A
Training:  12%|█▏        | 13/105 [00:03<00:24,  3.76it/s][A
Training:  13%|█▎        | 14/105 [00:03<00:22,  4.03it/s][A
Training:  15%|█▌        | 16/105 [00:03<00:16,  5.46it/s][A
Training:  17%|█▋        | 18/105 [00:04<00:21,  3.97it/s][A
Training:  19%|█▉        | 20/105 [00:04<00:16,  5.24it/s][A
Training:  21%|██        | 22/105 [00:05<00:23,  3.56it/s][A
Training:  24%|██▍       | 25/105 [00:06<00:23,  3.44it/s][A
Training:  28%|██▊       | 29/105 [00:07<00:19,  3.91it/s][A
Training:  30%|██▉       | 31/105 [00:07<00:15,  4.74it/s][A
Training:  31%|███▏  

Epoch: 49/66 - Loss: 0.1355 - Accuracy: 0.9473



  0%|          | 0/14 [00:00<?, ?it/s][A
  7%|▋         | 1/14 [00:01<00:15,  1.16s/it][A
 21%|██▏       | 3/14 [00:01<00:03,  2.93it/s][A
 36%|███▌      | 5/14 [00:01<00:02,  3.14it/s][A
 50%|█████     | 7/14 [00:02<00:01,  4.54it/s][A
 64%|██████▍   | 9/14 [00:02<00:01,  3.68it/s][A
 79%|███████▊  | 11/14 [00:02<00:00,  5.14it/s][A
100%|██████████| 14/14 [00:03<00:00,  3.87it/s][A
Epochs:  74%|███████▍  | 49/66 [22:08<07:38, 26.96s/it]

Val Loss: 0.1478 - Val Accuracy: 0.9440



Training:   0%|          | 0/105 [00:00<?, ?it/s][A
Training:   1%|          | 1/105 [00:01<02:06,  1.22s/it][A
Training:   3%|▎         | 3/105 [00:01<00:36,  2.81it/s][A
Training:   5%|▍         | 5/105 [00:02<00:36,  2.77it/s][A
Training:   7%|▋         | 7/105 [00:02<00:23,  4.25it/s][A
Training:   9%|▊         | 9/105 [00:02<00:26,  3.62it/s][A
Training:  10%|█         | 11/105 [00:02<00:18,  5.07it/s][A
Training:  12%|█▏        | 13/105 [00:03<00:20,  4.60it/s][A
Training:  13%|█▎        | 14/105 [00:03<00:19,  4.55it/s][A
Training:  15%|█▌        | 16/105 [00:03<00:14,  6.19it/s][A
Training:  17%|█▋        | 18/105 [00:04<00:22,  3.88it/s][A
Training:  19%|█▉        | 20/105 [00:04<00:16,  5.24it/s][A
Training:  21%|██        | 22/105 [00:05<00:21,  3.94it/s][A
Training:  23%|██▎       | 24/105 [00:05<00:16,  4.96it/s][A
Training:  24%|██▍       | 25/105 [00:06<00:17,  4.59it/s][A
Training:  25%|██▍       | 26/105 [00:06<00:19,  4.07it/s][A
Training:  26%|██▌   

Epoch: 50/66 - Loss: 0.1361 - Accuracy: 0.9460



  0%|          | 0/14 [00:00<?, ?it/s][A
  7%|▋         | 1/14 [00:01<00:17,  1.33s/it][A
 36%|███▌      | 5/14 [00:02<00:03,  2.86it/s][A
 64%|██████▍   | 9/14 [00:02<00:01,  3.74it/s][A
 86%|████████▌ | 12/14 [00:03<00:00,  5.41it/s][A
100%|██████████| 14/14 [00:03<00:00,  3.87it/s][A
Epochs:  76%|███████▌  | 50/66 [22:35<07:11, 26.96s/it]

Val Loss: 0.1494 - Val Accuracy: 0.9435



Training:   0%|          | 0/105 [00:00<?, ?it/s][A
Training:   1%|          | 1/105 [00:01<02:13,  1.28s/it][A
Training:   2%|▏         | 2/105 [00:01<01:02,  1.66it/s][A
Training:   5%|▍         | 5/105 [00:02<00:32,  3.10it/s][A
Training:   6%|▌         | 6/105 [00:02<00:27,  3.65it/s][A
Training:   9%|▊         | 9/105 [00:02<00:25,  3.75it/s][A
Training:  10%|█         | 11/105 [00:03<00:18,  5.12it/s][A
Training:  12%|█▏        | 13/105 [00:03<00:24,  3.74it/s][A
Training:  15%|█▌        | 16/105 [00:04<00:15,  5.73it/s][A
Training:  17%|█▋        | 18/105 [00:04<00:20,  4.31it/s][A
Training:  20%|██        | 21/105 [00:05<00:20,  4.17it/s][A
Training:  22%|██▏       | 23/105 [00:05<00:15,  5.18it/s][A
Training:  24%|██▍       | 25/105 [00:06<00:17,  4.49it/s][A
Training:  25%|██▍       | 26/105 [00:06<00:18,  4.32it/s][A
Training:  27%|██▋       | 28/105 [00:06<00:13,  5.73it/s][A
Training:  29%|██▊       | 30/105 [00:07<00:17,  4.39it/s][A
Training:  31%|███▏  

Epoch: 51/66 - Loss: 0.1358 - Accuracy: 0.9477



  0%|          | 0/14 [00:00<?, ?it/s][A
  7%|▋         | 1/14 [00:01<00:17,  1.32s/it][A
 36%|███▌      | 5/14 [00:02<00:03,  2.85it/s][A
 64%|██████▍   | 9/14 [00:02<00:01,  3.94it/s][A
 86%|████████▌ | 12/14 [00:02<00:00,  5.57it/s][A
100%|██████████| 14/14 [00:03<00:00,  3.98it/s][A
Epochs:  77%|███████▋  | 51/66 [23:01<06:41, 26.76s/it]

Val Loss: 0.1436 - Val Accuracy: 0.9451



Training:   0%|          | 0/105 [00:00<?, ?it/s][A
Training:   1%|          | 1/105 [00:01<02:05,  1.20s/it][A
Training:   3%|▎         | 3/105 [00:01<00:36,  2.78it/s][A
Training:   5%|▍         | 5/105 [00:02<00:35,  2.82it/s][A
Training:   7%|▋         | 7/105 [00:02<00:25,  3.90it/s][A
Training:   9%|▊         | 9/105 [00:02<00:25,  3.84it/s][A
Training:  10%|█         | 11/105 [00:03<00:22,  4.26it/s][A
Training:  12%|█▏        | 13/105 [00:03<00:20,  4.42it/s][A
Training:  14%|█▍        | 15/105 [00:03<00:18,  4.77it/s][A
Training:  16%|█▌        | 17/105 [00:04<00:18,  4.68it/s][A
Training:  18%|█▊        | 19/105 [00:04<00:17,  4.93it/s][A
Training:  20%|██        | 21/105 [00:05<00:18,  4.48it/s][A
Training:  22%|██▏       | 23/105 [00:05<00:16,  4.87it/s][A
Training:  24%|██▍       | 25/105 [00:06<00:18,  4.43it/s][A
Training:  26%|██▌       | 27/105 [00:06<00:17,  4.55it/s][A
Training:  28%|██▊       | 29/105 [00:07<00:18,  4.09it/s][A
Training:  30%|██▉   

Epoch: 52/66 - Loss: 0.1353 - Accuracy: 0.9468



  0%|          | 0/14 [00:00<?, ?it/s][A
  7%|▋         | 1/14 [00:01<00:17,  1.34s/it][A
 36%|███▌      | 5/14 [00:02<00:03,  2.68it/s][A
 50%|█████     | 7/14 [00:02<00:01,  3.86it/s][A
 64%|██████▍   | 9/14 [00:03<00:01,  3.39it/s][A
 79%|███████▊  | 11/14 [00:03<00:00,  4.53it/s][A
100%|██████████| 14/14 [00:03<00:00,  3.56it/s][A
Epochs:  79%|███████▉  | 52/66 [23:28<06:16, 26.86s/it]

Val Loss: 0.1511 - Val Accuracy: 0.9435



Training:   0%|          | 0/105 [00:00<?, ?it/s][A
Training:   1%|          | 1/105 [00:01<01:58,  1.14s/it][A
Training:   2%|▏         | 2/105 [00:01<00:55,  1.87it/s][A
Training:   4%|▍         | 4/105 [00:01<00:25,  3.96it/s][A
Training:   5%|▍         | 5/105 [00:02<00:39,  2.54it/s][A
Training:   7%|▋         | 7/105 [00:02<00:23,  4.24it/s][A
Training:   9%|▊         | 9/105 [00:02<00:25,  3.80it/s][A
Training:  10%|▉         | 10/105 [00:03<00:23,  4.11it/s][A
Training:  12%|█▏        | 13/105 [00:03<00:19,  4.65it/s][A
Training:  13%|█▎        | 14/105 [00:03<00:19,  4.78it/s][A
Training:  16%|█▌        | 17/105 [00:04<00:18,  4.69it/s][A
Training:  17%|█▋        | 18/105 [00:04<00:17,  4.95it/s][A
Training:  19%|█▉        | 20/105 [00:04<00:12,  6.61it/s][A
Training:  21%|██        | 22/105 [00:05<00:17,  4.80it/s][A
Training:  24%|██▍       | 25/105 [00:06<00:17,  4.57it/s][A
Training:  26%|██▌       | 27/105 [00:06<00:13,  5.64it/s][A
Training:  27%|██▋    

Epoch: 53/66 - Loss: 0.1335 - Accuracy: 0.9483



  0%|          | 0/14 [00:00<?, ?it/s][A
  7%|▋         | 1/14 [00:01<00:14,  1.15s/it][A
 36%|███▌      | 5/14 [00:01<00:03,  2.93it/s][A
 50%|█████     | 7/14 [00:02<00:01,  4.11it/s][A
 64%|██████▍   | 9/14 [00:02<00:01,  3.49it/s][A
 79%|███████▊  | 11/14 [00:03<00:00,  4.57it/s][A
100%|██████████| 14/14 [00:03<00:00,  3.86it/s][A
Epochs:  80%|████████  | 53/66 [23:55<05:49, 26.85s/it]

Val Loss: 0.1455 - Val Accuracy: 0.9446



Training:   0%|          | 0/105 [00:00<?, ?it/s][A
Training:   1%|          | 1/105 [00:01<02:05,  1.20s/it][A
Training:   3%|▎         | 3/105 [00:01<00:35,  2.85it/s][A
Training:   5%|▍         | 5/105 [00:01<00:33,  2.98it/s][A
Training:   7%|▋         | 7/105 [00:02<00:21,  4.47it/s][A
Training:   9%|▊         | 9/105 [00:02<00:24,  3.86it/s][A
Training:  10%|█         | 11/105 [00:02<00:17,  5.23it/s][A
Training:  12%|█▏        | 13/105 [00:03<00:21,  4.35it/s][A
Training:  13%|█▎        | 14/105 [00:03<00:19,  4.61it/s][A
Training:  15%|█▌        | 16/105 [00:03<00:14,  6.31it/s][A
Training:  17%|█▋        | 18/105 [00:04<00:19,  4.50it/s][A
Training:  18%|█▊        | 19/105 [00:04<00:17,  4.97it/s][A
Training:  20%|██        | 21/105 [00:05<00:21,  3.88it/s][A
Training:  22%|██▏       | 23/105 [00:05<00:16,  5.10it/s][A
Training:  24%|██▍       | 25/105 [00:06<00:20,  3.85it/s][A
Training:  27%|██▋       | 28/105 [00:06<00:13,  5.85it/s][A
Training:  29%|██▊   

Epoch: 54/66 - Loss: 0.1346 - Accuracy: 0.9474



  0%|          | 0/14 [00:00<?, ?it/s][A
  7%|▋         | 1/14 [00:01<00:17,  1.34s/it][A
 29%|██▊       | 4/14 [00:01<00:02,  3.43it/s][A
 43%|████▎     | 6/14 [00:02<00:02,  3.13it/s][A
 50%|█████     | 7/14 [00:02<00:01,  3.63it/s][A
 64%|██████▍   | 9/14 [00:03<00:01,  3.16it/s][A
 79%|███████▊  | 11/14 [00:03<00:00,  4.29it/s][A
100%|██████████| 14/14 [00:03<00:00,  3.55it/s][A
Epochs:  82%|████████▏ | 54/66 [24:22<05:20, 26.75s/it]

Val Loss: 0.1427 - Val Accuracy: 0.9456



Training:   0%|          | 0/105 [00:00<?, ?it/s][A
Training:   1%|          | 1/105 [00:01<02:02,  1.18s/it][A
Training:   4%|▍         | 4/105 [00:01<00:25,  3.99it/s][A
Training:   6%|▌         | 6/105 [00:01<00:29,  3.37it/s][A
Training:   8%|▊         | 8/105 [00:02<00:20,  4.74it/s][A
Training:  10%|▉         | 10/105 [00:02<00:25,  3.67it/s][A
Training:  12%|█▏        | 13/105 [00:03<00:23,  3.94it/s][A
Training:  13%|█▎        | 14/105 [00:03<00:21,  4.19it/s][A
Training:  16%|█▌        | 17/105 [00:04<00:21,  4.05it/s][A
Training:  17%|█▋        | 18/105 [00:04<00:21,  3.95it/s][A
Training:  19%|█▉        | 20/105 [00:04<00:16,  5.18it/s][A
Training:  20%|██        | 21/105 [00:05<00:18,  4.48it/s][A
Training:  21%|██        | 22/105 [00:05<00:21,  3.79it/s][A
Training:  24%|██▍       | 25/105 [00:06<00:14,  5.42it/s][A
Training:  25%|██▍       | 26/105 [00:06<00:20,  3.92it/s][A
Training:  28%|██▊       | 29/105 [00:06<00:14,  5.35it/s][A
Training:  29%|██▊  

Epoch: 55/66 - Loss: 0.1334 - Accuracy: 0.9481



  0%|          | 0/14 [00:00<?, ?it/s][A
  7%|▋         | 1/14 [00:01<00:14,  1.11s/it][A
 14%|█▍        | 2/14 [00:01<00:06,  1.93it/s][A
 36%|███▌      | 5/14 [00:02<00:03,  2.82it/s][A
 64%|██████▍   | 9/14 [00:03<00:01,  3.40it/s][A
 86%|████████▌ | 12/14 [00:03<00:00,  5.11it/s][A
100%|██████████| 14/14 [00:03<00:00,  3.53it/s][A
Epochs:  83%|████████▎ | 55/66 [24:48<04:53, 26.71s/it]

Val Loss: 0.1464 - Val Accuracy: 0.9414



Training:   0%|          | 0/105 [00:00<?, ?it/s][A
Training:   1%|          | 1/105 [00:01<02:03,  1.19s/it][A
Training:   2%|▏         | 2/105 [00:01<00:56,  1.81it/s][A
Training:   5%|▍         | 5/105 [00:02<00:35,  2.80it/s][A
Training:   6%|▌         | 6/105 [00:02<00:31,  3.13it/s][A
Training:   8%|▊         | 8/105 [00:02<00:20,  4.83it/s][A
Training:  10%|▉         | 10/105 [00:03<00:25,  3.72it/s][A
Training:  12%|█▏        | 13/105 [00:03<00:19,  4.68it/s][A
Training:  13%|█▎        | 14/105 [00:03<00:21,  4.18it/s][A
Training:  14%|█▍        | 15/105 [00:04<00:19,  4.62it/s][A
Training:  16%|█▌        | 17/105 [00:04<00:18,  4.71it/s][A
Training:  17%|█▋        | 18/105 [00:04<00:19,  4.57it/s][A
Training:  18%|█▊        | 19/105 [00:04<00:18,  4.74it/s][A
Training:  20%|██        | 21/105 [00:05<00:17,  4.85it/s][A
Training:  21%|██        | 22/105 [00:05<00:17,  4.81it/s][A
Training:  23%|██▎       | 24/105 [00:05<00:12,  6.66it/s][A
Training:  24%|██▍   

Epoch: 56/66 - Loss: 0.1347 - Accuracy: 0.9473



  0%|          | 0/14 [00:00<?, ?it/s][A
  7%|▋         | 1/14 [00:01<00:16,  1.29s/it][A
 14%|█▍        | 2/14 [00:01<00:07,  1.69it/s][A
 29%|██▊       | 4/14 [00:01<00:02,  3.92it/s][A
 43%|████▎     | 6/14 [00:02<00:02,  2.83it/s][A
 64%|██████▍   | 9/14 [00:03<00:01,  3.12it/s][A
 71%|███████▏  | 10/14 [00:03<00:01,  3.53it/s][A
100%|██████████| 14/14 [00:04<00:00,  3.42it/s][A
Epochs:  85%|████████▍ | 56/66 [25:16<04:28, 26.88s/it]

Val Loss: 0.1474 - Val Accuracy: 0.9414



Training:   0%|          | 0/105 [00:00<?, ?it/s][A
Training:   1%|          | 1/105 [00:01<02:23,  1.38s/it][A
Training:   4%|▍         | 4/105 [00:01<00:30,  3.36it/s][A
Training:   6%|▌         | 6/105 [00:02<00:33,  2.96it/s][A
Training:   9%|▊         | 9/105 [00:03<00:30,  3.15it/s][A
Training:  11%|█▏        | 12/105 [00:03<00:18,  4.95it/s][A
Training:  13%|█▎        | 14/105 [00:04<00:24,  3.78it/s][A
Training:  16%|█▌        | 17/105 [00:04<00:23,  3.75it/s][A
Training:  19%|█▉        | 20/105 [00:05<00:15,  5.38it/s][A
Training:  21%|██        | 22/105 [00:05<00:20,  4.07it/s][A
Training:  24%|██▍       | 25/105 [00:06<00:18,  4.27it/s][A
Training:  25%|██▍       | 26/105 [00:06<00:16,  4.65it/s][A
Training:  26%|██▌       | 27/105 [00:06<00:15,  5.09it/s][A
Training:  28%|██▊       | 29/105 [00:07<00:16,  4.50it/s][A
Training:  29%|██▊       | 30/105 [00:07<00:17,  4.31it/s][A
Training:  30%|███       | 32/105 [00:07<00:12,  5.76it/s][A
Training:  31%|███▏ 

Epoch: 57/66 - Loss: 0.1322 - Accuracy: 0.9490



  0%|          | 0/14 [00:00<?, ?it/s][A
  7%|▋         | 1/14 [00:01<00:13,  1.01s/it][A
 14%|█▍        | 2/14 [00:01<00:06,  1.74it/s][A
 29%|██▊       | 4/14 [00:01<00:02,  3.81it/s][A
 36%|███▌      | 5/14 [00:01<00:02,  3.29it/s][A
 43%|████▎     | 6/14 [00:02<00:02,  3.29it/s][A
 50%|█████     | 7/14 [00:02<00:01,  3.80it/s][A
 64%|██████▍   | 9/14 [00:02<00:01,  4.23it/s][A
 71%|███████▏  | 10/14 [00:03<00:01,  3.95it/s][A
 79%|███████▊  | 11/14 [00:03<00:00,  4.28it/s][A
100%|██████████| 14/14 [00:03<00:00,  4.03it/s][A
Epochs:  86%|████████▋ | 57/66 [25:42<04:00, 26.72s/it]

Val Loss: 0.1421 - Val Accuracy: 0.9451



Training:   0%|          | 0/105 [00:00<?, ?it/s][A
Training:   1%|          | 1/105 [00:01<02:07,  1.23s/it][A
Training:   3%|▎         | 3/105 [00:01<00:37,  2.72it/s][A
Training:   5%|▍         | 5/105 [00:02<00:35,  2.80it/s][A
Training:   8%|▊         | 8/105 [00:02<00:18,  5.30it/s][A
Training:  10%|▉         | 10/105 [00:02<00:24,  3.91it/s][A
Training:  11%|█▏        | 12/105 [00:03<00:18,  4.95it/s][A
Training:  13%|█▎        | 14/105 [00:03<00:22,  4.10it/s][A
Training:  15%|█▌        | 16/105 [00:03<00:16,  5.38it/s][A
Training:  17%|█▋        | 18/105 [00:04<00:21,  4.13it/s][A
Training:  19%|█▉        | 20/105 [00:04<00:15,  5.41it/s][A
Training:  21%|██        | 22/105 [00:05<00:20,  3.96it/s][A
Training:  23%|██▎       | 24/105 [00:05<00:15,  5.21it/s][A
Training:  25%|██▍       | 26/105 [00:06<00:20,  3.78it/s][A
Training:  28%|██▊       | 29/105 [00:07<00:19,  3.94it/s][A
Training:  30%|██▉       | 31/105 [00:07<00:14,  5.03it/s][A
Training:  31%|███▏ 

Epoch: 58/66 - Loss: 0.1345 - Accuracy: 0.9473



  0%|          | 0/14 [00:00<?, ?it/s][A
  7%|▋         | 1/14 [00:01<00:14,  1.10s/it][A
 14%|█▍        | 2/14 [00:01<00:06,  1.74it/s][A
 36%|███▌      | 5/14 [00:01<00:02,  3.10it/s][A
 43%|████▎     | 6/14 [00:02<00:02,  3.45it/s][A
 64%|██████▍   | 9/14 [00:02<00:01,  3.87it/s][A
 71%|███████▏  | 10/14 [00:03<00:00,  4.08it/s][A
 79%|███████▊  | 11/14 [00:03<00:00,  4.56it/s][A
100%|██████████| 14/14 [00:03<00:00,  3.75it/s][A
Epochs:  88%|████████▊ | 58/66 [26:09<03:33, 26.69s/it]

Val Loss: 0.1431 - Val Accuracy: 0.9446



Training:   0%|          | 0/105 [00:00<?, ?it/s][A
Training:   1%|          | 1/105 [00:01<02:16,  1.32s/it][A
Training:   4%|▍         | 4/105 [00:01<00:34,  2.90it/s][A
Training:   5%|▍         | 5/105 [00:02<00:38,  2.61it/s][A
Training:   8%|▊         | 8/105 [00:02<00:22,  4.37it/s][A
Training:   9%|▊         | 9/105 [00:02<00:27,  3.55it/s][A
Training:  10%|█         | 11/105 [00:03<00:19,  4.91it/s][A
Training:  11%|█▏        | 12/105 [00:03<00:18,  4.94it/s][A
Training:  12%|█▏        | 13/105 [00:03<00:29,  3.17it/s][A
Training:  16%|█▌        | 17/105 [00:04<00:23,  3.77it/s][A
Training:  18%|█▊        | 19/105 [00:04<00:17,  4.92it/s][A
Training:  20%|██        | 21/105 [00:05<00:21,  3.87it/s][A
Training:  22%|██▏       | 23/105 [00:05<00:16,  4.97it/s][A
Training:  24%|██▍       | 25/105 [00:06<00:19,  4.21it/s][A
Training:  27%|██▋       | 28/105 [00:06<00:13,  5.77it/s][A
Training:  28%|██▊       | 29/105 [00:07<00:18,  4.18it/s][A
Training:  30%|██▉   

Epoch: 59/66 - Loss: 0.1334 - Accuracy: 0.9483



  0%|          | 0/14 [00:00<?, ?it/s][A
  7%|▋         | 1/14 [00:01<00:18,  1.41s/it][A
 36%|███▌      | 5/14 [00:02<00:03,  2.72it/s][A
 50%|█████     | 7/14 [00:02<00:01,  4.02it/s][A
 64%|██████▍   | 9/14 [00:03<00:01,  3.35it/s][A
100%|██████████| 14/14 [00:03<00:00,  3.64it/s][A
Epochs:  89%|████████▉ | 59/66 [26:35<03:06, 26.61s/it]

Val Loss: 0.1421 - Val Accuracy: 0.9451



Training:   0%|          | 0/105 [00:00<?, ?it/s][A
Training:   1%|          | 1/105 [00:01<01:57,  1.13s/it][A
Training:   3%|▎         | 3/105 [00:01<00:36,  2.78it/s][A
Training:   5%|▍         | 5/105 [00:02<00:36,  2.74it/s][A
Training:   7%|▋         | 7/105 [00:02<00:23,  4.15it/s][A
Training:   9%|▊         | 9/105 [00:03<00:29,  3.22it/s][A
Training:  10%|█         | 11/105 [00:03<00:22,  4.27it/s][A
Training:  12%|█▏        | 13/105 [00:04<00:27,  3.33it/s][A
Training:  14%|█▍        | 15/105 [00:04<00:19,  4.52it/s][A
Training:  16%|█▌        | 17/105 [00:05<00:25,  3.49it/s][A
Training:  18%|█▊        | 19/105 [00:05<00:18,  4.54it/s][A
Training:  20%|██        | 21/105 [00:05<00:22,  3.71it/s][A
Training:  23%|██▎       | 24/105 [00:06<00:14,  5.66it/s][A
Training:  25%|██▍       | 26/105 [00:06<00:19,  4.04it/s][A
Training:  28%|██▊       | 29/105 [00:07<00:19,  3.89it/s][A
Training:  30%|███       | 32/105 [00:07<00:13,  5.51it/s][A
Training:  32%|███▏  

Epoch: 60/66 - Loss: 0.1320 - Accuracy: 0.9487



  0%|          | 0/14 [00:00<?, ?it/s][A
  7%|▋         | 1/14 [00:01<00:16,  1.26s/it][A
 29%|██▊       | 4/14 [00:01<00:02,  3.43it/s][A
 36%|███▌      | 5/14 [00:02<00:03,  2.55it/s][A
 50%|█████     | 7/14 [00:02<00:01,  4.04it/s][A
 64%|██████▍   | 9/14 [00:02<00:01,  3.39it/s][A
 79%|███████▊  | 11/14 [00:03<00:00,  4.76it/s][A
100%|██████████| 14/14 [00:03<00:00,  3.54it/s][A
Epochs:  91%|█████████ | 60/66 [27:03<02:41, 26.97s/it]

Val Loss: 0.1412 - Val Accuracy: 0.9462



Training:   0%|          | 0/105 [00:00<?, ?it/s][A
Training:   1%|          | 1/105 [00:01<01:50,  1.07s/it][A
Training:   2%|▏         | 2/105 [00:01<01:00,  1.70it/s][A
Training:   5%|▍         | 5/105 [00:02<00:32,  3.03it/s][A
Training:   6%|▌         | 6/105 [00:02<00:29,  3.36it/s][A
Training:   9%|▊         | 9/105 [00:02<00:25,  3.72it/s][A
Training:  10%|▉         | 10/105 [00:03<00:24,  3.87it/s][A
Training:  12%|█▏        | 13/105 [00:03<00:21,  4.27it/s][A
Training:  13%|█▎        | 14/105 [00:04<00:21,  4.25it/s][A
Training:  15%|█▌        | 16/105 [00:04<00:15,  5.74it/s][A
Training:  16%|█▌        | 17/105 [00:04<00:20,  4.30it/s][A
Training:  18%|█▊        | 19/105 [00:04<00:16,  5.17it/s][A
Training:  20%|██        | 21/105 [00:05<00:19,  4.39it/s][A
Training:  21%|██        | 22/105 [00:05<00:17,  4.72it/s][A
Training:  23%|██▎       | 24/105 [00:05<00:12,  6.30it/s][A
Training:  24%|██▍       | 25/105 [00:06<00:20,  3.92it/s][A
Training:  25%|██▍   

Epoch: 61/66 - Loss: 0.1321 - Accuracy: 0.9488



  0%|          | 0/14 [00:00<?, ?it/s][A
  7%|▋         | 1/14 [00:01<00:14,  1.08s/it][A
 14%|█▍        | 2/14 [00:01<00:06,  1.72it/s][A
 36%|███▌      | 5/14 [00:01<00:02,  3.07it/s][A
 43%|████▎     | 6/14 [00:02<00:02,  3.26it/s][A
 57%|█████▋    | 8/14 [00:02<00:01,  5.01it/s][A
 64%|██████▍   | 9/14 [00:02<00:01,  3.60it/s][A
 71%|███████▏  | 10/14 [00:03<00:01,  3.76it/s][A
100%|██████████| 14/14 [00:03<00:00,  3.66it/s][A
Epochs:  92%|█████████▏| 61/66 [27:29<02:14, 26.81s/it]

Val Loss: 0.1418 - Val Accuracy: 0.9456



Training:   0%|          | 0/105 [00:00<?, ?it/s][A
Training:   1%|          | 1/105 [00:01<01:50,  1.06s/it][A
Training:   3%|▎         | 3/105 [00:01<00:32,  3.17it/s][A
Training:   5%|▍         | 5/105 [00:01<00:32,  3.07it/s][A
Training:   6%|▌         | 6/105 [00:01<00:26,  3.72it/s][A
Training:   8%|▊         | 8/105 [00:02<00:18,  5.37it/s][A
Training:   9%|▊         | 9/105 [00:02<00:28,  3.37it/s][A
Training:  10%|▉         | 10/105 [00:02<00:23,  4.02it/s][A
Training:  11%|█▏        | 12/105 [00:03<00:15,  5.83it/s][A
Training:  13%|█▎        | 14/105 [00:03<00:22,  4.09it/s][A
Training:  15%|█▌        | 16/105 [00:03<00:16,  5.52it/s][A
Training:  17%|█▋        | 18/105 [00:04<00:22,  3.95it/s][A
Training:  20%|██        | 21/105 [00:05<00:21,  3.89it/s][A
Training:  22%|██▏       | 23/105 [00:05<00:16,  5.00it/s][A
Training:  24%|██▍       | 25/105 [00:06<00:20,  3.83it/s][A
Training:  26%|██▌       | 27/105 [00:06<00:16,  4.68it/s][A
Training:  28%|██▊    

Epoch: 62/66 - Loss: 0.1324 - Accuracy: 0.9481



  0%|          | 0/14 [00:00<?, ?it/s][A
  7%|▋         | 1/14 [00:01<00:15,  1.22s/it][A
 29%|██▊       | 4/14 [00:01<00:02,  3.70it/s][A
 43%|████▎     | 6/14 [00:02<00:02,  3.14it/s][A
 64%|██████▍   | 9/14 [00:02<00:01,  3.35it/s][A
100%|██████████| 14/14 [00:03<00:00,  3.78it/s][A
Epochs:  94%|█████████▍| 62/66 [27:56<01:47, 26.78s/it]

Val Loss: 0.1530 - Val Accuracy: 0.9154



Training:   0%|          | 0/105 [00:00<?, ?it/s][A
Training:   1%|          | 1/105 [00:01<02:06,  1.22s/it][A
Training:   3%|▎         | 3/105 [00:01<00:36,  2.82it/s][A
Training:   5%|▍         | 5/105 [00:02<00:41,  2.41it/s][A
Training:   7%|▋         | 7/105 [00:02<00:25,  3.81it/s][A
Training:   9%|▊         | 9/105 [00:03<00:30,  3.17it/s][A
Training:  10%|█         | 11/105 [00:03<00:20,  4.49it/s][A
Training:  12%|█▏        | 13/105 [00:04<00:24,  3.70it/s][A
Training:  15%|█▌        | 16/105 [00:04<00:15,  5.70it/s][A
Training:  17%|█▋        | 18/105 [00:04<00:19,  4.40it/s][A
Training:  20%|██        | 21/105 [00:05<00:20,  4.15it/s][A
Training:  22%|██▏       | 23/105 [00:05<00:15,  5.15it/s][A
Training:  24%|██▍       | 25/105 [00:06<00:19,  4.03it/s][A
Training:  26%|██▌       | 27/105 [00:06<00:15,  4.99it/s][A
Training:  28%|██▊       | 29/105 [00:07<00:18,  4.17it/s][A
Training:  30%|██▉       | 31/105 [00:07<00:13,  5.37it/s][A
Training:  31%|███▏  

Epoch: 63/66 - Loss: 0.1322 - Accuracy: 0.9487



  0%|          | 0/14 [00:00<?, ?it/s][A
  7%|▋         | 1/14 [00:01<00:15,  1.23s/it][A
 21%|██▏       | 3/14 [00:01<00:04,  2.73it/s][A
 36%|███▌      | 5/14 [00:02<00:03,  2.84it/s][A
 43%|████▎     | 6/14 [00:02<00:02,  3.26it/s][A
 64%|██████▍   | 9/14 [00:03<00:01,  3.40it/s][A
 71%|███████▏  | 10/14 [00:03<00:01,  3.79it/s][A
100%|██████████| 14/14 [00:03<00:00,  3.65it/s][A
Epochs:  95%|█████████▌| 63/66 [28:22<01:19, 26.57s/it]

Val Loss: 0.1401 - Val Accuracy: 0.9462



Training:   0%|          | 0/105 [00:00<?, ?it/s][A
Training:   1%|          | 1/105 [00:01<02:16,  1.32s/it][A
Training:   4%|▍         | 4/105 [00:01<00:28,  3.50it/s][A
Training:   6%|▌         | 6/105 [00:02<00:35,  2.79it/s][A
Training:   8%|▊         | 8/105 [00:02<00:23,  4.10it/s][A
Training:  10%|▉         | 10/105 [00:03<00:28,  3.37it/s][A
Training:  12%|█▏        | 13/105 [00:04<00:26,  3.53it/s][A
Training:  15%|█▌        | 16/105 [00:04<00:16,  5.28it/s][A
Training:  17%|█▋        | 18/105 [00:04<00:21,  4.02it/s][A
Training:  20%|██        | 21/105 [00:05<00:21,  3.86it/s][A
Training:  22%|██▏       | 23/105 [00:05<00:17,  4.70it/s][A
Training:  24%|██▍       | 25/105 [00:06<00:22,  3.63it/s][A
Training:  28%|██▊       | 29/105 [00:07<00:18,  4.13it/s][A
Training:  30%|███       | 32/105 [00:07<00:12,  5.63it/s][A
Training:  32%|███▏      | 34/105 [00:08<00:16,  4.39it/s][A
Training:  34%|███▍      | 36/105 [00:08<00:12,  5.44it/s][A
Training:  36%|███▌ 

Epoch: 64/66 - Loss: 0.1313 - Accuracy: 0.9495



  0%|          | 0/14 [00:00<?, ?it/s][A
  7%|▋         | 1/14 [00:01<00:15,  1.19s/it][A
 21%|██▏       | 3/14 [00:01<00:03,  2.86it/s][A
 36%|███▌      | 5/14 [00:02<00:03,  2.65it/s][A
 50%|█████     | 7/14 [00:02<00:01,  4.15it/s][A
 64%|██████▍   | 9/14 [00:03<00:01,  3.35it/s][A
100%|██████████| 14/14 [00:04<00:00,  3.49it/s][A
Epochs:  97%|█████████▋| 64/66 [28:50<00:53, 26.92s/it]

Val Loss: 0.1539 - Val Accuracy: 0.9149



Training:   0%|          | 0/105 [00:00<?, ?it/s][A
Training:   1%|          | 1/105 [00:01<02:17,  1.33s/it][A
Training:   4%|▍         | 4/105 [00:01<00:28,  3.59it/s][A
Training:   6%|▌         | 6/105 [00:02<00:31,  3.13it/s][A
Training:   8%|▊         | 8/105 [00:02<00:21,  4.55it/s][A
Training:  10%|▉         | 10/105 [00:03<00:27,  3.49it/s][A
Training:  11%|█▏        | 12/105 [00:03<00:20,  4.64it/s][A
Training:  13%|█▎        | 14/105 [00:04<00:25,  3.50it/s][A
Training:  16%|█▌        | 17/105 [00:04<00:24,  3.58it/s][A
Training:  18%|█▊        | 19/105 [00:05<00:19,  4.51it/s][A
Training:  20%|██        | 21/105 [00:05<00:21,  3.86it/s][A
Training:  22%|██▏       | 23/105 [00:05<00:16,  4.83it/s][A
Training:  24%|██▍       | 25/105 [00:06<00:19,  4.11it/s][A
Training:  26%|██▌       | 27/105 [00:06<00:14,  5.22it/s][A
Training:  28%|██▊       | 29/105 [00:07<00:18,  4.17it/s][A
Training:  30%|██▉       | 31/105 [00:07<00:14,  5.19it/s][A
Training:  31%|███▏ 

Epoch: 65/66 - Loss: 0.1322 - Accuracy: 0.9493



  0%|          | 0/14 [00:00<?, ?it/s][A
  7%|▋         | 1/14 [00:01<00:17,  1.37s/it][A
 29%|██▊       | 4/14 [00:01<00:02,  3.50it/s][A
 43%|████▎     | 6/14 [00:02<00:02,  3.11it/s][A
 64%|██████▍   | 9/14 [00:03<00:01,  3.14it/s][A
 86%|████████▌ | 12/14 [00:03<00:00,  4.86it/s][A
100%|██████████| 14/14 [00:03<00:00,  3.53it/s][A
Epochs:  98%|█████████▊| 65/66 [29:17<00:26, 26.97s/it]

Val Loss: 0.1422 - Val Accuracy: 0.9446



Training:   0%|          | 0/105 [00:00<?, ?it/s][A
Training:   1%|          | 1/105 [00:01<02:08,  1.24s/it][A
Training:   3%|▎         | 3/105 [00:01<00:36,  2.78it/s][A
Training:   5%|▍         | 5/105 [00:02<00:34,  2.88it/s][A
Training:   8%|▊         | 8/105 [00:02<00:18,  5.28it/s][A
Training:  10%|▉         | 10/105 [00:03<00:26,  3.55it/s][A
Training:  12%|█▏        | 13/105 [00:03<00:25,  3.62it/s][A
Training:  15%|█▌        | 16/105 [00:04<00:16,  5.37it/s][A
Training:  17%|█▋        | 18/105 [00:04<00:21,  4.08it/s][A
Training:  20%|██        | 21/105 [00:05<00:21,  3.94it/s][A
Training:  22%|██▏       | 23/105 [00:05<00:16,  4.94it/s][A
Training:  24%|██▍       | 25/105 [00:06<00:19,  4.04it/s][A
Training:  28%|██▊       | 29/105 [00:07<00:18,  4.11it/s][A
Training:  30%|██▉       | 31/105 [00:07<00:14,  5.01it/s][A
Training:  31%|███▏      | 33/105 [00:08<00:17,  4.01it/s][A
Training:  35%|███▌      | 37/105 [00:09<00:15,  4.45it/s][A
Training:  38%|███▊ 

Epoch: 66/66 - Loss: 0.1312 - Accuracy: 0.9494



  0%|          | 0/14 [00:00<?, ?it/s][A
  7%|▋         | 1/14 [00:01<00:16,  1.24s/it][A
 21%|██▏       | 3/14 [00:01<00:04,  2.72it/s][A
 36%|███▌      | 5/14 [00:02<00:03,  2.89it/s][A
 50%|█████     | 7/14 [00:02<00:01,  4.42it/s][A
 64%|██████▍   | 9/14 [00:02<00:01,  3.48it/s][A
 79%|███████▊  | 11/14 [00:03<00:00,  4.82it/s][A
100%|██████████| 14/14 [00:03<00:00,  3.76it/s][A
Epochs: 100%|██████████| 66/66 [29:43<00:00, 27.03s/it]


Val Loss: 0.1411 - Val Accuracy: 0.9451
Saving best model...


[32m[I 2023-12-15 00:21:41,388][0m Trial 4 finished with value: 0.9450960159301758 and parameters: {'learning_rate': 3.220616291387027e-05, 'weight_decay': 0.0010915949385844237, 'epsilon': 7.0510050620049406e-09, 'batch_size': 134, 'epochs': 66}. Best is trial 4 with value: 0.9450960159301758.[0m


Learning rate: 4.9359561612064165e-05
Weight decay: 0.0017282908819438848
Epsilon: 2.5803316647343055e-08
Batch size: 278
Number of epochs: 91


Epochs:   0%|          | 0/91 [00:00<?, ?it/s]
Training:   0%|          | 0/51 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/51 [00:02<01:47,  2.14s/it][A
Training:   6%|▌         | 3/51 [00:02<00:30,  1.59it/s][A
Training:  10%|▉         | 5/51 [00:04<00:35,  1.29it/s][A
Training:  12%|█▏        | 6/51 [00:04<00:27,  1.66it/s][A
Training:  18%|█▊        | 9/51 [00:06<00:25,  1.68it/s][A
Training:  22%|██▏       | 11/51 [00:06<00:16,  2.40it/s][A
Training:  25%|██▌       | 13/51 [00:07<00:21,  1.77it/s][A
Training:  29%|██▉       | 15/51 [00:08<00:14,  2.47it/s][A
Training:  33%|███▎      | 17/51 [00:09<00:16,  2.06it/s][A
Training:  37%|███▋      | 19/51 [00:09<00:11,  2.82it/s][A
Training:  41%|████      | 21/51 [00:11<00:16,  1.82it/s][A
Training:  45%|████▌     | 23/51 [00:11<00:11,  2.47it/s][A
Training:  49%|████▉     | 25/51 [00:13<00:13,  1.97it/s][A
Training:  53%|█████▎    | 27/51 [00:13<00:09,  2.62it/s][A
Training:  55%|█████▍    | 28/51 [00:13<00:07,  2.98

Epoch: 1/91 - Loss: 0.5873 - Accuracy: 0.7400



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:02<00:13,  2.27s/it][A
 29%|██▊       | 2/7 [00:02<00:05,  1.01s/it][A
 57%|█████▋    | 4/7 [00:02<00:01,  2.27it/s][A
 71%|███████▏  | 5/7 [00:04<00:01,  1.31it/s][A
100%|██████████| 7/7 [00:04<00:00,  1.62it/s][A
Epochs:   0%|          | 0/91 [00:27<?, ?it/s]
[32m[I 2023-12-15 00:22:09,526][0m Trial 5 pruned. [0m


Val Loss: 0.5016 - Val Accuracy: 0.8353
Learning rate: 9.224631812375132e-05
Weight decay: 0.009571773104112032
Epsilon: 4.371363667289597e-08
Batch size: 120
Number of epochs: 99


Epochs:   0%|          | 0/99 [00:00<?, ?it/s]
Training:   0%|          | 0/117 [00:00<?, ?it/s][A
Training:   1%|          | 1/117 [00:01<02:21,  1.22s/it][A
Training:   4%|▍         | 5/117 [00:01<00:38,  2.94it/s][A
Training:   6%|▌         | 7/117 [00:02<00:25,  4.28it/s][A
Training:   8%|▊         | 9/117 [00:02<00:28,  3.74it/s][A
Training:   9%|▊         | 10/117 [00:02<00:26,  4.06it/s][A
Training:  11%|█         | 13/117 [00:03<00:23,  4.45it/s][A
Training:  12%|█▏        | 14/117 [00:03<00:21,  4.72it/s][A
Training:  14%|█▎        | 16/117 [00:03<00:18,  5.56it/s][A
Training:  15%|█▍        | 17/117 [00:04<00:22,  4.41it/s][A
Training:  15%|█▌        | 18/117 [00:04<00:21,  4.63it/s][A
Training:  17%|█▋        | 20/117 [00:04<00:14,  6.50it/s][A
Training:  18%|█▊        | 21/117 [00:05<00:21,  4.55it/s][A
Training:  19%|█▉        | 22/117 [00:05<00:20,  4.68it/s][A
Training:  21%|██▏       | 25/117 [00:05<00:18,  4.93it/s][A
Training:  22%|██▏       | 26/117 [0

Epoch: 1/99 - Loss: 0.4651 - Accuracy: 0.8080



  0%|          | 0/15 [00:00<?, ?it/s][A
  7%|▋         | 1/15 [00:01<00:15,  1.11s/it][A
 27%|██▋       | 4/15 [00:01<00:02,  4.07it/s][A
 40%|████      | 6/15 [00:01<00:02,  3.43it/s][A
 60%|██████    | 9/15 [00:02<00:01,  3.91it/s][A
 67%|██████▋   | 10/15 [00:02<00:01,  4.33it/s][A
100%|██████████| 15/15 [00:03<00:00,  4.23it/s][A
Epochs:   0%|          | 0/99 [00:26<?, ?it/s]
[32m[I 2023-12-15 00:22:36,331][0m Trial 6 pruned. [0m


Val Loss: 0.3309 - Val Accuracy: 0.8895
Learning rate: 0.0032843110488633004
Weight decay: 0.0007127469704402247
Epsilon: 1.9878696237499133e-09
Batch size: 120
Number of epochs: 81


Epochs:   0%|          | 0/81 [00:00<?, ?it/s]
Training:   0%|          | 0/117 [00:00<?, ?it/s][A
Training:   1%|          | 1/117 [00:01<02:05,  1.08s/it][A
Training:   2%|▏         | 2/117 [00:01<00:58,  1.96it/s][A
Training:   4%|▍         | 5/117 [00:01<00:33,  3.36it/s][A
Training:   7%|▋         | 8/117 [00:01<00:18,  5.84it/s][A
Training:   9%|▊         | 10/117 [00:02<00:26,  4.11it/s][A
Training:  10%|█         | 12/117 [00:02<00:20,  5.25it/s][A
Training:  11%|█         | 13/117 [00:03<00:27,  3.79it/s][A
Training:  12%|█▏        | 14/117 [00:03<00:23,  4.30it/s][A
Training:  14%|█▎        | 16/117 [00:03<00:17,  5.89it/s][A
Training:  15%|█▌        | 18/117 [00:04<00:23,  4.21it/s][A
Training:  17%|█▋        | 20/117 [00:04<00:17,  5.66it/s][A
Training:  19%|█▉        | 22/117 [00:05<00:21,  4.35it/s][A
Training:  21%|██▏       | 25/117 [00:06<00:21,  4.19it/s][A
Training:  25%|██▍       | 29/117 [00:06<00:19,  4.59it/s][A
Training:  26%|██▋       | 31/117 [0

Epoch: 1/81 - Loss: 0.4739 - Accuracy: 0.8159



  0%|          | 0/15 [00:00<?, ?it/s][A
  7%|▋         | 1/15 [00:00<00:13,  1.02it/s][A
 13%|█▎        | 2/15 [00:01<00:06,  2.08it/s][A
 27%|██▋       | 4/15 [00:01<00:02,  4.64it/s][A
 40%|████      | 6/15 [00:01<00:02,  3.45it/s][A
 60%|██████    | 9/15 [00:02<00:01,  3.95it/s][A
 73%|███████▎  | 11/15 [00:02<00:00,  4.79it/s][A
 87%|████████▋ | 13/15 [00:03<00:00,  4.42it/s][A
100%|██████████| 15/15 [00:03<00:00,  4.21it/s][A
Epochs:   1%|          | 1/81 [00:26<35:29, 26.62s/it]

Val Loss: 0.2023 - Val Accuracy: 0.9133



Training:   0%|          | 0/117 [00:00<?, ?it/s][A
Training:   1%|          | 1/117 [00:01<02:15,  1.17s/it][A
Training:   2%|▏         | 2/117 [00:01<01:09,  1.65it/s][A
Training:   3%|▎         | 4/117 [00:01<00:29,  3.83it/s][A
Training:   4%|▍         | 5/117 [00:02<00:39,  2.84it/s][A
Training:   5%|▌         | 6/117 [00:02<00:30,  3.62it/s][A
Training:   8%|▊         | 9/117 [00:02<00:25,  4.32it/s][A
Training:   9%|▊         | 10/117 [00:03<00:26,  4.11it/s][A
Training:  10%|█         | 12/117 [00:03<00:18,  5.58it/s][A
Training:  11%|█         | 13/117 [00:03<00:21,  4.87it/s][A
Training:  12%|█▏        | 14/117 [00:03<00:27,  3.70it/s][A
Training:  15%|█▍        | 17/117 [00:04<00:18,  5.27it/s][A
Training:  15%|█▌        | 18/117 [00:04<00:25,  3.90it/s][A
Training:  17%|█▋        | 20/117 [00:04<00:18,  5.35it/s][A
Training:  18%|█▊        | 21/117 [00:05<00:18,  5.27it/s][A
Training:  19%|█▉        | 22/117 [00:05<00:23,  3.99it/s][A
Training:  21%|██▏    

Epoch: 2/81 - Loss: 0.1982 - Accuracy: 0.9179



  0%|          | 0/15 [00:00<?, ?it/s][A
  7%|▋         | 1/15 [00:00<00:13,  1.07it/s][A
 13%|█▎        | 2/15 [00:01<00:06,  2.12it/s][A
 33%|███▎      | 5/15 [00:01<00:02,  3.91it/s][A
 40%|████      | 6/15 [00:01<00:02,  4.12it/s][A
 60%|██████    | 9/15 [00:02<00:01,  5.20it/s][A
 67%|██████▋   | 10/15 [00:02<00:01,  4.63it/s][A
 87%|████████▋ | 13/15 [00:03<00:00,  5.34it/s][A
100%|██████████| 15/15 [00:03<00:00,  4.32it/s][A
Epochs:   2%|▏         | 2/81 [00:53<35:18, 26.81s/it]

Val Loss: 0.1744 - Val Accuracy: 0.9276



Training:   0%|          | 0/117 [00:00<?, ?it/s][A
Training:   1%|          | 1/117 [00:01<02:45,  1.43s/it][A
Training:   3%|▎         | 4/117 [00:01<00:33,  3.35it/s][A
Training:   5%|▌         | 6/117 [00:02<00:33,  3.28it/s][A
Training:   7%|▋         | 8/117 [00:02<00:23,  4.69it/s][A
Training:   9%|▊         | 10/117 [00:02<00:27,  3.83it/s][A
Training:  11%|█         | 13/117 [00:03<00:26,  3.96it/s][A
Training:  12%|█▏        | 14/117 [00:03<00:23,  4.39it/s][A
Training:  14%|█▎        | 16/117 [00:03<00:17,  5.85it/s][A
Training:  15%|█▌        | 18/117 [00:04<00:22,  4.38it/s][A
Training:  17%|█▋        | 20/117 [00:04<00:17,  5.63it/s][A
Training:  19%|█▉        | 22/117 [00:05<00:22,  4.16it/s][A
Training:  21%|██▏       | 25/117 [00:06<00:21,  4.21it/s][A
Training:  25%|██▍       | 29/117 [00:06<00:17,  4.95it/s][A
Training:  28%|██▊       | 33/117 [00:07<00:15,  5.37it/s][A
Training:  32%|███▏      | 37/117 [00:08<00:14,  5.58it/s][A
Training:  34%|███▍ 

Epoch: 3/81 - Loss: 0.1800 - Accuracy: 0.9239



  0%|          | 0/15 [00:00<?, ?it/s][A
  7%|▋         | 1/15 [00:01<00:17,  1.23s/it][A
 27%|██▋       | 4/15 [00:01<00:03,  3.66it/s][A
 40%|████      | 6/15 [00:02<00:02,  3.24it/s][A
 60%|██████    | 9/15 [00:02<00:01,  3.75it/s][A
 80%|████████  | 12/15 [00:02<00:00,  5.79it/s][A
100%|██████████| 15/15 [00:03<00:00,  4.27it/s][A
Epochs:   4%|▎         | 3/81 [01:19<34:16, 26.37s/it]

Val Loss: 0.1806 - Val Accuracy: 0.9247



Training:   0%|          | 0/117 [00:00<?, ?it/s][A
Training:   1%|          | 1/117 [00:01<02:42,  1.40s/it][A
Training:   3%|▎         | 3/117 [00:01<00:46,  2.44it/s][A
Training:   4%|▍         | 5/117 [00:02<00:42,  2.64it/s][A
Training:   6%|▌         | 7/117 [00:02<00:26,  4.17it/s][A
Training:   8%|▊         | 9/117 [00:02<00:26,  4.03it/s][A
Training:   9%|▉         | 11/117 [00:02<00:19,  5.56it/s][A
Training:  11%|█         | 13/117 [00:03<00:24,  4.24it/s][A
Training:  14%|█▎        | 16/117 [00:03<00:15,  6.41it/s][A
Training:  15%|█▌        | 18/117 [00:04<00:21,  4.60it/s][A
Training:  17%|█▋        | 20/117 [00:04<00:16,  5.82it/s][A
Training:  19%|█▉        | 22/117 [00:05<00:20,  4.58it/s][A
Training:  21%|██        | 24/117 [00:05<00:15,  5.90it/s][A
Training:  22%|██▏       | 26/117 [00:06<00:19,  4.60it/s][A
Training:  25%|██▍       | 29/117 [00:06<00:19,  4.51it/s][A
Training:  26%|██▋       | 31/117 [00:06<00:15,  5.67it/s][A
Training:  28%|██▊   

Epoch: 4/81 - Loss: 0.1709 - Accuracy: 0.9308



  0%|          | 0/15 [00:00<?, ?it/s][A
  7%|▋         | 1/15 [00:01<00:14,  1.00s/it][A
 27%|██▋       | 4/15 [00:01<00:02,  4.10it/s][A
 33%|███▎      | 5/15 [00:01<00:03,  2.76it/s][A
 47%|████▋     | 7/15 [00:02<00:01,  4.40it/s][A
 60%|██████    | 9/15 [00:02<00:01,  3.59it/s][A
 80%|████████  | 12/15 [00:02<00:00,  5.82it/s][A
100%|██████████| 15/15 [00:03<00:00,  4.35it/s][A
Epochs:   5%|▍         | 4/81 [01:46<34:05, 26.56s/it]

Val Loss: 0.1637 - Val Accuracy: 0.9326



Training:   0%|          | 0/117 [00:00<?, ?it/s][A
Training:   1%|          | 1/117 [00:00<01:50,  1.05it/s][A
Training:   3%|▎         | 3/117 [00:01<00:36,  3.09it/s][A
Training:   4%|▍         | 5/117 [00:01<00:35,  3.14it/s][A
Training:   6%|▌         | 7/117 [00:01<00:23,  4.77it/s][A
Training:   8%|▊         | 9/117 [00:02<00:27,  3.98it/s][A
Training:   9%|▉         | 11/117 [00:02<00:19,  5.33it/s][A
Training:  11%|█         | 13/117 [00:03<00:25,  4.06it/s][A
Training:  15%|█▍        | 17/117 [00:04<00:21,  4.66it/s][A
Training:  16%|█▌        | 19/117 [00:04<00:18,  5.26it/s][A
Training:  18%|█▊        | 21/117 [00:04<00:19,  4.86it/s][A
Training:  20%|█▉        | 23/117 [00:05<00:18,  5.18it/s][A
Training:  21%|██▏       | 25/117 [00:05<00:20,  4.50it/s][A
Training:  23%|██▎       | 27/117 [00:06<00:17,  5.20it/s][A
Training:  25%|██▍       | 29/117 [00:06<00:18,  4.80it/s][A
Training:  26%|██▋       | 31/117 [00:06<00:15,  5.63it/s][A
Training:  28%|██▊   

Epoch: 5/81 - Loss: 0.1671 - Accuracy: 0.9332



  0%|          | 0/15 [00:00<?, ?it/s][A
  7%|▋         | 1/15 [00:00<00:13,  1.07it/s][A
 20%|██        | 3/15 [00:01<00:03,  3.44it/s][A
 33%|███▎      | 5/15 [00:01<00:03,  3.27it/s][A
 47%|████▋     | 7/15 [00:01<00:01,  4.84it/s][A
 60%|██████    | 9/15 [00:02<00:01,  4.12it/s][A
 73%|███████▎  | 11/15 [00:02<00:00,  5.15it/s][A
100%|██████████| 15/15 [00:03<00:00,  4.38it/s][A
Epochs:   6%|▌         | 5/81 [02:13<33:46, 26.67s/it]

Val Loss: 0.1624 - Val Accuracy: 0.9298



Training:   0%|          | 0/117 [00:00<?, ?it/s][A
Training:   1%|          | 1/117 [00:01<01:59,  1.03s/it][A
Training:   2%|▏         | 2/117 [00:01<00:55,  2.07it/s][A
Training:   3%|▎         | 4/117 [00:01<00:26,  4.31it/s][A
Training:   4%|▍         | 5/117 [00:01<00:38,  2.94it/s][A
Training:   7%|▋         | 8/117 [00:02<00:18,  5.87it/s][A
Training:   9%|▊         | 10/117 [00:02<00:24,  4.38it/s][A
Training:  10%|█         | 12/117 [00:02<00:17,  5.88it/s][A
Training:  12%|█▏        | 14/117 [00:03<00:23,  4.30it/s][A
Training:  15%|█▍        | 17/117 [00:04<00:22,  4.50it/s][A
Training:  17%|█▋        | 20/117 [00:04<00:15,  6.21it/s][A
Training:  19%|█▉        | 22/117 [00:04<00:19,  4.79it/s][A
Training:  21%|██        | 24/117 [00:05<00:15,  5.85it/s][A
Training:  22%|██▏       | 26/117 [00:05<00:19,  4.78it/s][A
Training:  24%|██▍       | 28/117 [00:05<00:15,  5.57it/s][A
Training:  25%|██▍       | 29/117 [00:06<00:21,  4.05it/s][A
Training:  26%|██▋   

Epoch: 6/81 - Loss: 0.1649 - Accuracy: 0.9342



  0%|          | 0/15 [00:00<?, ?it/s][A
  7%|▋         | 1/15 [00:01<00:15,  1.12s/it][A
 20%|██        | 3/15 [00:01<00:04,  2.69it/s][A
 33%|███▎      | 5/15 [00:01<00:03,  3.03it/s][A
 53%|█████▎    | 8/15 [00:02<00:01,  5.69it/s][A
 67%|██████▋   | 10/15 [00:02<00:01,  4.35it/s][A
 80%|████████  | 12/15 [00:02<00:00,  5.80it/s][A
100%|██████████| 15/15 [00:03<00:00,  4.38it/s][A
Epochs:   7%|▋         | 6/81 [02:40<33:28, 26.78s/it]

Val Loss: 0.1614 - Val Accuracy: 0.9287



Training:   0%|          | 0/117 [00:00<?, ?it/s][A
Training:   1%|          | 1/117 [00:01<02:15,  1.17s/it][A
Training:   3%|▎         | 3/117 [00:01<00:39,  2.85it/s][A
Training:   4%|▍         | 5/117 [00:01<00:38,  2.91it/s][A
Training:   7%|▋         | 8/117 [00:02<00:20,  5.23it/s][A
Training:   9%|▊         | 10/117 [00:02<00:26,  4.01it/s][A
Training:  11%|█         | 13/117 [00:03<00:24,  4.19it/s][A
Training:  15%|█▍        | 17/117 [00:04<00:21,  4.76it/s][A
Training:  17%|█▋        | 20/117 [00:04<00:15,  6.15it/s][A
Training:  18%|█▊        | 21/117 [00:05<00:21,  4.54it/s][A
Training:  21%|██        | 24/117 [00:05<00:14,  6.34it/s][A
Training:  22%|██▏       | 26/117 [00:05<00:17,  5.15it/s][A
Training:  24%|██▍       | 28/117 [00:05<00:14,  6.20it/s][A
Training:  26%|██▌       | 30/117 [00:06<00:18,  4.80it/s][A
Training:  27%|██▋       | 32/117 [00:06<00:15,  5.65it/s][A
Training:  28%|██▊       | 33/117 [00:07<00:19,  4.39it/s][A
Training:  31%|███  

Epoch: 7/81 - Loss: 0.1618 - Accuracy: 0.9361



  0%|          | 0/15 [00:00<?, ?it/s][A
  7%|▋         | 1/15 [00:01<00:15,  1.08s/it][A
 13%|█▎        | 2/15 [00:01<00:06,  1.95it/s][A
 33%|███▎      | 5/15 [00:01<00:02,  3.41it/s][A
 40%|████      | 6/15 [00:01<00:02,  3.82it/s][A
 60%|██████    | 9/15 [00:02<00:01,  4.50it/s][A
 67%|██████▋   | 10/15 [00:02<00:01,  4.46it/s][A
 87%|████████▋ | 13/15 [00:03<00:00,  5.09it/s][A
100%|██████████| 15/15 [00:03<00:00,  4.21it/s][A
Epochs:   9%|▊         | 7/81 [03:06<32:46, 26.57s/it]

Val Loss: 0.1824 - Val Accuracy: 0.9177



Training:   0%|          | 0/117 [00:00<?, ?it/s][A
Training:   1%|          | 1/117 [00:01<01:55,  1.01it/s][A
Training:   4%|▍         | 5/117 [00:01<00:31,  3.50it/s][A
Training:   7%|▋         | 8/117 [00:01<00:20,  5.38it/s][A
Training:   8%|▊         | 9/117 [00:02<00:28,  3.77it/s][A
Training:   9%|▉         | 11/117 [00:02<00:20,  5.18it/s][A
Training:  11%|█         | 13/117 [00:03<00:25,  4.07it/s][A
Training:  15%|█▍        | 17/117 [00:04<00:21,  4.61it/s][A
Training:  17%|█▋        | 20/117 [00:04<00:16,  6.02it/s][A
Training:  18%|█▊        | 21/117 [00:04<00:19,  4.88it/s][A
Training:  21%|██        | 24/117 [00:05<00:15,  6.03it/s][A
Training:  21%|██▏       | 25/117 [00:05<00:17,  5.19it/s][A
Training:  23%|██▎       | 27/117 [00:05<00:13,  6.62it/s][A
Training:  24%|██▍       | 28/117 [00:05<00:15,  5.70it/s][A
Training:  25%|██▍       | 29/117 [00:06<00:20,  4.36it/s][A
Training:  26%|██▌       | 30/117 [00:06<00:17,  4.90it/s][A
Training:  27%|██▋  

Epoch: 8/81 - Loss: 0.1554 - Accuracy: 0.9383



  0%|          | 0/15 [00:00<?, ?it/s][A
  7%|▋         | 1/15 [00:01<00:14,  1.07s/it][A
 33%|███▎      | 5/15 [00:01<00:03,  3.09it/s][A
 47%|████▋     | 7/15 [00:01<00:01,  4.40it/s][A
 60%|██████    | 9/15 [00:02<00:01,  3.82it/s][A
 80%|████████  | 12/15 [00:02<00:00,  5.96it/s][A
100%|██████████| 15/15 [00:03<00:00,  4.19it/s][A
Epochs:  10%|▉         | 8/81 [03:32<32:17, 26.54s/it]

Val Loss: 0.1647 - Val Accuracy: 0.9330



Training:   0%|          | 0/117 [00:00<?, ?it/s][A
Training:   1%|          | 1/117 [00:01<02:11,  1.13s/it][A
Training:   4%|▍         | 5/117 [00:01<00:37,  2.97it/s][A
Training:   8%|▊         | 9/117 [00:02<00:27,  3.98it/s][A
Training:  10%|█         | 12/117 [00:02<00:18,  5.72it/s][A
Training:  12%|█▏        | 14/117 [00:03<00:20,  5.00it/s][A
Training:  14%|█▎        | 16/117 [00:03<00:16,  5.99it/s][A
Training:  15%|█▌        | 18/117 [00:04<00:21,  4.69it/s][A
Training:  18%|█▊        | 21/117 [00:04<00:22,  4.36it/s][A
Training:  21%|██▏       | 25/117 [00:05<00:19,  4.80it/s][A
Training:  23%|██▎       | 27/117 [00:05<00:15,  5.76it/s][A
Training:  25%|██▍       | 29/117 [00:06<00:18,  4.88it/s][A
Training:  26%|██▋       | 31/117 [00:06<00:14,  6.05it/s][A
Training:  28%|██▊       | 33/117 [00:07<00:17,  4.90it/s][A
Training:  31%|███       | 36/117 [00:07<00:13,  6.06it/s][A
Training:  32%|███▏      | 37/117 [00:07<00:16,  4.90it/s][A
Training:  33%|███▎

Epoch: 9/81 - Loss: 0.1567 - Accuracy: 0.9363



  0%|          | 0/15 [00:00<?, ?it/s][A
  7%|▋         | 1/15 [00:01<00:15,  1.09s/it][A
 20%|██        | 3/15 [00:01<00:03,  3.11it/s][A
 33%|███▎      | 5/15 [00:01<00:03,  3.11it/s][A
 60%|██████    | 9/15 [00:02<00:01,  4.15it/s][A
 80%|████████  | 12/15 [00:02<00:00,  6.18it/s][A
100%|██████████| 15/15 [00:03<00:00,  4.17it/s][A
Epochs:  11%|█         | 9/81 [03:59<31:50, 26.54s/it]

Val Loss: 0.1633 - Val Accuracy: 0.9330



Training:   0%|          | 0/117 [00:00<?, ?it/s][A
Training:   1%|          | 1/117 [00:01<02:00,  1.04s/it][A
Training:   2%|▏         | 2/117 [00:01<01:08,  1.69it/s][A
Training:   4%|▍         | 5/117 [00:01<00:28,  3.90it/s][A
Training:   5%|▌         | 6/117 [00:01<00:29,  3.74it/s][A
Training:   7%|▋         | 8/117 [00:02<00:19,  5.66it/s][A
Training:   8%|▊         | 9/117 [00:02<00:22,  4.89it/s][A
Training:   9%|▊         | 10/117 [00:02<00:25,  4.16it/s][A
Training:   9%|▉         | 11/117 [00:02<00:23,  4.49it/s][A
Training:  11%|█         | 13/117 [00:03<00:17,  5.84it/s][A
Training:  12%|█▏        | 14/117 [00:03<00:23,  4.38it/s][A
Training:  14%|█▎        | 16/117 [00:03<00:16,  6.23it/s][A
Training:  15%|█▍        | 17/117 [00:03<00:15,  6.54it/s][A
Training:  15%|█▌        | 18/117 [00:04<00:23,  4.21it/s][A
Training:  18%|█▊        | 21/117 [00:04<00:14,  6.59it/s][A
Training:  19%|█▉        | 22/117 [00:04<00:19,  4.85it/s][A
Training:  21%|██     

Epoch: 10/81 - Loss: 0.1570 - Accuracy: 0.9344



  0%|          | 0/15 [00:00<?, ?it/s][A
  7%|▋         | 1/15 [00:01<00:14,  1.06s/it][A
 13%|█▎        | 2/15 [00:01<00:06,  1.97it/s][A
 20%|██        | 3/15 [00:01<00:03,  3.03it/s][A
 33%|███▎      | 5/15 [00:02<00:03,  2.89it/s][A
 47%|████▋     | 7/15 [00:02<00:01,  4.09it/s][A
 60%|██████    | 9/15 [00:02<00:01,  3.83it/s][A
 73%|███████▎  | 11/15 [00:03<00:00,  4.63it/s][A
100%|██████████| 15/15 [00:03<00:00,  4.09it/s][A
Epochs:  12%|█▏        | 10/81 [04:25<31:23, 26.53s/it]

Val Loss: 0.1748 - Val Accuracy: 0.9274



Training:   0%|          | 0/117 [00:00<?, ?it/s][A
Training:   1%|          | 1/117 [00:01<02:33,  1.32s/it][A
Training:   3%|▎         | 3/117 [00:01<00:43,  2.63it/s][A
Training:   4%|▍         | 5/117 [00:02<00:39,  2.82it/s][A
Training:   8%|▊         | 9/117 [00:02<00:29,  3.72it/s][A
Training:  11%|█         | 13/117 [00:03<00:24,  4.25it/s][A
Training:  14%|█▎        | 16/117 [00:03<00:17,  5.79it/s][A
Training:  15%|█▌        | 18/117 [00:04<00:21,  4.53it/s][A
Training:  17%|█▋        | 20/117 [00:04<00:17,  5.40it/s][A
Training:  18%|█▊        | 21/117 [00:05<00:23,  4.16it/s][A
Training:  20%|█▉        | 23/117 [00:05<00:17,  5.45it/s][A
Training:  21%|██▏       | 25/117 [00:06<00:20,  4.59it/s][A
Training:  25%|██▍       | 29/117 [00:06<00:16,  5.30it/s][A
Training:  26%|██▋       | 31/117 [00:06<00:14,  5.99it/s][A
Training:  28%|██▊       | 33/117 [00:07<00:15,  5.31it/s][A
Training:  30%|██▉       | 35/117 [00:07<00:13,  6.19it/s][A
Training:  32%|███▏ 

Epoch: 11/81 - Loss: 0.1550 - Accuracy: 0.9381



  0%|          | 0/15 [00:00<?, ?it/s][A
  7%|▋         | 1/15 [00:01<00:14,  1.03s/it][A
 20%|██        | 3/15 [00:01<00:03,  3.23it/s][A
 33%|███▎      | 5/15 [00:01<00:03,  2.86it/s][A
 53%|█████▎    | 8/15 [00:02<00:01,  5.29it/s][A
 67%|██████▋   | 10/15 [00:02<00:01,  4.11it/s][A
100%|██████████| 15/15 [00:03<00:00,  4.15it/s][A
Epochs:  14%|█▎        | 11/81 [04:52<30:53, 26.48s/it]

Val Loss: 0.1538 - Val Accuracy: 0.9358



Training:   0%|          | 0/117 [00:00<?, ?it/s][A
Training:   1%|          | 1/117 [00:00<01:50,  1.05it/s][A
Training:   2%|▏         | 2/117 [00:01<01:01,  1.86it/s][A
Training:   3%|▎         | 4/117 [00:01<00:26,  4.19it/s][A
Training:   4%|▍         | 5/117 [00:01<00:33,  3.33it/s][A
Training:   5%|▌         | 6/117 [00:01<00:27,  4.00it/s][A
Training:   7%|▋         | 8/117 [00:02<00:18,  6.04it/s][A
Training:   8%|▊         | 9/117 [00:02<00:33,  3.21it/s][A
Training:  11%|█         | 13/117 [00:03<00:24,  4.27it/s][A
Training:  13%|█▎        | 15/117 [00:03<00:18,  5.55it/s][A
Training:  15%|█▍        | 17/117 [00:04<00:24,  4.05it/s][A
Training:  17%|█▋        | 20/117 [00:04<00:16,  5.93it/s][A
Training:  19%|█▉        | 22/117 [00:05<00:19,  4.76it/s][A
Training:  20%|█▉        | 23/117 [00:05<00:18,  5.15it/s][A
Training:  21%|██▏       | 25/117 [00:05<00:22,  4.14it/s][A
Training:  24%|██▍       | 28/117 [00:06<00:14,  6.16it/s][A
Training:  26%|██▌     

Epoch: 12/81 - Loss: 0.1469 - Accuracy: 0.9411



  0%|          | 0/15 [00:00<?, ?it/s][A
  7%|▋         | 1/15 [00:00<00:13,  1.04it/s][A
 20%|██        | 3/15 [00:01<00:03,  3.45it/s][A
 33%|███▎      | 5/15 [00:01<00:03,  3.13it/s][A
 47%|████▋     | 7/15 [00:01<00:01,  4.84it/s][A
 60%|██████    | 9/15 [00:02<00:01,  3.68it/s][A
100%|██████████| 15/15 [00:03<00:00,  4.28it/s][A
Epochs:  15%|█▍        | 12/81 [05:18<30:31, 26.55s/it]

Val Loss: 0.1476 - Val Accuracy: 0.9397



Training:   0%|          | 0/117 [00:00<?, ?it/s][A
Training:   1%|          | 1/117 [00:01<02:21,  1.22s/it][A
Training:   2%|▏         | 2/117 [00:01<01:09,  1.66it/s][A
Training:   4%|▍         | 5/117 [00:01<00:31,  3.52it/s][A
Training:   5%|▌         | 6/117 [00:02<00:28,  3.89it/s][A
Training:   7%|▋         | 8/117 [00:02<00:18,  5.74it/s][A
Training:   8%|▊         | 9/117 [00:02<00:30,  3.55it/s][A
Training:   9%|▉         | 11/117 [00:02<00:21,  5.03it/s][A
Training:  11%|█         | 13/117 [00:03<00:27,  3.78it/s][A
Training:  13%|█▎        | 15/117 [00:03<00:20,  4.96it/s][A
Training:  15%|█▍        | 17/117 [00:04<00:22,  4.37it/s][A
Training:  15%|█▌        | 18/117 [00:04<00:21,  4.64it/s][A
Training:  17%|█▋        | 20/117 [00:04<00:15,  6.35it/s][A
Training:  19%|█▉        | 22/117 [00:05<00:21,  4.50it/s][A
Training:  21%|██        | 24/117 [00:05<00:15,  5.89it/s][A
Training:  22%|██▏       | 26/117 [00:06<00:21,  4.31it/s][A
Training:  23%|██▎    

Epoch: 13/81 - Loss: 0.1517 - Accuracy: 0.9389



  0%|          | 0/15 [00:00<?, ?it/s][A
  7%|▋         | 1/15 [00:01<00:15,  1.11s/it][A
 20%|██        | 3/15 [00:01<00:04,  2.92it/s][A
 33%|███▎      | 5/15 [00:01<00:03,  3.05it/s][A
 47%|████▋     | 7/15 [00:02<00:01,  4.56it/s][A
 60%|██████    | 9/15 [00:02<00:01,  3.91it/s][A
 67%|██████▋   | 10/15 [00:02<00:01,  4.45it/s][A
 73%|███████▎  | 11/15 [00:02<00:00,  4.97it/s][A
 87%|████████▋ | 13/15 [00:03<00:00,  4.60it/s][A
100%|██████████| 15/15 [00:03<00:00,  4.23it/s][A
Epochs:  16%|█▌        | 13/81 [05:45<30:07, 26.58s/it]

Val Loss: 0.1435 - Val Accuracy: 0.9386



Training:   0%|          | 0/117 [00:00<?, ?it/s][A
Training:   1%|          | 1/117 [00:00<01:52,  1.04it/s][A
Training:   2%|▏         | 2/117 [00:01<00:55,  2.07it/s][A
Training:   3%|▎         | 3/117 [00:01<00:35,  3.19it/s][A
Training:   4%|▍         | 5/117 [00:01<00:33,  3.35it/s][A
Training:   5%|▌         | 6/117 [00:01<00:28,  3.95it/s][A
Training:   7%|▋         | 8/117 [00:02<00:18,  5.93it/s][A
Training:   8%|▊         | 9/117 [00:02<00:27,  3.88it/s][A
Training:   9%|▊         | 10/117 [00:02<00:24,  4.31it/s][A
Training:   9%|▉         | 11/117 [00:02<00:21,  4.90it/s][A
Training:  11%|█         | 13/117 [00:03<00:24,  4.17it/s][A
Training:  13%|█▎        | 15/117 [00:03<00:18,  5.57it/s][A
Training:  15%|█▍        | 17/117 [00:04<00:19,  5.13it/s][A
Training:  15%|█▌        | 18/117 [00:04<00:18,  5.47it/s][A
Training:  16%|█▌        | 19/117 [00:04<00:19,  4.96it/s][A
Training:  18%|█▊        | 21/117 [00:04<00:20,  4.78it/s][A
Training:  19%|█▉      

Epoch: 14/81 - Loss: 0.1433 - Accuracy: 0.9424



  0%|          | 0/15 [00:00<?, ?it/s][A
  7%|▋         | 1/15 [00:01<00:14,  1.01s/it][A
 20%|██        | 3/15 [00:01<00:03,  3.22it/s][A
 33%|███▎      | 5/15 [00:01<00:03,  2.85it/s][A
 47%|████▋     | 7/15 [00:02<00:01,  4.48it/s][A
 60%|██████    | 9/15 [00:02<00:01,  3.82it/s][A
 80%|████████  | 12/15 [00:02<00:00,  5.33it/s][A
 87%|████████▋ | 13/15 [00:03<00:00,  4.73it/s][A
100%|██████████| 15/15 [00:03<00:00,  4.28it/s][A
Epochs:  17%|█▋        | 14/81 [06:11<29:34, 26.49s/it]

Val Loss: 0.1365 - Val Accuracy: 0.9424



Training:   0%|          | 0/117 [00:00<?, ?it/s][A
Training:   1%|          | 1/117 [00:01<02:06,  1.09s/it][A
Training:   3%|▎         | 4/117 [00:01<00:27,  4.09it/s][A
Training:   5%|▌         | 6/117 [00:02<00:34,  3.26it/s][A
Training:   7%|▋         | 8/117 [00:02<00:23,  4.68it/s][A
Training:   9%|▊         | 10/117 [00:02<00:28,  3.73it/s][A
Training:  11%|█         | 13/117 [00:03<00:26,  3.91it/s][A
Training:  13%|█▎        | 15/117 [00:03<00:20,  4.96it/s][A
Training:  15%|█▍        | 17/117 [00:04<00:23,  4.32it/s][A
Training:  17%|█▋        | 20/117 [00:04<00:15,  6.45it/s][A
Training:  19%|█▉        | 22/117 [00:05<00:19,  4.92it/s][A
Training:  21%|██▏       | 25/117 [00:05<00:20,  4.55it/s][A
Training:  23%|██▎       | 27/117 [00:05<00:16,  5.55it/s][A
Training:  25%|██▍       | 29/117 [00:06<00:19,  4.57it/s][A
Training:  26%|██▋       | 31/117 [00:06<00:15,  5.43it/s][A
Training:  28%|██▊       | 33/117 [00:07<00:18,  4.54it/s][A
Training:  30%|██▉  

Epoch: 15/81 - Loss: 0.1479 - Accuracy: 0.9433



  0%|          | 0/15 [00:00<?, ?it/s][A
  7%|▋         | 1/15 [00:01<00:15,  1.10s/it][A
 20%|██        | 3/15 [00:01<00:03,  3.01it/s][A
 33%|███▎      | 5/15 [00:01<00:03,  3.01it/s][A
 53%|█████▎    | 8/15 [00:02<00:01,  5.43it/s][A
 67%|██████▋   | 10/15 [00:02<00:01,  3.92it/s][A
 87%|████████▋ | 13/15 [00:03<00:00,  4.15it/s][A
100%|██████████| 15/15 [00:03<00:00,  4.10it/s][A
Epochs:  19%|█▊        | 15/81 [06:37<28:58, 26.35s/it]

Val Loss: 0.1389 - Val Accuracy: 0.9418



Training:   0%|          | 0/117 [00:00<?, ?it/s][A
Training:   1%|          | 1/117 [00:01<02:15,  1.17s/it][A
Training:   3%|▎         | 4/117 [00:01<00:28,  3.98it/s][A
Training:   5%|▌         | 6/117 [00:02<00:34,  3.19it/s][A
Training:   7%|▋         | 8/117 [00:02<00:23,  4.62it/s][A
Training:   9%|▊         | 10/117 [00:03<00:30,  3.52it/s][A
Training:  10%|█         | 12/117 [00:03<00:21,  4.82it/s][A
Training:  12%|█▏        | 14/117 [00:03<00:25,  4.00it/s][A
Training:  14%|█▎        | 16/117 [00:03<00:19,  5.17it/s][A
Training:  15%|█▌        | 18/117 [00:04<00:22,  4.40it/s][A
Training:  17%|█▋        | 20/117 [00:04<00:17,  5.46it/s][A
Training:  18%|█▊        | 21/117 [00:05<00:24,  3.94it/s][A
Training:  21%|██        | 24/117 [00:05<00:16,  5.54it/s][A
Training:  21%|██▏       | 25/117 [00:06<00:22,  4.01it/s][A
Training:  24%|██▍       | 28/117 [00:06<00:14,  6.07it/s][A
Training:  26%|██▌       | 30/117 [00:06<00:17,  4.99it/s][A
Training:  27%|██▋  

Epoch: 16/81 - Loss: 0.1564 - Accuracy: 0.9363



  0%|          | 0/15 [00:00<?, ?it/s][A
  7%|▋         | 1/15 [00:01<00:15,  1.12s/it][A
 13%|█▎        | 2/15 [00:01<00:06,  1.90it/s][A
 33%|███▎      | 5/15 [00:01<00:02,  3.46it/s][A
 40%|████      | 6/15 [00:01<00:02,  4.00it/s][A
 60%|██████    | 9/15 [00:02<00:01,  4.21it/s][A
 87%|████████▋ | 13/15 [00:03<00:00,  5.24it/s][A
100%|██████████| 15/15 [00:03<00:00,  4.43it/s][A
Epochs:  20%|█▉        | 16/81 [07:04<28:33, 26.36s/it]

Val Loss: 0.1729 - Val Accuracy: 0.9375



Training:   0%|          | 0/117 [00:00<?, ?it/s][A
Training:   1%|          | 1/117 [00:01<02:27,  1.27s/it][A
Training:   2%|▏         | 2/117 [00:01<01:08,  1.67it/s][A
Training:   4%|▍         | 5/117 [00:02<00:36,  3.04it/s][A
Training:   6%|▌         | 7/117 [00:02<00:24,  4.56it/s][A
Training:   8%|▊         | 9/117 [00:02<00:25,  4.23it/s][A
Training:  10%|█         | 12/117 [00:02<00:16,  6.48it/s][A
Training:  12%|█▏        | 14/117 [00:03<00:21,  4.82it/s][A
Training:  15%|█▍        | 17/117 [00:04<00:21,  4.66it/s][A
Training:  17%|█▋        | 20/117 [00:04<00:15,  6.08it/s][A
Training:  18%|█▊        | 21/117 [00:05<00:22,  4.25it/s][A
Training:  21%|██        | 24/117 [00:05<00:15,  6.09it/s][A
Training:  22%|██▏       | 26/117 [00:06<00:20,  4.42it/s][A
Training:  24%|██▍       | 28/117 [00:06<00:15,  5.60it/s][A
Training:  26%|██▌       | 30/117 [00:06<00:20,  4.33it/s][A
Training:  28%|██▊       | 33/117 [00:07<00:18,  4.54it/s][A
Training:  30%|██▉   

Epoch: 17/81 - Loss: 0.1498 - Accuracy: 0.9394



  0%|          | 0/15 [00:00<?, ?it/s][A
  7%|▋         | 1/15 [00:01<00:15,  1.12s/it][A
 13%|█▎        | 2/15 [00:01<00:07,  1.74it/s][A
 33%|███▎      | 5/15 [00:01<00:03,  3.25it/s][A
 40%|████      | 6/15 [00:02<00:02,  3.50it/s][A
 60%|██████    | 9/15 [00:02<00:01,  4.23it/s][A
 67%|██████▋   | 10/15 [00:03<00:01,  4.01it/s][A
 87%|████████▋ | 13/15 [00:03<00:00,  4.74it/s][A
100%|██████████| 15/15 [00:03<00:00,  4.04it/s][A
Epochs:  21%|██        | 17/81 [07:30<28:04, 26.32s/it]

Val Loss: 0.1422 - Val Accuracy: 0.9424



Training:   0%|          | 0/117 [00:00<?, ?it/s][A
Training:   1%|          | 1/117 [00:01<02:13,  1.15s/it][A
Training:   3%|▎         | 3/117 [00:01<00:38,  2.98it/s][A
Training:   4%|▍         | 5/117 [00:02<00:41,  2.68it/s][A
Training:   6%|▌         | 7/117 [00:02<00:26,  4.19it/s][A
Training:   8%|▊         | 9/117 [00:02<00:31,  3.45it/s][A
Training:   9%|▉         | 11/117 [00:03<00:22,  4.74it/s][A
Training:  11%|█         | 13/117 [00:03<00:25,  4.13it/s][A
Training:  13%|█▎        | 15/117 [00:03<00:18,  5.49it/s][A
Training:  15%|█▍        | 17/117 [00:04<00:22,  4.39it/s][A
Training:  17%|█▋        | 20/117 [00:04<00:14,  6.70it/s][A
Training:  19%|█▉        | 22/117 [00:05<00:20,  4.68it/s][A
Training:  21%|██▏       | 25/117 [00:06<00:21,  4.29it/s][A
Training:  23%|██▎       | 27/117 [00:06<00:16,  5.39it/s][A
Training:  25%|██▍       | 29/117 [00:06<00:20,  4.34it/s][A
Training:  26%|██▋       | 31/117 [00:07<00:15,  5.50it/s][A
Training:  28%|██▊   

Epoch: 18/81 - Loss: 0.1533 - Accuracy: 0.9400



  0%|          | 0/15 [00:00<?, ?it/s][A
  7%|▋         | 1/15 [00:01<00:17,  1.25s/it][A
 27%|██▋       | 4/15 [00:01<00:03,  3.61it/s][A
 40%|████      | 6/15 [00:02<00:02,  3.20it/s][A
 60%|██████    | 9/15 [00:02<00:01,  3.70it/s][A
 80%|████████  | 12/15 [00:02<00:00,  5.66it/s][A
100%|██████████| 15/15 [00:03<00:00,  4.25it/s][A
Epochs:  22%|██▏       | 18/81 [07:56<27:39, 26.35s/it]

Val Loss: 0.1527 - Val Accuracy: 0.9382



Training:   0%|          | 0/117 [00:00<?, ?it/s][A
Training:   1%|          | 1/117 [00:01<02:14,  1.16s/it][A
Training:   3%|▎         | 4/117 [00:01<00:28,  4.01it/s][A
Training:   5%|▌         | 6/117 [00:02<00:33,  3.31it/s][A
Training:   8%|▊         | 9/117 [00:02<00:30,  3.50it/s][A
Training:   9%|▉         | 11/117 [00:02<00:23,  4.58it/s][A
Training:  11%|█         | 13/117 [00:03<00:27,  3.76it/s][A
Training:  15%|█▍        | 17/117 [00:04<00:23,  4.31it/s][A
Training:  17%|█▋        | 20/117 [00:04<00:16,  5.85it/s][A
Training:  19%|█▉        | 22/117 [00:05<00:20,  4.66it/s][A
Training:  21%|██▏       | 25/117 [00:06<00:22,  4.15it/s][A
Training:  24%|██▍       | 28/117 [00:06<00:15,  5.73it/s][A
Training:  26%|██▌       | 30/117 [00:07<00:18,  4.63it/s][A
Training:  28%|██▊       | 33/117 [00:07<00:18,  4.48it/s][A
Training:  31%|███       | 36/117 [00:07<00:13,  6.14it/s][A
Training:  32%|███▏      | 38/117 [00:08<00:16,  4.85it/s][A
Training:  34%|███▍ 

Epoch: 19/81 - Loss: 0.1618 - Accuracy: 0.9374



  0%|          | 0/15 [00:00<?, ?it/s][A
  7%|▋         | 1/15 [00:01<00:15,  1.10s/it][A
 20%|██        | 3/15 [00:01<00:03,  3.00it/s][A
 33%|███▎      | 5/15 [00:01<00:03,  3.19it/s][A
 60%|██████    | 9/15 [00:02<00:01,  4.51it/s][A
100%|██████████| 15/15 [00:03<00:00,  4.51it/s][A
Epochs:  23%|██▎       | 19/81 [08:22<27:05, 26.22s/it]

Val Loss: 0.1555 - Val Accuracy: 0.9369



Training:   0%|          | 0/117 [00:00<?, ?it/s][A
Training:   1%|          | 1/117 [00:01<02:23,  1.23s/it][A
Training:   3%|▎         | 3/117 [00:01<00:42,  2.68it/s][A
Training:   4%|▍         | 5/117 [00:02<00:39,  2.84it/s][A
Training:   6%|▌         | 7/117 [00:02<00:25,  4.33it/s][A
Training:   8%|▊         | 9/117 [00:02<00:27,  3.88it/s][A
Training:  10%|█         | 12/117 [00:02<00:17,  6.03it/s][A
Training:  12%|█▏        | 14/117 [00:03<00:22,  4.66it/s][A
Training:  14%|█▎        | 16/117 [00:03<00:18,  5.35it/s][A
Training:  15%|█▍        | 17/117 [00:04<00:22,  4.41it/s][A
Training:  16%|█▌        | 19/117 [00:04<00:17,  5.55it/s][A
Training:  17%|█▋        | 20/117 [00:04<00:19,  4.88it/s][A
Training:  18%|█▊        | 21/117 [00:05<00:23,  4.01it/s][A
Training:  20%|█▉        | 23/117 [00:05<00:16,  5.59it/s][A
Training:  21%|██        | 24/117 [00:05<00:19,  4.75it/s][A
Training:  21%|██▏       | 25/117 [00:05<00:22,  4.04it/s][A
Training:  24%|██▍   

Epoch: 20/81 - Loss: 0.1501 - Accuracy: 0.9400



  0%|          | 0/15 [00:00<?, ?it/s][A
  7%|▋         | 1/15 [00:01<00:16,  1.19s/it][A
 33%|███▎      | 5/15 [00:01<00:03,  3.18it/s][A
 47%|████▋     | 7/15 [00:01<00:01,  4.64it/s][A
 60%|██████    | 9/15 [00:02<00:01,  3.85it/s][A
 80%|████████  | 12/15 [00:02<00:00,  6.13it/s][A
100%|██████████| 15/15 [00:03<00:00,  4.35it/s][A
Epochs:  25%|██▍       | 20/81 [08:49<26:52, 26.43s/it]

Val Loss: 0.1558 - Val Accuracy: 0.9372



Training:   0%|          | 0/117 [00:00<?, ?it/s][A
Training:   1%|          | 1/117 [00:01<02:38,  1.37s/it][A
Training:   3%|▎         | 3/117 [00:01<00:45,  2.51it/s][A
Training:   4%|▍         | 5/117 [00:02<00:37,  3.00it/s][A
Training:   5%|▌         | 6/117 [00:02<00:30,  3.60it/s][A
Training:   7%|▋         | 8/117 [00:02<00:19,  5.58it/s][A
Training:   9%|▊         | 10/117 [00:02<00:25,  4.16it/s][A
Training:  11%|█         | 13/117 [00:03<00:22,  4.54it/s][A
Training:  12%|█▏        | 14/117 [00:03<00:21,  4.80it/s][A
Training:  15%|█▍        | 17/117 [00:04<00:21,  4.73it/s][A
Training:  16%|█▌        | 19/117 [00:04<00:16,  5.97it/s][A
Training:  18%|█▊        | 21/117 [00:05<00:19,  4.87it/s][A
Training:  20%|█▉        | 23/117 [00:05<00:17,  5.53it/s][A
Training:  21%|██▏       | 25/117 [00:05<00:18,  5.06it/s][A
Training:  23%|██▎       | 27/117 [00:06<00:17,  5.29it/s][A
Training:  25%|██▍       | 29/117 [00:06<00:16,  5.36it/s][A
Training:  26%|██▌   

Epoch: 21/81 - Loss: 0.1522 - Accuracy: 0.9417



  0%|          | 0/15 [00:00<?, ?it/s][A
  7%|▋         | 1/15 [00:01<00:15,  1.13s/it][A
 20%|██        | 3/15 [00:01<00:03,  3.02it/s][A
 33%|███▎      | 5/15 [00:01<00:03,  3.31it/s][A
 53%|█████▎    | 8/15 [00:01<00:01,  5.82it/s][A
 67%|██████▋   | 10/15 [00:02<00:00,  5.26it/s][A
 73%|███████▎  | 11/15 [00:02<00:00,  5.51it/s][A
100%|██████████| 15/15 [00:03<00:00,  4.68it/s][A
Epochs:  26%|██▌       | 21/81 [09:16<26:23, 26.40s/it]

Val Loss: 0.1562 - Val Accuracy: 0.9341



Training:   0%|          | 0/117 [00:00<?, ?it/s][A
Training:   1%|          | 1/117 [00:01<02:12,  1.14s/it][A
Training:   2%|▏         | 2/117 [00:01<01:08,  1.68it/s][A
Training:   4%|▍         | 5/117 [00:02<00:36,  3.03it/s][A
Training:   6%|▌         | 7/117 [00:02<00:23,  4.59it/s][A
Training:   8%|▊         | 9/117 [00:02<00:28,  3.75it/s][A
Training:   9%|▉         | 11/117 [00:03<00:21,  4.92it/s][A
Training:  11%|█         | 13/117 [00:03<00:24,  4.20it/s][A
Training:  14%|█▎        | 16/117 [00:03<00:15,  6.45it/s][A
Training:  15%|█▌        | 18/117 [00:04<00:21,  4.55it/s][A
Training:  17%|█▋        | 20/117 [00:04<00:18,  5.37it/s][A
Training:  18%|█▊        | 21/117 [00:05<00:25,  3.83it/s][A
Training:  20%|█▉        | 23/117 [00:05<00:19,  4.82it/s][A
Training:  21%|██▏       | 25/117 [00:06<00:19,  4.62it/s][A
Training:  23%|██▎       | 27/117 [00:06<00:17,  5.17it/s][A
Training:  25%|██▍       | 29/117 [00:06<00:19,  4.60it/s][A
Training:  26%|██▋   

Epoch: 22/81 - Loss: 0.1566 - Accuracy: 0.9367



  0%|          | 0/15 [00:00<?, ?it/s][A
  7%|▋         | 1/15 [00:01<00:16,  1.15s/it][A
 20%|██        | 3/15 [00:01<00:04,  2.91it/s][A
 33%|███▎      | 5/15 [00:01<00:03,  2.86it/s][A
 40%|████      | 6/15 [00:02<00:02,  3.51it/s][A
 60%|██████    | 9/15 [00:02<00:01,  3.95it/s][A
100%|██████████| 15/15 [00:03<00:00,  4.23it/s][A
Epochs:  27%|██▋       | 22/81 [09:43<26:12, 26.65s/it]

Val Loss: 0.1532 - Val Accuracy: 0.9374



Training:   0%|          | 0/117 [00:00<?, ?it/s][A
Training:   1%|          | 1/117 [00:01<02:04,  1.07s/it][A
Training:   2%|▏         | 2/117 [00:01<00:58,  1.98it/s][A
Training:   4%|▍         | 5/117 [00:01<00:32,  3.43it/s][A
Training:   5%|▌         | 6/117 [00:01<00:28,  3.88it/s][A
Training:   8%|▊         | 9/117 [00:02<00:24,  4.50it/s][A
Training:   9%|▊         | 10/117 [00:02<00:22,  4.69it/s][A
Training:  11%|█         | 13/117 [00:03<00:22,  4.66it/s][A
Training:  12%|█▏        | 14/117 [00:03<00:22,  4.64it/s][A
Training:  14%|█▎        | 16/117 [00:03<00:17,  5.90it/s][A
Training:  15%|█▍        | 17/117 [00:04<00:22,  4.40it/s][A
Training:  15%|█▌        | 18/117 [00:04<00:20,  4.90it/s][A
Training:  16%|█▌        | 19/117 [00:04<00:17,  5.54it/s][A
Training:  18%|█▊        | 21/117 [00:05<00:22,  4.21it/s][A
Training:  20%|█▉        | 23/117 [00:05<00:16,  5.74it/s][A
Training:  21%|██▏       | 25/117 [00:05<00:20,  4.40it/s][A
Training:  22%|██▏   

Epoch: 23/81 - Loss: 0.1493 - Accuracy: 0.9388



  0%|          | 0/15 [00:00<?, ?it/s][A
  7%|▋         | 1/15 [00:01<00:13,  1.00it/s][A
 33%|███▎      | 5/15 [00:01<00:02,  3.53it/s][A
 53%|█████▎    | 8/15 [00:01<00:01,  6.02it/s][A
 67%|██████▋   | 10/15 [00:02<00:01,  4.55it/s][A
 80%|████████  | 12/15 [00:02<00:00,  5.95it/s][A
100%|██████████| 15/15 [00:03<00:00,  4.62it/s][A
Epochs:  28%|██▊       | 23/81 [10:09<25:40, 26.57s/it]

Val Loss: 0.1851 - Val Accuracy: 0.9237



Training:   0%|          | 0/117 [00:00<?, ?it/s][A
Training:   1%|          | 1/117 [00:01<02:13,  1.15s/it][A
Training:   4%|▍         | 5/117 [00:01<00:36,  3.07it/s][A
Training:   7%|▋         | 8/117 [00:02<00:20,  5.23it/s][A
Training:   9%|▊         | 10/117 [00:02<00:24,  4.32it/s][A
Training:  10%|█         | 12/117 [00:02<00:18,  5.64it/s][A
Training:  12%|█▏        | 14/117 [00:03<00:24,  4.22it/s][A
Training:  14%|█▎        | 16/117 [00:03<00:18,  5.44it/s][A
Training:  15%|█▌        | 18/117 [00:04<00:22,  4.50it/s][A
Training:  17%|█▋        | 20/117 [00:04<00:16,  5.86it/s][A
Training:  19%|█▉        | 22/117 [00:05<00:23,  4.11it/s][A
Training:  21%|██        | 24/117 [00:05<00:17,  5.36it/s][A
Training:  22%|██▏       | 26/117 [00:06<00:21,  4.21it/s][A
Training:  25%|██▍       | 29/117 [00:06<00:21,  4.03it/s][A
Training:  28%|██▊       | 33/117 [00:07<00:18,  4.54it/s][A
Training:  32%|███▏      | 37/117 [00:08<00:17,  4.71it/s][A
Training:  33%|███▎

Epoch: 24/81 - Loss: 0.1469 - Accuracy: 0.9405



  0%|          | 0/15 [00:00<?, ?it/s][A
  7%|▋         | 1/15 [00:01<00:17,  1.22s/it][A
 20%|██        | 3/15 [00:01<00:04,  2.81it/s][A
 33%|███▎      | 5/15 [00:01<00:03,  2.95it/s][A
 53%|█████▎    | 8/15 [00:02<00:01,  5.42it/s][A
 67%|██████▋   | 10/15 [00:02<00:01,  4.35it/s][A
 80%|████████  | 12/15 [00:02<00:00,  5.82it/s][A
100%|██████████| 15/15 [00:03<00:00,  4.23it/s][A
Epochs:  30%|██▉       | 24/81 [10:36<25:26, 26.78s/it]

Val Loss: 0.1453 - Val Accuracy: 0.9397



Training:   0%|          | 0/117 [00:00<?, ?it/s][A
Training:   1%|          | 1/117 [00:01<02:11,  1.13s/it][A
Training:   3%|▎         | 4/117 [00:01<00:30,  3.75it/s][A
Training:   4%|▍         | 5/117 [00:01<00:38,  2.95it/s][A
Training:   7%|▋         | 8/117 [00:01<00:18,  5.77it/s][A
Training:   9%|▊         | 10/117 [00:02<00:23,  4.64it/s][A
Training:  10%|█         | 12/117 [00:02<00:17,  6.17it/s][A
Training:  12%|█▏        | 14/117 [00:03<00:25,  3.97it/s][A
Training:  14%|█▎        | 16/117 [00:03<00:19,  5.17it/s][A
Training:  15%|█▌        | 18/117 [00:04<00:23,  4.25it/s][A
Training:  17%|█▋        | 20/117 [00:04<00:17,  5.55it/s][A
Training:  19%|█▉        | 22/117 [00:05<00:23,  3.96it/s][A
Training:  21%|██▏       | 25/117 [00:05<00:22,  4.17it/s][A
Training:  24%|██▍       | 28/117 [00:06<00:14,  5.98it/s][A
Training:  26%|██▌       | 30/117 [00:06<00:19,  4.37it/s][A
Training:  28%|██▊       | 33/117 [00:07<00:20,  4.07it/s][A
Training:  30%|██▉  

Epoch: 25/81 - Loss: 0.1493 - Accuracy: 0.9405



  0%|          | 0/15 [00:00<?, ?it/s][A
  7%|▋         | 1/15 [00:01<00:19,  1.37s/it][A
 27%|██▋       | 4/15 [00:01<00:03,  3.39it/s][A
 40%|████      | 6/15 [00:02<00:02,  3.28it/s][A
 60%|██████    | 9/15 [00:02<00:01,  3.94it/s][A
 80%|████████  | 12/15 [00:02<00:00,  6.07it/s][A
100%|██████████| 15/15 [00:03<00:00,  4.34it/s][A
Epochs:  31%|███       | 25/81 [11:04<25:07, 26.93s/it]

Val Loss: 0.1486 - Val Accuracy: 0.9391



Training:   0%|          | 0/117 [00:00<?, ?it/s][A
Training:   1%|          | 1/117 [00:00<01:53,  1.02it/s][A
Training:   2%|▏         | 2/117 [00:01<01:02,  1.83it/s][A
Training:   3%|▎         | 4/117 [00:01<00:27,  4.11it/s][A
Training:   4%|▍         | 5/117 [00:01<00:33,  3.36it/s][A
Training:   5%|▌         | 6/117 [00:01<00:29,  3.74it/s][A
Training:   7%|▋         | 8/117 [00:02<00:18,  5.84it/s][A
Training:   8%|▊         | 9/117 [00:02<00:25,  4.23it/s][A
Training:   9%|▉         | 11/117 [00:02<00:17,  6.06it/s][A
Training:  10%|█         | 12/117 [00:02<00:17,  6.08it/s][A
Training:  11%|█         | 13/117 [00:03<00:22,  4.65it/s][A
Training:  12%|█▏        | 14/117 [00:03<00:19,  5.26it/s][A
Training:  14%|█▎        | 16/117 [00:03<00:14,  7.02it/s][A
Training:  15%|█▍        | 17/117 [00:03<00:19,  5.02it/s][A
Training:  15%|█▌        | 18/117 [00:04<00:18,  5.29it/s][A
Training:  17%|█▋        | 20/117 [00:04<00:13,  7.14it/s][A
Training:  18%|█▊      

Epoch: 26/81 - Loss: 0.1553 - Accuracy: 0.9393



  0%|          | 0/15 [00:00<?, ?it/s][A
  7%|▋         | 1/15 [00:01<00:16,  1.17s/it][A
 27%|██▋       | 4/15 [00:01<00:02,  3.70it/s][A
 40%|████      | 6/15 [00:02<00:02,  3.41it/s][A
 53%|█████▎    | 8/15 [00:02<00:01,  4.91it/s][A
 67%|██████▋   | 10/15 [00:02<00:01,  4.09it/s][A
100%|██████████| 15/15 [00:03<00:00,  4.38it/s][A
Epochs:  32%|███▏      | 26/81 [11:30<24:39, 26.89s/it]

Val Loss: 0.1824 - Val Accuracy: 0.9221



Training:   0%|          | 0/117 [00:00<?, ?it/s][A
Training:   1%|          | 1/117 [00:01<02:23,  1.24s/it][A
Training:   4%|▍         | 5/117 [00:01<00:37,  3.02it/s][A
Training:   6%|▌         | 7/117 [00:02<00:25,  4.35it/s][A
Training:   8%|▊         | 9/117 [00:02<00:29,  3.69it/s][A
Training:  10%|█         | 12/117 [00:02<00:18,  5.75it/s][A
Training:  12%|█▏        | 14/117 [00:03<00:20,  4.99it/s][A
Training:  15%|█▍        | 17/117 [00:04<00:21,  4.75it/s][A
Training:  16%|█▌        | 19/117 [00:04<00:16,  5.91it/s][A
Training:  18%|█▊        | 21/117 [00:04<00:19,  4.87it/s][A
Training:  20%|█▉        | 23/117 [00:05<00:16,  5.68it/s][A
Training:  21%|██▏       | 25/117 [00:05<00:20,  4.48it/s][A
Training:  23%|██▎       | 27/117 [00:05<00:15,  5.73it/s][A
Training:  25%|██▍       | 29/117 [00:06<00:19,  4.61it/s][A
Training:  26%|██▋       | 31/117 [00:06<00:14,  5.91it/s][A
Training:  28%|██▊       | 33/117 [00:07<00:17,  4.67it/s][A
Training:  30%|██▉  

Epoch: 27/81 - Loss: 0.1521 - Accuracy: 0.9381



  0%|          | 0/15 [00:00<?, ?it/s][A
  7%|▋         | 1/15 [00:00<00:12,  1.09it/s][A
 27%|██▋       | 4/15 [00:01<00:02,  4.16it/s][A
 33%|███▎      | 5/15 [00:01<00:03,  3.27it/s][A
 53%|█████▎    | 8/15 [00:01<00:01,  5.96it/s][A
 67%|██████▋   | 10/15 [00:02<00:01,  4.69it/s][A
 80%|████████  | 12/15 [00:02<00:00,  6.07it/s][A
100%|██████████| 15/15 [00:03<00:00,  4.69it/s][A
Epochs:  33%|███▎      | 27/81 [11:56<23:56, 26.59s/it]

Val Loss: 0.1602 - Val Accuracy: 0.9292



Training:   0%|          | 0/117 [00:00<?, ?it/s][A
Training:   1%|          | 1/117 [00:01<02:08,  1.11s/it][A
Training:   4%|▍         | 5/117 [00:01<00:33,  3.37it/s][A
Training:   6%|▌         | 7/117 [00:01<00:22,  4.88it/s][A
Training:   8%|▊         | 9/117 [00:02<00:29,  3.68it/s][A
Training:  10%|█         | 12/117 [00:02<00:18,  5.74it/s][A
Training:  12%|█▏        | 14/117 [00:03<00:24,  4.24it/s][A
Training:  14%|█▎        | 16/117 [00:03<00:18,  5.38it/s][A
Training:  15%|█▌        | 18/117 [00:04<00:24,  4.12it/s][A
Training:  18%|█▊        | 21/117 [00:05<00:23,  4.11it/s][A
Training:  20%|█▉        | 23/117 [00:05<00:18,  5.16it/s][A
Training:  21%|██▏       | 25/117 [00:05<00:19,  4.70it/s][A
Training:  24%|██▍       | 28/117 [00:05<00:13,  6.77it/s][A
Training:  26%|██▌       | 30/117 [00:06<00:16,  5.39it/s][A
Training:  28%|██▊       | 33/117 [00:07<00:18,  4.48it/s][A
Training:  31%|███       | 36/117 [00:07<00:13,  6.17it/s][A
Training:  32%|███▏ 

Epoch: 28/81 - Loss: 0.1450 - Accuracy: 0.9432



  0%|          | 0/15 [00:00<?, ?it/s][A
  7%|▋         | 1/15 [00:01<00:14,  1.05s/it][A
 27%|██▋       | 4/15 [00:01<00:02,  4.36it/s][A
 40%|████      | 6/15 [00:01<00:02,  3.36it/s][A
 60%|██████    | 9/15 [00:02<00:01,  3.54it/s][A
100%|██████████| 15/15 [00:03<00:00,  3.95it/s][A
Epochs:  35%|███▍      | 28/81 [12:23<23:37, 26.74s/it]

Val Loss: 0.1437 - Val Accuracy: 0.9393



Training:   0%|          | 0/117 [00:00<?, ?it/s][A
Training:   1%|          | 1/117 [00:01<02:06,  1.09s/it][A
Training:   3%|▎         | 4/117 [00:01<00:26,  4.20it/s][A
Training:   5%|▌         | 6/117 [00:01<00:32,  3.46it/s][A
Training:   7%|▋         | 8/117 [00:02<00:22,  4.94it/s][A
Training:   9%|▊         | 10/117 [00:02<00:29,  3.63it/s][A
Training:  11%|█         | 13/117 [00:03<00:22,  4.57it/s][A
Training:  12%|█▏        | 14/117 [00:03<00:23,  4.31it/s][A
Training:  14%|█▎        | 16/117 [00:03<00:17,  5.68it/s][A
Training:  15%|█▍        | 17/117 [00:03<00:18,  5.27it/s][A
Training:  15%|█▌        | 18/117 [00:04<00:22,  4.41it/s][A
Training:  18%|█▊        | 21/117 [00:04<00:16,  5.88it/s][A
Training:  19%|█▉        | 22/117 [00:05<00:20,  4.62it/s][A
Training:  21%|██▏       | 25/117 [00:05<00:13,  6.69it/s][A
Training:  22%|██▏       | 26/117 [00:05<00:18,  4.88it/s][A
Training:  25%|██▍       | 29/117 [00:05<00:12,  7.18it/s][A
Training:  26%|██▋  

Epoch: 29/81 - Loss: 0.1561 - Accuracy: 0.9389



  0%|          | 0/15 [00:00<?, ?it/s][A
  7%|▋         | 1/15 [00:01<00:14,  1.06s/it][A
 33%|███▎      | 5/15 [00:01<00:02,  3.68it/s][A
 60%|██████    | 9/15 [00:02<00:01,  4.37it/s][A
100%|██████████| 15/15 [00:03<00:00,  4.49it/s][A
Epochs:  36%|███▌      | 29/81 [12:50<23:04, 26.62s/it]

Val Loss: 0.1451 - Val Accuracy: 0.9420



Training:   0%|          | 0/117 [00:00<?, ?it/s][A
Training:   1%|          | 1/117 [00:01<01:58,  1.03s/it][A
Training:   3%|▎         | 3/117 [00:01<00:35,  3.18it/s][A
Training:   4%|▍         | 5/117 [00:01<00:32,  3.47it/s][A
Training:   6%|▌         | 7/117 [00:01<00:22,  4.91it/s][A
Training:   8%|▊         | 9/117 [00:02<00:23,  4.63it/s][A
Training:   9%|▊         | 10/117 [00:02<00:21,  5.08it/s][A
Training:   9%|▉         | 11/117 [00:02<00:20,  5.10it/s][A
Training:  11%|█         | 13/117 [00:03<00:20,  4.97it/s][A
Training:  13%|█▎        | 15/117 [00:03<00:19,  5.26it/s][A
Training:  15%|█▍        | 17/117 [00:04<00:24,  4.15it/s][A
Training:  16%|█▌        | 19/117 [00:04<00:18,  5.39it/s][A
Training:  18%|█▊        | 21/117 [00:04<00:22,  4.20it/s][A
Training:  21%|██        | 24/117 [00:05<00:14,  6.21it/s][A
Training:  22%|██▏       | 26/117 [00:05<00:18,  4.95it/s][A
Training:  23%|██▎       | 27/117 [00:05<00:19,  4.72it/s][A
Training:  25%|██▍   

Epoch: 30/81 - Loss: 0.1491 - Accuracy: 0.9419



  0%|          | 0/15 [00:00<?, ?it/s][A
  7%|▋         | 1/15 [00:01<00:16,  1.21s/it][A
 27%|██▋       | 4/15 [00:01<00:02,  3.87it/s][A
 40%|████      | 6/15 [00:02<00:02,  3.34it/s][A
 60%|██████    | 9/15 [00:02<00:01,  3.35it/s][A
100%|██████████| 15/15 [00:03<00:00,  3.94it/s][A
Epochs:  37%|███▋      | 30/81 [13:17<22:52, 26.92s/it]

Val Loss: 0.1748 - Val Accuracy: 0.9316



Training:   0%|          | 0/117 [00:00<?, ?it/s][A
Training:   1%|          | 1/117 [00:01<02:04,  1.08s/it][A
Training:   3%|▎         | 3/117 [00:01<00:36,  3.14it/s][A
Training:   4%|▍         | 5/117 [00:01<00:32,  3.40it/s][A
Training:   5%|▌         | 6/117 [00:01<00:30,  3.69it/s][A
Training:   8%|▊         | 9/117 [00:02<00:26,  4.05it/s][A
Training:   9%|▉         | 11/117 [00:02<00:19,  5.48it/s][A
Training:  11%|█         | 13/117 [00:03<00:22,  4.58it/s][A
Training:  15%|█▍        | 17/117 [00:04<00:19,  5.05it/s][A
Training:  18%|█▊        | 21/117 [00:04<00:17,  5.38it/s][A
Training:  20%|█▉        | 23/117 [00:04<00:14,  6.38it/s][A
Training:  21%|██▏       | 25/117 [00:05<00:18,  4.88it/s][A
Training:  23%|██▎       | 27/117 [00:05<00:15,  5.94it/s][A
Training:  25%|██▍       | 29/117 [00:06<00:17,  4.91it/s][A
Training:  26%|██▌       | 30/117 [00:06<00:17,  5.08it/s][A
Training:  28%|██▊       | 33/117 [00:06<00:16,  5.05it/s][A
Training:  29%|██▉   

Epoch: 31/81 - Loss: 0.1440 - Accuracy: 0.9441



  0%|          | 0/15 [00:00<?, ?it/s][A
  7%|▋         | 1/15 [00:00<00:13,  1.01it/s][A
 33%|███▎      | 5/15 [00:01<00:02,  3.62it/s][A
 53%|█████▎    | 8/15 [00:01<00:01,  6.20it/s][A
 67%|██████▋   | 10/15 [00:02<00:01,  4.74it/s][A
 80%|████████  | 12/15 [00:02<00:00,  5.89it/s][A
100%|██████████| 15/15 [00:03<00:00,  4.64it/s][A
Epochs:  38%|███▊      | 31/81 [13:43<22:09, 26.59s/it]

Val Loss: 0.1772 - Val Accuracy: 0.9292



Training:   0%|          | 0/117 [00:00<?, ?it/s][A
Training:   1%|          | 1/117 [00:01<02:21,  1.22s/it][A
Training:   4%|▍         | 5/117 [00:01<00:38,  2.94it/s][A
Training:   6%|▌         | 7/117 [00:02<00:25,  4.26it/s][A
Training:   8%|▊         | 9/117 [00:02<00:30,  3.52it/s][A
Training:   9%|▉         | 11/117 [00:02<00:22,  4.77it/s][A
Training:  11%|█         | 13/117 [00:03<00:26,  3.93it/s][A
Training:  14%|█▎        | 16/117 [00:03<00:17,  5.90it/s][A
Training:  15%|█▌        | 18/117 [00:04<00:23,  4.26it/s][A
Training:  18%|█▊        | 21/117 [00:05<00:21,  4.54it/s][A
Training:  21%|██        | 24/117 [00:05<00:14,  6.33it/s][A
Training:  22%|██▏       | 26/117 [00:06<00:19,  4.63it/s][A
Training:  25%|██▍       | 29/117 [00:06<00:20,  4.33it/s][A
Training:  26%|██▋       | 31/117 [00:07<00:16,  5.25it/s][A
Training:  28%|██▊       | 33/117 [00:07<00:19,  4.23it/s][A
Training:  31%|███       | 36/117 [00:07<00:13,  6.11it/s][A
Training:  32%|███▏ 

Epoch: 32/81 - Loss: 0.1565 - Accuracy: 0.9379



  0%|          | 0/15 [00:00<?, ?it/s][A
  7%|▋         | 1/15 [00:01<00:17,  1.27s/it][A
 33%|███▎      | 5/15 [00:01<00:03,  3.13it/s][A
 47%|████▋     | 7/15 [00:02<00:01,  4.36it/s][A
 60%|██████    | 9/15 [00:02<00:01,  3.44it/s][A
 73%|███████▎  | 11/15 [00:02<00:00,  4.62it/s][A
100%|██████████| 15/15 [00:03<00:00,  4.08it/s][A
Epochs:  40%|███▉      | 32/81 [14:11<21:54, 26.82s/it]

Val Loss: 0.1968 - Val Accuracy: 0.9231



Training:   0%|          | 0/117 [00:00<?, ?it/s][A
Training:   1%|          | 1/117 [00:01<02:08,  1.11s/it][A
Training:   2%|▏         | 2/117 [00:01<01:00,  1.90it/s][A
Training:   4%|▍         | 5/117 [00:01<00:32,  3.44it/s][A
Training:   5%|▌         | 6/117 [00:02<00:30,  3.61it/s][A
Training:   7%|▋         | 8/117 [00:02<00:24,  4.54it/s][A
Training:   8%|▊         | 9/117 [00:02<00:24,  4.33it/s][A
Training:   9%|▊         | 10/117 [00:02<00:23,  4.51it/s][A
Training:  10%|█         | 12/117 [00:03<00:23,  4.53it/s][A
Training:  11%|█         | 13/117 [00:03<00:27,  3.73it/s][A
Training:  13%|█▎        | 15/117 [00:03<00:19,  5.30it/s][A
Training:  14%|█▎        | 16/117 [00:03<00:18,  5.53it/s][A
Training:  15%|█▍        | 17/117 [00:04<00:24,  4.15it/s][A
Training:  16%|█▌        | 19/117 [00:04<00:16,  5.89it/s][A
Training:  17%|█▋        | 20/117 [00:04<00:16,  5.96it/s][A
Training:  18%|█▊        | 21/117 [00:05<00:26,  3.60it/s][A
Training:  20%|█▉     

Epoch: 33/81 - Loss: 0.1400 - Accuracy: 0.9466



  0%|          | 0/15 [00:00<?, ?it/s][A
  7%|▋         | 1/15 [00:01<00:17,  1.28s/it][A
 33%|███▎      | 5/15 [00:01<00:03,  2.92it/s][A
 60%|██████    | 9/15 [00:02<00:01,  3.95it/s][A
100%|██████████| 15/15 [00:03<00:00,  4.17it/s][A
Epochs:  41%|████      | 33/81 [14:38<21:29, 26.85s/it]

Val Loss: 0.2112 - Val Accuracy: 0.9165



Training:   0%|          | 0/117 [00:00<?, ?it/s][A
Training:   1%|          | 1/117 [00:01<02:31,  1.31s/it][A
Training:   3%|▎         | 3/117 [00:01<00:43,  2.59it/s][A
Training:   4%|▍         | 5/117 [00:02<00:39,  2.84it/s][A
Training:   7%|▋         | 8/117 [00:02<00:20,  5.29it/s][A
Training:   9%|▊         | 10/117 [00:03<00:27,  3.85it/s][A
Training:  10%|█         | 12/117 [00:03<00:20,  5.12it/s][A
Training:  12%|█▏        | 14/117 [00:03<00:26,  3.92it/s][A
Training:  15%|█▍        | 17/117 [00:04<00:27,  3.65it/s][A
Training:  17%|█▋        | 20/117 [00:04<00:18,  5.29it/s][A
Training:  19%|█▉        | 22/117 [00:05<00:22,  4.19it/s][A
Training:  21%|██        | 24/117 [00:05<00:17,  5.30it/s][A
Training:  22%|██▏       | 26/117 [00:06<00:21,  4.27it/s][A
Training:  25%|██▍       | 29/117 [00:07<00:23,  3.82it/s][A
Training:  28%|██▊       | 33/117 [00:08<00:18,  4.47it/s][A
Training:  31%|███       | 36/117 [00:08<00:13,  6.06it/s][A
Training:  32%|███▏ 

Epoch: 34/81 - Loss: 0.1555 - Accuracy: 0.9378



  0%|          | 0/15 [00:00<?, ?it/s][A
  7%|▋         | 1/15 [00:01<00:14,  1.00s/it][A
 13%|█▎        | 2/15 [00:01<00:06,  2.03it/s][A
 27%|██▋       | 4/15 [00:01<00:02,  4.56it/s][A
 40%|████      | 6/15 [00:01<00:02,  3.62it/s][A
 60%|██████    | 9/15 [00:02<00:01,  3.86it/s][A
 73%|███████▎  | 11/15 [00:02<00:00,  5.15it/s][A
 87%|████████▋ | 13/15 [00:03<00:00,  4.28it/s][A
100%|██████████| 15/15 [00:03<00:00,  4.15it/s][A
Epochs:  42%|████▏     | 34/81 [15:05<21:16, 27.16s/it]

Val Loss: 0.1935 - Val Accuracy: 0.9237



Training:   0%|          | 0/117 [00:00<?, ?it/s][A
Training:   1%|          | 1/117 [00:01<02:16,  1.17s/it][A
Training:   3%|▎         | 4/117 [00:01<00:29,  3.84it/s][A
Training:   5%|▌         | 6/117 [00:01<00:31,  3.51it/s][A
Training:   8%|▊         | 9/117 [00:02<00:29,  3.61it/s][A
Training:  10%|█         | 12/117 [00:02<00:18,  5.54it/s][A
Training:  12%|█▏        | 14/117 [00:03<00:22,  4.59it/s][A
Training:  13%|█▎        | 15/117 [00:03<00:20,  4.98it/s][A
Training:  14%|█▎        | 16/117 [00:03<00:18,  5.48it/s][A
Training:  15%|█▍        | 17/117 [00:04<00:24,  4.09it/s][A
Training:  16%|█▌        | 19/117 [00:04<00:21,  4.50it/s][A
Training:  18%|█▊        | 21/117 [00:05<00:22,  4.27it/s][A
Training:  20%|█▉        | 23/117 [00:05<00:20,  4.65it/s][A
Training:  21%|██▏       | 25/117 [00:05<00:20,  4.58it/s][A
Training:  23%|██▎       | 27/117 [00:06<00:19,  4.58it/s][A
Training:  25%|██▍       | 29/117 [00:06<00:19,  4.44it/s][A
Training:  26%|██▋  

Epoch: 35/81 - Loss: 0.1364 - Accuracy: 0.9463



  0%|          | 0/15 [00:00<?, ?it/s][A
  7%|▋         | 1/15 [00:01<00:15,  1.12s/it][A
 33%|███▎      | 5/15 [00:01<00:02,  3.34it/s][A
 60%|██████    | 9/15 [00:02<00:01,  4.19it/s][A
 80%|████████  | 12/15 [00:02<00:00,  5.93it/s][A
100%|██████████| 15/15 [00:03<00:00,  4.42it/s][A
Epochs:  43%|████▎     | 35/81 [15:32<20:38, 26.92s/it]

Val Loss: 0.1690 - Val Accuracy: 0.9342



Training:   0%|          | 0/117 [00:00<?, ?it/s][A
Training:   1%|          | 1/117 [00:01<02:11,  1.13s/it][A
Training:   3%|▎         | 3/117 [00:01<00:38,  2.96it/s][A
Training:   4%|▍         | 5/117 [00:01<00:36,  3.07it/s][A
Training:   6%|▌         | 7/117 [00:02<00:23,  4.62it/s][A
Training:   8%|▊         | 9/117 [00:02<00:28,  3.83it/s][A
Training:   9%|▉         | 11/117 [00:02<00:20,  5.25it/s][A
Training:  11%|█         | 13/117 [00:03<00:26,  3.86it/s][A
Training:  13%|█▎        | 15/117 [00:03<00:20,  5.03it/s][A
Training:  15%|█▍        | 17/117 [00:04<00:23,  4.23it/s][A
Training:  17%|█▋        | 20/117 [00:04<00:16,  5.89it/s][A
Training:  18%|█▊        | 21/117 [00:05<00:22,  4.27it/s][A
Training:  21%|██        | 24/117 [00:05<00:15,  5.93it/s][A
Training:  21%|██▏       | 25/117 [00:05<00:20,  4.38it/s][A
Training:  23%|██▎       | 27/117 [00:06<00:15,  5.75it/s][A
Training:  25%|██▍       | 29/117 [00:06<00:19,  4.49it/s][A
Training:  27%|██▋   

Epoch: 36/81 - Loss: 0.1539 - Accuracy: 0.9393



  0%|          | 0/15 [00:00<?, ?it/s][A
  7%|▋         | 1/15 [00:01<00:14,  1.04s/it][A
 27%|██▋       | 4/15 [00:01<00:02,  4.28it/s][A
 40%|████      | 6/15 [00:01<00:02,  3.57it/s][A
 60%|██████    | 9/15 [00:02<00:01,  3.80it/s][A
 73%|███████▎  | 11/15 [00:02<00:00,  5.02it/s][A
100%|██████████| 15/15 [00:03<00:00,  4.23it/s][A
Epochs:  44%|████▍     | 36/81 [15:59<20:12, 26.95s/it]

Val Loss: 0.1961 - Val Accuracy: 0.9221



Training:   0%|          | 0/117 [00:00<?, ?it/s][A
Training:   1%|          | 1/117 [00:01<02:24,  1.25s/it][A
Training:   3%|▎         | 4/117 [00:01<00:30,  3.70it/s][A
Training:   5%|▌         | 6/117 [00:02<00:33,  3.36it/s][A
Training:   8%|▊         | 9/117 [00:02<00:31,  3.45it/s][A
Training:   9%|▉         | 11/117 [00:03<00:22,  4.63it/s][A
Training:  11%|█         | 13/117 [00:03<00:26,  3.89it/s][A
Training:  15%|█▍        | 17/117 [00:04<00:22,  4.51it/s][A
Training:  16%|█▌        | 19/117 [00:04<00:17,  5.56it/s][A
Training:  18%|█▊        | 21/117 [00:05<00:20,  4.60it/s][A
Training:  21%|██        | 24/117 [00:05<00:14,  6.35it/s][A
Training:  22%|██▏       | 26/117 [00:05<00:17,  5.32it/s][A
Training:  25%|██▍       | 29/117 [00:06<00:18,  4.87it/s][A
Training:  27%|██▋       | 32/117 [00:06<00:12,  6.68it/s][A
Training:  29%|██▉       | 34/117 [00:07<00:16,  5.17it/s][A
Training:  31%|███       | 36/117 [00:07<00:13,  6.12it/s][A
Training:  32%|███▏ 

Epoch: 37/81 - Loss: 0.1413 - Accuracy: 0.9451



  0%|          | 0/15 [00:00<?, ?it/s][A
  7%|▋         | 1/15 [00:01<00:16,  1.15s/it][A
 33%|███▎      | 5/15 [00:02<00:03,  2.79it/s][A
 53%|█████▎    | 8/15 [00:02<00:01,  4.80it/s][A
 67%|██████▋   | 10/15 [00:03<00:01,  3.63it/s][A
100%|██████████| 15/15 [00:03<00:00,  3.98it/s][A
Epochs:  46%|████▌     | 37/81 [16:26<19:43, 26.90s/it]

Val Loss: 0.1519 - Val Accuracy: 0.9370



Training:   0%|          | 0/117 [00:00<?, ?it/s][A
Training:   1%|          | 1/117 [00:01<02:12,  1.14s/it][A
Training:   3%|▎         | 4/117 [00:01<00:28,  3.95it/s][A
Training:   5%|▌         | 6/117 [00:01<00:32,  3.44it/s][A
Training:   8%|▊         | 9/117 [00:02<00:30,  3.50it/s][A
Training:   9%|▉         | 11/117 [00:02<00:22,  4.68it/s][A
Training:  11%|█         | 13/117 [00:03<00:26,  3.86it/s][A
Training:  13%|█▎        | 15/117 [00:03<00:19,  5.10it/s][A
Training:  15%|█▍        | 17/117 [00:04<00:21,  4.70it/s][A
Training:  17%|█▋        | 20/117 [00:04<00:14,  6.67it/s][A
Training:  19%|█▉        | 22/117 [00:04<00:17,  5.29it/s][A
Training:  21%|██▏       | 25/117 [00:06<00:22,  4.11it/s][A
Training:  24%|██▍       | 28/117 [00:06<00:15,  5.80it/s][A
Training:  26%|██▌       | 30/117 [00:06<00:19,  4.57it/s][A
Training:  27%|██▋       | 32/117 [00:06<00:14,  5.68it/s][A
Training:  29%|██▉       | 34/117 [00:07<00:17,  4.86it/s][A
Training:  32%|███▏ 

Epoch: 38/81 - Loss: 0.1404 - Accuracy: 0.9443



  0%|          | 0/15 [00:00<?, ?it/s][A
  7%|▋         | 1/15 [00:01<00:15,  1.11s/it][A
 20%|██        | 3/15 [00:01<00:04,  2.85it/s][A
 33%|███▎      | 5/15 [00:01<00:03,  3.10it/s][A
 40%|████      | 6/15 [00:02<00:02,  3.51it/s][A
 47%|████▋     | 7/15 [00:02<00:02,  3.89it/s][A
 60%|██████    | 9/15 [00:02<00:01,  4.19it/s][A
 67%|██████▋   | 10/15 [00:02<00:01,  4.42it/s][A
 73%|███████▎  | 11/15 [00:03<00:00,  4.54it/s][A
100%|██████████| 15/15 [00:03<00:00,  4.14it/s][A
Epochs:  47%|████▋     | 38/81 [16:52<19:15, 26.86s/it]

Val Loss: 0.1924 - Val Accuracy: 0.9292



Training:   0%|          | 0/117 [00:00<?, ?it/s][A
Training:   1%|          | 1/117 [00:01<02:01,  1.04s/it][A
Training:   2%|▏         | 2/117 [00:01<00:57,  1.99it/s][A
Training:   4%|▍         | 5/117 [00:01<00:33,  3.33it/s][A
Training:   6%|▌         | 7/117 [00:01<00:21,  5.02it/s][A
Training:   8%|▊         | 9/117 [00:02<00:27,  3.88it/s][A
Training:  10%|█         | 12/117 [00:02<00:19,  5.51it/s][A
Training:  11%|█         | 13/117 [00:03<00:25,  4.11it/s][A
Training:  13%|█▎        | 15/117 [00:03<00:18,  5.50it/s][A
Training:  15%|█▍        | 17/117 [00:04<00:23,  4.18it/s][A
Training:  17%|█▋        | 20/117 [00:04<00:16,  5.89it/s][A
Training:  18%|█▊        | 21/117 [00:05<00:25,  3.75it/s][A
Training:  21%|██        | 24/117 [00:05<00:16,  5.69it/s][A
Training:  22%|██▏       | 26/117 [00:06<00:21,  4.26it/s][A
Training:  25%|██▍       | 29/117 [00:06<00:20,  4.22it/s][A
Training:  27%|██▋       | 32/117 [00:07<00:14,  5.86it/s][A
Training:  29%|██▉   

Epoch: 39/81 - Loss: 0.1755 - Accuracy: 0.9306



  0%|          | 0/15 [00:00<?, ?it/s][A
  7%|▋         | 1/15 [00:01<00:15,  1.09s/it][A
 27%|██▋       | 4/15 [00:01<00:02,  4.24it/s][A
 40%|████      | 6/15 [00:01<00:02,  3.63it/s][A
 53%|█████▎    | 8/15 [00:01<00:01,  5.23it/s][A
 67%|██████▋   | 10/15 [00:02<00:01,  4.95it/s][A
 80%|████████  | 12/15 [00:02<00:00,  6.44it/s][A
100%|██████████| 15/15 [00:03<00:00,  4.60it/s][A
Epochs:  48%|████▊     | 39/81 [17:19<18:45, 26.79s/it]

Val Loss: 0.1925 - Val Accuracy: 0.9260



Training:   0%|          | 0/117 [00:00<?, ?it/s][A
Training:   1%|          | 1/117 [00:01<02:15,  1.16s/it][A
Training:   3%|▎         | 4/117 [00:01<00:33,  3.38it/s][A
Training:   4%|▍         | 5/117 [00:02<00:42,  2.66it/s][A
Training:   7%|▋         | 8/117 [00:02<00:23,  4.69it/s][A
Training:   8%|▊         | 9/117 [00:02<00:31,  3.44it/s][A
Training:  10%|█         | 12/117 [00:03<00:20,  5.21it/s][A
Training:  11%|█         | 13/117 [00:03<00:27,  3.82it/s][A
Training:  14%|█▎        | 16/117 [00:03<00:17,  5.78it/s][A
Training:  15%|█▍        | 17/117 [00:04<00:24,  4.03it/s][A
Training:  17%|█▋        | 20/117 [00:04<00:16,  5.99it/s][A
Training:  19%|█▉        | 22/117 [00:05<00:22,  4.23it/s][A
Training:  21%|██        | 24/117 [00:05<00:16,  5.48it/s][A
Training:  22%|██▏       | 26/117 [00:06<00:20,  4.43it/s][A
Training:  24%|██▍       | 28/117 [00:06<00:16,  5.50it/s][A
Training:  26%|██▌       | 30/117 [00:07<00:20,  4.26it/s][A
Training:  27%|██▋   

Epoch: 40/81 - Loss: 0.1626 - Accuracy: 0.9372



  0%|          | 0/15 [00:00<?, ?it/s][A
  7%|▋         | 1/15 [00:01<00:15,  1.12s/it][A
 27%|██▋       | 4/15 [00:01<00:02,  3.90it/s][A
 40%|████      | 6/15 [00:01<00:02,  3.49it/s][A
 60%|██████    | 9/15 [00:02<00:01,  3.79it/s][A
 73%|███████▎  | 11/15 [00:02<00:00,  5.07it/s][A
100%|██████████| 15/15 [00:03<00:00,  4.27it/s][A
Epochs:  49%|████▉     | 40/81 [17:46<18:20, 26.85s/it]

Val Loss: 0.1451 - Val Accuracy: 0.9419



Training:   0%|          | 0/117 [00:00<?, ?it/s][A
Training:   1%|          | 1/117 [00:01<02:10,  1.12s/it][A
Training:   2%|▏         | 2/117 [00:01<01:06,  1.73it/s][A
Training:   4%|▍         | 5/117 [00:01<00:32,  3.43it/s][A
Training:   5%|▌         | 6/117 [00:02<00:31,  3.47it/s][A
Training:   8%|▊         | 9/117 [00:02<00:22,  4.77it/s][A
Training:   9%|▊         | 10/117 [00:02<00:25,  4.23it/s][A
Training:  11%|█         | 13/117 [00:03<00:19,  5.30it/s][A
Training:  12%|█▏        | 14/117 [00:03<00:22,  4.49it/s][A
Training:  14%|█▎        | 16/117 [00:03<00:16,  6.00it/s][A
Training:  15%|█▍        | 17/117 [00:04<00:20,  4.92it/s][A
Training:  15%|█▌        | 18/117 [00:04<00:22,  4.41it/s][A
Training:  17%|█▋        | 20/117 [00:04<00:15,  6.15it/s][A
Training:  18%|█▊        | 21/117 [00:05<00:21,  4.48it/s][A
Training:  19%|█▉        | 22/117 [00:05<00:22,  4.20it/s][A
Training:  21%|██▏       | 25/117 [00:05<00:20,  4.54it/s][A
Training:  22%|██▏   

Epoch: 41/81 - Loss: 0.1369 - Accuracy: 0.9452



  0%|          | 0/15 [00:00<?, ?it/s][A
  7%|▋         | 1/15 [00:01<00:17,  1.26s/it][A
 33%|███▎      | 5/15 [00:02<00:03,  2.85it/s][A
 60%|██████    | 9/15 [00:02<00:01,  3.67it/s][A
 80%|████████  | 12/15 [00:02<00:00,  5.38it/s][A
100%|██████████| 15/15 [00:03<00:00,  3.99it/s][A
Epochs:  51%|█████     | 41/81 [18:13<17:56, 26.90s/it]

Val Loss: 0.1528 - Val Accuracy: 0.9392



Training:   0%|          | 0/117 [00:00<?, ?it/s][A
Training:   1%|          | 1/117 [00:01<02:29,  1.29s/it][A
Training:   4%|▍         | 5/117 [00:02<00:43,  2.60it/s][A
Training:   7%|▋         | 8/117 [00:02<00:24,  4.51it/s][A
Training:   9%|▊         | 10/117 [00:03<00:28,  3.76it/s][A
Training:  10%|█         | 12/117 [00:03<00:21,  4.95it/s][A
Training:  12%|█▏        | 14/117 [00:03<00:23,  4.42it/s][A
Training:  15%|█▍        | 17/117 [00:04<00:23,  4.18it/s][A
Training:  16%|█▌        | 19/117 [00:04<00:18,  5.31it/s][A
Training:  18%|█▊        | 21/117 [00:05<00:22,  4.32it/s][A
Training:  21%|██▏       | 25/117 [00:06<00:19,  4.70it/s][A
Training:  23%|██▎       | 27/117 [00:06<00:15,  5.75it/s][A
Training:  25%|██▍       | 29/117 [00:06<00:19,  4.49it/s][A
Training:  28%|██▊       | 33/117 [00:07<00:17,  4.81it/s][A
Training:  32%|███▏      | 37/117 [00:08<00:16,  5.00it/s][A
Training:  33%|███▎      | 39/117 [00:08<00:13,  5.76it/s][A
Training:  35%|███▌

Epoch: 42/81 - Loss: 0.1479 - Accuracy: 0.9430



  0%|          | 0/15 [00:00<?, ?it/s][A
  7%|▋         | 1/15 [00:01<00:14,  1.04s/it][A
 33%|███▎      | 5/15 [00:01<00:02,  3.40it/s][A
 60%|██████    | 9/15 [00:02<00:01,  4.37it/s][A
 73%|███████▎  | 11/15 [00:02<00:00,  5.35it/s][A
100%|██████████| 15/15 [00:03<00:00,  4.47it/s][A
Epochs:  52%|█████▏    | 42/81 [18:40<17:29, 26.90s/it]

Val Loss: 0.1468 - Val Accuracy: 0.9437



Training:   0%|          | 0/117 [00:00<?, ?it/s][A
Training:   1%|          | 1/117 [00:01<02:23,  1.24s/it][A
Training:   3%|▎         | 4/117 [00:01<00:29,  3.80it/s][A
Training:   5%|▌         | 6/117 [00:02<00:33,  3.32it/s][A
Training:   8%|▊         | 9/117 [00:02<00:29,  3.70it/s][A
Training:  11%|█         | 13/117 [00:03<00:25,  4.10it/s][A
Training:  13%|█▎        | 15/117 [00:03<00:20,  5.05it/s][A
Training:  15%|█▍        | 17/117 [00:04<00:23,  4.25it/s][A
Training:  18%|█▊        | 21/117 [00:05<00:21,  4.57it/s][A
Training:  20%|█▉        | 23/117 [00:05<00:16,  5.55it/s][A
Training:  21%|██▏       | 25/117 [00:06<00:20,  4.42it/s][A
Training:  25%|██▍       | 29/117 [00:06<00:19,  4.54it/s][A
Training:  27%|██▋       | 32/117 [00:07<00:13,  6.13it/s][A
Training:  29%|██▉       | 34/117 [00:07<00:17,  4.70it/s][A
Training:  31%|███       | 36/117 [00:07<00:14,  5.70it/s][A
Training:  32%|███▏      | 38/117 [00:08<00:19,  4.12it/s][A
Training:  34%|███▍ 

Epoch: 43/81 - Loss: 0.1399 - Accuracy: 0.9462



  0%|          | 0/15 [00:00<?, ?it/s][A
  7%|▋         | 1/15 [00:00<00:13,  1.02it/s][A
 13%|█▎        | 2/15 [00:01<00:06,  1.95it/s][A
 33%|███▎      | 5/15 [00:01<00:02,  3.61it/s][A
 40%|████      | 6/15 [00:01<00:02,  3.76it/s][A
 60%|██████    | 9/15 [00:02<00:01,  5.03it/s][A
 67%|██████▋   | 10/15 [00:02<00:01,  5.00it/s][A
 87%|████████▋ | 13/15 [00:03<00:00,  5.46it/s][A
100%|██████████| 15/15 [00:03<00:00,  4.57it/s][A
Epochs:  53%|█████▎    | 43/81 [19:06<16:56, 26.74s/it]

Val Loss: 0.1821 - Val Accuracy: 0.9238



Training:   0%|          | 0/117 [00:00<?, ?it/s][A
Training:   1%|          | 1/117 [00:01<01:57,  1.01s/it][A
Training:   3%|▎         | 3/117 [00:01<00:34,  3.33it/s][A
Training:   4%|▍         | 5/117 [00:01<00:32,  3.44it/s][A
Training:   7%|▋         | 8/117 [00:01<00:18,  6.04it/s][A
Training:   9%|▊         | 10/117 [00:02<00:24,  4.32it/s][A
Training:  10%|█         | 12/117 [00:02<00:18,  5.56it/s][A
Training:  12%|█▏        | 14/117 [00:03<00:21,  4.83it/s][A
Training:  14%|█▎        | 16/117 [00:03<00:18,  5.55it/s][A
Training:  15%|█▍        | 17/117 [00:04<00:26,  3.77it/s][A
Training:  16%|█▌        | 19/117 [00:04<00:19,  5.11it/s][A
Training:  17%|█▋        | 20/117 [00:04<00:17,  5.50it/s][A
Training:  18%|█▊        | 21/117 [00:04<00:24,  3.89it/s][A
Training:  21%|██        | 24/117 [00:05<00:17,  5.45it/s][A
Training:  21%|██▏       | 25/117 [00:05<00:20,  4.42it/s][A
Training:  23%|██▎       | 27/117 [00:05<00:14,  6.06it/s][A
Training:  25%|██▍  

Epoch: 44/81 - Loss: 0.1389 - Accuracy: 0.9450



  0%|          | 0/15 [00:00<?, ?it/s][A
  7%|▋         | 1/15 [00:00<00:13,  1.01it/s][A
 13%|█▎        | 2/15 [00:01<00:06,  2.14it/s][A
 33%|███▎      | 5/15 [00:01<00:03,  3.32it/s][A
 60%|██████    | 9/15 [00:02<00:01,  4.02it/s][A
 67%|██████▋   | 10/15 [00:02<00:01,  4.44it/s][A
 87%|████████▋ | 13/15 [00:03<00:00,  4.50it/s][A
100%|██████████| 15/15 [00:03<00:00,  4.17it/s][A
Epochs:  54%|█████▍    | 44/81 [19:34<16:37, 26.95s/it]

Val Loss: 0.1480 - Val Accuracy: 0.9353



Training:   0%|          | 0/117 [00:00<?, ?it/s][A
Training:   1%|          | 1/117 [00:00<01:49,  1.06it/s][A
Training:   3%|▎         | 4/117 [00:01<00:23,  4.74it/s][A
Training:   5%|▌         | 6/117 [00:01<00:30,  3.65it/s][A
Training:   8%|▊         | 9/117 [00:02<00:25,  4.30it/s][A
Training:   9%|▊         | 10/117 [00:02<00:23,  4.51it/s][A
Training:  11%|█         | 13/117 [00:03<00:24,  4.27it/s][A
Training:  13%|█▎        | 15/117 [00:03<00:19,  5.28it/s][A
Training:  15%|█▍        | 17/117 [00:04<00:23,  4.17it/s][A
Training:  16%|█▌        | 19/117 [00:04<00:18,  5.32it/s][A
Training:  18%|█▊        | 21/117 [00:05<00:23,  4.09it/s][A
Training:  20%|█▉        | 23/117 [00:05<00:18,  5.06it/s][A
Training:  21%|██▏       | 25/117 [00:05<00:20,  4.41it/s][A
Training:  23%|██▎       | 27/117 [00:05<00:15,  5.67it/s][A
Training:  25%|██▍       | 29/117 [00:06<00:19,  4.58it/s][A
Training:  26%|██▋       | 31/117 [00:06<00:14,  5.81it/s][A
Training:  28%|██▊  

Epoch: 45/81 - Loss: 0.1442 - Accuracy: 0.9431



  0%|          | 0/15 [00:00<?, ?it/s][A
  7%|▋         | 1/15 [00:01<00:14,  1.01s/it][A
 33%|███▎      | 5/15 [00:01<00:03,  3.17it/s][A
 60%|██████    | 9/15 [00:02<00:01,  4.02it/s][A
100%|██████████| 15/15 [00:03<00:00,  4.31it/s][A
Epochs:  56%|█████▌    | 45/81 [20:01<16:11, 26.99s/it]

Val Loss: 0.1704 - Val Accuracy: 0.9276



Training:   0%|          | 0/117 [00:00<?, ?it/s][A
Training:   1%|          | 1/117 [00:00<01:50,  1.05it/s][A
Training:   2%|▏         | 2/117 [00:01<00:57,  1.99it/s][A
Training:   3%|▎         | 4/117 [00:01<00:25,  4.47it/s][A
Training:   4%|▍         | 5/117 [00:01<00:30,  3.70it/s][A
Training:   5%|▌         | 6/117 [00:01<00:27,  4.11it/s][A
Training:   7%|▋         | 8/117 [00:01<00:16,  6.50it/s][A
Training:   9%|▊         | 10/117 [00:02<00:24,  4.40it/s][A
Training:  10%|█         | 12/117 [00:02<00:17,  6.02it/s][A
Training:  12%|█▏        | 14/117 [00:03<00:23,  4.34it/s][A
Training:  14%|█▎        | 16/117 [00:03<00:18,  5.59it/s][A
Training:  15%|█▌        | 18/117 [00:04<00:20,  4.73it/s][A
Training:  17%|█▋        | 20/117 [00:04<00:15,  6.16it/s][A
Training:  19%|█▉        | 22/117 [00:04<00:18,  5.04it/s][A
Training:  21%|██▏       | 25/117 [00:05<00:18,  5.09it/s][A
Training:  22%|██▏       | 26/117 [00:05<00:17,  5.24it/s][A
Training:  24%|██▍    

Epoch: 46/81 - Loss: 0.1487 - Accuracy: 0.9435



  0%|          | 0/15 [00:00<?, ?it/s][A
  7%|▋         | 1/15 [00:00<00:13,  1.00it/s][A
 13%|█▎        | 2/15 [00:01<00:07,  1.84it/s][A
 33%|███▎      | 5/15 [00:01<00:02,  3.39it/s][A
 40%|████      | 6/15 [00:02<00:02,  3.68it/s][A
 53%|█████▎    | 8/15 [00:02<00:01,  5.52it/s][A
 60%|██████    | 9/15 [00:02<00:01,  3.90it/s][A
 67%|██████▋   | 10/15 [00:02<00:01,  4.07it/s][A
 87%|████████▋ | 13/15 [00:03<00:00,  4.87it/s][A
100%|██████████| 15/15 [00:03<00:00,  4.08it/s][A
Epochs:  57%|█████▋    | 46/81 [20:28<15:45, 27.02s/it]

Val Loss: 0.1444 - Val Accuracy: 0.9409



Training:   0%|          | 0/117 [00:00<?, ?it/s][A
Training:   1%|          | 1/117 [00:01<02:16,  1.18s/it][A
Training:   3%|▎         | 3/117 [00:01<00:39,  2.85it/s][A
Training:   4%|▍         | 5/117 [00:02<00:39,  2.86it/s][A
Training:   8%|▊         | 9/117 [00:02<00:25,  4.21it/s][A
Training:  10%|█         | 12/117 [00:02<00:16,  6.32it/s][A
Training:  12%|█▏        | 14/117 [00:03<00:21,  4.84it/s][A
Training:  15%|█▍        | 17/117 [00:04<00:21,  4.75it/s][A
Training:  16%|█▌        | 19/117 [00:04<00:16,  5.78it/s][A
Training:  18%|█▊        | 21/117 [00:04<00:19,  4.92it/s][A
Training:  20%|█▉        | 23/117 [00:04<00:15,  6.01it/s][A
Training:  21%|██▏       | 25/117 [00:05<00:21,  4.35it/s][A
Training:  24%|██▍       | 28/117 [00:05<00:15,  5.74it/s][A
Training:  25%|██▍       | 29/117 [00:06<00:21,  4.02it/s][A
Training:  27%|██▋       | 32/117 [00:06<00:16,  5.06it/s][A
Training:  28%|██▊       | 33/117 [00:07<00:19,  4.20it/s][A
Training:  31%|███  

Epoch: 47/81 - Loss: 0.1424 - Accuracy: 0.9426



  0%|          | 0/15 [00:00<?, ?it/s][A
  7%|▋         | 1/15 [00:00<00:13,  1.01it/s][A
 13%|█▎        | 2/15 [00:01<00:06,  2.12it/s][A
 27%|██▋       | 4/15 [00:01<00:02,  4.49it/s][A
 33%|███▎      | 5/15 [00:01<00:03,  2.99it/s][A
 40%|████      | 6/15 [00:01<00:02,  3.72it/s][A
 60%|██████    | 9/15 [00:02<00:01,  4.07it/s][A
 67%|██████▋   | 10/15 [00:02<00:01,  4.57it/s][A
100%|██████████| 15/15 [00:03<00:00,  4.38it/s][A
Epochs:  58%|█████▊    | 47/81 [20:55<15:14, 26.91s/it]

Val Loss: 0.1454 - Val Accuracy: 0.9413



Training:   0%|          | 0/117 [00:00<?, ?it/s][A
Training:   1%|          | 1/117 [00:00<01:39,  1.17it/s][A
Training:   3%|▎         | 3/117 [00:00<00:30,  3.70it/s][A
Training:   4%|▍         | 5/117 [00:01<00:29,  3.78it/s][A
Training:   6%|▌         | 7/117 [00:01<00:20,  5.27it/s][A
Training:   8%|▊         | 9/117 [00:02<00:24,  4.33it/s][A
Training:   9%|▉         | 11/117 [00:02<00:18,  5.60it/s][A
Training:  10%|█         | 12/117 [00:02<00:17,  6.10it/s][A
Training:  11%|█         | 13/117 [00:03<00:26,  3.92it/s][A
Training:  13%|█▎        | 15/117 [00:03<00:19,  5.13it/s][A
Training:  15%|█▍        | 17/117 [00:03<00:20,  4.99it/s][A
Training:  16%|█▌        | 19/117 [00:04<00:18,  5.19it/s][A
Training:  18%|█▊        | 21/117 [00:04<00:17,  5.48it/s][A
Training:  20%|█▉        | 23/117 [00:04<00:20,  4.67it/s][A
Training:  21%|██▏       | 25/117 [00:05<00:17,  5.36it/s][A
Training:  23%|██▎       | 27/117 [00:05<00:18,  4.94it/s][A
Training:  25%|██▍   

Epoch: 48/81 - Loss: 0.1422 - Accuracy: 0.9435



  0%|          | 0/15 [00:00<?, ?it/s][A
  7%|▋         | 1/15 [00:01<00:16,  1.18s/it][A
 33%|███▎      | 5/15 [00:01<00:03,  3.03it/s][A
 60%|██████    | 9/15 [00:02<00:01,  3.83it/s][A
100%|██████████| 15/15 [00:03<00:00,  4.16it/s][A
Epochs:  59%|█████▉    | 48/81 [21:22<14:53, 27.07s/it]

Val Loss: 0.1692 - Val Accuracy: 0.9365



Training:   0%|          | 0/117 [00:00<?, ?it/s][A
Training:   1%|          | 1/117 [00:00<01:53,  1.02it/s][A
Training:   3%|▎         | 4/117 [00:01<00:24,  4.67it/s][A
Training:   5%|▌         | 6/117 [00:01<00:28,  3.87it/s][A
Training:   7%|▋         | 8/117 [00:01<00:20,  5.27it/s][A
Training:   9%|▊         | 10/117 [00:02<00:24,  4.39it/s][A
Training:  11%|█         | 13/117 [00:03<00:26,  3.85it/s][A
Training:  13%|█▎        | 15/117 [00:03<00:20,  4.95it/s][A
Training:  15%|█▍        | 17/117 [00:04<00:24,  4.04it/s][A
Training:  18%|█▊        | 21/117 [00:04<00:20,  4.62it/s][A
Training:  21%|██▏       | 25/117 [00:05<00:18,  5.07it/s][A
Training:  25%|██▍       | 29/117 [00:06<00:17,  5.09it/s][A
Training:  26%|██▋       | 31/117 [00:06<00:14,  5.93it/s][A
Training:  28%|██▊       | 33/117 [00:07<00:16,  5.06it/s][A
Training:  32%|███▏      | 37/117 [00:07<00:16,  4.94it/s][A
Training:  33%|███▎      | 39/117 [00:08<00:13,  5.83it/s][A
Training:  35%|███▌ 

Epoch: 49/81 - Loss: 0.1411 - Accuracy: 0.9459



  0%|          | 0/15 [00:00<?, ?it/s][A
  7%|▋         | 1/15 [00:01<00:15,  1.08s/it][A
 20%|██        | 3/15 [00:01<00:04,  2.92it/s][A
 33%|███▎      | 5/15 [00:02<00:03,  2.77it/s][A
 47%|████▋     | 7/15 [00:02<00:01,  4.25it/s][A
 60%|██████    | 9/15 [00:02<00:01,  3.54it/s][A
100%|██████████| 15/15 [00:03<00:00,  4.09it/s][A
Epochs:  60%|██████    | 49/81 [21:49<14:25, 27.03s/it]

Val Loss: 0.1591 - Val Accuracy: 0.9326



Training:   0%|          | 0/117 [00:00<?, ?it/s][A
Training:   1%|          | 1/117 [00:01<02:11,  1.14s/it][A
Training:   3%|▎         | 4/117 [00:01<00:27,  4.10it/s][A
Training:   5%|▌         | 6/117 [00:01<00:33,  3.34it/s][A
Training:   8%|▊         | 9/117 [00:02<00:28,  3.82it/s][A
Training:  10%|█         | 12/117 [00:02<00:17,  5.85it/s][A
Training:  12%|█▏        | 14/117 [00:03<00:21,  4.79it/s][A
Training:  14%|█▎        | 16/117 [00:03<00:16,  6.11it/s][A
Training:  15%|█▌        | 18/117 [00:04<00:21,  4.54it/s][A
Training:  17%|█▋        | 20/117 [00:04<00:16,  5.77it/s][A
Training:  19%|█▉        | 22/117 [00:04<00:21,  4.52it/s][A
Training:  21%|██▏       | 25/117 [00:05<00:21,  4.38it/s][A
Training:  23%|██▎       | 27/117 [00:05<00:16,  5.50it/s][A
Training:  25%|██▍       | 29/117 [00:06<00:18,  4.72it/s][A
Training:  26%|██▌       | 30/117 [00:06<00:17,  4.87it/s][A
Training:  28%|██▊       | 33/117 [00:07<00:15,  5.37it/s][A
Training:  29%|██▉  

Epoch: 50/81 - Loss: 0.1491 - Accuracy: 0.9395



  0%|          | 0/15 [00:00<?, ?it/s][A
  7%|▋         | 1/15 [00:01<00:15,  1.13s/it][A
 13%|█▎        | 2/15 [00:01<00:07,  1.84it/s][A
 27%|██▋       | 4/15 [00:01<00:02,  4.17it/s][A
 40%|████      | 6/15 [00:02<00:02,  3.55it/s][A
 53%|█████▎    | 8/15 [00:02<00:01,  5.18it/s][A
 67%|██████▋   | 10/15 [00:02<00:01,  4.12it/s][A
 73%|███████▎  | 11/15 [00:02<00:00,  4.68it/s][A
100%|██████████| 15/15 [00:03<00:00,  4.14it/s][A
Epochs:  62%|██████▏   | 50/81 [22:16<13:58, 27.06s/it]

Val Loss: 0.1389 - Val Accuracy: 0.9441



Training:   0%|          | 0/117 [00:00<?, ?it/s][A
Training:   1%|          | 1/117 [00:01<02:28,  1.28s/it][A
Training:   3%|▎         | 4/117 [00:01<00:30,  3.68it/s][A
Training:   5%|▌         | 6/117 [00:02<00:37,  2.94it/s][A
Training:   8%|▊         | 9/117 [00:02<00:30,  3.57it/s][A
Training:   9%|▊         | 10/117 [00:03<00:27,  3.88it/s][A
Training:  11%|█         | 13/117 [00:03<00:23,  4.50it/s][A
Training:  12%|█▏        | 14/117 [00:03<00:21,  4.80it/s][A
Training:  15%|█▍        | 17/117 [00:04<00:22,  4.52it/s][A
Training:  17%|█▋        | 20/117 [00:04<00:14,  6.57it/s][A
Training:  19%|█▉        | 22/117 [00:05<00:19,  4.80it/s][A
Training:  21%|██▏       | 25/117 [00:05<00:20,  4.59it/s][A
Training:  22%|██▏       | 26/117 [00:06<00:18,  4.86it/s][A
Training:  24%|██▍       | 28/117 [00:06<00:14,  6.15it/s][A
Training:  26%|██▌       | 30/117 [00:06<00:19,  4.47it/s][A
Training:  28%|██▊       | 33/117 [00:07<00:17,  4.88it/s][A
Training:  29%|██▉  

Epoch: 51/81 - Loss: 0.1462 - Accuracy: 0.9430



  0%|          | 0/15 [00:00<?, ?it/s][A
  7%|▋         | 1/15 [00:01<00:14,  1.06s/it][A
 13%|█▎        | 2/15 [00:01<00:06,  1.87it/s][A
 27%|██▋       | 4/15 [00:01<00:02,  4.24it/s][A
 40%|████      | 6/15 [00:01<00:02,  3.83it/s][A
 53%|█████▎    | 8/15 [00:02<00:01,  5.56it/s][A
 67%|██████▋   | 10/15 [00:02<00:01,  4.21it/s][A
 80%|████████  | 12/15 [00:02<00:00,  5.46it/s][A
 87%|████████▋ | 13/15 [00:03<00:00,  4.15it/s][A
100%|██████████| 15/15 [00:03<00:00,  4.19it/s][A
Epochs:  63%|██████▎   | 51/81 [22:43<13:30, 27.00s/it]

Val Loss: 0.1577 - Val Accuracy: 0.9375



Training:   0%|          | 0/117 [00:00<?, ?it/s][A
Training:   1%|          | 1/117 [00:01<02:08,  1.10s/it][A
Training:   3%|▎         | 3/117 [00:01<00:38,  3.00it/s][A
Training:   4%|▍         | 5/117 [00:01<00:34,  3.28it/s][A
Training:   7%|▋         | 8/117 [00:01<00:18,  5.88it/s][A
Training:   9%|▊         | 10/117 [00:02<00:23,  4.56it/s][A
Training:  10%|█         | 12/117 [00:02<00:18,  5.83it/s][A
Training:  12%|█▏        | 14/117 [00:03<00:23,  4.34it/s][A
Training:  14%|█▎        | 16/117 [00:03<00:17,  5.73it/s][A
Training:  15%|█▌        | 18/117 [00:04<00:22,  4.36it/s][A
Training:  18%|█▊        | 21/117 [00:04<00:22,  4.34it/s][A
Training:  21%|██        | 24/117 [00:05<00:15,  6.16it/s][A
Training:  22%|██▏       | 26/117 [00:05<00:18,  5.01it/s][A
Training:  25%|██▍       | 29/117 [00:06<00:19,  4.52it/s][A
Training:  26%|██▋       | 31/117 [00:06<00:15,  5.46it/s][A
Training:  28%|██▊       | 33/117 [00:07<00:18,  4.55it/s][A
Training:  32%|███▏ 

Epoch: 52/81 - Loss: 0.1421 - Accuracy: 0.9455



  0%|          | 0/15 [00:00<?, ?it/s][A
  7%|▋         | 1/15 [00:01<00:14,  1.05s/it][A
 20%|██        | 3/15 [00:01<00:03,  3.22it/s][A
 33%|███▎      | 5/15 [00:01<00:03,  3.11it/s][A
 60%|██████    | 9/15 [00:02<00:01,  3.91it/s][A
 80%|████████  | 12/15 [00:02<00:00,  5.88it/s][A
100%|██████████| 15/15 [00:03<00:00,  4.27it/s][A
Epochs:  64%|██████▍   | 52/81 [23:09<12:59, 26.87s/it]

Val Loss: 0.1519 - Val Accuracy: 0.9398



Training:   0%|          | 0/117 [00:00<?, ?it/s][A
Training:   1%|          | 1/117 [00:01<02:08,  1.11s/it][A
Training:   3%|▎         | 4/117 [00:01<00:27,  4.11it/s][A
Training:   5%|▌         | 6/117 [00:01<00:32,  3.43it/s][A
Training:   8%|▊         | 9/117 [00:02<00:28,  3.75it/s][A
Training:   9%|▉         | 11/117 [00:02<00:21,  4.89it/s][A
Training:  11%|█         | 13/117 [00:03<00:25,  4.02it/s][A
Training:  14%|█▎        | 16/117 [00:03<00:17,  5.88it/s][A
Training:  15%|█▌        | 18/117 [00:04<00:23,  4.29it/s][A
Training:  17%|█▋        | 20/117 [00:04<00:17,  5.48it/s][A
Training:  19%|█▉        | 22/117 [00:05<00:21,  4.46it/s][A
Training:  21%|██        | 24/117 [00:05<00:16,  5.67it/s][A
Training:  22%|██▏       | 26/117 [00:06<00:21,  4.17it/s][A
Training:  24%|██▍       | 28/117 [00:06<00:16,  5.33it/s][A
Training:  26%|██▌       | 30/117 [00:06<00:20,  4.34it/s][A
Training:  27%|██▋       | 32/117 [00:07<00:15,  5.63it/s][A
Training:  29%|██▉  

Epoch: 53/81 - Loss: 0.1392 - Accuracy: 0.9451



  0%|          | 0/15 [00:00<?, ?it/s][A
  7%|▋         | 1/15 [00:00<00:13,  1.01it/s][A
 13%|█▎        | 2/15 [00:01<00:06,  2.05it/s][A
 33%|███▎      | 5/15 [00:01<00:03,  3.31it/s][A
 40%|████      | 6/15 [00:02<00:02,  3.65it/s][A
 60%|██████    | 9/15 [00:02<00:01,  4.74it/s][A
 67%|██████▋   | 10/15 [00:02<00:01,  4.14it/s][A
 87%|████████▋ | 13/15 [00:03<00:00,  4.90it/s][A
100%|██████████| 15/15 [00:03<00:00,  4.15it/s][A
Epochs:  65%|██████▌   | 53/81 [23:36<12:32, 26.87s/it]

Val Loss: 0.1462 - Val Accuracy: 0.9353



Training:   0%|          | 0/117 [00:00<?, ?it/s][A
Training:   1%|          | 1/117 [00:01<02:15,  1.17s/it][A
Training:   4%|▍         | 5/117 [00:01<00:36,  3.09it/s][A
Training:   6%|▌         | 7/117 [00:01<00:24,  4.54it/s][A
Training:   8%|▊         | 9/117 [00:02<00:29,  3.65it/s][A
Training:   9%|▉         | 11/117 [00:02<00:21,  4.95it/s][A
Training:  11%|█         | 13/117 [00:03<00:26,  3.90it/s][A
Training:  14%|█▎        | 16/117 [00:03<00:17,  5.93it/s][A
Training:  15%|█▌        | 18/117 [00:04<00:21,  4.71it/s][A
Training:  17%|█▋        | 20/117 [00:04<00:16,  5.97it/s][A
Training:  19%|█▉        | 22/117 [00:05<00:19,  4.75it/s][A
Training:  21%|██▏       | 25/117 [00:05<00:22,  4.15it/s][A
Training:  24%|██▍       | 28/117 [00:06<00:15,  5.82it/s][A
Training:  26%|██▌       | 30/117 [00:06<00:20,  4.31it/s][A
Training:  28%|██▊       | 33/117 [00:07<00:20,  4.05it/s][A
Training:  31%|███       | 36/117 [00:07<00:14,  5.59it/s][A
Training:  32%|███▏ 

Epoch: 54/81 - Loss: 0.1437 - Accuracy: 0.9434



  0%|          | 0/15 [00:00<?, ?it/s][A
  7%|▋         | 1/15 [00:01<00:14,  1.06s/it][A
 33%|███▎      | 5/15 [00:01<00:03,  3.09it/s][A
 40%|████      | 6/15 [00:02<00:02,  3.54it/s][A
 60%|██████    | 9/15 [00:02<00:01,  3.81it/s][A
 67%|██████▋   | 10/15 [00:02<00:01,  4.21it/s][A
100%|██████████| 15/15 [00:03<00:00,  4.13it/s][A
Epochs:  67%|██████▋   | 54/81 [24:03<12:06, 26.92s/it]

Val Loss: 0.1591 - Val Accuracy: 0.9368



Training:   0%|          | 0/117 [00:00<?, ?it/s][A
Training:   1%|          | 1/117 [00:01<02:05,  1.08s/it][A
Training:   2%|▏         | 2/117 [00:01<01:00,  1.90it/s][A
Training:   4%|▍         | 5/117 [00:01<00:36,  3.04it/s][A
Training:   6%|▌         | 7/117 [00:02<00:24,  4.55it/s][A
Training:   8%|▊         | 9/117 [00:02<00:30,  3.53it/s][A
Training:  10%|█         | 12/117 [00:03<00:19,  5.50it/s][A
Training:  12%|█▏        | 14/117 [00:03<00:23,  4.48it/s][A
Training:  14%|█▎        | 16/117 [00:03<00:17,  5.81it/s][A
Training:  15%|█▌        | 18/117 [00:04<00:22,  4.37it/s][A
Training:  18%|█▊        | 21/117 [00:05<00:23,  4.11it/s][A
Training:  21%|██        | 24/117 [00:05<00:16,  5.76it/s][A
Training:  22%|██▏       | 26/117 [00:06<00:19,  4.62it/s][A
Training:  24%|██▍       | 28/117 [00:06<00:15,  5.65it/s][A
Training:  26%|██▌       | 30/117 [00:06<00:19,  4.44it/s][A
Training:  27%|██▋       | 32/117 [00:07<00:16,  5.05it/s][A
Training:  28%|██▊   

Epoch: 55/81 - Loss: 0.1428 - Accuracy: 0.9448



  0%|          | 0/15 [00:00<?, ?it/s][A
  7%|▋         | 1/15 [00:01<00:17,  1.26s/it][A
 33%|███▎      | 5/15 [00:02<00:03,  2.61it/s][A
 53%|█████▎    | 8/15 [00:02<00:01,  4.56it/s][A
 67%|██████▋   | 10/15 [00:02<00:01,  3.93it/s][A
100%|██████████| 15/15 [00:03<00:00,  4.05it/s][A
Epochs:  68%|██████▊   | 55/81 [24:31<11:41, 27.00s/it]

Val Loss: 0.1514 - Val Accuracy: 0.9343



Training:   0%|          | 0/117 [00:00<?, ?it/s][A
Training:   1%|          | 1/117 [00:01<02:26,  1.27s/it][A
Training:   3%|▎         | 4/117 [00:01<00:30,  3.65it/s][A
Training:   5%|▌         | 6/117 [00:02<00:35,  3.14it/s][A
Training:   7%|▋         | 8/117 [00:02<00:23,  4.61it/s][A
Training:   9%|▊         | 10/117 [00:02<00:28,  3.70it/s][A
Training:  11%|█         | 13/117 [00:03<00:22,  4.64it/s][A
Training:  12%|█▏        | 14/117 [00:03<00:21,  4.69it/s][A
Training:  15%|█▍        | 17/117 [00:04<00:19,  5.01it/s][A
Training:  15%|█▌        | 18/117 [00:04<00:19,  5.11it/s][A
Training:  17%|█▋        | 20/117 [00:04<00:14,  6.56it/s][A
Training:  18%|█▊        | 21/117 [00:05<00:23,  4.08it/s][A
Training:  20%|█▉        | 23/117 [00:05<00:17,  5.45it/s][A
Training:  21%|██▏       | 25/117 [00:05<00:21,  4.24it/s][A
Training:  24%|██▍       | 28/117 [00:06<00:14,  6.33it/s][A
Training:  26%|██▌       | 30/117 [00:06<00:18,  4.76it/s][A
Training:  28%|██▊  

Epoch: 56/81 - Loss: 0.1373 - Accuracy: 0.9472



  0%|          | 0/15 [00:00<?, ?it/s][A
  7%|▋         | 1/15 [00:01<00:14,  1.05s/it][A
 20%|██        | 3/15 [00:01<00:03,  3.20it/s][A
 33%|███▎      | 5/15 [00:02<00:03,  2.70it/s][A
 60%|██████    | 9/15 [00:02<00:01,  3.60it/s][A
100%|██████████| 15/15 [00:03<00:00,  4.17it/s][A
Epochs:  69%|██████▉   | 56/81 [24:57<11:12, 26.90s/it]

Val Loss: 0.1663 - Val Accuracy: 0.9337



Training:   0%|          | 0/117 [00:00<?, ?it/s][A
Training:   1%|          | 1/117 [00:01<02:14,  1.16s/it][A
Training:   2%|▏         | 2/117 [00:01<01:05,  1.75it/s][A
Training:   3%|▎         | 4/117 [00:01<00:27,  4.05it/s][A
Training:   5%|▌         | 6/117 [00:02<00:32,  3.41it/s][A
Training:   8%|▊         | 9/117 [00:02<00:27,  3.94it/s][A
Training:   9%|▊         | 10/117 [00:02<00:25,  4.19it/s][A
Training:  10%|█         | 12/117 [00:03<00:18,  5.70it/s][A
Training:  11%|█         | 13/117 [00:03<00:24,  4.23it/s][A
Training:  12%|█▏        | 14/117 [00:03<00:21,  4.76it/s][A
Training:  15%|█▍        | 17/117 [00:04<00:19,  5.10it/s][A
Training:  15%|█▌        | 18/117 [00:04<00:19,  5.04it/s][A
Training:  17%|█▋        | 20/117 [00:04<00:14,  6.68it/s][A
Training:  18%|█▊        | 21/117 [00:05<00:21,  4.41it/s][A
Training:  19%|█▉        | 22/117 [00:05<00:19,  4.84it/s][A
Training:  21%|██▏       | 25/117 [00:05<00:19,  4.80it/s][A
Training:  22%|██▏   

Epoch: 57/81 - Loss: 0.1441 - Accuracy: 0.9412



  0%|          | 0/15 [00:00<?, ?it/s][A
  7%|▋         | 1/15 [00:01<00:16,  1.17s/it][A
 20%|██        | 3/15 [00:01<00:04,  2.88it/s][A
 33%|███▎      | 5/15 [00:02<00:03,  2.85it/s][A
 40%|████      | 6/15 [00:02<00:02,  3.12it/s][A
 60%|██████    | 9/15 [00:02<00:01,  3.89it/s][A
 67%|██████▋   | 10/15 [00:02<00:01,  4.41it/s][A
 87%|████████▋ | 13/15 [00:03<00:00,  4.65it/s][A
100%|██████████| 15/15 [00:03<00:00,  3.97it/s][A
Epochs:  70%|███████   | 57/81 [25:24<10:45, 26.88s/it]

Val Loss: 0.1888 - Val Accuracy: 0.9343



Training:   0%|          | 0/117 [00:00<?, ?it/s][A
Training:   1%|          | 1/117 [00:01<02:11,  1.14s/it][A
Training:   2%|▏         | 2/117 [00:01<01:10,  1.62it/s][A
Training:   4%|▍         | 5/117 [00:02<00:36,  3.08it/s][A
Training:   5%|▌         | 6/117 [00:02<00:31,  3.47it/s][A
Training:   7%|▋         | 8/117 [00:02<00:21,  5.18it/s][A
Training:   8%|▊         | 9/117 [00:02<00:28,  3.77it/s][A
Training:   9%|▉         | 11/117 [00:02<00:20,  5.30it/s][A
Training:  11%|█         | 13/117 [00:03<00:23,  4.39it/s][A
Training:  12%|█▏        | 14/117 [00:03<00:22,  4.58it/s][A
Training:  14%|█▎        | 16/117 [00:03<00:15,  6.38it/s][A
Training:  15%|█▌        | 18/117 [00:04<00:21,  4.68it/s][A
Training:  18%|█▊        | 21/117 [00:05<00:21,  4.43it/s][A
Training:  21%|██        | 24/117 [00:05<00:14,  6.47it/s][A
Training:  22%|██▏       | 26/117 [00:06<00:19,  4.70it/s][A
Training:  25%|██▍       | 29/117 [00:06<00:20,  4.32it/s][A
Training:  26%|██▋    

Epoch: 58/81 - Loss: 0.1466 - Accuracy: 0.9436



  0%|          | 0/15 [00:00<?, ?it/s][A
  7%|▋         | 1/15 [00:01<00:15,  1.13s/it][A
 20%|██        | 3/15 [00:01<00:04,  2.81it/s][A
 33%|███▎      | 5/15 [00:01<00:03,  3.11it/s][A
 40%|████      | 6/15 [00:02<00:02,  3.50it/s][A
 53%|█████▎    | 8/15 [00:02<00:01,  5.29it/s][A
 60%|██████    | 9/15 [00:02<00:01,  3.90it/s][A
 67%|██████▋   | 10/15 [00:02<00:01,  4.27it/s][A
 87%|████████▋ | 13/15 [00:03<00:00,  4.80it/s][A
100%|██████████| 15/15 [00:03<00:00,  4.07it/s][A
Epochs:  72%|███████▏  | 58/81 [25:51<10:19, 26.94s/it]

Val Loss: 0.1667 - Val Accuracy: 0.9338



Training:   0%|          | 0/117 [00:00<?, ?it/s][A
Training:   1%|          | 1/117 [00:01<02:25,  1.25s/it][A
Training:   3%|▎         | 3/117 [00:01<00:43,  2.62it/s][A
Training:   4%|▍         | 5/117 [00:02<00:38,  2.90it/s][A
Training:   5%|▌         | 6/117 [00:02<00:34,  3.20it/s][A
Training:   8%|▊         | 9/117 [00:02<00:25,  4.25it/s][A
Training:   9%|▊         | 10/117 [00:02<00:23,  4.57it/s][A
Training:  11%|█         | 13/117 [00:03<00:22,  4.72it/s][A
Training:  12%|█▏        | 14/117 [00:03<00:20,  4.91it/s][A
Training:  14%|█▎        | 16/117 [00:03<00:15,  6.49it/s][A
Training:  15%|█▍        | 17/117 [00:04<00:20,  4.93it/s][A
Training:  15%|█▌        | 18/117 [00:04<00:23,  4.18it/s][A
Training:  18%|█▊        | 21/117 [00:05<00:19,  5.04it/s][A
Training:  19%|█▉        | 22/117 [00:05<00:20,  4.55it/s][A
Training:  21%|██        | 24/117 [00:05<00:14,  6.21it/s][A
Training:  21%|██▏       | 25/117 [00:05<00:20,  4.60it/s][A
Training:  22%|██▏   

Epoch: 59/81 - Loss: 0.1442 - Accuracy: 0.9435



  0%|          | 0/15 [00:00<?, ?it/s][A
  7%|▋         | 1/15 [00:01<00:17,  1.22s/it][A
 13%|█▎        | 2/15 [00:01<00:07,  1.70it/s][A
 33%|███▎      | 5/15 [00:02<00:03,  3.13it/s][A
 53%|█████▎    | 8/15 [00:02<00:01,  5.56it/s][A
 67%|██████▋   | 10/15 [00:02<00:01,  3.91it/s][A
100%|██████████| 15/15 [00:03<00:00,  3.99it/s][A
Epochs:  73%|███████▎  | 59/81 [26:18<09:52, 26.91s/it]

Val Loss: 0.1532 - Val Accuracy: 0.9388



Training:   0%|          | 0/117 [00:00<?, ?it/s][A
Training:   1%|          | 1/117 [00:01<02:20,  1.21s/it][A
Training:   3%|▎         | 3/117 [00:01<00:40,  2.82it/s][A
Training:   4%|▍         | 5/117 [00:01<00:37,  3.01it/s][A
Training:   6%|▌         | 7/117 [00:02<00:24,  4.46it/s][A
Training:   8%|▊         | 9/117 [00:02<00:29,  3.65it/s][A
Training:   9%|▉         | 11/117 [00:02<00:20,  5.10it/s][A
Training:  11%|█         | 13/117 [00:03<00:23,  4.52it/s][A
Training:  14%|█▎        | 16/117 [00:03<00:16,  6.29it/s][A
Training:  15%|█▌        | 18/117 [00:04<00:18,  5.34it/s][A
Training:  17%|█▋        | 20/117 [00:04<00:14,  6.58it/s][A
Training:  19%|█▉        | 22/117 [00:04<00:19,  4.91it/s][A
Training:  21%|██▏       | 25/117 [00:05<00:22,  4.11it/s][A
Training:  23%|██▎       | 27/117 [00:06<00:17,  5.22it/s][A
Training:  25%|██▍       | 29/117 [00:06<00:20,  4.25it/s][A
Training:  28%|██▊       | 33/117 [00:07<00:17,  4.82it/s][A
Training:  32%|███▏  

Epoch: 60/81 - Loss: 0.1464 - Accuracy: 0.9423



  0%|          | 0/15 [00:00<?, ?it/s][A
  7%|▋         | 1/15 [00:01<00:14,  1.05s/it][A
 27%|██▋       | 4/15 [00:01<00:02,  4.24it/s][A
 40%|████      | 6/15 [00:01<00:02,  3.72it/s][A
 47%|████▋     | 7/15 [00:01<00:01,  4.37it/s][A
 53%|█████▎    | 8/15 [00:02<00:01,  4.73it/s][A
 60%|██████    | 9/15 [00:02<00:01,  3.36it/s][A
 73%|███████▎  | 11/15 [00:02<00:00,  4.95it/s][A
 80%|████████  | 12/15 [00:03<00:00,  4.70it/s][A
100%|██████████| 15/15 [00:03<00:00,  4.24it/s][A
Epochs:  74%|███████▍  | 60/81 [26:44<09:22, 26.79s/it]

Val Loss: 0.1474 - Val Accuracy: 0.9380



Training:   0%|          | 0/117 [00:00<?, ?it/s][A
Training:   1%|          | 1/117 [00:01<01:59,  1.03s/it][A
Training:   3%|▎         | 3/117 [00:01<00:35,  3.23it/s][A
Training:   4%|▍         | 5/117 [00:01<00:33,  3.31it/s][A
Training:   5%|▌         | 6/117 [00:01<00:29,  3.78it/s][A
Training:   7%|▋         | 8/117 [00:02<00:19,  5.72it/s][A
Training:   9%|▊         | 10/117 [00:02<00:26,  4.10it/s][A
Training:  11%|█         | 13/117 [00:03<00:23,  4.44it/s][A
Training:  12%|█▏        | 14/117 [00:03<00:23,  4.46it/s][A
Training:  15%|█▍        | 17/117 [00:04<00:20,  4.83it/s][A
Training:  15%|█▌        | 18/117 [00:04<00:20,  4.80it/s][A
Training:  18%|█▊        | 21/117 [00:04<00:18,  5.23it/s][A
Training:  19%|█▉        | 22/117 [00:05<00:19,  4.98it/s][A
Training:  21%|██▏       | 25/117 [00:05<00:16,  5.69it/s][A
Training:  22%|██▏       | 26/117 [00:05<00:19,  4.71it/s][A
Training:  25%|██▍       | 29/117 [00:06<00:14,  5.89it/s][A
Training:  26%|██▌   

Epoch: 61/81 - Loss: 0.1352 - Accuracy: 0.9461



  0%|          | 0/15 [00:00<?, ?it/s][A
  7%|▋         | 1/15 [00:00<00:12,  1.16it/s][A
 27%|██▋       | 4/15 [00:01<00:02,  4.97it/s][A
 40%|████      | 6/15 [00:01<00:02,  3.96it/s][A
 60%|██████    | 9/15 [00:02<00:01,  4.24it/s][A
 80%|████████  | 12/15 [00:02<00:00,  6.52it/s][A
100%|██████████| 15/15 [00:03<00:00,  4.59it/s][A
Epochs:  75%|███████▌  | 61/81 [27:11<08:54, 26.70s/it]

Val Loss: 0.1458 - Val Accuracy: 0.9403



Training:   0%|          | 0/117 [00:00<?, ?it/s][A
Training:   1%|          | 1/117 [00:01<02:07,  1.10s/it][A
Training:   3%|▎         | 3/117 [00:01<00:36,  3.09it/s][A
Training:   4%|▍         | 5/117 [00:01<00:36,  3.08it/s][A
Training:   7%|▋         | 8/117 [00:01<00:18,  5.76it/s][A
Training:   9%|▊         | 10/117 [00:02<00:24,  4.30it/s][A
Training:  10%|█         | 12/117 [00:02<00:18,  5.72it/s][A
Training:  12%|█▏        | 14/117 [00:03<00:22,  4.53it/s][A
Training:  14%|█▎        | 16/117 [00:03<00:20,  5.05it/s][A
Training:  15%|█▍        | 17/117 [00:04<00:26,  3.83it/s][A
Training:  16%|█▌        | 19/117 [00:04<00:18,  5.21it/s][A
Training:  18%|█▊        | 21/117 [00:05<00:23,  4.09it/s][A
Training:  20%|█▉        | 23/117 [00:05<00:17,  5.32it/s][A
Training:  21%|██▏       | 25/117 [00:05<00:20,  4.41it/s][A
Training:  23%|██▎       | 27/117 [00:06<00:16,  5.41it/s][A
Training:  25%|██▍       | 29/117 [00:06<00:17,  5.01it/s][A
Training:  26%|██▌  

Epoch: 62/81 - Loss: 0.1383 - Accuracy: 0.9438



  0%|          | 0/15 [00:00<?, ?it/s][A
  7%|▋         | 1/15 [00:00<00:13,  1.04it/s][A
 20%|██        | 3/15 [00:01<00:03,  3.19it/s][A
 33%|███▎      | 5/15 [00:01<00:02,  3.45it/s][A
 40%|████      | 6/15 [00:01<00:02,  3.95it/s][A
 47%|████▋     | 7/15 [00:01<00:01,  4.73it/s][A
 60%|██████    | 9/15 [00:02<00:01,  4.01it/s][A
 67%|██████▋   | 10/15 [00:02<00:01,  4.24it/s][A
100%|██████████| 15/15 [00:03<00:00,  4.38it/s][A
Epochs:  77%|███████▋  | 62/81 [27:38<08:26, 26.67s/it]

Val Loss: 0.1774 - Val Accuracy: 0.9331



Training:   0%|          | 0/117 [00:00<?, ?it/s][A
Training:   1%|          | 1/117 [00:01<02:01,  1.05s/it][A
Training:   3%|▎         | 4/117 [00:01<00:26,  4.33it/s][A
Training:   5%|▌         | 6/117 [00:01<00:28,  3.91it/s][A
Training:   6%|▌         | 7/117 [00:01<00:25,  4.39it/s][A
Training:   8%|▊         | 9/117 [00:02<00:24,  4.39it/s][A
Training:   9%|▉         | 11/117 [00:02<00:21,  5.02it/s][A
Training:  11%|█         | 13/117 [00:03<00:22,  4.67it/s][A
Training:  12%|█▏        | 14/117 [00:03<00:21,  4.79it/s][A
Training:  13%|█▎        | 15/117 [00:03<00:23,  4.40it/s][A
Training:  14%|█▎        | 16/117 [00:03<00:20,  4.99it/s][A
Training:  15%|█▍        | 17/117 [00:04<00:24,  4.00it/s][A
Training:  16%|█▌        | 19/117 [00:04<00:21,  4.57it/s][A
Training:  18%|█▊        | 21/117 [00:04<00:20,  4.63it/s][A
Training:  20%|█▉        | 23/117 [00:05<00:21,  4.38it/s][A
Training:  21%|██▏       | 25/117 [00:05<00:18,  4.94it/s][A
Training:  23%|██▎   

Epoch: 63/81 - Loss: 0.1514 - Accuracy: 0.9392



  0%|          | 0/15 [00:00<?, ?it/s][A
  7%|▋         | 1/15 [00:01<00:16,  1.17s/it][A
 20%|██        | 3/15 [00:01<00:04,  2.68it/s][A
 33%|███▎      | 5/15 [00:02<00:03,  2.65it/s][A
 53%|█████▎    | 8/15 [00:02<00:01,  4.98it/s][A
 67%|██████▋   | 10/15 [00:02<00:01,  4.46it/s][A
100%|██████████| 15/15 [00:03<00:00,  4.10it/s][A
Epochs:  78%|███████▊  | 63/81 [28:05<08:03, 26.84s/it]

Val Loss: 0.1595 - Val Accuracy: 0.9403



Training:   0%|          | 0/117 [00:00<?, ?it/s][A
Training:   1%|          | 1/117 [00:01<02:12,  1.15s/it][A
Training:   3%|▎         | 3/117 [00:01<00:39,  2.91it/s][A
Training:   4%|▍         | 5/117 [00:01<00:35,  3.17it/s][A
Training:   6%|▌         | 7/117 [00:01<00:22,  4.79it/s][A
Training:   8%|▊         | 9/117 [00:02<00:23,  4.57it/s][A
Training:   9%|▉         | 11/117 [00:02<00:17,  6.22it/s][A
Training:  11%|█         | 13/117 [00:03<00:22,  4.59it/s][A
Training:  13%|█▎        | 15/117 [00:03<00:17,  5.74it/s][A
Training:  15%|█▍        | 17/117 [00:03<00:21,  4.65it/s][A
Training:  16%|█▌        | 19/117 [00:04<00:16,  6.05it/s][A
Training:  18%|█▊        | 21/117 [00:04<00:21,  4.39it/s][A
Training:  20%|█▉        | 23/117 [00:04<00:16,  5.60it/s][A
Training:  21%|██▏       | 25/117 [00:05<00:18,  4.88it/s][A
Training:  24%|██▍       | 28/117 [00:05<00:14,  6.05it/s][A
Training:  25%|██▍       | 29/117 [00:06<00:17,  5.04it/s][A
Training:  26%|██▋   

Epoch: 64/81 - Loss: 0.1403 - Accuracy: 0.9449



  0%|          | 0/15 [00:00<?, ?it/s][A
  7%|▋         | 1/15 [00:01<00:14,  1.04s/it][A
 13%|█▎        | 2/15 [00:01<00:07,  1.85it/s][A
 27%|██▋       | 4/15 [00:01<00:02,  4.04it/s][A
 33%|███▎      | 5/15 [00:01<00:03,  3.15it/s][A
 40%|████      | 6/15 [00:02<00:02,  3.75it/s][A
 53%|█████▎    | 8/15 [00:02<00:01,  5.84it/s][A
 60%|██████    | 9/15 [00:02<00:01,  4.21it/s][A
 67%|██████▋   | 10/15 [00:02<00:01,  4.27it/s][A
 80%|████████  | 12/15 [00:02<00:00,  6.34it/s][A
 87%|████████▋ | 13/15 [00:03<00:00,  5.20it/s][A
100%|██████████| 15/15 [00:03<00:00,  4.26it/s][A
Epochs:  79%|███████▉  | 64/81 [28:31<07:35, 26.80s/it]

Val Loss: 0.1516 - Val Accuracy: 0.9403



Training:   0%|          | 0/117 [00:00<?, ?it/s][A
Training:   1%|          | 1/117 [00:01<01:58,  1.02s/it][A
Training:   3%|▎         | 4/117 [00:01<00:25,  4.36it/s][A
Training:   5%|▌         | 6/117 [00:02<00:37,  2.96it/s][A
Training:   8%|▊         | 9/117 [00:02<00:27,  3.86it/s][A
Training:   9%|▊         | 10/117 [00:03<00:29,  3.59it/s][A
Training:  10%|█         | 12/117 [00:03<00:21,  4.85it/s][A
Training:  11%|█         | 13/117 [00:03<00:26,  3.92it/s][A
Training:  12%|█▏        | 14/117 [00:03<00:28,  3.68it/s][A
Training:  15%|█▍        | 17/117 [00:04<00:20,  4.90it/s][A
Training:  15%|█▌        | 18/117 [00:04<00:23,  4.18it/s][A
Training:  18%|█▊        | 21/117 [00:05<00:18,  5.07it/s][A
Training:  19%|█▉        | 22/117 [00:05<00:21,  4.50it/s][A
Training:  21%|██        | 24/117 [00:05<00:15,  5.94it/s][A
Training:  21%|██▏       | 25/117 [00:05<00:15,  6.00it/s][A
Training:  22%|██▏       | 26/117 [00:06<00:19,  4.56it/s][A
Training:  23%|██▎  

Epoch: 65/81 - Loss: 0.1432 - Accuracy: 0.9428



  0%|          | 0/15 [00:00<?, ?it/s][A
  7%|▋         | 1/15 [00:01<00:17,  1.24s/it][A
 33%|███▎      | 5/15 [00:02<00:03,  2.82it/s][A
 60%|██████    | 9/15 [00:02<00:01,  3.49it/s][A
 80%|████████  | 12/15 [00:03<00:00,  5.13it/s][A
100%|██████████| 15/15 [00:03<00:00,  3.94it/s][A
Epochs:  80%|████████  | 65/81 [29:00<07:15, 27.23s/it]

Val Loss: 0.1582 - Val Accuracy: 0.9335



Training:   0%|          | 0/117 [00:00<?, ?it/s][A
Training:   1%|          | 1/117 [00:00<01:50,  1.05it/s][A
Training:   4%|▍         | 5/117 [00:01<00:31,  3.58it/s][A
Training:   8%|▊         | 9/117 [00:02<00:23,  4.51it/s][A
Training:  10%|█         | 12/117 [00:02<00:16,  6.36it/s][A
Training:  12%|█▏        | 14/117 [00:03<00:20,  4.91it/s][A
Training:  13%|█▎        | 15/117 [00:03<00:19,  5.19it/s][A
Training:  15%|█▍        | 17/117 [00:03<00:20,  4.90it/s][A
Training:  15%|█▌        | 18/117 [00:03<00:21,  4.62it/s][A
Training:  16%|█▌        | 19/117 [00:04<00:19,  5.08it/s][A
Training:  18%|█▊        | 21/117 [00:04<00:19,  4.98it/s][A
Training:  19%|█▉        | 22/117 [00:04<00:22,  4.16it/s][A
Training:  21%|██▏       | 25/117 [00:05<00:17,  5.32it/s][A
Training:  22%|██▏       | 26/117 [00:05<00:19,  4.74it/s][A
Training:  25%|██▍       | 29/117 [00:05<00:14,  6.03it/s][A
Training:  26%|██▌       | 30/117 [00:06<00:17,  4.97it/s][A
Training:  27%|██▋ 

Epoch: 66/81 - Loss: 0.1472 - Accuracy: 0.9434



  0%|          | 0/15 [00:00<?, ?it/s][A
  7%|▋         | 1/15 [00:01<00:19,  1.38s/it][A
 33%|███▎      | 5/15 [00:02<00:03,  2.57it/s][A
 53%|█████▎    | 8/15 [00:02<00:01,  4.52it/s][A
 67%|██████▋   | 10/15 [00:03<00:01,  3.87it/s][A
100%|██████████| 15/15 [00:03<00:00,  3.89it/s][A
Epochs:  80%|████████  | 65/81 [29:27<07:14, 27.19s/it]
[32m[I 2023-12-15 00:52:04,045][0m Trial 7 pruned. [0m


Val Loss: 0.1526 - Val Accuracy: 0.9380
Learning rate: 8.19622214040848e-05
Weight decay: 0.0006651175912530341
Epsilon: 2.0431682685958338e-08
Batch size: 99
Number of epochs: 97


Epochs:   0%|          | 0/97 [00:00<?, ?it/s]
Training:   0%|          | 0/142 [00:00<?, ?it/s][A
Training:   1%|          | 1/142 [00:01<02:27,  1.05s/it][A
Training:   2%|▏         | 3/142 [00:01<00:46,  3.01it/s][A
Training:   4%|▎         | 5/142 [00:01<00:36,  3.80it/s][A
Training:   4%|▍         | 6/142 [00:01<00:30,  4.50it/s][A
Training:   6%|▋         | 9/142 [00:02<00:24,  5.46it/s][A
Training:   7%|▋         | 10/142 [00:02<00:22,  5.99it/s][A
Training:   9%|▉         | 13/142 [00:02<00:20,  6.42it/s][A
Training:  10%|▉         | 14/142 [00:03<00:23,  5.37it/s][A
Training:  11%|█▏        | 16/142 [00:03<00:18,  6.92it/s][A
Training:  12%|█▏        | 17/142 [00:03<00:21,  5.79it/s][A
Training:  13%|█▎        | 18/142 [00:03<00:23,  5.25it/s][A
Training:  15%|█▍        | 21/142 [00:04<00:19,  6.10it/s][A
Training:  15%|█▌        | 22/142 [00:04<00:21,  5.59it/s][A
Training:  17%|█▋        | 24/142 [00:04<00:16,  7.12it/s][A
Training:  18%|█▊        | 25/142 [00

Epoch: 1/97 - Loss: 0.4710 - Accuracy: 0.8054



  0%|          | 0/18 [00:00<?, ?it/s][A
  6%|▌         | 1/18 [00:00<00:16,  1.02it/s][A
 17%|█▋        | 3/18 [00:01<00:04,  3.11it/s][A
 28%|██▊       | 5/18 [00:01<00:03,  3.62it/s][A
 39%|███▉      | 7/18 [00:01<00:02,  5.19it/s][A
 50%|█████     | 9/18 [00:02<00:01,  4.92it/s][A
 61%|██████    | 11/18 [00:02<00:01,  5.69it/s][A
 72%|███████▏  | 13/18 [00:02<00:00,  5.90it/s][A
 78%|███████▊  | 14/18 [00:02<00:00,  6.21it/s][A
 83%|████████▎ | 15/18 [00:03<00:00,  6.09it/s][A
100%|██████████| 18/18 [00:03<00:00,  4.98it/s][A
Epochs:   0%|          | 0/97 [00:27<?, ?it/s]


Val Loss: 0.3301 - Val Accuracy: 0.8851


[32m[I 2023-12-15 00:52:31,767][0m Trial 8 pruned. [0m


Learning rate: 0.002005785451589527
Weight decay: 0.00012253607234297403
Epsilon: 4.799570380034638e-08
Batch size: 137
Number of epochs: 85


Epochs:   0%|          | 0/85 [00:00<?, ?it/s]
Training:   0%|          | 0/102 [00:00<?, ?it/s][A
Training:   1%|          | 1/102 [00:01<01:52,  1.11s/it][A
Training:   2%|▏         | 2/102 [00:01<00:54,  1.83it/s][A
Training:   5%|▍         | 5/102 [00:01<00:29,  3.25it/s][A
Training:   6%|▌         | 6/102 [00:02<00:24,  3.88it/s][A
Training:   8%|▊         | 8/102 [00:02<00:16,  5.59it/s][A
Training:   9%|▉         | 9/102 [00:02<00:26,  3.53it/s][A
Training:  12%|█▏        | 12/102 [00:02<00:14,  6.26it/s][A
Training:  14%|█▎        | 14/102 [00:03<00:24,  3.58it/s][A
Training:  17%|█▋        | 17/102 [00:04<00:20,  4.08it/s][A
Training:  20%|█▉        | 20/102 [00:04<00:13,  5.94it/s][A
Training:  22%|██▏       | 22/102 [00:05<00:17,  4.60it/s][A
Training:  25%|██▍       | 25/102 [00:05<00:16,  4.72it/s][A
Training:  25%|██▌       | 26/102 [00:06<00:16,  4.55it/s][A
Training:  28%|██▊       | 29/102 [00:06<00:13,  5.37it/s][A
Training:  29%|██▉       | 30/102 [00:

Epoch: 1/85 - Loss: 0.3867 - Accuracy: 0.8330



  0%|          | 0/13 [00:00<?, ?it/s][A
  8%|▊         | 1/13 [00:01<00:17,  1.44s/it][A
 31%|███       | 4/13 [00:01<00:02,  3.27it/s][A
 46%|████▌     | 6/13 [00:02<00:02,  2.97it/s][A
 69%|██████▉   | 9/13 [00:03<00:01,  3.38it/s][A
 77%|███████▋  | 10/13 [00:03<00:00,  3.69it/s][A
100%|██████████| 13/13 [00:03<00:00,  3.53it/s][A
Epochs:   0%|          | 0/85 [00:27<?, ?it/s]
[32m[I 2023-12-15 00:52:59,563][0m Trial 9 pruned. [0m


Val Loss: 0.2268 - Val Accuracy: 0.9027
Learning rate: 1.4538307885462702e-05
Weight decay: 0.0002172635852988645
Epsilon: 4.147277776013085e-09
Batch size: 195
Number of epochs: 36


Epochs:   0%|          | 0/36 [00:00<?, ?it/s]
Training:   0%|          | 0/72 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/72 [00:01<01:59,  1.68s/it][A
Training:   3%|▎         | 2/72 [00:01<00:56,  1.24it/s][A
Training:   6%|▌         | 4/72 [00:01<00:22,  3.01it/s][A
Training:   8%|▊         | 6/72 [00:03<00:28,  2.28it/s][A
Training:  11%|█         | 8/72 [00:03<00:18,  3.38it/s][A
Training:  12%|█▎        | 9/72 [00:04<00:27,  2.29it/s][A
Training:  14%|█▍        | 10/72 [00:04<00:24,  2.56it/s][A
Training:  18%|█▊        | 13/72 [00:05<00:21,  2.74it/s][A
Training:  19%|█▉        | 14/72 [00:05<00:18,  3.15it/s][A
Training:  24%|██▎       | 17/72 [00:06<00:16,  3.29it/s][A
Training:  25%|██▌       | 18/72 [00:06<00:17,  3.14it/s][A
Training:  28%|██▊       | 20/72 [00:06<00:11,  4.35it/s][A
Training:  29%|██▉       | 21/72 [00:07<00:18,  2.74it/s][A
Training:  31%|███       | 22/72 [00:08<00:16,  3.08it/s][A
Training:  33%|███▎      | 24/72 [00:08<00:11,  4.30i

Epoch: 1/36 - Loss: 0.6754 - Accuracy: 0.5792



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:01<00:13,  1.70s/it][A
 22%|██▏       | 2/9 [00:01<00:05,  1.17it/s][A
 33%|███▎      | 3/9 [00:02<00:03,  1.97it/s][A
 56%|█████▌    | 5/9 [00:03<00:02,  1.95it/s][A
 67%|██████▋   | 6/9 [00:03<00:01,  2.45it/s][A
100%|██████████| 9/9 [00:04<00:00,  2.14it/s][A
Epochs:   0%|          | 0/36 [00:27<?, ?it/s]
[32m[I 2023-12-15 00:53:28,082][0m Trial 10 pruned. [0m


Val Loss: 0.6369 - Val Accuracy: 0.6727
Learning rate: 0.000570460761203135
Weight decay: 0.00042617738933726666
Epsilon: 7.279481359440188e-09
Batch size: 212
Number of epochs: 48


Epochs:   0%|          | 0/48 [00:00<?, ?it/s]
Training:   0%|          | 0/66 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/66 [00:01<01:59,  1.83s/it][A
Training:   3%|▎         | 2/66 [00:01<00:52,  1.22it/s][A
Training:   6%|▌         | 4/66 [00:02<00:21,  2.87it/s][A
Training:   8%|▊         | 5/66 [00:03<00:38,  1.59it/s][A
Training:  11%|█         | 7/66 [00:03<00:21,  2.69it/s][A
Training:  14%|█▎        | 9/66 [00:04<00:28,  2.03it/s][A
Training:  15%|█▌        | 10/66 [00:04<00:22,  2.45it/s][A
Training:  20%|█▉        | 13/66 [00:05<00:19,  2.70it/s][A
Training:  21%|██        | 14/66 [00:06<00:16,  3.08it/s][A
Training:  23%|██▎       | 15/66 [00:06<00:14,  3.56it/s][A
Training:  26%|██▌       | 17/66 [00:07<00:19,  2.49it/s][A
Training:  29%|██▉       | 19/66 [00:07<00:13,  3.46it/s][A
Training:  30%|███       | 20/66 [00:07<00:11,  3.96it/s][A
Training:  32%|███▏      | 21/66 [00:08<00:21,  2.11it/s][A
Training:  36%|███▋      | 24/66 [00:09<00:11,  3.67i

Epoch: 1/48 - Loss: 0.4391 - Accuracy: 0.7922



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:01<00:13,  1.64s/it][A
 33%|███▎      | 3/9 [00:01<00:03,  1.91it/s][A
 56%|█████▌    | 5/9 [00:03<00:02,  1.82it/s][A
 67%|██████▋   | 6/9 [00:03<00:01,  2.25it/s][A
100%|██████████| 9/9 [00:03<00:00,  2.60it/s][A
Epochs:   0%|          | 0/48 [00:27<?, ?it/s]
[32m[I 2023-12-15 00:53:56,704][0m Trial 11 pruned. [0m


Val Loss: 0.2731 - Val Accuracy: 0.8931
Learning rate: 0.05948026968537991
Weight decay: 0.00034787947770947993
Epsilon: 8.078943657181766e-09
Batch size: 248
Number of epochs: 54


Epochs:   0%|          | 0/54 [00:00<?, ?it/s]
Training:   0%|          | 0/57 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/57 [00:02<01:59,  2.13s/it][A
Training:   4%|▎         | 2/57 [00:02<00:52,  1.04it/s][A
Training:   7%|▋         | 4/57 [00:02<00:21,  2.47it/s][A
Training:   9%|▉         | 5/57 [00:03<00:35,  1.45it/s][A
Training:  12%|█▏        | 7/57 [00:03<00:19,  2.53it/s][A
Training:  16%|█▌        | 9/57 [00:05<00:27,  1.75it/s][A
Training:  19%|█▉        | 11/57 [00:05<00:18,  2.55it/s][A
Training:  23%|██▎       | 13/57 [00:07<00:23,  1.88it/s][A
Training:  26%|██▋       | 15/57 [00:07<00:16,  2.61it/s][A
Training:  28%|██▊       | 16/57 [00:07<00:13,  2.98it/s][A
Training:  30%|██▉       | 17/57 [00:09<00:24,  1.63it/s][A
Training:  33%|███▎      | 19/57 [00:09<00:15,  2.44it/s][A
Training:  37%|███▋      | 21/57 [00:10<00:18,  1.98it/s][A
Training:  40%|████      | 23/57 [00:10<00:12,  2.77it/s][A
Training:  44%|████▍     | 25/57 [00:12<00:15,  2.07i

Epoch: 1/54 - Loss: 50.3775 - Accuracy: 0.6534



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:01<00:13,  1.97s/it][A
 62%|██████▎   | 5/8 [00:03<00:01,  1.57it/s][A
 75%|███████▌  | 6/8 [00:03<00:01,  1.89it/s][A
100%|██████████| 8/8 [00:03<00:00,  2.03it/s][A
Epochs:   0%|          | 0/54 [00:27<?, ?it/s]
[32m[I 2023-12-15 00:54:25,164][0m Trial 12 pruned. [0m


Val Loss: 0.9847 - Val Accuracy: 0.8056
Learning rate: 1.1317403035941938e-05
Weight decay: 0.0011705693693100725
Epsilon: 3.2898539137350323e-09
Batch size: 174
Number of epochs: 38


Epochs:   0%|          | 0/38 [00:00<?, ?it/s]
Training:   0%|          | 0/81 [00:00<?, ?it/s][A
Training:   1%|          | 1/81 [00:01<01:37,  1.22s/it][A
Training:   2%|▏         | 2/81 [00:01<00:47,  1.65it/s][A
Training:   5%|▍         | 4/81 [00:01<00:21,  3.66it/s][A
Training:   6%|▌         | 5/81 [00:02<00:36,  2.06it/s][A
Training:   9%|▊         | 7/81 [00:02<00:22,  3.34it/s][A
Training:  10%|▉         | 8/81 [00:02<00:20,  3.59it/s][A
Training:  11%|█         | 9/81 [00:03<00:28,  2.56it/s][A
Training:  12%|█▏        | 10/81 [00:03<00:22,  3.21it/s][A
Training:  15%|█▍        | 12/81 [00:04<00:16,  4.14it/s][A
Training:  16%|█▌        | 13/81 [00:04<00:24,  2.79it/s][A
Training:  19%|█▊        | 15/81 [00:04<00:15,  4.15it/s][A
Training:  20%|█▉        | 16/81 [00:05<00:18,  3.61it/s][A
Training:  21%|██        | 17/81 [00:05<00:23,  2.73it/s][A
Training:  23%|██▎       | 19/81 [00:06<00:17,  3.62it/s][A
Training:  25%|██▍       | 20/81 [00:06<00:16,  3.73it

Epoch: 1/38 - Loss: 0.6521 - Accuracy: 0.6459



  0%|          | 0/11 [00:00<?, ?it/s][A
  9%|▉         | 1/11 [00:01<00:16,  1.65s/it][A
 27%|██▋       | 3/11 [00:01<00:03,  2.14it/s][A
 45%|████▌     | 5/11 [00:02<00:02,  2.32it/s][A
 55%|█████▍    | 6/11 [00:02<00:01,  2.91it/s][A
100%|██████████| 11/11 [00:03<00:00,  3.06it/s][A
Epochs:   0%|          | 0/38 [00:27<?, ?it/s]
[32m[I 2023-12-15 00:54:52,872][0m Trial 13 pruned. [0m


Val Loss: 0.6200 - Val Accuracy: 0.7347
Learning rate: 0.0002368647611919522
Weight decay: 0.005253290197793034
Epsilon: 1.024280390884668e-09
Batch size: 241
Number of epochs: 68


Epochs:   0%|          | 0/68 [00:00<?, ?it/s]
Training:   0%|          | 0/58 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/58 [00:02<02:03,  2.17s/it][A
Training:   9%|▊         | 5/58 [00:03<00:35,  1.47it/s][A
Training:  12%|█▏        | 7/58 [00:04<00:23,  2.19it/s][A
Training:  14%|█▍        | 8/58 [00:04<00:19,  2.59it/s][A
Training:  16%|█▌        | 9/58 [00:05<00:30,  1.62it/s][A
Training:  22%|██▏       | 13/58 [00:07<00:23,  1.89it/s][A
Training:  24%|██▍       | 14/58 [00:07<00:20,  2.17it/s][A
Training:  26%|██▌       | 15/58 [00:07<00:17,  2.51it/s][A
Training:  29%|██▉       | 17/58 [00:09<00:20,  2.00it/s][A
Training:  33%|███▎      | 19/58 [00:09<00:13,  2.81it/s][A
Training:  36%|███▌      | 21/58 [00:10<00:17,  2.06it/s][A
Training:  40%|███▉      | 23/58 [00:10<00:12,  2.83it/s][A
Training:  43%|████▎     | 25/58 [00:12<00:15,  2.17it/s][A
Training:  48%|████▊     | 28/58 [00:12<00:08,  3.45it/s][A
Training:  52%|█████▏    | 30/58 [00:13<00:11,  2.35

Epoch: 1/68 - Loss: 0.4745 - Accuracy: 0.7752



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:01<00:12,  1.76s/it][A
 25%|██▌       | 2/8 [00:01<00:05,  1.20it/s][A
 62%|██████▎   | 5/8 [00:03<00:01,  1.79it/s][A
100%|██████████| 8/8 [00:03<00:00,  2.24it/s][A
Epochs:   0%|          | 0/68 [00:28<?, ?it/s]
[32m[I 2023-12-15 00:55:22,174][0m Trial 14 pruned. [0m


Val Loss: 0.3275 - Val Accuracy: 0.8730
Learning rate: 0.011120328919873822
Weight decay: 0.0009021908416559254
Epsilon: 1.3856544340527937e-08
Batch size: 162
Number of epochs: 60


Epochs:   0%|          | 0/60 [00:00<?, ?it/s]
Training:   0%|          | 0/87 [00:00<?, ?it/s][A
Training:   1%|          | 1/87 [00:01<01:55,  1.34s/it][A
Training:   3%|▎         | 3/87 [00:01<00:34,  2.47it/s][A
Training:   6%|▌         | 5/87 [00:02<00:35,  2.29it/s][A
Training:   7%|▋         | 6/87 [00:02<00:31,  2.58it/s][A
Training:   9%|▉         | 8/87 [00:02<00:19,  4.15it/s][A
Training:  11%|█▏        | 10/87 [00:03<00:25,  2.98it/s][A
Training:  14%|█▍        | 12/87 [00:03<00:18,  4.08it/s][A
Training:  15%|█▍        | 13/87 [00:04<00:25,  2.88it/s][A
Training:  16%|█▌        | 14/87 [00:05<00:25,  2.89it/s][A
Training:  17%|█▋        | 15/87 [00:05<00:21,  3.38it/s][A
Training:  20%|█▉        | 17/87 [00:05<00:22,  3.17it/s][A
Training:  21%|██        | 18/87 [00:06<00:20,  3.43it/s][A
Training:  22%|██▏       | 19/87 [00:06<00:17,  3.88it/s][A
Training:  24%|██▍       | 21/87 [00:06<00:18,  3.49it/s][A
Training:  25%|██▌       | 22/87 [00:07<00:17,  3.68

Epoch: 1/60 - Loss: 0.6754 - Accuracy: 0.8227



  0%|          | 0/11 [00:00<?, ?it/s][A
  9%|▉         | 1/11 [00:01<00:15,  1.57s/it][A
 45%|████▌     | 5/11 [00:02<00:02,  2.38it/s][A
100%|██████████| 11/11 [00:03<00:00,  3.07it/s][A
Epochs:   2%|▏         | 1/60 [00:26<26:29, 26.95s/it]

Val Loss: 0.2025 - Val Accuracy: 0.9146



Training:   0%|          | 0/87 [00:00<?, ?it/s][A
Training:   1%|          | 1/87 [00:01<01:52,  1.31s/it][A
Training:   2%|▏         | 2/87 [00:01<01:01,  1.37it/s][A
Training:   5%|▍         | 4/87 [00:01<00:25,  3.23it/s][A
Training:   6%|▌         | 5/87 [00:02<00:29,  2.80it/s][A
Training:   7%|▋         | 6/87 [00:02<00:26,  3.00it/s][A
Training:   9%|▉         | 8/87 [00:02<00:16,  4.81it/s][A
Training:  10%|█         | 9/87 [00:03<00:25,  3.05it/s][A
Training:  11%|█▏        | 10/87 [00:03<00:21,  3.55it/s][A
Training:  13%|█▎        | 11/87 [00:03<00:18,  4.11it/s][A
Training:  15%|█▍        | 13/87 [00:04<00:23,  3.08it/s][A
Training:  16%|█▌        | 14/87 [00:04<00:21,  3.40it/s][A
Training:  17%|█▋        | 15/87 [00:04<00:17,  4.09it/s][A
Training:  20%|█▉        | 17/87 [00:05<00:22,  3.16it/s][A
Training:  21%|██        | 18/87 [00:05<00:20,  3.35it/s][A
Training:  23%|██▎       | 20/87 [00:05<00:14,  4.71it/s][A
Training:  24%|██▍       | 21/87 [00:06

Epoch: 2/60 - Loss: 0.2174 - Accuracy: 0.9083



  0%|          | 0/11 [00:00<?, ?it/s][A
  9%|▉         | 1/11 [00:01<00:13,  1.40s/it][A
 45%|████▌     | 5/11 [00:02<00:02,  2.61it/s][A
 73%|███████▎  | 8/11 [00:02<00:00,  4.56it/s][A
100%|██████████| 11/11 [00:03<00:00,  3.21it/s][A
Epochs:   2%|▏         | 1/60 [00:53<52:39, 53.54s/it]
[32m[I 2023-12-15 00:56:16,430][0m Trial 15 pruned. [0m


Val Loss: 0.2637 - Val Accuracy: 0.8871
Learning rate: 0.00021047614680916088
Weight decay: 0.00036071850880326466
Epsilon: 4.662333380755921e-09
Batch size: 295
Number of epochs: 78


Epochs:   0%|          | 0/78 [00:00<?, ?it/s]
Training:   0%|          | 0/48 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/48 [00:02<01:43,  2.20s/it][A
Training:   6%|▋         | 3/48 [00:02<00:27,  1.61it/s][A
Training:  10%|█         | 5/48 [00:04<00:35,  1.20it/s][A
Training:  15%|█▍        | 7/48 [00:04<00:20,  1.96it/s][A
Training:  19%|█▉        | 9/48 [00:06<00:25,  1.50it/s][A
Training:  21%|██        | 10/48 [00:06<00:20,  1.81it/s][A
Training:  23%|██▎       | 11/48 [00:06<00:16,  2.23it/s][A
Training:  27%|██▋       | 13/48 [00:08<00:20,  1.73it/s][A
Training:  31%|███▏      | 15/48 [00:08<00:13,  2.52it/s][A
Training:  35%|███▌      | 17/48 [00:09<00:15,  1.94it/s][A
Training:  42%|████▏     | 20/48 [00:10<00:09,  3.05it/s][A
Training:  44%|████▍     | 21/48 [00:11<00:15,  1.75it/s][A
Training:  48%|████▊     | 23/48 [00:11<00:10,  2.44it/s][A
Training:  52%|█████▏    | 25/48 [00:13<00:13,  1.71it/s][A
Training:  56%|█████▋    | 27/48 [00:14<00:08,  2.34

Epoch: 1/78 - Loss: 0.4750 - Accuracy: 0.8037



  0%|          | 0/6 [00:00<?, ?it/s][A
 17%|█▋        | 1/6 [00:02<00:09,  1.99s/it][A
 50%|█████     | 3/6 [00:02<00:01,  1.71it/s][A
100%|██████████| 6/6 [00:03<00:00,  1.64it/s][A
Epochs:   0%|          | 0/78 [00:27<?, ?it/s]
[32m[I 2023-12-15 00:56:44,313][0m Trial 16 pruned. [0m


Val Loss: 0.3283 - Val Accuracy: 0.8835
Learning rate: 3.065990017216129e-05
Weight decay: 0.0020192397673603965
Epsilon: 1.53889328547201e-08
Batch size: 219
Number of epochs: 44


Epochs:   0%|          | 0/44 [00:00<?, ?it/s]
Training:   0%|          | 0/64 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/64 [00:01<01:57,  1.87s/it][A
Training:   3%|▎         | 2/64 [00:02<00:52,  1.19it/s][A
Training:   5%|▍         | 3/64 [00:02<00:30,  1.98it/s][A
Training:   6%|▋         | 4/64 [00:02<00:21,  2.85it/s][A
Training:   8%|▊         | 5/64 [00:03<00:38,  1.54it/s][A
Training:  11%|█         | 7/64 [00:03<00:20,  2.81it/s][A
Training:  14%|█▍        | 9/64 [00:04<00:27,  1.99it/s][A
Training:  17%|█▋        | 11/64 [00:05<00:18,  2.90it/s][A
Training:  20%|██        | 13/64 [00:06<00:22,  2.28it/s][A
Training:  22%|██▏       | 14/64 [00:06<00:18,  2.69it/s][A
Training:  25%|██▌       | 16/64 [00:06<00:12,  3.90it/s][A
Training:  28%|██▊       | 18/64 [00:07<00:15,  2.90it/s][A
Training:  31%|███▏      | 20/64 [00:07<00:11,  3.97it/s][A
Training:  34%|███▍      | 22/64 [00:08<00:15,  2.73it/s][A
Training:  38%|███▊      | 24/64 [00:09<00:10,  3.71it

Epoch: 1/44 - Loss: 0.6232 - Accuracy: 0.6907



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:01<00:10,  1.54s/it][A
 38%|███▊      | 3/8 [00:01<00:02,  2.03it/s][A
 62%|██████▎   | 5/8 [00:02<00:01,  1.87it/s][A
100%|██████████| 8/8 [00:03<00:00,  2.44it/s][A
Epochs:   0%|          | 0/44 [00:26<?, ?it/s]
[32m[I 2023-12-15 00:57:11,366][0m Trial 17 pruned. [0m


Val Loss: 0.5492 - Val Accuracy: 0.8125
Learning rate: 0.008898488984532577
Weight decay: 0.00019237086128139516
Epsilon: 2.2589140295533423e-09
Batch size: 74
Number of epochs: 18


Epochs:   0%|          | 0/18 [00:00<?, ?it/s]
Training:   0%|          | 0/189 [00:00<?, ?it/s][A
Training:   1%|          | 1/189 [00:00<02:32,  1.24it/s][A
Training:   3%|▎         | 5/189 [00:01<00:39,  4.66it/s][A
Training:   4%|▍         | 8/189 [00:01<00:23,  7.78it/s][A
Training:   5%|▌         | 10/189 [00:01<00:27,  6.47it/s][A
Training:   7%|▋         | 13/189 [00:02<00:26,  6.63it/s][A
Training:   9%|▉         | 17/189 [00:02<00:22,  7.65it/s][A
Training:  11%|█         | 20/189 [00:02<00:17,  9.72it/s][A
Training:  12%|█▏        | 22/189 [00:03<00:21,  7.67it/s][A
Training:  13%|█▎        | 24/189 [00:03<00:19,  8.68it/s][A
Training:  14%|█▍        | 26/189 [00:03<00:22,  7.36it/s][A
Training:  15%|█▍        | 28/189 [00:03<00:19,  8.26it/s][A
Training:  16%|█▌        | 30/189 [00:04<00:21,  7.37it/s][A
Training:  17%|█▋        | 32/189 [00:04<00:21,  7.31it/s][A
Training:  17%|█▋        | 33/189 [00:04<00:24,  6.40it/s][A
Training:  19%|█▉        | 36/189 [

Epoch: 1/18 - Loss: 0.6354 - Accuracy: 0.8405



  0%|          | 0/24 [00:00<?, ?it/s][A
  4%|▍         | 1/24 [00:00<00:16,  1.39it/s][A
 21%|██        | 5/24 [00:01<00:04,  4.62it/s][A
 33%|███▎      | 8/24 [00:01<00:02,  7.34it/s][A
 42%|████▏     | 10/24 [00:01<00:02,  6.43it/s][A
 54%|█████▍    | 13/24 [00:02<00:01,  5.85it/s][A
 71%|███████   | 17/24 [00:02<00:00,  7.11it/s][A
 83%|████████▎ | 20/24 [00:02<00:00,  9.17it/s][A
100%|██████████| 24/24 [00:03<00:00,  7.05it/s][A
Epochs:   6%|▌         | 1/18 [00:26<07:33, 26.67s/it]

Val Loss: 0.1949 - Val Accuracy: 0.9152



Training:   0%|          | 0/189 [00:00<?, ?it/s][A
Training:   1%|          | 1/189 [00:00<02:17,  1.37it/s][A
Training:   3%|▎         | 5/189 [00:01<00:36,  5.10it/s][A
Training:   4%|▍         | 8/189 [00:01<00:22,  8.06it/s][A
Training:   5%|▌         | 10/189 [00:01<00:24,  7.17it/s][A
Training:   7%|▋         | 13/189 [00:02<00:24,  7.14it/s][A
Training:   8%|▊         | 16/189 [00:02<00:18,  9.50it/s][A
Training:  10%|▉         | 18/189 [00:02<00:23,  7.41it/s][A
Training:  11%|█         | 21/189 [00:03<00:23,  7.13it/s][A
Training:  13%|█▎        | 25/189 [00:03<00:22,  7.34it/s][A
Training:  15%|█▌        | 29/189 [00:04<00:23,  6.85it/s][A
Training:  17%|█▋        | 33/189 [00:04<00:21,  7.31it/s][A
Training:  19%|█▊        | 35/189 [00:04<00:18,  8.31it/s][A
Training:  20%|█▉        | 37/189 [00:05<00:20,  7.32it/s][A
Training:  22%|██▏       | 41/189 [00:05<00:19,  7.65it/s][A
Training:  23%|██▎       | 44/189 [00:05<00:14,  9.70it/s][A
Training:  24%|██▍ 

Epoch: 2/18 - Loss: 0.1930 - Accuracy: 0.9182



  0%|          | 0/24 [00:00<?, ?it/s][A
  4%|▍         | 1/24 [00:00<00:17,  1.29it/s][A
  8%|▊         | 2/24 [00:00<00:08,  2.63it/s][A
 21%|██        | 5/24 [00:01<00:03,  5.72it/s][A
 25%|██▌       | 6/24 [00:01<00:02,  6.24it/s][A
 38%|███▊      | 9/24 [00:01<00:02,  7.41it/s][A
 42%|████▏     | 10/24 [00:01<00:02,  6.66it/s][A
 54%|█████▍    | 13/24 [00:02<00:01,  8.06it/s][A
 58%|█████▊    | 14/24 [00:02<00:01,  7.80it/s][A
 71%|███████   | 17/24 [00:02<00:00,  8.87it/s][A
 75%|███████▌  | 18/24 [00:02<00:00,  8.52it/s][A
 88%|████████▊ | 21/24 [00:03<00:00,  8.70it/s][A
100%|██████████| 24/24 [00:03<00:00,  7.40it/s][A
Epochs:  11%|█         | 2/18 [00:52<06:57, 26.12s/it]

Val Loss: 0.1686 - Val Accuracy: 0.9292



Training:   0%|          | 0/189 [00:00<?, ?it/s][A
Training:   1%|          | 1/189 [00:00<02:33,  1.23it/s][A
Training:   3%|▎         | 5/189 [00:01<00:42,  4.31it/s][A
Training:   5%|▍         | 9/189 [00:01<00:29,  6.05it/s][A
Training:   6%|▋         | 12/189 [00:01<00:20,  8.43it/s][A
Training:   7%|▋         | 14/189 [00:02<00:23,  7.54it/s][A
Training:   9%|▉         | 17/189 [00:02<00:24,  7.09it/s][A
Training:  11%|█         | 21/189 [00:03<00:23,  7.29it/s][A
Training:  12%|█▏        | 23/189 [00:03<00:19,  8.46it/s][A
Training:  13%|█▎        | 25/189 [00:03<00:20,  7.82it/s][A
Training:  15%|█▌        | 29/189 [00:04<00:19,  8.24it/s][A
Training:  17%|█▋        | 32/189 [00:04<00:15, 10.35it/s][A
Training:  18%|█▊        | 34/189 [00:04<00:17,  8.99it/s][A
Training:  19%|█▉        | 36/189 [00:04<00:15,  9.85it/s][A
Training:  20%|██        | 38/189 [00:05<00:17,  8.64it/s][A
Training:  21%|██        | 40/189 [00:05<00:17,  8.54it/s][A
Training:  22%|██▏ 

Epoch: 3/18 - Loss: 0.1986 - Accuracy: 0.9201



  0%|          | 0/24 [00:00<?, ?it/s][A
  4%|▍         | 1/24 [00:00<00:19,  1.18it/s][A
 21%|██        | 5/24 [00:01<00:04,  3.93it/s][A
 38%|███▊      | 9/24 [00:01<00:02,  5.52it/s][A
 54%|█████▍    | 13/24 [00:02<00:01,  6.89it/s][A
 71%|███████   | 17/24 [00:02<00:00,  8.01it/s][A
 88%|████████▊ | 21/24 [00:03<00:00,  8.43it/s][A
100%|██████████| 24/24 [00:03<00:00,  7.22it/s][A
Epochs:  17%|█▋        | 3/18 [01:19<06:35, 26.34s/it]

Val Loss: 0.1599 - Val Accuracy: 0.9365



Training:   0%|          | 0/189 [00:00<?, ?it/s][A
Training:   1%|          | 1/189 [00:00<02:39,  1.18it/s][A
Training:   1%|          | 2/189 [00:00<01:21,  2.30it/s][A
Training:   3%|▎         | 5/189 [00:01<00:34,  5.33it/s][A
Training:   3%|▎         | 6/189 [00:01<00:32,  5.67it/s][A
Training:   5%|▍         | 9/189 [00:01<00:27,  6.52it/s][A
Training:   5%|▌         | 10/189 [00:01<00:26,  6.76it/s][A
Training:   7%|▋         | 13/189 [00:02<00:25,  6.89it/s][A
Training:   8%|▊         | 15/189 [00:02<00:20,  8.60it/s][A
Training:   9%|▉         | 17/189 [00:02<00:25,  6.68it/s][A
Training:  11%|█         | 21/189 [00:03<00:22,  7.48it/s][A
Training:  12%|█▏        | 23/189 [00:03<00:18,  8.78it/s][A
Training:  13%|█▎        | 25/189 [00:03<00:24,  6.82it/s][A
Training:  15%|█▌        | 29/189 [00:04<00:21,  7.61it/s][A
Training:  17%|█▋        | 33/189 [00:04<00:18,  8.55it/s][A
Training:  19%|█▉        | 36/189 [00:04<00:14, 10.53it/s][A
Training:  20%|██    

Epoch: 4/18 - Loss: 0.1924 - Accuracy: 0.9227



  0%|          | 0/24 [00:00<?, ?it/s][A
  4%|▍         | 1/24 [00:00<00:19,  1.17it/s][A
 21%|██        | 5/24 [00:01<00:04,  4.57it/s][A
 38%|███▊      | 9/24 [00:01<00:02,  6.24it/s][A
 54%|█████▍    | 13/24 [00:02<00:01,  7.02it/s][A
 71%|███████   | 17/24 [00:02<00:00,  7.57it/s][A
 83%|████████▎ | 20/24 [00:02<00:00,  9.58it/s][A
 92%|█████████▏| 22/24 [00:03<00:00,  8.07it/s][A
100%|██████████| 24/24 [00:03<00:00,  7.16it/s][A
Epochs:  22%|██▏       | 4/18 [01:46<06:16, 26.91s/it]

Val Loss: 0.1601 - Val Accuracy: 0.9320



Training:   0%|          | 0/189 [00:00<?, ?it/s][A
Training:   1%|          | 1/189 [00:00<02:30,  1.25it/s][A
Training:   2%|▏         | 4/189 [00:00<00:33,  5.55it/s][A
Training:   3%|▎         | 6/189 [00:01<00:32,  5.55it/s][A
Training:   5%|▍         | 9/189 [00:01<00:28,  6.25it/s][A
Training:   6%|▌         | 11/189 [00:01<00:22,  7.96it/s][A
Training:   7%|▋         | 13/189 [00:02<00:23,  7.58it/s][A
Training:   8%|▊         | 15/189 [00:02<00:21,  7.96it/s][A
Training:   9%|▉         | 17/189 [00:02<00:19,  8.66it/s][A
Training:  10%|█         | 19/189 [00:02<00:22,  7.47it/s][A
Training:  11%|█         | 21/189 [00:02<00:19,  8.82it/s][A
Training:  12%|█▏        | 23/189 [00:03<00:23,  6.95it/s][A
Training:  14%|█▍        | 26/189 [00:03<00:17,  9.07it/s][A
Training:  15%|█▍        | 28/189 [00:03<00:20,  7.98it/s][A
Training:  16%|█▌        | 30/189 [00:04<00:19,  8.03it/s][A
Training:  16%|█▋        | 31/189 [00:04<00:23,  6.73it/s][A
Training:  18%|█▊   

Epoch: 5/18 - Loss: 0.1881 - Accuracy: 0.9241



  0%|          | 0/24 [00:00<?, ?it/s][A
  4%|▍         | 1/24 [00:00<00:17,  1.33it/s][A
 17%|█▋        | 4/24 [00:00<00:03,  5.83it/s][A
 25%|██▌       | 6/24 [00:01<00:03,  5.12it/s][A
 38%|███▊      | 9/24 [00:01<00:02,  5.44it/s][A
 54%|█████▍    | 13/24 [00:02<00:01,  6.74it/s][A
 71%|███████   | 17/24 [00:02<00:00,  7.25it/s][A
100%|██████████| 24/24 [00:03<00:00,  7.44it/s][A
Epochs:  28%|██▊       | 5/18 [02:13<05:50, 26.93s/it]

Val Loss: 0.2041 - Val Accuracy: 0.9104



Training:   0%|          | 0/189 [00:00<?, ?it/s][A
Training:   1%|          | 1/189 [00:00<02:20,  1.34it/s][A
Training:   2%|▏         | 3/189 [00:00<00:43,  4.30it/s][A
Training:   3%|▎         | 5/189 [00:01<00:40,  4.52it/s][A
Training:   4%|▍         | 8/189 [00:01<00:22,  7.99it/s][A
Training:   5%|▌         | 10/189 [00:01<00:27,  6.44it/s][A
Training:   7%|▋         | 13/189 [00:02<00:28,  6.27it/s][A
Training:   8%|▊         | 16/189 [00:02<00:19,  8.74it/s][A
Training:  10%|▉         | 18/189 [00:02<00:23,  7.27it/s][A
Training:  11%|█         | 21/189 [00:03<00:23,  7.05it/s][A
Training:  13%|█▎        | 25/189 [00:03<00:21,  7.58it/s][A
Training:  15%|█▌        | 29/189 [00:04<00:20,  7.94it/s][A
Training:  17%|█▋        | 33/189 [00:04<00:19,  8.01it/s][A
Training:  19%|█▉        | 36/189 [00:04<00:15,  9.95it/s][A
Training:  20%|██        | 38/189 [00:05<00:18,  8.23it/s][A
Training:  22%|██▏       | 41/189 [00:05<00:19,  7.54it/s][A
Training:  24%|██▍  

Epoch: 6/18 - Loss: 0.2210 - Accuracy: 0.9167



  0%|          | 0/24 [00:00<?, ?it/s][A
  4%|▍         | 1/24 [00:00<00:17,  1.30it/s][A
 17%|█▋        | 4/24 [00:00<00:03,  5.67it/s][A
 25%|██▌       | 6/24 [00:01<00:03,  5.90it/s][A
 33%|███▎      | 8/24 [00:01<00:02,  7.47it/s][A
 42%|████▏     | 10/24 [00:01<00:02,  6.86it/s][A
 54%|█████▍    | 13/24 [00:02<00:01,  6.82it/s][A
 71%|███████   | 17/24 [00:02<00:00,  7.48it/s][A
 83%|████████▎ | 20/24 [00:02<00:00,  9.88it/s][A
100%|██████████| 24/24 [00:03<00:00,  7.65it/s][A
Epochs:  33%|███▎      | 6/18 [02:39<05:18, 26.57s/it]

Val Loss: 0.4806 - Val Accuracy: 0.8718



Training:   0%|          | 0/189 [00:00<?, ?it/s][A
Training:   1%|          | 1/189 [00:00<02:14,  1.40it/s][A
Training:   3%|▎         | 5/189 [00:01<00:37,  4.96it/s][A
Training:   4%|▎         | 7/189 [00:01<00:26,  6.81it/s][A
Training:   5%|▍         | 9/189 [00:01<00:27,  6.52it/s][A
Training:   5%|▌         | 10/189 [00:01<00:29,  6.02it/s][A
Training:   7%|▋         | 13/189 [00:02<00:23,  7.59it/s][A
Training:   7%|▋         | 14/189 [00:02<00:23,  7.37it/s][A
Training:   9%|▉         | 17/189 [00:02<00:23,  7.25it/s][A
Training:  11%|█         | 20/189 [00:02<00:17,  9.85it/s][A
Training:  12%|█▏        | 22/189 [00:03<00:21,  7.74it/s][A
Training:  13%|█▎        | 25/189 [00:03<00:23,  7.06it/s][A
Training:  15%|█▌        | 29/189 [00:04<00:19,  8.04it/s][A
Training:  17%|█▋        | 33/189 [00:04<00:17,  8.78it/s][A
Training:  19%|█▉        | 36/189 [00:04<00:14, 10.82it/s][A
Training:  20%|██        | 38/189 [00:05<00:17,  8.59it/s][A
Training:  22%|██▏  

Epoch: 7/18 - Loss: 0.4560 - Accuracy: 0.8962



  0%|          | 0/24 [00:00<?, ?it/s][A
  4%|▍         | 1/24 [00:01<00:24,  1.07s/it][A
 21%|██        | 5/24 [00:01<00:04,  3.90it/s][A
 38%|███▊      | 9/24 [00:01<00:02,  5.69it/s][A
 50%|█████     | 12/24 [00:02<00:01,  7.71it/s][A
 58%|█████▊    | 14/24 [00:02<00:01,  6.61it/s][A
 71%|███████   | 17/24 [00:03<00:01,  6.17it/s][A
100%|██████████| 24/24 [00:03<00:00,  6.73it/s][A
Epochs:  39%|███▉      | 7/18 [03:07<04:55, 26.87s/it]

Val Loss: 0.2625 - Val Accuracy: 0.9105



Training:   0%|          | 0/189 [00:00<?, ?it/s][A
Training:   1%|          | 1/189 [00:00<02:29,  1.25it/s][A
Training:   1%|          | 2/189 [00:00<01:15,  2.48it/s][A
Training:   3%|▎         | 5/189 [00:01<00:35,  5.25it/s][A
Training:   3%|▎         | 6/189 [00:01<00:33,  5.46it/s][A
Training:   5%|▍         | 9/189 [00:01<00:26,  6.74it/s][A
Training:   5%|▌         | 10/189 [00:01<00:26,  6.81it/s][A
Training:   7%|▋         | 13/189 [00:02<00:22,  7.96it/s][A
Training:   7%|▋         | 14/189 [00:02<00:24,  7.05it/s][A
Training:   9%|▉         | 17/189 [00:02<00:22,  7.80it/s][A
Training:  10%|▉         | 18/189 [00:02<00:23,  7.25it/s][A
Training:  11%|█         | 21/189 [00:03<00:22,  7.57it/s][A
Training:  12%|█▏        | 22/189 [00:03<00:24,  6.78it/s][A
Training:  13%|█▎        | 25/189 [00:03<00:20,  7.94it/s][A
Training:  14%|█▍        | 26/189 [00:04<00:23,  6.98it/s][A
Training:  15%|█▌        | 29/189 [00:04<00:20,  7.83it/s][A
Training:  17%|█▋    

Epoch: 8/18 - Loss: 0.2016 - Accuracy: 0.9242



  0%|          | 0/24 [00:00<?, ?it/s][A
  4%|▍         | 1/24 [00:00<00:18,  1.27it/s][A
 17%|█▋        | 4/24 [00:00<00:03,  5.43it/s][A
 25%|██▌       | 6/24 [00:01<00:03,  5.49it/s][A
 33%|███▎      | 8/24 [00:01<00:02,  7.11it/s][A
 42%|████▏     | 10/24 [00:01<00:02,  5.96it/s][A
 50%|█████     | 12/24 [00:01<00:01,  7.69it/s][A
 58%|█████▊    | 14/24 [00:02<00:01,  6.06it/s][A
 62%|██████▎   | 15/24 [00:02<00:01,  6.31it/s][A
 71%|███████   | 17/24 [00:02<00:01,  5.68it/s][A
 79%|███████▉  | 19/24 [00:03<00:00,  6.65it/s][A
 88%|████████▊ | 21/24 [00:03<00:00,  6.73it/s][A
100%|██████████| 24/24 [00:03<00:00,  6.35it/s][A
Epochs:  44%|████▍     | 8/18 [03:34<04:28, 26.90s/it]

Val Loss: 0.2039 - Val Accuracy: 0.9167



Training:   0%|          | 0/189 [00:00<?, ?it/s][A
Training:   1%|          | 1/189 [00:00<02:29,  1.26it/s][A
Training:   3%|▎         | 5/189 [00:01<00:37,  4.88it/s][A
Training:   5%|▍         | 9/189 [00:01<00:29,  6.19it/s][A
Training:   6%|▋         | 12/189 [00:01<00:21,  8.34it/s][A
Training:   7%|▋         | 14/189 [00:02<00:22,  7.86it/s][A
Training:   8%|▊         | 16/189 [00:02<00:19,  8.82it/s][A
Training:  10%|▉         | 18/189 [00:02<00:23,  7.30it/s][A
Training:  10%|█         | 19/189 [00:02<00:26,  6.53it/s][A
Training:  11%|█         | 21/189 [00:03<00:28,  5.92it/s][A
Training:  13%|█▎        | 25/189 [00:03<00:24,  6.59it/s][A
Training:  15%|█▌        | 29/189 [00:04<00:22,  7.13it/s][A
Training:  17%|█▋        | 33/189 [00:04<00:21,  7.16it/s][A
Training:  20%|█▉        | 37/189 [00:05<00:19,  7.68it/s][A
Training:  22%|██▏       | 41/189 [00:05<00:17,  8.23it/s][A
Training:  24%|██▍       | 45/189 [00:06<00:18,  7.99it/s][A
Training:  26%|██▌ 

Epoch: 9/18 - Loss: 0.1992 - Accuracy: 0.9282



  0%|          | 0/24 [00:00<?, ?it/s][A
  4%|▍         | 1/24 [00:00<00:18,  1.22it/s][A
 17%|█▋        | 4/24 [00:00<00:04,  4.99it/s][A
 25%|██▌       | 6/24 [00:01<00:03,  4.89it/s][A
 38%|███▊      | 9/24 [00:01<00:02,  5.85it/s][A
 42%|████▏     | 10/24 [00:01<00:02,  6.09it/s][A
 54%|█████▍    | 13/24 [00:02<00:01,  6.93it/s][A
 62%|██████▎   | 15/24 [00:02<00:01,  8.60it/s][A
 71%|███████   | 17/24 [00:02<00:01,  6.82it/s][A
 83%|████████▎ | 20/24 [00:02<00:00,  9.13it/s][A
100%|██████████| 24/24 [00:03<00:00,  6.89it/s][A
Epochs:  50%|█████     | 9/18 [04:01<04:02, 26.98s/it]

Val Loss: 0.1858 - Val Accuracy: 0.9297



Training:   0%|          | 0/189 [00:00<?, ?it/s][A
Training:   1%|          | 1/189 [00:00<02:11,  1.43it/s][A
Training:   1%|          | 2/189 [00:00<01:12,  2.59it/s][A
Training:   3%|▎         | 5/189 [00:01<00:38,  4.77it/s][A
Training:   3%|▎         | 6/189 [00:01<00:33,  5.47it/s][A
Training:   5%|▍         | 9/189 [00:01<00:27,  6.66it/s][A
Training:   5%|▌         | 10/189 [00:01<00:27,  6.48it/s][A
Training:   7%|▋         | 13/189 [00:02<00:22,  7.94it/s][A
Training:   7%|▋         | 14/189 [00:02<00:23,  7.33it/s][A
Training:   9%|▉         | 17/189 [00:02<00:21,  8.17it/s][A
Training:  10%|▉         | 18/189 [00:02<00:21,  7.81it/s][A
Training:  11%|█         | 21/189 [00:03<00:17,  9.59it/s][A
Training:  12%|█▏        | 22/189 [00:03<00:20,  8.20it/s][A
Training:  13%|█▎        | 25/189 [00:03<00:18,  8.77it/s][A
Training:  14%|█▍        | 26/189 [00:03<00:20,  8.11it/s][A
Training:  15%|█▌        | 29/189 [00:04<00:18,  8.58it/s][A
Training:  16%|█▌    

Epoch: 10/18 - Loss: 0.1991 - Accuracy: 0.9264



  0%|          | 0/24 [00:00<?, ?it/s][A
  4%|▍         | 1/24 [00:00<00:13,  1.74it/s][A
 21%|██        | 5/24 [00:00<00:02,  6.46it/s][A
 33%|███▎      | 8/24 [00:01<00:01, 10.23it/s][A
 42%|████▏     | 10/24 [00:01<00:01,  8.31it/s][A
 54%|█████▍    | 13/24 [00:01<00:01,  8.14it/s][A
 62%|██████▎   | 15/24 [00:01<00:00,  9.52it/s][A
 71%|███████   | 17/24 [00:02<00:00,  8.06it/s][A
100%|██████████| 24/24 [00:02<00:00,  9.30it/s][A
Epochs:  56%|█████▌    | 10/18 [04:24<03:27, 25.95s/it]

Val Loss: 0.1807 - Val Accuracy: 0.9344



Training:   0%|          | 0/189 [00:00<?, ?it/s][A
Training:   1%|          | 1/189 [00:00<01:39,  1.89it/s][A
Training:   2%|▏         | 4/189 [00:00<00:27,  6.71it/s][A
Training:   3%|▎         | 6/189 [00:00<00:26,  6.88it/s][A
Training:   5%|▍         | 9/189 [00:01<00:20,  8.71it/s][A
Training:   6%|▌         | 11/189 [00:01<00:17, 10.17it/s][A
Training:   7%|▋         | 13/189 [00:01<00:16, 10.49it/s][A
Training:   8%|▊         | 15/189 [00:01<00:15, 11.10it/s][A
Training:   9%|▉         | 17/189 [00:01<00:15, 11.38it/s][A
Training:  10%|█         | 19/189 [00:01<00:13, 12.66it/s][A
Training:  11%|█         | 21/189 [00:02<00:12, 13.08it/s][A
Training:  12%|█▏        | 23/189 [00:02<00:11, 14.13it/s][A
Training:  13%|█▎        | 25/189 [00:02<00:14, 11.54it/s][A
Training:  14%|█▍        | 27/189 [00:02<00:13, 12.23it/s][A
Training:  15%|█▌        | 29/189 [00:02<00:14, 11.06it/s][A
Training:  16%|█▋        | 31/189 [00:02<00:13, 12.05it/s][A
Training:  17%|█▋   

Epoch: 11/18 - Loss: 0.2037 - Accuracy: 0.9267



  0%|          | 0/24 [00:00<?, ?it/s][A
  4%|▍         | 1/24 [00:00<00:16,  1.41it/s][A
 21%|██        | 5/24 [00:01<00:03,  5.32it/s][A
 38%|███▊      | 9/24 [00:01<00:02,  6.99it/s][A
 54%|█████▍    | 13/24 [00:01<00:01,  8.34it/s][A
 71%|███████   | 17/24 [00:02<00:00,  8.89it/s][A
100%|██████████| 24/24 [00:02<00:00,  8.97it/s][A
Epochs:  61%|██████    | 11/18 [04:45<02:50, 24.40s/it]

Val Loss: 0.1827 - Val Accuracy: 0.9295



Training:   0%|          | 0/189 [00:00<?, ?it/s][A
Training:   1%|          | 1/189 [00:00<02:02,  1.54it/s][A
Training:   2%|▏         | 4/189 [00:00<00:28,  6.52it/s][A
Training:   3%|▎         | 6/189 [00:01<00:27,  6.72it/s][A
Training:   5%|▍         | 9/189 [00:01<00:24,  7.34it/s][A
Training:   6%|▋         | 12/189 [00:01<00:16, 10.59it/s][A
Training:   7%|▋         | 14/189 [00:01<00:19,  8.95it/s][A
Training:   9%|▉         | 17/189 [00:02<00:19,  9.01it/s][A
Training:  11%|█         | 21/189 [00:02<00:16, 10.47it/s][A
Training:  13%|█▎        | 25/189 [00:02<00:14, 11.43it/s][A
Training:  15%|█▌        | 29/189 [00:03<00:14, 10.68it/s][A
Training:  17%|█▋        | 32/189 [00:03<00:12, 12.90it/s][A
Training:  18%|█▊        | 34/189 [00:03<00:14, 10.75it/s][A
Training:  20%|█▉        | 37/189 [00:03<00:14, 10.29it/s][A
Training:  21%|██        | 39/189 [00:04<00:14, 10.43it/s][A
Training:  22%|██▏       | 41/189 [00:04<00:14,  9.97it/s][A
Training:  23%|██▎  

Epoch: 12/18 - Loss: 0.2750 - Accuracy: 0.9158



  0%|          | 0/24 [00:00<?, ?it/s][A
  4%|▍         | 1/24 [00:00<00:12,  1.80it/s][A
 17%|█▋        | 4/24 [00:00<00:02,  7.43it/s][A
 25%|██▌       | 6/24 [00:00<00:02,  7.23it/s][A
 38%|███▊      | 9/24 [00:01<00:02,  7.50it/s][A
 54%|█████▍    | 13/24 [00:01<00:01,  8.55it/s][A
 71%|███████   | 17/24 [00:02<00:00,  9.23it/s][A
100%|██████████| 24/24 [00:02<00:00,  9.41it/s][A
Epochs:  67%|██████▋   | 12/18 [05:06<02:20, 23.39s/it]

Val Loss: 0.1992 - Val Accuracy: 0.9211



Training:   0%|          | 0/189 [00:00<?, ?it/s][A
Training:   1%|          | 1/189 [00:00<01:56,  1.62it/s][A
Training:   3%|▎         | 5/189 [00:00<00:30,  5.99it/s][A
Training:   5%|▍         | 9/189 [00:01<00:23,  7.68it/s][A
Training:   7%|▋         | 13/189 [00:01<00:19,  8.81it/s][A
Training:   8%|▊         | 16/189 [00:01<00:15, 11.34it/s][A
Training:  10%|▉         | 18/189 [00:02<00:16, 10.14it/s][A
Training:  11%|█         | 21/189 [00:02<00:18,  9.25it/s][A
Training:  13%|█▎        | 25/189 [00:02<00:15, 10.42it/s][A
Training:  14%|█▍        | 27/189 [00:02<00:14, 11.03it/s][A
Training:  15%|█▌        | 29/189 [00:03<00:15, 10.48it/s][A
Training:  16%|█▋        | 31/189 [00:03<00:14, 11.01it/s][A
Training:  17%|█▋        | 33/189 [00:03<00:13, 11.51it/s][A
Training:  19%|█▊        | 35/189 [00:03<00:13, 11.09it/s][A
Training:  20%|█▉        | 37/189 [00:03<00:13, 11.24it/s][A
Training:  21%|██        | 39/189 [00:04<00:13, 11.19it/s][A
Training:  22%|██▏ 

Epoch: 13/18 - Loss: 0.6376 - Accuracy: 0.8991



  0%|          | 0/24 [00:00<?, ?it/s][A
  4%|▍         | 1/24 [00:00<00:12,  1.78it/s][A
 21%|██        | 5/24 [00:00<00:03,  5.89it/s][A
 33%|███▎      | 8/24 [00:01<00:01,  9.47it/s][A
 42%|████▏     | 10/24 [00:01<00:01,  8.01it/s][A
 54%|█████▍    | 13/24 [00:01<00:01,  8.32it/s][A
 67%|██████▋   | 16/24 [00:01<00:00, 10.38it/s][A
 75%|███████▌  | 18/24 [00:02<00:00,  9.06it/s][A
 83%|████████▎ | 20/24 [00:02<00:00, 10.41it/s][A
100%|██████████| 24/24 [00:02<00:00,  9.09it/s][A
Epochs:  67%|██████▋   | 12/18 [05:27<02:43, 27.33s/it]
[32m[I 2023-12-15 01:02:39,853][0m Trial 18 pruned. [0m


Val Loss: 1.1321 - Val Accuracy: 0.8989
Learning rate: 0.0002414304307703839
Weight decay: 0.0006287430339754604
Epsilon: 6.640626574918036e-09
Batch size: 160
Number of epochs: 28


Epochs:   0%|          | 0/28 [00:00<?, ?it/s]
Training:   0%|          | 0/88 [00:00<?, ?it/s][A
Training:   1%|          | 1/88 [00:01<01:35,  1.10s/it][A
Training:   5%|▍         | 4/88 [00:01<00:20,  4.16it/s][A
Training:   7%|▋         | 6/88 [00:02<00:25,  3.23it/s][A
Training:   9%|▉         | 8/88 [00:02<00:16,  4.74it/s][A
Training:  11%|█▏        | 10/88 [00:02<00:19,  3.92it/s][A
Training:  15%|█▍        | 13/88 [00:03<00:19,  3.94it/s][A
Training:  18%|█▊        | 16/88 [00:03<00:12,  5.71it/s][A
Training:  20%|██        | 18/88 [00:04<00:16,  4.34it/s][A
Training:  23%|██▎       | 20/88 [00:04<00:12,  5.49it/s][A
Training:  25%|██▌       | 22/88 [00:05<00:15,  4.19it/s][A
Training:  28%|██▊       | 25/88 [00:05<00:14,  4.39it/s][A
Training:  33%|███▎      | 29/88 [00:06<00:12,  4.70it/s][A
Training:  38%|███▊      | 33/88 [00:07<00:11,  4.90it/s][A
Training:  39%|███▊      | 34/88 [00:07<00:10,  5.08it/s][A
Training:  42%|████▏     | 37/88 [00:08<00:09,  5.1

Epoch: 1/28 - Loss: 0.4147 - Accuracy: 0.8175



  0%|          | 0/11 [00:00<?, ?it/s][A
  9%|▉         | 1/11 [00:01<00:10,  1.07s/it][A
 36%|███▋      | 4/11 [00:01<00:01,  4.31it/s][A
 55%|█████▍    | 6/11 [00:01<00:01,  3.39it/s][A
 82%|████████▏ | 9/11 [00:02<00:00,  3.67it/s][A
100%|██████████| 11/11 [00:02<00:00,  3.73it/s][A
Epochs:   0%|          | 0/28 [00:21<?, ?it/s]
[32m[I 2023-12-15 01:03:01,501][0m Trial 19 pruned. [0m


Val Loss: 0.2655 - Val Accuracy: 0.8986

Study statistics: 
  Number of finished trials:  20
  Number of pruned trials:  15
  Number of complete trials:  5


In [20]:
print("Best trial:")
trial = study.best_trial

print("  Value: ", trial.value)

print("  Params: ")
for key, value in trial.params.items():
    print("    {}: {}".format(key, value))

Best trial:
  Value:  0.9450960159301758
  Params: 
    batch_size: 134
    epochs: 66
    epsilon: 7.0510050620049406e-09
    learning_rate: 3.220616291387027e-05
    weight_decay: 0.0010915949385844237


In [None]:
# ViT P12-S8 Mean

Best trial:
Value:  0.9450960159301758
Params: 
batch_size: 134
epochs: 66
epsilon: 7.0510050620049406e-09
learning_rate: 3.220616291387027e-05
weight_decay: 0.0010915949385844237