In [25]:
import os
import random
import pandas as pd
import numpy as np
import mxnet as mx
import torch
import torch.nn as nn
import torch.nn.functional as F
import torch.optim as opt
from torch.utils.data import Dataset, DataLoader
from pytorch_metric_learning import losses
from einops import rearrange, repeat
import optuna
from optuna.trial import TrialState
from tqdm import tqdm

In [2]:
def file_to_embed(embeds, file):
    emb = []
    for f in file:
        emb.append(embeds[f][0])
    return torch.stack(emb)

In [3]:
MIN_NUM_PATCHES = 16

In [4]:
device = torch.device("cuda:2" if torch.cuda.is_available() else "cpu")
device

device(type='cuda', index=2)

In [5]:
class AdienceDataset(Dataset):
    def __init__(self, annot_file, img_dir, train=False):
        self.img_lbls = pd.read_csv(annot_file, header=None)
        self.img_dir = img_dir
        self.is_train = train
    
    def __len__(self):
        return len(self.img_lbls)
    
    def __getitem__(self, idx):
        img_file = self.img_lbls.iloc[idx, 0]
        img_path = os.path.join(self.img_dir, img_file)
        image = mx.image.imread(img_path)
        if image.shape[1] != 112:
            image = mx.image.resize_short(image, 112)
        image = mx.nd.transpose(image, axes=(2,0,1))
        image = torch.tensor(image.asnumpy()).type(torch.FloatTensor)
        label = self.img_lbls.iloc[idx, 1]
        
        if self.is_train:
            positive_list = self.img_lbls[self.img_lbls.iloc[:, 1] == label].index.values
            positive_list = np.setdiff1d(positive_list, np.array([idx]))
            positive_item = random.choice(positive_list)
            positive_img = self.img_lbls.iloc[positive_item, 0]
            pos_img_path = os.path.join(self.img_dir, positive_img)
            pos_image = mx.image.imread(pos_img_path)
            if pos_image.shape[1] != 112:
                pos_image = mx.image.resize_short(pos_image, 112)
            pos_image = mx.nd.transpose(pos_image, axes=(2,0,1))
            pos_image = torch.tensor(pos_image.asnumpy()).type(torch.FloatTensor)
            
            negative_list = self.img_lbls[self.img_lbls.iloc[:, 1] != label].index.values
            negative_item = random.choice(negative_list)
            negative_img = self.img_lbls.iloc[negative_item, 0]
            neg_img_path = os.path.join(self.img_dir, negative_img)
            neg_image = mx.image.imread(neg_img_path)
            if neg_image.shape[1] != 112:
                neg_image = mx.image.resize_short(neg_image, 112)
            neg_image = mx.nd.transpose(neg_image, axes=(2,0,1))
            neg_image = torch.tensor(neg_image.asnumpy()).type(torch.FloatTensor)
            
            return image, pos_image, neg_image, label, img_file, positive_img, negative_img

        return image, label, img_file

In [6]:
train_data = AdienceDataset("../train.csv", "../cropped_Adience/", train=False)
val_data = AdienceDataset("../val.csv", "../cropped_Adience/", train=False)

In [22]:
train_data = AdienceDataset("../train.csv", "../cropped_Adience/", train=True)
val_data = AdienceDataset("../val.csv", "../cropped_Adience/", train=True)

In [7]:
class TripletLoss(nn.Module):
    def __init__(self, margin=1.0):
        super(TripletLoss, self).__init__()
        self.margin = margin
        
    def calc_euclidean(self, x1, x2):
        return (x1 - x2).pow(2).sum(1)
    
    def forward(self, anchor, positive, negative):
        distance_positive = self.calc_euclidean(anchor, positive)
        distance_negative = self.calc_euclidean(anchor, negative)
        losses = torch.relu(distance_positive - distance_negative + self.margin)

        return losses.mean()

In [8]:
class CombinedLoss(nn.Module):
    def __init__(self, beta=1.0):
        super(CombinedLoss, self).__init__()
        self.beta = beta
        self.triplet = TripletLoss(margin=1.0)
        self.classification = nn.CrossEntropyLoss()
        
    def forward(self, anchor, positive, negative, classification_out, labels):
        triplet_loss = self.triplet(anchor, positive, negative)
        classification_loss = self.classification(classification_out, labels)
        total_loss = (self.beta * triplet_loss) + classification_loss
        
        return total_loss

In [9]:
class CosFace(nn.Module):
    r"""Implement of CosFace (https://arxiv.org/pdf/1801.09414.pdf):
    Args:
        in_features: size of each input sample
        out_features: size of each output sample
        device_id: the ID of GPU where the model will be trained by model parallel.
                       if device_id=None, it will be trained on CPU without model parallel.
        s: norm of input feature
        m: margin
        cos(theta)-m
    """

    def __init__(self, in_features, out_features, device_id, s=64.0, m=0.35):
        super(CosFace, self).__init__()
        self.in_features = in_features
        self.out_features = out_features
        self.device_id = device_id
        self.s = s
        self.m = m
        print("self.device_id", self.device_id)
        self.weight = nn.Parameter(torch.FloatTensor(out_features, in_features))
        nn.init.xavier_uniform_(self.weight)

    def forward(self, input, label):
        # --------------------------- cos(theta) & phi(theta) ---------------------------

        if self.device_id == None:
            cosine = F.linear(F.normalize(input), F.normalize(self.weight))
        else:
            x = input
            sub_weights = torch.chunk(self.weight, len(self.device_id), dim=0)
            temp_x = x.cuda(self.device_id[0])
            weight = sub_weights[0].cuda(self.device_id[0])
            cosine = F.linear(F.normalize(temp_x), F.normalize(weight))
            for i in range(1, len(self.device_id)):
                temp_x = x.cuda(self.device_id[i])
                weight = sub_weights[i].cuda(self.device_id[i])
                cosine = torch.cat((cosine, F.linear(F.normalize(temp_x), F.normalize(weight)).cuda(self.device_id[0])),
                                   dim=1)
        phi = cosine - self.m
        # --------------------------- convert label to one-hot ---------------------------
        one_hot = torch.zeros(cosine.size())
        if self.device_id != None:
            one_hot = one_hot.cuda(self.device_id[0])
        # one_hot = one_hot.cuda() if cosine.is_cuda else one_hot

        one_hot.scatter_(1, label.view(-1, 1).long(), 1)
        # -------------torch.where(out_i = {x_i if condition_i else y_i) -------------
        output = (one_hot * phi) + (
                    (1.0 - one_hot) * cosine)  # you can use torch.where if your torch.__version__ is 0.4
        output *= self.s

        return output

    def __repr__(self):
        return self.__class__.__name__ + '(' \
               + 'in_features = ' + str(self.in_features) \
               + ', out_features = ' + str(self.out_features) \
               + ', s = ' + str(self.s) \
               + ', m = ' + str(self.m) + ')'

In [10]:
class Residual(nn.Module):
    def __init__(self, fn):
        super().__init__()
        self.fn = fn
    def forward(self, x, **kwargs):
        return self.fn(x, **kwargs) + x

In [11]:
class PreNorm(nn.Module):
    def __init__(self, dim, fn):
        super().__init__()
        self.norm = nn.LayerNorm(dim)
        self.fn = fn
    def forward(self, x, **kwargs):
        return self.fn(self.norm(x), **kwargs)

In [12]:
class FeedForward(nn.Module):
    def __init__(self, dim, hidden_dim, dropout = 0.):
        super().__init__()
        self.net = nn.Sequential(
            nn.Linear(dim, hidden_dim),
            nn.GELU(),
            nn.Dropout(dropout),
            nn.Linear(hidden_dim, dim),
            nn.Dropout(dropout)
        )
    def forward(self, x):
        return self.net(x)

In [13]:
class Attention(nn.Module):
    def __init__(self, dim, heads = 8, dim_head = 64, dropout = 0.):
        super().__init__()
        inner_dim = dim_head *  heads
        self.heads = heads
        self.scale = dim ** -0.5

        self.to_qkv = nn.Linear(dim, inner_dim * 3, bias = False)
        self.to_out = nn.Sequential(
            nn.Linear(inner_dim, dim),
            nn.Dropout(dropout)
        )

    def forward(self, x, mask = None):
        b, n, _, h = *x.shape, self.heads
        qkv = self.to_qkv(x).chunk(3, dim = -1)

        q, k, v = map(lambda t: rearrange(t, 'b n (h d) -> b h n d', h = h), qkv)
        dots = torch.einsum('bhid,bhjd->bhij', q, k) * self.scale
        mask_value = -torch.finfo(dots.dtype).max
        #embed()
        if mask is not None:
            mask = F.pad(mask.flatten(1), (1, 0), value = True)
            assert mask.shape[-1] == dots.shape[-1], 'mask has incorrect dimensions'
            mask = mask[:, None, :] * mask[:, :, None]
            dots.masked_fill_(~mask, mask_value)
            del mask

        attn = dots.softmax(dim=-1)

        out = torch.einsum('bhij,bhjd->bhid', attn, v)
        out = rearrange(out, 'b h n d -> b n (h d)')
        out =  self.to_out(out)

        return out

In [14]:
class Transformer(nn.Module):
    def __init__(self, dim, depth, heads, dim_head, mlp_dim, dropout):
        super().__init__()
        self.layers = nn.ModuleList([])
        for _ in range(depth):
            self.layers.append(nn.ModuleList([
                Residual(PreNorm(dim, Attention(dim, heads = heads, dim_head = dim_head, dropout = dropout))),
                Residual(PreNorm(dim, FeedForward(dim, mlp_dim, dropout = dropout)))
            ]))
    def forward(self, x, mask = None):
        for attn, ff in self.layers:
            x = attn(x, mask = mask)
            #embed()
            x = ff(x)
        return x

In [15]:
class ViTs_face(nn.Module):
    def __init__(self, *, loss_type, GPU_ID, num_class, image_size, patch_size, ac_patch_size,
                         pad, dim, depth, heads, mlp_dim, pool = 'mean', channels = 3, dim_head = 64, dropout = 0., emb_dropout = 0.):
        super().__init__()
        assert image_size % patch_size == 0, 'Image dimensions must be divisible by the patch size.'
        num_patches = (image_size // patch_size) ** 2
        patch_dim = channels * ac_patch_size ** 2
        assert num_patches > MIN_NUM_PATCHES, f'your number of patches ({num_patches}) is way too small for attention to be effective (at least 16). Try decreasing your patch size'
        assert pool in {'cls', 'mean'}, 'pool type must be either cls (cls token) or mean (mean pooling)'

        self.patch_size = patch_size
        self.soft_split = nn.Unfold(kernel_size=(ac_patch_size, ac_patch_size), stride=(self.patch_size, self.patch_size), padding=(pad, pad))


        self.pos_embedding = nn.Parameter(torch.randn(1, num_patches + 1, dim))
        self.patch_to_embedding = nn.Linear(patch_dim, dim)
        self.cls_token = nn.Parameter(torch.randn(1, 1, dim))
        self.dropout = nn.Dropout(emb_dropout)

        self.transformer = Transformer(dim, depth, heads, dim_head, mlp_dim, dropout)

        self.pool = pool
        self.to_latent = nn.Identity()

        self.mlp_head = nn.Sequential(
            nn.LayerNorm(dim),
        )
        self.loss_type = loss_type
        self.GPU_ID = GPU_ID
        if self.loss_type == 'None':
            print("no loss for vit_face")
        else:
            if self.loss_type == 'Softmax':
                self.loss = Softmax(in_features=dim, out_features=num_class, device_id=self.GPU_ID)
            elif self.loss_type == 'CosFace':
                self.loss = CosFace(in_features=dim, out_features=num_class, device_id=self.GPU_ID)
            elif self.loss_type == 'ArcFace':
                self.loss = ArcFace(in_features=dim, out_features=num_class, device_id=self.GPU_ID)
            elif self.loss_type == 'SFace':
                self.loss = SFaceLoss(in_features=dim, out_features=num_class, device_id=self.GPU_ID)

    def forward(self, img, label= None , mask = None):
        p = self.patch_size
        x = self.soft_split(img).transpose(1, 2)
        x = self.patch_to_embedding(x)
        b, n, _ = x.shape

        cls_tokens = repeat(self.cls_token, '() n d -> b n d', b = b)
        x = torch.cat((cls_tokens, x), dim=1)
        x += self.pos_embedding[:, :(n + 1)]
        x = self.dropout(x)
        x = self.transformer(x, mask)

        y = x[:, 0]
        z = x[:, 1:].mean(dim = 1)

        y = self.to_latent(y)
        emb_y = self.mlp_head(y)
        z = self.to_latent(z)
        emb_z = self.mlp_head(z)
        emb = torch.cat((emb_y, emb_z), dim=1)
        if label is not None:
            x = self.loss(emb, label)
            return x, emb
        else:
            return emb

In [16]:
class ViT_plus(nn.Module):
    def __init__(self):
        super(ViT_plus, self).__init__()
        
        self.fc1 = nn.Linear(in_features=1024, out_features=1024)
        self.fc2 = nn.Linear(in_features=1024, out_features=2)
        
    def forward(self, x):
        x = self.fc1(x)
        x_cosface = x
        x_classification = self.fc2(x)
        
        return x_cosface, x_classification

In [19]:
model = ViTs_face(
            loss_type='CosFace',
            GPU_ID=[device],
            num_class=93431,
            image_size=112,
            patch_size=8,
            ac_patch_size=12,
            pad=4,
            dim=512,
            depth=20,
            heads=8,
            mlp_dim=2048,
            dropout=0.1,
            emb_dropout=0.1
        ).to(device)
model.load_state_dict(
    torch.load("../Backbone_VITs_Epoch_2_Batch_12000_Time_2021-03-17-04-05_checkpoint.pth", map_location=device)
)

self.device_id [device(type='cuda', index=2)]


<All keys matched successfully>

In [20]:
for param in model.parameters():
    param.requires_grad = False

In [21]:
embeds = {}
model.eval()

with torch.no_grad():
    for img, _, file in train_data:
        img = img.to(device)
        embeds[file] = model(torch.unsqueeze(img, 0))

    for img, _, file in val_data:
        img = img.to(device)
        embeds[file] = model(torch.unsqueeze(img, 0))

In [23]:
best_accu = 0.0
def objective(trial):
    model_xtr = ViT_plus().to(device)
    
    loss_lr = trial.suggest_float("loss_learning_rate", 1e-4, 1e-2, log=True)
    arc_margin = losses.ArcFaceLoss(2, 1024).to(device)
    loss_optimizer = opt.AdamW(arc_margin.parameters(), lr=loss_lr)
    
    lr = trial.suggest_float("learning_rate", 1e-5, 1e-1, log=True)
    wd = trial.suggest_float('weight_decay', 1e-4, 1e-2, log=True)
    eps = trial.suggest_float("epsilon", 1e-9, 1e-7, log=True)
    optimizer = opt.AdamW(model_xtr.parameters(), lr=lr, eps=eps, weight_decay=wd)
    
    beta = trial.suggest_float("beta", 0.1, 1.0, step=0.1)
    gamma = trial.suggest_float("gamma", 0.1, 1.0, step=0.1)
    criterion = CombinedLoss(beta=beta).to(device)
    
    batch_size = trial.suggest_int('batch_size', 50, 300)
    num_epochs = trial.suggest_int('epochs', 10, 100)
    
    print("Learning rate for Loss: "+ str(loss_lr))
    print("Learning rate: "+ str(lr))
    print("Weight decay: "+ str(wd))
    print("Epsilon: "+ str(eps))
    print("Beta: "+ str(beta))
    print("Gamma: "+ str(gamma))
    print("Batch size: "+ str(batch_size))
    print("Number of epochs: "+ str(num_epochs))
    
    for epoch in tqdm(range(num_epochs), desc="Epochs"):
        train_loader = DataLoader(train_data, batch_size=batch_size, shuffle=True, num_workers=4)
        val_loader = DataLoader(val_data, batch_size=batch_size, shuffle=False, num_workers=4)
        
        # training loop
        running_loss = []
        running_accu = []
        
        model_xtr.train()
        for img, pos_img, neg_img, label, img_file, pos_file, neg_file in tqdm(train_loader, desc="Training", leave=False):
            img, pos_img, neg_img, label = img.to(device), pos_img.to(device), neg_img.to(device), label.to(device)

            x1 = file_to_embed(embeds, img_file)
            x2 = file_to_embed(embeds, pos_file)
            x3 = file_to_embed(embeds, neg_file)
            
            optimizer.zero_grad()
            anchor, output = model_xtr(x1)
            pos, _ = model_xtr(x2)
            neg, _ = model_xtr(x3)
            
            pred = torch.argmax(output, 1)
            accuracy = torch.eq(pred, label).sum() / len(img)

            class_triplet_loss = criterion(anchor, pos, neg, output, label)
            arc_loss = arc_margin(anchor, label)
            loss = (gamma * arc_loss) + class_triplet_loss
            loss.backward()
            loss_optimizer.step()
            optimizer.step()

            running_accu.append(accuracy.cpu().detach().numpy())
            running_loss.append(loss.cpu().detach().numpy())
        print("Epoch: {}/{} - Loss: {:.4f} - Accuracy: {:.4f}".format(epoch+1, num_epochs, np.mean(running_loss), np.mean(running_accu)))
        
        # validation loop
        val_loss = []
        val_accu = []

        model_xtr.eval()
        with torch.no_grad():
            for img, pos_img, neg_img, label, img_file, pos_file, neg_file in tqdm(val_loader):
                img, pos_img, neg_img, label = img.to(device), pos_img.to(device), neg_img.to(device), label.to(device)
                
                x1 = file_to_embed(embeds, img_file)
                x2 = file_to_embed(embeds, pos_file)
                x3 = file_to_embed(embeds, neg_file)
                
                anchor, output = model_xtr(x1)
                pos, _ = model_xtr(x2)
                neg, _ = model_xtr(x3)
                
                pred = torch.argmax(output, 1)
                accuracy = torch.eq(pred, label).sum() / len(img)
                
                class_triplet_loss = criterion(anchor, pos, neg, output, label)
                arc_loss = arc_margin(anchor, label)
                loss = (gamma * arc_loss) + class_triplet_loss
                
                val_accu.append(accuracy.cpu().detach().numpy())
                val_loss.append(loss.cpu().detach().numpy())
        val_accu = np.mean(val_accu)
        val_loss = np.mean(val_loss)
        print("Val Loss: {:.4f} - Val Accuracy: {:.4f}".format(val_loss, val_accu))
        
        trial.report(val_accu, epoch)
        if trial.should_prune():
            raise optuna.exceptions.TrialPruned()
    
    global best_accu
    if val_accu > best_accu:
        best_accu = val_accu
        print("Saving best model...")
        torch.save(model_xtr.state_dict(), "../vit_12-8_triplet_arcface_mean.pt")
            
    return val_accu

In [26]:
study = optuna.create_study(direction='maximize',
                            study_name='triplet-arcface-12-8-mean-vit-study',
                            storage='sqlite:///study5.db',
                            load_if_exists=True)
study.optimize(objective, n_trials=5)

pruned_trials = study.get_trials(deepcopy=False, states=[TrialState.PRUNED])
complete_trials = study.get_trials(deepcopy=False, states=[TrialState.COMPLETE])

# Display the study statistics
print("\nStudy statistics: ")
print("  Number of finished trials: ", len(study.trials))
print("  Number of pruned trials: ", len(pruned_trials))
print("  Number of complete trials: ", len(complete_trials))

[32m[I 2023-12-08 09:37:03,248][0m A new study created in RDB with name: triplet-arcface-12-8-mean-vit-study[0m


Learning rate for Loss: 0.0035987381095719333
Learning rate: 1.1042719857613235e-05
Weight decay: 0.0009341013224507427
Epsilon: 1.0684926352395233e-09
Beta: 0.1
Gamma: 0.7000000000000001
Batch size: 218
Number of epochs: 33


Epochs:   0%|          | 0/33 [00:00<?, ?it/s]
Training:   0%|          | 0/65 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/65 [00:04<04:53,  4.59s/it][A
Training:   3%|▎         | 2/65 [00:04<02:03,  1.96s/it][A
Training:   5%|▍         | 3/65 [00:04<01:09,  1.12s/it][A
Training:   8%|▊         | 5/65 [00:08<01:36,  1.60s/it][A
Training:   9%|▉         | 6/65 [00:08<01:10,  1.19s/it][A
Training:  12%|█▏        | 8/65 [00:09<00:38,  1.46it/s][A
Training:  14%|█▍        | 9/65 [00:13<01:23,  1.49s/it][A
Training:  17%|█▋        | 11/65 [00:13<00:49,  1.10it/s][A
Training:  20%|██        | 13/65 [00:17<01:07,  1.30s/it][A
Training:  23%|██▎       | 15/65 [00:17<00:43,  1.14it/s][A
Training:  26%|██▌       | 17/65 [00:21<01:00,  1.25s/it][A
Training:  29%|██▉       | 19/65 [00:21<00:40,  1.15it/s][A
Training:  32%|███▏      | 21/65 [00:26<00:58,  1.32s/it][A
Training:  34%|███▍      | 22/65 [00:26<00:47,  1.10s/it][A
Training:  35%|███▌      | 23/65 [00:26<00:37,  1.12it

Epoch: 1/33 - Loss: 21.4630 - Accuracy: 0.5781



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:05<00:43,  5.47s/it][A
 22%|██▏       | 2/9 [00:05<00:16,  2.36s/it][A
 33%|███▎      | 3/9 [00:05<00:08,  1.37s/it][A
 44%|████▍     | 4/9 [00:05<00:04,  1.15it/s][A
 56%|█████▌    | 5/9 [00:10<00:08,  2.17s/it][A
 67%|██████▋   | 6/9 [00:10<00:04,  1.55s/it][A
100%|██████████| 9/9 [00:11<00:00,  1.23s/it][A
Epochs:   3%|▎         | 1/33 [01:29<47:49, 89.68s/it]

Val Loss: 18.5190 - Val Accuracy: 0.6845



Training:   0%|          | 0/65 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/65 [00:06<06:47,  6.36s/it][A
Training:   5%|▍         | 3/65 [00:06<01:47,  1.74s/it][A
Training:   8%|▊         | 5/65 [00:11<02:09,  2.16s/it][A
Training:   9%|▉         | 6/65 [00:11<01:35,  1.63s/it][A
Training:  12%|█▏        | 8/65 [00:12<00:54,  1.05it/s][A
Training:  14%|█▍        | 9/65 [00:17<01:46,  1.91s/it][A
Training:  15%|█▌        | 10/65 [00:17<01:21,  1.49s/it][A
Training:  18%|█▊        | 12/65 [00:17<00:47,  1.12it/s][A
Training:  20%|██        | 13/65 [00:22<01:32,  1.77s/it][A
Training:  22%|██▏       | 14/65 [00:22<01:12,  1.42s/it][A
Training:  25%|██▍       | 16/65 [00:22<00:42,  1.16it/s][A
Training:  26%|██▌       | 17/65 [00:27<01:25,  1.77s/it][A
Training:  28%|██▊       | 18/65 [00:27<01:06,  1.41s/it][A
Training:  29%|██▉       | 19/65 [00:27<00:49,  1.08s/it][A
Training:  32%|███▏      | 21/65 [00:32<01:07,  1.53s/it][A
Training:  34%|███▍      | 22/65 [00:3

Epoch: 2/33 - Loss: 16.6646 - Accuracy: 0.6864



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:05<00:45,  5.65s/it][A
 22%|██▏       | 2/9 [00:05<00:16,  2.42s/it][A
 44%|████▍     | 4/9 [00:05<00:04,  1.05it/s][A
 56%|█████▌    | 5/9 [00:10<00:08,  2.07s/it][A
 67%|██████▋   | 6/9 [00:10<00:04,  1.47s/it][A
100%|██████████| 9/9 [00:10<00:00,  1.22s/it][A
Epochs:   6%|▌         | 2/33 [03:06<48:22, 93.63s/it]

Val Loss: 13.7103 - Val Accuracy: 0.7722



Training:   0%|          | 0/65 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/65 [00:06<06:49,  6.40s/it][A
Training:   3%|▎         | 2/65 [00:06<02:52,  2.74s/it][A
Training:   6%|▌         | 4/65 [00:06<01:04,  1.06s/it][A
Training:   9%|▉         | 6/65 [00:12<01:47,  1.83s/it][A
Training:  12%|█▏        | 8/65 [00:12<01:03,  1.11s/it][A
Training:  15%|█▌        | 10/65 [00:17<01:29,  1.62s/it][A
Training:  18%|█▊        | 12/65 [00:17<00:58,  1.09s/it][A
Training:  20%|██        | 13/65 [00:22<01:36,  1.86s/it][A
Training:  23%|██▎       | 15/65 [00:22<01:00,  1.21s/it][A
Training:  26%|██▌       | 17/65 [00:27<01:20,  1.67s/it][A
Training:  28%|██▊       | 18/65 [00:27<01:04,  1.37s/it][A
Training:  29%|██▉       | 19/65 [00:27<00:50,  1.11s/it][A
Training:  31%|███       | 20/65 [00:28<00:39,  1.15it/s][A
Training:  32%|███▏      | 21/65 [00:31<01:12,  1.65s/it][A
Training:  35%|███▌      | 23/65 [00:32<00:41,  1.01it/s][A
Training:  38%|███▊      | 25/65 [00:

Epoch: 3/33 - Loss: 12.9850 - Accuracy: 0.7915



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:05<00:42,  5.34s/it][A
 33%|███▎      | 3/9 [00:05<00:08,  1.47s/it][A
 44%|████▍     | 4/9 [00:05<00:05,  1.06s/it][A
 56%|█████▌    | 5/9 [00:10<00:08,  2.23s/it][A
100%|██████████| 9/9 [00:10<00:00,  1.20s/it][A
Epochs:   9%|▉         | 3/33 [04:41<47:14, 94.50s/it]

Val Loss: 11.2301 - Val Accuracy: 0.8614



Training:   0%|          | 0/65 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/65 [00:06<06:49,  6.39s/it][A
Training:   3%|▎         | 2/65 [00:06<02:49,  2.70s/it][A
Training:   6%|▌         | 4/65 [00:06<01:03,  1.04s/it][A
Training:   9%|▉         | 6/65 [00:11<01:46,  1.81s/it][A
Training:  11%|█         | 7/65 [00:12<01:20,  1.38s/it][A
Training:  12%|█▏        | 8/65 [00:12<01:00,  1.07s/it][A
Training:  14%|█▍        | 9/65 [00:17<01:59,  2.14s/it][A
Training:  15%|█▌        | 10/65 [00:17<01:26,  1.58s/it][A
Training:  17%|█▋        | 11/65 [00:17<01:02,  1.16s/it][A
Training:  18%|█▊        | 12/65 [00:17<00:45,  1.16it/s][A
Training:  20%|██        | 13/65 [00:22<01:46,  2.05s/it][A
Training:  23%|██▎       | 15/65 [00:22<00:57,  1.15s/it][A
Training:  26%|██▌       | 17/65 [00:28<01:24,  1.77s/it][A
Training:  28%|██▊       | 18/65 [00:28<01:06,  1.41s/it][A
Training:  31%|███       | 20/65 [00:28<00:39,  1.13it/s][A
Training:  32%|███▏      | 21/65 [00:32

Epoch: 4/33 - Loss: 10.6680 - Accuracy: 0.8570



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:05<00:43,  5.46s/it][A
 22%|██▏       | 2/9 [00:05<00:16,  2.37s/it][A
 44%|████▍     | 4/9 [00:05<00:04,  1.07it/s][A
 56%|█████▌    | 5/9 [00:10<00:08,  2.03s/it][A
 67%|██████▋   | 6/9 [00:10<00:04,  1.51s/it][A
100%|██████████| 9/9 [00:10<00:00,  1.21s/it][A
Epochs:  12%|█▏        | 4/33 [06:18<46:04, 95.31s/it]

Val Loss: 9.3463 - Val Accuracy: 0.8986



Training:   0%|          | 0/65 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/65 [00:06<06:28,  6.07s/it][A
Training:   3%|▎         | 2/65 [00:06<02:47,  2.67s/it][A
Training:   6%|▌         | 4/65 [00:06<01:03,  1.04s/it][A
Training:   8%|▊         | 5/65 [00:11<02:16,  2.28s/it][A
Training:   9%|▉         | 6/65 [00:12<01:41,  1.72s/it][A
Training:  11%|█         | 7/65 [00:12<01:12,  1.25s/it][A
Training:  12%|█▏        | 8/65 [00:12<00:52,  1.09it/s][A
Training:  14%|█▍        | 9/65 [00:16<01:53,  2.03s/it][A
Training:  15%|█▌        | 10/65 [00:17<01:24,  1.54s/it][A
Training:  17%|█▋        | 11/65 [00:17<01:00,  1.11s/it][A
Training:  18%|█▊        | 12/65 [00:17<00:43,  1.22it/s][A
Training:  20%|██        | 13/65 [00:22<01:41,  1.95s/it][A
Training:  22%|██▏       | 14/65 [00:22<01:15,  1.48s/it][A
Training:  23%|██▎       | 15/65 [00:22<00:54,  1.09s/it][A
Training:  25%|██▍       | 16/65 [00:22<00:39,  1.24it/s][A
Training:  26%|██▌       | 17/65 [00:27<

Epoch: 5/33 - Loss: 9.1216 - Accuracy: 0.8907



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:05<00:43,  5.44s/it][A
 33%|███▎      | 3/9 [00:05<00:08,  1.47s/it][A
 44%|████▍     | 4/9 [00:05<00:05,  1.01s/it][A
 56%|█████▌    | 5/9 [00:10<00:09,  2.26s/it][A
100%|██████████| 9/9 [00:10<00:00,  1.21s/it][A
Epochs:  15%|█▌        | 5/33 [07:55<44:52, 96.17s/it]

Val Loss: 8.0325 - Val Accuracy: 0.9159



Training:   0%|          | 0/65 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/65 [00:06<06:41,  6.28s/it][A
Training:   5%|▍         | 3/65 [00:06<01:44,  1.68s/it][A
Training:   6%|▌         | 4/65 [00:06<01:09,  1.14s/it][A
Training:   8%|▊         | 5/65 [00:12<02:35,  2.60s/it][A
Training:   9%|▉         | 6/65 [00:12<01:46,  1.81s/it][A
Training:  12%|█▏        | 8/65 [00:12<00:57,  1.00s/it][A
Training:  14%|█▍        | 9/65 [00:17<01:58,  2.12s/it][A
Training:  15%|█▌        | 10/65 [00:18<01:27,  1.59s/it][A
Training:  17%|█▋        | 11/65 [00:18<01:04,  1.19s/it][A
Training:  20%|██        | 13/65 [00:23<01:30,  1.75s/it][A
Training:  23%|██▎       | 15/65 [00:23<00:54,  1.09s/it][A
Training:  26%|██▌       | 17/65 [00:28<01:17,  1.62s/it][A
Training:  28%|██▊       | 18/65 [00:28<01:02,  1.32s/it][A
Training:  29%|██▉       | 19/65 [00:28<00:48,  1.06s/it][A
Training:  31%|███       | 20/65 [00:28<00:37,  1.20it/s][A
Training:  32%|███▏      | 21/65 [00:33

Epoch: 6/33 - Loss: 7.9902 - Accuracy: 0.9112



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:05<00:44,  5.53s/it][A
 33%|███▎      | 3/9 [00:05<00:08,  1.49s/it][A
 56%|█████▌    | 5/9 [00:10<00:08,  2.01s/it][A
100%|██████████| 9/9 [00:10<00:00,  1.22s/it][A
Epochs:  18%|█▊        | 6/33 [09:33<43:31, 96.73s/it]

Val Loss: 7.1481 - Val Accuracy: 0.9307



Training:   0%|          | 0/65 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/65 [00:06<06:38,  6.22s/it][A
Training:   3%|▎         | 2/65 [00:06<02:47,  2.66s/it][A
Training:   5%|▍         | 3/65 [00:06<01:34,  1.53s/it][A
Training:   6%|▌         | 4/65 [00:06<00:59,  1.03it/s][A
Training:   8%|▊         | 5/65 [00:12<02:32,  2.55s/it][A
Training:   9%|▉         | 6/65 [00:12<01:44,  1.76s/it][A
Training:  11%|█         | 7/65 [00:12<01:10,  1.22s/it][A
Training:  12%|█▏        | 8/65 [00:12<00:49,  1.14it/s][A
Training:  14%|█▍        | 9/65 [00:17<01:58,  2.12s/it][A
Training:  15%|█▌        | 10/65 [00:17<01:24,  1.54s/it][A
Training:  18%|█▊        | 12/65 [00:17<00:45,  1.17it/s][A
Training:  20%|██        | 13/65 [00:22<01:37,  1.88s/it][A
Training:  22%|██▏       | 14/65 [00:23<01:15,  1.49s/it][A
Training:  25%|██▍       | 16/65 [00:23<00:43,  1.14it/s][A
Training:  26%|██▌       | 17/65 [00:27<01:24,  1.76s/it][A
Training:  28%|██▊       | 18/65 [00:28<0

Epoch: 7/33 - Loss: 7.1424 - Accuracy: 0.9214



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:05<00:43,  5.49s/it][A
 33%|███▎      | 3/9 [00:05<00:09,  1.51s/it][A
 44%|████▍     | 4/9 [00:05<00:05,  1.03s/it][A
 56%|█████▌    | 5/9 [00:10<00:08,  2.22s/it][A
100%|██████████| 9/9 [00:10<00:00,  1.20s/it][A
Epochs:  21%|██        | 7/33 [11:10<41:59, 96.92s/it]

Val Loss: 6.3691 - Val Accuracy: 0.9363



Training:   0%|          | 0/65 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/65 [00:06<06:45,  6.34s/it][A
Training:   3%|▎         | 2/65 [00:06<02:48,  2.67s/it][A
Training:   5%|▍         | 3/65 [00:06<01:33,  1.51s/it][A
Training:   6%|▌         | 4/65 [00:06<00:59,  1.02it/s][A
Training:   8%|▊         | 5/65 [00:12<02:34,  2.57s/it][A
Training:  11%|█         | 7/65 [00:12<01:16,  1.32s/it][A
Training:  12%|█▏        | 8/65 [00:12<00:57,  1.02s/it][A
Training:  14%|█▍        | 9/65 [00:17<01:59,  2.13s/it][A
Training:  15%|█▌        | 10/65 [00:17<01:25,  1.56s/it][A
Training:  17%|█▋        | 11/65 [00:17<01:01,  1.15s/it][A
Training:  18%|█▊        | 12/65 [00:17<00:44,  1.18it/s][A
Training:  20%|██        | 13/65 [00:23<01:48,  2.09s/it][A
Training:  22%|██▏       | 14/65 [00:23<01:17,  1.51s/it][A
Training:  23%|██▎       | 15/65 [00:23<00:55,  1.12s/it][A
Training:  25%|██▍       | 16/65 [00:23<00:40,  1.22it/s][A
Training:  26%|██▌       | 17/65 [00:28<

Epoch: 8/33 - Loss: 6.4735 - Accuracy: 0.9274



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:05<00:42,  5.34s/it][A
 22%|██▏       | 2/9 [00:05<00:15,  2.28s/it][A
 33%|███▎      | 3/9 [00:05<00:07,  1.30s/it][A
 56%|█████▌    | 5/9 [00:10<00:07,  1.88s/it][A
 67%|██████▋   | 6/9 [00:10<00:04,  1.39s/it][A
100%|██████████| 9/9 [00:10<00:00,  1.19s/it][A
Epochs:  24%|██▍       | 8/33 [12:47<40:22, 96.90s/it]

Val Loss: 5.6681 - Val Accuracy: 0.9393



Training:   0%|          | 0/65 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/65 [00:06<07:21,  6.90s/it][A
Training:   5%|▍         | 3/65 [00:07<01:54,  1.85s/it][A
Training:   8%|▊         | 5/65 [00:13<02:26,  2.45s/it][A
Training:   9%|▉         | 6/65 [00:13<01:51,  1.89s/it][A
Training:  11%|█         | 7/65 [00:13<01:21,  1.41s/it][A
Training:  12%|█▏        | 8/65 [00:13<00:59,  1.05s/it][A
Training:  14%|█▍        | 9/65 [00:20<02:28,  2.65s/it][A
Training:  15%|█▌        | 10/65 [00:20<01:48,  1.98s/it][A
Training:  17%|█▋        | 11/65 [00:20<01:18,  1.46s/it][A
Training:  18%|█▊        | 12/65 [00:21<00:57,  1.08s/it][A
Training:  20%|██        | 13/65 [00:28<02:35,  2.99s/it][A
Training:  22%|██▏       | 14/65 [00:28<01:50,  2.17s/it][A
Training:  23%|██▎       | 15/65 [00:28<01:17,  1.56s/it][A
Training:  25%|██▍       | 16/65 [00:29<00:57,  1.17s/it][A
Training:  26%|██▌       | 17/65 [00:37<02:42,  3.39s/it][A
Training:  28%|██▊       | 18/65 [00:37

Epoch: 9/33 - Loss: 5.9266 - Accuracy: 0.9314



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:12<01:36, 12.09s/it][A
 22%|██▏       | 2/9 [00:12<00:36,  5.17s/it][A
 33%|███▎      | 3/9 [00:12<00:17,  2.90s/it][A
 44%|████▍     | 4/9 [00:13<00:09,  1.92s/it][A
 56%|█████▌    | 5/9 [00:22<00:18,  4.68s/it][A
 67%|██████▋   | 6/9 [00:22<00:09,  3.12s/it][A
100%|██████████| 9/9 [00:23<00:00,  2.58s/it][A
Epochs:  27%|██▋       | 9/33 [15:59<50:39, 126.66s/it]

Val Loss: 5.0329 - Val Accuracy: 0.9439



Training:   0%|          | 0/65 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/65 [00:13<14:39, 13.73s/it][A
Training:   3%|▎         | 2/65 [00:14<06:08,  5.86s/it][A
Training:   5%|▍         | 3/65 [00:14<03:29,  3.39s/it][A
Training:   6%|▌         | 4/65 [00:14<02:09,  2.12s/it][A
Training:   8%|▊         | 5/65 [00:27<05:48,  5.81s/it][A
Training:   9%|▉         | 6/65 [00:27<03:52,  3.93s/it][A
Training:  11%|█         | 7/65 [00:27<02:40,  2.76s/it][A
Training:  12%|█▏        | 8/65 [00:27<01:49,  1.92s/it][A
Training:  14%|█▍        | 9/65 [00:38<04:19,  4.64s/it][A
Training:  15%|█▌        | 10/65 [00:38<02:59,  3.27s/it][A
Training:  17%|█▋        | 11/65 [00:38<02:08,  2.38s/it][A
Training:  18%|█▊        | 12/65 [00:39<01:30,  1.71s/it][A
Training:  20%|██        | 13/65 [00:50<03:52,  4.47s/it][A
Training:  22%|██▏       | 14/65 [00:50<02:46,  3.27s/it][A
Training:  23%|██▎       | 15/65 [00:51<02:02,  2.46s/it][A
Training:  25%|██▍       | 16/65 [00:51<0

Epoch: 10/33 - Loss: 5.3768 - Accuracy: 0.9369



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:12<01:41, 12.66s/it][A
 22%|██▏       | 2/9 [00:13<00:37,  5.41s/it][A
 33%|███▎      | 3/9 [00:13<00:18,  3.02s/it][A
 56%|█████▌    | 5/9 [00:23<00:17,  4.36s/it][A
 78%|███████▊  | 7/9 [00:24<00:04,  2.44s/it][A
100%|██████████| 9/9 [00:25<00:00,  2.81s/it][A
Epochs:  30%|███       | 10/33 [19:39<59:35, 155.47s/it]

Val Loss: 4.5281 - Val Accuracy: 0.9475



Training:   0%|          | 0/65 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/65 [00:14<15:13, 14.27s/it][A
Training:   3%|▎         | 2/65 [00:14<06:20,  6.04s/it][A
Training:   5%|▍         | 3/65 [00:14<03:28,  3.36s/it][A
Training:   6%|▌         | 4/65 [00:15<02:12,  2.18s/it][A
Training:   8%|▊         | 5/65 [00:26<05:24,  5.41s/it][A
Training:   9%|▉         | 6/65 [00:26<03:39,  3.72s/it][A
Training:  11%|█         | 7/65 [00:26<02:30,  2.59s/it][A
Training:  12%|█▏        | 8/65 [00:27<01:46,  1.86s/it][A
Training:  14%|█▍        | 9/65 [00:38<04:26,  4.76s/it][A
Training:  15%|█▌        | 10/65 [00:38<03:08,  3.42s/it][A
Training:  17%|█▋        | 11/65 [00:38<02:10,  2.42s/it][A
Training:  18%|█▊        | 12/65 [00:39<01:32,  1.75s/it][A
Training:  20%|██        | 13/65 [00:50<03:57,  4.56s/it][A
Training:  22%|██▏       | 14/65 [00:50<02:48,  3.30s/it][A
Training:  23%|██▎       | 15/65 [00:50<01:57,  2.35s/it][A
Training:  25%|██▍       | 16/65 [00:51<0

Epoch: 11/33 - Loss: 4.9857 - Accuracy: 0.9397



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:11<01:32, 11.58s/it][A
 22%|██▏       | 2/9 [00:11<00:33,  4.86s/it][A
 44%|████▍     | 4/9 [00:12<00:10,  2.01s/it][A
 56%|█████▌    | 5/9 [00:22<00:17,  4.41s/it][A
 67%|██████▋   | 6/9 [00:22<00:09,  3.18s/it][A
 78%|███████▊  | 7/9 [00:22<00:04,  2.33s/it][A
 89%|████████▉ | 8/9 [00:23<00:01,  1.72s/it][A
100%|██████████| 9/9 [00:23<00:00,  2.62s/it][A
Epochs:  33%|███▎      | 11/33 [23:16<1:03:49, 174.08s/it]

Val Loss: 4.6540 - Val Accuracy: 0.9506



Training:   0%|          | 0/65 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/65 [00:14<15:09, 14.21s/it][A
Training:   3%|▎         | 2/65 [00:14<06:12,  5.92s/it][A
Training:   5%|▍         | 3/65 [00:14<03:24,  3.31s/it][A
Training:   8%|▊         | 5/65 [00:26<04:41,  4.69s/it][A
Training:   9%|▉         | 6/65 [00:26<03:27,  3.52s/it][A
Training:  11%|█         | 7/65 [00:26<02:30,  2.59s/it][A
Training:  12%|█▏        | 8/65 [00:27<01:46,  1.87s/it][A
Training:  14%|█▍        | 9/65 [00:38<04:16,  4.57s/it][A
Training:  15%|█▌        | 10/65 [00:38<03:01,  3.31s/it][A
Training:  18%|█▊        | 12/65 [00:38<01:38,  1.85s/it][A
Training:  20%|██        | 13/65 [00:50<03:39,  4.22s/it][A
Training:  22%|██▏       | 14/65 [00:50<02:41,  3.17s/it][A
Training:  23%|██▎       | 15/65 [00:50<01:57,  2.34s/it][A
Training:  25%|██▍       | 16/65 [00:50<01:26,  1.76s/it][A
Training:  26%|██▌       | 17/65 [01:01<03:33,  4.45s/it][A
Training:  29%|██▉       | 19/65 [01:02<

Epoch: 12/33 - Loss: 4.6485 - Accuracy: 0.9420



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:11<01:33, 11.66s/it][A
 22%|██▏       | 2/9 [00:12<00:34,  5.00s/it][A
 33%|███▎      | 3/9 [00:12<00:16,  2.77s/it][A
 44%|████▍     | 4/9 [00:12<00:09,  1.81s/it][A
 56%|█████▌    | 5/9 [00:22<00:18,  4.63s/it][A
 67%|██████▋   | 6/9 [00:22<00:09,  3.13s/it][A
 78%|███████▊  | 7/9 [00:22<00:04,  2.18s/it][A
 89%|████████▉ | 8/9 [00:22<00:01,  1.62s/it][A
100%|██████████| 9/9 [00:23<00:00,  2.59s/it][A
Epochs:  36%|███▋      | 12/33 [26:50<1:05:14, 186.38s/it]

Val Loss: 3.9197 - Val Accuracy: 0.9521



Training:   0%|          | 0/65 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/65 [00:14<15:32, 14.57s/it][A
Training:   3%|▎         | 2/65 [00:14<06:30,  6.20s/it][A
Training:   5%|▍         | 3/65 [00:15<03:33,  3.44s/it][A
Training:   6%|▌         | 4/65 [00:15<02:09,  2.12s/it][A
Training:   8%|▊         | 5/65 [00:27<05:47,  5.79s/it][A
Training:   9%|▉         | 6/65 [00:27<03:50,  3.91s/it][A
Training:  11%|█         | 7/65 [00:28<02:42,  2.80s/it][A
Training:  12%|█▏        | 8/65 [00:28<01:51,  1.96s/it][A
Training:  14%|█▍        | 9/65 [00:40<04:39,  5.00s/it][A
Training:  15%|█▌        | 10/65 [00:40<03:15,  3.55s/it][A
Training:  17%|█▋        | 11/65 [00:40<02:14,  2.50s/it][A
Training:  18%|█▊        | 12/65 [00:40<01:36,  1.82s/it][A
Training:  20%|██        | 13/65 [00:52<04:08,  4.77s/it][A
Training:  22%|██▏       | 14/65 [00:52<02:51,  3.37s/it][A
Training:  23%|██▎       | 15/65 [00:52<01:59,  2.40s/it][A
Training:  26%|██▌       | 17/65 [01:04<0

Epoch: 13/33 - Loss: 4.3509 - Accuracy: 0.9445



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:08<01:09,  8.64s/it][A
 22%|██▏       | 2/9 [00:08<00:25,  3.66s/it][A
 33%|███▎      | 3/9 [00:09<00:12,  2.16s/it][A
 44%|████▍     | 4/9 [00:09<00:07,  1.42s/it][A
 56%|█████▌    | 5/9 [00:16<00:14,  3.59s/it][A
 67%|██████▋   | 6/9 [00:17<00:07,  2.42s/it][A
 78%|███████▊  | 7/9 [00:17<00:03,  1.69s/it][A
 89%|████████▉ | 8/9 [00:17<00:01,  1.20s/it][A
100%|██████████| 9/9 [00:17<00:00,  1.98s/it][A
Epochs:  39%|███▉      | 13/33 [30:16<1:04:05, 192.29s/it]

Val Loss: 3.6220 - Val Accuracy: 0.9541



Training:   0%|          | 0/65 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/65 [00:10<10:47, 10.12s/it][A
Training:   3%|▎         | 2/65 [00:10<04:33,  4.34s/it][A
Training:   5%|▍         | 3/65 [00:10<02:31,  2.45s/it][A
Training:   6%|▌         | 4/65 [00:10<01:34,  1.55s/it][A
Training:   8%|▊         | 5/65 [00:19<03:58,  3.98s/it][A
Training:   9%|▉         | 6/65 [00:19<02:38,  2.69s/it][A
Training:  11%|█         | 7/65 [00:19<01:49,  1.88s/it][A
Training:  12%|█▏        | 8/65 [00:19<01:15,  1.32s/it][A
Training:  14%|█▍        | 9/65 [00:28<03:17,  3.53s/it][A
Training:  15%|█▌        | 10/65 [00:28<02:22,  2.59s/it][A
Training:  17%|█▋        | 11/65 [00:28<01:41,  1.88s/it][A
Training:  18%|█▊        | 12/65 [00:29<01:13,  1.39s/it][A
Training:  20%|██        | 13/65 [00:36<02:55,  3.37s/it][A
Training:  22%|██▏       | 14/65 [00:37<02:02,  2.39s/it][A
Training:  23%|██▎       | 15/65 [00:37<01:25,  1.71s/it][A
Training:  26%|██▌       | 17/65 [00:45<0

Epoch: 14/33 - Loss: 4.1330 - Accuracy: 0.9461



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:09<01:13,  9.25s/it][A
 33%|███▎      | 3/9 [00:09<00:14,  2.44s/it][A
 56%|█████▌    | 5/9 [00:17<00:13,  3.35s/it][A
 67%|██████▋   | 6/9 [00:17<00:07,  2.48s/it][A
 78%|███████▊  | 7/9 [00:18<00:03,  1.84s/it][A
100%|██████████| 9/9 [00:18<00:00,  2.05s/it][A
Epochs:  42%|████▏     | 14/33 [32:58<57:57, 183.05s/it]  

Val Loss: 3.4708 - Val Accuracy: 0.9541



Training:   0%|          | 0/65 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/65 [00:10<11:22, 10.67s/it][A
Training:   3%|▎         | 2/65 [00:10<04:45,  4.53s/it][A
Training:   5%|▍         | 3/65 [00:11<02:39,  2.57s/it][A
Training:   6%|▌         | 4/65 [00:11<01:37,  1.60s/it][A
Training:   8%|▊         | 5/65 [00:20<04:10,  4.18s/it][A
Training:   9%|▉         | 6/65 [00:20<02:48,  2.86s/it][A
Training:  11%|█         | 7/65 [00:20<01:54,  1.98s/it][A
Training:  12%|█▏        | 8/65 [00:20<01:21,  1.44s/it][A
Training:  14%|█▍        | 9/65 [00:28<03:08,  3.36s/it][A
Training:  15%|█▌        | 10/65 [00:28<02:10,  2.37s/it][A
Training:  17%|█▋        | 11/65 [00:29<01:41,  1.89s/it][A
Training:  18%|█▊        | 12/65 [00:29<01:14,  1.40s/it][A
Training:  20%|██        | 13/65 [00:36<02:43,  3.15s/it][A
Training:  22%|██▏       | 14/65 [00:38<02:14,  2.63s/it][A
Training:  23%|██▎       | 15/65 [00:38<01:34,  1.89s/it][A
Training:  25%|██▍       | 16/65 [00:38<0

Epoch: 15/33 - Loss: 3.9165 - Accuracy: 0.9497



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:08<01:05,  8.21s/it][A
 22%|██▏       | 2/9 [00:08<00:25,  3.58s/it][A
 33%|███▎      | 3/9 [00:08<00:12,  2.08s/it][A
 44%|████▍     | 4/9 [00:09<00:06,  1.33s/it][A
 56%|█████▌    | 5/9 [00:16<00:13,  3.46s/it][A
 67%|██████▋   | 6/9 [00:16<00:07,  2.36s/it][A
 78%|███████▊  | 7/9 [00:17<00:03,  1.87s/it][A
100%|██████████| 9/9 [00:17<00:00,  1.96s/it][A
Epochs:  45%|████▌     | 15/33 [35:39<52:57, 176.53s/it]

Val Loss: 3.3357 - Val Accuracy: 0.9557



Training:   0%|          | 0/65 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/65 [00:11<11:56, 11.20s/it][A
Training:   3%|▎         | 2/65 [00:11<04:59,  4.76s/it][A
Training:   5%|▍         | 3/65 [00:11<02:47,  2.70s/it][A
Training:   6%|▌         | 4/65 [00:11<01:44,  1.72s/it][A
Training:   8%|▊         | 5/65 [00:20<04:09,  4.15s/it][A
Training:  11%|█         | 7/65 [00:20<02:03,  2.13s/it][A
Training:  14%|█▍        | 9/65 [00:29<02:51,  3.07s/it][A
Training:  15%|█▌        | 10/65 [00:29<02:12,  2.41s/it][A
Training:  18%|█▊        | 12/65 [00:29<01:18,  1.47s/it][A
Training:  20%|██        | 13/65 [00:38<02:34,  2.98s/it][A
Training:  22%|██▏       | 14/65 [00:38<01:56,  2.29s/it][A
Training:  23%|██▎       | 15/65 [00:38<01:26,  1.74s/it][A
Training:  25%|██▍       | 16/65 [00:38<01:04,  1.32s/it][A
Training:  26%|██▌       | 17/65 [00:46<02:38,  3.30s/it][A
Training:  28%|██▊       | 18/65 [00:47<01:55,  2.46s/it][A
Training:  29%|██▉       | 19/65 [00:47

Epoch: 16/33 - Loss: 3.7690 - Accuracy: 0.9508



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:08<01:11,  8.97s/it][A
 22%|██▏       | 2/9 [00:09<00:26,  3.80s/it][A
 33%|███▎      | 3/9 [00:09<00:12,  2.15s/it][A
 44%|████▍     | 4/9 [00:09<00:07,  1.49s/it][A
 56%|█████▌    | 5/9 [00:17<00:14,  3.54s/it][A
 67%|██████▋   | 6/9 [00:17<00:07,  2.42s/it][A
100%|██████████| 9/9 [00:17<00:00,  1.97s/it][A
Epochs:  48%|████▊     | 16/33 [38:21<48:47, 172.23s/it]

Val Loss: 3.2191 - Val Accuracy: 0.9567



Training:   0%|          | 0/65 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/65 [00:10<10:47, 10.11s/it][A
Training:   3%|▎         | 2/65 [00:10<04:35,  4.37s/it][A
Training:   5%|▍         | 3/65 [00:10<02:31,  2.45s/it][A
Training:   6%|▌         | 4/65 [00:10<01:36,  1.58s/it][A
Training:   8%|▊         | 5/65 [00:18<03:55,  3.93s/it][A
Training:   9%|▉         | 6/65 [00:19<02:39,  2.71s/it][A
Training:  11%|█         | 7/65 [00:19<01:50,  1.90s/it][A
Training:  12%|█▏        | 8/65 [00:19<01:19,  1.39s/it][A
Training:  14%|█▍        | 9/65 [00:27<03:11,  3.41s/it][A
Training:  17%|█▋        | 11/65 [00:27<01:39,  1.84s/it][A
Training:  18%|█▊        | 12/65 [00:28<01:18,  1.48s/it][A
Training:  20%|██        | 13/65 [00:36<02:54,  3.35s/it][A
Training:  22%|██▏       | 14/65 [00:37<02:07,  2.49s/it][A
Training:  23%|██▎       | 15/65 [00:37<01:30,  1.82s/it][A
Training:  25%|██▍       | 16/65 [00:37<01:06,  1.35s/it][A
Training:  26%|██▌       | 17/65 [00:45<0

Epoch: 17/33 - Loss: 3.6534 - Accuracy: 0.9511



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:05<00:43,  5.46s/it][A
 33%|███▎      | 3/9 [00:05<00:09,  1.50s/it][A
 44%|████▍     | 4/9 [00:05<00:05,  1.04s/it][A
 56%|█████▌    | 5/9 [00:10<00:09,  2.29s/it][A
 78%|███████▊  | 7/9 [00:10<00:02,  1.21s/it][A
100%|██████████| 9/9 [00:11<00:00,  1.24s/it][A
Epochs:  52%|█████▏    | 17/33 [40:48<43:50, 164.41s/it]

Val Loss: 3.0853 - Val Accuracy: 0.9592



Training:   0%|          | 0/65 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/65 [00:06<06:33,  6.15s/it][A
Training:   3%|▎         | 2/65 [00:06<02:49,  2.68s/it][A
Training:   5%|▍         | 3/65 [00:06<01:35,  1.54s/it][A
Training:   6%|▌         | 4/65 [00:06<00:59,  1.02it/s][A
Training:   8%|▊         | 5/65 [00:11<02:23,  2.40s/it][A
Training:   9%|▉         | 6/65 [00:12<01:49,  1.85s/it][A
Training:  11%|█         | 7/65 [00:12<01:14,  1.28s/it][A
Training:  12%|█▏        | 8/65 [00:12<00:51,  1.10it/s][A
Training:  14%|█▍        | 9/65 [00:17<01:54,  2.04s/it][A
Training:  15%|█▌        | 10/65 [00:18<01:34,  1.71s/it][A
Training:  17%|█▋        | 11/65 [00:18<01:06,  1.24s/it][A
Training:  18%|█▊        | 12/65 [00:18<00:47,  1.11it/s][A
Training:  20%|██        | 13/65 [00:22<01:36,  1.86s/it][A
Training:  22%|██▏       | 14/65 [00:23<01:20,  1.57s/it][A
Training:  25%|██▍       | 16/65 [00:23<00:43,  1.12it/s][A
Training:  26%|██▌       | 17/65 [00:28<0

Epoch: 18/33 - Loss: 3.5651 - Accuracy: 0.9518



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:05<00:44,  5.57s/it][A
 33%|███▎      | 3/9 [00:05<00:08,  1.49s/it][A
 56%|█████▌    | 5/9 [00:10<00:08,  2.04s/it][A
100%|██████████| 9/9 [00:11<00:00,  1.24s/it][A
Epochs:  55%|█████▍    | 18/33 [42:28<36:17, 145.19s/it]

Val Loss: 3.0633 - Val Accuracy: 0.9577



Training:   0%|          | 0/65 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/65 [00:06<06:39,  6.24s/it][A
Training:   3%|▎         | 2/65 [00:06<02:47,  2.66s/it][A
Training:   5%|▍         | 3/65 [00:06<01:33,  1.50s/it][A
Training:   6%|▌         | 4/65 [00:06<01:02,  1.03s/it][A
Training:   8%|▊         | 5/65 [00:12<02:33,  2.55s/it][A
Training:   9%|▉         | 6/65 [00:12<01:41,  1.73s/it][A
Training:  11%|█         | 7/65 [00:12<01:09,  1.20s/it][A
Training:  12%|█▏        | 8/65 [00:12<00:49,  1.15it/s][A
Training:  14%|█▍        | 9/65 [00:17<02:00,  2.16s/it][A
Training:  17%|█▋        | 11/65 [00:17<01:05,  1.21s/it][A
Training:  20%|██        | 13/65 [00:22<01:31,  1.75s/it][A
Training:  22%|██▏       | 14/65 [00:23<01:10,  1.39s/it][A
Training:  23%|██▎       | 15/65 [00:23<00:54,  1.09s/it][A
Training:  25%|██▍       | 16/65 [00:23<00:41,  1.17it/s][A
Training:  26%|██▌       | 17/65 [00:28<01:35,  1.98s/it][A
Training:  28%|██▊       | 18/65 [00:28<0

Epoch: 19/33 - Loss: 3.4235 - Accuracy: 0.9528



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:05<00:42,  5.27s/it][A
 22%|██▏       | 2/9 [00:05<00:16,  2.39s/it][A
 33%|███▎      | 3/9 [00:05<00:08,  1.36s/it][A
 44%|████▍     | 4/9 [00:05<00:04,  1.14it/s][A
 56%|█████▌    | 5/9 [00:10<00:08,  2.13s/it][A
 67%|██████▋   | 6/9 [00:10<00:04,  1.55s/it][A
100%|██████████| 9/9 [00:10<00:00,  1.22s/it][A
Epochs:  58%|█████▊    | 19/33 [44:07<30:38, 131.34s/it]

Val Loss: 3.0445 - Val Accuracy: 0.9587



Training:   0%|          | 0/65 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/65 [00:06<06:38,  6.22s/it][A
Training:   3%|▎         | 2/65 [00:06<02:51,  2.73s/it][A
Training:   6%|▌         | 4/65 [00:06<01:06,  1.09s/it][A
Training:   8%|▊         | 5/65 [00:12<02:26,  2.45s/it][A
Training:   9%|▉         | 6/65 [00:12<01:41,  1.73s/it][A
Training:  12%|█▏        | 8/65 [00:12<00:54,  1.04it/s][A
Training:  14%|█▍        | 9/65 [00:17<01:51,  2.00s/it][A
Training:  15%|█▌        | 10/65 [00:17<01:23,  1.52s/it][A
Training:  17%|█▋        | 11/65 [00:17<01:01,  1.13s/it][A
Training:  20%|██        | 13/65 [00:22<01:30,  1.75s/it][A
Training:  22%|██▏       | 14/65 [00:23<01:09,  1.36s/it][A
Training:  23%|██▎       | 15/65 [00:23<00:52,  1.04s/it][A
Training:  25%|██▍       | 16/65 [00:23<00:38,  1.27it/s][A
Training:  26%|██▌       | 17/65 [00:28<01:35,  1.98s/it][A
Training:  28%|██▊       | 18/65 [00:28<01:08,  1.45s/it][A
Training:  29%|██▉       | 19/65 [00:28

Epoch: 20/33 - Loss: 3.3839 - Accuracy: 0.9526



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:05<00:43,  5.38s/it][A
 22%|██▏       | 2/9 [00:05<00:16,  2.31s/it][A
 44%|████▍     | 4/9 [00:05<00:04,  1.11it/s][A
 56%|█████▌    | 5/9 [00:10<00:08,  2.15s/it][A
100%|██████████| 9/9 [00:10<00:00,  1.21s/it][A
Epochs:  61%|██████    | 20/33 [45:46<26:19, 121.46s/it]

Val Loss: 2.8926 - Val Accuracy: 0.9577



Training:   0%|          | 0/65 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/65 [00:06<06:44,  6.31s/it][A
Training:   3%|▎         | 2/65 [00:06<02:55,  2.78s/it][A
Training:   5%|▍         | 3/65 [00:06<01:37,  1.57s/it][A
Training:   6%|▌         | 4/65 [00:06<01:00,  1.01it/s][A
Training:   8%|▊         | 5/65 [00:12<02:31,  2.52s/it][A
Training:   9%|▉         | 6/65 [00:12<01:48,  1.84s/it][A
Training:  11%|█         | 7/65 [00:12<01:14,  1.29s/it][A
Training:  12%|█▏        | 8/65 [00:12<00:53,  1.07it/s][A
Training:  14%|█▍        | 9/65 [00:17<01:58,  2.11s/it][A
Training:  15%|█▌        | 10/65 [00:17<01:25,  1.56s/it][A
Training:  18%|█▊        | 12/65 [00:18<00:46,  1.15it/s][A
Training:  20%|██        | 13/65 [00:22<01:37,  1.87s/it][A
Training:  22%|██▏       | 14/65 [00:23<01:14,  1.46s/it][A
Training:  23%|██▎       | 15/65 [00:23<00:55,  1.10s/it][A
Training:  25%|██▍       | 16/65 [00:23<00:41,  1.18it/s][A
Training:  26%|██▌       | 17/65 [00:28<0

Epoch: 21/33 - Loss: 3.2469 - Accuracy: 0.9546



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:05<00:41,  5.18s/it][A
 22%|██▏       | 2/9 [00:05<00:15,  2.23s/it][A
 44%|████▍     | 4/9 [00:05<00:04,  1.13it/s][A
 56%|█████▌    | 5/9 [00:10<00:08,  2.07s/it][A
 67%|██████▋   | 6/9 [00:10<00:04,  1.49s/it][A
100%|██████████| 9/9 [00:10<00:00,  1.19s/it][A
Epochs:  64%|██████▎   | 21/33 [47:24<22:55, 114.65s/it]

Val Loss: 2.8568 - Val Accuracy: 0.9602



Training:   0%|          | 0/65 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/65 [00:06<06:42,  6.29s/it][A
Training:   3%|▎         | 2/65 [00:06<02:57,  2.82s/it][A
Training:   6%|▌         | 4/65 [00:06<01:07,  1.10s/it][A
Training:   8%|▊         | 5/65 [00:11<02:16,  2.28s/it][A
Training:  11%|█         | 7/65 [00:12<01:14,  1.29s/it][A
Training:  12%|█▏        | 8/65 [00:12<00:57,  1.02s/it][A
Training:  14%|█▍        | 9/65 [00:17<01:56,  2.07s/it][A
Training:  15%|█▌        | 10/65 [00:17<01:24,  1.54s/it][A
Training:  17%|█▋        | 11/65 [00:17<01:01,  1.15s/it][A
Training:  20%|██        | 13/65 [00:22<01:27,  1.69s/it][A
Training:  22%|██▏       | 14/65 [00:22<01:08,  1.33s/it][A
Training:  23%|██▎       | 15/65 [00:22<00:51,  1.03s/it][A
Training:  26%|██▌       | 17/65 [00:27<01:19,  1.65s/it][A
Training:  28%|██▊       | 18/65 [00:27<01:00,  1.29s/it][A
Training:  29%|██▉       | 19/65 [00:28<00:47,  1.03s/it][A
Training:  31%|███       | 20/65 [00:28

Epoch: 22/33 - Loss: 3.2127 - Accuracy: 0.9552



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:05<00:43,  5.40s/it][A
 22%|██▏       | 2/9 [00:05<00:16,  2.29s/it][A
 33%|███▎      | 3/9 [00:05<00:07,  1.30s/it][A
 44%|████▍     | 4/9 [00:05<00:04,  1.21it/s][A
 56%|█████▌    | 5/9 [00:10<00:08,  2.24s/it][A
100%|██████████| 9/9 [00:10<00:00,  1.21s/it][A
Epochs:  67%|██████▋   | 22/33 [49:02<20:06, 109.65s/it]

Val Loss: 2.8085 - Val Accuracy: 0.9618



Training:   0%|          | 0/65 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/65 [00:06<06:53,  6.46s/it][A
Training:   3%|▎         | 2/65 [00:06<02:53,  2.76s/it][A
Training:   5%|▍         | 3/65 [00:06<01:38,  1.58s/it][A
Training:   6%|▌         | 4/65 [00:07<01:04,  1.05s/it][A
Training:   8%|▊         | 5/65 [00:12<02:32,  2.55s/it][A
Training:  11%|█         | 7/65 [00:12<01:14,  1.29s/it][A
Training:  14%|█▍        | 9/65 [00:17<01:42,  1.83s/it][A
Training:  17%|█▋        | 11/65 [00:17<01:03,  1.18s/it][A
Training:  18%|█▊        | 12/65 [00:17<00:51,  1.03it/s][A
Training:  20%|██        | 13/65 [00:22<01:37,  1.88s/it][A
Training:  23%|██▎       | 15/65 [00:22<00:58,  1.16s/it][A
Training:  26%|██▌       | 17/65 [00:28<01:19,  1.66s/it][A
Training:  28%|██▊       | 18/65 [00:28<01:03,  1.35s/it][A
Training:  29%|██▉       | 19/65 [00:28<00:48,  1.06s/it][A
Training:  31%|███       | 20/65 [00:28<00:37,  1.19it/s][A
Training:  32%|███▏      | 21/65 [00:33

Epoch: 23/33 - Loss: 3.1524 - Accuracy: 0.9557



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:04<00:39,  4.97s/it][A
 22%|██▏       | 2/9 [00:05<00:15,  2.15s/it][A
 33%|███▎      | 3/9 [00:05<00:07,  1.22s/it][A
 44%|████▍     | 4/9 [00:05<00:03,  1.26it/s][A
 56%|█████▌    | 5/9 [00:09<00:08,  2.14s/it][A
 67%|██████▋   | 6/9 [00:10<00:04,  1.45s/it][A
100%|██████████| 9/9 [00:10<00:00,  1.15s/it][A
Epochs:  70%|██████▉   | 23/33 [50:40<17:40, 106.03s/it]

Val Loss: 2.7735 - Val Accuracy: 0.9618



Training:   0%|          | 0/65 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/65 [00:06<06:35,  6.17s/it][A
Training:   5%|▍         | 3/65 [00:06<01:42,  1.65s/it][A
Training:   6%|▌         | 4/65 [00:06<01:09,  1.13s/it][A
Training:   8%|▊         | 5/65 [00:11<02:32,  2.54s/it][A
Training:   9%|▉         | 6/65 [00:11<01:43,  1.76s/it][A
Training:  11%|█         | 7/65 [00:12<01:12,  1.25s/it][A
Training:  12%|█▏        | 8/65 [00:12<00:51,  1.11it/s][A
Training:  14%|█▍        | 9/65 [00:17<02:01,  2.16s/it][A
Training:  15%|█▌        | 10/65 [00:17<01:25,  1.55s/it][A
Training:  17%|█▋        | 11/65 [00:17<00:59,  1.11s/it][A
Training:  20%|██        | 13/65 [00:22<01:33,  1.80s/it][A
Training:  22%|██▏       | 14/65 [00:22<01:10,  1.39s/it][A
Training:  23%|██▎       | 15/65 [00:22<00:53,  1.07s/it][A
Training:  25%|██▍       | 16/65 [00:23<00:40,  1.21it/s][A
Training:  26%|██▌       | 17/65 [00:28<01:34,  1.97s/it][A
Training:  28%|██▊       | 18/65 [00:28<

Epoch: 24/33 - Loss: 3.0521 - Accuracy: 0.9572



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:05<00:42,  5.30s/it][A
 22%|██▏       | 2/9 [00:05<00:16,  2.34s/it][A
 44%|████▍     | 4/9 [00:05<00:04,  1.08it/s][A
 56%|█████▌    | 5/9 [00:10<00:08,  2.00s/it][A
 67%|██████▋   | 6/9 [00:10<00:04,  1.45s/it][A
 78%|███████▊  | 7/9 [00:10<00:02,  1.07s/it][A
100%|██████████| 9/9 [00:10<00:00,  1.21s/it][A
Epochs:  73%|███████▎  | 24/33 [52:18<15:33, 103.70s/it]

Val Loss: 2.7438 - Val Accuracy: 0.9618



Training:   0%|          | 0/65 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/65 [00:06<06:38,  6.23s/it][A
Training:   5%|▍         | 3/65 [00:06<01:43,  1.68s/it][A
Training:   8%|▊         | 5/65 [00:11<02:12,  2.21s/it][A
Training:  11%|█         | 7/65 [00:12<01:18,  1.35s/it][A
Training:  12%|█▏        | 8/65 [00:12<01:01,  1.07s/it][A
Training:  14%|█▍        | 9/65 [00:17<01:55,  2.07s/it][A
Training:  17%|█▋        | 11/65 [00:17<01:07,  1.25s/it][A
Training:  20%|██        | 13/65 [00:22<01:30,  1.74s/it][A
Training:  23%|██▎       | 15/65 [00:22<00:58,  1.16s/it][A
Training:  26%|██▌       | 17/65 [00:28<01:19,  1.65s/it][A
Training:  29%|██▉       | 19/65 [00:28<00:53,  1.16s/it][A
Training:  32%|███▏      | 21/65 [00:33<01:07,  1.53s/it][A
Training:  35%|███▌      | 23/65 [00:33<00:46,  1.10s/it][A
Training:  38%|███▊      | 25/65 [00:37<00:58,  1.46s/it][A
Training:  42%|████▏     | 27/65 [00:38<00:40,  1.07s/it][A
Training:  43%|████▎     | 28/65 [00:3

Epoch: 25/33 - Loss: 3.0648 - Accuracy: 0.9570



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:05<00:44,  5.57s/it][A
 33%|███▎      | 3/9 [00:05<00:09,  1.53s/it][A
 56%|█████▌    | 5/9 [00:10<00:07,  1.99s/it][A
 67%|██████▋   | 6/9 [00:10<00:04,  1.48s/it][A
100%|██████████| 9/9 [00:11<00:00,  1.23s/it][A
Epochs:  76%|███████▌  | 25/33 [53:56<13:35, 101.92s/it]

Val Loss: 2.7008 - Val Accuracy: 0.9633



Training:   0%|          | 0/65 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/65 [00:07<07:34,  7.10s/it][A
Training:   3%|▎         | 2/65 [00:07<03:10,  3.03s/it][A
Training:   6%|▌         | 4/65 [00:07<01:11,  1.18s/it][A
Training:   8%|▊         | 5/65 [00:13<02:47,  2.80s/it][A
Training:   9%|▉         | 6/65 [00:14<02:02,  2.07s/it][A
Training:  12%|█▏        | 8/65 [00:14<01:05,  1.15s/it][A
Training:  14%|█▍        | 9/65 [00:21<02:25,  2.60s/it][A
Training:  15%|█▌        | 10/65 [00:21<01:49,  1.99s/it][A
Training:  17%|█▋        | 11/65 [00:21<01:19,  1.48s/it][A
Training:  18%|█▊        | 12/65 [00:22<01:01,  1.15s/it][A
Training:  20%|██        | 13/65 [00:30<02:48,  3.24s/it][A
Training:  22%|██▏       | 14/65 [00:30<02:02,  2.41s/it][A
Training:  23%|██▎       | 15/65 [00:31<01:26,  1.73s/it][A
Training:  25%|██▍       | 16/65 [00:32<01:17,  1.58s/it][A
Training:  26%|██▌       | 17/65 [00:40<02:51,  3.58s/it][A
Training:  28%|██▊       | 18/65 [00:40

Epoch: 26/33 - Loss: 2.9560 - Accuracy: 0.9571



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:12<01:43, 12.95s/it][A
 22%|██▏       | 2/9 [00:13<00:38,  5.55s/it][A
 33%|███▎      | 3/9 [00:13<00:18,  3.08s/it][A
 44%|████▍     | 4/9 [00:13<00:09,  1.92s/it][A
 56%|█████▌    | 5/9 [00:23<00:18,  4.62s/it][A
 67%|██████▋   | 6/9 [00:23<00:09,  3.13s/it][A
 78%|███████▊  | 7/9 [00:23<00:04,  2.22s/it][A
 89%|████████▉ | 8/9 [00:23<00:01,  1.59s/it][A
100%|██████████| 9/9 [00:24<00:00,  2.71s/it][A
Epochs:  79%|███████▉  | 26/33 [57:10<15:07, 129.58s/it]

Val Loss: 2.6826 - Val Accuracy: 0.9613



Training:   0%|          | 0/65 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/65 [00:13<14:40, 13.75s/it][A
Training:   3%|▎         | 2/65 [00:14<06:16,  5.97s/it][A
Training:   5%|▍         | 3/65 [00:14<03:28,  3.36s/it][A
Training:   6%|▌         | 4/65 [00:14<02:09,  2.12s/it][A
Training:   8%|▊         | 5/65 [00:26<05:25,  5.42s/it][A
Training:   9%|▉         | 6/65 [00:26<03:38,  3.70s/it][A
Training:  11%|█         | 7/65 [00:26<02:26,  2.53s/it][A
Training:  12%|█▏        | 8/65 [00:26<01:44,  1.83s/it][A
Training:  14%|█▍        | 9/65 [00:37<04:21,  4.67s/it][A
Training:  15%|█▌        | 10/65 [00:37<02:59,  3.26s/it][A
Training:  17%|█▋        | 11/65 [00:38<02:07,  2.37s/it][A
Training:  18%|█▊        | 12/65 [00:38<01:31,  1.72s/it][A
Training:  20%|██        | 13/65 [00:48<03:47,  4.37s/it][A
Training:  23%|██▎       | 15/65 [00:49<02:00,  2.41s/it][A
Training:  25%|██▍       | 16/65 [00:49<01:34,  1.93s/it][A
Training:  26%|██▌       | 17/65 [01:00<0

Epoch: 27/33 - Loss: 2.9205 - Accuracy: 0.9583



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:12<01:42, 12.87s/it][A
 22%|██▏       | 2/9 [00:13<00:37,  5.38s/it][A
 33%|███▎      | 3/9 [00:13<00:18,  3.07s/it][A
 44%|████▍     | 4/9 [00:13<00:09,  1.94s/it][A
 56%|█████▌    | 5/9 [00:23<00:19,  4.84s/it][A
 67%|██████▋   | 6/9 [00:24<00:10,  3.41s/it][A
 78%|███████▊  | 7/9 [00:24<00:04,  2.38s/it][A
100%|██████████| 9/9 [00:24<00:00,  2.77s/it][A
Epochs:  82%|████████▏ | 27/33 [1:00:49<15:37, 156.25s/it]

Val Loss: 2.6057 - Val Accuracy: 0.9633



Training:   0%|          | 0/65 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/65 [00:13<14:11, 13.31s/it][A
Training:   3%|▎         | 2/65 [00:13<05:57,  5.67s/it][A
Training:   5%|▍         | 3/65 [00:14<03:37,  3.51s/it][A
Training:   6%|▌         | 4/65 [00:14<02:14,  2.20s/it][A
Training:   8%|▊         | 5/65 [00:25<05:27,  5.45s/it][A
Training:   9%|▉         | 6/65 [00:26<03:35,  3.65s/it][A
Training:  11%|█         | 7/65 [00:26<02:35,  2.68s/it][A
Training:  12%|█▏        | 8/65 [00:26<01:46,  1.87s/it][A
Training:  14%|█▍        | 9/65 [00:37<04:09,  4.45s/it][A
Training:  15%|█▌        | 10/65 [00:37<02:51,  3.11s/it][A
Training:  17%|█▋        | 11/65 [00:39<02:30,  2.79s/it][A
Training:  18%|█▊        | 12/65 [00:39<01:48,  2.05s/it][A
Training:  20%|██        | 13/65 [00:47<03:21,  3.87s/it][A
Training:  22%|██▏       | 14/65 [00:47<02:20,  2.76s/it][A
Training:  23%|██▎       | 15/65 [00:50<02:15,  2.72s/it][A
Training:  25%|██▍       | 16/65 [00:50<0

Epoch: 28/33 - Loss: 2.8520 - Accuracy: 0.9592



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:12<01:36, 12.06s/it][A
 22%|██▏       | 2/9 [00:12<00:36,  5.15s/it][A
 33%|███▎      | 3/9 [00:12<00:17,  2.85s/it][A
 44%|████▍     | 4/9 [00:12<00:08,  1.77s/it][A
 56%|█████▌    | 5/9 [00:22<00:18,  4.64s/it][A
 67%|██████▋   | 6/9 [00:22<00:09,  3.14s/it][A
 78%|███████▊  | 7/9 [00:22<00:04,  2.22s/it][A
100%|██████████| 9/9 [00:23<00:00,  2.59s/it][A
Epochs:  85%|████████▍ | 28/33 [1:04:21<14:25, 173.11s/it]

Val Loss: 2.7362 - Val Accuracy: 0.9643



Training:   0%|          | 0/65 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/65 [00:13<14:30, 13.59s/it][A
Training:   3%|▎         | 2/65 [00:14<06:09,  5.87s/it][A
Training:   5%|▍         | 3/65 [00:14<03:28,  3.36s/it][A
Training:   6%|▌         | 4/65 [00:14<02:07,  2.09s/it][A
Training:   8%|▊         | 5/65 [00:25<05:20,  5.33s/it][A
Training:   9%|▉         | 6/65 [00:25<03:30,  3.56s/it][A
Training:  12%|█▏        | 8/65 [00:25<01:45,  1.84s/it][A
Training:  14%|█▍        | 9/65 [00:37<03:58,  4.27s/it][A
Training:  15%|█▌        | 10/65 [00:37<02:53,  3.16s/it][A
Training:  17%|█▋        | 11/65 [00:37<02:05,  2.32s/it][A
Training:  18%|█▊        | 12/65 [00:37<01:29,  1.69s/it][A
Training:  20%|██        | 13/65 [00:48<03:45,  4.33s/it][A
Training:  22%|██▏       | 14/65 [00:49<02:48,  3.30s/it][A
Training:  25%|██▍       | 16/65 [00:49<01:29,  1.83s/it][A
Training:  26%|██▌       | 17/65 [01:00<03:15,  4.08s/it][A
Training:  28%|██▊       | 18/65 [01:00<

Epoch: 29/33 - Loss: 2.8018 - Accuracy: 0.9596



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:12<01:38, 12.33s/it][A
 22%|██▏       | 2/9 [00:12<00:36,  5.15s/it][A
 44%|████▍     | 4/9 [00:13<00:10,  2.14s/it][A
 56%|█████▌    | 5/9 [00:23<00:18,  4.66s/it][A
 78%|███████▊  | 7/9 [00:23<00:05,  2.50s/it][A
100%|██████████| 9/9 [00:24<00:00,  2.69s/it][A
Epochs:  88%|████████▊ | 29/33 [1:08:00<12:27, 186.98s/it]

Val Loss: 2.6324 - Val Accuracy: 0.9633



Training:   0%|          | 0/65 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/65 [00:14<15:17, 14.34s/it][A
Training:   3%|▎         | 2/65 [00:14<06:19,  6.03s/it][A
Training:   5%|▍         | 3/65 [00:14<03:29,  3.39s/it][A
Training:   6%|▌         | 4/65 [00:15<02:12,  2.18s/it][A
Training:   8%|▊         | 5/65 [00:26<05:31,  5.52s/it][A
Training:   9%|▉         | 6/65 [00:27<03:49,  3.90s/it][A
Training:  11%|█         | 7/65 [00:27<02:36,  2.70s/it][A
Training:  14%|█▍        | 9/65 [00:37<03:38,  3.90s/it][A
Training:  15%|█▌        | 10/65 [00:38<02:46,  3.03s/it][A
Training:  17%|█▋        | 11/65 [00:38<02:01,  2.25s/it][A
Training:  18%|█▊        | 12/65 [00:38<01:31,  1.73s/it][A
Training:  20%|██        | 13/65 [00:49<03:46,  4.35s/it][A
Training:  22%|██▏       | 14/65 [00:50<02:46,  3.27s/it][A
Training:  23%|██▎       | 15/65 [00:50<02:01,  2.43s/it][A
Training:  25%|██▍       | 16/65 [00:51<01:28,  1.81s/it][A
Training:  26%|██▌       | 17/65 [01:01<

Epoch: 30/33 - Loss: 2.7820 - Accuracy: 0.9606



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:08<01:11,  8.89s/it][A
 22%|██▏       | 2/9 [00:09<00:26,  3.76s/it][A
 33%|███▎      | 3/9 [00:09<00:12,  2.15s/it][A
 44%|████▍     | 4/9 [00:09<00:06,  1.37s/it][A
 56%|█████▌    | 5/9 [00:16<00:14,  3.56s/it][A
 67%|██████▋   | 6/9 [00:17<00:07,  2.42s/it][A
 78%|███████▊  | 7/9 [00:17<00:03,  1.68s/it][A
100%|██████████| 9/9 [00:17<00:00,  1.98s/it][A
Epochs:  91%|█████████ | 30/33 [1:11:26<09:37, 192.48s/it]

Val Loss: 2.5691 - Val Accuracy: 0.9643



Training:   0%|          | 0/65 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/65 [00:09<10:26,  9.80s/it][A
Training:   3%|▎         | 2/65 [00:10<04:47,  4.56s/it][A
Training:   5%|▍         | 3/65 [00:10<02:37,  2.54s/it][A
Training:   6%|▌         | 4/65 [00:11<01:47,  1.77s/it][A
Training:   8%|▊         | 5/65 [00:19<03:57,  3.95s/it][A
Training:   9%|▉         | 6/65 [00:19<02:46,  2.83s/it][A
Training:  11%|█         | 7/65 [00:20<01:53,  1.96s/it][A
Training:  12%|█▏        | 8/65 [00:20<01:24,  1.49s/it][A
Training:  14%|█▍        | 9/65 [00:27<03:06,  3.33s/it][A
Training:  15%|█▌        | 10/65 [00:28<02:11,  2.39s/it][A
Training:  17%|█▋        | 11/65 [00:28<01:32,  1.71s/it][A
Training:  18%|█▊        | 12/65 [00:29<01:17,  1.46s/it][A
Training:  20%|██        | 13/65 [00:36<02:48,  3.24s/it][A
Training:  22%|██▏       | 14/65 [00:37<02:09,  2.54s/it][A
Training:  23%|██▎       | 15/65 [00:37<01:33,  1.87s/it][A
Training:  25%|██▍       | 16/65 [00:38<0

Epoch: 31/33 - Loss: 2.7716 - Accuracy: 0.9613



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:09<01:18,  9.76s/it][A
 22%|██▏       | 2/9 [00:10<00:29,  4.16s/it][A
 33%|███▎      | 3/9 [00:10<00:14,  2.40s/it][A
 44%|████▍     | 4/9 [00:10<00:07,  1.54s/it][A
 56%|█████▌    | 5/9 [00:17<00:14,  3.55s/it][A
100%|██████████| 9/9 [00:18<00:00,  2.01s/it][A
Epochs:  94%|█████████▍| 31/33 [1:14:06<06:05, 182.78s/it]

Val Loss: 2.5281 - Val Accuracy: 0.9648



Training:   0%|          | 0/65 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/65 [00:10<10:42, 10.03s/it][A
Training:   3%|▎         | 2/65 [00:10<04:50,  4.61s/it][A
Training:   5%|▍         | 3/65 [00:11<02:40,  2.59s/it][A
Training:   6%|▌         | 4/65 [00:11<01:39,  1.64s/it][A
Training:   8%|▊         | 5/65 [00:19<03:52,  3.87s/it][A
Training:   9%|▉         | 6/65 [00:19<02:41,  2.73s/it][A
Training:  11%|█         | 7/65 [00:19<01:48,  1.87s/it][A
Training:  12%|█▏        | 8/65 [00:19<01:17,  1.35s/it][A
Training:  14%|█▍        | 9/65 [00:28<03:19,  3.56s/it][A
Training:  15%|█▌        | 10/65 [00:28<02:19,  2.54s/it][A
Training:  17%|█▋        | 11/65 [00:28<01:38,  1.82s/it][A
Training:  18%|█▊        | 12/65 [00:28<01:09,  1.31s/it][A
Training:  20%|██        | 13/65 [00:36<02:52,  3.32s/it][A
Training:  22%|██▏       | 14/65 [00:36<01:59,  2.35s/it][A
Training:  23%|██▎       | 15/65 [00:37<01:23,  1.68s/it][A
Training:  26%|██▌       | 17/65 [00:45<0

Epoch: 32/33 - Loss: 2.7670 - Accuracy: 0.9603



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:09<01:14,  9.26s/it][A
 22%|██▏       | 2/9 [00:09<00:27,  3.92s/it][A
 33%|███▎      | 3/9 [00:09<00:13,  2.21s/it][A
 44%|████▍     | 4/9 [00:09<00:07,  1.40s/it][A
 56%|█████▌    | 5/9 [00:17<00:14,  3.64s/it][A
 67%|██████▋   | 6/9 [00:17<00:07,  2.46s/it][A
 78%|███████▊  | 7/9 [00:17<00:03,  1.71s/it][A
100%|██████████| 9/9 [00:18<00:00,  2.03s/it][A
Epochs:  97%|█████████▋| 32/33 [1:16:47<02:56, 176.28s/it]

Val Loss: 2.4938 - Val Accuracy: 0.9653



Training:   0%|          | 0/65 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/65 [00:09<10:32,  9.88s/it][A
Training:   3%|▎         | 2/65 [00:10<04:40,  4.46s/it][A
Training:   5%|▍         | 3/65 [00:10<02:34,  2.48s/it][A
Training:   6%|▌         | 4/65 [00:11<01:44,  1.71s/it][A
Training:   8%|▊         | 5/65 [00:18<03:40,  3.67s/it][A
Training:   9%|▉         | 6/65 [00:18<02:30,  2.55s/it][A
Training:  11%|█         | 7/65 [00:18<01:43,  1.79s/it][A
Training:  12%|█▏        | 8/65 [00:19<01:16,  1.34s/it][A
Training:  14%|█▍        | 9/65 [00:27<03:19,  3.57s/it][A
Training:  15%|█▌        | 10/65 [00:27<02:18,  2.53s/it][A
Training:  17%|█▋        | 11/65 [00:28<01:39,  1.84s/it][A
Training:  18%|█▊        | 12/65 [00:28<01:10,  1.32s/it][A
Training:  20%|██        | 13/65 [00:36<02:54,  3.36s/it][A
Training:  23%|██▎       | 15/65 [00:36<01:33,  1.88s/it][A
Training:  26%|██▌       | 17/65 [00:45<02:15,  2.83s/it][A
Training:  28%|██▊       | 18/65 [00:45<0

Epoch: 33/33 - Loss: 2.7715 - Accuracy: 0.9607



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:08<01:11,  8.88s/it][A
 22%|██▏       | 2/9 [00:09<00:26,  3.79s/it][A
 33%|███▎      | 3/9 [00:09<00:12,  2.16s/it][A
 56%|█████▌    | 5/9 [00:16<00:12,  3.02s/it][A
 67%|██████▋   | 6/9 [00:17<00:06,  2.25s/it][A
 78%|███████▊  | 7/9 [00:17<00:03,  1.64s/it][A
100%|██████████| 9/9 [00:17<00:00,  1.95s/it][A
Epochs: 100%|██████████| 33/33 [1:19:28<00:00, 144.51s/it]


Val Loss: 2.5540 - Val Accuracy: 0.9648
Saving best model...


[32m[I 2023-12-08 10:56:33,132][0m Trial 0 finished with value: 0.9648317694664001 and parameters: {'loss_learning_rate': 0.0035987381095719333, 'learning_rate': 1.1042719857613235e-05, 'weight_decay': 0.0009341013224507427, 'epsilon': 1.0684926352395233e-09, 'beta': 0.1, 'gamma': 0.7000000000000001, 'batch_size': 218, 'epochs': 33}. Best is trial 0 with value: 0.9648317694664001.[0m


Learning rate for Loss: 0.0037047485989424762
Learning rate: 0.02088792830186936
Weight decay: 0.003283560684544378
Epsilon: 7.115743039074607e-09
Beta: 0.5
Gamma: 0.2
Batch size: 103
Number of epochs: 23


Epochs:   0%|          | 0/23 [00:00<?, ?it/s]
Training:   0%|          | 0/136 [00:00<?, ?it/s][A
Training:   1%|          | 1/136 [00:05<12:36,  5.60s/it][A
Training:   1%|▏         | 2/136 [00:05<05:31,  2.47s/it][A
Training:   3%|▎         | 4/136 [00:06<02:07,  1.04it/s][A
Training:   4%|▎         | 5/136 [00:09<03:54,  1.79s/it][A
Training:   4%|▍         | 6/136 [00:09<02:51,  1.32s/it][A
Training:   6%|▌         | 8/136 [00:10<01:33,  1.36it/s][A
Training:   7%|▋         | 9/136 [00:14<03:17,  1.55s/it][A
Training:   7%|▋         | 10/136 [00:14<02:28,  1.18s/it][A
Training:   9%|▉         | 12/136 [00:14<01:29,  1.39it/s][A
Training:  10%|▉         | 13/136 [00:18<03:03,  1.49s/it][A
Training:  10%|█         | 14/136 [00:18<02:26,  1.20s/it][A
Training:  11%|█         | 15/136 [00:18<01:52,  1.08it/s][A
Training:  12%|█▏        | 16/136 [00:19<01:27,  1.37it/s][A
Training:  12%|█▎        | 17/136 [00:22<03:01,  1.52s/it][A
Training:  13%|█▎        | 18/136 [00:2

Epoch: 1/23 - Loss: 1038.9761 - Accuracy: 0.9023



  0%|          | 0/17 [00:00<?, ?it/s][A
  6%|▌         | 1/17 [00:02<00:43,  2.74s/it][A
 18%|█▊        | 3/17 [00:02<00:10,  1.32it/s][A
 29%|██▉       | 5/17 [00:05<00:11,  1.07it/s][A
 41%|████      | 7/17 [00:05<00:05,  1.75it/s][A
 53%|█████▎    | 9/17 [00:07<00:05,  1.37it/s][A
 65%|██████▍   | 11/17 [00:07<00:03,  1.94it/s][A
 76%|███████▋  | 13/17 [00:09<00:02,  1.46it/s][A
 88%|████████▊ | 15/17 [00:09<00:00,  2.05it/s][A
100%|██████████| 17/17 [00:11<00:00,  1.47it/s][A
Epochs:   4%|▍         | 1/23 [02:21<51:55, 141.59s/it]

Val Loss: 1403.6344 - Val Accuracy: 0.9484



Training:   0%|          | 0/136 [00:00<?, ?it/s][A
Training:   1%|          | 1/136 [00:02<06:39,  2.96s/it][A
Training:   2%|▏         | 3/136 [00:03<01:47,  1.24it/s][A
Training:   4%|▎         | 5/136 [00:05<02:12,  1.02s/it][A
Training:   4%|▍         | 6/136 [00:05<01:41,  1.28it/s][A
Training:   5%|▌         | 7/136 [00:05<01:16,  1.68it/s][A
Training:   6%|▌         | 8/136 [00:05<00:59,  2.16it/s][A
Training:   7%|▋         | 9/136 [00:08<02:01,  1.05it/s][A
Training:   8%|▊         | 11/136 [00:08<01:10,  1.77it/s][A
Training:   9%|▉         | 12/136 [00:08<00:56,  2.18it/s][A
Training:  10%|▉         | 13/136 [00:10<02:01,  1.01it/s][A
Training:  12%|█▏        | 16/136 [00:11<00:59,  2.02it/s][A
Training:  12%|█▎        | 17/136 [00:13<01:48,  1.10it/s][A
Training:  14%|█▍        | 19/136 [00:13<01:10,  1.65it/s][A
Training:  15%|█▍        | 20/136 [00:13<00:58,  1.98it/s][A
Training:  15%|█▌        | 21/136 [00:15<01:35,  1.21it/s][A
Training:  18%|█▊      

Epoch: 2/23 - Loss: 1741.8860 - Accuracy: 0.9328



  0%|          | 0/17 [00:00<?, ?it/s][A
  6%|▌         | 1/17 [00:02<00:45,  2.85s/it][A
 12%|█▏        | 2/17 [00:02<00:18,  1.23s/it][A
 24%|██▎       | 4/17 [00:03<00:06,  1.99it/s][A
 35%|███▌      | 6/17 [00:05<00:08,  1.31it/s][A
 41%|████      | 7/17 [00:05<00:06,  1.58it/s][A
 53%|█████▎    | 9/17 [00:07<00:06,  1.32it/s][A
 65%|██████▍   | 11/17 [00:07<00:03,  1.92it/s][A
 76%|███████▋  | 13/17 [00:09<00:02,  1.39it/s][A
 88%|████████▊ | 15/17 [00:09<00:00,  2.00it/s][A
100%|██████████| 17/17 [00:11<00:00,  1.42it/s][A
Epochs:   9%|▊         | 2/23 [03:59<40:30, 115.73s/it]

Val Loss: 1923.1025 - Val Accuracy: 0.9289



Training:   0%|          | 0/136 [00:00<?, ?it/s][A
Training:   1%|          | 1/136 [00:03<07:28,  3.32s/it][A
Training:   2%|▏         | 3/136 [00:03<01:59,  1.11it/s][A
Training:   4%|▎         | 5/136 [00:05<02:23,  1.10s/it][A
Training:   5%|▌         | 7/136 [00:06<01:25,  1.50it/s][A
Training:   7%|▋         | 9/136 [00:08<01:50,  1.15it/s][A
Training:   7%|▋         | 10/136 [00:08<01:29,  1.40it/s][A
Training:   9%|▉         | 12/136 [00:08<00:58,  2.12it/s][A
Training:  10%|▉         | 13/136 [00:11<01:44,  1.18it/s][A
Training:  10%|█         | 14/136 [00:11<01:22,  1.48it/s][A
Training:  12%|█▏        | 16/136 [00:11<00:52,  2.29it/s][A
Training:  12%|█▎        | 17/136 [00:13<01:41,  1.18it/s][A
Training:  13%|█▎        | 18/136 [00:13<01:20,  1.47it/s][A
Training:  15%|█▍        | 20/136 [00:14<00:51,  2.23it/s][A
Training:  15%|█▌        | 21/136 [00:15<01:29,  1.29it/s][A
Training:  16%|█▌        | 22/136 [00:16<01:12,  1.57it/s][A
Training:  18%|█▊    

Epoch: 3/23 - Loss: 1928.4117 - Accuracy: 0.9381



  0%|          | 0/17 [00:00<?, ?it/s][A
  6%|▌         | 1/17 [00:02<00:45,  2.86s/it][A
 18%|█▊        | 3/17 [00:02<00:10,  1.27it/s][A
 29%|██▉       | 5/17 [00:05<00:10,  1.10it/s][A
 47%|████▋     | 8/17 [00:05<00:04,  2.21it/s][A
 59%|█████▉    | 10/17 [00:07<00:04,  1.46it/s][A
 65%|██████▍   | 11/17 [00:07<00:03,  1.73it/s][A
 76%|███████▋  | 13/17 [00:09<00:02,  1.35it/s][A
100%|██████████| 17/17 [00:11<00:00,  1.45it/s][A
Epochs:  13%|█▎        | 3/23 [05:37<35:58, 107.91s/it]

Val Loss: 1671.4069 - Val Accuracy: 0.9472



Training:   0%|          | 0/136 [00:00<?, ?it/s][A
Training:   1%|          | 1/136 [00:03<07:23,  3.28s/it][A
Training:   2%|▏         | 3/136 [00:03<01:59,  1.12it/s][A
Training:   4%|▎         | 5/136 [00:05<02:12,  1.01s/it][A
Training:   6%|▌         | 8/136 [00:05<01:04,  1.98it/s][A
Training:   7%|▋         | 10/136 [00:08<01:35,  1.32it/s][A
Training:   8%|▊         | 11/136 [00:08<01:19,  1.58it/s][A
Training:  10%|▉         | 13/136 [00:10<01:44,  1.18it/s][A
Training:  11%|█         | 15/136 [00:11<01:11,  1.69it/s][A
Training:  12%|█▎        | 17/136 [00:13<01:33,  1.27it/s][A
Training:  15%|█▍        | 20/136 [00:13<00:55,  2.09it/s][A
Training:  16%|█▌        | 22/136 [00:15<01:14,  1.53it/s][A
Training:  18%|█▊        | 24/136 [00:15<00:54,  2.05it/s][A
Training:  19%|█▉        | 26/136 [00:18<01:17,  1.43it/s][A
Training:  21%|██▏       | 29/136 [00:21<01:23,  1.28it/s][A
Training:  23%|██▎       | 31/136 [00:21<01:01,  1.71it/s][A
Training:  24%|██▍  

Epoch: 4/23 - Loss: 2024.3622 - Accuracy: 0.9413



  0%|          | 0/17 [00:00<?, ?it/s][A
  6%|▌         | 1/17 [00:02<00:44,  2.80s/it][A
 12%|█▏        | 2/17 [00:02<00:18,  1.23s/it][A
 24%|██▎       | 4/17 [00:03<00:07,  1.85it/s][A
 29%|██▉       | 5/17 [00:04<00:11,  1.09it/s][A
 35%|███▌      | 6/17 [00:05<00:08,  1.34it/s][A
 53%|█████▎    | 9/17 [00:07<00:05,  1.48it/s][A
 59%|█████▉    | 10/17 [00:07<00:04,  1.59it/s][A
 65%|██████▍   | 11/17 [00:07<00:03,  1.96it/s][A
 76%|███████▋  | 13/17 [00:09<00:02,  1.50it/s][A
 82%|████████▏ | 14/17 [00:10<00:01,  1.60it/s][A
 88%|████████▊ | 15/17 [00:10<00:01,  1.83it/s][A
100%|██████████| 17/17 [00:11<00:00,  1.45it/s][A
Epochs:  17%|█▋        | 4/23 [07:22<33:47, 106.70s/it]

Val Loss: 2093.5969 - Val Accuracy: 0.9507



Training:   0%|          | 0/136 [00:00<?, ?it/s][A
Training:   1%|          | 1/136 [00:03<07:24,  3.30s/it][A
Training:   1%|▏         | 2/136 [00:03<03:09,  1.42s/it][A
Training:   2%|▏         | 3/136 [00:03<01:49,  1.22it/s][A
Training:   3%|▎         | 4/136 [00:03<01:12,  1.82it/s][A
Training:   4%|▎         | 5/136 [00:06<02:40,  1.22s/it][A
Training:   6%|▌         | 8/136 [00:06<01:04,  1.99it/s][A
Training:   7%|▋         | 10/136 [00:09<01:45,  1.19it/s][A
Training:   9%|▉         | 12/136 [00:09<01:11,  1.73it/s][A
Training:  10%|█         | 14/136 [00:11<01:39,  1.22it/s][A
Training:  12%|█▎        | 17/136 [00:14<01:36,  1.24it/s][A
Training:  13%|█▎        | 18/136 [00:14<01:21,  1.44it/s][A
Training:  15%|█▍        | 20/136 [00:14<00:57,  2.01it/s][A
Training:  15%|█▌        | 21/136 [00:16<01:35,  1.20it/s][A
Training:  18%|█▊        | 24/136 [00:16<00:53,  2.08it/s][A
Training:  19%|█▉        | 26/136 [00:19<01:22,  1.33it/s][A
Training:  21%|██     

Epoch: 5/23 - Loss: 2016.9435 - Accuracy: 0.9444



  0%|          | 0/17 [00:00<?, ?it/s][A
  6%|▌         | 1/17 [00:02<00:46,  2.90s/it][A
 24%|██▎       | 4/17 [00:03<00:07,  1.73it/s][A
 35%|███▌      | 6/17 [00:05<00:09,  1.19it/s][A
 53%|█████▎    | 9/17 [00:07<00:06,  1.19it/s][A
 76%|███████▋  | 13/17 [00:10<00:02,  1.38it/s][A
100%|██████████| 17/17 [00:12<00:00,  1.38it/s][A
Epochs:  22%|██▏       | 5/23 [09:05<31:38, 105.48s/it]

Val Loss: 2353.5566 - Val Accuracy: 0.9593



Training:   0%|          | 0/136 [00:00<?, ?it/s][A
Training:   1%|          | 1/136 [00:03<07:10,  3.19s/it][A
Training:   1%|▏         | 2/136 [00:03<03:05,  1.38s/it][A
Training:   4%|▎         | 5/136 [00:05<02:12,  1.01s/it][A
Training:   6%|▌         | 8/136 [00:06<01:06,  1.92it/s][A
Training:   7%|▋         | 10/136 [00:08<01:44,  1.21it/s][A
Training:   9%|▉         | 12/136 [00:09<01:12,  1.70it/s][A
Training:  10%|█         | 14/136 [00:11<01:32,  1.31it/s][A
Training:  12%|█▎        | 17/136 [00:13<01:28,  1.34it/s][A
Training:  14%|█▍        | 19/136 [00:13<01:06,  1.76it/s][A
Training:  15%|█▍        | 20/136 [00:13<00:57,  2.03it/s][A
Training:  15%|█▌        | 21/136 [00:16<01:38,  1.17it/s][A
Training:  17%|█▋        | 23/136 [00:16<01:05,  1.74it/s][A
Training:  18%|█▊        | 25/136 [00:19<01:31,  1.21it/s][A
Training:  20%|█▉        | 27/136 [00:19<01:03,  1.71it/s][A
Training:  21%|██▏       | 29/136 [00:21<01:28,  1.21it/s][A
Training:  22%|██▏  

Epoch: 6/23 - Loss: 2181.8806 - Accuracy: 0.9462



  0%|          | 0/17 [00:00<?, ?it/s][A
  6%|▌         | 1/17 [00:03<00:47,  3.00s/it][A
 18%|█▊        | 3/17 [00:03<00:11,  1.22it/s][A
 29%|██▉       | 5/17 [00:05<00:12,  1.03s/it][A
 41%|████      | 7/17 [00:05<00:06,  1.61it/s][A
 53%|█████▎    | 9/17 [00:08<00:06,  1.21it/s][A
 71%|███████   | 12/17 [00:08<00:02,  2.07it/s][A
 82%|████████▏ | 14/17 [00:10<00:02,  1.45it/s][A
100%|██████████| 17/17 [00:12<00:00,  1.35it/s][A
Epochs:  26%|██▌       | 6/23 [10:48<29:34, 104.40s/it]

Val Loss: 2338.7222 - Val Accuracy: 0.9502



Training:   0%|          | 0/136 [00:00<?, ?it/s][A
Training:   1%|          | 1/136 [00:03<07:49,  3.48s/it][A
Training:   1%|▏         | 2/136 [00:03<03:22,  1.51s/it][A
Training:   2%|▏         | 3/136 [00:03<01:59,  1.11it/s][A
Training:   4%|▎         | 5/136 [00:06<02:40,  1.22s/it][A
Training:   5%|▌         | 7/136 [00:06<01:31,  1.42it/s][A
Training:   7%|▋         | 9/136 [00:09<02:03,  1.03it/s][A
Training:   8%|▊         | 11/136 [00:09<01:20,  1.55it/s][A
Training:  10%|▉         | 13/136 [00:12<01:43,  1.19it/s][A
Training:  11%|█         | 15/136 [00:12<01:11,  1.70it/s][A
Training:  12%|█▏        | 16/136 [00:12<00:59,  2.01it/s][A
Training:  12%|█▎        | 17/136 [00:15<01:55,  1.03it/s][A
Training:  14%|█▍        | 19/136 [00:15<01:14,  1.58it/s][A
Training:  15%|█▍        | 20/136 [00:15<01:00,  1.91it/s][A
Training:  15%|█▌        | 21/136 [00:18<02:02,  1.06s/it][A
Training:  16%|█▌        | 22/136 [00:18<01:34,  1.21it/s][A
Training:  18%|█▊     

Epoch: 7/23 - Loss: 2280.2573 - Accuracy: 0.9463



  0%|          | 0/17 [00:00<?, ?it/s][A
  6%|▌         | 1/17 [00:03<00:48,  3.04s/it][A
 24%|██▎       | 4/17 [00:03<00:08,  1.62it/s][A
 35%|███▌      | 6/17 [00:05<00:09,  1.16it/s][A
 47%|████▋     | 8/17 [00:05<00:04,  1.81it/s][A
 59%|█████▉    | 10/17 [00:07<00:05,  1.40it/s][A
 76%|███████▋  | 13/17 [00:10<00:02,  1.35it/s][A
100%|██████████| 17/17 [00:12<00:00,  1.41it/s][A
Epochs:  30%|███       | 7/23 [12:30<27:41, 103.84s/it]

Val Loss: 2474.2122 - Val Accuracy: 0.9477



Training:   0%|          | 0/136 [00:00<?, ?it/s][A
Training:   1%|          | 1/136 [00:03<07:06,  3.16s/it][A
Training:   1%|▏         | 2/136 [00:03<03:06,  1.39s/it][A
Training:   2%|▏         | 3/136 [00:03<01:46,  1.24it/s][A
Training:   4%|▎         | 5/136 [00:05<02:04,  1.06it/s][A
Training:   4%|▍         | 6/136 [00:05<01:33,  1.39it/s][A
Training:   5%|▌         | 7/136 [00:05<01:12,  1.79it/s][A
Training:   7%|▋         | 9/136 [00:08<01:43,  1.23it/s][A
Training:   7%|▋         | 10/136 [00:08<01:24,  1.50it/s][A
Training:  10%|▉         | 13/136 [00:10<01:30,  1.36it/s][A
Training:  10%|█         | 14/136 [00:11<01:20,  1.52it/s][A
Training:  12%|█▎        | 17/136 [00:13<01:26,  1.38it/s][A
Training:  13%|█▎        | 18/136 [00:13<01:15,  1.56it/s][A
Training:  15%|█▌        | 21/136 [00:16<01:24,  1.36it/s][A
Training:  16%|█▌        | 22/136 [00:16<01:13,  1.55it/s][A
Training:  18%|█▊        | 24/136 [00:16<00:51,  2.20it/s][A
Training:  18%|█▊      

Epoch: 8/23 - Loss: 2323.2556 - Accuracy: 0.9444



  0%|          | 0/17 [00:00<?, ?it/s][A
  6%|▌         | 1/17 [00:03<00:50,  3.18s/it][A
 12%|█▏        | 2/17 [00:03<00:21,  1.42s/it][A
 29%|██▉       | 5/17 [00:05<00:10,  1.09it/s][A
 35%|███▌      | 6/17 [00:05<00:08,  1.26it/s][A
 53%|█████▎    | 9/17 [00:07<00:05,  1.47it/s][A
 59%|█████▉    | 10/17 [00:08<00:04,  1.56it/s][A
 76%|███████▋  | 13/17 [00:10<00:02,  1.50it/s][A
 82%|████████▏ | 14/17 [00:10<00:01,  1.62it/s][A
100%|██████████| 17/17 [00:12<00:00,  1.38it/s][A
Epochs:  35%|███▍      | 8/23 [14:11<25:42, 102.85s/it]

Val Loss: 2780.0017 - Val Accuracy: 0.9506



Training:   0%|          | 0/136 [00:00<?, ?it/s][A
Training:   1%|          | 1/136 [00:03<07:58,  3.54s/it][A
Training:   2%|▏         | 3/136 [00:03<02:07,  1.05it/s][A
Training:   4%|▎         | 5/136 [00:05<02:17,  1.05s/it][A
Training:   5%|▌         | 7/136 [00:06<01:20,  1.60it/s][A
Training:   7%|▋         | 9/136 [00:09<02:01,  1.05it/s][A
Training:   8%|▊         | 11/136 [00:09<01:21,  1.53it/s][A
Training:  10%|▉         | 13/136 [00:11<01:48,  1.13it/s][A
Training:  11%|█         | 15/136 [00:12<01:14,  1.62it/s][A
Training:  12%|█▎        | 17/136 [00:14<01:40,  1.18it/s][A
Training:  14%|█▍        | 19/136 [00:14<01:10,  1.66it/s][A
Training:  15%|█▍        | 20/136 [00:14<00:59,  1.95it/s][A
Training:  15%|█▌        | 21/136 [00:17<01:50,  1.04it/s][A
Training:  17%|█▋        | 23/136 [00:17<01:11,  1.57it/s][A
Training:  18%|█▊        | 24/136 [00:17<00:58,  1.90it/s][A
Training:  18%|█▊        | 25/136 [00:20<01:48,  1.03it/s][A
Training:  19%|█▉    

Epoch: 9/23 - Loss: 2391.9839 - Accuracy: 0.9472



  0%|          | 0/17 [00:00<?, ?it/s][A
  6%|▌         | 1/17 [00:02<00:41,  2.58s/it][A
 24%|██▎       | 4/17 [00:02<00:06,  1.91it/s][A
 35%|███▌      | 6/17 [00:04<00:08,  1.31it/s][A
 53%|█████▎    | 9/17 [00:07<00:06,  1.28it/s][A
 59%|█████▉    | 10/17 [00:07<00:04,  1.52it/s][A
 76%|███████▋  | 13/17 [00:09<00:02,  1.42it/s][A
100%|██████████| 17/17 [00:11<00:00,  1.44it/s][A
Epochs:  39%|███▉      | 9/23 [15:56<24:09, 103.57s/it]

Val Loss: 2755.6152 - Val Accuracy: 0.9524



Training:   0%|          | 0/136 [00:00<?, ?it/s][A
Training:   1%|          | 1/136 [00:02<06:17,  2.80s/it][A
Training:   2%|▏         | 3/136 [00:02<01:43,  1.28it/s][A
Training:   4%|▎         | 5/136 [00:05<02:11,  1.00s/it][A
Training:   6%|▌         | 8/136 [00:05<01:03,  2.02it/s][A
Training:   7%|▋         | 10/136 [00:08<01:40,  1.26it/s][A
Training:   8%|▊         | 11/136 [00:08<01:23,  1.51it/s][A
Training:  10%|▉         | 13/136 [00:10<01:44,  1.18it/s][A
Training:  10%|█         | 14/136 [00:10<01:26,  1.41it/s][A
Training:  11%|█         | 15/136 [00:11<01:09,  1.74it/s][A
Training:  12%|█▏        | 16/136 [00:11<00:56,  2.12it/s][A
Training:  12%|█▎        | 17/136 [00:13<01:51,  1.07it/s][A
Training:  13%|█▎        | 18/136 [00:13<01:28,  1.33it/s][A
Training:  15%|█▍        | 20/136 [00:13<00:54,  2.13it/s][A
Training:  15%|█▌        | 21/136 [00:16<01:39,  1.15it/s][A
Training:  16%|█▌        | 22/136 [00:16<01:23,  1.36it/s][A
Training:  18%|█▊   

Epoch: 10/23 - Loss: 2350.8818 - Accuracy: 0.9495



  0%|          | 0/17 [00:00<?, ?it/s][A
  6%|▌         | 1/17 [00:02<00:39,  2.50s/it][A
 24%|██▎       | 4/17 [00:02<00:06,  1.99it/s][A
 35%|███▌      | 6/17 [00:04<00:08,  1.32it/s][A
 47%|████▋     | 8/17 [00:04<00:04,  2.01it/s][A
 59%|█████▉    | 10/17 [00:07<00:05,  1.34it/s][A
 65%|██████▍   | 11/17 [00:07<00:03,  1.61it/s][A
 76%|███████▋  | 13/17 [00:09<00:03,  1.17it/s][A
100%|██████████| 17/17 [00:12<00:00,  1.41it/s][A
Epochs:  43%|████▎     | 10/23 [17:39<22:22, 103.25s/it]

Val Loss: 2556.0166 - Val Accuracy: 0.9496



Training:   0%|          | 0/136 [00:00<?, ?it/s][A
Training:   1%|          | 1/136 [00:02<06:21,  2.82s/it][A
Training:   3%|▎         | 4/136 [00:02<01:14,  1.78it/s][A
Training:   4%|▍         | 6/136 [00:05<01:52,  1.16it/s][A
Training:   6%|▌         | 8/136 [00:05<01:11,  1.79it/s][A
Training:   7%|▋         | 10/136 [00:08<01:44,  1.20it/s][A
Training:  10%|▉         | 13/136 [00:10<01:44,  1.18it/s][A
Training:  10%|█         | 14/136 [00:10<01:28,  1.38it/s][A
Training:  12%|█▏        | 16/136 [00:11<01:00,  1.98it/s][A
Training:  12%|█▎        | 17/136 [00:13<01:45,  1.13it/s][A
Training:  14%|█▍        | 19/136 [00:13<01:11,  1.64it/s][A
Training:  15%|█▌        | 21/136 [00:16<01:33,  1.23it/s][A
Training:  17%|█▋        | 23/136 [00:16<01:05,  1.74it/s][A
Training:  18%|█▊        | 25/136 [00:18<01:27,  1.27it/s][A
Training:  20%|█▉        | 27/136 [00:18<01:01,  1.78it/s][A
Training:  21%|██▏       | 29/136 [00:21<01:22,  1.29it/s][A
Training:  24%|██▎  

Epoch: 11/23 - Loss: 2400.9495 - Accuracy: 0.9492



  0%|          | 0/17 [00:00<?, ?it/s][A
  6%|▌         | 1/17 [00:02<00:41,  2.61s/it][A
 24%|██▎       | 4/17 [00:02<00:06,  1.87it/s][A
 35%|███▌      | 6/17 [00:04<00:08,  1.32it/s][A
 47%|████▋     | 8/17 [00:04<00:04,  2.03it/s][A
 59%|█████▉    | 10/17 [00:07<00:04,  1.44it/s][A
 71%|███████   | 12/17 [00:07<00:02,  2.04it/s][A
 76%|███████▋  | 13/17 [00:09<00:03,  1.25it/s][A
100%|██████████| 17/17 [00:11<00:00,  1.49it/s][A
Epochs:  48%|████▊     | 11/23 [19:19<20:28, 102.41s/it]

Val Loss: 3314.7671 - Val Accuracy: 0.9575



Training:   0%|          | 0/136 [00:00<?, ?it/s][A
Training:   1%|          | 1/136 [00:03<07:13,  3.21s/it][A
Training:   2%|▏         | 3/136 [00:03<01:56,  1.14it/s][A
Training:   3%|▎         | 4/136 [00:03<01:21,  1.62it/s][A
Training:   4%|▎         | 5/136 [00:05<02:43,  1.25s/it][A
Training:   4%|▍         | 6/136 [00:06<01:54,  1.13it/s][A
Training:   6%|▌         | 8/136 [00:06<01:05,  1.95it/s][A
Training:   7%|▋         | 9/136 [00:09<02:16,  1.07s/it][A
Training:   8%|▊         | 11/136 [00:09<01:22,  1.52it/s][A
Training:   9%|▉         | 12/136 [00:09<01:05,  1.89it/s][A
Training:  10%|▉         | 13/136 [00:11<02:10,  1.06s/it][A
Training:  11%|█         | 15/136 [00:12<01:19,  1.52it/s][A
Training:  12%|█▎        | 17/136 [00:14<01:44,  1.14it/s][A
Training:  13%|█▎        | 18/136 [00:14<01:24,  1.39it/s][A
Training:  14%|█▍        | 19/136 [00:14<01:07,  1.72it/s][A
Training:  15%|█▍        | 20/136 [00:15<00:53,  2.15it/s][A
Training:  15%|█▌      

Epoch: 12/23 - Loss: 2630.2207 - Accuracy: 0.9508



  0%|          | 0/17 [00:00<?, ?it/s][A
  6%|▌         | 1/17 [00:02<00:43,  2.70s/it][A
 12%|█▏        | 2/17 [00:02<00:18,  1.20s/it][A
 18%|█▊        | 3/17 [00:03<00:10,  1.37it/s][A
 29%|██▉       | 5/17 [00:05<00:10,  1.14it/s][A
 35%|███▌      | 6/17 [00:05<00:07,  1.43it/s][A
 41%|████      | 7/17 [00:05<00:05,  1.86it/s][A
 53%|█████▎    | 9/17 [00:07<00:05,  1.42it/s][A
 59%|█████▉    | 10/17 [00:07<00:04,  1.63it/s][A
 65%|██████▍   | 11/17 [00:07<00:02,  2.01it/s][A
 76%|███████▋  | 13/17 [00:09<00:02,  1.69it/s][A
 82%|████████▏ | 14/17 [00:09<00:01,  2.02it/s][A
 88%|████████▊ | 15/17 [00:09<00:00,  2.33it/s][A
100%|██████████| 17/17 [00:10<00:00,  1.57it/s][A
Epochs:  52%|█████▏    | 12/23 [21:01<18:42, 102.03s/it]

Val Loss: 2956.8889 - Val Accuracy: 0.9617



Training:   0%|          | 0/136 [00:00<?, ?it/s][A
Training:   1%|          | 1/136 [00:03<06:59,  3.11s/it][A
Training:   2%|▏         | 3/136 [00:03<01:54,  1.16it/s][A
Training:   4%|▎         | 5/136 [00:05<02:18,  1.06s/it][A
Training:   4%|▍         | 6/136 [00:05<01:45,  1.23it/s][A
Training:   5%|▌         | 7/136 [00:06<01:20,  1.61it/s][A
Training:   6%|▌         | 8/136 [00:06<01:01,  2.10it/s][A
Training:   7%|▋         | 9/136 [00:08<02:08,  1.01s/it][A
Training:   8%|▊         | 11/136 [00:08<01:19,  1.58it/s][A
Training:  10%|▉         | 13/136 [00:11<01:40,  1.22it/s][A
Training:  10%|█         | 14/136 [00:11<01:22,  1.48it/s][A
Training:  11%|█         | 15/136 [00:11<01:13,  1.66it/s][A
Training:  12%|█▎        | 17/136 [00:13<01:38,  1.21it/s][A
Training:  14%|█▍        | 19/136 [00:14<01:08,  1.72it/s][A
Training:  15%|█▌        | 21/136 [00:16<01:28,  1.30it/s][A
Training:  17%|█▋        | 23/136 [00:16<01:04,  1.76it/s][A
Training:  18%|█▊      

Epoch: 13/23 - Loss: 2466.7434 - Accuracy: 0.9507



  0%|          | 0/17 [00:00<?, ?it/s][A
  6%|▌         | 1/17 [00:02<00:36,  2.27s/it][A
 18%|█▊        | 3/17 [00:02<00:09,  1.54it/s][A
 29%|██▉       | 5/17 [00:04<00:09,  1.21it/s][A
 41%|████      | 7/17 [00:04<00:05,  1.85it/s][A
 53%|█████▎    | 9/17 [00:06<00:05,  1.41it/s][A
 59%|█████▉    | 10/17 [00:06<00:04,  1.71it/s][A
 65%|██████▍   | 11/17 [00:06<00:02,  2.08it/s][A
 76%|███████▋  | 13/17 [00:08<00:02,  1.48it/s][A
100%|██████████| 17/17 [00:10<00:00,  1.59it/s][A
Epochs:  57%|█████▋    | 13/23 [22:41<16:54, 101.46s/it]

Val Loss: 2814.9167 - Val Accuracy: 0.9547



Training:   0%|          | 0/136 [00:00<?, ?it/s][A
Training:   1%|          | 1/136 [00:02<06:39,  2.96s/it][A
Training:   2%|▏         | 3/136 [00:03<01:49,  1.22it/s][A
Training:   4%|▎         | 5/136 [00:05<02:21,  1.08s/it][A
Training:   4%|▍         | 6/136 [00:05<01:46,  1.22it/s][A
Training:   5%|▌         | 7/136 [00:05<01:19,  1.61it/s][A
Training:   6%|▌         | 8/136 [00:06<01:00,  2.12it/s][A
Training:   7%|▋         | 9/136 [00:08<02:11,  1.04s/it][A
Training:   7%|▋         | 10/136 [00:08<01:41,  1.25it/s][A
Training:   9%|▉         | 12/136 [00:08<00:58,  2.12it/s][A
Training:  10%|▉         | 13/136 [00:11<01:59,  1.03it/s][A
Training:  10%|█         | 14/136 [00:11<01:39,  1.23it/s][A
Training:  11%|█         | 15/136 [00:11<01:15,  1.59it/s][A
Training:  12%|█▎        | 17/136 [00:14<01:43,  1.15it/s][A
Training:  13%|█▎        | 18/136 [00:14<01:29,  1.33it/s][A
Training:  14%|█▍        | 19/136 [00:14<01:09,  1.69it/s][A
Training:  15%|█▌      

Epoch: 14/23 - Loss: 2485.2495 - Accuracy: 0.9493



  0%|          | 0/17 [00:00<?, ?it/s][A
  6%|▌         | 1/17 [00:02<00:40,  2.56s/it][A
 18%|█▊        | 3/17 [00:02<00:09,  1.41it/s][A
 29%|██▉       | 5/17 [00:04<00:09,  1.22it/s][A
 47%|████▋     | 8/17 [00:04<00:03,  2.43it/s][A
 59%|█████▉    | 10/17 [00:06<00:04,  1.59it/s][A
 71%|███████   | 12/17 [00:06<00:02,  2.24it/s][A
 82%|████████▏ | 14/17 [00:08<00:01,  1.67it/s][A
 88%|████████▊ | 15/17 [00:08<00:01,  1.97it/s][A
100%|██████████| 17/17 [00:10<00:00,  1.59it/s][A
Epochs:  61%|██████    | 14/23 [24:26<15:22, 102.52s/it]

Val Loss: 3188.5842 - Val Accuracy: 0.9483



Training:   0%|          | 0/136 [00:00<?, ?it/s][A
Training:   1%|          | 1/136 [00:03<07:19,  3.26s/it][A
Training:   2%|▏         | 3/136 [00:03<01:58,  1.12it/s][A
Training:   4%|▎         | 5/136 [00:05<02:24,  1.10s/it][A
Training:   5%|▌         | 7/136 [00:06<01:25,  1.51it/s][A
Training:   7%|▋         | 9/136 [00:08<01:49,  1.16it/s][A
Training:   8%|▊         | 11/136 [00:08<01:12,  1.73it/s][A
Training:  10%|▉         | 13/136 [00:11<01:39,  1.23it/s][A
Training:  10%|█         | 14/136 [00:11<01:22,  1.48it/s][A
Training:  12%|█▏        | 16/136 [00:11<00:54,  2.19it/s][A
Training:  13%|█▎        | 18/136 [00:14<01:31,  1.28it/s][A
Training:  15%|█▌        | 21/136 [00:17<01:36,  1.19it/s][A
Training:  17%|█▋        | 23/136 [00:17<01:11,  1.58it/s][A
Training:  18%|█▊        | 25/136 [00:19<01:28,  1.26it/s][A
Training:  20%|█▉        | 27/136 [00:19<01:03,  1.72it/s][A
Training:  21%|██▏       | 29/136 [00:22<01:27,  1.23it/s][A
Training:  23%|██▎   

Epoch: 15/23 - Loss: 2400.4485 - Accuracy: 0.9527



  0%|          | 0/17 [00:00<?, ?it/s][A
  6%|▌         | 1/17 [00:06<01:45,  6.59s/it][A
 12%|█▏        | 2/17 [00:07<00:44,  2.96s/it][A
 24%|██▎       | 4/17 [00:07<00:14,  1.13s/it][A
 29%|██▉       | 5/17 [00:11<00:26,  2.20s/it][A
 35%|███▌      | 6/17 [00:11<00:17,  1.58s/it][A
 41%|████      | 7/17 [00:12<00:11,  1.17s/it][A
 53%|█████▎    | 9/17 [00:16<00:12,  1.56s/it][A
 59%|█████▉    | 10/17 [00:16<00:08,  1.25s/it][A
 65%|██████▍   | 11/17 [00:16<00:05,  1.04it/s][A
 71%|███████   | 12/17 [00:16<00:03,  1.32it/s][A
 76%|███████▋  | 13/17 [00:20<00:06,  1.66s/it][A
 82%|████████▏ | 14/17 [00:21<00:04,  1.40s/it][A
100%|██████████| 17/17 [00:26<00:00,  1.56s/it][A


Val Loss: 2750.9565 - Val Accuracy: 0.9593


Epochs:  65%|██████▌   | 15/23 [27:05<15:56, 119.56s/it]
Training:   0%|          | 0/136 [00:00<?, ?it/s][A
Training:   1%|          | 1/136 [00:07<16:35,  7.38s/it][A
Training:   1%|▏         | 2/136 [00:07<06:55,  3.10s/it][A
Training:   2%|▏         | 3/136 [00:07<04:05,  1.85s/it][A
Training:   3%|▎         | 4/136 [00:08<02:39,  1.21s/it][A
Training:   4%|▎         | 5/136 [00:13<06:00,  2.75s/it][A
Training:   4%|▍         | 6/136 [00:13<04:00,  1.85s/it][A
Training:   5%|▌         | 7/136 [00:14<03:02,  1.41s/it][A
Training:   6%|▌         | 8/136 [00:14<02:16,  1.07s/it][A
Training:   7%|▋         | 9/136 [00:19<04:46,  2.26s/it][A
Training:   7%|▋         | 10/136 [00:19<03:21,  1.60s/it][A
Training:   8%|▊         | 11/136 [00:20<02:44,  1.32s/it][A
Training:   9%|▉         | 12/136 [00:20<01:57,  1.06it/s][A
Training:  10%|▉         | 13/136 [00:25<04:17,  2.09s/it][A
Training:  10%|█         | 14/136 [00:25<03:15,  1.60s/it][A
Training:  11%|█         | 15/1

Epoch: 16/23 - Loss: 2475.6519 - Accuracy: 0.9533



  0%|          | 0/17 [00:00<?, ?it/s][A
  6%|▌         | 1/17 [00:06<01:44,  6.53s/it][A
 12%|█▏        | 2/17 [00:06<00:42,  2.86s/it][A
 24%|██▎       | 4/17 [00:06<00:14,  1.11s/it][A
 29%|██▉       | 5/17 [00:11<00:25,  2.14s/it][A
 35%|███▌      | 6/17 [00:11<00:16,  1.54s/it][A
 41%|████      | 7/17 [00:11<00:11,  1.16s/it][A
 47%|████▋     | 8/17 [00:12<00:07,  1.15it/s][A
 53%|█████▎    | 9/17 [00:16<00:15,  1.96s/it][A
 65%|██████▍   | 11/17 [00:16<00:06,  1.08s/it][A
 76%|███████▋  | 13/17 [00:20<00:05,  1.39s/it][A
 82%|████████▏ | 14/17 [00:21<00:03,  1.22s/it][A
 94%|█████████▍| 16/17 [00:21<00:00,  1.29it/s][A
100%|██████████| 17/17 [00:24<00:00,  1.46s/it][A
Epochs:  70%|██████▉   | 16/23 [30:56<17:51, 153.04s/it]

Val Loss: 2910.0017 - Val Accuracy: 0.9622



Training:   0%|          | 0/136 [00:00<?, ?it/s][A
Training:   1%|          | 1/136 [00:06<15:32,  6.90s/it][A
Training:   1%|▏         | 2/136 [00:07<06:29,  2.91s/it][A
Training:   2%|▏         | 3/136 [00:07<03:54,  1.76s/it][A
Training:   3%|▎         | 4/136 [00:07<02:30,  1.14s/it][A
Training:   4%|▎         | 5/136 [00:12<05:34,  2.55s/it][A
Training:   4%|▍         | 6/136 [00:12<03:47,  1.75s/it][A
Training:   5%|▌         | 7/136 [00:13<02:49,  1.31s/it][A
Training:   6%|▌         | 8/136 [00:13<02:01,  1.05it/s][A
Training:   7%|▋         | 9/136 [00:19<05:25,  2.57s/it][A
Training:   7%|▋         | 10/136 [00:19<03:52,  1.85s/it][A
Training:   8%|▊         | 11/136 [00:19<02:45,  1.33s/it][A
Training:   9%|▉         | 12/136 [00:20<02:00,  1.03it/s][A
Training:  10%|▉         | 13/136 [00:24<04:09,  2.03s/it][A
Training:  10%|█         | 14/136 [00:25<03:19,  1.63s/it][A
Training:  11%|█         | 15/136 [00:25<02:27,  1.22s/it][A
Training:  12%|█▏        

Epoch: 17/23 - Loss: 2572.0659 - Accuracy: 0.9512



  0%|          | 0/17 [00:00<?, ?it/s][A
  6%|▌         | 1/17 [00:56<15:02, 56.38s/it][A
 12%|█▏        | 2/17 [00:56<05:49, 23.30s/it][A
 18%|█▊        | 3/17 [00:56<02:58, 12.72s/it][A
 24%|██▎       | 4/17 [00:56<01:40,  7.76s/it][A
 29%|██▉       | 5/17 [00:57<01:00,  5.08s/it][A
 35%|███▌      | 6/17 [00:57<00:37,  3.41s/it][A
 41%|████      | 7/17 [00:57<00:23,  2.35s/it][A
 47%|████▋     | 8/17 [00:57<00:14,  1.65s/it][A
 53%|█████▎    | 9/17 [01:01<00:18,  2.28s/it][A
 59%|█████▉    | 10/17 [01:01<00:11,  1.61s/it][A
 65%|██████▍   | 11/17 [01:02<00:08,  1.34s/it][A
 71%|███████   | 12/17 [01:02<00:04,  1.04it/s][A
 76%|███████▋  | 13/17 [01:06<00:07,  1.92s/it][A
 82%|████████▏ | 14/17 [01:06<00:04,  1.39s/it][A
 88%|████████▊ | 15/17 [01:06<00:02,  1.07s/it][A
100%|██████████| 17/17 [01:10<00:00,  4.14s/it][A
Epochs:  74%|███████▍  | 17/23 [35:40<19:15, 192.55s/it]

Val Loss: 3193.1338 - Val Accuracy: 0.9512



Training:   0%|          | 0/136 [00:00<?, ?it/s][A
Training:   1%|          | 1/136 [00:07<16:22,  7.28s/it][A
Training:   1%|▏         | 2/136 [00:08<07:47,  3.49s/it][A
Training:   2%|▏         | 3/136 [00:08<04:31,  2.04s/it][A
Training:   3%|▎         | 4/136 [00:08<02:49,  1.28s/it][A
Training:   4%|▎         | 5/136 [00:13<05:23,  2.47s/it][A
Training:   4%|▍         | 6/136 [00:14<04:31,  2.09s/it][A
Training:   5%|▌         | 7/136 [00:14<03:10,  1.48s/it][A
Training:   6%|▌         | 8/136 [00:14<02:19,  1.09s/it][A
Training:   7%|▋         | 9/136 [00:19<04:14,  2.00s/it][A
Training:   7%|▋         | 10/136 [00:20<03:48,  1.81s/it][A
Training:   8%|▊         | 11/136 [00:20<02:42,  1.30s/it][A
Training:   9%|▉         | 12/136 [00:20<01:57,  1.06it/s][A
Training:  10%|▉         | 13/136 [00:24<03:48,  1.86s/it][A
Training:  10%|█         | 14/136 [00:25<03:20,  1.65s/it][A
Training:  11%|█         | 15/136 [00:26<02:29,  1.23s/it][A
Training:  12%|█▎        

Epoch: 18/23 - Loss: 2670.7278 - Accuracy: 0.9507



  0%|          | 0/17 [00:00<?, ?it/s][A
  6%|▌         | 1/17 [00:06<01:42,  6.43s/it][A
 12%|█▏        | 2/17 [00:06<00:42,  2.80s/it][A
 18%|█▊        | 3/17 [00:06<00:22,  1.60s/it][A
 24%|██▎       | 4/17 [00:07<00:13,  1.07s/it][A
 29%|██▉       | 5/17 [00:11<00:28,  2.40s/it][A
 35%|███▌      | 6/17 [00:12<00:18,  1.65s/it][A
 41%|████      | 7/17 [00:13<00:14,  1.44s/it][A
 47%|████▋     | 8/17 [00:13<00:09,  1.03s/it][A
 53%|█████▎    | 9/17 [00:16<00:14,  1.78s/it][A
 65%|██████▍   | 11/17 [00:18<00:08,  1.37s/it][A
 71%|███████   | 12/17 [00:18<00:05,  1.06s/it][A
 76%|███████▋  | 13/17 [00:21<00:06,  1.56s/it][A
 88%|████████▊ | 15/17 [00:23<00:02,  1.25s/it][A
100%|██████████| 17/17 [00:25<00:00,  1.52s/it][A
Epochs:  78%|███████▊  | 18/23 [39:27<16:54, 202.83s/it]

Val Loss: 2961.1575 - Val Accuracy: 0.9513



Training:   0%|          | 0/136 [00:00<?, ?it/s][A
Training:   1%|          | 1/136 [00:08<19:56,  8.86s/it][A
Training:   1%|▏         | 2/136 [00:09<08:27,  3.79s/it][A
Training:   2%|▏         | 3/136 [00:09<04:40,  2.11s/it][A
Training:   3%|▎         | 4/136 [00:09<03:02,  1.38s/it][A
Training:   4%|▎         | 5/136 [00:15<06:40,  3.05s/it][A
Training:   4%|▍         | 6/136 [00:15<04:41,  2.16s/it][A
Training:   5%|▌         | 7/136 [00:16<03:18,  1.54s/it][A
Training:   6%|▌         | 8/136 [00:16<02:22,  1.12s/it][A
Training:   7%|▋         | 9/136 [00:22<05:54,  2.79s/it][A
Training:   8%|▊         | 11/136 [00:22<03:07,  1.50s/it][A
Training:  10%|▉         | 13/136 [00:29<04:42,  2.30s/it][A
Training:  11%|█         | 15/136 [00:30<03:00,  1.49s/it][A
Training:  12%|█▏        | 16/136 [00:30<02:25,  1.22s/it][A
Training:  12%|█▎        | 17/136 [00:36<04:33,  2.30s/it][A
Training:  14%|█▍        | 19/136 [00:36<02:47,  1.43s/it][A
Training:  15%|█▍        

Epoch: 19/23 - Loss: 2634.0659 - Accuracy: 0.9536



  0%|          | 0/17 [00:00<?, ?it/s][A
  6%|▌         | 1/17 [00:04<01:13,  4.60s/it][A
 18%|█▊        | 3/17 [00:04<00:17,  1.24s/it][A
 29%|██▉       | 5/17 [00:08<00:17,  1.49s/it][A
 35%|███▌      | 6/17 [00:08<00:12,  1.12s/it][A
 41%|████      | 7/17 [00:08<00:08,  1.19it/s][A
 47%|████▋     | 8/17 [00:08<00:05,  1.57it/s][A
 53%|█████▎    | 9/17 [00:11<00:11,  1.42s/it][A
 59%|█████▉    | 10/17 [00:12<00:07,  1.06s/it][A
 71%|███████   | 12/17 [00:12<00:03,  1.64it/s][A
 76%|███████▋  | 13/17 [00:15<00:05,  1.25s/it][A
 94%|█████████▍| 16/17 [00:15<00:00,  1.52it/s][A
100%|██████████| 17/17 [00:18<00:00,  1.09s/it][A
Epochs:  83%|████████▎ | 19/23 [42:54<13:36, 204.05s/it]

Val Loss: 3027.1191 - Val Accuracy: 0.9421



Training:   0%|          | 0/136 [00:00<?, ?it/s][A
Training:   1%|          | 1/136 [00:04<11:09,  4.96s/it][A
Training:   2%|▏         | 3/136 [00:05<03:00,  1.36s/it][A
Training:   3%|▎         | 4/136 [00:05<02:10,  1.01it/s][A
Training:   4%|▎         | 5/136 [00:09<04:07,  1.89s/it][A
Training:   4%|▍         | 6/136 [00:09<02:54,  1.34s/it][A
Training:   5%|▌         | 7/136 [00:09<02:04,  1.03it/s][A
Training:   6%|▌         | 8/136 [00:09<01:35,  1.34it/s][A
Training:   7%|▋         | 9/136 [00:13<03:18,  1.56s/it][A
Training:   7%|▋         | 10/136 [00:13<02:29,  1.19s/it][A
Training:   8%|▊         | 11/136 [00:13<01:54,  1.09it/s][A
Training:   9%|▉         | 12/136 [00:13<01:23,  1.48it/s][A
Training:  10%|▉         | 13/136 [00:17<03:25,  1.67s/it][A
Training:  12%|█▏        | 16/136 [00:18<01:35,  1.25it/s][A
Training:  12%|█▎        | 17/136 [00:21<02:48,  1.42s/it][A
Training:  13%|█▎        | 18/136 [00:22<02:20,  1.19s/it][A
Training:  14%|█▍       

Epoch: 20/23 - Loss: 2805.3245 - Accuracy: 0.9543



  0%|          | 0/17 [00:00<?, ?it/s][A
  6%|▌         | 1/17 [00:04<01:13,  4.59s/it][A
 18%|█▊        | 3/17 [00:04<00:17,  1.23s/it][A
 24%|██▎       | 4/17 [00:04<00:11,  1.16it/s][A
 29%|██▉       | 5/17 [00:08<00:20,  1.71s/it][A
 41%|████      | 7/17 [00:08<00:09,  1.09it/s][A
 47%|████▋     | 8/17 [00:08<00:06,  1.40it/s][A
 53%|█████▎    | 9/17 [00:11<00:10,  1.37s/it][A
 65%|██████▍   | 11/17 [00:11<00:04,  1.24it/s][A
 76%|███████▋  | 13/17 [00:15<00:05,  1.25s/it][A
 82%|████████▏ | 14/17 [00:15<00:03,  1.01s/it][A
 88%|████████▊ | 15/17 [00:16<00:01,  1.23it/s][A
100%|██████████| 17/17 [00:19<00:00,  1.14s/it][A
Epochs:  87%|████████▋ | 20/23 [45:43<09:41, 193.78s/it]

Val Loss: 4097.6426 - Val Accuracy: 0.9604



Training:   0%|          | 0/136 [00:00<?, ?it/s][A
Training:   1%|          | 1/136 [00:05<11:46,  5.24s/it][A
Training:   1%|▏         | 2/136 [00:05<05:16,  2.37s/it][A
Training:   3%|▎         | 4/136 [00:05<02:01,  1.09it/s][A
Training:   4%|▎         | 5/136 [00:09<03:39,  1.68s/it][A
Training:   4%|▍         | 6/136 [00:10<03:13,  1.49s/it][A
Training:   5%|▌         | 7/136 [00:10<02:20,  1.09s/it][A
Training:   6%|▌         | 8/136 [00:10<01:42,  1.25it/s][A
Training:   7%|▋         | 9/136 [00:13<03:09,  1.49s/it][A
Training:   7%|▋         | 10/136 [00:14<02:48,  1.34s/it][A
Training:   8%|▊         | 11/136 [00:14<02:02,  1.02it/s][A
Training:  10%|▉         | 13/136 [00:18<02:46,  1.35s/it][A
Training:  10%|█         | 14/136 [00:18<02:23,  1.18s/it][A
Training:  11%|█         | 15/136 [00:19<01:52,  1.08it/s][A
Training:  12%|█▏        | 16/136 [00:19<01:27,  1.37it/s][A
Training:  12%|█▎        | 17/136 [00:22<02:57,  1.49s/it][A
Training:  13%|█▎       

Epoch: 21/23 - Loss: 2629.8652 - Accuracy: 0.9541



  0%|          | 0/17 [00:00<?, ?it/s][A
  6%|▌         | 1/17 [00:05<01:20,  5.01s/it][A
 12%|█▏        | 2/17 [00:05<00:32,  2.14s/it][A
 18%|█▊        | 3/17 [00:05<00:17,  1.26s/it][A
 29%|██▉       | 5/17 [00:08<00:16,  1.37s/it][A
 41%|████      | 7/17 [00:08<00:08,  1.23it/s][A
 47%|████▋     | 8/17 [00:08<00:06,  1.46it/s][A
 53%|█████▎    | 9/17 [00:11<00:10,  1.25s/it][A
 59%|█████▉    | 10/17 [00:11<00:06,  1.06it/s][A
 71%|███████   | 12/17 [00:12<00:02,  1.69it/s][A
 76%|███████▋  | 13/17 [00:15<00:04,  1.17s/it][A
 82%|████████▏ | 14/17 [00:15<00:03,  1.00s/it][A
 88%|████████▊ | 15/17 [00:15<00:01,  1.29it/s][A
 94%|█████████▍| 16/17 [00:15<00:00,  1.65it/s][A
100%|██████████| 17/17 [00:18<00:00,  1.09s/it][A
Epochs:  91%|█████████▏| 21/23 [48:28<06:09, 184.92s/it]

Val Loss: 3518.0137 - Val Accuracy: 0.9650



Training:   0%|          | 0/136 [00:00<?, ?it/s][A
Training:   1%|          | 1/136 [00:05<11:56,  5.31s/it][A
Training:   1%|▏         | 2/136 [00:05<05:04,  2.27s/it][A
Training:   2%|▏         | 3/136 [00:05<02:54,  1.31s/it][A
Training:   3%|▎         | 4/136 [00:05<01:53,  1.16it/s][A
Training:   4%|▎         | 5/136 [00:09<03:53,  1.79s/it][A
Training:   4%|▍         | 6/136 [00:09<02:39,  1.23s/it][A
Training:   7%|▋         | 9/136 [00:13<02:53,  1.37s/it][A
Training:   7%|▋         | 10/136 [00:13<02:19,  1.11s/it][A
Training:   8%|▊         | 11/136 [00:14<01:51,  1.12it/s][A
Training:   9%|▉         | 12/136 [00:14<01:27,  1.41it/s][A
Training:  10%|▉         | 13/136 [00:18<03:07,  1.52s/it][A
Training:  10%|█         | 14/136 [00:18<02:23,  1.18s/it][A
Training:  11%|█         | 15/136 [00:18<01:45,  1.15it/s][A
Training:  12%|█▏        | 16/136 [00:18<01:21,  1.47it/s][A
Training:  12%|█▎        | 17/136 [00:22<03:06,  1.57s/it][A
Training:  13%|█▎      

Epoch: 22/23 - Loss: 2643.7385 - Accuracy: 0.9539



  0%|          | 0/17 [00:00<?, ?it/s][A
  6%|▌         | 1/17 [00:04<01:13,  4.59s/it][A
 12%|█▏        | 2/17 [00:04<00:29,  1.97s/it][A
 24%|██▎       | 4/17 [00:04<00:10,  1.28it/s][A
 29%|██▉       | 5/17 [00:08<00:19,  1.64s/it][A
 41%|████      | 7/17 [00:08<00:09,  1.11it/s][A
 53%|█████▎    | 9/17 [00:12<00:09,  1.24s/it][A
 59%|█████▉    | 10/17 [00:12<00:06,  1.01it/s][A
 65%|██████▍   | 11/17 [00:12<00:04,  1.28it/s][A
 71%|███████   | 12/17 [00:12<00:03,  1.61it/s][A
 76%|███████▋  | 13/17 [00:14<00:04,  1.13s/it][A
 88%|████████▊ | 15/17 [00:15<00:01,  1.46it/s][A
 94%|█████████▍| 16/17 [00:15<00:00,  1.61it/s][A
100%|██████████| 17/17 [00:18<00:00,  1.07s/it][A
Epochs:  96%|█████████▌| 22/23 [51:08<02:57, 177.43s/it]

Val Loss: 3634.8757 - Val Accuracy: 0.9565



Training:   0%|          | 0/136 [00:00<?, ?it/s][A
Training:   1%|          | 1/136 [00:05<12:54,  5.74s/it][A
Training:   1%|▏         | 2/136 [00:05<05:33,  2.49s/it][A
Training:   2%|▏         | 3/136 [00:06<03:11,  1.44s/it][A
Training:   3%|▎         | 4/136 [00:06<02:02,  1.08it/s][A
Training:   4%|▎         | 5/136 [00:09<04:03,  1.86s/it][A
Training:   4%|▍         | 6/136 [00:09<02:46,  1.28s/it][A
Training:   5%|▌         | 7/136 [00:10<02:00,  1.07it/s][A
Training:   6%|▌         | 8/136 [00:10<01:26,  1.48it/s][A
Training:   7%|▋         | 9/136 [00:14<03:38,  1.72s/it][A
Training:   8%|▊         | 11/136 [00:14<01:59,  1.04it/s][A
Training:   9%|▉         | 12/136 [00:14<01:35,  1.30it/s][A
Training:  10%|▉         | 13/136 [00:18<03:04,  1.50s/it][A
Training:  10%|█         | 14/136 [00:18<02:16,  1.12s/it][A
Training:  11%|█         | 15/136 [00:18<01:44,  1.15it/s][A
Training:  12%|█▎        | 17/136 [00:22<02:39,  1.34s/it][A
Training:  14%|█▍        

Epoch: 23/23 - Loss: 2548.5808 - Accuracy: 0.9544



  0%|          | 0/17 [00:00<?, ?it/s][A
  6%|▌         | 1/17 [00:02<00:45,  2.86s/it][A
 18%|█▊        | 3/17 [00:02<00:10,  1.28it/s][A
 29%|██▉       | 5/17 [00:05<00:11,  1.08it/s][A
 41%|████      | 7/17 [00:05<00:05,  1.81it/s][A
 53%|█████▎    | 9/17 [00:07<00:06,  1.29it/s][A
 65%|██████▍   | 11/17 [00:07<00:03,  1.91it/s][A
 76%|███████▋  | 13/17 [00:09<00:02,  1.46it/s][A
100%|██████████| 17/17 [00:11<00:00,  1.51it/s][A
Epochs: 100%|██████████| 23/23 [53:10<00:00, 138.71s/it]


Val Loss: 3646.2012 - Val Accuracy: 0.9483


[32m[I 2023-12-08 11:49:44,713][0m Trial 1 finished with value: 0.9483182430267334 and parameters: {'loss_learning_rate': 0.0037047485989424762, 'learning_rate': 0.02088792830186936, 'weight_decay': 0.003283560684544378, 'epsilon': 7.115743039074607e-09, 'beta': 0.5, 'gamma': 0.2, 'batch_size': 103, 'epochs': 23}. Best is trial 0 with value: 0.9648317694664001.[0m


Learning rate for Loss: 0.0008958261761009699
Learning rate: 1.5218716314145224e-05
Weight decay: 0.0049081536466633905
Epsilon: 1.7968823637993475e-08
Beta: 0.4
Gamma: 0.5
Batch size: 186
Number of epochs: 88


Epochs:   0%|          | 0/88 [00:00<?, ?it/s]
Training:   0%|          | 0/76 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/76 [00:05<06:27,  5.17s/it][A
Training:   3%|▎         | 2/76 [00:05<02:49,  2.29s/it][A
Training:   4%|▍         | 3/76 [00:05<01:34,  1.29s/it][A
Training:   7%|▋         | 5/76 [00:10<02:13,  1.88s/it][A
Training:   9%|▉         | 7/76 [00:10<01:14,  1.08s/it][A
Training:  12%|█▏        | 9/76 [00:15<01:44,  1.56s/it][A
Training:  13%|█▎        | 10/76 [00:15<01:22,  1.25s/it][A
Training:  16%|█▌        | 12/76 [00:15<00:51,  1.25it/s][A
Training:  17%|█▋        | 13/76 [00:20<01:43,  1.65s/it][A
Training:  20%|█▉        | 15/76 [00:20<01:04,  1.05s/it][A
Training:  21%|██        | 16/76 [00:20<00:51,  1.17it/s][A
Training:  22%|██▏       | 17/76 [00:24<01:36,  1.63s/it][A
Training:  24%|██▎       | 18/76 [00:24<01:12,  1.26s/it][A
Training:  25%|██▌       | 19/76 [00:24<00:54,  1.05it/s][A
Training:  26%|██▋       | 20/76 [00:24<00:40,  1.38i

Epoch: 1/88 - Loss: 21.1716 - Accuracy: 0.5792



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:04<00:40,  4.45s/it][A
 20%|██        | 2/10 [00:04<00:15,  1.94s/it][A
 40%|████      | 4/10 [00:04<00:04,  1.29it/s][A
 50%|█████     | 5/10 [00:08<00:08,  1.76s/it][A
 60%|██████    | 6/10 [00:08<00:05,  1.26s/it][A
 80%|████████  | 8/10 [00:08<00:01,  1.44it/s][A
100%|██████████| 10/10 [00:12<00:00,  1.22s/it][A
Epochs:   1%|          | 1/88 [01:39<2:24:26, 99.62s/it]

Val Loss: 19.1349 - Val Accuracy: 0.6486



Training:   0%|          | 0/76 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/76 [00:05<06:53,  5.52s/it][A
Training:   4%|▍         | 3/76 [00:05<01:47,  1.47s/it][A
Training:   7%|▋         | 5/76 [00:10<02:19,  1.97s/it][A
Training:   8%|▊         | 6/76 [00:10<01:42,  1.47s/it][A
Training:  11%|█         | 8/76 [00:10<00:58,  1.17it/s][A
Training:  13%|█▎        | 10/76 [00:15<01:32,  1.41s/it][A
Training:  16%|█▌        | 12/76 [00:15<01:00,  1.06it/s][A
Training:  17%|█▋        | 13/76 [00:20<01:45,  1.68s/it][A
Training:  18%|█▊        | 14/76 [00:20<01:23,  1.35s/it][A
Training:  21%|██        | 16/76 [00:20<00:51,  1.17it/s][A
Training:  22%|██▏       | 17/76 [00:24<01:32,  1.56s/it][A
Training:  25%|██▌       | 19/76 [00:24<00:56,  1.02it/s][A
Training:  26%|██▋       | 20/76 [00:24<00:44,  1.26it/s][A
Training:  28%|██▊       | 21/76 [00:29<01:32,  1.68s/it][A
Training:  29%|██▉       | 22/76 [00:29<01:09,  1.29s/it][A
Training:  32%|███▏      | 24/76 [00:

Epoch: 2/88 - Loss: 17.5646 - Accuracy: 0.6956



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:04<00:44,  4.90s/it][A
 20%|██        | 2/10 [00:05<00:16,  2.08s/it][A
 30%|███       | 3/10 [00:05<00:08,  1.21s/it][A
 50%|█████     | 5/10 [00:09<00:08,  1.61s/it][A
 80%|████████  | 8/10 [00:09<00:01,  1.32it/s][A
100%|██████████| 10/10 [00:12<00:00,  1.25s/it][A
Epochs:   2%|▏         | 2/88 [03:20<2:23:48, 100.33s/it]

Val Loss: 16.2561 - Val Accuracy: 0.7742



Training:   0%|          | 0/76 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/76 [00:05<06:38,  5.31s/it][A
Training:   3%|▎         | 2/76 [00:05<03:02,  2.46s/it][A
Training:   4%|▍         | 3/76 [00:05<01:41,  1.39s/it][A
Training:   7%|▋         | 5/76 [00:10<02:12,  1.87s/it][A
Training:   8%|▊         | 6/76 [00:10<01:42,  1.46s/it][A
Training:   9%|▉         | 7/76 [00:11<01:15,  1.09s/it][A
Training:  12%|█▏        | 9/76 [00:15<01:43,  1.54s/it][A
Training:  13%|█▎        | 10/76 [00:15<01:23,  1.26s/it][A
Training:  16%|█▌        | 12/76 [00:15<00:49,  1.29it/s][A
Training:  17%|█▋        | 13/76 [00:20<01:38,  1.57s/it][A
Training:  18%|█▊        | 14/76 [00:20<01:17,  1.25s/it][A
Training:  21%|██        | 16/76 [00:20<00:45,  1.32it/s][A
Training:  22%|██▏       | 17/76 [00:24<01:31,  1.55s/it][A
Training:  24%|██▎       | 18/76 [00:25<01:15,  1.30s/it][A
Training:  25%|██▌       | 19/76 [00:25<00:57,  1.00s/it][A
Training:  28%|██▊       | 21/76 [00:29

Epoch: 3/88 - Loss: 14.7211 - Accuracy: 0.8088



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:04<00:41,  4.65s/it][A
 20%|██        | 2/10 [00:04<00:16,  2.09s/it][A
 40%|████      | 4/10 [00:05<00:04,  1.23it/s][A
 50%|█████     | 5/10 [00:08<00:08,  1.68s/it][A
 60%|██████    | 6/10 [00:08<00:04,  1.24s/it][A
100%|██████████| 10/10 [00:12<00:00,  1.23s/it][A
Epochs:   3%|▎         | 3/88 [05:01<2:22:26, 100.55s/it]

Val Loss: 13.7749 - Val Accuracy: 0.8594



Training:   0%|          | 0/76 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/76 [00:05<06:38,  5.32s/it][A
Training:   4%|▍         | 3/76 [00:05<01:47,  1.47s/it][A
Training:   5%|▌         | 4/76 [00:05<01:12,  1.01s/it][A
Training:   7%|▋         | 5/76 [00:10<02:32,  2.14s/it][A
Training:   8%|▊         | 6/76 [00:10<01:45,  1.51s/it][A
Training:   9%|▉         | 7/76 [00:10<01:14,  1.09s/it][A
Training:  11%|█         | 8/76 [00:10<00:55,  1.23it/s][A
Training:  12%|█▏        | 9/76 [00:14<02:06,  1.89s/it][A
Training:  13%|█▎        | 10/76 [00:15<01:29,  1.35s/it][A
Training:  14%|█▍        | 11/76 [00:15<01:03,  1.03it/s][A
Training:  16%|█▌        | 12/76 [00:15<00:46,  1.37it/s][A
Training:  17%|█▋        | 13/76 [00:19<01:54,  1.82s/it][A
Training:  18%|█▊        | 14/76 [00:19<01:21,  1.31s/it][A
Training:  21%|██        | 16/76 [00:20<00:47,  1.27it/s][A
Training:  22%|██▏       | 17/76 [00:24<01:37,  1.65s/it][A
Training:  26%|██▋       | 20/76 [00:24<

Epoch: 4/88 - Loss: 12.3971 - Accuracy: 0.8736



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:04<00:44,  4.93s/it][A
 20%|██        | 2/10 [00:05<00:16,  2.09s/it][A
 30%|███       | 3/10 [00:05<00:08,  1.20s/it][A
 50%|█████     | 5/10 [00:08<00:07,  1.56s/it][A
 70%|███████   | 7/10 [00:08<00:02,  1.12it/s][A
100%|██████████| 10/10 [00:12<00:00,  1.25s/it][A
Epochs:   5%|▍         | 4/88 [06:41<2:20:22, 100.26s/it]

Val Loss: 11.3845 - Val Accuracy: 0.9018



Training:   0%|          | 0/76 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/76 [00:05<06:56,  5.56s/it][A
Training:   3%|▎         | 2/76 [00:05<02:56,  2.39s/it][A
Training:   5%|▌         | 4/76 [00:05<01:08,  1.06it/s][A
Training:   7%|▋         | 5/76 [00:10<02:27,  2.08s/it][A
Training:  11%|█         | 8/76 [00:10<01:02,  1.09it/s][A
Training:  13%|█▎        | 10/76 [00:15<01:33,  1.42s/it][A
Training:  14%|█▍        | 11/76 [00:15<01:16,  1.17s/it][A
Training:  16%|█▌        | 12/76 [00:15<01:00,  1.06it/s][A
Training:  17%|█▋        | 13/76 [00:19<01:50,  1.75s/it][A
Training:  20%|█▉        | 15/76 [00:20<01:04,  1.06s/it][A
Training:  21%|██        | 16/76 [00:20<00:51,  1.16it/s][A
Training:  22%|██▏       | 17/76 [00:24<01:40,  1.70s/it][A
Training:  24%|██▎       | 18/76 [00:24<01:15,  1.30s/it][A
Training:  25%|██▌       | 19/76 [00:24<00:56,  1.00it/s][A
Training:  26%|██▋       | 20/76 [00:24<00:42,  1.33it/s][A
Training:  28%|██▊       | 21/76 [00:

Epoch: 5/88 - Loss: 10.4805 - Accuracy: 0.9058



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:04<00:43,  4.79s/it][A
 20%|██        | 2/10 [00:04<00:16,  2.06s/it][A
 30%|███       | 3/10 [00:05<00:08,  1.18s/it][A
 50%|█████     | 5/10 [00:08<00:07,  1.49s/it][A
 60%|██████    | 6/10 [00:08<00:04,  1.14s/it][A
 70%|███████   | 7/10 [00:08<00:02,  1.19it/s][A
100%|██████████| 10/10 [00:12<00:00,  1.24s/it][A
Epochs:   6%|▌         | 5/88 [08:21<2:18:41, 100.26s/it]

Val Loss: 9.6671 - Val Accuracy: 0.9199



Training:   0%|          | 0/76 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/76 [00:05<06:55,  5.54s/it][A
Training:   3%|▎         | 2/76 [00:05<02:54,  2.36s/it][A
Training:   5%|▌         | 4/76 [00:05<01:06,  1.09it/s][A
Training:   7%|▋         | 5/76 [00:10<02:27,  2.08s/it][A
Training:   9%|▉         | 7/76 [00:10<01:18,  1.14s/it][A
Training:  12%|█▏        | 9/76 [00:15<01:48,  1.61s/it][A
Training:  13%|█▎        | 10/76 [00:15<01:25,  1.30s/it][A
Training:  16%|█▌        | 12/76 [00:15<00:52,  1.22it/s][A
Training:  17%|█▋        | 13/76 [00:19<01:40,  1.59s/it][A
Training:  18%|█▊        | 14/76 [00:20<01:17,  1.24s/it][A
Training:  20%|█▉        | 15/76 [00:20<00:58,  1.04it/s][A
Training:  21%|██        | 16/76 [00:20<00:45,  1.33it/s][A
Training:  22%|██▏       | 17/76 [00:24<01:39,  1.69s/it][A
Training:  25%|██▌       | 19/76 [00:24<00:57,  1.01s/it][A
Training:  26%|██▋       | 20/76 [00:25<00:45,  1.24it/s][A
Training:  28%|██▊       | 21/76 [00:2

Epoch: 6/88 - Loss: 9.1702 - Accuracy: 0.9218



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:04<00:43,  4.82s/it][A
 30%|███       | 3/10 [00:04<00:09,  1.29s/it][A
 50%|█████     | 5/10 [00:08<00:07,  1.58s/it][A
 80%|████████  | 8/10 [00:08<00:01,  1.29it/s][A
100%|██████████| 10/10 [00:12<00:00,  1.25s/it][A
Epochs:   7%|▋         | 6/88 [10:01<2:17:05, 100.31s/it]

Val Loss: 8.5569 - Val Accuracy: 0.9274



Training:   0%|          | 0/76 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/76 [00:05<06:52,  5.50s/it][A
Training:   4%|▍         | 3/76 [00:05<01:47,  1.48s/it][A
Training:   7%|▋         | 5/76 [00:10<02:16,  1.92s/it][A
Training:   8%|▊         | 6/76 [00:10<01:40,  1.44s/it][A
Training:   9%|▉         | 7/76 [00:10<01:14,  1.08s/it][A
Training:  11%|█         | 8/76 [00:10<00:54,  1.24it/s][A
Training:  12%|█▏        | 9/76 [00:15<02:03,  1.84s/it][A
Training:  13%|█▎        | 10/76 [00:15<01:29,  1.35s/it][A
Training:  16%|█▌        | 12/76 [00:15<00:49,  1.30it/s][A
Training:  17%|█▋        | 13/76 [00:19<01:43,  1.64s/it][A
Training:  20%|█▉        | 15/76 [00:19<01:00,  1.01it/s][A
Training:  21%|██        | 16/76 [00:20<00:48,  1.23it/s][A
Training:  22%|██▏       | 17/76 [00:24<01:39,  1.68s/it][A
Training:  25%|██▌       | 19/76 [00:24<00:59,  1.04s/it][A
Training:  28%|██▊       | 21/76 [00:28<01:19,  1.45s/it][A
Training:  29%|██▉       | 22/76 [00:29

Epoch: 7/88 - Loss: 8.1789 - Accuracy: 0.9296



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:04<00:43,  4.87s/it][A
 20%|██        | 2/10 [00:04<00:16,  2.08s/it][A
 40%|████      | 4/10 [00:05<00:04,  1.22it/s][A
 50%|█████     | 5/10 [00:08<00:08,  1.69s/it][A
 80%|████████  | 8/10 [00:08<00:01,  1.33it/s][A
100%|██████████| 10/10 [00:12<00:00,  1.27s/it][A
Epochs:   8%|▊         | 7/88 [11:41<2:15:02, 100.03s/it]

Val Loss: 7.7516 - Val Accuracy: 0.9342



Training:   0%|          | 0/76 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/76 [00:05<07:09,  5.73s/it][A
Training:   4%|▍         | 3/76 [00:05<01:52,  1.54s/it][A
Training:   7%|▋         | 5/76 [00:10<02:19,  1.96s/it][A
Training:   8%|▊         | 6/76 [00:10<01:43,  1.47s/it][A
Training:   9%|▉         | 7/76 [00:10<01:16,  1.10s/it][A
Training:  12%|█▏        | 9/76 [00:15<01:47,  1.60s/it][A
Training:  14%|█▍        | 11/76 [00:15<01:05,  1.00s/it][A
Training:  17%|█▋        | 13/76 [00:19<01:30,  1.43s/it][A
Training:  18%|█▊        | 14/76 [00:19<01:12,  1.17s/it][A
Training:  21%|██        | 16/76 [00:20<00:47,  1.27it/s][A
Training:  22%|██▏       | 17/76 [00:24<01:27,  1.48s/it][A
Training:  25%|██▌       | 19/76 [00:24<00:55,  1.03it/s][A
Training:  26%|██▋       | 20/76 [00:24<00:44,  1.26it/s][A
Training:  28%|██▊       | 21/76 [00:29<01:28,  1.60s/it][A
Training:  29%|██▉       | 22/76 [00:29<01:07,  1.24s/it][A
Training:  30%|███       | 23/76 [00:2

Epoch: 8/88 - Loss: 7.3470 - Accuracy: 0.9340



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:04<00:39,  4.43s/it][A
 30%|███       | 3/10 [00:04<00:08,  1.19s/it][A
 50%|█████     | 5/10 [00:08<00:07,  1.58s/it][A
 80%|████████  | 8/10 [00:08<00:01,  1.25it/s][A
100%|██████████| 10/10 [00:12<00:00,  1.22s/it][A
Epochs:   9%|▉         | 8/88 [13:20<2:13:06, 99.83s/it] 

Val Loss: 6.9307 - Val Accuracy: 0.9380



Training:   0%|          | 0/76 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/76 [00:05<06:44,  5.39s/it][A
Training:   3%|▎         | 2/76 [00:05<02:50,  2.30s/it][A
Training:   4%|▍         | 3/76 [00:05<01:35,  1.31s/it][A
Training:   7%|▋         | 5/76 [00:10<02:11,  1.85s/it][A
Training:   8%|▊         | 6/76 [00:10<01:37,  1.40s/it][A
Training:   9%|▉         | 7/76 [00:10<01:10,  1.03s/it][A
Training:  11%|█         | 8/76 [00:10<00:52,  1.30it/s][A
Training:  12%|█▏        | 9/76 [00:14<01:58,  1.77s/it][A
Training:  13%|█▎        | 10/76 [00:15<01:24,  1.28s/it][A
Training:  14%|█▍        | 11/76 [00:15<01:00,  1.07it/s][A
Training:  17%|█▋        | 13/76 [00:19<01:38,  1.56s/it][A
Training:  18%|█▊        | 14/76 [00:19<01:14,  1.21s/it][A
Training:  21%|██        | 16/76 [00:20<00:44,  1.35it/s][A
Training:  22%|██▏       | 17/76 [00:24<01:34,  1.60s/it][A
Training:  25%|██▌       | 19/76 [00:24<00:57,  1.01s/it][A
Training:  28%|██▊       | 21/76 [00:29<

Epoch: 9/88 - Loss: 6.7331 - Accuracy: 0.9396



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:04<00:41,  4.59s/it][A
 30%|███       | 3/10 [00:04<00:08,  1.24s/it][A
 50%|█████     | 5/10 [00:08<00:08,  1.67s/it][A
 80%|████████  | 8/10 [00:09<00:01,  1.22it/s][A
100%|██████████| 10/10 [00:12<00:00,  1.29s/it][A
Epochs:  10%|█         | 9/88 [15:01<2:11:57, 100.22s/it]

Val Loss: 6.6083 - Val Accuracy: 0.9412



Training:   0%|          | 0/76 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/76 [00:05<06:42,  5.37s/it][A
Training:   3%|▎         | 2/76 [00:05<02:48,  2.27s/it][A
Training:   4%|▍         | 3/76 [00:05<01:34,  1.29s/it][A
Training:   7%|▋         | 5/76 [00:10<02:13,  1.88s/it][A
Training:   8%|▊         | 6/76 [00:10<01:36,  1.38s/it][A
Training:   9%|▉         | 7/76 [00:10<01:12,  1.05s/it][A
Training:  12%|█▏        | 9/76 [00:14<01:41,  1.52s/it][A
Training:  13%|█▎        | 10/76 [00:15<01:21,  1.23s/it][A
Training:  14%|█▍        | 11/76 [00:15<01:01,  1.05it/s][A
Training:  16%|█▌        | 12/76 [00:15<00:47,  1.35it/s][A
Training:  17%|█▋        | 13/76 [00:19<01:41,  1.61s/it][A
Training:  18%|█▊        | 14/76 [00:19<01:16,  1.23s/it][A
Training:  20%|█▉        | 15/76 [00:20<01:01,  1.01s/it][A
Training:  22%|██▏       | 17/76 [00:24<01:26,  1.46s/it][A
Training:  24%|██▎       | 18/76 [00:24<01:09,  1.19s/it][A
Training:  25%|██▌       | 19/76 [00:24

Epoch: 10/88 - Loss: 6.3614 - Accuracy: 0.9414



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:04<00:36,  4.11s/it][A
 20%|██        | 2/10 [00:04<00:14,  1.78s/it][A
 30%|███       | 3/10 [00:04<00:07,  1.07s/it][A
 50%|█████     | 5/10 [00:08<00:08,  1.61s/it][A
 70%|███████   | 7/10 [00:08<00:02,  1.07it/s][A
100%|██████████| 10/10 [00:12<00:00,  1.24s/it][A
Epochs:  11%|█▏        | 10/88 [16:41<2:10:17, 100.23s/it]

Val Loss: 6.1780 - Val Accuracy: 0.9448



Training:   0%|          | 0/76 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/76 [00:05<06:55,  5.55s/it][A
Training:   3%|▎         | 2/76 [00:05<02:55,  2.38s/it][A
Training:   4%|▍         | 3/76 [00:05<01:38,  1.35s/it][A
Training:   5%|▌         | 4/76 [00:05<01:02,  1.16it/s][A
Training:   7%|▋         | 5/76 [00:10<02:36,  2.20s/it][A
Training:   8%|▊         | 6/76 [00:10<01:44,  1.50s/it][A
Training:  11%|█         | 8/76 [00:10<00:53,  1.27it/s][A
Training:  12%|█▏        | 9/76 [00:15<01:56,  1.73s/it][A
Training:  14%|█▍        | 11/76 [00:15<01:06,  1.03s/it][A
Training:  16%|█▌        | 12/76 [00:15<00:51,  1.23it/s][A
Training:  17%|█▋        | 13/76 [00:19<01:47,  1.71s/it][A
Training:  18%|█▊        | 14/76 [00:19<01:19,  1.29s/it][A
Training:  20%|█▉        | 15/76 [00:20<01:00,  1.00it/s][A
Training:  21%|██        | 16/76 [00:20<00:45,  1.31it/s][A
Training:  22%|██▏       | 17/76 [00:24<01:44,  1.76s/it][A
Training:  25%|██▌       | 19/76 [00:24<

Epoch: 11/88 - Loss: 5.8979 - Accuracy: 0.9443



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:04<00:39,  4.36s/it][A
 20%|██        | 2/10 [00:04<00:15,  1.89s/it][A
 30%|███       | 3/10 [00:04<00:07,  1.08s/it][A
 50%|█████     | 5/10 [00:08<00:08,  1.64s/it][A
 70%|███████   | 7/10 [00:08<00:02,  1.06it/s][A
100%|██████████| 10/10 [00:12<00:00,  1.26s/it][A
Epochs:  12%|█▎        | 11/88 [18:22<2:08:38, 100.24s/it]

Val Loss: 5.6967 - Val Accuracy: 0.9453



Training:   0%|          | 0/76 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/76 [00:05<06:57,  5.56s/it][A
Training:   4%|▍         | 3/76 [00:05<01:52,  1.54s/it][A
Training:   7%|▋         | 5/76 [00:10<02:14,  1.90s/it][A
Training:   9%|▉         | 7/76 [00:10<01:18,  1.13s/it][A
Training:  11%|█         | 8/76 [00:10<01:01,  1.11it/s][A
Training:  12%|█▏        | 9/76 [00:14<01:56,  1.74s/it][A
Training:  14%|█▍        | 11/76 [00:15<01:08,  1.05s/it][A
Training:  16%|█▌        | 12/76 [00:15<00:53,  1.19it/s][A
Training:  17%|█▋        | 13/76 [00:19<01:50,  1.76s/it][A
Training:  18%|█▊        | 14/76 [00:19<01:23,  1.34s/it][A
Training:  20%|█▉        | 15/76 [00:20<01:01,  1.01s/it][A
Training:  22%|██▏       | 17/76 [00:24<01:31,  1.56s/it][A
Training:  24%|██▎       | 18/76 [00:24<01:10,  1.22s/it][A
Training:  26%|██▋       | 20/76 [00:24<00:42,  1.33it/s][A
Training:  28%|██▊       | 21/76 [00:29<01:27,  1.59s/it][A
Training:  29%|██▉       | 22/76 [00:2

Epoch: 12/88 - Loss: 5.5722 - Accuracy: 0.9469



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:04<00:43,  4.81s/it][A
 20%|██        | 2/10 [00:04<00:16,  2.06s/it][A
 40%|████      | 4/10 [00:05<00:04,  1.24it/s][A
 50%|█████     | 5/10 [00:09<00:09,  1.82s/it][A
 70%|███████   | 7/10 [00:09<00:02,  1.01it/s][A
100%|██████████| 10/10 [00:13<00:00,  1.31s/it][A
Epochs:  14%|█▎        | 12/88 [20:02<2:07:07, 100.36s/it]

Val Loss: 5.2441 - Val Accuracy: 0.9469



Training:   0%|          | 0/76 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/76 [00:05<06:27,  5.17s/it][A
Training:   3%|▎         | 2/76 [00:05<02:44,  2.22s/it][A
Training:   4%|▍         | 3/76 [00:05<01:32,  1.27s/it][A
Training:   5%|▌         | 4/76 [00:05<01:01,  1.17it/s][A
Training:   7%|▋         | 5/76 [00:09<02:26,  2.06s/it][A
Training:   8%|▊         | 6/76 [00:10<01:46,  1.52s/it][A
Training:  11%|█         | 8/76 [00:10<00:55,  1.24it/s][A
Training:  12%|█▏        | 9/76 [00:14<01:50,  1.65s/it][A
Training:  13%|█▎        | 10/76 [00:15<01:30,  1.37s/it][A
Training:  16%|█▌        | 12/76 [00:15<00:51,  1.25it/s][A
Training:  17%|█▋        | 13/76 [00:19<01:37,  1.55s/it][A
Training:  18%|█▊        | 14/76 [00:19<01:19,  1.29s/it][A
Training:  20%|█▉        | 15/76 [00:19<00:59,  1.02it/s][A
Training:  21%|██        | 16/76 [00:20<00:44,  1.34it/s][A
Training:  22%|██▏       | 17/76 [00:23<01:36,  1.64s/it][A
Training:  24%|██▎       | 18/76 [00:24<

Epoch: 13/88 - Loss: 5.3039 - Accuracy: 0.9485



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:04<00:42,  4.75s/it][A
 30%|███       | 3/10 [00:04<00:09,  1.31s/it][A
 40%|████      | 4/10 [00:05<00:05,  1.12it/s][A
 50%|█████     | 5/10 [00:09<00:10,  2.01s/it][A
 70%|███████   | 7/10 [00:09<00:03,  1.06s/it][A
100%|██████████| 10/10 [00:13<00:00,  1.33s/it][A
Epochs:  15%|█▍        | 13/88 [21:43<2:05:43, 100.58s/it]

Val Loss: 5.2103 - Val Accuracy: 0.9485



Training:   0%|          | 0/76 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/76 [00:05<06:45,  5.40s/it][A
Training:   4%|▍         | 3/76 [00:05<01:46,  1.45s/it][A
Training:   5%|▌         | 4/76 [00:05<01:11,  1.01it/s][A
Training:   7%|▋         | 5/76 [00:10<02:43,  2.30s/it][A
Training:   9%|▉         | 7/76 [00:10<01:23,  1.21s/it][A
Training:  12%|█▏        | 9/76 [00:15<01:47,  1.61s/it][A
Training:  13%|█▎        | 10/76 [00:15<01:23,  1.27s/it][A
Training:  16%|█▌        | 12/76 [00:15<00:51,  1.24it/s][A
Training:  17%|█▋        | 13/76 [00:19<01:40,  1.59s/it][A
Training:  18%|█▊        | 14/76 [00:19<01:16,  1.24s/it][A
Training:  20%|█▉        | 15/76 [00:20<00:58,  1.05it/s][A
Training:  21%|██        | 16/76 [00:20<00:44,  1.34it/s][A
Training:  22%|██▏       | 17/76 [00:24<01:40,  1.70s/it][A
Training:  25%|██▌       | 19/76 [00:24<00:55,  1.02it/s][A
Training:  28%|██▊       | 21/76 [00:28<01:19,  1.45s/it][A
Training:  29%|██▉       | 22/76 [00:2

Epoch: 14/88 - Loss: 4.9831 - Accuracy: 0.9503



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:04<00:42,  4.75s/it][A
 30%|███       | 3/10 [00:04<00:08,  1.27s/it][A
 50%|█████     | 5/10 [00:09<00:08,  1.74s/it][A
 80%|████████  | 8/10 [00:09<00:01,  1.18it/s][A
100%|██████████| 10/10 [00:13<00:00,  1.30s/it][A
Epochs:  16%|█▌        | 14/88 [23:23<2:03:51, 100.42s/it]

Val Loss: 5.0766 - Val Accuracy: 0.9526



Training:   0%|          | 0/76 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/76 [00:05<06:58,  5.57s/it][A
Training:   3%|▎         | 2/76 [00:05<02:54,  2.36s/it][A
Training:   4%|▍         | 3/76 [00:05<01:37,  1.34s/it][A
Training:   5%|▌         | 4/76 [00:05<01:03,  1.13it/s][A
Training:   7%|▋         | 5/76 [00:10<02:34,  2.18s/it][A
Training:   8%|▊         | 6/76 [00:10<01:43,  1.48s/it][A
Training:  11%|█         | 8/76 [00:10<00:54,  1.25it/s][A
Training:  12%|█▏        | 9/76 [00:14<01:52,  1.68s/it][A
Training:  14%|█▍        | 11/76 [00:15<01:08,  1.05s/it][A
Training:  16%|█▌        | 12/76 [00:15<00:53,  1.20it/s][A
Training:  17%|█▋        | 13/76 [00:19<01:42,  1.63s/it][A
Training:  18%|█▊        | 14/76 [00:19<01:16,  1.23s/it][A
Training:  20%|█▉        | 15/76 [00:20<01:03,  1.04s/it][A
Training:  22%|██▏       | 17/76 [00:24<01:28,  1.51s/it][A
Training:  25%|██▌       | 19/76 [00:24<00:55,  1.03it/s][A
Training:  26%|██▋       | 20/76 [00:24<

Epoch: 15/88 - Loss: 4.8279 - Accuracy: 0.9518



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:04<00:41,  4.64s/it][A
 20%|██        | 2/10 [00:04<00:16,  2.03s/it][A
 40%|████      | 4/10 [00:04<00:04,  1.25it/s][A
 50%|█████     | 5/10 [00:09<00:09,  1.81s/it][A
 60%|██████    | 6/10 [00:09<00:05,  1.31s/it][A
 70%|███████   | 7/10 [00:09<00:02,  1.05it/s][A
100%|██████████| 10/10 [00:12<00:00,  1.30s/it][A
Epochs:  17%|█▋        | 15/88 [25:03<2:01:59, 100.27s/it]

Val Loss: 4.7611 - Val Accuracy: 0.9521



Training:   0%|          | 0/76 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/76 [00:05<06:53,  5.51s/it][A
Training:   4%|▍         | 3/76 [00:05<01:47,  1.47s/it][A
Training:   5%|▌         | 4/76 [00:05<01:12,  1.01s/it][A
Training:   7%|▋         | 5/76 [00:10<02:34,  2.17s/it][A
Training:   8%|▊         | 6/76 [00:10<01:48,  1.55s/it][A
Training:  11%|█         | 8/76 [00:10<00:58,  1.16it/s][A
Training:  12%|█▏        | 9/76 [00:14<01:54,  1.71s/it][A
Training:  13%|█▎        | 10/76 [00:15<01:30,  1.37s/it][A
Training:  14%|█▍        | 11/76 [00:15<01:07,  1.04s/it][A
Training:  16%|█▌        | 12/76 [00:15<00:49,  1.28it/s][A
Training:  17%|█▋        | 13/76 [00:19<01:45,  1.67s/it][A
Training:  18%|█▊        | 14/76 [00:19<01:21,  1.32s/it][A
Training:  21%|██        | 16/76 [00:20<00:45,  1.31it/s][A
Training:  22%|██▏       | 17/76 [00:23<01:27,  1.49s/it][A
Training:  24%|██▎       | 18/76 [00:24<01:18,  1.35s/it][A
Training:  25%|██▌       | 19/76 [00:25

Epoch: 16/88 - Loss: 4.6806 - Accuracy: 0.9527



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:04<00:40,  4.54s/it][A
 30%|███       | 3/10 [00:04<00:08,  1.22s/it][A
 50%|█████     | 5/10 [00:08<00:08,  1.69s/it][A
 70%|███████   | 7/10 [00:09<00:03,  1.00s/it][A
 80%|████████  | 8/10 [00:09<00:01,  1.22it/s][A
100%|██████████| 10/10 [00:12<00:00,  1.29s/it][A
Epochs:  18%|█▊        | 16/88 [26:43<2:00:07, 100.11s/it]

Val Loss: 4.4363 - Val Accuracy: 0.9526



Training:   0%|          | 0/76 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/76 [00:05<06:33,  5.25s/it][A
Training:   3%|▎         | 2/76 [00:05<02:53,  2.35s/it][A
Training:   4%|▍         | 3/76 [00:05<01:37,  1.33s/it][A
Training:   7%|▋         | 5/76 [00:10<02:07,  1.80s/it][A
Training:   8%|▊         | 6/76 [00:10<01:37,  1.39s/it][A
Training:  11%|█         | 8/76 [00:10<00:56,  1.21it/s][A
Training:  12%|█▏        | 9/76 [00:14<01:46,  1.59s/it][A
Training:  13%|█▎        | 10/76 [00:15<01:27,  1.32s/it][A
Training:  16%|█▌        | 12/76 [00:15<00:51,  1.25it/s][A
Training:  17%|█▋        | 13/76 [00:19<01:33,  1.49s/it][A
Training:  18%|█▊        | 14/76 [00:19<01:18,  1.26s/it][A
Training:  21%|██        | 16/76 [00:20<00:49,  1.22it/s][A
Training:  22%|██▏       | 17/76 [00:23<01:26,  1.47s/it][A
Training:  24%|██▎       | 18/76 [00:24<01:13,  1.27s/it][A
Training:  25%|██▌       | 19/76 [00:24<00:55,  1.03it/s][A
Training:  26%|██▋       | 20/76 [00:24

Epoch: 17/88 - Loss: 4.5045 - Accuracy: 0.9523



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:04<00:38,  4.29s/it][A
 20%|██        | 2/10 [00:04<00:14,  1.83s/it][A
 30%|███       | 3/10 [00:04<00:07,  1.13s/it][A
 40%|████      | 4/10 [00:04<00:04,  1.33it/s][A
 50%|█████     | 5/10 [00:08<00:09,  1.82s/it][A
 60%|██████    | 6/10 [00:08<00:05,  1.27s/it][A
 70%|███████   | 7/10 [00:09<00:02,  1.06it/s][A
100%|██████████| 10/10 [00:12<00:00,  1.25s/it][A
Epochs:  19%|█▉        | 17/88 [28:23<1:58:20, 100.01s/it]

Val Loss: 4.3100 - Val Accuracy: 0.9532



Training:   0%|          | 0/76 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/76 [00:05<06:57,  5.57s/it][A
Training:   3%|▎         | 2/76 [00:05<02:57,  2.39s/it][A
Training:   4%|▍         | 3/76 [00:05<01:40,  1.37s/it][A
Training:   5%|▌         | 4/76 [00:06<01:03,  1.14it/s][A
Training:   7%|▋         | 5/76 [00:10<02:38,  2.23s/it][A
Training:   8%|▊         | 6/76 [00:10<01:45,  1.51s/it][A
Training:  11%|█         | 8/76 [00:10<00:54,  1.25it/s][A
Training:  12%|█▏        | 9/76 [00:15<02:01,  1.81s/it][A
Training:  13%|█▎        | 10/76 [00:15<01:29,  1.35s/it][A
Training:  14%|█▍        | 11/76 [00:15<01:06,  1.02s/it][A
Training:  16%|█▌        | 12/76 [00:16<00:49,  1.29it/s][A
Training:  17%|█▋        | 13/76 [00:20<01:52,  1.78s/it][A
Training:  18%|█▊        | 14/76 [00:20<01:20,  1.30s/it][A
Training:  22%|██▏       | 17/76 [00:24<01:22,  1.41s/it][A
Training:  26%|██▋       | 20/76 [00:25<00:45,  1.24it/s][A
Training:  28%|██▊       | 21/76 [00:29<

Epoch: 18/88 - Loss: 4.2504 - Accuracy: 0.9544



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:04<00:38,  4.28s/it][A
 20%|██        | 2/10 [00:04<00:14,  1.82s/it][A
 30%|███       | 3/10 [00:04<00:08,  1.17s/it][A
 40%|████      | 4/10 [00:04<00:04,  1.32it/s][A
 50%|█████     | 5/10 [00:08<00:09,  1.87s/it][A
 60%|██████    | 6/10 [00:08<00:05,  1.29s/it][A
 70%|███████   | 7/10 [00:09<00:02,  1.10it/s][A
100%|██████████| 10/10 [00:12<00:00,  1.26s/it][A
Epochs:  20%|██        | 18/88 [30:03<1:56:48, 100.12s/it]

Val Loss: 4.2113 - Val Accuracy: 0.9542



Training:   0%|          | 0/76 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/76 [00:05<06:58,  5.59s/it][A
Training:   3%|▎         | 2/76 [00:05<02:55,  2.37s/it][A
Training:   4%|▍         | 3/76 [00:05<01:38,  1.35s/it][A
Training:   7%|▋         | 5/76 [00:10<02:14,  1.90s/it][A
Training:   8%|▊         | 6/76 [00:10<01:40,  1.43s/it][A
Training:   9%|▉         | 7/76 [00:10<01:12,  1.05s/it][A
Training:  11%|█         | 8/76 [00:10<00:52,  1.30it/s][A
Training:  12%|█▏        | 9/76 [00:14<01:54,  1.71s/it][A
Training:  13%|█▎        | 10/76 [00:15<01:29,  1.35s/it][A
Training:  14%|█▍        | 11/76 [00:15<01:04,  1.01it/s][A
Training:  16%|█▌        | 12/76 [00:15<00:46,  1.36it/s][A
Training:  17%|█▋        | 13/76 [00:19<01:50,  1.75s/it][A
Training:  18%|█▊        | 14/76 [00:20<01:21,  1.32s/it][A
Training:  21%|██        | 16/76 [00:20<00:45,  1.33it/s][A
Training:  22%|██▏       | 17/76 [00:23<01:26,  1.47s/it][A
Training:  24%|██▎       | 18/76 [00:24<

Epoch: 19/88 - Loss: 4.1180 - Accuracy: 0.9551



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:04<00:40,  4.54s/it][A
 20%|██        | 2/10 [00:04<00:15,  1.94s/it][A
 30%|███       | 3/10 [00:04<00:07,  1.10s/it][A
 40%|████      | 4/10 [00:04<00:04,  1.39it/s][A
 50%|█████     | 5/10 [00:08<00:09,  1.89s/it][A
 80%|████████  | 8/10 [00:08<00:01,  1.30it/s][A
100%|██████████| 10/10 [00:12<00:00,  1.28s/it][A
Epochs:  22%|██▏       | 19/88 [31:44<1:55:10, 100.16s/it]

Val Loss: 3.9736 - Val Accuracy: 0.9559



Training:   0%|          | 0/76 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/76 [00:05<06:50,  5.47s/it][A
Training:   3%|▎         | 2/76 [00:05<02:55,  2.37s/it][A
Training:   5%|▌         | 4/76 [00:05<01:06,  1.09it/s][A
Training:   7%|▋         | 5/76 [00:10<02:25,  2.04s/it][A
Training:   8%|▊         | 6/76 [00:10<01:47,  1.53s/it][A
Training:  12%|█▏        | 9/76 [00:15<01:40,  1.51s/it][A
Training:  13%|█▎        | 10/76 [00:15<01:21,  1.23s/it][A
Training:  16%|█▌        | 12/76 [00:15<00:50,  1.26it/s][A
Training:  17%|█▋        | 13/76 [00:19<01:34,  1.50s/it][A
Training:  18%|█▊        | 14/76 [00:20<01:16,  1.24s/it][A
Training:  20%|█▉        | 15/76 [00:20<00:59,  1.03it/s][A
Training:  22%|██▏       | 17/76 [00:23<01:17,  1.31s/it][A
Training:  24%|██▎       | 18/76 [00:24<01:03,  1.10s/it][A
Training:  26%|██▋       | 20/76 [00:24<00:39,  1.41it/s][A
Training:  28%|██▊       | 21/76 [00:28<01:16,  1.39s/it][A
Training:  29%|██▉       | 22/76 [00:2

Epoch: 20/88 - Loss: 3.9855 - Accuracy: 0.9574



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:04<00:38,  4.22s/it][A
 20%|██        | 2/10 [00:04<00:14,  1.82s/it][A
 30%|███       | 3/10 [00:04<00:07,  1.04s/it][A
 40%|████      | 4/10 [00:04<00:04,  1.45it/s][A
 50%|█████     | 5/10 [00:08<00:09,  1.91s/it][A
 60%|██████    | 6/10 [00:08<00:05,  1.30s/it][A
 80%|████████  | 8/10 [00:08<00:01,  1.44it/s][A
100%|██████████| 10/10 [00:12<00:00,  1.25s/it][A
Epochs:  23%|██▎       | 20/88 [33:23<1:53:24, 100.07s/it]

Val Loss: 3.9565 - Val Accuracy: 0.9564



Training:   0%|          | 0/76 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/76 [00:05<07:00,  5.61s/it][A
Training:   4%|▍         | 3/76 [00:05<01:50,  1.51s/it][A
Training:   5%|▌         | 4/76 [00:05<01:15,  1.05s/it][A
Training:   7%|▋         | 5/76 [00:10<02:34,  2.18s/it][A
Training:   9%|▉         | 7/76 [00:10<01:20,  1.16s/it][A
Training:  11%|█         | 8/76 [00:10<01:02,  1.08it/s][A
Training:  12%|█▏        | 9/76 [00:15<02:03,  1.84s/it][A
Training:  13%|█▎        | 10/76 [00:15<01:30,  1.37s/it][A
Training:  14%|█▍        | 11/76 [00:15<01:06,  1.02s/it][A
Training:  16%|█▌        | 12/76 [00:15<00:49,  1.29it/s][A
Training:  17%|█▋        | 13/76 [00:19<01:47,  1.71s/it][A
Training:  18%|█▊        | 14/76 [00:19<01:17,  1.25s/it][A
Training:  20%|█▉        | 15/76 [00:19<00:56,  1.09it/s][A
Training:  22%|██▏       | 17/76 [00:24<01:25,  1.45s/it][A
Training:  26%|██▋       | 20/76 [00:24<00:46,  1.20it/s][A
Training:  28%|██▊       | 21/76 [00:28

Epoch: 21/88 - Loss: 3.8730 - Accuracy: 0.9573



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:04<00:38,  4.30s/it][A
 20%|██        | 2/10 [00:04<00:14,  1.85s/it][A
 40%|████      | 4/10 [00:04<00:04,  1.35it/s][A
 50%|█████     | 5/10 [00:08<00:08,  1.68s/it][A
 60%|██████    | 6/10 [00:08<00:05,  1.25s/it][A
100%|██████████| 10/10 [00:12<00:00,  1.24s/it][A
Epochs:  24%|██▍       | 21/88 [35:03<1:51:40, 100.00s/it]

Val Loss: 3.9757 - Val Accuracy: 0.9569



Training:   0%|          | 0/76 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/76 [00:05<06:45,  5.41s/it][A
Training:   3%|▎         | 2/76 [00:05<03:01,  2.45s/it][A
Training:   5%|▌         | 4/76 [00:05<01:08,  1.05it/s][A
Training:   7%|▋         | 5/76 [00:10<02:27,  2.08s/it][A
Training:   8%|▊         | 6/76 [00:10<01:48,  1.55s/it][A
Training:  11%|█         | 8/76 [00:11<00:58,  1.16it/s][A
Training:  12%|█▏        | 9/76 [00:15<01:50,  1.65s/it][A
Training:  13%|█▎        | 10/76 [00:15<01:30,  1.37s/it][A
Training:  14%|█▍        | 11/76 [00:15<01:06,  1.03s/it][A
Training:  17%|█▋        | 13/76 [00:19<01:30,  1.43s/it][A
Training:  18%|█▊        | 14/76 [00:19<01:12,  1.18s/it][A
Training:  21%|██        | 16/76 [00:20<00:43,  1.39it/s][A
Training:  22%|██▏       | 17/76 [00:23<01:23,  1.42s/it][A
Training:  24%|██▎       | 18/76 [00:24<01:05,  1.12s/it][A
Training:  25%|██▌       | 19/76 [00:24<00:49,  1.16it/s][A
Training:  26%|██▋       | 20/76 [00:24

Epoch: 22/88 - Loss: 3.7679 - Accuracy: 0.9585



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:04<00:38,  4.29s/it][A
 20%|██        | 2/10 [00:04<00:14,  1.85s/it][A
 30%|███       | 3/10 [00:04<00:07,  1.07s/it][A
 50%|█████     | 5/10 [00:08<00:08,  1.61s/it][A
 60%|██████    | 6/10 [00:08<00:04,  1.18s/it][A
 70%|███████   | 7/10 [00:08<00:02,  1.14it/s][A
100%|██████████| 10/10 [00:12<00:00,  1.26s/it][A
Epochs:  25%|██▌       | 22/88 [36:44<1:50:20, 100.30s/it]

Val Loss: 3.7935 - Val Accuracy: 0.9569



Training:   0%|          | 0/76 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/76 [00:05<06:51,  5.48s/it][A
Training:   4%|▍         | 3/76 [00:05<01:49,  1.50s/it][A
Training:   5%|▌         | 4/76 [00:05<01:14,  1.04s/it][A
Training:   7%|▋         | 5/76 [00:10<02:38,  2.23s/it][A
Training:   8%|▊         | 6/76 [00:10<01:48,  1.55s/it][A
Training:   9%|▉         | 7/76 [00:10<01:16,  1.10s/it][A
Training:  11%|█         | 8/76 [00:10<00:54,  1.25it/s][A
Training:  12%|█▏        | 9/76 [00:15<02:05,  1.88s/it][A
Training:  13%|█▎        | 10/76 [00:15<01:28,  1.34s/it][A
Training:  16%|█▌        | 12/76 [00:15<00:47,  1.34it/s][A
Training:  17%|█▋        | 13/76 [00:19<01:47,  1.70s/it][A
Training:  18%|█▊        | 14/76 [00:20<01:19,  1.28s/it][A
Training:  20%|█▉        | 15/76 [00:20<00:58,  1.04it/s][A
Training:  21%|██        | 16/76 [00:20<00:43,  1.37it/s][A
Training:  22%|██▏       | 17/76 [00:23<01:26,  1.46s/it][A
Training:  25%|██▌       | 19/76 [00:23<

Epoch: 23/88 - Loss: 3.6565 - Accuracy: 0.9585



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:04<00:41,  4.60s/it][A
 30%|███       | 3/10 [00:04<00:08,  1.25s/it][A
 50%|█████     | 5/10 [00:08<00:08,  1.69s/it][A
 60%|██████    | 6/10 [00:09<00:05,  1.27s/it][A
 80%|████████  | 8/10 [00:09<00:01,  1.34it/s][A
100%|██████████| 10/10 [00:12<00:00,  1.29s/it][A
Epochs:  26%|██▌       | 23/88 [38:26<1:49:00, 100.62s/it]

Val Loss: 3.9238 - Val Accuracy: 0.9580



Training:   0%|          | 0/76 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/76 [00:05<06:54,  5.52s/it][A
Training:   3%|▎         | 2/76 [00:05<02:53,  2.34s/it][A
Training:   5%|▌         | 4/76 [00:05<01:06,  1.09it/s][A
Training:   7%|▋         | 5/76 [00:10<02:21,  1.99s/it][A
Training:   9%|▉         | 7/76 [00:10<01:14,  1.08s/it][A
Training:  12%|█▏        | 9/76 [00:14<01:45,  1.58s/it][A
Training:  14%|█▍        | 11/76 [00:15<01:06,  1.02s/it][A
Training:  17%|█▋        | 13/76 [00:19<01:28,  1.40s/it][A
Training:  20%|█▉        | 15/76 [00:19<00:58,  1.04it/s][A
Training:  22%|██▏       | 17/76 [00:23<01:14,  1.26s/it][A
Training:  24%|██▎       | 18/76 [00:23<01:00,  1.05s/it][A
Training:  25%|██▌       | 19/76 [00:23<00:48,  1.17it/s][A
Training:  26%|██▋       | 20/76 [00:23<00:38,  1.46it/s][A
Training:  28%|██▊       | 21/76 [00:27<01:26,  1.57s/it][A
Training:  29%|██▉       | 22/76 [00:27<01:04,  1.20s/it][A
Training:  30%|███       | 23/76 [00:2

Epoch: 24/88 - Loss: 3.5718 - Accuracy: 0.9590



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:04<00:38,  4.32s/it][A
 20%|██        | 2/10 [00:04<00:14,  1.87s/it][A
 30%|███       | 3/10 [00:04<00:07,  1.14s/it][A
 40%|████      | 4/10 [00:04<00:04,  1.33it/s][A
 50%|█████     | 5/10 [00:08<00:08,  1.80s/it][A
 60%|██████    | 6/10 [00:08<00:05,  1.29s/it][A
 70%|███████   | 7/10 [00:09<00:02,  1.05it/s][A
100%|██████████| 10/10 [00:12<00:00,  1.26s/it][A
Epochs:  27%|██▋       | 24/88 [40:06<1:47:15, 100.55s/it]

Val Loss: 3.4444 - Val Accuracy: 0.9585



Training:   0%|          | 0/76 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/76 [00:05<07:08,  5.72s/it][A
Training:   3%|▎         | 2/76 [00:05<02:58,  2.42s/it][A
Training:   5%|▌         | 4/76 [00:05<01:07,  1.07it/s][A
Training:   8%|▊         | 6/76 [00:10<01:49,  1.57s/it][A
Training:  11%|█         | 8/76 [00:10<01:05,  1.04it/s][A
Training:  13%|█▎        | 10/76 [00:15<01:39,  1.50s/it][A
Training:  16%|█▌        | 12/76 [00:15<01:05,  1.02s/it][A
Training:  17%|█▋        | 13/76 [00:19<01:34,  1.50s/it][A
Training:  18%|█▊        | 14/76 [00:19<01:14,  1.20s/it][A
Training:  21%|██        | 16/76 [00:19<00:47,  1.26it/s][A
Training:  22%|██▏       | 17/76 [00:23<01:31,  1.54s/it][A
Training:  24%|██▎       | 18/76 [00:23<01:10,  1.21s/it][A
Training:  25%|██▌       | 19/76 [00:24<00:52,  1.08it/s][A
Training:  28%|██▊       | 21/76 [00:28<01:22,  1.50s/it][A
Training:  30%|███       | 23/76 [00:28<00:50,  1.04it/s][A
Training:  33%|███▎      | 25/76 [00:

Epoch: 25/88 - Loss: 3.4878 - Accuracy: 0.9595



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:04<00:40,  4.46s/it][A
 20%|██        | 2/10 [00:04<00:15,  1.98s/it][A
 30%|███       | 3/10 [00:04<00:07,  1.14s/it][A
 40%|████      | 4/10 [00:04<00:04,  1.37it/s][A
 50%|█████     | 5/10 [00:08<00:09,  1.92s/it][A
 70%|███████   | 7/10 [00:09<00:02,  1.01it/s][A
100%|██████████| 10/10 [00:12<00:00,  1.29s/it][A
Epochs:  28%|██▊       | 25/88 [41:48<1:45:57, 100.92s/it]

Val Loss: 3.5833 - Val Accuracy: 0.9585



Training:   0%|          | 0/76 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/76 [00:04<06:01,  4.83s/it][A
Training:   3%|▎         | 2/76 [00:05<02:43,  2.21s/it][A
Training:   4%|▍         | 3/76 [00:05<01:31,  1.25s/it][A
Training:   5%|▌         | 4/76 [00:05<00:58,  1.24it/s][A
Training:   7%|▋         | 5/76 [00:09<02:20,  1.99s/it][A
Training:   8%|▊         | 6/76 [00:10<01:47,  1.54s/it][A
Training:   9%|▉         | 7/76 [00:10<01:13,  1.07s/it][A
Training:  12%|█▏        | 9/76 [00:13<01:36,  1.44s/it][A
Training:  13%|█▎        | 10/76 [00:14<01:20,  1.22s/it][A
Training:  16%|█▌        | 12/76 [00:14<00:46,  1.37it/s][A
Training:  17%|█▋        | 13/76 [00:17<01:21,  1.30s/it][A
Training:  18%|█▊        | 14/76 [00:18<01:12,  1.17s/it][A
Training:  20%|█▉        | 15/76 [00:18<00:57,  1.06it/s][A
Training:  22%|██▏       | 17/76 [00:22<01:16,  1.30s/it][A
Training:  24%|██▎       | 18/76 [00:23<01:08,  1.18s/it][A
Training:  25%|██▌       | 19/76 [00:23<

Epoch: 26/88 - Loss: 3.4417 - Accuracy: 0.9597



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:04<00:42,  4.77s/it][A
 30%|███       | 3/10 [00:04<00:09,  1.29s/it][A
 50%|█████     | 5/10 [00:09<00:08,  1.71s/it][A
 70%|███████   | 7/10 [00:09<00:03,  1.01s/it][A
100%|██████████| 10/10 [00:13<00:00,  1.30s/it][A
Epochs:  30%|██▉       | 26/88 [43:29<1:44:26, 101.08s/it]

Val Loss: 3.5064 - Val Accuracy: 0.9602



Training:   0%|          | 0/76 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/76 [00:05<06:28,  5.19s/it][A
Training:   4%|▍         | 3/76 [00:05<01:41,  1.39s/it][A
Training:   5%|▌         | 4/76 [00:05<01:08,  1.05it/s][A
Training:   7%|▋         | 5/76 [00:09<02:30,  2.13s/it][A
Training:   9%|▉         | 7/76 [00:10<01:17,  1.13s/it][A
Training:  12%|█▏        | 9/76 [00:13<01:30,  1.35s/it][A
Training:  14%|█▍        | 11/76 [00:13<00:56,  1.14it/s][A
Training:  17%|█▋        | 13/76 [00:18<01:24,  1.34s/it][A
Training:  20%|█▉        | 15/76 [00:18<00:57,  1.06it/s][A
Training:  22%|██▏       | 17/76 [00:22<01:18,  1.33s/it][A
Training:  24%|██▎       | 18/76 [00:22<01:04,  1.11s/it][A
Training:  25%|██▌       | 19/76 [00:22<00:51,  1.11it/s][A
Training:  26%|██▋       | 20/76 [00:22<00:40,  1.39it/s][A
Training:  28%|██▊       | 21/76 [00:27<01:26,  1.58s/it][A
Training:  29%|██▉       | 22/76 [00:27<01:04,  1.19s/it][A
Training:  32%|███▏      | 24/76 [00:2

Epoch: 27/88 - Loss: 3.3422 - Accuracy: 0.9605



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:04<00:43,  4.83s/it][A
 30%|███       | 3/10 [00:05<00:09,  1.34s/it][A
 40%|████      | 4/10 [00:05<00:05,  1.08it/s][A
 50%|█████     | 5/10 [00:09<00:09,  1.96s/it][A
 60%|██████    | 6/10 [00:09<00:05,  1.37s/it][A
 80%|████████  | 8/10 [00:09<00:01,  1.26it/s][A
100%|██████████| 10/10 [00:12<00:00,  1.30s/it][A
Epochs:  31%|███       | 27/88 [45:10<1:42:32, 100.85s/it]

Val Loss: 3.3851 - Val Accuracy: 0.9602



Training:   0%|          | 0/76 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/76 [00:05<06:33,  5.25s/it][A
Training:   3%|▎         | 2/76 [00:05<02:47,  2.26s/it][A
Training:   4%|▍         | 3/76 [00:05<01:33,  1.28s/it][A
Training:   7%|▋         | 5/76 [00:09<02:07,  1.80s/it][A
Training:   9%|▉         | 7/76 [00:10<01:11,  1.04s/it][A
Training:  12%|█▏        | 9/76 [00:14<01:36,  1.45s/it][A
Training:  13%|█▎        | 10/76 [00:14<01:16,  1.16s/it][A
Training:  14%|█▍        | 11/76 [00:14<00:59,  1.09it/s][A
Training:  17%|█▋        | 13/76 [00:18<01:29,  1.41s/it][A
Training:  20%|█▉        | 15/76 [00:19<00:56,  1.07it/s][A
Training:  21%|██        | 16/76 [00:19<00:48,  1.23it/s][A
Training:  22%|██▏       | 17/76 [00:23<01:29,  1.52s/it][A
Training:  25%|██▌       | 19/76 [00:23<00:53,  1.06it/s][A
Training:  26%|██▋       | 20/76 [00:23<00:45,  1.24it/s][A
Training:  28%|██▊       | 21/76 [00:27<01:28,  1.61s/it][A
Training:  29%|██▉       | 22/76 [00:2

Epoch: 28/88 - Loss: 3.2614 - Accuracy: 0.9610



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:04<00:44,  4.90s/it][A
 40%|████      | 4/10 [00:05<00:05,  1.04it/s][A
 60%|██████    | 6/10 [00:09<00:05,  1.49s/it][A
100%|██████████| 10/10 [00:13<00:00,  1.32s/it][A
Epochs:  32%|███▏      | 28/88 [46:50<1:40:49, 100.83s/it]

Val Loss: 3.2693 - Val Accuracy: 0.9607



Training:   0%|          | 0/76 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/76 [00:05<06:35,  5.27s/it][A
Training:   3%|▎         | 2/76 [00:05<02:50,  2.31s/it][A
Training:   4%|▍         | 3/76 [00:05<01:37,  1.34s/it][A
Training:   7%|▋         | 5/76 [00:09<01:56,  1.64s/it][A
Training:   8%|▊         | 6/76 [00:09<01:25,  1.22s/it][A
Training:   9%|▉         | 7/76 [00:09<01:03,  1.08it/s][A
Training:  12%|█▏        | 9/76 [00:14<01:38,  1.48s/it][A
Training:  13%|█▎        | 10/76 [00:14<01:18,  1.19s/it][A
Training:  14%|█▍        | 11/76 [00:14<00:59,  1.09it/s][A
Training:  17%|█▋        | 13/76 [00:18<01:28,  1.41s/it][A
Training:  18%|█▊        | 14/76 [00:18<01:10,  1.14s/it][A
Training:  20%|█▉        | 15/76 [00:19<00:55,  1.11it/s][A
Training:  22%|██▏       | 17/76 [00:23<01:19,  1.35s/it][A
Training:  24%|██▎       | 18/76 [00:23<01:04,  1.11s/it][A
Training:  25%|██▌       | 19/76 [00:23<00:53,  1.06it/s][A
Training:  26%|██▋       | 20/76 [00:23

Epoch: 29/88 - Loss: 3.2403 - Accuracy: 0.9602



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:04<00:43,  4.81s/it][A
 20%|██        | 2/10 [00:05<00:17,  2.15s/it][A
 50%|█████     | 5/10 [00:08<00:07,  1.49s/it][A
 60%|██████    | 6/10 [00:09<00:04,  1.24s/it][A
 80%|████████  | 8/10 [00:09<00:01,  1.33it/s][A
100%|██████████| 10/10 [00:12<00:00,  1.27s/it][A
Epochs:  33%|███▎      | 29/88 [48:31<1:39:06, 100.79s/it]

Val Loss: 3.3091 - Val Accuracy: 0.9602



Training:   0%|          | 0/76 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/76 [00:04<06:05,  4.87s/it][A
Training:   3%|▎         | 2/76 [00:05<02:37,  2.13s/it][A
Training:   5%|▌         | 4/76 [00:05<01:00,  1.18it/s][A
Training:   7%|▋         | 5/76 [00:09<02:16,  1.92s/it][A
Training:   8%|▊         | 6/76 [00:09<01:36,  1.38s/it][A
Training:   9%|▉         | 7/76 [00:09<01:09,  1.00s/it][A
Training:  11%|█         | 8/76 [00:10<00:50,  1.35it/s][A
Training:  12%|█▏        | 9/76 [00:14<02:02,  1.83s/it][A
Training:  13%|█▎        | 10/76 [00:14<01:27,  1.32s/it][A
Training:  14%|█▍        | 11/76 [00:14<01:02,  1.04it/s][A
Training:  16%|█▌        | 12/76 [00:14<00:45,  1.40it/s][A
Training:  17%|█▋        | 13/76 [00:19<01:52,  1.79s/it][A
Training:  20%|█▉        | 15/76 [00:19<01:00,  1.01it/s][A
Training:  22%|██▏       | 17/76 [00:23<01:27,  1.48s/it][A
Training:  24%|██▎       | 18/76 [00:23<01:09,  1.21s/it][A
Training:  26%|██▋       | 20/76 [00:23<

Epoch: 30/88 - Loss: 3.1905 - Accuracy: 0.9617



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:04<00:39,  4.40s/it][A
 20%|██        | 2/10 [00:04<00:15,  1.93s/it][A
 40%|████      | 4/10 [00:04<00:04,  1.31it/s][A
 50%|█████     | 5/10 [00:08<00:08,  1.75s/it][A
 60%|██████    | 6/10 [00:08<00:05,  1.25s/it][A
100%|██████████| 10/10 [00:12<00:00,  1.24s/it][A
Epochs:  34%|███▍      | 30/88 [50:12<1:37:26, 100.80s/it]

Val Loss: 3.4620 - Val Accuracy: 0.9607



Training:   0%|          | 0/76 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/76 [00:04<06:08,  4.92s/it][A
Training:   4%|▍         | 3/76 [00:05<01:36,  1.32s/it][A
Training:   7%|▋         | 5/76 [00:09<02:09,  1.83s/it][A
Training:   9%|▉         | 7/76 [00:09<01:14,  1.08s/it][A
Training:  11%|█         | 8/76 [00:09<00:59,  1.14it/s][A
Training:  12%|█▏        | 9/76 [00:14<01:56,  1.75s/it][A
Training:  13%|█▎        | 10/76 [00:14<01:27,  1.33s/it][A
Training:  14%|█▍        | 11/76 [00:14<01:05,  1.01s/it][A
Training:  16%|█▌        | 12/76 [00:14<00:49,  1.29it/s][A
Training:  17%|█▋        | 13/76 [00:18<01:49,  1.74s/it][A
Training:  18%|█▊        | 14/76 [00:19<01:19,  1.28s/it][A
Training:  20%|█▉        | 15/76 [00:19<00:58,  1.05it/s][A
Training:  21%|██        | 16/76 [00:19<00:43,  1.39it/s][A
Training:  22%|██▏       | 17/76 [00:23<01:40,  1.71s/it][A
Training:  24%|██▎       | 18/76 [00:23<01:12,  1.26s/it][A
Training:  25%|██▌       | 19/76 [00:2

Epoch: 31/88 - Loss: 3.1624 - Accuracy: 0.9622



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:04<00:42,  4.77s/it][A
 30%|███       | 3/10 [00:04<00:09,  1.31s/it][A
 40%|████      | 4/10 [00:05<00:05,  1.11it/s][A
 50%|█████     | 5/10 [00:09<00:09,  1.94s/it][A
 70%|███████   | 7/10 [00:09<00:03,  1.04s/it][A
100%|██████████| 10/10 [00:12<00:00,  1.26s/it][A
Epochs:  35%|███▌      | 31/88 [51:52<1:35:35, 100.62s/it]

Val Loss: 3.3248 - Val Accuracy: 0.9607



Training:   0%|          | 0/76 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/76 [00:05<06:18,  5.04s/it][A
Training:   3%|▎         | 2/76 [00:05<02:40,  2.17s/it][A
Training:   4%|▍         | 3/76 [00:05<01:34,  1.29s/it][A
Training:   7%|▋         | 5/76 [00:09<02:06,  1.78s/it][A
Training:   8%|▊         | 6/76 [00:09<01:31,  1.31s/it][A
Training:   9%|▉         | 7/76 [00:10<01:13,  1.07s/it][A
Training:  12%|█▏        | 9/76 [00:14<01:41,  1.51s/it][A
Training:  13%|█▎        | 10/76 [00:14<01:17,  1.18s/it][A
Training:  14%|█▍        | 11/76 [00:14<01:01,  1.06it/s][A
Training:  17%|█▋        | 13/76 [00:19<01:32,  1.46s/it][A
Training:  18%|█▊        | 14/76 [00:19<01:11,  1.15s/it][A
Training:  20%|█▉        | 15/76 [00:19<01:01,  1.01s/it][A
Training:  21%|██        | 16/76 [00:20<00:47,  1.25it/s][A
Training:  22%|██▏       | 17/76 [00:24<01:38,  1.67s/it][A
Training:  24%|██▎       | 18/76 [00:24<01:16,  1.32s/it][A
Training:  25%|██▌       | 19/76 [00:25

Epoch: 32/88 - Loss: 3.1156 - Accuracy: 0.9622



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:04<00:42,  4.76s/it][A
 20%|██        | 2/10 [00:04<00:16,  2.04s/it][A
 30%|███       | 3/10 [00:05<00:08,  1.20s/it][A
 40%|████      | 4/10 [00:05<00:04,  1.30it/s][A
 50%|█████     | 5/10 [00:08<00:09,  1.83s/it][A
 60%|██████    | 6/10 [00:09<00:05,  1.25s/it][A
 80%|████████  | 8/10 [00:09<00:01,  1.48it/s][A
100%|██████████| 10/10 [00:12<00:00,  1.24s/it][A
Epochs:  36%|███▋      | 32/88 [53:38<1:35:30, 102.32s/it]

Val Loss: 3.2568 - Val Accuracy: 0.9612



Training:   0%|          | 0/76 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/76 [00:05<06:49,  5.46s/it][A
Training:   3%|▎         | 2/76 [00:05<03:03,  2.48s/it][A
Training:   4%|▍         | 3/76 [00:05<01:41,  1.39s/it][A
Training:   7%|▋         | 5/76 [00:10<02:09,  1.83s/it][A
Training:   8%|▊         | 6/76 [00:10<01:40,  1.43s/it][A
Training:   9%|▉         | 7/76 [00:10<01:13,  1.07s/it][A
Training:  11%|█         | 8/76 [00:11<00:53,  1.26it/s][A
Training:  12%|█▏        | 9/76 [00:15<01:55,  1.73s/it][A
Training:  13%|█▎        | 10/76 [00:15<01:29,  1.36s/it][A
Training:  16%|█▌        | 12/76 [00:15<00:50,  1.26it/s][A
Training:  17%|█▋        | 13/76 [00:19<01:36,  1.54s/it][A
Training:  18%|█▊        | 14/76 [00:20<01:20,  1.29s/it][A
Training:  21%|██        | 16/76 [00:20<00:45,  1.31it/s][A
Training:  22%|██▏       | 17/76 [00:24<01:28,  1.50s/it][A
Training:  24%|██▎       | 18/76 [00:24<01:16,  1.32s/it][A
Training:  25%|██▌       | 19/76 [00:25<

Epoch: 33/88 - Loss: 3.0298 - Accuracy: 0.9632



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:04<00:44,  4.92s/it][A
 20%|██        | 2/10 [00:05<00:17,  2.20s/it][A
 30%|███       | 3/10 [00:05<00:08,  1.26s/it][A
 40%|████      | 4/10 [00:05<00:04,  1.23it/s][A
 50%|█████     | 5/10 [00:08<00:08,  1.70s/it][A
 60%|██████    | 6/10 [00:09<00:04,  1.21s/it][A
 80%|████████  | 8/10 [00:09<00:01,  1.54it/s][A
100%|██████████| 10/10 [00:12<00:00,  1.29s/it][A
Epochs:  38%|███▊      | 33/88 [55:21<1:33:57, 102.51s/it]

Val Loss: 3.0337 - Val Accuracy: 0.9607



Training:   0%|          | 0/76 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/76 [00:05<06:42,  5.37s/it][A
Training:   4%|▍         | 3/76 [00:05<01:45,  1.45s/it][A
Training:   5%|▌         | 4/76 [00:05<01:12,  1.00s/it][A
Training:   7%|▋         | 5/76 [00:10<02:34,  2.18s/it][A
Training:   8%|▊         | 6/76 [00:10<01:46,  1.52s/it][A
Training:   9%|▉         | 7/76 [00:10<01:14,  1.07s/it][A
Training:  12%|█▏        | 9/76 [00:15<01:53,  1.69s/it][A
Training:  14%|█▍        | 11/76 [00:15<01:07,  1.04s/it][A
Training:  17%|█▋        | 13/76 [00:19<01:32,  1.47s/it][A
Training:  18%|█▊        | 14/76 [00:19<01:14,  1.21s/it][A
Training:  21%|██        | 16/76 [00:20<00:46,  1.28it/s][A
Training:  22%|██▏       | 17/76 [00:25<01:38,  1.67s/it][A
Training:  24%|██▎       | 18/76 [00:25<01:16,  1.32s/it][A
Training:  25%|██▌       | 19/76 [00:25<00:58,  1.03s/it][A
Training:  28%|██▊       | 21/76 [00:30<01:30,  1.64s/it][A
Training:  29%|██▉       | 22/76 [00:30

Epoch: 34/88 - Loss: 3.0068 - Accuracy: 0.9624



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:05<00:48,  5.38s/it][A
 20%|██        | 2/10 [00:05<00:18,  2.31s/it][A
 30%|███       | 3/10 [00:05<00:09,  1.30s/it][A
 40%|████      | 4/10 [00:05<00:05,  1.18it/s][A
 50%|█████     | 5/10 [00:10<00:10,  2.16s/it][A
 70%|███████   | 7/10 [00:10<00:03,  1.10s/it][A
100%|██████████| 10/10 [00:14<00:00,  1.45s/it][A
Epochs:  39%|███▊      | 34/88 [57:13<1:34:40, 105.19s/it]

Val Loss: 3.1368 - Val Accuracy: 0.9596



Training:   0%|          | 0/76 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/76 [00:07<09:57,  7.97s/it][A
Training:   3%|▎         | 2/76 [00:08<04:08,  3.35s/it][A
Training:   5%|▌         | 4/76 [00:08<01:37,  1.35s/it][A
Training:   7%|▋         | 5/76 [00:14<03:17,  2.78s/it][A
Training:   8%|▊         | 6/76 [00:14<02:18,  1.98s/it][A
Training:   9%|▉         | 7/76 [00:14<01:39,  1.44s/it][A
Training:  12%|█▏        | 9/76 [00:19<02:09,  1.94s/it][A
Training:  14%|█▍        | 11/76 [00:20<01:20,  1.24s/it][A
Training:  16%|█▌        | 12/76 [00:20<01:03,  1.00it/s][A
Training:  17%|█▋        | 13/76 [00:24<01:51,  1.76s/it][A
Training:  18%|█▊        | 14/76 [00:24<01:22,  1.34s/it][A
Training:  20%|█▉        | 15/76 [00:24<01:05,  1.07s/it][A
Training:  22%|██▏       | 17/76 [00:29<01:35,  1.61s/it][A
Training:  25%|██▌       | 19/76 [00:29<01:01,  1.07s/it][A
Training:  26%|██▋       | 20/76 [00:30<00:48,  1.16it/s][A
Training:  28%|██▊       | 21/76 [00:34

Epoch: 35/88 - Loss: 3.0094 - Accuracy: 0.9621



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:04<00:43,  4.85s/it][A
 20%|██        | 2/10 [00:05<00:17,  2.13s/it][A
 40%|████      | 4/10 [00:05<00:04,  1.21it/s][A
 60%|██████    | 6/10 [00:09<00:05,  1.42s/it][A
 80%|████████  | 8/10 [00:09<00:01,  1.14it/s][A
100%|██████████| 10/10 [00:13<00:00,  1.32s/it][A
Epochs:  40%|███▉      | 35/88 [59:04<1:34:26, 106.92s/it]

Val Loss: 3.0377 - Val Accuracy: 0.9591



Training:   0%|          | 0/76 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/76 [00:05<06:50,  5.48s/it][A
Training:   3%|▎         | 2/76 [00:05<03:01,  2.45s/it][A
Training:   4%|▍         | 3/76 [00:05<01:40,  1.38s/it][A
Training:   7%|▋         | 5/76 [00:10<02:13,  1.88s/it][A
Training:   8%|▊         | 6/76 [00:10<01:38,  1.41s/it][A
Training:   9%|▉         | 7/76 [00:10<01:11,  1.03s/it][A
Training:  11%|█         | 8/76 [00:10<00:52,  1.30it/s][A
Training:  12%|█▏        | 9/76 [00:15<02:08,  1.92s/it][A
Training:  13%|█▎        | 10/76 [00:15<01:33,  1.41s/it][A
Training:  14%|█▍        | 11/76 [00:15<01:06,  1.03s/it][A
Training:  17%|█▋        | 13/76 [00:20<01:36,  1.53s/it][A
Training:  18%|█▊        | 14/76 [00:20<01:18,  1.27s/it][A
Training:  21%|██        | 16/76 [00:20<00:45,  1.31it/s][A
Training:  22%|██▏       | 17/76 [00:25<01:32,  1.57s/it][A
Training:  24%|██▎       | 18/76 [00:25<01:19,  1.37s/it][A
Training:  25%|██▌       | 19/76 [00:26<

Epoch: 36/88 - Loss: 2.9148 - Accuracy: 0.9629



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:05<00:46,  5.13s/it][A
 20%|██        | 2/10 [00:05<00:17,  2.21s/it][A
 30%|███       | 3/10 [00:05<00:08,  1.25s/it][A
 40%|████      | 4/10 [00:05<00:04,  1.25it/s][A
 50%|█████     | 5/10 [00:09<00:09,  1.91s/it][A
 70%|███████   | 7/10 [00:09<00:02,  1.02it/s][A
 80%|████████  | 8/10 [00:09<00:01,  1.34it/s][A
100%|██████████| 10/10 [00:13<00:00,  1.34s/it][A
Epochs:  41%|████      | 36/88 [1:00:47<1:31:48, 105.93s/it]

Val Loss: 3.2165 - Val Accuracy: 0.9585



Training:   0%|          | 0/76 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/76 [00:06<07:36,  6.09s/it][A
Training:   4%|▍         | 3/76 [00:06<01:59,  1.63s/it][A
Training:   7%|▋         | 5/76 [00:11<02:28,  2.09s/it][A
Training:   8%|▊         | 6/76 [00:11<01:49,  1.56s/it][A
Training:  11%|█         | 8/76 [00:11<01:02,  1.09it/s][A
Training:  12%|█▏        | 9/76 [00:15<01:54,  1.70s/it][A
Training:  14%|█▍        | 11/76 [00:15<01:07,  1.04s/it][A
Training:  16%|█▌        | 12/76 [00:16<00:54,  1.18it/s][A
Training:  17%|█▋        | 13/76 [00:20<01:46,  1.69s/it][A
Training:  18%|█▊        | 14/76 [00:20<01:21,  1.32s/it][A
Training:  21%|██        | 16/76 [00:20<00:47,  1.27it/s][A
Training:  22%|██▏       | 17/76 [00:25<01:36,  1.64s/it][A
Training:  24%|██▎       | 18/76 [00:25<01:14,  1.28s/it][A
Training:  25%|██▌       | 19/76 [00:25<00:55,  1.02it/s][A
Training:  26%|██▋       | 20/76 [00:25<00:42,  1.33it/s][A
Training:  28%|██▊       | 21/76 [00:2

Epoch: 37/88 - Loss: 2.9857 - Accuracy: 0.9628



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:04<00:43,  4.83s/it][A
 20%|██        | 2/10 [00:05<00:16,  2.11s/it][A
 40%|████      | 4/10 [00:05<00:05,  1.19it/s][A
 50%|█████     | 5/10 [00:09<00:08,  1.78s/it][A
 60%|██████    | 6/10 [00:09<00:05,  1.33s/it][A
 80%|████████  | 8/10 [00:09<00:01,  1.36it/s][A
100%|██████████| 10/10 [00:13<00:00,  1.32s/it][A
Epochs:  42%|████▏     | 37/88 [1:02:30<1:29:20, 105.10s/it]

Val Loss: 3.0031 - Val Accuracy: 0.9591



Training:   0%|          | 0/76 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/76 [00:05<07:00,  5.61s/it][A
Training:   4%|▍         | 3/76 [00:05<01:50,  1.52s/it][A
Training:   7%|▋         | 5/76 [00:10<02:19,  1.96s/it][A
Training:   8%|▊         | 6/76 [00:10<01:42,  1.47s/it][A
Training:   9%|▉         | 7/76 [00:10<01:15,  1.09s/it][A
Training:  11%|█         | 8/76 [00:10<00:57,  1.19it/s][A
Training:  12%|█▏        | 9/76 [00:15<02:03,  1.85s/it][A
Training:  13%|█▎        | 10/76 [00:15<01:34,  1.42s/it][A
Training:  14%|█▍        | 11/76 [00:15<01:07,  1.04s/it][A
Training:  17%|█▋        | 13/76 [00:20<01:39,  1.58s/it][A
Training:  18%|█▊        | 14/76 [00:20<01:23,  1.35s/it][A
Training:  21%|██        | 16/76 [00:21<00:48,  1.23it/s][A
Training:  22%|██▏       | 17/76 [00:25<01:32,  1.57s/it][A
Training:  24%|██▎       | 18/76 [00:25<01:15,  1.30s/it][A
Training:  25%|██▌       | 19/76 [00:25<00:56,  1.00it/s][A
Training:  26%|██▋       | 20/76 [00:25

Epoch: 38/88 - Loss: 2.8180 - Accuracy: 0.9639



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:05<00:45,  5.06s/it][A
 20%|██        | 2/10 [00:05<00:17,  2.16s/it][A
 30%|███       | 3/10 [00:05<00:08,  1.25s/it][A
 50%|█████     | 5/10 [00:09<00:08,  1.69s/it][A
 70%|███████   | 7/10 [00:09<00:02,  1.05it/s][A
100%|██████████| 10/10 [00:13<00:00,  1.35s/it][A
Epochs:  43%|████▎     | 38/88 [1:04:15<1:27:30, 105.01s/it]

Val Loss: 3.0122 - Val Accuracy: 0.9591



Training:   0%|          | 0/76 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/76 [00:06<07:53,  6.31s/it][A
Training:   4%|▍         | 3/76 [00:06<02:05,  1.72s/it][A
Training:   7%|▋         | 5/76 [00:11<02:30,  2.11s/it][A
Training:   8%|▊         | 6/76 [00:11<01:50,  1.58s/it][A
Training:   9%|▉         | 7/76 [00:11<01:20,  1.17s/it][A
Training:  12%|█▏        | 9/76 [00:16<01:52,  1.67s/it][A
Training:  13%|█▎        | 10/76 [00:16<01:26,  1.30s/it][A
Training:  14%|█▍        | 11/76 [00:16<01:05,  1.01s/it][A
Training:  17%|█▋        | 13/76 [00:21<01:40,  1.60s/it][A
Training:  20%|█▉        | 15/76 [00:21<01:02,  1.02s/it][A
Training:  22%|██▏       | 17/76 [00:26<01:27,  1.49s/it][A
Training:  25%|██▌       | 19/76 [00:26<00:57,  1.01s/it][A
Training:  28%|██▊       | 21/76 [00:31<01:19,  1.44s/it][A
Training:  30%|███       | 23/76 [00:31<00:53,  1.02s/it][A
Training:  32%|███▏      | 24/76 [00:31<00:44,  1.16it/s][A
Training:  33%|███▎      | 25/76 [00:3

Epoch: 39/88 - Loss: 2.7730 - Accuracy: 0.9644



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:04<00:43,  4.88s/it][A
 20%|██        | 2/10 [00:04<00:16,  2.07s/it][A
 30%|███       | 3/10 [00:05<00:08,  1.18s/it][A
 50%|█████     | 5/10 [00:09<00:08,  1.77s/it][A
 60%|██████    | 6/10 [00:09<00:05,  1.30s/it][A
 80%|████████  | 8/10 [00:09<00:01,  1.35it/s][A
100%|██████████| 10/10 [00:13<00:00,  1.35s/it][A
Epochs:  44%|████▍     | 39/88 [1:06:00<1:25:43, 104.96s/it]

Val Loss: 3.2337 - Val Accuracy: 0.9602



Training:   0%|          | 0/76 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/76 [00:05<06:59,  5.59s/it][A
Training:   3%|▎         | 2/76 [00:05<02:55,  2.37s/it][A
Training:   4%|▍         | 3/76 [00:05<01:39,  1.36s/it][A
Training:   5%|▌         | 4/76 [00:05<01:02,  1.16it/s][A
Training:   7%|▋         | 5/76 [00:10<02:32,  2.15s/it][A
Training:   9%|▉         | 7/76 [00:10<01:16,  1.11s/it][A
Training:  11%|█         | 8/76 [00:10<00:59,  1.15it/s][A
Training:  12%|█▏        | 9/76 [00:15<02:03,  1.84s/it][A
Training:  13%|█▎        | 10/76 [00:15<01:29,  1.36s/it][A
Training:  14%|█▍        | 11/76 [00:15<01:05,  1.00s/it][A
Training:  16%|█▌        | 12/76 [00:15<00:49,  1.30it/s][A
Training:  17%|█▋        | 13/76 [00:20<01:56,  1.85s/it][A
Training:  18%|█▊        | 14/76 [00:20<01:22,  1.34s/it][A
Training:  20%|█▉        | 15/76 [00:20<00:59,  1.03it/s][A
Training:  21%|██        | 16/76 [00:20<00:45,  1.31it/s][A
Training:  22%|██▏       | 17/76 [00:24<

Epoch: 40/88 - Loss: 2.7773 - Accuracy: 0.9633



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:05<00:45,  5.00s/it][A
 20%|██        | 2/10 [00:05<00:17,  2.14s/it][A
 30%|███       | 3/10 [00:05<00:08,  1.24s/it][A
 40%|████      | 4/10 [00:05<00:04,  1.25it/s][A
 50%|█████     | 5/10 [00:09<00:09,  1.96s/it][A
 80%|████████  | 8/10 [00:09<00:01,  1.22it/s][A
 90%|█████████ | 9/10 [00:13<00:01,  1.44s/it][A
100%|██████████| 10/10 [00:13<00:00,  1.35s/it][A
Epochs:  45%|████▌     | 40/88 [1:07:43<1:23:26, 104.30s/it]

Val Loss: 2.9746 - Val Accuracy: 0.9591



Training:   0%|          | 0/76 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/76 [00:05<07:23,  5.91s/it][A
Training:   3%|▎         | 2/76 [00:06<03:08,  2.55s/it][A
Training:   4%|▍         | 3/76 [00:06<01:44,  1.43s/it][A
Training:   7%|▋         | 5/76 [00:10<02:10,  1.84s/it][A
Training:   8%|▊         | 6/76 [00:10<01:35,  1.36s/it][A
Training:   9%|▉         | 7/76 [00:10<01:10,  1.02s/it][A
Training:  11%|█         | 8/76 [00:11<00:52,  1.31it/s][A
Training:  12%|█▏        | 9/76 [00:15<02:02,  1.83s/it][A
Training:  14%|█▍        | 11/76 [00:15<01:06,  1.02s/it][A
Training:  16%|█▌        | 12/76 [00:15<00:51,  1.25it/s][A
Training:  17%|█▋        | 13/76 [00:21<02:06,  2.02s/it][A
Training:  20%|█▉        | 15/76 [00:21<01:12,  1.19s/it][A
Training:  21%|██        | 16/76 [00:21<00:56,  1.06it/s][A
Training:  22%|██▏       | 17/76 [00:26<02:04,  2.11s/it][A
Training:  25%|██▌       | 19/76 [00:27<01:11,  1.25s/it][A
Training:  26%|██▋       | 20/76 [00:27<

Epoch: 41/88 - Loss: 2.7747 - Accuracy: 0.9649



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:05<00:52,  5.82s/it][A
 20%|██        | 2/10 [00:05<00:19,  2.50s/it][A
 40%|████      | 4/10 [00:06<00:05,  1.02it/s][A
 50%|█████     | 5/10 [00:10<00:10,  2.11s/it][A
 60%|██████    | 6/10 [00:10<00:05,  1.50s/it][A
 70%|███████   | 7/10 [00:11<00:03,  1.09s/it][A
100%|██████████| 10/10 [00:15<00:00,  1.53s/it][A
Epochs:  47%|████▋     | 41/88 [1:09:42<1:25:07, 108.67s/it]

Val Loss: 3.0488 - Val Accuracy: 0.9596



Training:   0%|          | 0/76 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/76 [00:06<07:56,  6.35s/it][A
Training:   4%|▍         | 3/76 [00:06<02:08,  1.76s/it][A
Training:   5%|▌         | 4/76 [00:06<01:25,  1.19s/it][A
Training:   7%|▋         | 5/76 [00:12<03:05,  2.61s/it][A
Training:   8%|▊         | 6/76 [00:12<02:07,  1.82s/it][A
Training:  11%|█         | 8/76 [00:12<01:09,  1.02s/it][A
Training:  12%|█▏        | 9/76 [00:17<02:13,  1.99s/it][A
Training:  13%|█▎        | 10/76 [00:17<01:38,  1.49s/it][A
Training:  14%|█▍        | 11/76 [00:17<01:13,  1.14s/it][A
Training:  17%|█▋        | 13/76 [00:22<01:51,  1.77s/it][A
Training:  20%|█▉        | 15/76 [00:23<01:13,  1.21s/it][A
Training:  22%|██▏       | 17/76 [00:28<01:37,  1.66s/it][A
Training:  24%|██▎       | 18/76 [00:28<01:18,  1.35s/it][A
Training:  25%|██▌       | 19/76 [00:29<01:09,  1.21s/it][A
Training:  28%|██▊       | 21/76 [00:34<01:30,  1.64s/it][A
Training:  30%|███       | 23/76 [00:35

Epoch: 42/88 - Loss: 2.6765 - Accuracy: 0.9647



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:05<00:51,  5.69s/it][A
 20%|██        | 2/10 [00:05<00:19,  2.42s/it][A
 40%|████      | 4/10 [00:06<00:05,  1.03it/s][A
 50%|█████     | 5/10 [00:11<00:11,  2.23s/it][A
 60%|██████    | 6/10 [00:11<00:06,  1.63s/it][A
 70%|███████   | 7/10 [00:11<00:03,  1.17s/it][A
 80%|████████  | 8/10 [00:11<00:01,  1.18it/s][A
100%|██████████| 10/10 [00:16<00:00,  1.62s/it][A
Epochs:  48%|████▊     | 42/88 [1:11:43<1:26:09, 112.39s/it]

Val Loss: 3.0899 - Val Accuracy: 0.9585



Training:   0%|          | 0/76 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/76 [00:06<08:16,  6.62s/it][A
Training:   3%|▎         | 2/76 [00:06<03:28,  2.82s/it][A
Training:   5%|▌         | 4/76 [00:06<01:18,  1.09s/it][A
Training:   7%|▋         | 5/76 [00:13<03:09,  2.66s/it][A
Training:   9%|▉         | 7/76 [00:13<01:39,  1.45s/it][A
Training:  11%|█         | 8/76 [00:13<01:16,  1.12s/it][A
Training:  12%|█▏        | 9/76 [00:18<02:32,  2.27s/it][A
Training:  14%|█▍        | 11/76 [00:19<01:26,  1.32s/it][A
Training:  16%|█▌        | 12/76 [00:19<01:08,  1.07s/it][A
Training:  17%|█▋        | 13/76 [00:24<02:07,  2.03s/it][A
Training:  18%|█▊        | 14/76 [00:24<01:35,  1.53s/it][A
Training:  20%|█▉        | 15/76 [00:24<01:09,  1.15s/it][A
Training:  21%|██        | 16/76 [00:24<00:51,  1.17it/s][A
Training:  22%|██▏       | 17/76 [00:30<02:10,  2.21s/it][A
Training:  24%|██▎       | 18/76 [00:30<01:33,  1.61s/it][A
Training:  25%|██▌       | 19/76 [00:30

Epoch: 43/88 - Loss: 2.7241 - Accuracy: 0.9663



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:05<00:50,  5.59s/it][A
 20%|██        | 2/10 [00:05<00:18,  2.36s/it][A
 30%|███       | 3/10 [00:06<00:10,  1.45s/it][A
 50%|█████     | 5/10 [00:10<00:09,  1.95s/it][A
 70%|███████   | 7/10 [00:11<00:03,  1.15s/it][A
100%|██████████| 10/10 [00:15<00:00,  1.55s/it][A
Epochs:  49%|████▉     | 43/88 [1:13:43<1:25:58, 114.64s/it]

Val Loss: 3.0521 - Val Accuracy: 0.9602



Training:   0%|          | 0/76 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/76 [00:06<07:49,  6.26s/it][A
Training:   3%|▎         | 2/76 [00:06<03:15,  2.64s/it][A
Training:   4%|▍         | 3/76 [00:06<01:48,  1.48s/it][A
Training:   5%|▌         | 4/76 [00:06<01:07,  1.07it/s][A
Training:   7%|▋         | 5/76 [00:11<02:50,  2.40s/it][A
Training:   8%|▊         | 6/76 [00:11<01:53,  1.62s/it][A
Training:   9%|▉         | 7/76 [00:11<01:18,  1.14s/it][A
Training:  11%|█         | 8/76 [00:11<00:56,  1.21it/s][A
Training:  12%|█▏        | 9/76 [00:16<02:23,  2.14s/it][A
Training:  14%|█▍        | 11/76 [00:17<01:16,  1.18s/it][A
Training:  17%|█▋        | 13/76 [00:22<01:46,  1.69s/it][A
Training:  21%|██        | 16/76 [00:22<00:55,  1.07it/s][A
Training:  22%|██▏       | 17/76 [00:27<01:38,  1.68s/it][A
Training:  24%|██▎       | 18/76 [00:27<01:20,  1.38s/it][A
Training:  25%|██▌       | 19/76 [00:27<01:02,  1.10s/it][A
Training:  28%|██▊       | 21/76 [00:32<0

Epoch: 44/88 - Loss: 2.6727 - Accuracy: 0.9648



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:05<00:46,  5.17s/it][A
 30%|███       | 3/10 [00:05<00:10,  1.47s/it][A
 50%|█████     | 5/10 [00:10<00:09,  1.91s/it][A
 70%|███████   | 7/10 [00:10<00:03,  1.13s/it][A
100%|██████████| 10/10 [00:14<00:00,  1.49s/it][A
Epochs:  50%|█████     | 44/88 [1:15:37<1:23:59, 114.53s/it]

Val Loss: 2.8569 - Val Accuracy: 0.9610



Training:   0%|          | 0/76 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/76 [00:06<07:53,  6.31s/it][A
Training:   3%|▎         | 2/76 [00:06<03:17,  2.66s/it][A
Training:   5%|▌         | 4/76 [00:06<01:14,  1.03s/it][A
Training:   8%|▊         | 6/76 [00:12<02:12,  1.89s/it][A
Training:  11%|█         | 8/76 [00:12<01:19,  1.16s/it][A
Training:  12%|█▏        | 9/76 [00:17<02:15,  2.02s/it][A
Training:  13%|█▎        | 10/76 [00:17<01:44,  1.59s/it][A
Training:  16%|█▌        | 12/76 [00:17<01:02,  1.03it/s][A
Training:  17%|█▋        | 13/76 [00:22<01:59,  1.90s/it][A
Training:  18%|█▊        | 14/76 [00:23<01:30,  1.47s/it][A
Training:  20%|█▉        | 15/76 [00:23<01:08,  1.12s/it][A
Training:  22%|██▏       | 17/76 [00:28<01:43,  1.75s/it][A
Training:  25%|██▌       | 19/76 [00:28<01:03,  1.12s/it][A
Training:  28%|██▊       | 21/76 [00:33<01:30,  1.65s/it][A
Training:  29%|██▉       | 22/76 [00:33<01:13,  1.35s/it][A
Training:  30%|███       | 23/76 [00:3

Epoch: 45/88 - Loss: 2.6460 - Accuracy: 0.9655



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:05<00:51,  5.68s/it][A
 20%|██        | 2/10 [00:06<00:20,  2.55s/it][A
 50%|█████     | 5/10 [00:10<00:08,  1.79s/it][A
 60%|██████    | 6/10 [00:11<00:05,  1.47s/it][A
 70%|███████   | 7/10 [00:11<00:03,  1.13s/it][A
 80%|████████  | 8/10 [00:11<00:01,  1.17it/s][A
100%|██████████| 10/10 [00:15<00:00,  1.50s/it][A
Epochs:  51%|█████     | 45/88 [1:17:34<1:22:36, 115.27s/it]

Val Loss: 2.9626 - Val Accuracy: 0.9607



Training:   0%|          | 0/76 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/76 [00:06<07:36,  6.09s/it][A
Training:   3%|▎         | 2/76 [00:06<03:34,  2.90s/it][A
Training:   4%|▍         | 3/76 [00:06<01:59,  1.63s/it][A
Training:   5%|▌         | 4/76 [00:07<01:14,  1.03s/it][A
Training:   7%|▋         | 5/76 [00:11<02:46,  2.34s/it][A
Training:   8%|▊         | 6/76 [00:12<02:04,  1.78s/it][A
Training:  11%|█         | 8/76 [00:12<01:03,  1.07it/s][A
Training:  12%|█▏        | 9/76 [00:17<02:08,  1.92s/it][A
Training:  13%|█▎        | 10/76 [00:17<01:41,  1.54s/it][A
Training:  16%|█▌        | 12/76 [00:17<00:57,  1.11it/s][A
Training:  17%|█▋        | 13/76 [00:22<01:49,  1.73s/it][A
Training:  18%|█▊        | 14/76 [00:22<01:30,  1.45s/it][A
Training:  20%|█▉        | 15/76 [00:23<01:08,  1.11s/it][A
Training:  21%|██        | 16/76 [00:23<00:50,  1.19it/s][A
Training:  22%|██▏       | 17/76 [00:26<01:33,  1.59s/it][A
Training:  24%|██▎       | 18/76 [00:27<

Epoch: 46/88 - Loss: 2.6345 - Accuracy: 0.9663



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:05<00:53,  5.98s/it][A
 20%|██        | 2/10 [00:06<00:21,  2.64s/it][A
 30%|███       | 3/10 [00:06<00:10,  1.49s/it][A
 40%|████      | 4/10 [00:06<00:05,  1.05it/s][A
 50%|█████     | 5/10 [00:11<00:12,  2.54s/it][A
 60%|██████    | 6/10 [00:12<00:06,  1.74s/it][A
 70%|███████   | 7/10 [00:12<00:03,  1.21s/it][A
100%|██████████| 10/10 [00:17<00:00,  1.72s/it][A
Epochs:  52%|█████▏    | 46/88 [1:19:26<1:20:04, 114.40s/it]

Val Loss: 3.0332 - Val Accuracy: 0.9616



Training:   0%|          | 0/76 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/76 [00:06<08:07,  6.50s/it][A
Training:   3%|▎         | 2/76 [00:06<03:33,  2.88s/it][A
Training:   5%|▌         | 4/76 [00:06<01:20,  1.12s/it][A
Training:   7%|▋         | 5/76 [00:12<02:56,  2.48s/it][A
Training:   8%|▊         | 6/76 [00:12<02:08,  1.84s/it][A
Training:  11%|█         | 8/76 [00:13<01:08,  1.01s/it][A
Training:  12%|█▏        | 9/76 [00:17<02:13,  2.00s/it][A
Training:  13%|█▎        | 10/76 [00:18<01:40,  1.52s/it][A
Training:  16%|█▌        | 12/76 [00:18<00:57,  1.12it/s][A
Training:  17%|█▋        | 13/76 [00:22<01:49,  1.74s/it][A
Training:  18%|█▊        | 14/76 [00:23<01:30,  1.45s/it][A
Training:  20%|█▉        | 15/76 [00:23<01:07,  1.11s/it][A
Training:  21%|██        | 16/76 [00:23<00:51,  1.18it/s][A
Training:  22%|██▏       | 17/76 [00:27<01:45,  1.78s/it][A
Training:  24%|██▎       | 18/76 [00:28<01:28,  1.52s/it][A
Training:  25%|██▌       | 19/76 [00:28

Epoch: 47/88 - Loss: 2.6036 - Accuracy: 0.9663



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:04<00:44,  4.94s/it][A
 20%|██        | 2/10 [00:05<00:17,  2.20s/it][A
 50%|█████     | 5/10 [00:09<00:08,  1.75s/it][A
 70%|███████   | 7/10 [00:10<00:03,  1.06s/it][A
100%|██████████| 10/10 [00:14<00:00,  1.40s/it][A
Epochs:  53%|█████▎    | 47/88 [1:21:15<1:17:01, 112.72s/it]

Val Loss: 2.7099 - Val Accuracy: 0.9605



Training:   0%|          | 0/76 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/76 [00:05<06:59,  5.59s/it][A
Training:   3%|▎         | 2/76 [00:05<03:02,  2.47s/it][A
Training:   5%|▌         | 4/76 [00:06<01:11,  1.00it/s][A
Training:   7%|▋         | 5/76 [00:10<02:24,  2.04s/it][A
Training:   8%|▊         | 6/76 [00:10<01:44,  1.49s/it][A
Training:   9%|▉         | 7/76 [00:10<01:15,  1.09s/it][A
Training:  11%|█         | 8/76 [00:11<00:54,  1.25it/s][A
Training:  12%|█▏        | 9/76 [00:15<02:00,  1.79s/it][A
Training:  13%|█▎        | 10/76 [00:15<01:28,  1.34s/it][A
Training:  16%|█▌        | 12/76 [00:15<00:51,  1.25it/s][A
Training:  17%|█▋        | 13/76 [00:20<01:47,  1.70s/it][A
Training:  20%|█▉        | 15/76 [00:20<01:02,  1.02s/it][A
Training:  22%|██▏       | 17/76 [00:24<01:23,  1.42s/it][A
Training:  24%|██▎       | 18/76 [00:24<01:07,  1.16s/it][A
Training:  25%|██▌       | 19/76 [00:24<00:52,  1.08it/s][A
Training:  26%|██▋       | 20/76 [00:25<

Epoch: 48/88 - Loss: 2.5305 - Accuracy: 0.9658



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:05<00:50,  5.58s/it][A
 20%|██        | 2/10 [00:05<00:19,  2.39s/it][A
 30%|███       | 3/10 [00:05<00:09,  1.37s/it][A
 40%|████      | 4/10 [00:06<00:05,  1.14it/s][A
 50%|█████     | 5/10 [00:10<00:10,  2.13s/it][A
 70%|███████   | 7/10 [00:10<00:03,  1.09s/it][A
100%|██████████| 10/10 [00:14<00:00,  1.47s/it][A
Epochs:  55%|█████▍    | 48/88 [1:23:10<1:15:29, 113.23s/it]

Val Loss: 2.8194 - Val Accuracy: 0.9607



Training:   0%|          | 0/76 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/76 [00:06<07:38,  6.12s/it][A
Training:   4%|▍         | 3/76 [00:06<01:59,  1.64s/it][A
Training:   7%|▋         | 5/76 [00:11<02:25,  2.04s/it][A
Training:   9%|▉         | 7/76 [00:11<01:23,  1.21s/it][A
Training:  12%|█▏        | 9/76 [00:16<01:51,  1.67s/it][A
Training:  14%|█▍        | 11/76 [00:16<01:11,  1.11s/it][A
Training:  17%|█▋        | 13/76 [00:21<01:38,  1.56s/it][A
Training:  20%|█▉        | 15/76 [00:21<01:05,  1.07s/it][A
Training:  21%|██        | 16/76 [00:21<00:53,  1.12it/s][A
Training:  22%|██▏       | 17/76 [00:26<01:44,  1.78s/it][A
Training:  24%|██▎       | 18/76 [00:26<01:21,  1.40s/it][A
Training:  25%|██▌       | 19/76 [00:26<01:02,  1.09s/it][A
Training:  26%|██▋       | 20/76 [00:26<00:47,  1.19it/s][A
Training:  28%|██▊       | 21/76 [00:31<01:44,  1.90s/it][A
Training:  29%|██▉       | 22/76 [00:31<01:15,  1.40s/it][A
Training:  32%|███▏      | 24/76 [00:

Epoch: 49/88 - Loss: 2.5501 - Accuracy: 0.9675



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:04<00:44,  4.96s/it][A
 20%|██        | 2/10 [00:05<00:17,  2.21s/it][A
 30%|███       | 3/10 [00:05<00:08,  1.27s/it][A
 50%|█████     | 5/10 [00:09<00:08,  1.75s/it][A
 70%|███████   | 7/10 [00:09<00:02,  1.01it/s][A
100%|██████████| 10/10 [00:13<00:00,  1.37s/it][A
Epochs:  56%|█████▌    | 49/88 [1:24:56<1:12:14, 111.15s/it]

Val Loss: 2.9855 - Val Accuracy: 0.9621



Training:   0%|          | 0/76 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/76 [00:05<07:10,  5.75s/it][A
Training:   4%|▍         | 3/76 [00:05<01:53,  1.55s/it][A
Training:   5%|▌         | 4/76 [00:06<01:17,  1.08s/it][A
Training:   7%|▋         | 5/76 [00:10<02:37,  2.21s/it][A
Training:   9%|▉         | 7/76 [00:10<01:20,  1.17s/it][A
Training:  11%|█         | 8/76 [00:11<01:04,  1.05it/s][A
Training:  12%|█▏        | 9/76 [00:15<02:09,  1.94s/it][A
Training:  14%|█▍        | 11/76 [00:15<01:13,  1.13s/it][A
Training:  17%|█▋        | 13/76 [00:20<01:38,  1.56s/it][A
Training:  20%|█▉        | 15/76 [00:20<01:03,  1.03s/it][A
Training:  21%|██        | 16/76 [00:20<00:51,  1.15it/s][A
Training:  22%|██▏       | 17/76 [00:25<01:43,  1.75s/it][A
Training:  24%|██▎       | 18/76 [00:25<01:18,  1.35s/it][A
Training:  25%|██▌       | 19/76 [00:25<01:00,  1.05s/it][A
Training:  26%|██▋       | 20/76 [00:25<00:44,  1.25it/s][A
Training:  28%|██▊       | 21/76 [00:30

Epoch: 50/88 - Loss: 2.5294 - Accuracy: 0.9666



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:05<00:48,  5.44s/it][A
 30%|███       | 3/10 [00:05<00:10,  1.47s/it][A
 50%|█████     | 5/10 [00:10<00:09,  1.86s/it][A
 70%|███████   | 7/10 [00:10<00:03,  1.11s/it][A
 80%|████████  | 8/10 [00:10<00:01,  1.14it/s][A
100%|██████████| 10/10 [00:13<00:00,  1.38s/it][A
Epochs:  57%|█████▋    | 50/88 [1:26:44<1:09:44, 110.11s/it]

Val Loss: 2.8548 - Val Accuracy: 0.9610



Training:   0%|          | 0/76 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/76 [00:05<07:27,  5.97s/it][A
Training:   4%|▍         | 3/76 [00:06<01:58,  1.62s/it][A
Training:   5%|▌         | 4/76 [00:06<01:19,  1.10s/it][A
Training:   7%|▋         | 5/76 [00:11<02:53,  2.44s/it][A
Training:   8%|▊         | 6/76 [00:11<02:00,  1.71s/it][A
Training:   9%|▉         | 7/76 [00:11<01:27,  1.27s/it][A
Training:  11%|█         | 8/76 [00:12<01:02,  1.09it/s][A
Training:  12%|█▏        | 9/76 [00:17<02:38,  2.37s/it][A
Training:  14%|█▍        | 11/76 [00:18<01:28,  1.37s/it][A
Training:  16%|█▌        | 12/76 [00:18<01:07,  1.06s/it][A
Training:  17%|█▋        | 13/76 [00:22<02:02,  1.95s/it][A
Training:  20%|█▉        | 15/76 [00:23<01:17,  1.27s/it][A
Training:  22%|██▏       | 17/76 [00:27<01:37,  1.64s/it][A
Training:  25%|██▌       | 19/76 [00:28<01:07,  1.18s/it][A
Training:  26%|██▋       | 20/76 [00:28<00:54,  1.03it/s][A
Training:  28%|██▊       | 21/76 [00:33<

Epoch: 51/88 - Loss: 2.6237 - Accuracy: 0.9655



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:05<00:52,  5.81s/it][A
 40%|████      | 4/10 [00:06<00:07,  1.24s/it][A
 50%|█████     | 5/10 [00:09<00:09,  1.89s/it][A
 70%|███████   | 7/10 [00:10<00:03,  1.08s/it][A
 80%|████████  | 8/10 [00:10<00:01,  1.08it/s][A
100%|██████████| 10/10 [00:14<00:00,  1.40s/it][A
Epochs:  58%|█████▊    | 51/88 [1:28:38<1:08:42, 111.41s/it]

Val Loss: 2.7868 - Val Accuracy: 0.9605



Training:   0%|          | 0/76 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/76 [00:05<07:25,  5.94s/it][A
Training:   3%|▎         | 2/76 [00:06<03:08,  2.55s/it][A
Training:   4%|▍         | 3/76 [00:06<01:46,  1.46s/it][A
Training:   5%|▌         | 4/76 [00:06<01:07,  1.06it/s][A
Training:   7%|▋         | 5/76 [00:11<02:59,  2.53s/it][A
Training:   9%|▉         | 7/76 [00:11<01:28,  1.28s/it][A
Training:  12%|█▏        | 9/76 [00:17<02:04,  1.85s/it][A
Training:  13%|█▎        | 10/76 [00:17<01:36,  1.46s/it][A
Training:  14%|█▍        | 11/76 [00:17<01:13,  1.13s/it][A
Training:  17%|█▋        | 13/76 [00:22<01:45,  1.67s/it][A
Training:  20%|█▉        | 15/76 [00:22<01:06,  1.08s/it][A
Training:  22%|██▏       | 17/76 [00:27<01:30,  1.54s/it][A
Training:  24%|██▎       | 18/76 [00:27<01:13,  1.26s/it][A
Training:  26%|██▋       | 20/76 [00:27<00:46,  1.20it/s][A
Training:  28%|██▊       | 21/76 [00:32<01:28,  1.61s/it][A
Training:  29%|██▉       | 22/76 [00:32

Epoch: 52/88 - Loss: 2.5815 - Accuracy: 0.9664



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:05<00:45,  5.00s/it][A
 20%|██        | 2/10 [00:05<00:17,  2.14s/it][A
 30%|███       | 3/10 [00:05<00:08,  1.23s/it][A
 40%|████      | 4/10 [00:05<00:04,  1.25it/s][A
 50%|█████     | 5/10 [00:09<00:10,  2.14s/it][A
 70%|███████   | 7/10 [00:10<00:03,  1.08s/it][A
100%|██████████| 10/10 [00:13<00:00,  1.37s/it][A
Epochs:  59%|█████▉    | 52/88 [1:30:32<1:07:15, 112.09s/it]

Val Loss: 2.9736 - Val Accuracy: 0.9610



Training:   0%|          | 0/76 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/76 [00:06<07:31,  6.01s/it][A
Training:   3%|▎         | 2/76 [00:06<03:11,  2.58s/it][A
Training:   5%|▌         | 4/76 [00:06<01:13,  1.02s/it][A
Training:   7%|▋         | 5/76 [00:11<02:36,  2.20s/it][A
Training:   9%|▉         | 7/76 [00:11<01:23,  1.21s/it][A
Training:  12%|█▏        | 9/76 [00:16<01:56,  1.75s/it][A
Training:  13%|█▎        | 10/76 [00:16<01:31,  1.38s/it][A
Training:  14%|█▍        | 11/76 [00:16<01:10,  1.08s/it][A
Training:  16%|█▌        | 12/76 [00:16<00:53,  1.20it/s][A
Training:  17%|█▋        | 13/76 [00:21<01:56,  1.85s/it][A
Training:  18%|█▊        | 14/76 [00:21<01:24,  1.37s/it][A
Training:  20%|█▉        | 15/76 [00:21<01:03,  1.03s/it][A
Training:  21%|██        | 16/76 [00:21<00:47,  1.28it/s][A
Training:  22%|██▏       | 17/76 [00:26<01:51,  1.89s/it][A
Training:  24%|██▎       | 18/76 [00:26<01:19,  1.37s/it][A
Training:  25%|██▌       | 19/76 [00:2

Epoch: 53/88 - Loss: 2.4530 - Accuracy: 0.9669



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:05<00:52,  5.78s/it][A
 20%|██        | 2/10 [00:05<00:19,  2.44s/it][A
 40%|████      | 4/10 [00:06<00:05,  1.05it/s][A
 60%|██████    | 6/10 [00:10<00:06,  1.51s/it][A
 80%|████████  | 8/10 [00:10<00:02,  1.03s/it][A
100%|██████████| 10/10 [00:14<00:00,  1.45s/it][A
Epochs:  60%|██████    | 53/88 [1:32:25<1:05:37, 112.50s/it]

Val Loss: 2.9516 - Val Accuracy: 0.9605



Training:   0%|          | 0/76 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/76 [00:05<07:09,  5.73s/it][A
Training:   4%|▍         | 3/76 [00:06<02:01,  1.67s/it][A
Training:   7%|▋         | 5/76 [00:10<02:23,  2.03s/it][A
Training:   8%|▊         | 6/76 [00:11<01:46,  1.52s/it][A
Training:   9%|▉         | 7/76 [00:11<01:20,  1.16s/it][A
Training:  11%|█         | 8/76 [00:11<00:58,  1.15it/s][A
Training:  12%|█▏        | 9/76 [00:16<02:10,  1.95s/it][A
Training:  13%|█▎        | 10/76 [00:16<01:34,  1.43s/it][A
Training:  14%|█▍        | 11/76 [00:16<01:14,  1.15s/it][A
Training:  16%|█▌        | 12/76 [00:16<00:54,  1.17it/s][A
Training:  17%|█▋        | 13/76 [00:22<02:15,  2.15s/it][A
Training:  20%|█▉        | 15/76 [00:23<01:24,  1.38s/it][A
Training:  22%|██▏       | 17/76 [00:27<01:39,  1.69s/it][A
Training:  24%|██▎       | 18/76 [00:27<01:18,  1.36s/it][A
Training:  25%|██▌       | 19/76 [00:28<01:17,  1.36s/it][A
Training:  28%|██▊       | 21/76 [00:32

Epoch: 54/88 - Loss: 2.4491 - Accuracy: 0.9668



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:05<00:45,  5.07s/it][A
 20%|██        | 2/10 [00:05<00:17,  2.16s/it][A
 30%|███       | 3/10 [00:05<00:08,  1.24s/it][A
 50%|█████     | 5/10 [00:09<00:08,  1.76s/it][A
 70%|███████   | 7/10 [00:09<00:02,  1.00it/s][A
100%|██████████| 10/10 [00:14<00:00,  1.42s/it][A
Epochs:  61%|██████▏   | 54/88 [1:34:19<1:04:01, 112.97s/it]

Val Loss: 2.9088 - Val Accuracy: 0.9594



Training:   0%|          | 0/76 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/76 [00:05<07:01,  5.62s/it][A
Training:   3%|▎         | 2/76 [00:05<03:01,  2.46s/it][A
Training:   4%|▍         | 3/76 [00:06<01:42,  1.40s/it][A
Training:   5%|▌         | 4/76 [00:06<01:05,  1.11it/s][A
Training:   7%|▋         | 5/76 [00:11<02:50,  2.40s/it][A
Training:   9%|▉         | 7/76 [00:11<01:26,  1.25s/it][A
Training:  11%|█         | 8/76 [00:11<01:05,  1.04it/s][A
Training:  12%|█▏        | 9/76 [00:16<02:15,  2.03s/it][A
Training:  13%|█▎        | 10/76 [00:16<01:38,  1.49s/it][A
Training:  14%|█▍        | 11/76 [00:17<01:20,  1.24s/it][A
Training:  16%|█▌        | 12/76 [00:17<00:58,  1.09it/s][A
Training:  17%|█▋        | 13/76 [00:21<01:53,  1.80s/it][A
Training:  18%|█▊        | 14/76 [00:21<01:26,  1.39s/it][A
Training:  20%|█▉        | 15/76 [00:22<01:13,  1.20s/it][A
Training:  22%|██▏       | 17/76 [00:25<01:25,  1.45s/it][A
Training:  24%|██▎       | 18/76 [00:26<

Epoch: 55/88 - Loss: 2.4261 - Accuracy: 0.9670



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:05<00:45,  5.07s/it][A
 20%|██        | 2/10 [00:05<00:17,  2.16s/it][A
 30%|███       | 3/10 [00:05<00:08,  1.25s/it][A
 50%|█████     | 5/10 [00:09<00:09,  1.83s/it][A
 80%|████████  | 8/10 [00:10<00:01,  1.17it/s][A
100%|██████████| 10/10 [00:13<00:00,  1.40s/it][A
Epochs:  62%|██████▎   | 55/88 [1:36:11<1:01:58, 112.67s/it]

Val Loss: 2.6557 - Val Accuracy: 0.9605



Training:   0%|          | 0/76 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/76 [00:05<07:17,  5.83s/it][A
Training:   3%|▎         | 2/76 [00:05<03:02,  2.46s/it][A
Training:   5%|▌         | 4/76 [00:06<01:08,  1.05it/s][A
Training:   8%|▊         | 6/76 [00:11<02:02,  1.75s/it][A
Training:  11%|█         | 8/76 [00:11<01:13,  1.08s/it][A
Training:  12%|█▏        | 9/76 [00:16<02:13,  1.99s/it][A
Training:  13%|█▎        | 10/76 [00:16<01:41,  1.55s/it][A
Training:  16%|█▌        | 12/76 [00:16<01:00,  1.06it/s][A
Training:  17%|█▋        | 13/76 [00:21<01:48,  1.72s/it][A
Training:  20%|█▉        | 15/76 [00:21<01:05,  1.07s/it][A
Training:  22%|██▏       | 17/76 [00:25<01:26,  1.46s/it][A
Training:  24%|██▎       | 18/76 [00:25<01:08,  1.19s/it][A
Training:  25%|██▌       | 19/76 [00:25<00:53,  1.06it/s][A
Training:  28%|██▊       | 21/76 [00:30<01:20,  1.47s/it][A
Training:  29%|██▉       | 22/76 [00:30<01:03,  1.17s/it][A
Training:  30%|███       | 23/76 [00:3

Epoch: 56/88 - Loss: 2.4929 - Accuracy: 0.9669



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:05<00:45,  5.03s/it][A
 20%|██        | 2/10 [00:05<00:18,  2.33s/it][A
 40%|████      | 4/10 [00:05<00:05,  1.10it/s][A
 50%|█████     | 5/10 [00:09<00:09,  1.84s/it][A
 60%|██████    | 6/10 [00:10<00:05,  1.45s/it][A
 80%|████████  | 8/10 [00:10<00:01,  1.23it/s][A
100%|██████████| 10/10 [00:13<00:00,  1.38s/it][A
Epochs:  64%|██████▎   | 56/88 [1:37:59<59:23, 111.37s/it]  

Val Loss: 2.7071 - Val Accuracy: 0.9600



Training:   0%|          | 0/76 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/76 [00:05<06:52,  5.50s/it][A
Training:   3%|▎         | 2/76 [00:05<02:57,  2.40s/it][A
Training:   4%|▍         | 3/76 [00:05<01:41,  1.39s/it][A
Training:   7%|▋         | 5/76 [00:10<02:15,  1.91s/it][A
Training:   8%|▊         | 6/76 [00:10<01:37,  1.40s/it][A
Training:   9%|▉         | 7/76 [00:10<01:13,  1.07s/it][A
Training:  12%|█▏        | 9/76 [00:15<01:51,  1.67s/it][A
Training:  14%|█▍        | 11/76 [00:15<01:08,  1.05s/it][A
Training:  17%|█▋        | 13/76 [00:20<01:32,  1.46s/it][A
Training:  21%|██        | 16/76 [00:20<00:50,  1.18it/s][A
Training:  22%|██▏       | 17/76 [00:25<01:30,  1.53s/it][A
Training:  24%|██▎       | 18/76 [00:25<01:12,  1.26s/it][A
Training:  26%|██▋       | 20/76 [00:25<00:46,  1.21it/s][A
Training:  28%|██▊       | 21/76 [00:30<01:27,  1.59s/it][A
Training:  30%|███       | 23/76 [00:30<00:55,  1.04s/it][A
Training:  32%|███▏      | 24/76 [00:30

Epoch: 57/88 - Loss: 2.3687 - Accuracy: 0.9680



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:05<00:47,  5.31s/it][A
 20%|██        | 2/10 [00:05<00:18,  2.30s/it][A
 30%|███       | 3/10 [00:05<00:09,  1.31s/it][A
 50%|█████     | 5/10 [00:09<00:08,  1.74s/it][A
 60%|██████    | 6/10 [00:09<00:05,  1.27s/it][A
 80%|████████  | 8/10 [00:10<00:01,  1.35it/s][A
100%|██████████| 10/10 [00:13<00:00,  1.38s/it][A
Epochs:  65%|██████▍   | 57/88 [1:39:47<56:56, 110.20s/it]

Val Loss: 2.9390 - Val Accuracy: 0.9605



Training:   0%|          | 0/76 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/76 [00:05<07:11,  5.75s/it][A
Training:   3%|▎         | 2/76 [00:05<03:00,  2.44s/it][A
Training:   5%|▌         | 4/76 [00:06<01:08,  1.05it/s][A
Training:   7%|▋         | 5/76 [00:11<02:36,  2.20s/it][A
Training:   8%|▊         | 6/76 [00:11<01:49,  1.56s/it][A
Training:   9%|▉         | 7/76 [00:11<01:19,  1.15s/it][A
Training:  11%|█         | 8/76 [00:11<00:57,  1.18it/s][A
Training:  12%|█▏        | 9/76 [00:15<02:03,  1.84s/it][A
Training:  13%|█▎        | 10/76 [00:15<01:27,  1.33s/it][A
Training:  14%|█▍        | 11/76 [00:16<01:14,  1.15s/it][A
Training:  17%|█▋        | 13/76 [00:20<01:30,  1.44s/it][A
Training:  18%|█▊        | 14/76 [00:20<01:10,  1.14s/it][A
Training:  20%|█▉        | 15/76 [00:20<00:59,  1.03it/s][A
Training:  22%|██▏       | 17/76 [00:24<01:22,  1.40s/it][A
Training:  24%|██▎       | 18/76 [00:25<01:08,  1.18s/it][A
Training:  25%|██▌       | 19/76 [00:25<

Epoch: 58/88 - Loss: 2.3893 - Accuracy: 0.9680



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:05<00:46,  5.13s/it][A
 20%|██        | 2/10 [00:05<00:17,  2.19s/it][A
 30%|███       | 3/10 [00:05<00:08,  1.24s/it][A
 40%|████      | 4/10 [00:05<00:04,  1.26it/s][A
 50%|█████     | 5/10 [00:09<00:09,  1.92s/it][A
 60%|██████    | 6/10 [00:09<00:05,  1.36s/it][A
 80%|████████  | 8/10 [00:09<00:01,  1.34it/s][A
100%|██████████| 10/10 [00:13<00:00,  1.35s/it][A
Epochs:  66%|██████▌   | 58/88 [1:41:33<54:28, 108.96s/it]

Val Loss: 2.7531 - Val Accuracy: 0.9600



Training:   0%|          | 0/76 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/76 [00:05<07:29,  5.99s/it][A
Training:   3%|▎         | 2/76 [00:06<03:08,  2.55s/it][A
Training:   4%|▍         | 3/76 [00:06<01:45,  1.44s/it][A
Training:   5%|▌         | 4/76 [00:06<01:06,  1.08it/s][A
Training:   7%|▋         | 5/76 [00:11<02:47,  2.36s/it][A
Training:   8%|▊         | 6/76 [00:11<01:52,  1.61s/it][A
Training:  12%|█▏        | 9/76 [00:15<01:39,  1.49s/it][A
Training:  14%|█▍        | 11/76 [00:15<01:02,  1.03it/s][A
Training:  17%|█▋        | 13/76 [00:20<01:25,  1.36s/it][A
Training:  20%|█▉        | 15/76 [00:20<00:57,  1.06it/s][A
Training:  22%|██▏       | 17/76 [00:24<01:20,  1.37s/it][A
Training:  24%|██▎       | 18/76 [00:24<01:06,  1.14s/it][A
Training:  25%|██▌       | 19/76 [00:25<00:53,  1.06it/s][A
Training:  26%|██▋       | 20/76 [00:25<00:42,  1.32it/s][A
Training:  28%|██▊       | 21/76 [00:29<01:28,  1.60s/it][A
Training:  30%|███       | 23/76 [00:29

Epoch: 59/88 - Loss: 2.3777 - Accuracy: 0.9680



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:04<00:44,  4.92s/it][A
 20%|██        | 2/10 [00:05<00:16,  2.11s/it][A
 30%|███       | 3/10 [00:05<00:08,  1.21s/it][A
 40%|████      | 4/10 [00:05<00:04,  1.26it/s][A
 50%|█████     | 5/10 [00:09<00:09,  1.94s/it][A
 60%|██████    | 6/10 [00:09<00:05,  1.32s/it][A
 70%|███████   | 7/10 [00:09<00:02,  1.08it/s][A
 80%|████████  | 8/10 [00:09<00:01,  1.48it/s][A
100%|██████████| 10/10 [00:13<00:00,  1.32s/it][A
Epochs:  67%|██████▋   | 59/88 [1:43:14<51:31, 106.60s/it]

Val Loss: 2.6683 - Val Accuracy: 0.9605



Training:   0%|          | 0/76 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/76 [00:05<06:45,  5.40s/it][A
Training:   3%|▎         | 2/76 [00:05<02:52,  2.34s/it][A
Training:   7%|▋         | 5/76 [00:10<02:06,  1.78s/it][A
Training:   8%|▊         | 6/76 [00:10<01:37,  1.39s/it][A
Training:   9%|▉         | 7/76 [00:10<01:13,  1.06s/it][A
Training:  12%|█▏        | 9/76 [00:14<01:39,  1.48s/it][A
Training:  13%|█▎        | 10/76 [00:15<01:19,  1.21s/it][A
Training:  16%|█▌        | 12/76 [00:15<00:47,  1.34it/s][A
Training:  17%|█▋        | 13/76 [00:19<01:35,  1.51s/it][A
Training:  18%|█▊        | 14/76 [00:19<01:16,  1.23s/it][A
Training:  20%|█▉        | 15/76 [00:19<00:57,  1.06it/s][A
Training:  22%|██▏       | 17/76 [00:23<01:20,  1.37s/it][A
Training:  24%|██▎       | 18/76 [00:24<01:09,  1.20s/it][A
Training:  26%|██▋       | 20/76 [00:24<00:42,  1.33it/s][A
Training:  28%|██▊       | 21/76 [00:28<01:17,  1.41s/it][A
Training:  29%|██▉       | 22/76 [00:2

Epoch: 60/88 - Loss: 2.3681 - Accuracy: 0.9682



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:04<00:44,  4.92s/it][A
 30%|███       | 3/10 [00:05<00:09,  1.33s/it][A
 40%|████      | 4/10 [00:05<00:05,  1.10it/s][A
 50%|█████     | 5/10 [00:09<00:10,  2.03s/it][A
 70%|███████   | 7/10 [00:09<00:03,  1.10s/it][A
100%|██████████| 10/10 [00:13<00:00,  1.34s/it][A
Epochs:  68%|██████▊   | 60/88 [1:44:56<49:04, 105.15s/it]

Val Loss: 2.6521 - Val Accuracy: 0.9605



Training:   0%|          | 0/76 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/76 [00:05<06:42,  5.37s/it][A
Training:   3%|▎         | 2/76 [00:05<02:52,  2.33s/it][A
Training:   4%|▍         | 3/76 [00:05<01:37,  1.33s/it][A
Training:   7%|▋         | 5/76 [00:10<02:07,  1.80s/it][A
Training:   8%|▊         | 6/76 [00:10<01:35,  1.37s/it][A
Training:  11%|█         | 8/76 [00:10<00:54,  1.26it/s][A
Training:  12%|█▏        | 9/76 [00:14<01:42,  1.53s/it][A
Training:  13%|█▎        | 10/76 [00:14<01:21,  1.23s/it][A
Training:  14%|█▍        | 11/76 [00:14<01:01,  1.07it/s][A
Training:  16%|█▌        | 12/76 [00:15<00:46,  1.37it/s][A
Training:  17%|█▋        | 13/76 [00:18<01:42,  1.63s/it][A
Training:  18%|█▊        | 14/76 [00:19<01:18,  1.26s/it][A
Training:  21%|██        | 16/76 [00:19<00:48,  1.23it/s][A
Training:  22%|██▏       | 17/76 [00:23<01:30,  1.53s/it][A
Training:  24%|██▎       | 18/76 [00:23<01:08,  1.18s/it][A
Training:  26%|██▋       | 20/76 [00:24

Epoch: 61/88 - Loss: 2.3874 - Accuracy: 0.9680



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:04<00:44,  4.96s/it][A
 20%|██        | 2/10 [00:05<00:16,  2.11s/it][A
 30%|███       | 3/10 [00:05<00:08,  1.24s/it][A
 40%|████      | 4/10 [00:05<00:04,  1.24it/s][A
 50%|█████     | 5/10 [00:09<00:09,  1.98s/it][A
 70%|███████   | 7/10 [00:09<00:03,  1.02s/it][A
 80%|████████  | 8/10 [00:09<00:01,  1.28it/s][A
100%|██████████| 10/10 [00:13<00:00,  1.35s/it][A
Epochs:  69%|██████▉   | 61/88 [1:46:37<46:49, 104.06s/it]

Val Loss: 2.6944 - Val Accuracy: 0.9610



Training:   0%|          | 0/76 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/76 [00:05<06:53,  5.51s/it][A
Training:   3%|▎         | 2/76 [00:05<02:53,  2.35s/it][A
Training:   4%|▍         | 3/76 [00:05<01:36,  1.32s/it][A
Training:   5%|▌         | 4/76 [00:05<01:02,  1.16it/s][A
Training:   7%|▋         | 5/76 [00:10<02:29,  2.10s/it][A
Training:   9%|▉         | 7/76 [00:10<01:13,  1.06s/it][A
Training:  12%|█▏        | 9/76 [00:14<01:46,  1.58s/it][A
Training:  13%|█▎        | 10/76 [00:15<01:23,  1.26s/it][A
Training:  14%|█▍        | 11/76 [00:15<01:03,  1.03it/s][A
Training:  17%|█▋        | 13/76 [00:19<01:36,  1.53s/it][A
Training:  18%|█▊        | 14/76 [00:20<01:15,  1.22s/it][A
Training:  20%|█▉        | 15/76 [00:20<00:58,  1.05it/s][A
Training:  22%|██▏       | 17/76 [00:24<01:24,  1.43s/it][A
Training:  24%|██▎       | 18/76 [00:24<01:05,  1.13s/it][A
Training:  25%|██▌       | 19/76 [00:24<00:51,  1.11it/s][A
Training:  28%|██▊       | 21/76 [00:29

Epoch: 62/88 - Loss: 2.3917 - Accuracy: 0.9690



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:05<00:46,  5.17s/it][A
 20%|██        | 2/10 [00:05<00:18,  2.30s/it][A
 30%|███       | 3/10 [00:05<00:09,  1.34s/it][A
 50%|█████     | 5/10 [00:09<00:08,  1.69s/it][A
 80%|████████  | 8/10 [00:09<00:01,  1.21it/s][A
100%|██████████| 10/10 [00:13<00:00,  1.36s/it][A
Epochs:  70%|███████   | 62/88 [1:48:24<45:25, 104.82s/it]

Val Loss: 2.7537 - Val Accuracy: 0.9605



Training:   0%|          | 0/76 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/76 [00:05<06:36,  5.29s/it][A
Training:   3%|▎         | 2/76 [00:05<02:47,  2.26s/it][A
Training:   5%|▌         | 4/76 [00:05<01:03,  1.13it/s][A
Training:   7%|▋         | 5/76 [00:09<02:14,  1.90s/it][A
Training:   9%|▉         | 7/76 [00:09<01:11,  1.03s/it][A
Training:  12%|█▏        | 9/76 [00:14<01:43,  1.55s/it][A
Training:  13%|█▎        | 10/76 [00:14<01:21,  1.23s/it][A
Training:  14%|█▍        | 11/76 [00:14<01:03,  1.03it/s][A
Training:  17%|█▋        | 13/76 [00:19<01:32,  1.46s/it][A
Training:  18%|█▊        | 14/76 [00:19<01:11,  1.16s/it][A
Training:  20%|█▉        | 15/76 [00:19<00:55,  1.09it/s][A
Training:  21%|██        | 16/76 [00:19<00:42,  1.41it/s][A
Training:  22%|██▏       | 17/76 [00:23<01:40,  1.70s/it][A
Training:  24%|██▎       | 18/76 [00:24<01:13,  1.27s/it][A
Training:  25%|██▌       | 19/76 [00:24<00:53,  1.06it/s][A
Training:  26%|██▋       | 20/76 [00:2

Epoch: 63/88 - Loss: 2.2975 - Accuracy: 0.9689



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:04<00:42,  4.76s/it][A
 20%|██        | 2/10 [00:04<00:16,  2.02s/it][A
 30%|███       | 3/10 [00:05<00:08,  1.19s/it][A
 50%|█████     | 5/10 [00:09<00:08,  1.70s/it][A
 60%|██████    | 6/10 [00:09<00:04,  1.25s/it][A
 70%|███████   | 7/10 [00:09<00:02,  1.08it/s][A
100%|██████████| 10/10 [00:13<00:00,  1.35s/it][A
Epochs:  72%|███████▏  | 63/88 [1:50:06<43:16, 103.87s/it]

Val Loss: 2.6984 - Val Accuracy: 0.9616



Training:   0%|          | 0/76 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/76 [00:05<06:24,  5.13s/it][A
Training:   3%|▎         | 2/76 [00:05<02:41,  2.18s/it][A
Training:   4%|▍         | 3/76 [00:05<01:32,  1.26s/it][A
Training:   7%|▋         | 5/76 [00:10<02:14,  1.90s/it][A
Training:   9%|▉         | 7/76 [00:10<01:13,  1.07s/it][A
Training:  12%|█▏        | 9/76 [00:15<01:45,  1.57s/it][A
Training:  13%|█▎        | 10/76 [00:15<01:23,  1.27s/it][A
Training:  14%|█▍        | 11/76 [00:15<01:04,  1.01it/s][A
Training:  17%|█▋        | 13/76 [00:19<01:33,  1.49s/it][A
Training:  18%|█▊        | 14/76 [00:19<01:13,  1.18s/it][A
Training:  21%|██        | 16/76 [00:20<00:45,  1.33it/s][A
Training:  22%|██▏       | 17/76 [00:24<01:33,  1.59s/it][A
Training:  24%|██▎       | 18/76 [00:24<01:12,  1.24s/it][A
Training:  25%|██▌       | 19/76 [00:24<00:55,  1.03it/s][A
Training:  28%|██▊       | 21/76 [00:29<01:22,  1.50s/it][A
Training:  30%|███       | 23/76 [00:2

Epoch: 64/88 - Loss: 2.3147 - Accuracy: 0.9679



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:05<00:45,  5.01s/it][A
 30%|███       | 3/10 [00:05<00:09,  1.34s/it][A
 50%|█████     | 5/10 [00:09<00:08,  1.72s/it][A
 60%|██████    | 6/10 [00:09<00:05,  1.32s/it][A
 70%|███████   | 7/10 [00:09<00:02,  1.02it/s][A
100%|██████████| 10/10 [00:13<00:00,  1.34s/it][A
Epochs:  73%|███████▎  | 64/88 [1:51:49<41:30, 103.77s/it]

Val Loss: 2.6365 - Val Accuracy: 0.9610



Training:   0%|          | 0/76 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/76 [00:05<06:34,  5.26s/it][A
Training:   3%|▎         | 2/76 [00:05<02:46,  2.25s/it][A
Training:   4%|▍         | 3/76 [00:05<01:35,  1.30s/it][A
Training:   5%|▌         | 4/76 [00:05<01:01,  1.18it/s][A
Training:   7%|▋         | 5/76 [00:10<02:32,  2.14s/it][A
Training:   8%|▊         | 6/76 [00:10<01:42,  1.46s/it][A
Training:   9%|▉         | 7/76 [00:10<01:10,  1.02s/it][A
Training:  11%|█         | 8/76 [00:10<00:50,  1.34it/s][A
Training:  12%|█▏        | 9/76 [00:14<02:06,  1.88s/it][A
Training:  14%|█▍        | 11/76 [00:15<01:08,  1.05s/it][A
Training:  17%|█▋        | 13/76 [00:19<01:36,  1.54s/it][A
Training:  18%|█▊        | 14/76 [00:19<01:15,  1.22s/it][A
Training:  20%|█▉        | 15/76 [00:20<00:59,  1.02it/s][A
Training:  21%|██        | 16/76 [00:20<00:45,  1.32it/s][A
Training:  22%|██▏       | 17/76 [00:24<01:38,  1.67s/it][A
Training:  24%|██▎       | 18/76 [00:24<0

Epoch: 65/88 - Loss: 2.3245 - Accuracy: 0.9684



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:04<00:44,  4.93s/it][A
 20%|██        | 2/10 [00:05<00:16,  2.10s/it][A
 40%|████      | 4/10 [00:05<00:04,  1.22it/s][A
 60%|██████    | 6/10 [00:09<00:05,  1.47s/it][A
100%|██████████| 10/10 [00:12<00:00,  1.29s/it][A
Epochs:  74%|███████▍  | 65/88 [1:53:32<39:39, 103.44s/it]

Val Loss: 2.4873 - Val Accuracy: 0.9616



Training:   0%|          | 0/76 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/76 [00:05<06:51,  5.49s/it][A
Training:   3%|▎         | 2/76 [00:05<02:55,  2.37s/it][A
Training:   4%|▍         | 3/76 [00:05<01:37,  1.34s/it][A
Training:   5%|▌         | 4/76 [00:05<01:01,  1.17it/s][A
Training:   7%|▋         | 5/76 [00:10<02:28,  2.08s/it][A
Training:   9%|▉         | 7/76 [00:10<01:13,  1.07s/it][A
Training:  11%|█         | 8/76 [00:10<00:57,  1.17it/s][A
Training:  12%|█▏        | 9/76 [00:14<01:57,  1.76s/it][A
Training:  13%|█▎        | 10/76 [00:14<01:25,  1.29s/it][A
Training:  14%|█▍        | 11/76 [00:15<01:04,  1.01it/s][A
Training:  16%|█▌        | 12/76 [00:15<00:49,  1.28it/s][A
Training:  17%|█▋        | 13/76 [00:19<01:50,  1.76s/it][A
Training:  18%|█▊        | 14/76 [00:19<01:19,  1.29s/it][A
Training:  20%|█▉        | 15/76 [00:20<01:01,  1.01s/it][A
Training:  21%|██        | 16/76 [00:20<00:44,  1.34it/s][A
Training:  22%|██▏       | 17/76 [00:24<

Epoch: 66/88 - Loss: 2.2954 - Accuracy: 0.9688



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:05<00:45,  5.08s/it][A
 30%|███       | 3/10 [00:05<00:09,  1.39s/it][A
 50%|█████     | 5/10 [00:09<00:08,  1.75s/it][A
 80%|████████  | 8/10 [00:09<00:01,  1.17it/s][A
100%|██████████| 10/10 [00:13<00:00,  1.31s/it][A
Epochs:  75%|███████▌  | 66/88 [1:55:14<37:49, 103.16s/it]

Val Loss: 2.7014 - Val Accuracy: 0.9610



Training:   0%|          | 0/76 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/76 [00:05<07:03,  5.64s/it][A
Training:   4%|▍         | 3/76 [00:05<01:50,  1.52s/it][A
Training:   7%|▋         | 5/76 [00:10<02:18,  1.95s/it][A
Training:   8%|▊         | 6/76 [00:10<01:42,  1.46s/it][A
Training:  11%|█         | 8/76 [00:10<00:57,  1.17it/s][A
Training:  12%|█▏        | 9/76 [00:15<01:56,  1.74s/it][A
Training:  13%|█▎        | 10/76 [00:15<01:27,  1.33s/it][A
Training:  14%|█▍        | 11/76 [00:15<01:06,  1.02s/it][A
Training:  16%|█▌        | 12/76 [00:15<00:50,  1.27it/s][A
Training:  17%|█▋        | 13/76 [00:20<01:52,  1.78s/it][A
Training:  18%|█▊        | 14/76 [00:20<01:20,  1.30s/it][A
Training:  20%|█▉        | 15/76 [00:20<00:58,  1.05it/s][A
Training:  22%|██▏       | 17/76 [00:24<01:29,  1.52s/it][A
Training:  24%|██▎       | 18/76 [00:24<01:08,  1.17s/it][A
Training:  26%|██▋       | 20/76 [00:24<00:40,  1.39it/s][A
Training:  28%|██▊       | 21/76 [00:2

Epoch: 67/88 - Loss: 2.3027 - Accuracy: 0.9682



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:04<00:43,  4.88s/it][A
 20%|██        | 2/10 [00:05<00:17,  2.18s/it][A
 30%|███       | 3/10 [00:05<00:08,  1.24s/it][A
 40%|████      | 4/10 [00:05<00:04,  1.21it/s][A
 50%|█████     | 5/10 [00:08<00:08,  1.71s/it][A
 60%|██████    | 6/10 [00:09<00:04,  1.25s/it][A
 80%|████████  | 8/10 [00:09<00:01,  1.51it/s][A
100%|██████████| 10/10 [00:12<00:00,  1.27s/it][A
Epochs:  76%|███████▌  | 67/88 [1:56:59<36:13, 103.48s/it]

Val Loss: 2.7191 - Val Accuracy: 0.9610



Training:   0%|          | 0/76 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/76 [00:05<07:06,  5.69s/it][A
Training:   4%|▍         | 3/76 [00:05<01:54,  1.56s/it][A
Training:   5%|▌         | 4/76 [00:06<01:16,  1.07s/it][A
Training:   7%|▋         | 5/76 [00:10<02:42,  2.29s/it][A
Training:   8%|▊         | 6/76 [00:10<01:52,  1.61s/it][A
Training:   9%|▉         | 7/76 [00:11<01:18,  1.13s/it][A
Training:  12%|█▏        | 9/76 [00:15<01:56,  1.73s/it][A
Training:  13%|█▎        | 10/76 [00:16<01:28,  1.34s/it][A
Training:  14%|█▍        | 11/76 [00:16<01:06,  1.02s/it][A
Training:  17%|█▋        | 13/76 [00:20<01:41,  1.61s/it][A
Training:  20%|█▉        | 15/76 [00:21<01:02,  1.03s/it][A
Training:  22%|██▏       | 17/76 [00:25<01:24,  1.43s/it][A
Training:  25%|██▌       | 19/76 [00:25<00:55,  1.03it/s][A
Training:  26%|██▋       | 20/76 [00:25<00:44,  1.25it/s][A
Training:  28%|██▊       | 21/76 [00:30<01:29,  1.62s/it][A
Training:  29%|██▉       | 22/76 [00:30

Epoch: 68/88 - Loss: 2.2203 - Accuracy: 0.9692



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:04<00:41,  4.62s/it][A
 20%|██        | 2/10 [00:04<00:16,  2.06s/it][A
 40%|████      | 4/10 [00:05<00:05,  1.20it/s][A
 50%|█████     | 5/10 [00:08<00:08,  1.69s/it][A
 60%|██████    | 6/10 [00:09<00:05,  1.33s/it][A
100%|██████████| 10/10 [00:12<00:00,  1.27s/it][A
Epochs:  77%|███████▋  | 68/88 [1:58:42<34:28, 103.41s/it]

Val Loss: 2.6131 - Val Accuracy: 0.9616



Training:   0%|          | 0/76 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/76 [00:05<06:18,  5.05s/it][A
Training:   3%|▎         | 2/76 [00:05<02:45,  2.23s/it][A
Training:   4%|▍         | 3/76 [00:05<01:32,  1.27s/it][A
Training:   5%|▌         | 4/76 [00:05<00:59,  1.22it/s][A
Training:   7%|▋         | 5/76 [00:10<02:32,  2.15s/it][A
Training:   8%|▊         | 6/76 [00:10<01:49,  1.57s/it][A
Training:   9%|▉         | 7/76 [00:10<01:16,  1.11s/it][A
Training:  11%|█         | 8/76 [00:10<00:53,  1.27it/s][A
Training:  12%|█▏        | 9/76 [00:14<02:03,  1.85s/it][A
Training:  13%|█▎        | 10/76 [00:15<01:31,  1.39s/it][A
Training:  16%|█▌        | 12/76 [00:15<00:49,  1.29it/s][A
Training:  17%|█▋        | 13/76 [00:19<01:44,  1.66s/it][A
Training:  18%|█▊        | 14/76 [00:20<01:22,  1.34s/it][A
Training:  20%|█▉        | 15/76 [00:20<01:01,  1.00s/it][A
Training:  22%|██▏       | 17/76 [00:24<01:27,  1.48s/it][A
Training:  24%|██▎       | 18/76 [00:24<0

Epoch: 69/88 - Loss: 2.2266 - Accuracy: 0.9698



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:04<00:40,  4.46s/it][A
 30%|███       | 3/10 [00:04<00:08,  1.20s/it][A
 40%|████      | 4/10 [00:04<00:05,  1.18it/s][A
 50%|█████     | 5/10 [00:08<00:09,  1.95s/it][A
 80%|████████  | 8/10 [00:09<00:01,  1.20it/s][A
100%|██████████| 10/10 [00:12<00:00,  1.27s/it][A
Epochs:  78%|███████▊  | 69/88 [2:00:24<32:39, 103.12s/it]

Val Loss: 2.5271 - Val Accuracy: 0.9610



Training:   0%|          | 0/76 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/76 [00:05<06:57,  5.57s/it][A
Training:   3%|▎         | 2/76 [00:05<02:57,  2.40s/it][A
Training:   4%|▍         | 3/76 [00:05<01:38,  1.35s/it][A
Training:   7%|▋         | 5/76 [00:10<02:12,  1.86s/it][A
Training:   9%|▉         | 7/76 [00:10<01:14,  1.08s/it][A
Training:  12%|█▏        | 9/76 [00:15<01:45,  1.58s/it][A
Training:  13%|█▎        | 10/76 [00:15<01:24,  1.28s/it][A
Training:  14%|█▍        | 11/76 [00:15<01:05,  1.00s/it][A
Training:  17%|█▋        | 13/76 [00:20<01:36,  1.53s/it][A
Training:  18%|█▊        | 14/76 [00:20<01:15,  1.21s/it][A
Training:  20%|█▉        | 15/76 [00:20<00:57,  1.06it/s][A
Training:  22%|██▏       | 17/76 [00:24<01:23,  1.42s/it][A
Training:  25%|██▌       | 19/76 [00:24<00:52,  1.08it/s][A
Training:  28%|██▊       | 21/76 [00:29<01:15,  1.37s/it][A
Training:  30%|███       | 23/76 [00:29<00:50,  1.04it/s][A
Training:  32%|███▏      | 24/76 [00:2

Epoch: 70/88 - Loss: 2.1997 - Accuracy: 0.9701



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:05<00:45,  5.10s/it][A
 20%|██        | 2/10 [00:05<00:17,  2.17s/it][A
 30%|███       | 3/10 [00:05<00:08,  1.26s/it][A
 40%|████      | 4/10 [00:05<00:04,  1.20it/s][A
 50%|█████     | 5/10 [00:09<00:09,  1.90s/it][A
 70%|███████   | 7/10 [00:09<00:03,  1.03s/it][A
100%|██████████| 10/10 [00:13<00:00,  1.32s/it][A
Epochs:  80%|███████▉  | 70/88 [2:02:07<30:52, 102.91s/it]

Val Loss: 2.6328 - Val Accuracy: 0.9610



Training:   0%|          | 0/76 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/76 [00:05<07:04,  5.67s/it][A
Training:   3%|▎         | 2/76 [00:05<02:58,  2.42s/it][A
Training:   5%|▌         | 4/76 [00:05<01:08,  1.06it/s][A
Training:   7%|▋         | 5/76 [00:10<02:24,  2.03s/it][A
Training:   8%|▊         | 6/76 [00:10<01:45,  1.51s/it][A
Training:  11%|█         | 8/76 [00:10<00:56,  1.20it/s][A
Training:  12%|█▏        | 9/76 [00:14<01:49,  1.64s/it][A
Training:  13%|█▎        | 10/76 [00:15<01:27,  1.33s/it][A
Training:  14%|█▍        | 11/76 [00:15<01:05,  1.01s/it][A
Training:  16%|█▌        | 12/76 [00:15<00:49,  1.30it/s][A
Training:  17%|█▋        | 13/76 [00:19<01:44,  1.65s/it][A
Training:  18%|█▊        | 14/76 [00:20<01:22,  1.33s/it][A
Training:  20%|█▉        | 15/76 [00:20<01:02,  1.03s/it][A
Training:  22%|██▏       | 17/76 [00:24<01:24,  1.43s/it][A
Training:  24%|██▎       | 18/76 [00:24<01:05,  1.13s/it][A
Training:  25%|██▌       | 19/76 [00:24

Epoch: 71/88 - Loss: 2.2500 - Accuracy: 0.9695



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:05<00:51,  5.78s/it][A
 20%|██        | 2/10 [00:05<00:19,  2.49s/it][A
 30%|███       | 3/10 [00:06<00:09,  1.40s/it][A
 50%|█████     | 5/10 [00:10<00:08,  1.76s/it][A
 70%|███████   | 7/10 [00:10<00:03,  1.02s/it][A
 80%|████████  | 8/10 [00:10<00:01,  1.24it/s][A
100%|██████████| 10/10 [00:14<00:00,  1.48s/it][A
Epochs:  81%|████████  | 71/88 [2:03:58<29:50, 105.35s/it]

Val Loss: 2.7234 - Val Accuracy: 0.9608



Training:   0%|          | 0/76 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/76 [00:05<07:17,  5.83s/it][A
Training:   3%|▎         | 2/76 [00:06<03:12,  2.60s/it][A
Training:   4%|▍         | 3/76 [00:06<01:51,  1.53s/it][A
Training:   5%|▌         | 4/76 [00:06<01:10,  1.02it/s][A
Training:   7%|▋         | 5/76 [00:10<02:27,  2.07s/it][A
Training:   8%|▊         | 6/76 [00:10<01:43,  1.48s/it][A
Training:   9%|▉         | 7/76 [00:11<01:11,  1.03s/it][A
Training:  11%|█         | 8/76 [00:11<00:50,  1.34it/s][A
Training:  12%|█▏        | 9/76 [00:15<02:05,  1.88s/it][A
Training:  13%|█▎        | 10/76 [00:16<01:38,  1.49s/it][A
Training:  14%|█▍        | 11/76 [00:16<01:09,  1.06s/it][A
Training:  17%|█▋        | 13/76 [00:20<01:36,  1.53s/it][A
Training:  18%|█▊        | 14/76 [00:20<01:19,  1.29s/it][A
Training:  21%|██        | 16/76 [00:21<00:46,  1.29it/s][A
Training:  22%|██▏       | 17/76 [00:24<01:27,  1.49s/it][A
Training:  24%|██▎       | 18/76 [00:25<0

Epoch: 72/88 - Loss: 2.1964 - Accuracy: 0.9698



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:04<00:41,  4.64s/it][A
 20%|██        | 2/10 [00:04<00:16,  2.10s/it][A
 40%|████      | 4/10 [00:05<00:05,  1.18it/s][A
 50%|█████     | 5/10 [00:09<00:09,  1.86s/it][A
 60%|██████    | 6/10 [00:09<00:05,  1.32s/it][A
100%|██████████| 10/10 [00:13<00:00,  1.34s/it][A
Epochs:  82%|████████▏ | 72/88 [2:05:44<28:09, 105.62s/it]

Val Loss: 2.6391 - Val Accuracy: 0.9610



Training:   0%|          | 0/76 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/76 [00:05<07:26,  5.96s/it][A
Training:   3%|▎         | 2/76 [00:06<03:05,  2.51s/it][A
Training:   5%|▌         | 4/76 [00:06<01:09,  1.03it/s][A
Training:   8%|▊         | 6/76 [00:10<01:51,  1.60s/it][A
Training:   9%|▉         | 7/76 [00:10<01:25,  1.24s/it][A
Training:  12%|█▏        | 9/76 [00:15<01:52,  1.67s/it][A
Training:  14%|█▍        | 11/76 [00:15<01:09,  1.07s/it][A
Training:  16%|█▌        | 12/76 [00:15<00:56,  1.14it/s][A
Training:  17%|█▋        | 13/76 [00:20<01:49,  1.74s/it][A
Training:  18%|█▊        | 14/76 [00:20<01:23,  1.35s/it][A
Training:  20%|█▉        | 15/76 [00:20<01:03,  1.04s/it][A
Training:  22%|██▏       | 17/76 [00:25<01:34,  1.61s/it][A
Training:  25%|██▌       | 19/76 [00:25<00:58,  1.02s/it][A
Training:  28%|██▊       | 21/76 [00:30<01:26,  1.56s/it][A
Training:  29%|██▉       | 22/76 [00:30<01:08,  1.28s/it][A
Training:  30%|███       | 23/76 [00:3

Epoch: 73/88 - Loss: 2.2301 - Accuracy: 0.9704



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:04<00:43,  4.82s/it][A
 20%|██        | 2/10 [00:05<00:17,  2.19s/it][A
 30%|███       | 3/10 [00:05<00:09,  1.30s/it][A
 40%|████      | 4/10 [00:05<00:05,  1.17it/s][A
 50%|█████     | 5/10 [00:09<00:09,  1.97s/it][A
 60%|██████    | 6/10 [00:09<00:05,  1.36s/it][A
 70%|███████   | 7/10 [00:09<00:02,  1.04it/s][A
100%|██████████| 10/10 [00:13<00:00,  1.38s/it][A
Epochs:  83%|████████▎ | 73/88 [2:07:31<26:31, 106.10s/it]

Val Loss: 2.7591 - Val Accuracy: 0.9610



Training:   0%|          | 0/76 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/76 [00:05<07:03,  5.65s/it][A
Training:   3%|▎         | 2/76 [00:05<02:57,  2.40s/it][A
Training:   5%|▌         | 4/76 [00:05<01:07,  1.07it/s][A
Training:   7%|▋         | 5/76 [00:10<02:31,  2.14s/it][A
Training:   8%|▊         | 6/76 [00:10<01:46,  1.52s/it][A
Training:   9%|▉         | 7/76 [00:11<01:17,  1.13s/it][A
Training:  12%|█▏        | 9/76 [00:15<01:47,  1.60s/it][A
Training:  13%|█▎        | 10/76 [00:15<01:21,  1.23s/it][A
Training:  14%|█▍        | 11/76 [00:15<01:07,  1.04s/it][A
Training:  16%|█▌        | 12/76 [00:16<00:51,  1.24it/s][A
Training:  17%|█▋        | 13/76 [00:20<01:49,  1.73s/it][A
Training:  18%|█▊        | 14/76 [00:20<01:19,  1.28s/it][A
Training:  20%|█▉        | 15/76 [00:20<01:02,  1.03s/it][A
Training:  22%|██▏       | 17/76 [00:25<01:32,  1.57s/it][A
Training:  25%|██▌       | 19/76 [00:26<01:02,  1.10s/it][A
Training:  26%|██▋       | 20/76 [00:26

Epoch: 74/88 - Loss: 2.1786 - Accuracy: 0.9706



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:05<00:48,  5.35s/it][A
 20%|██        | 2/10 [00:05<00:18,  2.28s/it][A
 30%|███       | 3/10 [00:05<00:09,  1.30s/it][A
 40%|████      | 4/10 [00:05<00:04,  1.20it/s][A
 50%|█████     | 5/10 [00:09<00:10,  2.06s/it][A
 80%|████████  | 8/10 [00:10<00:01,  1.19it/s][A
100%|██████████| 10/10 [00:13<00:00,  1.39s/it][A
Epochs:  84%|████████▍ | 74/88 [2:09:18<24:47, 106.28s/it]

Val Loss: 2.7947 - Val Accuracy: 0.9610



Training:   0%|          | 0/76 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/76 [00:05<07:24,  5.92s/it][A
Training:   4%|▍         | 3/76 [00:06<01:55,  1.59s/it][A
Training:   7%|▋         | 5/76 [00:10<02:16,  1.92s/it][A
Training:   9%|▉         | 7/76 [00:10<01:18,  1.14s/it][A
Training:  11%|█         | 8/76 [00:11<01:04,  1.05it/s][A
Training:  12%|█▏        | 9/76 [00:15<02:02,  1.82s/it][A
Training:  13%|█▎        | 10/76 [00:15<01:30,  1.37s/it][A
Training:  14%|█▍        | 11/76 [00:15<01:08,  1.06s/it][A
Training:  16%|█▌        | 12/76 [00:15<00:51,  1.24it/s][A
Training:  17%|█▋        | 13/76 [00:20<01:55,  1.83s/it][A
Training:  18%|█▊        | 14/76 [00:20<01:23,  1.34s/it][A
Training:  21%|██        | 16/76 [00:20<00:46,  1.29it/s][A
Training:  22%|██▏       | 17/76 [00:25<01:39,  1.69s/it][A
Training:  25%|██▌       | 19/76 [00:25<00:57,  1.02s/it][A
Training:  26%|██▋       | 20/76 [00:25<00:46,  1.21it/s][A
Training:  28%|██▊       | 21/76 [00:2

Epoch: 75/88 - Loss: 2.1325 - Accuracy: 0.9701



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:05<00:51,  5.72s/it][A
 20%|██        | 2/10 [00:05<00:19,  2.43s/it][A
 30%|███       | 3/10 [00:05<00:09,  1.38s/it][A
 50%|█████     | 5/10 [00:09<00:08,  1.67s/it][A
 80%|████████  | 8/10 [00:09<00:01,  1.28it/s][A
100%|██████████| 10/10 [00:13<00:00,  1.37s/it][A
Epochs:  85%|████████▌ | 75/88 [2:11:02<22:51, 105.53s/it]

Val Loss: 2.6962 - Val Accuracy: 0.9624



Training:   0%|          | 0/76 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/76 [00:05<06:41,  5.36s/it][A
Training:   3%|▎         | 2/76 [00:05<02:57,  2.40s/it][A
Training:   4%|▍         | 3/76 [00:05<01:40,  1.38s/it][A
Training:   5%|▌         | 4/76 [00:05<01:03,  1.13it/s][A
Training:   7%|▋         | 5/76 [00:10<02:23,  2.03s/it][A
Training:   8%|▊         | 6/76 [00:10<01:45,  1.51s/it][A
Training:  11%|█         | 8/76 [00:10<00:54,  1.25it/s][A
Training:  12%|█▏        | 9/76 [00:14<01:51,  1.67s/it][A
Training:  13%|█▎        | 10/76 [00:15<01:34,  1.42s/it][A
Training:  16%|█▌        | 12/76 [00:15<00:53,  1.19it/s][A
Training:  17%|█▋        | 13/76 [00:19<01:38,  1.56s/it][A
Training:  18%|█▊        | 14/76 [00:20<01:23,  1.35s/it][A
Training:  20%|█▉        | 15/76 [00:20<01:05,  1.07s/it][A
Training:  22%|██▏       | 17/76 [00:24<01:24,  1.44s/it][A
Training:  24%|██▎       | 18/76 [00:25<01:14,  1.28s/it][A
Training:  25%|██▌       | 19/76 [00:25<

Epoch: 76/88 - Loss: 2.2493 - Accuracy: 0.9700



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:05<00:44,  5.00s/it][A
 20%|██        | 2/10 [00:05<00:17,  2.14s/it][A
 30%|███       | 3/10 [00:05<00:08,  1.22s/it][A
 40%|████      | 4/10 [00:05<00:04,  1.22it/s][A
 50%|█████     | 5/10 [00:09<00:10,  2.01s/it][A
 60%|██████    | 6/10 [00:09<00:05,  1.40s/it][A
 70%|███████   | 7/10 [00:09<00:02,  1.01it/s][A
 80%|████████  | 8/10 [00:10<00:01,  1.40it/s][A
100%|██████████| 10/10 [00:13<00:00,  1.39s/it][A
Epochs:  86%|████████▋ | 76/88 [2:12:46<21:02, 105.20s/it]

Val Loss: 2.5438 - Val Accuracy: 0.9624



Training:   0%|          | 0/76 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/76 [00:05<07:11,  5.75s/it][A
Training:   3%|▎         | 2/76 [00:05<03:03,  2.48s/it][A
Training:   4%|▍         | 3/76 [00:06<01:42,  1.40s/it][A
Training:   7%|▋         | 5/76 [00:11<02:25,  2.04s/it][A
Training:   9%|▉         | 7/76 [00:11<01:20,  1.16s/it][A
Training:  11%|█         | 8/76 [00:11<01:05,  1.04it/s][A
Training:  12%|█▏        | 9/76 [00:16<02:09,  1.94s/it][A
Training:  14%|█▍        | 11/76 [00:16<01:14,  1.14s/it][A
Training:  17%|█▋        | 13/76 [00:21<01:43,  1.65s/it][A
Training:  18%|█▊        | 14/76 [00:21<01:26,  1.40s/it][A
Training:  21%|██        | 16/76 [00:22<00:54,  1.09it/s][A
Training:  22%|██▏       | 17/76 [00:26<01:36,  1.64s/it][A
Training:  24%|██▎       | 18/76 [00:26<01:19,  1.37s/it][A
Training:  25%|██▌       | 19/76 [00:27<01:01,  1.08s/it][A
Training:  26%|██▋       | 20/76 [00:27<00:47,  1.18it/s][A
Training:  28%|██▊       | 21/76 [00:31

Epoch: 77/88 - Loss: 2.1914 - Accuracy: 0.9705



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:04<00:44,  4.90s/it][A
 20%|██        | 2/10 [00:05<00:16,  2.09s/it][A
 40%|████      | 4/10 [00:05<00:04,  1.22it/s][A
 60%|██████    | 6/10 [00:09<00:05,  1.41s/it][A
100%|██████████| 10/10 [00:13<00:00,  1.31s/it][A
Epochs:  88%|████████▊ | 77/88 [2:14:31<19:17, 105.20s/it]

Val Loss: 2.7025 - Val Accuracy: 0.9624



Training:   0%|          | 0/76 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/76 [00:05<06:51,  5.49s/it][A
Training:   3%|▎         | 2/76 [00:05<02:52,  2.33s/it][A
Training:   4%|▍         | 3/76 [00:05<01:38,  1.35s/it][A
Training:   5%|▌         | 4/76 [00:06<01:05,  1.10it/s][A
Training:   7%|▋         | 5/76 [00:10<02:36,  2.20s/it][A
Training:   9%|▉         | 7/76 [00:10<01:17,  1.12s/it][A
Training:  12%|█▏        | 9/76 [00:15<01:49,  1.63s/it][A
Training:  13%|█▎        | 10/76 [00:15<01:25,  1.29s/it][A
Training:  14%|█▍        | 11/76 [00:15<01:07,  1.03s/it][A
Training:  16%|█▌        | 12/76 [00:15<00:52,  1.22it/s][A
Training:  17%|█▋        | 13/76 [00:20<01:47,  1.70s/it][A
Training:  20%|█▉        | 15/76 [00:20<01:00,  1.01it/s][A
Training:  21%|██        | 16/76 [00:20<00:48,  1.24it/s][A
Training:  22%|██▏       | 17/76 [00:24<01:40,  1.71s/it][A
Training:  25%|██▌       | 19/76 [00:24<00:58,  1.02s/it][A
Training:  26%|██▋       | 20/76 [00:25

Epoch: 78/88 - Loss: 2.1566 - Accuracy: 0.9698



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:04<00:43,  4.87s/it][A
 20%|██        | 2/10 [00:05<00:16,  2.09s/it][A
 40%|████      | 4/10 [00:05<00:04,  1.21it/s][A
 50%|█████     | 5/10 [00:09<00:08,  1.80s/it][A
 70%|███████   | 7/10 [00:09<00:02,  1.02it/s][A
100%|██████████| 10/10 [00:13<00:00,  1.31s/it][A
Epochs:  89%|████████▊ | 78/88 [2:16:14<17:25, 104.51s/it]

Val Loss: 2.4574 - Val Accuracy: 0.9619



Training:   0%|          | 0/76 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/76 [00:05<07:08,  5.72s/it][A
Training:   3%|▎         | 2/76 [00:05<02:59,  2.43s/it][A
Training:   5%|▌         | 4/76 [00:06<01:10,  1.02it/s][A
Training:   7%|▋         | 5/76 [00:10<02:29,  2.11s/it][A
Training:   8%|▊         | 6/76 [00:10<01:44,  1.49s/it][A
Training:   9%|▉         | 7/76 [00:11<01:15,  1.09s/it][A
Training:  11%|█         | 8/76 [00:11<00:54,  1.25it/s][A
Training:  12%|█▏        | 9/76 [00:15<02:07,  1.90s/it][A
Training:  14%|█▍        | 11/76 [00:15<01:07,  1.04s/it][A
Training:  17%|█▋        | 13/76 [00:20<01:40,  1.60s/it][A
Training:  20%|█▉        | 15/76 [00:20<01:03,  1.04s/it][A
Training:  21%|██        | 16/76 [00:20<00:51,  1.17it/s][A
Training:  22%|██▏       | 17/76 [00:25<01:38,  1.67s/it][A
Training:  24%|██▎       | 18/76 [00:25<01:14,  1.29s/it][A
Training:  26%|██▋       | 20/76 [00:25<00:44,  1.25it/s][A
Training:  28%|██▊       | 21/76 [00:29<

Epoch: 79/88 - Loss: 2.2106 - Accuracy: 0.9689



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:04<00:44,  4.92s/it][A
 20%|██        | 2/10 [00:05<00:17,  2.13s/it][A
 40%|████      | 4/10 [00:05<00:05,  1.20it/s][A
 50%|█████     | 5/10 [00:09<00:08,  1.77s/it][A
 60%|██████    | 6/10 [00:09<00:05,  1.27s/it][A
 70%|███████   | 7/10 [00:09<00:02,  1.05it/s][A
 80%|████████  | 8/10 [00:09<00:01,  1.44it/s][A
100%|██████████| 10/10 [00:13<00:00,  1.30s/it][A
Epochs:  90%|████████▉ | 79/88 [2:17:56<15:34, 103.80s/it]

Val Loss: 2.8601 - Val Accuracy: 0.9624



Training:   0%|          | 0/76 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/76 [00:05<06:49,  5.46s/it][A
Training:   3%|▎         | 2/76 [00:05<03:01,  2.45s/it][A
Training:   4%|▍         | 3/76 [00:05<01:43,  1.41s/it][A
Training:   5%|▌         | 4/76 [00:06<01:05,  1.10it/s][A
Training:   7%|▋         | 5/76 [00:10<02:32,  2.14s/it][A
Training:   8%|▊         | 6/76 [00:10<01:46,  1.52s/it][A
Training:   9%|▉         | 7/76 [00:10<01:13,  1.06s/it][A
Training:  11%|█         | 8/76 [00:11<00:53,  1.27it/s][A
Training:  12%|█▏        | 9/76 [00:15<02:05,  1.87s/it][A
Training:  14%|█▍        | 11/76 [00:15<01:06,  1.02s/it][A
Training:  17%|█▋        | 13/76 [00:20<01:37,  1.55s/it][A
Training:  18%|█▊        | 14/76 [00:20<01:17,  1.25s/it][A
Training:  20%|█▉        | 15/76 [00:20<00:59,  1.02it/s][A
Training:  22%|██▏       | 17/76 [00:24<01:28,  1.50s/it][A
Training:  24%|██▎       | 18/76 [00:25<01:08,  1.18s/it][A
Training:  25%|██▌       | 19/76 [00:25<0

Epoch: 80/88 - Loss: 2.1618 - Accuracy: 0.9698



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:05<00:45,  5.05s/it][A
 30%|███       | 3/10 [00:05<00:09,  1.35s/it][A
 50%|█████     | 5/10 [00:09<00:09,  1.83s/it][A
 70%|███████   | 7/10 [00:09<00:03,  1.08s/it][A
100%|██████████| 10/10 [00:13<00:00,  1.38s/it][A
Epochs:  91%|█████████ | 80/88 [2:19:40<13:50, 103.77s/it]

Val Loss: 2.5944 - Val Accuracy: 0.9630



Training:   0%|          | 0/76 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/76 [00:05<07:04,  5.66s/it][A
Training:   3%|▎         | 2/76 [00:05<03:02,  2.46s/it][A
Training:   5%|▌         | 4/76 [00:06<01:09,  1.04it/s][A
Training:   7%|▋         | 5/76 [00:10<02:29,  2.10s/it][A
Training:   8%|▊         | 6/76 [00:11<01:52,  1.60s/it][A
Training:   9%|▉         | 7/76 [00:11<01:20,  1.16s/it][A
Training:  11%|█         | 8/76 [00:11<00:57,  1.18it/s][A
Training:  12%|█▏        | 9/76 [00:15<02:00,  1.80s/it][A
Training:  13%|█▎        | 10/76 [00:15<01:30,  1.37s/it][A
Training:  16%|█▌        | 12/76 [00:15<00:48,  1.31it/s][A
Training:  17%|█▋        | 13/76 [00:20<01:41,  1.61s/it][A
Training:  18%|█▊        | 14/76 [00:20<01:24,  1.36s/it][A
Training:  21%|██        | 16/76 [00:20<00:48,  1.23it/s][A
Training:  22%|██▏       | 17/76 [00:24<01:31,  1.55s/it][A
Training:  24%|██▎       | 18/76 [00:25<01:14,  1.29s/it][A
Training:  26%|██▋       | 20/76 [00:25<

Epoch: 81/88 - Loss: 2.1340 - Accuracy: 0.9701



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:05<00:46,  5.15s/it][A
 20%|██        | 2/10 [00:05<00:17,  2.19s/it][A
 30%|███       | 3/10 [00:05<00:08,  1.25s/it][A
 50%|█████     | 5/10 [00:09<00:08,  1.79s/it][A
 70%|███████   | 7/10 [00:09<00:03,  1.02s/it][A
100%|██████████| 10/10 [00:13<00:00,  1.38s/it][A
Epochs:  92%|█████████▏| 81/88 [2:21:23<12:05, 103.66s/it]

Val Loss: 2.5460 - Val Accuracy: 0.9624



Training:   0%|          | 0/76 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/76 [00:05<07:07,  5.70s/it][A
Training:   3%|▎         | 2/76 [00:05<03:05,  2.51s/it][A
Training:   5%|▌         | 4/76 [00:06<01:09,  1.03it/s][A
Training:   7%|▋         | 5/76 [00:10<02:32,  2.15s/it][A
Training:   8%|▊         | 6/76 [00:11<01:47,  1.53s/it][A
Training:   9%|▉         | 7/76 [00:11<01:15,  1.10s/it][A
Training:  12%|█▏        | 9/76 [00:15<01:53,  1.69s/it][A
Training:  14%|█▍        | 11/76 [00:15<01:07,  1.04s/it][A
Training:  17%|█▋        | 13/76 [00:20<01:35,  1.51s/it][A
Training:  18%|█▊        | 14/76 [00:20<01:15,  1.22s/it][A
Training:  20%|█▉        | 15/76 [00:20<00:59,  1.03it/s][A
Training:  21%|██        | 16/76 [00:21<00:46,  1.28it/s][A
Training:  22%|██▏       | 17/76 [00:25<01:39,  1.69s/it][A
Training:  24%|██▎       | 18/76 [00:25<01:14,  1.28s/it][A
Training:  25%|██▌       | 19/76 [00:25<00:54,  1.05it/s][A
Training:  26%|██▋       | 20/76 [00:25

Epoch: 82/88 - Loss: 2.1511 - Accuracy: 0.9705



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:04<00:44,  4.94s/it][A
 20%|██        | 2/10 [00:05<00:17,  2.24s/it][A
 30%|███       | 3/10 [00:05<00:08,  1.27s/it][A
 50%|█████     | 5/10 [00:09<00:08,  1.69s/it][A
 60%|██████    | 6/10 [00:09<00:05,  1.28s/it][A
 70%|███████   | 7/10 [00:09<00:02,  1.06it/s][A
 90%|█████████ | 9/10 [00:13<00:01,  1.29s/it][A
100%|██████████| 10/10 [00:13<00:00,  1.36s/it][A
Epochs:  93%|█████████▎| 82/88 [2:23:07<10:21, 103.62s/it]

Val Loss: 2.6195 - Val Accuracy: 0.9624



Training:   0%|          | 0/76 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/76 [00:05<07:00,  5.60s/it][A
Training:   3%|▎         | 2/76 [00:05<02:56,  2.39s/it][A
Training:   4%|▍         | 3/76 [00:05<01:38,  1.35s/it][A
Training:   7%|▋         | 5/76 [00:10<02:14,  1.89s/it][A
Training:   8%|▊         | 6/76 [00:10<01:38,  1.41s/it][A
Training:  11%|█         | 8/76 [00:10<00:56,  1.21it/s][A
Training:  12%|█▏        | 9/76 [00:15<01:55,  1.72s/it][A
Training:  13%|█▎        | 10/76 [00:15<01:28,  1.34s/it][A
Training:  14%|█▍        | 11/76 [00:15<01:06,  1.03s/it][A
Training:  17%|█▋        | 13/76 [00:20<01:37,  1.55s/it][A
Training:  18%|█▊        | 14/76 [00:20<01:15,  1.21s/it][A
Training:  21%|██        | 16/76 [00:20<00:47,  1.26it/s][A
Training:  22%|██▏       | 17/76 [00:25<01:35,  1.62s/it][A
Training:  24%|██▎       | 18/76 [00:25<01:14,  1.28s/it][A
Training:  26%|██▋       | 20/76 [00:25<00:45,  1.23it/s][A
Training:  28%|██▊       | 21/76 [00:30

Epoch: 83/88 - Loss: 2.1193 - Accuracy: 0.9705



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:05<00:45,  5.03s/it][A
 20%|██        | 2/10 [00:05<00:17,  2.16s/it][A
 40%|████      | 4/10 [00:05<00:05,  1.19it/s][A
 60%|██████    | 6/10 [00:09<00:06,  1.52s/it][A
 80%|████████  | 8/10 [00:09<00:01,  1.07it/s][A
100%|██████████| 10/10 [00:13<00:00,  1.36s/it][A
Epochs:  94%|█████████▍| 83/88 [2:24:52<08:39, 103.90s/it]

Val Loss: 2.6120 - Val Accuracy: 0.9624



Training:   0%|          | 0/76 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/76 [00:05<06:46,  5.43s/it][A
Training:   3%|▎         | 2/76 [00:05<02:55,  2.38s/it][A
Training:   4%|▍         | 3/76 [00:05<01:38,  1.35s/it][A
Training:   5%|▌         | 4/76 [00:05<01:03,  1.13it/s][A
Training:   7%|▋         | 5/76 [00:10<02:31,  2.14s/it][A
Training:   8%|▊         | 6/76 [00:10<01:49,  1.56s/it][A
Training:  11%|█         | 8/76 [00:10<00:55,  1.22it/s][A
Training:  12%|█▏        | 9/76 [00:15<01:54,  1.71s/it][A
Training:  13%|█▎        | 10/76 [00:15<01:31,  1.38s/it][A
Training:  14%|█▍        | 11/76 [00:15<01:07,  1.04s/it][A
Training:  16%|█▌        | 12/76 [00:15<00:51,  1.25it/s][A
Training:  17%|█▋        | 13/76 [00:19<01:44,  1.66s/it][A
Training:  18%|█▊        | 14/76 [00:20<01:25,  1.37s/it][A
Training:  20%|█▉        | 15/76 [00:20<01:01,  1.00s/it][A
Training:  21%|██        | 16/76 [00:20<00:44,  1.35it/s][A
Training:  22%|██▏       | 17/76 [00:24<

Epoch: 84/88 - Loss: 2.1280 - Accuracy: 0.9703



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:05<00:45,  5.04s/it][A
 20%|██        | 2/10 [00:05<00:17,  2.23s/it][A
 30%|███       | 3/10 [00:05<00:09,  1.32s/it][A
 40%|████      | 4/10 [00:05<00:05,  1.15it/s][A
 50%|█████     | 5/10 [00:09<00:09,  1.92s/it][A
 60%|██████    | 6/10 [00:10<00:05,  1.44s/it][A
 80%|████████  | 8/10 [00:10<00:01,  1.32it/s][A
100%|██████████| 10/10 [00:13<00:00,  1.35s/it][A
Epochs:  95%|█████████▌| 84/88 [2:26:35<06:54, 103.67s/it]

Val Loss: 2.6426 - Val Accuracy: 0.9621



Training:   0%|          | 0/76 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/76 [00:05<06:55,  5.54s/it][A
Training:   3%|▎         | 2/76 [00:05<02:58,  2.41s/it][A
Training:   4%|▍         | 3/76 [00:06<01:44,  1.43s/it][A
Training:   5%|▌         | 4/76 [00:06<01:07,  1.07it/s][A
Training:   7%|▋         | 5/76 [00:10<02:36,  2.21s/it][A
Training:   8%|▊         | 6/76 [00:10<01:45,  1.51s/it][A
Training:   9%|▉         | 7/76 [00:11<01:14,  1.08s/it][A
Training:  11%|█         | 8/76 [00:11<00:52,  1.29it/s][A
Training:  12%|█▏        | 9/76 [00:15<02:17,  2.05s/it][A
Training:  14%|█▍        | 11/76 [00:16<01:11,  1.11s/it][A
Training:  16%|█▌        | 12/76 [00:16<00:55,  1.16it/s][A
Training:  17%|█▋        | 13/76 [00:20<01:54,  1.81s/it][A
Training:  18%|█▊        | 14/76 [00:20<01:25,  1.38s/it][A
Training:  20%|█▉        | 15/76 [00:21<01:03,  1.03s/it][A
Training:  21%|██        | 16/76 [00:21<00:48,  1.25it/s][A
Training:  22%|██▏       | 17/76 [00:25<0

Epoch: 85/88 - Loss: 2.1058 - Accuracy: 0.9707



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:04<00:44,  4.99s/it][A
 20%|██        | 2/10 [00:05<00:17,  2.16s/it][A
 30%|███       | 3/10 [00:05<00:08,  1.26s/it][A
 50%|█████     | 5/10 [00:09<00:08,  1.76s/it][A
 70%|███████   | 7/10 [00:09<00:02,  1.00it/s][A
100%|██████████| 10/10 [00:13<00:00,  1.37s/it][A
Epochs:  97%|█████████▋| 85/88 [2:28:19<05:11, 103.86s/it]

Val Loss: 2.6282 - Val Accuracy: 0.9630



Training:   0%|          | 0/76 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/76 [00:05<06:54,  5.53s/it][A
Training:   3%|▎         | 2/76 [00:05<02:57,  2.39s/it][A
Training:   5%|▌         | 4/76 [00:05<01:08,  1.06it/s][A
Training:   7%|▋         | 5/76 [00:10<02:32,  2.15s/it][A
Training:   8%|▊         | 6/76 [00:10<01:48,  1.55s/it][A
Training:   9%|▉         | 7/76 [00:11<01:17,  1.13s/it][A
Training:  12%|█▏        | 9/76 [00:15<01:49,  1.64s/it][A
Training:  13%|█▎        | 10/76 [00:15<01:23,  1.27s/it][A
Training:  16%|█▌        | 12/76 [00:15<00:49,  1.30it/s][A
Training:  17%|█▋        | 13/76 [00:20<01:46,  1.69s/it][A
Training:  18%|█▊        | 14/76 [00:20<01:21,  1.31s/it][A
Training:  21%|██        | 16/76 [00:20<00:48,  1.23it/s][A
Training:  22%|██▏       | 17/76 [00:25<01:40,  1.70s/it][A
Training:  24%|██▎       | 18/76 [00:25<01:16,  1.31s/it][A
Training:  25%|██▌       | 19/76 [00:25<00:57,  1.02s/it][A
Training:  28%|██▊       | 21/76 [00:30

Epoch: 86/88 - Loss: 2.0725 - Accuracy: 0.9707



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:05<00:48,  5.41s/it][A
 30%|███       | 3/10 [00:05<00:10,  1.52s/it][A
 40%|████      | 4/10 [00:05<00:06,  1.05s/it][A
 50%|█████     | 5/10 [00:10<00:11,  2.29s/it][A
 60%|██████    | 6/10 [00:10<00:06,  1.59s/it][A
 80%|████████  | 8/10 [00:11<00:01,  1.13it/s][A
100%|██████████| 10/10 [00:14<00:00,  1.49s/it][A
Epochs:  98%|█████████▊| 86/88 [2:30:11<03:32, 106.44s/it]

Val Loss: 2.4401 - Val Accuracy: 0.9626



Training:   0%|          | 0/76 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/76 [00:05<07:16,  5.82s/it][A
Training:   3%|▎         | 2/76 [00:05<03:03,  2.48s/it][A
Training:   4%|▍         | 3/76 [00:06<01:42,  1.41s/it][A
Training:   7%|▋         | 5/76 [00:11<02:26,  2.07s/it][A
Training:   8%|▊         | 6/76 [00:11<01:45,  1.51s/it][A
Training:  11%|█         | 8/76 [00:11<00:58,  1.15it/s][A
Training:  12%|█▏        | 9/76 [00:16<02:03,  1.84s/it][A
Training:  13%|█▎        | 10/76 [00:16<01:31,  1.39s/it][A
Training:  16%|█▌        | 12/76 [00:16<00:52,  1.21it/s][A
Training:  17%|█▋        | 13/76 [00:21<01:49,  1.74s/it][A
Training:  20%|█▉        | 15/76 [00:21<01:05,  1.07s/it][A
Training:  21%|██        | 16/76 [00:21<00:52,  1.15it/s][A
Training:  22%|██▏       | 17/76 [00:26<01:50,  1.87s/it][A
Training:  24%|██▎       | 18/76 [00:26<01:22,  1.43s/it][A
Training:  25%|██▌       | 19/76 [00:26<01:01,  1.07s/it][A
Training:  28%|██▊       | 21/76 [00:31

Epoch: 87/88 - Loss: 2.1108 - Accuracy: 0.9705



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:05<00:50,  5.56s/it][A
 20%|██        | 2/10 [00:05<00:18,  2.35s/it][A
 40%|████      | 4/10 [00:05<00:05,  1.09it/s][A
 60%|██████    | 6/10 [00:10<00:06,  1.57s/it][A
 70%|███████   | 7/10 [00:10<00:03,  1.21s/it][A
 80%|████████  | 8/10 [00:10<00:01,  1.08it/s][A
100%|██████████| 10/10 [00:14<00:00,  1.46s/it][A
Epochs:  99%|█████████▉| 87/88 [2:32:02<01:47, 107.55s/it]

Val Loss: 2.7225 - Val Accuracy: 0.9626



Training:   0%|          | 0/76 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/76 [00:05<07:22,  5.90s/it][A
Training:   3%|▎         | 2/76 [00:06<03:06,  2.52s/it][A
Training:   4%|▍         | 3/76 [00:06<01:45,  1.45s/it][A
Training:   5%|▌         | 4/76 [00:06<01:06,  1.09it/s][A
Training:   7%|▋         | 5/76 [00:11<02:47,  2.36s/it][A
Training:   8%|▊         | 6/76 [00:11<01:54,  1.63s/it][A
Training:   9%|▉         | 7/76 [00:11<01:20,  1.16s/it][A
Training:  11%|█         | 8/76 [00:11<00:58,  1.16it/s][A
Training:  12%|█▏        | 9/76 [00:16<02:08,  1.92s/it][A
Training:  14%|█▍        | 11/76 [00:16<01:10,  1.09s/it][A
Training:  16%|█▌        | 12/76 [00:16<00:53,  1.19it/s][A
Training:  17%|█▋        | 13/76 [00:21<02:01,  1.93s/it][A
Training:  20%|█▉        | 15/76 [00:21<01:08,  1.13s/it][A
Training:  21%|██        | 16/76 [00:21<00:53,  1.13it/s][A
Training:  22%|██▏       | 17/76 [00:26<01:51,  1.89s/it][A
Training:  24%|██▎       | 18/76 [00:26<0

Epoch: 88/88 - Loss: 2.0852 - Accuracy: 0.9717



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:06<01:01,  6.86s/it][A
 20%|██        | 2/10 [00:07<00:23,  2.94s/it][A
 30%|███       | 3/10 [00:07<00:11,  1.68s/it][A
 50%|█████     | 5/10 [00:12<00:10,  2.15s/it][A
 60%|██████    | 6/10 [00:12<00:06,  1.57s/it][A
100%|██████████| 10/10 [00:16<00:00,  1.69s/it][A
Epochs: 100%|██████████| 88/88 [2:33:58<00:00, 104.99s/it]


Val Loss: 2.4291 - Val Accuracy: 0.9626


[32m[I 2023-12-08 14:23:44,381][0m Trial 2 finished with value: 0.9626457095146179 and parameters: {'loss_learning_rate': 0.0008958261761009699, 'learning_rate': 1.5218716314145224e-05, 'weight_decay': 0.0049081536466633905, 'epsilon': 1.7968823637993475e-08, 'beta': 0.4, 'gamma': 0.5, 'batch_size': 186, 'epochs': 88}. Best is trial 0 with value: 0.9648317694664001.[0m


Learning rate for Loss: 0.0007864547818893396
Learning rate: 0.026672551860448212
Weight decay: 0.0004995203487508594
Epsilon: 2.215641865314564e-08
Beta: 0.4
Gamma: 0.8
Batch size: 193
Number of epochs: 35


Epochs:   0%|          | 0/35 [00:00<?, ?it/s]
Training:   0%|          | 0/73 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/73 [00:06<07:42,  6.42s/it][A
Training:   3%|▎         | 2/73 [00:06<03:24,  2.88s/it][A
Training:   5%|▌         | 4/73 [00:06<01:16,  1.12s/it][A
Training:   7%|▋         | 5/73 [00:12<02:53,  2.56s/it][A
Training:   8%|▊         | 6/73 [00:12<02:03,  1.85s/it][A
Training:  11%|█         | 8/73 [00:13<01:05,  1.02s/it][A
Training:  12%|█▏        | 9/73 [00:18<02:08,  2.00s/it][A
Training:  14%|█▎        | 10/73 [00:18<01:38,  1.57s/it][A
Training:  16%|█▋        | 12/73 [00:18<00:56,  1.09it/s][A
Training:  18%|█▊        | 13/73 [00:23<01:54,  1.91s/it][A
Training:  19%|█▉        | 14/73 [00:24<01:35,  1.61s/it][A
Training:  22%|██▏       | 16/73 [00:24<00:54,  1.04it/s][A
Training:  23%|██▎       | 17/73 [00:30<01:56,  2.08s/it][A
Training:  25%|██▍       | 18/73 [00:31<01:35,  1.73s/it][A
Training:  26%|██▌       | 19/73 [00:31<01:11,  1.32s/

Epoch: 1/35 - Loss: 654.3174 - Accuracy: 0.8801



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:05<00:50,  5.64s/it][A
 20%|██        | 2/10 [00:05<00:20,  2.51s/it][A
 30%|███       | 3/10 [00:06<00:10,  1.45s/it][A
 40%|████      | 4/10 [00:06<00:05,  1.05it/s][A
 50%|█████     | 5/10 [00:11<00:11,  2.35s/it][A
 70%|███████   | 7/10 [00:11<00:03,  1.23s/it][A
 80%|████████  | 8/10 [00:11<00:01,  1.07it/s][A
100%|██████████| 10/10 [00:15<00:00,  1.57s/it][A
Epochs:   3%|▎         | 1/35 [01:58<1:07:02, 118.32s/it]

Val Loss: 903.7855 - Val Accuracy: 0.9523



Training:   0%|          | 0/73 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/73 [00:06<07:57,  6.63s/it][A
Training:   3%|▎         | 2/73 [00:06<03:18,  2.80s/it][A
Training:   4%|▍         | 3/73 [00:06<01:49,  1.57s/it][A
Training:   5%|▌         | 4/73 [00:07<01:10,  1.02s/it][A
Training:   7%|▋         | 5/73 [00:12<03:01,  2.67s/it][A
Training:   8%|▊         | 6/73 [00:12<02:00,  1.80s/it][A
Training:  11%|█         | 8/73 [00:12<01:01,  1.06it/s][A
Training:  12%|█▏        | 9/73 [00:18<02:17,  2.16s/it][A
Training:  14%|█▎        | 10/73 [00:18<01:41,  1.61s/it][A
Training:  15%|█▌        | 11/73 [00:18<01:13,  1.19s/it][A
Training:  16%|█▋        | 12/73 [00:18<00:54,  1.12it/s][A
Training:  18%|█▊        | 13/73 [00:24<02:11,  2.18s/it][A
Training:  21%|██        | 15/73 [00:24<01:10,  1.22s/it][A
Training:  22%|██▏       | 16/73 [00:24<00:54,  1.06it/s][A
Training:  23%|██▎       | 17/73 [00:29<01:58,  2.12s/it][A
Training:  25%|██▍       | 18/73 [00:30<

Epoch: 2/35 - Loss: 1131.4542 - Accuracy: 0.9306



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:05<00:50,  5.64s/it][A
 20%|██        | 2/10 [00:05<00:19,  2.40s/it][A
 30%|███       | 3/10 [00:06<00:10,  1.53s/it][A
 40%|████      | 4/10 [00:06<00:05,  1.02it/s][A
 50%|█████     | 5/10 [00:11<00:11,  2.30s/it][A
 60%|██████    | 6/10 [00:11<00:06,  1.59s/it][A
 70%|███████   | 7/10 [00:11<00:03,  1.27s/it][A
100%|██████████| 10/10 [00:15<00:00,  1.59s/it][A
Epochs:   6%|▌         | 2/35 [03:55<1:04:44, 117.70s/it]

Val Loss: 1215.4076 - Val Accuracy: 0.9420



Training:   0%|          | 0/73 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/73 [00:06<07:52,  6.56s/it][A
Training:   3%|▎         | 2/73 [00:07<03:32,  2.99s/it][A
Training:   4%|▍         | 3/73 [00:07<01:59,  1.71s/it][A
Training:   5%|▌         | 4/73 [00:07<01:15,  1.10s/it][A
Training:   7%|▋         | 5/73 [00:12<02:52,  2.53s/it][A
Training:   8%|▊         | 6/73 [00:12<02:00,  1.80s/it][A
Training:  10%|▉         | 7/73 [00:12<01:22,  1.25s/it][A
Training:  12%|█▏        | 9/73 [00:18<02:02,  1.91s/it][A
Training:  14%|█▎        | 10/73 [00:18<01:35,  1.51s/it][A
Training:  15%|█▌        | 11/73 [00:18<01:10,  1.14s/it][A
Training:  18%|█▊        | 13/73 [00:23<01:46,  1.77s/it][A
Training:  19%|█▉        | 14/73 [00:24<01:23,  1.42s/it][A
Training:  21%|██        | 15/73 [00:24<01:03,  1.10s/it][A
Training:  23%|██▎       | 17/73 [00:29<01:34,  1.69s/it][A
Training:  25%|██▍       | 18/73 [00:29<01:14,  1.35s/it][A
Training:  27%|██▋       | 20/73 [00:29<

Epoch: 3/35 - Loss: 1488.2982 - Accuracy: 0.9396



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:06<00:55,  6.11s/it][A
 20%|██        | 2/10 [00:06<00:20,  2.62s/it][A
 30%|███       | 3/10 [00:06<00:10,  1.47s/it][A
 50%|█████     | 5/10 [00:11<00:10,  2.09s/it][A
 60%|██████    | 6/10 [00:11<00:06,  1.52s/it][A
 80%|████████  | 8/10 [00:11<00:01,  1.16it/s][A
100%|██████████| 10/10 [00:16<00:00,  1.63s/it][A
Epochs:   9%|▊         | 3/35 [05:54<1:02:59, 118.10s/it]

Val Loss: 1406.6609 - Val Accuracy: 0.9544



Training:   0%|          | 0/73 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/73 [00:06<07:57,  6.64s/it][A
Training:   3%|▎         | 2/73 [00:06<03:18,  2.79s/it][A
Training:   4%|▍         | 3/73 [00:06<01:51,  1.59s/it][A
Training:   5%|▌         | 4/73 [00:07<01:09,  1.01s/it][A
Training:   7%|▋         | 5/73 [00:12<03:08,  2.77s/it][A
Training:  10%|▉         | 7/73 [00:13<01:32,  1.40s/it][A
Training:  12%|█▏        | 9/73 [00:19<02:19,  2.18s/it][A
Training:  15%|█▌        | 11/73 [00:19<01:26,  1.39s/it][A
Training:  18%|█▊        | 13/73 [00:26<02:04,  2.08s/it][A
Training:  21%|██        | 15/73 [00:26<01:22,  1.42s/it][A
Training:  23%|██▎       | 17/73 [00:32<01:49,  1.96s/it][A
Training:  25%|██▍       | 18/73 [00:32<01:28,  1.61s/it][A
Training:  26%|██▌       | 19/73 [00:33<01:10,  1.30s/it][A
Training:  29%|██▉       | 21/73 [00:38<01:36,  1.86s/it][A
Training:  32%|███▏      | 23/73 [00:38<01:02,  1.26s/it][A
Training:  34%|███▍      | 25/73 [00:44

Epoch: 4/35 - Loss: 1495.4575 - Accuracy: 0.9379



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:05<00:51,  5.72s/it][A
 30%|███       | 3/10 [00:05<00:10,  1.54s/it][A
 40%|████      | 4/10 [00:06<00:06,  1.05s/it][A
 50%|█████     | 5/10 [00:10<00:11,  2.21s/it][A
 60%|██████    | 6/10 [00:10<00:06,  1.54s/it][A
 70%|███████   | 7/10 [00:10<00:03,  1.10s/it][A
 80%|████████  | 8/10 [00:10<00:01,  1.25it/s][A
100%|██████████| 10/10 [00:14<00:00,  1.49s/it][A
Epochs:  11%|█▏        | 4/35 [07:57<1:02:02, 120.08s/it]

Val Loss: 1631.3365 - Val Accuracy: 0.9513



Training:   0%|          | 0/73 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/73 [00:06<07:30,  6.26s/it][A
Training:   4%|▍         | 3/73 [00:06<01:56,  1.67s/it][A
Training:   5%|▌         | 4/73 [00:06<01:19,  1.15s/it][A
Training:   7%|▋         | 5/73 [00:11<02:53,  2.56s/it][A
Training:   8%|▊         | 6/73 [00:12<01:58,  1.77s/it][A
Training:  11%|█         | 8/73 [00:12<01:02,  1.05it/s][A
Training:  12%|█▏        | 9/73 [00:17<02:10,  2.05s/it][A
Training:  14%|█▎        | 10/73 [00:17<01:36,  1.53s/it][A
Training:  15%|█▌        | 11/73 [00:17<01:10,  1.14s/it][A
Training:  16%|█▋        | 12/73 [00:17<00:52,  1.17it/s][A
Training:  18%|█▊        | 13/73 [00:22<02:06,  2.10s/it][A
Training:  19%|█▉        | 14/73 [00:23<01:32,  1.56s/it][A
Training:  21%|██        | 15/73 [00:23<01:06,  1.15s/it][A
Training:  23%|██▎       | 17/73 [00:28<01:38,  1.76s/it][A
Training:  26%|██▌       | 19/73 [00:28<00:59,  1.09s/it][A
Training:  29%|██▉       | 21/73 [00:32

Epoch: 5/35 - Loss: 1513.8732 - Accuracy: 0.9459



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:06<00:56,  6.29s/it][A
 20%|██        | 2/10 [00:06<00:22,  2.78s/it][A
 40%|████      | 4/10 [00:06<00:06,  1.07s/it][A
 50%|█████     | 5/10 [00:11<00:11,  2.35s/it][A
 60%|██████    | 6/10 [00:12<00:06,  1.68s/it][A
 80%|████████  | 8/10 [00:12<00:01,  1.09it/s][A
100%|██████████| 10/10 [00:16<00:00,  1.69s/it][A
Epochs:  14%|█▍        | 5/35 [09:59<1:00:29, 121.00s/it]

Val Loss: 1740.9301 - Val Accuracy: 0.9549



Training:   0%|          | 0/73 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/73 [00:06<08:00,  6.67s/it][A
Training:   3%|▎         | 2/73 [00:07<03:44,  3.16s/it][A
Training:   5%|▌         | 4/73 [00:07<01:24,  1.22s/it][A
Training:   7%|▋         | 5/73 [00:13<02:57,  2.61s/it][A
Training:   8%|▊         | 6/73 [00:13<02:14,  2.01s/it][A
Training:  10%|▉         | 7/73 [00:14<01:36,  1.46s/it][A
Training:  11%|█         | 8/73 [00:14<01:08,  1.06s/it][A
Training:  12%|█▏        | 9/73 [00:19<02:37,  2.45s/it][A
Training:  14%|█▎        | 10/73 [00:20<01:55,  1.83s/it][A
Training:  15%|█▌        | 11/73 [00:20<01:25,  1.38s/it][A
Training:  16%|█▋        | 12/73 [00:20<01:02,  1.02s/it][A
Training:  18%|█▊        | 13/73 [00:26<02:18,  2.30s/it][A
Training:  21%|██        | 15/73 [00:26<01:14,  1.28s/it][A
Training:  22%|██▏       | 16/73 [00:26<01:00,  1.06s/it][A
Training:  23%|██▎       | 17/73 [00:31<01:57,  2.10s/it][A
Training:  25%|██▍       | 18/73 [00:31<

Epoch: 6/35 - Loss: 1856.3551 - Accuracy: 0.9447



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:05<00:50,  5.56s/it][A
 20%|██        | 2/10 [00:05<00:19,  2.43s/it][A
 30%|███       | 3/10 [00:06<00:10,  1.46s/it][A
 40%|████      | 4/10 [00:06<00:05,  1.06it/s][A
 50%|█████     | 5/10 [00:11<00:11,  2.31s/it][A
 70%|███████   | 7/10 [00:11<00:03,  1.17s/it][A
 80%|████████  | 8/10 [00:11<00:01,  1.11it/s][A
100%|██████████| 10/10 [00:15<00:00,  1.55s/it][A
Epochs:  17%|█▋        | 6/35 [12:04<59:07, 122.32s/it]  

Val Loss: 1750.0276 - Val Accuracy: 0.9409



Training:   0%|          | 0/73 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/73 [00:06<07:53,  6.58s/it][A
Training:   3%|▎         | 2/73 [00:06<03:18,  2.79s/it][A
Training:   4%|▍         | 3/73 [00:06<01:51,  1.59s/it][A
Training:   5%|▌         | 4/73 [00:07<01:10,  1.02s/it][A
Training:   7%|▋         | 5/73 [00:12<02:57,  2.61s/it][A
Training:   8%|▊         | 6/73 [00:12<01:59,  1.78s/it][A
Training:  11%|█         | 8/73 [00:12<01:02,  1.05it/s][A
Training:  12%|█▏        | 9/73 [00:17<02:07,  1.99s/it][A
Training:  14%|█▎        | 10/73 [00:17<01:33,  1.49s/it][A
Training:  15%|█▌        | 11/73 [00:18<01:08,  1.11s/it][A
Training:  16%|█▋        | 12/73 [00:18<00:50,  1.21it/s][A
Training:  18%|█▊        | 13/73 [00:22<01:59,  1.99s/it][A
Training:  19%|█▉        | 14/73 [00:23<01:25,  1.44s/it][A
Training:  22%|██▏       | 16/73 [00:23<00:46,  1.22it/s][A
Training:  23%|██▎       | 17/73 [00:27<01:36,  1.73s/it][A
Training:  25%|██▍       | 18/73 [00:27<

Epoch: 7/35 - Loss: 1831.4548 - Accuracy: 0.9462



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:05<00:47,  5.30s/it][A
 30%|███       | 3/10 [00:05<00:10,  1.45s/it][A
 40%|████      | 4/10 [00:05<00:06,  1.01s/it][A
 50%|█████     | 5/10 [00:10<00:10,  2.13s/it][A
 80%|████████  | 8/10 [00:10<00:01,  1.10it/s][A
100%|██████████| 10/10 [00:14<00:00,  1.43s/it][A
Epochs:  20%|██        | 7/35 [13:56<55:26, 118.80s/it]

Val Loss: 1476.1300 - Val Accuracy: 0.9461



Training:   0%|          | 0/73 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/73 [00:06<07:23,  6.16s/it][A
Training:   3%|▎         | 2/73 [00:06<03:06,  2.62s/it][A
Training:   4%|▍         | 3/73 [00:06<01:46,  1.53s/it][A
Training:   7%|▋         | 5/73 [00:12<02:30,  2.21s/it][A
Training:   8%|▊         | 6/73 [00:12<01:57,  1.75s/it][A
Training:  10%|▉         | 7/73 [00:12<01:24,  1.28s/it][A
Training:  12%|█▏        | 9/73 [00:17<01:51,  1.74s/it][A
Training:  14%|█▎        | 10/73 [00:18<01:34,  1.50s/it][A
Training:  16%|█▋        | 12/73 [00:18<00:55,  1.10it/s][A
Training:  18%|█▊        | 13/73 [00:21<01:31,  1.53s/it][A
Training:  19%|█▉        | 14/73 [00:22<01:18,  1.33s/it][A
Training:  21%|██        | 15/73 [00:22<00:58,  1.01s/it][A
Training:  23%|██▎       | 17/73 [00:26<01:20,  1.44s/it][A
Training:  25%|██▍       | 18/73 [00:27<01:11,  1.29s/it][A
Training:  26%|██▌       | 19/73 [00:27<00:54,  1.00s/it][A
Training:  27%|██▋       | 20/73 [00:27

Epoch: 8/35 - Loss: 1921.2600 - Accuracy: 0.9482



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:05<00:47,  5.25s/it][A
 20%|██        | 2/10 [00:05<00:17,  2.25s/it][A
 30%|███       | 3/10 [00:05<00:09,  1.33s/it][A
 50%|█████     | 5/10 [00:10<00:09,  1.84s/it][A
 70%|███████   | 7/10 [00:10<00:03,  1.06s/it][A
100%|██████████| 10/10 [00:14<00:00,  1.42s/it][A
Epochs:  23%|██▎       | 8/35 [15:48<52:34, 116.84s/it]

Val Loss: 2052.9810 - Val Accuracy: 0.9560



Training:   0%|          | 0/73 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/73 [00:05<07:06,  5.92s/it][A
Training:   3%|▎         | 2/73 [00:06<03:01,  2.55s/it][A
Training:   4%|▍         | 3/73 [00:06<01:41,  1.45s/it][A
Training:   5%|▌         | 4/73 [00:06<01:03,  1.09it/s][A
Training:   7%|▋         | 5/73 [00:11<02:47,  2.47s/it][A
Training:   8%|▊         | 6/73 [00:11<01:51,  1.67s/it][A
Training:  10%|▉         | 7/73 [00:11<01:17,  1.17s/it][A
Training:  11%|█         | 8/73 [00:11<00:54,  1.20it/s][A
Training:  12%|█▏        | 9/73 [00:17<02:19,  2.18s/it][A
Training:  15%|█▌        | 11/73 [00:17<01:13,  1.19s/it][A
Training:  18%|█▊        | 13/73 [00:22<01:42,  1.72s/it][A
Training:  19%|█▉        | 14/73 [00:22<01:19,  1.36s/it][A
Training:  21%|██        | 15/73 [00:22<01:01,  1.06s/it][A
Training:  22%|██▏       | 16/73 [00:22<00:47,  1.19it/s][A
Training:  23%|██▎       | 17/73 [00:28<01:56,  2.08s/it][A
Training:  26%|██▌       | 19/73 [00:28<0

Epoch: 9/35 - Loss: 1969.9285 - Accuracy: 0.9478



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:05<00:48,  5.43s/it][A
 20%|██        | 2/10 [00:05<00:18,  2.30s/it][A
 40%|████      | 4/10 [00:05<00:05,  1.11it/s][A
 60%|██████    | 6/10 [00:10<00:06,  1.51s/it][A
 70%|███████   | 7/10 [00:10<00:03,  1.16s/it][A
100%|██████████| 10/10 [00:14<00:00,  1.43s/it][A
Epochs:  26%|██▌       | 9/35 [17:40<49:57, 115.29s/it]

Val Loss: 2093.5776 - Val Accuracy: 0.9466



Training:   0%|          | 0/73 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/73 [00:05<07:07,  5.93s/it][A
Training:   3%|▎         | 2/73 [00:06<03:02,  2.57s/it][A
Training:   4%|▍         | 3/73 [00:06<01:43,  1.47s/it][A
Training:   5%|▌         | 4/73 [00:06<01:05,  1.06it/s][A
Training:   7%|▋         | 5/73 [00:10<02:32,  2.24s/it][A
Training:  10%|▉         | 7/73 [00:11<01:15,  1.14s/it][A
Training:  11%|█         | 8/73 [00:11<01:02,  1.04it/s][A
Training:  12%|█▏        | 9/73 [00:15<01:59,  1.86s/it][A
Training:  14%|█▎        | 10/73 [00:16<01:27,  1.39s/it][A
Training:  16%|█▋        | 12/73 [00:16<00:49,  1.24it/s][A
Training:  18%|█▊        | 13/73 [00:20<01:41,  1.69s/it][A
Training:  21%|██        | 15/73 [00:21<01:02,  1.07s/it][A
Training:  23%|██▎       | 17/73 [00:25<01:24,  1.51s/it][A
Training:  26%|██▌       | 19/73 [00:25<00:56,  1.05s/it][A
Training:  29%|██▉       | 21/73 [00:30<01:16,  1.47s/it][A
Training:  30%|███       | 22/73 [00:30<

Epoch: 10/35 - Loss: 1993.3033 - Accuracy: 0.9497



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:05<00:47,  5.33s/it][A
 30%|███       | 3/10 [00:05<00:10,  1.44s/it][A
 50%|█████     | 5/10 [00:09<00:09,  1.82s/it][A
 60%|██████    | 6/10 [00:10<00:05,  1.39s/it][A
 80%|████████  | 8/10 [00:10<00:01,  1.24it/s][A
100%|██████████| 10/10 [00:13<00:00,  1.39s/it][A
Epochs:  29%|██▊       | 10/35 [19:28<47:00, 112.82s/it]

Val Loss: 1732.4000 - Val Accuracy: 0.9539



Training:   0%|          | 0/73 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/73 [00:06<07:11,  5.99s/it][A
Training:   3%|▎         | 2/73 [00:06<02:59,  2.53s/it][A
Training:   4%|▍         | 3/73 [00:06<01:39,  1.42s/it][A
Training:   7%|▋         | 5/73 [00:10<02:07,  1.87s/it][A
Training:   8%|▊         | 6/73 [00:10<01:32,  1.37s/it][A
Training:  11%|█         | 8/73 [00:10<00:50,  1.28it/s][A
Training:  12%|█▏        | 9/73 [00:15<01:48,  1.69s/it][A
Training:  14%|█▎        | 10/73 [00:15<01:24,  1.34s/it][A
Training:  16%|█▋        | 12/73 [00:15<00:48,  1.25it/s][A
Training:  18%|█▊        | 13/73 [00:20<01:41,  1.69s/it][A
Training:  21%|██        | 15/73 [00:20<01:00,  1.04s/it][A
Training:  22%|██▏       | 16/73 [00:20<00:48,  1.17it/s][A
Training:  23%|██▎       | 17/73 [00:25<01:36,  1.73s/it][A
Training:  25%|██▍       | 18/73 [00:25<01:14,  1.36s/it][A
Training:  26%|██▌       | 19/73 [00:25<00:55,  1.03s/it][A
Training:  27%|██▋       | 20/73 [00:25

Epoch: 11/35 - Loss: 1946.4628 - Accuracy: 0.9509



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:05<00:46,  5.20s/it][A
 20%|██        | 2/10 [00:05<00:17,  2.25s/it][A
 30%|███       | 3/10 [00:05<00:09,  1.35s/it][A
 50%|█████     | 5/10 [00:09<00:08,  1.77s/it][A
 70%|███████   | 7/10 [00:10<00:03,  1.11s/it][A
100%|██████████| 10/10 [00:14<00:00,  1.42s/it][A
Epochs:  31%|███▏      | 11/35 [21:18<44:52, 112.17s/it]

Val Loss: 1783.1477 - Val Accuracy: 0.9513



Training:   0%|          | 0/73 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/73 [00:05<06:50,  5.71s/it][A
Training:   3%|▎         | 2/73 [00:06<03:10,  2.68s/it][A
Training:   4%|▍         | 3/73 [00:06<01:45,  1.51s/it][A
Training:   7%|▋         | 5/73 [00:10<02:12,  1.95s/it][A
Training:   8%|▊         | 6/73 [00:11<01:43,  1.54s/it][A
Training:  10%|▉         | 7/73 [00:11<01:14,  1.13s/it][A
Training:  11%|█         | 8/73 [00:11<00:54,  1.20it/s][A
Training:  12%|█▏        | 9/73 [00:15<01:57,  1.84s/it][A
Training:  14%|█▎        | 10/73 [00:16<01:31,  1.45s/it][A
Training:  15%|█▌        | 11/73 [00:16<01:05,  1.06s/it][A
Training:  18%|█▊        | 13/73 [00:21<01:36,  1.60s/it][A
Training:  19%|█▉        | 14/73 [00:21<01:18,  1.32s/it][A
Training:  22%|██▏       | 16/73 [00:21<00:46,  1.24it/s][A
Training:  23%|██▎       | 17/73 [00:26<01:37,  1.74s/it][A
Training:  25%|██▍       | 18/73 [00:26<01:16,  1.39s/it][A
Training:  26%|██▌       | 19/73 [00:27<

Epoch: 12/35 - Loss: 2070.4487 - Accuracy: 0.9510



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:05<00:52,  5.81s/it][A
 20%|██        | 2/10 [00:05<00:19,  2.47s/it][A
 30%|███       | 3/10 [00:06<00:10,  1.43s/it][A
 40%|████      | 4/10 [00:06<00:05,  1.07it/s][A
 50%|█████     | 5/10 [00:10<00:11,  2.22s/it][A
 70%|███████   | 7/10 [00:10<00:03,  1.13s/it][A
100%|██████████| 10/10 [00:14<00:00,  1.46s/it][A
Epochs:  34%|███▍      | 12/35 [23:13<43:16, 112.90s/it]

Val Loss: 2329.8237 - Val Accuracy: 0.9388



Training:   0%|          | 0/73 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/73 [00:05<06:46,  5.64s/it][A
Training:   3%|▎         | 2/73 [00:05<02:50,  2.40s/it][A
Training:   4%|▍         | 3/73 [00:05<01:35,  1.36s/it][A
Training:   7%|▋         | 5/73 [00:10<02:15,  1.99s/it][A
Training:   8%|▊         | 6/73 [00:11<01:38,  1.47s/it][A
Training:  10%|▉         | 7/73 [00:11<01:11,  1.08s/it][A
Training:  11%|█         | 8/73 [00:11<00:52,  1.24it/s][A
Training:  12%|█▏        | 9/73 [00:16<02:20,  2.19s/it][A
Training:  15%|█▌        | 11/73 [00:17<01:16,  1.24s/it][A
Training:  18%|█▊        | 13/73 [00:22<01:46,  1.78s/it][A
Training:  19%|█▉        | 14/73 [00:22<01:28,  1.51s/it][A
Training:  21%|██        | 15/73 [00:22<01:08,  1.19s/it][A
Training:  22%|██▏       | 16/73 [00:23<00:53,  1.07it/s][A
Training:  23%|██▎       | 17/73 [00:27<01:43,  1.85s/it][A
Training:  25%|██▍       | 18/73 [00:28<01:24,  1.53s/it][A
Training:  26%|██▌       | 19/73 [00:28<

Epoch: 13/35 - Loss: 2056.9670 - Accuracy: 0.9488



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:05<00:50,  5.58s/it][A
 30%|███       | 3/10 [00:05<00:10,  1.49s/it][A
 50%|█████     | 5/10 [00:09<00:09,  1.81s/it][A
 60%|██████    | 6/10 [00:10<00:05,  1.36s/it][A
 80%|████████  | 8/10 [00:10<00:01,  1.25it/s][A
100%|██████████| 10/10 [00:13<00:00,  1.39s/it][A
Epochs:  37%|███▋      | 13/35 [25:03<41:04, 112.01s/it]

Val Loss: 2178.6826 - Val Accuracy: 0.9606



Training:   0%|          | 0/73 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/73 [00:05<06:59,  5.83s/it][A
Training:   3%|▎         | 2/73 [00:05<02:55,  2.47s/it][A
Training:   5%|▌         | 4/73 [00:06<01:07,  1.02it/s][A
Training:   7%|▋         | 5/73 [00:11<02:29,  2.19s/it][A
Training:   8%|▊         | 6/73 [00:11<01:45,  1.57s/it][A
Training:  10%|▉         | 7/73 [00:11<01:15,  1.14s/it][A
Training:  12%|█▏        | 9/73 [00:16<01:49,  1.70s/it][A
Training:  14%|█▎        | 10/73 [00:16<01:22,  1.31s/it][A
Training:  15%|█▌        | 11/73 [00:16<01:01,  1.00it/s][A
Training:  16%|█▋        | 12/73 [00:16<00:45,  1.33it/s][A
Training:  18%|█▊        | 13/73 [00:21<01:54,  1.90s/it][A
Training:  19%|█▉        | 14/73 [00:21<01:22,  1.40s/it][A
Training:  22%|██▏       | 16/73 [00:21<00:45,  1.24it/s][A
Training:  23%|██▎       | 17/73 [00:26<01:42,  1.82s/it][A
Training:  26%|██▌       | 19/73 [00:26<00:59,  1.10s/it][A
Training:  27%|██▋       | 20/73 [00:26

Epoch: 14/35 - Loss: 1982.6068 - Accuracy: 0.9550



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:05<00:46,  5.16s/it][A
 20%|██        | 2/10 [00:05<00:17,  2.20s/it][A
 40%|████      | 4/10 [00:05<00:05,  1.13it/s][A
 50%|█████     | 5/10 [00:10<00:10,  2.01s/it][A
 60%|██████    | 6/10 [00:10<00:05,  1.43s/it][A
 80%|████████  | 8/10 [00:10<00:01,  1.26it/s][A
100%|██████████| 10/10 [00:13<00:00,  1.38s/it][A
Epochs:  40%|████      | 14/35 [26:50<38:39, 110.47s/it]

Val Loss: 2089.4868 - Val Accuracy: 0.9575



Training:   0%|          | 0/73 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/73 [00:05<06:49,  5.69s/it][A
Training:   3%|▎         | 2/73 [00:05<02:54,  2.46s/it][A
Training:   4%|▍         | 3/73 [00:06<01:39,  1.42s/it][A
Training:   5%|▌         | 4/73 [00:06<01:02,  1.10it/s][A
Training:   7%|▋         | 5/73 [00:10<02:34,  2.27s/it][A
Training:   8%|▊         | 6/73 [00:11<01:43,  1.54s/it][A
Training:  10%|▉         | 7/73 [00:11<01:10,  1.07s/it][A
Training:  11%|█         | 8/73 [00:11<00:49,  1.31it/s][A
Training:  12%|█▏        | 9/73 [00:16<02:10,  2.04s/it][A
Training:  14%|█▎        | 10/73 [00:16<01:32,  1.47s/it][A
Training:  15%|█▌        | 11/73 [00:16<01:05,  1.06s/it][A
Training:  18%|█▊        | 13/73 [00:21<01:44,  1.75s/it][A
Training:  19%|█▉        | 14/73 [00:21<01:20,  1.37s/it][A
Training:  22%|██▏       | 16/73 [00:21<00:48,  1.18it/s][A
Training:  23%|██▎       | 17/73 [00:27<01:41,  1.82s/it][A
Training:  25%|██▍       | 18/73 [00:27<0

Epoch: 15/35 - Loss: 2081.5022 - Accuracy: 0.9537



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:06<00:54,  6.00s/it][A
 30%|███       | 3/10 [00:06<00:11,  1.60s/it][A
 50%|█████     | 5/10 [00:10<00:10,  2.03s/it][A
 70%|███████   | 7/10 [00:11<00:03,  1.22s/it][A
 80%|████████  | 8/10 [00:11<00:01,  1.03it/s][A
100%|██████████| 10/10 [00:15<00:00,  1.52s/it][A
Epochs:  43%|████▎     | 15/35 [28:43<37:05, 111.29s/it]

Val Loss: 2599.9111 - Val Accuracy: 0.9404



Training:   0%|          | 0/73 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/73 [00:06<07:19,  6.11s/it][A
Training:   3%|▎         | 2/73 [00:06<03:03,  2.59s/it][A
Training:   5%|▌         | 4/73 [00:06<01:10,  1.02s/it][A
Training:   7%|▋         | 5/73 [00:11<02:33,  2.26s/it][A
Training:   8%|▊         | 6/73 [00:11<01:47,  1.61s/it][A
Training:  10%|▉         | 7/73 [00:11<01:16,  1.15s/it][A
Training:  12%|█▏        | 9/73 [00:16<01:51,  1.74s/it][A
Training:  15%|█▌        | 11/73 [00:16<01:08,  1.10s/it][A
Training:  18%|█▊        | 13/73 [00:21<01:32,  1.55s/it][A
Training:  19%|█▉        | 14/73 [00:21<01:14,  1.26s/it][A
Training:  21%|██        | 15/73 [00:21<01:00,  1.05s/it][A
Training:  23%|██▎       | 17/73 [00:26<01:28,  1.57s/it][A
Training:  25%|██▍       | 18/73 [00:26<01:09,  1.26s/it][A
Training:  26%|██▌       | 19/73 [00:27<00:55,  1.03s/it][A
Training:  29%|██▉       | 21/73 [00:31<01:20,  1.55s/it][A
Training:  32%|███▏      | 23/73 [00:32

Epoch: 16/35 - Loss: 2165.3030 - Accuracy: 0.9514



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:05<00:45,  5.04s/it][A
 20%|██        | 2/10 [00:05<00:17,  2.13s/it][A
 30%|███       | 3/10 [00:05<00:08,  1.21s/it][A
 50%|█████     | 5/10 [00:09<00:07,  1.60s/it][A
 60%|██████    | 6/10 [00:09<00:04,  1.17s/it][A
 80%|████████  | 8/10 [00:09<00:01,  1.49it/s][A
100%|██████████| 10/10 [00:12<00:00,  1.29s/it][A
Epochs:  46%|████▌     | 16/35 [30:29<34:43, 109.64s/it]

Val Loss: 2411.9722 - Val Accuracy: 0.9596



Training:   0%|          | 0/73 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/73 [00:05<07:07,  5.94s/it][A
Training:   3%|▎         | 2/73 [00:06<03:04,  2.60s/it][A
Training:   5%|▌         | 4/73 [00:06<01:10,  1.02s/it][A
Training:   7%|▋         | 5/73 [00:11<02:32,  2.25s/it][A
Training:  10%|▉         | 7/73 [00:11<01:22,  1.25s/it][A
Training:  11%|█         | 8/73 [00:11<01:03,  1.02it/s][A
Training:  12%|█▏        | 9/73 [00:16<02:04,  1.95s/it][A
Training:  14%|█▎        | 10/73 [00:16<01:31,  1.45s/it][A
Training:  15%|█▌        | 11/73 [00:16<01:06,  1.07s/it][A
Training:  16%|█▋        | 12/73 [00:16<00:48,  1.26it/s][A
Training:  18%|█▊        | 13/73 [00:21<02:02,  2.04s/it][A
Training:  21%|██        | 15/73 [00:22<01:07,  1.16s/it][A
Training:  23%|██▎       | 17/73 [00:27<01:39,  1.77s/it][A
Training:  26%|██▌       | 19/73 [00:27<01:02,  1.16s/it][A
Training:  27%|██▋       | 20/73 [00:27<00:50,  1.05it/s][A
Training:  29%|██▉       | 21/73 [00:32

Epoch: 17/35 - Loss: 2089.7632 - Accuracy: 0.9528



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:04<00:44,  4.89s/it][A
 20%|██        | 2/10 [00:05<00:17,  2.22s/it][A
 30%|███       | 3/10 [00:05<00:08,  1.26s/it][A
 50%|█████     | 5/10 [00:09<00:08,  1.77s/it][A
 60%|██████    | 6/10 [00:09<00:05,  1.31s/it][A
 80%|████████  | 8/10 [00:09<00:01,  1.34it/s][A
100%|██████████| 10/10 [00:13<00:00,  1.35s/it][A
Epochs:  49%|████▊     | 17/35 [32:17<32:43, 109.11s/it]

Val Loss: 2007.6285 - Val Accuracy: 0.9642



Training:   0%|          | 0/73 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/73 [00:05<07:07,  5.94s/it][A
Training:   3%|▎         | 2/73 [00:06<03:05,  2.61s/it][A
Training:   4%|▍         | 3/73 [00:06<01:44,  1.49s/it][A
Training:   5%|▌         | 4/73 [00:06<01:05,  1.06it/s][A
Training:   7%|▋         | 5/73 [00:11<02:40,  2.36s/it][A
Training:   8%|▊         | 6/73 [00:11<01:47,  1.61s/it][A
Training:  10%|▉         | 7/73 [00:11<01:16,  1.16s/it][A
Training:  11%|█         | 8/73 [00:11<00:54,  1.19it/s][A
Training:  12%|█▏        | 9/73 [00:16<02:07,  1.99s/it][A
Training:  14%|█▎        | 10/73 [00:16<01:35,  1.52s/it][A
Training:  15%|█▌        | 11/73 [00:17<01:07,  1.10s/it][A
Training:  16%|█▋        | 12/73 [00:17<00:49,  1.23it/s][A
Training:  18%|█▊        | 13/73 [00:21<01:52,  1.88s/it][A
Training:  19%|█▉        | 14/73 [00:21<01:25,  1.45s/it][A
Training:  21%|██        | 15/73 [00:22<01:00,  1.05s/it][A
Training:  23%|██▎       | 17/73 [00:26<0

Epoch: 18/35 - Loss: 2137.1013 - Accuracy: 0.9541



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:05<00:50,  5.57s/it][A
 20%|██        | 2/10 [00:05<00:19,  2.44s/it][A
 40%|████      | 4/10 [00:05<00:05,  1.04it/s][A
 50%|█████     | 5/10 [00:10<00:09,  1.92s/it][A
 60%|██████    | 6/10 [00:10<00:05,  1.40s/it][A
 80%|████████  | 8/10 [00:10<00:01,  1.29it/s][A
100%|██████████| 10/10 [00:14<00:00,  1.42s/it][A
Epochs:  51%|█████▏    | 18/35 [34:05<30:52, 108.96s/it]

Val Loss: 2119.0022 - Val Accuracy: 0.9606



Training:   0%|          | 0/73 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/73 [00:06<07:18,  6.08s/it][A
Training:   3%|▎         | 2/73 [00:06<03:10,  2.68s/it][A
Training:   5%|▌         | 4/73 [00:06<01:11,  1.04s/it][A
Training:   7%|▋         | 5/73 [00:11<02:32,  2.24s/it][A
Training:   8%|▊         | 6/73 [00:11<01:46,  1.58s/it][A
Training:  11%|█         | 8/73 [00:11<00:57,  1.14it/s][A
Training:  12%|█▏        | 9/73 [00:16<02:02,  1.92s/it][A
Training:  16%|█▋        | 12/73 [00:16<00:57,  1.05it/s][A
Training:  19%|█▉        | 14/73 [00:22<01:27,  1.49s/it][A
Training:  21%|██        | 15/73 [00:22<01:11,  1.23s/it][A
Training:  23%|██▎       | 17/73 [00:27<01:33,  1.66s/it][A
Training:  26%|██▌       | 19/73 [00:27<01:01,  1.14s/it][A
Training:  29%|██▉       | 21/73 [00:31<01:18,  1.52s/it][A
Training:  32%|███▏      | 23/73 [00:32<00:52,  1.06s/it][A
Training:  34%|███▍      | 25/73 [00:36<01:09,  1.45s/it][A
Training:  36%|███▌      | 26/73 [00:36

Epoch: 19/35 - Loss: 2070.9019 - Accuracy: 0.9536



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:05<00:46,  5.14s/it][A
 30%|███       | 3/10 [00:05<00:09,  1.39s/it][A
 50%|█████     | 5/10 [00:09<00:09,  1.82s/it][A
 70%|███████   | 7/10 [00:09<00:03,  1.07s/it][A
100%|██████████| 10/10 [00:13<00:00,  1.39s/it][A
Epochs:  54%|█████▍    | 19/35 [35:53<28:57, 108.58s/it]

Val Loss: 2267.5437 - Val Accuracy: 0.9642



Training:   0%|          | 0/73 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/73 [00:05<07:09,  5.96s/it][A
Training:   3%|▎         | 2/73 [00:06<03:04,  2.59s/it][A
Training:   4%|▍         | 3/73 [00:06<01:43,  1.48s/it][A
Training:   5%|▌         | 4/73 [00:06<01:04,  1.06it/s][A
Training:   7%|▋         | 5/73 [00:11<02:38,  2.34s/it][A
Training:  10%|▉         | 7/73 [00:11<01:18,  1.19s/it][A
Training:  11%|█         | 8/73 [00:11<00:59,  1.10it/s][A
Training:  12%|█▏        | 9/73 [00:16<02:13,  2.09s/it][A
Training:  15%|█▌        | 11/73 [00:16<01:14,  1.19s/it][A
Training:  18%|█▊        | 13/73 [00:21<01:38,  1.64s/it][A
Training:  19%|█▉        | 14/73 [00:21<01:20,  1.36s/it][A
Training:  21%|██        | 15/73 [00:22<01:02,  1.08s/it][A
Training:  22%|██▏       | 16/73 [00:22<00:47,  1.19it/s][A
Training:  23%|██▎       | 17/73 [00:26<01:42,  1.83s/it][A
Training:  25%|██▍       | 18/73 [00:27<01:17,  1.41s/it][A
Training:  26%|██▌       | 19/73 [00:27<

Epoch: 20/35 - Loss: 2031.2051 - Accuracy: 0.9542



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:05<00:47,  5.28s/it][A
 30%|███       | 3/10 [00:05<00:10,  1.51s/it][A
 50%|█████     | 5/10 [00:09<00:08,  1.79s/it][A
 60%|██████    | 6/10 [00:09<00:05,  1.37s/it][A
 70%|███████   | 7/10 [00:10<00:03,  1.06s/it][A
100%|██████████| 10/10 [00:13<00:00,  1.39s/it][A
Epochs:  57%|█████▋    | 20/35 [37:39<26:58, 107.91s/it]

Val Loss: 1981.0771 - Val Accuracy: 0.9617



Training:   0%|          | 0/73 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/73 [00:05<06:53,  5.74s/it][A
Training:   3%|▎         | 2/73 [00:05<02:58,  2.51s/it][A
Training:   4%|▍         | 3/73 [00:06<01:39,  1.43s/it][A
Training:   5%|▌         | 4/73 [00:06<01:04,  1.08it/s][A
Training:   7%|▋         | 5/73 [00:11<02:36,  2.30s/it][A
Training:  10%|▉         | 7/73 [00:11<01:17,  1.18s/it][A
Training:  12%|█▏        | 9/73 [00:16<01:48,  1.70s/it][A
Training:  14%|█▎        | 10/73 [00:16<01:23,  1.33s/it][A
Training:  15%|█▌        | 11/73 [00:16<01:07,  1.08s/it][A
Training:  16%|█▋        | 12/73 [00:16<00:50,  1.20it/s][A
Training:  18%|█▊        | 13/73 [00:21<01:48,  1.80s/it][A
Training:  19%|█▉        | 14/73 [00:21<01:18,  1.33s/it][A
Training:  21%|██        | 15/73 [00:21<01:00,  1.04s/it][A
Training:  23%|██▎       | 17/73 [00:26<01:30,  1.61s/it][A
Training:  25%|██▍       | 18/73 [00:26<01:11,  1.31s/it][A
Training:  26%|██▌       | 19/73 [00:26

Epoch: 21/35 - Loss: 1998.4358 - Accuracy: 0.9551



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:05<00:51,  5.70s/it][A
 20%|██        | 2/10 [00:05<00:19,  2.48s/it][A
 40%|████      | 4/10 [00:06<00:06,  1.05s/it][A
 50%|█████     | 5/10 [00:10<00:10,  2.13s/it][A
 60%|██████    | 6/10 [00:11<00:06,  1.58s/it][A
 70%|███████   | 7/10 [00:11<00:03,  1.14s/it][A
 80%|████████  | 8/10 [00:11<00:01,  1.15it/s][A
100%|██████████| 10/10 [00:15<00:00,  1.55s/it][A
Epochs:  60%|██████    | 21/35 [39:29<25:19, 108.57s/it]

Val Loss: 2427.9485 - Val Accuracy: 0.9580



Training:   0%|          | 0/73 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/73 [00:07<09:20,  7.79s/it][A
Training:   4%|▍         | 3/73 [00:07<02:25,  2.09s/it][A
Training:   7%|▋         | 5/73 [00:13<02:39,  2.35s/it][A
Training:   8%|▊         | 6/73 [00:13<01:57,  1.76s/it][A
Training:  10%|▉         | 7/73 [00:13<01:26,  1.31s/it][A
Training:  12%|█▏        | 9/73 [00:18<01:55,  1.81s/it][A
Training:  14%|█▎        | 10/73 [00:18<01:28,  1.41s/it][A
Training:  16%|█▋        | 12/73 [00:18<00:53,  1.15it/s][A
Training:  18%|█▊        | 13/73 [00:23<01:43,  1.73s/it][A
Training:  22%|██▏       | 16/73 [00:23<00:51,  1.11it/s][A
Training:  23%|██▎       | 17/73 [00:28<01:37,  1.74s/it][A
Training:  25%|██▍       | 18/73 [00:28<01:16,  1.40s/it][A
Training:  26%|██▌       | 19/73 [00:29<01:00,  1.12s/it][A
Training:  27%|██▋       | 20/73 [00:29<00:46,  1.15it/s][A
Training:  29%|██▉       | 21/73 [00:33<01:33,  1.79s/it][A
Training:  30%|███       | 22/73 [00:3

Epoch: 22/35 - Loss: 2048.4651 - Accuracy: 0.9547



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:05<00:49,  5.51s/it][A
 20%|██        | 2/10 [00:05<00:18,  2.34s/it][A
 30%|███       | 3/10 [00:05<00:09,  1.32s/it][A
 50%|█████     | 5/10 [00:10<00:08,  1.78s/it][A
 60%|██████    | 6/10 [00:10<00:05,  1.34s/it][A
 80%|████████  | 8/10 [00:10<00:01,  1.32it/s][A
100%|██████████| 10/10 [00:14<00:00,  1.42s/it][A
Epochs:  63%|██████▎   | 22/35 [41:18<23:30, 108.49s/it]

Val Loss: 2836.9922 - Val Accuracy: 0.9585



Training:   0%|          | 0/73 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/73 [00:05<07:00,  5.85s/it][A
Training:   3%|▎         | 2/73 [00:06<02:58,  2.51s/it][A
Training:   4%|▍         | 3/73 [00:06<01:41,  1.45s/it][A
Training:   5%|▌         | 4/73 [00:06<01:05,  1.06it/s][A
Training:   7%|▋         | 5/73 [00:11<02:36,  2.31s/it][A
Training:   8%|▊         | 6/73 [00:11<01:50,  1.66s/it][A
Training:  10%|▉         | 7/73 [00:11<01:16,  1.15s/it][A
Training:  11%|█         | 8/73 [00:11<00:53,  1.22it/s][A
Training:  12%|█▏        | 9/73 [00:15<02:01,  1.89s/it][A
Training:  14%|█▎        | 10/73 [00:16<01:35,  1.51s/it][A
Training:  15%|█▌        | 11/73 [00:16<01:07,  1.08s/it][A
Training:  16%|█▋        | 12/73 [00:16<00:48,  1.26it/s][A
Training:  18%|█▊        | 13/73 [00:20<01:47,  1.79s/it][A
Training:  19%|█▉        | 14/73 [00:21<01:26,  1.46s/it][A
Training:  21%|██        | 15/73 [00:21<01:01,  1.06s/it][A
Training:  22%|██▏       | 16/73 [00:22<0

Epoch: 23/35 - Loss: 2179.6819 - Accuracy: 0.9528



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:05<00:49,  5.50s/it][A
 20%|██        | 2/10 [00:05<00:19,  2.42s/it][A
 30%|███       | 3/10 [00:05<00:09,  1.38s/it][A
 50%|█████     | 5/10 [00:10<00:09,  1.85s/it][A
 60%|██████    | 6/10 [00:10<00:05,  1.40s/it][A
 80%|████████  | 8/10 [00:10<00:01,  1.26it/s][A
100%|██████████| 10/10 [00:14<00:00,  1.48s/it][A
Epochs:  66%|██████▌   | 23/35 [43:07<21:46, 108.84s/it]

Val Loss: 2809.0176 - Val Accuracy: 0.9679



Training:   0%|          | 0/73 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/73 [00:06<07:27,  6.22s/it][A
Training:   3%|▎         | 2/73 [00:06<03:07,  2.64s/it][A
Training:   5%|▌         | 4/73 [00:06<01:10,  1.02s/it][A
Training:   7%|▋         | 5/73 [00:11<02:40,  2.36s/it][A
Training:   8%|▊         | 6/73 [00:11<01:52,  1.68s/it][A
Training:  10%|▉         | 7/73 [00:12<01:19,  1.21s/it][A
Training:  12%|█▏        | 9/73 [00:16<01:53,  1.77s/it][A
Training:  15%|█▌        | 11/73 [00:17<01:09,  1.12s/it][A
Training:  18%|█▊        | 13/73 [00:22<01:38,  1.65s/it][A
Training:  21%|██        | 15/73 [00:22<01:05,  1.14s/it][A
Training:  22%|██▏       | 16/73 [00:22<00:53,  1.06it/s][A
Training:  23%|██▎       | 17/73 [00:27<01:40,  1.79s/it][A
Training:  26%|██▌       | 19/73 [00:28<01:04,  1.19s/it][A
Training:  29%|██▉       | 21/73 [00:32<01:22,  1.58s/it][A
Training:  30%|███       | 22/73 [00:32<01:07,  1.32s/it][A
Training:  32%|███▏      | 23/73 [00:33

Epoch: 24/35 - Loss: 2216.1218 - Accuracy: 0.9576



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:05<00:50,  5.57s/it][A
 20%|██        | 2/10 [00:05<00:18,  2.36s/it][A
 30%|███       | 3/10 [00:05<00:09,  1.34s/it][A
 50%|█████     | 5/10 [00:10<00:09,  1.88s/it][A
 70%|███████   | 7/10 [00:10<00:03,  1.09s/it][A
 80%|████████  | 8/10 [00:10<00:01,  1.17it/s][A
100%|██████████| 10/10 [00:14<00:00,  1.47s/it][A
Epochs:  69%|██████▊   | 24/35 [44:58<20:01, 109.23s/it]

Val Loss: 2542.2942 - Val Accuracy: 0.9606



Training:   0%|          | 0/73 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/73 [00:06<07:41,  6.41s/it][A
Training:   3%|▎         | 2/73 [00:06<03:11,  2.70s/it][A
Training:   5%|▌         | 4/73 [00:06<01:12,  1.05s/it][A
Training:   7%|▋         | 5/73 [00:12<02:44,  2.42s/it][A
Training:   8%|▊         | 6/73 [00:12<01:54,  1.71s/it][A
Training:  11%|█         | 8/73 [00:12<01:02,  1.04it/s][A
Training:  12%|█▏        | 9/73 [00:17<02:05,  1.97s/it][A
Training:  15%|█▌        | 11/73 [00:17<01:13,  1.19s/it][A
Training:  16%|█▋        | 12/73 [00:17<00:58,  1.05it/s][A
Training:  18%|█▊        | 13/73 [00:22<01:58,  1.97s/it][A
Training:  19%|█▉        | 14/73 [00:23<01:27,  1.49s/it][A
Training:  21%|██        | 15/73 [00:23<01:06,  1.14s/it][A
Training:  22%|██▏       | 16/73 [00:23<00:49,  1.15it/s][A
Training:  23%|██▎       | 17/73 [00:28<01:51,  1.99s/it][A
Training:  25%|██▍       | 18/73 [00:28<01:21,  1.49s/it][A
Training:  27%|██▋       | 20/73 [00:28

Epoch: 25/35 - Loss: 2262.3823 - Accuracy: 0.9570



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:05<00:50,  5.57s/it][A
 20%|██        | 2/10 [00:05<00:19,  2.38s/it][A
 30%|███       | 3/10 [00:05<00:09,  1.36s/it][A
 40%|████      | 4/10 [00:06<00:05,  1.14it/s][A
 50%|█████     | 5/10 [00:11<00:12,  2.57s/it][A
 70%|███████   | 7/10 [00:11<00:03,  1.30s/it][A
100%|██████████| 10/10 [00:15<00:00,  1.59s/it][A
Epochs:  71%|███████▏  | 25/35 [46:52<18:28, 110.83s/it]

Val Loss: 2555.9900 - Val Accuracy: 0.9482



Training:   0%|          | 0/73 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/73 [00:06<07:22,  6.14s/it][A
Training:   4%|▍         | 3/73 [00:06<01:55,  1.64s/it][A
Training:   7%|▋         | 5/73 [00:11<02:31,  2.23s/it][A
Training:  10%|▉         | 7/73 [00:12<01:27,  1.32s/it][A
Training:  12%|█▏        | 9/73 [00:17<01:58,  1.85s/it][A
Training:  14%|█▎        | 10/73 [00:17<01:32,  1.48s/it][A
Training:  16%|█▋        | 12/73 [00:17<00:57,  1.06it/s][A
Training:  18%|█▊        | 13/73 [00:22<01:49,  1.82s/it][A
Training:  19%|█▉        | 14/73 [00:22<01:24,  1.44s/it][A
Training:  21%|██        | 15/73 [00:23<01:04,  1.11s/it][A
Training:  23%|██▎       | 17/73 [00:27<01:32,  1.65s/it][A
Training:  25%|██▍       | 18/73 [00:28<01:12,  1.31s/it][A
Training:  27%|██▋       | 20/73 [00:28<00:43,  1.23it/s][A
Training:  29%|██▉       | 21/73 [00:32<01:27,  1.69s/it][A
Training:  32%|███▏      | 23/73 [00:33<00:52,  1.06s/it][A
Training:  34%|███▍      | 25/73 [00:

Epoch: 26/35 - Loss: 1937.7565 - Accuracy: 0.9570



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:05<00:52,  5.83s/it][A
 20%|██        | 2/10 [00:05<00:19,  2.47s/it][A
 30%|███       | 3/10 [00:06<00:09,  1.40s/it][A
 40%|████      | 4/10 [00:06<00:05,  1.06it/s][A
 50%|█████     | 5/10 [00:10<00:11,  2.29s/it][A
 70%|███████   | 7/10 [00:11<00:03,  1.16s/it][A
 80%|████████  | 8/10 [00:11<00:01,  1.12it/s][A
 90%|█████████ | 9/10 [00:16<00:01,  1.95s/it][A
100%|██████████| 10/10 [00:16<00:00,  1.65s/it][A
Epochs:  74%|███████▍  | 26/35 [48:49<16:52, 112.53s/it]

Val Loss: 2379.3684 - Val Accuracy: 0.9518



Training:   0%|          | 0/73 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/73 [00:07<08:29,  7.07s/it][A
Training:   3%|▎         | 2/73 [00:07<03:38,  3.08s/it][A
Training:   4%|▍         | 3/73 [00:07<02:03,  1.77s/it][A
Training:   5%|▌         | 4/73 [00:07<01:19,  1.15s/it][A
Training:   7%|▋         | 5/73 [00:12<02:44,  2.42s/it][A
Training:   8%|▊         | 6/73 [00:12<01:58,  1.77s/it][A
Training:  10%|▉         | 7/73 [00:13<01:21,  1.23s/it][A
Training:  12%|█▏        | 9/73 [00:17<01:52,  1.76s/it][A
Training:  14%|█▎        | 10/73 [00:18<01:30,  1.44s/it][A
Training:  15%|█▌        | 11/73 [00:18<01:07,  1.09s/it][A
Training:  16%|█▋        | 12/73 [00:18<00:50,  1.22it/s][A
Training:  18%|█▊        | 13/73 [00:23<01:53,  1.90s/it][A
Training:  19%|█▉        | 14/73 [00:23<01:25,  1.45s/it][A
Training:  22%|██▏       | 16/73 [00:23<00:46,  1.21it/s][A
Training:  23%|██▎       | 17/73 [00:28<01:37,  1.74s/it][A
Training:  25%|██▍       | 18/73 [00:28<

Epoch: 27/35 - Loss: 2001.0745 - Accuracy: 0.9593



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:05<00:46,  5.16s/it][A
 20%|██        | 2/10 [00:05<00:17,  2.23s/it][A
 40%|████      | 4/10 [00:05<00:05,  1.13it/s][A
 50%|█████     | 5/10 [00:09<00:09,  1.98s/it][A
 70%|███████   | 7/10 [00:10<00:03,  1.10s/it][A
100%|██████████| 10/10 [00:14<00:00,  1.40s/it][A
Epochs:  77%|███████▋  | 27/35 [50:36<14:46, 110.87s/it]

Val Loss: 2247.8469 - Val Accuracy: 0.9378



Training:   0%|          | 0/73 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/73 [00:05<06:50,  5.71s/it][A
Training:   3%|▎         | 2/73 [00:05<02:52,  2.44s/it][A
Training:   4%|▍         | 3/73 [00:06<01:38,  1.40s/it][A
Training:   7%|▋         | 5/73 [00:10<02:13,  1.96s/it][A
Training:   8%|▊         | 6/73 [00:11<01:39,  1.49s/it][A
Training:  11%|█         | 8/73 [00:11<00:55,  1.18it/s][A
Training:  12%|█▏        | 9/73 [00:16<01:55,  1.80s/it][A
Training:  14%|█▎        | 10/73 [00:16<01:27,  1.39s/it][A
Training:  16%|█▋        | 12/73 [00:16<00:51,  1.18it/s][A
Training:  18%|█▊        | 13/73 [00:20<01:39,  1.66s/it][A
Training:  19%|█▉        | 14/73 [00:21<01:20,  1.37s/it][A
Training:  21%|██        | 15/73 [00:21<01:00,  1.04s/it][A
Training:  23%|██▎       | 17/73 [00:25<01:24,  1.51s/it][A
Training:  25%|██▍       | 18/73 [00:26<01:11,  1.30s/it][A
Training:  26%|██▌       | 19/73 [00:26<00:54,  1.01s/it][A
Training:  27%|██▋       | 20/73 [00:26

Epoch: 28/35 - Loss: 2053.7454 - Accuracy: 0.9570



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:05<00:49,  5.46s/it][A
 30%|███       | 3/10 [00:05<00:10,  1.45s/it][A
 50%|█████     | 5/10 [00:10<00:09,  1.93s/it][A
 60%|██████    | 6/10 [00:10<00:05,  1.47s/it][A
 70%|███████   | 7/10 [00:10<00:03,  1.09s/it][A
100%|██████████| 10/10 [00:14<00:00,  1.49s/it][A
Epochs:  80%|████████  | 28/35 [52:24<12:51, 110.20s/it]

Val Loss: 2717.2651 - Val Accuracy: 0.9575



Training:   0%|          | 0/73 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/73 [00:06<08:22,  6.98s/it][A
Training:   3%|▎         | 2/73 [00:07<03:34,  3.03s/it][A
Training:   4%|▍         | 3/73 [00:07<02:05,  1.80s/it][A
Training:   5%|▌         | 4/73 [00:07<01:22,  1.20s/it][A
Training:   7%|▋         | 5/73 [00:12<02:54,  2.57s/it][A
Training:   8%|▊         | 6/73 [00:13<01:57,  1.75s/it][A
Training:  10%|▉         | 7/73 [00:13<01:22,  1.25s/it][A
Training:  12%|█▏        | 9/73 [00:17<01:54,  1.79s/it][A
Training:  15%|█▌        | 11/73 [00:18<01:07,  1.10s/it][A
Training:  16%|█▋        | 12/73 [00:18<00:53,  1.13it/s][A
Training:  18%|█▊        | 13/73 [00:23<01:49,  1.83s/it][A
Training:  19%|█▉        | 14/73 [00:23<01:23,  1.41s/it][A
Training:  21%|██        | 15/73 [00:23<01:02,  1.07s/it][A
Training:  22%|██▏       | 16/73 [00:23<00:46,  1.22it/s][A
Training:  23%|██▎       | 17/73 [00:28<01:42,  1.84s/it][A
Training:  25%|██▍       | 18/73 [00:28<

Epoch: 29/35 - Loss: 2245.0713 - Accuracy: 0.9558



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:05<00:48,  5.41s/it][A
 30%|███       | 3/10 [00:05<00:10,  1.45s/it][A
 50%|█████     | 5/10 [00:10<00:09,  1.91s/it][A
 80%|████████  | 8/10 [00:10<00:01,  1.08it/s][A
100%|██████████| 10/10 [00:14<00:00,  1.43s/it][A
Epochs:  83%|████████▎ | 29/35 [54:11<10:54, 109.02s/it]

Val Loss: 2328.7991 - Val Accuracy: 0.9451



Training:   0%|          | 0/73 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/73 [00:05<06:55,  5.77s/it][A
Training:   3%|▎         | 2/73 [00:05<02:54,  2.46s/it][A
Training:   4%|▍         | 3/73 [00:06<01:39,  1.42s/it][A
Training:   5%|▌         | 4/73 [00:06<01:02,  1.10it/s][A
Training:   7%|▋         | 5/73 [00:11<02:37,  2.31s/it][A
Training:   8%|▊         | 6/73 [00:11<01:48,  1.62s/it][A
Training:  10%|▉         | 7/73 [00:11<01:16,  1.16s/it][A
Training:  11%|█         | 8/73 [00:11<00:55,  1.18it/s][A
Training:  12%|█▏        | 9/73 [00:16<02:10,  2.03s/it][A
Training:  14%|█▎        | 10/73 [00:16<01:40,  1.60s/it][A
Training:  15%|█▌        | 11/73 [00:17<01:15,  1.21s/it][A
Training:  16%|█▋        | 12/73 [00:17<00:55,  1.11it/s][A
Training:  18%|█▊        | 13/73 [00:22<02:13,  2.22s/it][A
Training:  19%|█▉        | 14/73 [00:23<01:38,  1.68s/it][A
Training:  21%|██        | 15/73 [00:23<01:10,  1.21s/it][A
Training:  22%|██▏       | 16/73 [00:23<0

Epoch: 30/35 - Loss: 2376.8196 - Accuracy: 0.9559



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:06<00:57,  6.40s/it][A
 30%|███       | 3/10 [00:06<00:12,  1.73s/it][A
 40%|████      | 4/10 [00:06<00:07,  1.20s/it][A
 50%|█████     | 5/10 [00:12<00:13,  2.65s/it][A
 60%|██████    | 6/10 [00:12<00:07,  1.83s/it][A
 70%|███████   | 7/10 [00:12<00:03,  1.31s/it][A
 80%|████████  | 8/10 [00:12<00:01,  1.05it/s][A
100%|██████████| 10/10 [00:17<00:00,  1.74s/it][A
Epochs:  86%|████████▌ | 30/35 [56:11<09:21, 112.36s/it]

Val Loss: 2366.3193 - Val Accuracy: 0.9637



Training:   0%|          | 0/73 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/73 [00:06<08:10,  6.81s/it][A
Training:   3%|▎         | 2/73 [00:06<03:26,  2.90s/it][A
Training:   4%|▍         | 3/73 [00:07<01:54,  1.64s/it][A
Training:   5%|▌         | 4/73 [00:07<01:12,  1.05s/it][A
Training:   7%|▋         | 5/73 [00:12<02:58,  2.62s/it][A
Training:   8%|▊         | 6/73 [00:12<01:58,  1.76s/it][A
Training:  11%|█         | 8/73 [00:13<01:01,  1.05it/s][A
Training:  12%|█▏        | 9/73 [00:17<02:07,  1.98s/it][A
Training:  15%|█▌        | 11/73 [00:18<01:12,  1.17s/it][A
Training:  18%|█▊        | 13/73 [00:23<01:41,  1.68s/it][A
Training:  21%|██        | 15/73 [00:23<01:05,  1.13s/it][A
Training:  23%|██▎       | 17/73 [00:28<01:25,  1.53s/it][A
Training:  26%|██▌       | 19/73 [00:28<00:57,  1.06s/it][A
Training:  29%|██▉       | 21/73 [00:32<01:15,  1.46s/it][A
Training:  30%|███       | 22/73 [00:32<01:02,  1.22s/it][A
Training:  32%|███▏      | 23/73 [00:33<

Epoch: 31/35 - Loss: 2267.4897 - Accuracy: 0.9565



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:05<00:48,  5.34s/it][A
 20%|██        | 2/10 [00:05<00:18,  2.34s/it][A
 30%|███       | 3/10 [00:05<00:09,  1.32s/it][A
 50%|█████     | 5/10 [00:10<00:09,  1.83s/it][A
 70%|███████   | 7/10 [00:10<00:03,  1.04s/it][A
100%|██████████| 10/10 [00:14<00:00,  1.41s/it][A
Epochs:  89%|████████▊ | 31/35 [57:58<07:22, 110.73s/it]

Val Loss: 2301.4294 - Val Accuracy: 0.9523



Training:   0%|          | 0/73 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/73 [00:06<07:14,  6.03s/it][A
Training:   3%|▎         | 2/73 [00:06<03:01,  2.56s/it][A
Training:   4%|▍         | 3/73 [00:06<01:41,  1.44s/it][A
Training:   5%|▌         | 4/73 [00:06<01:04,  1.07it/s][A
Training:   7%|▋         | 5/73 [00:11<02:37,  2.32s/it][A
Training:   8%|▊         | 6/73 [00:11<01:45,  1.57s/it][A
Training:  11%|█         | 8/73 [00:11<00:54,  1.20it/s][A
Training:  12%|█▏        | 9/73 [00:16<02:02,  1.92s/it][A
Training:  15%|█▌        | 11/73 [00:16<01:11,  1.15s/it][A
Training:  16%|█▋        | 12/73 [00:16<00:56,  1.07it/s][A
Training:  18%|█▊        | 13/73 [00:21<01:51,  1.86s/it][A
Training:  19%|█▉        | 14/73 [00:21<01:22,  1.40s/it][A
Training:  21%|██        | 15/73 [00:21<01:02,  1.07s/it][A
Training:  22%|██▏       | 16/73 [00:21<00:45,  1.25it/s][A
Training:  23%|██▎       | 17/73 [00:26<01:44,  1.87s/it][A
Training:  26%|██▌       | 19/73 [00:26<

Epoch: 32/35 - Loss: 2094.0020 - Accuracy: 0.9576



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:05<00:49,  5.45s/it][A
 40%|████      | 4/10 [00:05<00:06,  1.07s/it][A
 60%|██████    | 6/10 [00:09<00:06,  1.56s/it][A
 80%|████████  | 8/10 [00:10<00:01,  1.01it/s][A
100%|██████████| 10/10 [00:14<00:00,  1.41s/it][A
Epochs:  91%|█████████▏| 32/35 [59:44<05:28, 109.36s/it]

Val Loss: 2551.3220 - Val Accuracy: 0.9648



Training:   0%|          | 0/73 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/73 [00:05<07:04,  5.89s/it][A
Training:   3%|▎         | 2/73 [00:06<02:58,  2.51s/it][A
Training:   4%|▍         | 3/73 [00:06<01:42,  1.46s/it][A
Training:   5%|▌         | 4/73 [00:06<01:05,  1.05it/s][A
Training:   7%|▋         | 5/73 [00:11<02:44,  2.43s/it][A
Training:   8%|▊         | 6/73 [00:11<01:50,  1.65s/it][A
Training:  10%|▉         | 7/73 [00:11<01:16,  1.17s/it][A
Training:  11%|█         | 8/73 [00:11<00:54,  1.20it/s][A
Training:  12%|█▏        | 9/73 [00:16<02:09,  2.02s/it][A
Training:  15%|█▌        | 11/73 [00:16<01:07,  1.10s/it][A
Training:  18%|█▊        | 13/73 [00:21<01:39,  1.65s/it][A
Training:  19%|█▉        | 14/73 [00:21<01:17,  1.32s/it][A
Training:  22%|██▏       | 16/73 [00:21<00:47,  1.19it/s][A
Training:  23%|██▎       | 17/73 [00:26<01:30,  1.62s/it][A
Training:  26%|██▌       | 19/73 [00:26<00:55,  1.03s/it][A
Training:  29%|██▉       | 21/73 [00:30<0

Epoch: 33/35 - Loss: 2240.1868 - Accuracy: 0.9615



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:05<00:50,  5.59s/it][A
 20%|██        | 2/10 [00:05<00:19,  2.38s/it][A
 40%|████      | 4/10 [00:05<00:05,  1.09it/s][A
 60%|██████    | 6/10 [00:10<00:06,  1.66s/it][A
 70%|███████   | 7/10 [00:10<00:03,  1.28s/it][A
 80%|████████  | 8/10 [00:11<00:01,  1.01it/s][A
100%|██████████| 10/10 [00:15<00:00,  1.56s/it][A
Epochs:  94%|█████████▍| 33/35 [1:01:33<03:38, 109.34s/it]

Val Loss: 2496.8940 - Val Accuracy: 0.9383



Training:   0%|          | 0/73 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/73 [00:06<08:20,  6.95s/it][A
Training:   3%|▎         | 2/73 [00:07<03:30,  2.97s/it][A
Training:   4%|▍         | 3/73 [00:07<01:59,  1.71s/it][A
Training:   5%|▌         | 4/73 [00:07<01:14,  1.08s/it][A
Training:   7%|▋         | 5/73 [00:12<02:58,  2.63s/it][A
Training:   8%|▊         | 6/73 [00:13<02:04,  1.86s/it][A
Training:  10%|▉         | 7/73 [00:13<01:25,  1.30s/it][A
Training:  12%|█▏        | 9/73 [00:18<02:02,  1.91s/it][A
Training:  14%|█▎        | 10/73 [00:19<01:38,  1.57s/it][A
Training:  15%|█▌        | 11/73 [00:19<01:14,  1.20s/it][A
Training:  18%|█▊        | 13/73 [00:24<01:46,  1.77s/it][A
Training:  19%|█▉        | 14/73 [00:24<01:24,  1.44s/it][A
Training:  21%|██        | 15/73 [00:24<01:04,  1.11s/it][A
Training:  23%|██▎       | 17/73 [00:29<01:33,  1.67s/it][A
Training:  25%|██▍       | 18/73 [00:30<01:15,  1.37s/it][A
Training:  26%|██▌       | 19/73 [00:30<

Epoch: 34/35 - Loss: 2262.2268 - Accuracy: 0.9582



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:05<00:50,  5.65s/it][A
 20%|██        | 2/10 [00:05<00:19,  2.42s/it][A
 30%|███       | 3/10 [00:06<00:09,  1.40s/it][A
 50%|█████     | 5/10 [00:11<00:10,  2.07s/it][A
 60%|██████    | 6/10 [00:11<00:06,  1.51s/it][A
 80%|████████  | 8/10 [00:11<00:01,  1.17it/s][A
100%|██████████| 10/10 [00:15<00:00,  1.57s/it][A
Epochs:  97%|█████████▋| 34/35 [1:03:33<01:52, 112.59s/it]

Val Loss: 2520.9011 - Val Accuracy: 0.9658



Training:   0%|          | 0/73 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/73 [00:06<08:14,  6.87s/it][A
Training:   4%|▍         | 3/73 [00:07<02:08,  1.83s/it][A
Training:   5%|▌         | 4/73 [00:07<01:25,  1.24s/it][A
Training:   7%|▋         | 5/73 [00:12<02:57,  2.61s/it][A
Training:  10%|▉         | 7/73 [00:12<01:32,  1.40s/it][A
Training:  12%|█▏        | 9/73 [00:18<02:08,  2.00s/it][A
Training:  14%|█▎        | 10/73 [00:18<01:39,  1.58s/it][A
Training:  16%|█▋        | 12/73 [00:18<00:59,  1.02it/s][A
Training:  18%|█▊        | 13/73 [00:23<01:52,  1.88s/it][A
Training:  19%|█▉        | 14/73 [00:24<01:27,  1.48s/it][A
Training:  21%|██        | 15/73 [00:24<01:05,  1.13s/it][A
Training:  23%|██▎       | 17/73 [00:28<01:33,  1.67s/it][A
Training:  26%|██▌       | 19/73 [00:29<00:58,  1.08s/it][A
Training:  29%|██▉       | 21/73 [00:34<01:22,  1.58s/it][A
Training:  32%|███▏      | 23/73 [00:34<00:54,  1.08s/it][A
Training:  33%|███▎      | 24/73 [00:3

Epoch: 35/35 - Loss: 2367.1531 - Accuracy: 0.9579



  0%|          | 0/10 [00:00<?, ?it/s][A
 10%|█         | 1/10 [00:05<00:47,  5.32s/it][A
 30%|███       | 3/10 [00:05<00:10,  1.46s/it][A
 40%|████      | 4/10 [00:05<00:05,  1.00it/s][A
 50%|█████     | 5/10 [00:10<00:10,  2.14s/it][A
 80%|████████  | 8/10 [00:10<00:01,  1.10it/s][A
100%|██████████| 10/10 [00:14<00:00,  1.43s/it][A
Epochs: 100%|██████████| 35/35 [1:05:28<00:00, 112.24s/it]


Val Loss: 2810.1382 - Val Accuracy: 0.9466


[32m[I 2023-12-08 15:29:13,989][0m Trial 3 finished with value: 0.9466322064399719 and parameters: {'loss_learning_rate': 0.0007864547818893396, 'learning_rate': 0.026672551860448212, 'weight_decay': 0.0004995203487508594, 'epsilon': 2.215641865314564e-08, 'beta': 0.4, 'gamma': 0.8, 'batch_size': 193, 'epochs': 35}. Best is trial 0 with value: 0.9648317694664001.[0m


Learning rate for Loss: 0.0042754188900381235
Learning rate: 0.004531367393603924
Weight decay: 0.00046837344629150696
Epsilon: 2.3522348716547854e-09
Beta: 0.4
Gamma: 0.4
Batch size: 209
Number of epochs: 49


Epochs:   0%|          | 0/49 [00:00<?, ?it/s]
Training:   0%|          | 0/67 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/67 [00:06<07:00,  6.37s/it][A
Training:   3%|▎         | 2/67 [00:06<03:06,  2.88s/it][A
Training:   4%|▍         | 3/67 [00:06<01:43,  1.61s/it][A
Training:   6%|▌         | 4/67 [00:07<01:05,  1.05s/it][A
Training:   7%|▋         | 5/67 [00:12<02:32,  2.45s/it][A
Training:   9%|▉         | 6/67 [00:12<01:45,  1.74s/it][A
Training:  10%|█         | 7/67 [00:12<01:12,  1.20s/it][A
Training:  12%|█▏        | 8/67 [00:12<00:50,  1.16it/s][A
Training:  13%|█▎        | 9/67 [00:17<01:56,  2.02s/it][A
Training:  15%|█▍        | 10/67 [00:17<01:23,  1.46s/it][A
Training:  18%|█▊        | 12/67 [00:17<00:47,  1.15it/s][A
Training:  19%|█▉        | 13/67 [00:22<01:40,  1.85s/it][A
Training:  21%|██        | 14/67 [00:22<01:15,  1.43s/it][A
Training:  24%|██▍       | 16/67 [00:22<00:43,  1.18it/s][A
Training:  25%|██▌       | 17/67 [00:26<01:19,  1.59s/it

Epoch: 1/49 - Loss: 24.1722 - Accuracy: 0.8950



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:05<00:44,  5.62s/it][A
 33%|███▎      | 3/9 [00:05<00:09,  1.56s/it][A
 44%|████▍     | 4/9 [00:06<00:05,  1.07s/it][A
 56%|█████▌    | 5/9 [00:10<00:09,  2.27s/it][A
 78%|███████▊  | 7/9 [00:10<00:02,  1.20s/it][A
 89%|████████▉ | 8/9 [00:10<00:00,  1.09it/s][A
100%|██████████| 9/9 [00:12<00:00,  1.38s/it][A
Epochs:   2%|▏         | 1/49 [01:44<1:23:56, 104.94s/it]

Val Loss: 28.2238 - Val Accuracy: 0.9442



Training:   0%|          | 0/67 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/67 [00:06<06:51,  6.23s/it][A
Training:   3%|▎         | 2/67 [00:06<03:09,  2.91s/it][A
Training:   4%|▍         | 3/67 [00:06<01:44,  1.63s/it][A
Training:   6%|▌         | 4/67 [00:07<01:05,  1.03s/it][A
Training:   7%|▋         | 5/67 [00:11<02:24,  2.33s/it][A
Training:   9%|▉         | 6/67 [00:12<01:44,  1.71s/it][A
Training:  12%|█▏        | 8/67 [00:12<00:53,  1.11it/s][A
Training:  13%|█▎        | 9/67 [00:17<01:49,  1.89s/it][A
Training:  15%|█▍        | 10/67 [00:17<01:27,  1.54s/it][A
Training:  16%|█▋        | 11/67 [00:17<01:04,  1.15s/it][A
Training:  18%|█▊        | 12/67 [00:17<00:47,  1.15it/s][A
Training:  19%|█▉        | 13/67 [00:22<01:45,  1.96s/it][A
Training:  21%|██        | 14/67 [00:22<01:18,  1.48s/it][A
Training:  24%|██▍       | 16/67 [00:22<00:42,  1.20it/s][A
Training:  25%|██▌       | 17/67 [00:26<01:17,  1.55s/it][A
Training:  27%|██▋       | 18/67 [00:27<

Epoch: 2/49 - Loss: 31.3945 - Accuracy: 0.9448



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:06<00:54,  6.80s/it][A
 22%|██▏       | 2/9 [00:06<00:20,  2.91s/it][A
 33%|███▎      | 3/9 [00:07<00:09,  1.65s/it][A
 44%|████▍     | 4/9 [00:07<00:05,  1.07s/it][A
 56%|█████▌    | 5/9 [00:13<00:11,  2.76s/it][A
 78%|███████▊  | 7/9 [00:13<00:02,  1.40s/it][A
 89%|████████▉ | 8/9 [00:13<00:01,  1.06s/it][A
100%|██████████| 9/9 [00:15<00:00,  1.67s/it][A
Epochs:   4%|▍         | 2/49 [03:36<1:25:18, 108.90s/it]

Val Loss: 33.4816 - Val Accuracy: 0.9468



Training:   0%|          | 0/67 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/67 [00:07<08:30,  7.73s/it][A
Training:   4%|▍         | 3/67 [00:08<02:15,  2.12s/it][A
Training:   6%|▌         | 4/67 [00:08<01:31,  1.45s/it][A
Training:   7%|▋         | 5/67 [00:14<03:01,  2.93s/it][A
Training:   9%|▉         | 6/67 [00:14<02:14,  2.21s/it][A
Training:  10%|█         | 7/67 [00:15<01:36,  1.61s/it][A
Training:  12%|█▏        | 8/67 [00:15<01:09,  1.18s/it][A
Training:  13%|█▎        | 9/67 [00:21<02:35,  2.68s/it][A
Training:  15%|█▍        | 10/67 [00:22<02:01,  2.13s/it][A
Training:  16%|█▋        | 11/67 [00:22<01:25,  1.52s/it][A
Training:  18%|█▊        | 12/67 [00:22<01:00,  1.11s/it][A
Training:  19%|█▉        | 13/67 [00:27<02:07,  2.35s/it][A
Training:  21%|██        | 14/67 [00:28<01:37,  1.85s/it][A
Training:  24%|██▍       | 16/67 [00:28<00:52,  1.02s/it][A
Training:  25%|██▌       | 17/67 [00:33<01:33,  1.87s/it][A
Training:  27%|██▋       | 18/67 [00:34<

Epoch: 3/49 - Loss: 38.1326 - Accuracy: 0.9494



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:06<00:51,  6.38s/it][A
 33%|███▎      | 3/9 [00:06<00:10,  1.71s/it][A
 56%|█████▌    | 5/9 [00:12<00:09,  2.29s/it][A
 78%|███████▊  | 7/9 [00:12<00:02,  1.34s/it][A
100%|██████████| 9/9 [00:14<00:00,  1.56s/it][A
Epochs:   6%|▌         | 3/49 [05:37<1:27:32, 114.18s/it]

Val Loss: 51.2696 - Val Accuracy: 0.9493



Training:   0%|          | 0/67 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/67 [00:07<07:44,  7.04s/it][A
Training:   3%|▎         | 2/67 [00:07<03:16,  3.02s/it][A
Training:   4%|▍         | 3/67 [00:07<01:48,  1.70s/it][A
Training:   6%|▌         | 4/67 [00:07<01:07,  1.08s/it][A
Training:   7%|▋         | 5/67 [00:14<03:09,  3.06s/it][A
Training:   9%|▉         | 6/67 [00:14<02:05,  2.05s/it][A
Training:  12%|█▏        | 8/67 [00:14<01:08,  1.16s/it][A
Training:  13%|█▎        | 9/67 [00:20<02:10,  2.26s/it][A
Training:  16%|█▋        | 11/67 [00:20<01:14,  1.33s/it][A
Training:  18%|█▊        | 12/67 [00:20<00:57,  1.05s/it][A
Training:  19%|█▉        | 13/67 [00:24<01:44,  1.94s/it][A
Training:  22%|██▏       | 15/67 [00:25<01:00,  1.17s/it][A
Training:  24%|██▍       | 16/67 [00:25<00:51,  1.00s/it][A
Training:  25%|██▌       | 17/67 [00:30<01:38,  1.97s/it][A
Training:  28%|██▊       | 19/67 [00:30<00:56,  1.18s/it][A
Training:  30%|██▉       | 20/67 [00:30<

Epoch: 4/49 - Loss: 41.2169 - Accuracy: 0.9549



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:06<00:52,  6.51s/it][A
 22%|██▏       | 2/9 [00:06<00:19,  2.80s/it][A
 33%|███▎      | 3/9 [00:06<00:09,  1.60s/it][A
 44%|████▍     | 4/9 [00:07<00:05,  1.02s/it][A
 56%|█████▌    | 5/9 [00:11<00:09,  2.35s/it][A
 78%|███████▊  | 7/9 [00:12<00:02,  1.27s/it][A
 89%|████████▉ | 8/9 [00:12<00:00,  1.04it/s][A
100%|██████████| 9/9 [00:13<00:00,  1.50s/it][A
Epochs:   8%|▊         | 4/49 [07:35<1:27:01, 116.04s/it]

Val Loss: 42.1096 - Val Accuracy: 0.9603



Training:   0%|          | 0/67 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/67 [00:06<07:06,  6.46s/it][A
Training:   3%|▎         | 2/67 [00:06<03:01,  2.79s/it][A
Training:   4%|▍         | 3/67 [00:06<01:41,  1.58s/it][A
Training:   6%|▌         | 4/67 [00:07<01:05,  1.05s/it][A
Training:   7%|▋         | 5/67 [00:12<02:38,  2.55s/it][A
Training:   9%|▉         | 6/67 [00:12<01:45,  1.73s/it][A
Training:  10%|█         | 7/67 [00:12<01:12,  1.20s/it][A
Training:  12%|█▏        | 8/67 [00:12<00:52,  1.12it/s][A
Training:  13%|█▎        | 9/67 [00:17<01:58,  2.04s/it][A
Training:  16%|█▋        | 11/67 [00:17<01:02,  1.11s/it][A
Training:  19%|█▉        | 13/67 [00:21<01:23,  1.54s/it][A
Training:  22%|██▏       | 15/67 [00:21<00:52,  1.00s/it][A
Training:  24%|██▍       | 16/67 [00:22<00:43,  1.18it/s][A
Training:  25%|██▌       | 17/67 [00:27<01:32,  1.84s/it][A
Training:  28%|██▊       | 19/67 [00:27<00:54,  1.14s/it][A
Training:  30%|██▉       | 20/67 [00:27<0

Epoch: 5/49 - Loss: 46.3817 - Accuracy: 0.9510



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:06<00:50,  6.30s/it][A
 22%|██▏       | 2/9 [00:06<00:18,  2.71s/it][A
 33%|███▎      | 3/9 [00:06<00:09,  1.61s/it][A
 56%|█████▌    | 5/9 [00:13<00:10,  2.52s/it][A
 67%|██████▋   | 6/9 [00:13<00:05,  1.85s/it][A
 78%|███████▊  | 7/9 [00:13<00:02,  1.41s/it][A
 89%|████████▉ | 8/9 [00:13<00:01,  1.06s/it][A
100%|██████████| 9/9 [00:15<00:00,  1.72s/it][A
Epochs:  10%|█         | 5/49 [09:31<1:24:58, 115.86s/it]

Val Loss: 64.6048 - Val Accuracy: 0.9441



Training:   0%|          | 0/67 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/67 [00:08<09:31,  8.66s/it][A
Training:   3%|▎         | 2/67 [00:08<04:03,  3.75s/it][A
Training:   4%|▍         | 3/67 [00:09<02:20,  2.19s/it][A
Training:   6%|▌         | 4/67 [00:09<01:35,  1.52s/it][A
Training:   7%|▋         | 5/67 [00:15<02:57,  2.86s/it][A
Training:  10%|█         | 7/67 [00:15<01:31,  1.53s/it][A
Training:  12%|█▏        | 8/67 [00:15<01:08,  1.16s/it][A
Training:  13%|█▎        | 9/67 [00:20<02:13,  2.30s/it][A
Training:  16%|█▋        | 11/67 [00:21<01:17,  1.38s/it][A
Training:  18%|█▊        | 12/67 [00:21<00:59,  1.08s/it][A
Training:  19%|█▉        | 13/67 [00:26<01:59,  2.21s/it][A
Training:  21%|██        | 14/67 [00:27<01:27,  1.66s/it][A
Training:  24%|██▍       | 16/67 [00:27<00:49,  1.03it/s][A
Training:  25%|██▌       | 17/67 [00:33<01:45,  2.12s/it][A
Training:  27%|██▋       | 18/67 [00:33<01:19,  1.62s/it][A
Training:  28%|██▊       | 19/67 [00:33<

Epoch: 6/49 - Loss: 48.4394 - Accuracy: 0.9561



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:05<00:45,  5.73s/it][A
 22%|██▏       | 2/9 [00:06<00:17,  2.57s/it][A
 56%|█████▌    | 5/9 [00:10<00:07,  1.85s/it][A
 67%|██████▋   | 6/9 [00:11<00:04,  1.50s/it][A
100%|██████████| 9/9 [00:12<00:00,  1.35s/it][A
Epochs:  12%|█▏        | 6/49 [11:33<1:24:24, 117.78s/it]

Val Loss: 60.0227 - Val Accuracy: 0.9503



Training:   0%|          | 0/67 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/67 [00:06<07:01,  6.39s/it][A
Training:   3%|▎         | 2/67 [00:06<02:55,  2.70s/it][A
Training:   4%|▍         | 3/67 [00:06<01:39,  1.55s/it][A
Training:   6%|▌         | 4/67 [00:06<01:03,  1.01s/it][A
Training:   7%|▋         | 5/67 [00:11<02:29,  2.41s/it][A
Training:   9%|▉         | 6/67 [00:11<01:40,  1.65s/it][A
Training:  12%|█▏        | 8/67 [00:12<00:52,  1.12it/s][A
Training:  13%|█▎        | 9/67 [00:16<01:49,  1.89s/it][A
Training:  15%|█▍        | 10/67 [00:17<01:22,  1.44s/it][A
Training:  16%|█▋        | 11/67 [00:17<01:00,  1.08s/it][A
Training:  19%|█▉        | 13/67 [00:21<01:25,  1.57s/it][A
Training:  21%|██        | 14/67 [00:22<01:10,  1.33s/it][A
Training:  22%|██▏       | 15/67 [00:22<00:54,  1.05s/it][A
Training:  24%|██▍       | 16/67 [00:22<00:42,  1.20it/s][A
Training:  25%|██▌       | 17/67 [00:27<01:35,  1.92s/it][A
Training:  27%|██▋       | 18/67 [00:28<

Epoch: 7/49 - Loss: 50.0748 - Accuracy: 0.9562



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:06<00:51,  6.49s/it][A
 22%|██▏       | 2/9 [00:06<00:19,  2.78s/it][A
 33%|███▎      | 3/9 [00:06<00:09,  1.56s/it][A
 44%|████▍     | 4/9 [00:06<00:05,  1.01s/it][A
 56%|█████▌    | 5/9 [00:11<00:09,  2.31s/it][A
 78%|███████▊  | 7/9 [00:11<00:02,  1.17s/it][A
100%|██████████| 9/9 [00:13<00:00,  1.46s/it][A
Epochs:  14%|█▍        | 7/49 [13:23<1:20:47, 115.42s/it]

Val Loss: 65.6245 - Val Accuracy: 0.9433



Training:   0%|          | 0/67 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/67 [00:06<07:18,  6.64s/it][A
Training:   3%|▎         | 2/67 [00:07<03:20,  3.09s/it][A
Training:   4%|▍         | 3/67 [00:07<01:50,  1.73s/it][A
Training:   6%|▌         | 4/67 [00:07<01:09,  1.10s/it][A
Training:   7%|▋         | 5/67 [00:12<02:29,  2.41s/it][A
Training:   9%|▉         | 6/67 [00:13<01:54,  1.88s/it][A
Training:  10%|█         | 7/67 [00:13<01:18,  1.30s/it][A
Training:  12%|█▏        | 8/67 [00:13<00:55,  1.06it/s][A
Training:  13%|█▎        | 9/67 [00:17<01:59,  2.05s/it][A
Training:  15%|█▍        | 10/67 [00:18<01:33,  1.65s/it][A
Training:  16%|█▋        | 11/67 [00:18<01:05,  1.17s/it][A
Training:  18%|█▊        | 12/67 [00:18<00:46,  1.18it/s][A
Training:  19%|█▉        | 13/67 [00:23<01:49,  2.02s/it][A
Training:  21%|██        | 14/67 [00:24<01:32,  1.75s/it][A
Training:  22%|██▏       | 15/67 [00:25<01:09,  1.34s/it][A
Training:  24%|██▍       | 16/67 [00:25<0

Epoch: 8/49 - Loss: 53.3017 - Accuracy: 0.9544



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:07<01:01,  7.71s/it][A
 22%|██▏       | 2/9 [00:08<00:24,  3.44s/it][A
 33%|███▎      | 3/9 [00:08<00:11,  1.99s/it][A
 44%|████▍     | 4/9 [00:08<00:06,  1.25s/it][A
 56%|█████▌    | 5/9 [00:13<00:11,  2.75s/it][A
 67%|██████▋   | 6/9 [00:14<00:05,  1.87s/it][A
 89%|████████▉ | 8/9 [00:14<00:00,  1.02it/s][A
100%|██████████| 9/9 [00:16<00:00,  1.83s/it][A
Epochs:  16%|█▋        | 8/49 [15:44<1:24:26, 123.57s/it]

Val Loss: 71.3270 - Val Accuracy: 0.9355



Training:   0%|          | 0/67 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/67 [00:08<09:42,  8.82s/it][A
Training:   3%|▎         | 2/67 [00:08<04:02,  3.73s/it][A
Training:   4%|▍         | 3/67 [00:09<02:15,  2.11s/it][A
Training:   6%|▌         | 4/67 [00:09<01:25,  1.36s/it][A
Training:   7%|▋         | 5/67 [00:15<03:18,  3.20s/it][A
Training:   9%|▉         | 6/67 [00:16<02:12,  2.18s/it][A
Training:  10%|█         | 7/67 [00:16<01:30,  1.50s/it][A
Training:  12%|█▏        | 8/67 [00:16<01:05,  1.11s/it][A
Training:  13%|█▎        | 9/67 [00:21<02:23,  2.47s/it][A
Training:  15%|█▍        | 10/67 [00:21<01:39,  1.74s/it][A
Training:  16%|█▋        | 11/67 [00:22<01:09,  1.25s/it][A
Training:  18%|█▊        | 12/67 [00:22<00:50,  1.10it/s][A
Training:  19%|█▉        | 13/67 [00:27<02:04,  2.31s/it][A
Training:  21%|██        | 14/67 [00:27<01:27,  1.66s/it][A
Training:  22%|██▏       | 15/67 [00:28<01:02,  1.20s/it][A
Training:  24%|██▍       | 16/67 [00:28<0

Epoch: 9/49 - Loss: 51.9774 - Accuracy: 0.9529



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:05<00:44,  5.58s/it][A
 22%|██▏       | 2/9 [00:05<00:16,  2.39s/it][A
 33%|███▎      | 3/9 [00:05<00:08,  1.37s/it][A
 56%|█████▌    | 5/9 [00:10<00:07,  1.87s/it][A
 89%|████████▉ | 8/9 [00:10<00:00,  1.15it/s][A
100%|██████████| 9/9 [00:12<00:00,  1.35s/it][A
Epochs:  18%|█▊        | 9/49 [17:34<1:19:34, 119.36s/it]

Val Loss: 58.0212 - Val Accuracy: 0.9551



Training:   0%|          | 0/67 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/67 [00:06<06:36,  6.00s/it][A
Training:   3%|▎         | 2/67 [00:06<02:47,  2.57s/it][A
Training:   4%|▍         | 3/67 [00:06<01:35,  1.49s/it][A
Training:   7%|▋         | 5/67 [00:11<02:13,  2.16s/it][A
Training:   9%|▉         | 6/67 [00:11<01:35,  1.57s/it][A
Training:  12%|█▏        | 8/67 [00:12<00:53,  1.11it/s][A
Training:  13%|█▎        | 9/67 [00:16<01:45,  1.83s/it][A
Training:  16%|█▋        | 11/67 [00:16<01:02,  1.11s/it][A
Training:  18%|█▊        | 12/67 [00:17<00:48,  1.12it/s][A
Training:  19%|█▉        | 13/67 [00:22<01:48,  2.00s/it][A
Training:  22%|██▏       | 15/67 [00:22<01:03,  1.21s/it][A
Training:  25%|██▌       | 17/67 [00:27<01:23,  1.67s/it][A
Training:  27%|██▋       | 18/67 [00:27<01:06,  1.35s/it][A
Training:  28%|██▊       | 19/67 [00:28<00:54,  1.14s/it][A
Training:  30%|██▉       | 20/67 [00:28<00:42,  1.11it/s][A
Training:  31%|███▏      | 21/67 [00:32

Epoch: 10/49 - Loss: 55.5335 - Accuracy: 0.9583



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:05<00:42,  5.29s/it][A
 22%|██▏       | 2/9 [00:05<00:15,  2.25s/it][A
 44%|████▍     | 4/9 [00:05<00:04,  1.12it/s][A
 56%|█████▌    | 5/9 [00:10<00:08,  2.14s/it][A
 78%|███████▊  | 7/9 [00:10<00:02,  1.17s/it][A
100%|██████████| 9/9 [00:12<00:00,  1.36s/it][A
Epochs:  20%|██        | 10/49 [19:18<1:14:31, 114.64s/it]

Val Loss: 69.3006 - Val Accuracy: 0.9496



Training:   0%|          | 0/67 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/67 [00:06<07:03,  6.41s/it][A
Training:   3%|▎         | 2/67 [00:06<02:56,  2.72s/it][A
Training:   6%|▌         | 4/67 [00:06<01:06,  1.05s/it][A
Training:   7%|▋         | 5/67 [00:11<02:22,  2.29s/it][A
Training:  10%|█         | 7/67 [00:11<01:14,  1.24s/it][A
Training:  13%|█▎        | 9/67 [00:16<01:42,  1.76s/it][A
Training:  15%|█▍        | 10/67 [00:17<01:19,  1.39s/it][A
Training:  16%|█▋        | 11/67 [00:17<01:00,  1.09s/it][A
Training:  18%|█▊        | 12/67 [00:17<00:47,  1.16it/s][A
Training:  19%|█▉        | 13/67 [00:22<01:51,  2.07s/it][A
Training:  21%|██        | 14/67 [00:22<01:21,  1.53s/it][A
Training:  22%|██▏       | 15/67 [00:22<00:58,  1.13s/it][A
Training:  25%|██▌       | 17/67 [00:27<01:25,  1.71s/it][A
Training:  27%|██▋       | 18/67 [00:28<01:08,  1.40s/it][A
Training:  28%|██▊       | 19/67 [00:28<00:51,  1.08s/it][A
Training:  30%|██▉       | 20/67 [00:2

Epoch: 11/49 - Loss: 54.9575 - Accuracy: 0.9565



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:05<00:42,  5.29s/it][A
 22%|██▏       | 2/9 [00:05<00:15,  2.26s/it][A
 44%|████▍     | 4/9 [00:05<00:04,  1.13it/s][A
 56%|█████▌    | 5/9 [00:10<00:08,  2.07s/it][A
 67%|██████▋   | 6/9 [00:10<00:04,  1.47s/it][A
 89%|████████▉ | 8/9 [00:10<00:00,  1.23it/s][A
100%|██████████| 9/9 [00:11<00:00,  1.32s/it][A
Epochs:  22%|██▏       | 11/49 [21:03<1:10:39, 111.56s/it]

Val Loss: 69.1777 - Val Accuracy: 0.9515



Training:   0%|          | 0/67 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/67 [00:05<05:59,  5.45s/it][A
Training:   3%|▎         | 2/67 [00:05<02:36,  2.41s/it][A
Training:   4%|▍         | 3/67 [00:05<01:27,  1.36s/it][A
Training:   7%|▋         | 5/67 [00:10<01:58,  1.90s/it][A
Training:  10%|█         | 7/67 [00:10<01:05,  1.09s/it][A
Training:  12%|█▏        | 8/67 [00:10<00:51,  1.15it/s][A
Training:  13%|█▎        | 9/67 [00:16<01:58,  2.05s/it][A
Training:  15%|█▍        | 10/67 [00:16<01:28,  1.56s/it][A
Training:  16%|█▋        | 11/67 [00:16<01:05,  1.18s/it][A
Training:  18%|█▊        | 12/67 [00:16<00:48,  1.12it/s][A
Training:  19%|█▉        | 13/67 [00:21<01:48,  2.01s/it][A
Training:  21%|██        | 14/67 [00:21<01:17,  1.47s/it][A
Training:  22%|██▏       | 15/67 [00:21<00:55,  1.07s/it][A
Training:  24%|██▍       | 16/67 [00:22<00:40,  1.27it/s][A
Training:  25%|██▌       | 17/67 [00:26<01:33,  1.88s/it][A
Training:  27%|██▋       | 18/67 [00:26

Epoch: 12/49 - Loss: 53.4651 - Accuracy: 0.9573



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:05<00:44,  5.56s/it][A
 22%|██▏       | 2/9 [00:05<00:16,  2.35s/it][A
 44%|████▍     | 4/9 [00:05<00:04,  1.09it/s][A
 67%|██████▋   | 6/9 [00:10<00:04,  1.65s/it][A
 89%|████████▉ | 8/9 [00:10<00:01,  1.01s/it][A
100%|██████████| 9/9 [00:12<00:00,  1.34s/it][A
Epochs:  24%|██▍       | 12/49 [22:46<1:07:15, 109.07s/it]

Val Loss: 67.5125 - Val Accuracy: 0.9561



Training:   0%|          | 0/67 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/67 [00:05<06:06,  5.55s/it][A
Training:   3%|▎         | 2/67 [00:06<02:47,  2.58s/it][A
Training:   6%|▌         | 4/67 [00:06<01:03,  1.01s/it][A
Training:   7%|▋         | 5/67 [00:10<02:12,  2.13s/it][A
Training:   9%|▉         | 6/67 [00:11<01:38,  1.62s/it][A
Training:  12%|█▏        | 8/67 [00:11<00:53,  1.11it/s][A
Training:  13%|█▎        | 9/67 [00:16<01:45,  1.82s/it][A
Training:  15%|█▍        | 10/67 [00:16<01:23,  1.47s/it][A
Training:  18%|█▊        | 12/67 [00:16<00:51,  1.07it/s][A
Training:  19%|█▉        | 13/67 [00:21<01:29,  1.66s/it][A
Training:  21%|██        | 14/67 [00:21<01:13,  1.38s/it][A
Training:  24%|██▍       | 16/67 [00:21<00:42,  1.21it/s][A
Training:  25%|██▌       | 17/67 [00:25<01:17,  1.55s/it][A
Training:  27%|██▋       | 18/67 [00:26<01:06,  1.37s/it][A
Training:  30%|██▉       | 20/67 [00:26<00:39,  1.18it/s][A
Training:  31%|███▏      | 21/67 [00:30

Epoch: 13/49 - Loss: 57.4691 - Accuracy: 0.9605



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:05<00:42,  5.33s/it][A
 22%|██▏       | 2/9 [00:05<00:15,  2.28s/it][A
 33%|███▎      | 3/9 [00:05<00:07,  1.30s/it][A
 44%|████▍     | 4/9 [00:05<00:04,  1.17it/s][A
 56%|█████▌    | 5/9 [00:10<00:08,  2.15s/it][A
 78%|███████▊  | 7/9 [00:10<00:02,  1.09s/it][A
100%|██████████| 9/9 [00:11<00:00,  1.29s/it][A
Epochs:  27%|██▋       | 13/49 [24:29<1:04:15, 107.11s/it]

Val Loss: 69.9809 - Val Accuracy: 0.9511



Training:   0%|          | 0/67 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/67 [00:05<06:14,  5.67s/it][A
Training:   3%|▎         | 2/67 [00:05<02:43,  2.51s/it][A
Training:   6%|▌         | 4/67 [00:06<01:04,  1.03s/it][A
Training:   7%|▋         | 5/67 [00:11<02:17,  2.22s/it][A
Training:   9%|▉         | 6/67 [00:11<01:37,  1.60s/it][A
Training:  10%|█         | 7/67 [00:11<01:09,  1.15s/it][A
Training:  12%|█▏        | 8/67 [00:11<00:50,  1.16it/s][A
Training:  13%|█▎        | 9/67 [00:16<01:57,  2.03s/it][A
Training:  15%|█▍        | 10/67 [00:16<01:26,  1.51s/it][A
Training:  16%|█▋        | 11/67 [00:16<01:01,  1.09s/it][A
Training:  18%|█▊        | 12/67 [00:17<00:45,  1.20it/s][A
Training:  19%|█▉        | 13/67 [00:21<01:48,  2.00s/it][A
Training:  21%|██        | 14/67 [00:22<01:17,  1.47s/it][A
Training:  24%|██▍       | 16/67 [00:22<00:47,  1.08it/s][A
Training:  25%|██▌       | 17/67 [00:27<01:30,  1.80s/it][A
Training:  27%|██▋       | 18/67 [00:27<

Epoch: 14/49 - Loss: 53.9876 - Accuracy: 0.9573



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:05<00:42,  5.30s/it][A
 22%|██▏       | 2/9 [00:05<00:17,  2.44s/it][A
 33%|███▎      | 3/9 [00:05<00:08,  1.39s/it][A
 44%|████▍     | 4/9 [00:06<00:04,  1.10it/s][A
 56%|█████▌    | 5/9 [00:10<00:08,  2.03s/it][A
 67%|██████▋   | 6/9 [00:10<00:04,  1.50s/it][A
 89%|████████▉ | 8/9 [00:10<00:00,  1.25it/s][A
100%|██████████| 9/9 [00:11<00:00,  1.28s/it][A
Epochs:  29%|██▊       | 14/49 [26:10<1:01:28, 105.39s/it]

Val Loss: 49.1556 - Val Accuracy: 0.9614



Training:   0%|          | 0/67 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/67 [00:05<06:12,  5.64s/it][A
Training:   3%|▎         | 2/67 [00:05<02:37,  2.42s/it][A
Training:   4%|▍         | 3/67 [00:06<01:30,  1.41s/it][A
Training:   6%|▌         | 4/67 [00:06<00:56,  1.12it/s][A
Training:   7%|▋         | 5/67 [00:11<02:25,  2.34s/it][A
Training:   9%|▉         | 6/67 [00:11<01:36,  1.58s/it][A
Training:  12%|█▏        | 8/67 [00:11<00:50,  1.16it/s][A
Training:  13%|█▎        | 9/67 [00:16<01:52,  1.94s/it][A
Training:  15%|█▍        | 10/67 [00:16<01:22,  1.45s/it][A
Training:  16%|█▋        | 11/67 [00:16<01:00,  1.08s/it][A
Training:  18%|█▊        | 12/67 [00:16<00:44,  1.25it/s][A
Training:  19%|█▉        | 13/67 [00:21<01:50,  2.04s/it][A
Training:  22%|██▏       | 15/67 [00:22<01:00,  1.15s/it][A
Training:  25%|██▌       | 17/67 [00:26<01:23,  1.67s/it][A
Training:  27%|██▋       | 18/67 [00:27<01:05,  1.33s/it][A
Training:  30%|██▉       | 20/67 [00:27<

Epoch: 15/49 - Loss: 54.3468 - Accuracy: 0.9593



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:05<00:42,  5.36s/it][A
 22%|██▏       | 2/9 [00:05<00:16,  2.31s/it][A
 44%|████▍     | 4/9 [00:05<00:04,  1.09it/s][A
 56%|█████▌    | 5/9 [00:10<00:08,  2.08s/it][A
 78%|███████▊  | 7/9 [00:10<00:02,  1.13s/it][A
100%|██████████| 9/9 [00:11<00:00,  1.30s/it][A
Epochs:  31%|███       | 15/49 [27:52<59:05, 104.28s/it]  

Val Loss: 65.1629 - Val Accuracy: 0.9553



Training:   0%|          | 0/67 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/67 [00:05<06:34,  5.98s/it][A
Training:   4%|▍         | 3/67 [00:06<01:45,  1.64s/it][A
Training:   6%|▌         | 4/67 [00:06<01:10,  1.12s/it][A
Training:   7%|▋         | 5/67 [00:11<02:32,  2.46s/it][A
Training:  10%|█         | 7/67 [00:11<01:21,  1.35s/it][A
Training:  12%|█▏        | 8/67 [00:12<01:02,  1.05s/it][A
Training:  13%|█▎        | 9/67 [00:17<02:03,  2.12s/it][A
Training:  16%|█▋        | 11/67 [00:17<01:09,  1.24s/it][A
Training:  18%|█▊        | 12/67 [00:17<00:53,  1.02it/s][A
Training:  19%|█▉        | 13/67 [00:22<01:45,  1.96s/it][A
Training:  21%|██        | 14/67 [00:22<01:17,  1.47s/it][A
Training:  22%|██▏       | 15/67 [00:22<00:57,  1.10s/it][A
Training:  24%|██▍       | 16/67 [00:22<00:42,  1.19it/s][A
Training:  25%|██▌       | 17/67 [00:28<01:46,  2.12s/it][A
Training:  27%|██▋       | 18/67 [00:28<01:15,  1.54s/it][A
Training:  28%|██▊       | 19/67 [00:28

Epoch: 16/49 - Loss: 56.4367 - Accuracy: 0.9588



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:05<00:44,  5.51s/it][A
 22%|██▏       | 2/9 [00:05<00:16,  2.39s/it][A
 44%|████▍     | 4/9 [00:05<00:04,  1.06it/s][A
 56%|█████▌    | 5/9 [00:10<00:07,  2.00s/it][A
 89%|████████▉ | 8/9 [00:10<00:00,  1.13it/s][A
100%|██████████| 9/9 [00:11<00:00,  1.29s/it][A
Epochs:  33%|███▎      | 16/49 [29:35<57:08, 103.89s/it]

Val Loss: 64.5783 - Val Accuracy: 0.9499



Training:   0%|          | 0/67 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/67 [00:06<07:13,  6.57s/it][A
Training:   4%|▍         | 3/67 [00:06<01:52,  1.75s/it][A
Training:   7%|▋         | 5/67 [00:12<02:18,  2.24s/it][A
Training:   9%|▉         | 6/67 [00:12<01:42,  1.67s/it][A
Training:  10%|█         | 7/67 [00:12<01:15,  1.25s/it][A
Training:  12%|█▏        | 8/67 [00:12<00:54,  1.07it/s][A
Training:  13%|█▎        | 9/67 [00:17<01:57,  2.03s/it][A
Training:  16%|█▋        | 11/67 [00:17<01:03,  1.14s/it][A
Training:  19%|█▉        | 13/67 [00:22<01:30,  1.68s/it][A
Training:  21%|██        | 14/67 [00:22<01:11,  1.35s/it][A
Training:  22%|██▏       | 15/67 [00:22<00:54,  1.06s/it][A
Training:  24%|██▍       | 16/67 [00:22<00:41,  1.22it/s][A
Training:  25%|██▌       | 17/67 [00:28<01:42,  2.05s/it][A
Training:  28%|██▊       | 19/67 [00:28<00:58,  1.22s/it][A
Training:  30%|██▉       | 20/67 [00:28<00:45,  1.03it/s][A
Training:  31%|███▏      | 21/67 [00:33

Epoch: 17/49 - Loss: 57.2122 - Accuracy: 0.9607



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:05<00:44,  5.62s/it][A
 22%|██▏       | 2/9 [00:05<00:16,  2.38s/it][A
 44%|████▍     | 4/9 [00:05<00:04,  1.08it/s][A
 67%|██████▋   | 6/9 [00:09<00:04,  1.45s/it][A
 89%|████████▉ | 8/9 [00:10<00:00,  1.10it/s][A
100%|██████████| 9/9 [00:11<00:00,  1.28s/it][A
Epochs:  35%|███▍      | 17/49 [31:17<55:10, 103.45s/it]

Val Loss: 68.2442 - Val Accuracy: 0.9578



Training:   0%|          | 0/67 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/67 [00:05<06:23,  5.80s/it][A
Training:   3%|▎         | 2/67 [00:06<02:55,  2.70s/it][A
Training:   6%|▌         | 4/67 [00:06<01:07,  1.08s/it][A
Training:   7%|▋         | 5/67 [00:11<02:16,  2.20s/it][A
Training:   9%|▉         | 6/67 [00:11<01:45,  1.73s/it][A
Training:  12%|█▏        | 8/67 [00:12<00:55,  1.06it/s][A
Training:  13%|█▎        | 9/67 [00:16<01:44,  1.81s/it][A
Training:  15%|█▍        | 10/67 [00:17<01:26,  1.52s/it][A
Training:  18%|█▊        | 12/67 [00:17<00:50,  1.09it/s][A
Training:  19%|█▉        | 13/67 [00:22<01:36,  1.79s/it][A
Training:  21%|██        | 14/67 [00:22<01:19,  1.50s/it][A
Training:  22%|██▏       | 15/67 [00:22<00:59,  1.15s/it][A
Training:  24%|██▍       | 16/67 [00:22<00:44,  1.15it/s][A
Training:  25%|██▌       | 17/67 [00:27<01:34,  1.88s/it][A
Training:  27%|██▋       | 18/67 [00:27<01:12,  1.47s/it][A
Training:  30%|██▉       | 20/67 [00:27

Epoch: 18/49 - Loss: 55.5701 - Accuracy: 0.9597



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:05<00:45,  5.74s/it][A
 22%|██▏       | 2/9 [00:05<00:17,  2.45s/it][A
 33%|███▎      | 3/9 [00:06<00:08,  1.40s/it][A
 56%|█████▌    | 5/9 [00:10<00:07,  1.79s/it][A
 78%|███████▊  | 7/9 [00:10<00:02,  1.02s/it][A
100%|██████████| 9/9 [00:11<00:00,  1.31s/it][A
Epochs:  37%|███▋      | 18/49 [32:59<53:13, 103.02s/it]

Val Loss: 90.0401 - Val Accuracy: 0.9404



Training:   0%|          | 0/67 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/67 [00:06<06:49,  6.21s/it][A
Training:   4%|▍         | 3/67 [00:06<01:48,  1.69s/it][A
Training:   7%|▋         | 5/67 [00:11<02:13,  2.16s/it][A
Training:   9%|▉         | 6/67 [00:11<01:38,  1.61s/it][A
Training:  10%|█         | 7/67 [00:11<01:11,  1.19s/it][A
Training:  12%|█▏        | 8/67 [00:11<00:52,  1.12it/s][A
Training:  13%|█▎        | 9/67 [00:16<01:58,  2.05s/it][A
Training:  15%|█▍        | 10/67 [00:16<01:24,  1.48s/it][A
Training:  16%|█▋        | 11/67 [00:17<01:00,  1.08s/it][A
Training:  18%|█▊        | 12/67 [00:17<00:44,  1.25it/s][A
Training:  19%|█▉        | 13/67 [00:22<01:52,  2.08s/it][A
Training:  21%|██        | 14/67 [00:22<01:21,  1.55s/it][A
Training:  22%|██▏       | 15/67 [00:22<00:58,  1.12s/it][A
Training:  24%|██▍       | 16/67 [00:22<00:41,  1.22it/s][A
Training:  25%|██▌       | 17/67 [00:27<01:40,  2.01s/it][A
Training:  27%|██▋       | 18/67 [00:27

Epoch: 19/49 - Loss: 57.4345 - Accuracy: 0.9599



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:05<00:41,  5.22s/it][A
 22%|██▏       | 2/9 [00:05<00:16,  2.29s/it][A
 44%|████▍     | 4/9 [00:05<00:04,  1.10it/s][A
 56%|█████▌    | 5/9 [00:09<00:07,  1.94s/it][A
 67%|██████▋   | 6/9 [00:09<00:04,  1.38s/it][A
 89%|████████▉ | 8/9 [00:10<00:00,  1.30it/s][A
100%|██████████| 9/9 [00:11<00:00,  1.26s/it][A
Epochs:  39%|███▉      | 19/49 [34:42<51:25, 102.85s/it]

Val Loss: 63.8559 - Val Accuracy: 0.9455



Training:   0%|          | 0/67 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/67 [00:05<06:35,  5.99s/it][A
Training:   3%|▎         | 2/67 [00:06<02:55,  2.70s/it][A
Training:   6%|▌         | 4/67 [00:06<01:07,  1.06s/it][A
Training:   7%|▋         | 5/67 [00:11<02:16,  2.19s/it][A
Training:   9%|▉         | 6/67 [00:11<01:40,  1.65s/it][A
Training:  12%|█▏        | 8/67 [00:11<00:53,  1.10it/s][A
Training:  13%|█▎        | 9/67 [00:16<01:52,  1.94s/it][A
Training:  15%|█▍        | 10/67 [00:16<01:23,  1.47s/it][A
Training:  18%|█▊        | 12/67 [00:17<00:47,  1.16it/s][A
Training:  19%|█▉        | 13/67 [00:22<01:38,  1.82s/it][A
Training:  21%|██        | 14/67 [00:22<01:17,  1.45s/it][A
Training:  24%|██▍       | 16/67 [00:22<00:44,  1.14it/s][A
Training:  25%|██▌       | 17/67 [00:27<01:29,  1.79s/it][A
Training:  27%|██▋       | 18/67 [00:27<01:09,  1.42s/it][A
Training:  28%|██▊       | 19/67 [00:27<00:51,  1.08s/it][A
Training:  31%|███▏      | 21/67 [00:32

Epoch: 20/49 - Loss: 59.1700 - Accuracy: 0.9613



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:05<00:43,  5.46s/it][A
 22%|██▏       | 2/9 [00:05<00:16,  2.32s/it][A
 44%|████▍     | 4/9 [00:05<00:04,  1.09it/s][A
 56%|█████▌    | 5/9 [00:10<00:07,  1.95s/it][A
 67%|██████▋   | 6/9 [00:10<00:04,  1.41s/it][A
 78%|███████▊  | 7/9 [00:10<00:02,  1.01s/it][A
100%|██████████| 9/9 [00:11<00:00,  1.32s/it][A
Epochs:  41%|████      | 20/49 [36:25<49:41, 102.80s/it]

Val Loss: 74.5620 - Val Accuracy: 0.9546



Training:   0%|          | 0/67 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/67 [00:07<07:57,  7.24s/it][A
Training:   3%|▎         | 2/67 [00:07<03:18,  3.05s/it][A
Training:   4%|▍         | 3/67 [00:07<01:58,  1.85s/it][A
Training:   6%|▌         | 4/67 [00:07<01:13,  1.16s/it][A
Training:   7%|▋         | 5/67 [00:12<02:40,  2.58s/it][A
Training:   9%|▉         | 6/67 [00:13<01:47,  1.76s/it][A
Training:  10%|█         | 7/67 [00:13<01:22,  1.38s/it][A
Training:  12%|█▏        | 8/67 [00:13<00:59,  1.00s/it][A
Training:  13%|█▎        | 9/67 [00:20<02:34,  2.66s/it][A
Training:  15%|█▍        | 10/67 [00:20<01:49,  1.92s/it][A
Training:  16%|█▋        | 11/67 [00:20<01:19,  1.41s/it][A
Training:  18%|█▊        | 12/67 [00:21<00:57,  1.05s/it][A
Training:  19%|█▉        | 13/67 [00:28<02:41,  2.99s/it][A
Training:  21%|██        | 14/67 [00:28<01:57,  2.21s/it][A
Training:  22%|██▏       | 15/67 [00:29<01:28,  1.70s/it][A
Training:  24%|██▍       | 16/67 [00:29<0

Epoch: 21/49 - Loss: 55.4010 - Accuracy: 0.9603



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:07<01:01,  7.73s/it][A
 22%|██▏       | 2/9 [00:08<00:23,  3.34s/it][A
 33%|███▎      | 3/9 [00:08<00:11,  1.89s/it][A
 44%|████▍     | 4/9 [00:08<00:05,  1.18s/it][A
 56%|█████▌    | 5/9 [00:14<00:11,  2.95s/it][A
 67%|██████▋   | 6/9 [00:14<00:06,  2.02s/it][A
 78%|███████▊  | 7/9 [00:14<00:02,  1.45s/it][A
 89%|████████▉ | 8/9 [00:15<00:01,  1.06s/it][A
100%|██████████| 9/9 [00:16<00:00,  1.88s/it][A
Epochs:  43%|████▎     | 21/49 [38:41<52:42, 112.96s/it]

Val Loss: 83.7041 - Val Accuracy: 0.9594



Training:   0%|          | 0/67 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/67 [00:08<09:33,  8.70s/it][A
Training:   4%|▍         | 3/67 [00:08<02:27,  2.31s/it][A
Training:   7%|▋         | 5/67 [00:15<03:02,  2.94s/it][A
Training:   9%|▉         | 6/67 [00:16<02:15,  2.23s/it][A
Training:  10%|█         | 7/67 [00:16<01:40,  1.67s/it][A
Training:  12%|█▏        | 8/67 [00:16<01:14,  1.27s/it][A
Training:  13%|█▎        | 9/67 [00:23<02:44,  2.84s/it][A
Training:  15%|█▍        | 10/67 [00:23<01:59,  2.09s/it][A
Training:  16%|█▋        | 11/67 [00:23<01:24,  1.52s/it][A
Training:  18%|█▊        | 12/67 [00:24<01:03,  1.16s/it][A
Training:  19%|█▉        | 13/67 [00:30<02:24,  2.67s/it][A
Training:  21%|██        | 14/67 [00:30<01:41,  1.91s/it][A
Training:  22%|██▏       | 15/67 [00:30<01:11,  1.38s/it][A
Training:  25%|██▌       | 17/67 [00:37<01:57,  2.35s/it][A
Training:  27%|██▋       | 18/67 [00:37<01:29,  1.82s/it][A
Training:  28%|██▊       | 19/67 [00:38

Epoch: 22/49 - Loss: 55.5453 - Accuracy: 0.9597



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:04<00:39,  4.89s/it][A
 33%|███▎      | 3/9 [00:05<00:08,  1.35s/it][A
 44%|████▍     | 4/9 [00:05<00:04,  1.06it/s][A
 56%|█████▌    | 5/9 [00:09<00:08,  2.12s/it][A
 67%|██████▋   | 6/9 [00:09<00:04,  1.50s/it][A
 89%|████████▉ | 8/9 [00:10<00:00,  1.23it/s][A
100%|██████████| 9/9 [00:11<00:00,  1.27s/it][A
Epochs:  45%|████▍     | 22/49 [40:37<51:16, 113.95s/it]

Val Loss: 90.5727 - Val Accuracy: 0.9535



Training:   0%|          | 0/67 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/67 [00:05<06:04,  5.52s/it][A
Training:   4%|▍         | 3/67 [00:05<01:35,  1.49s/it][A
Training:   7%|▋         | 5/67 [00:11<02:12,  2.14s/it][A
Training:  10%|█         | 7/67 [00:11<01:16,  1.27s/it][A
Training:  13%|█▎        | 9/67 [00:16<01:43,  1.78s/it][A
Training:  16%|█▋        | 11/67 [00:16<01:06,  1.19s/it][A
Training:  19%|█▉        | 13/67 [00:22<01:31,  1.70s/it][A
Training:  22%|██▏       | 15/67 [00:22<01:01,  1.19s/it][A
Training:  25%|██▌       | 17/67 [00:27<01:22,  1.64s/it][A
Training:  28%|██▊       | 19/67 [00:27<00:55,  1.15s/it][A
Training:  31%|███▏      | 21/67 [00:33<01:15,  1.64s/it][A
Training:  34%|███▍      | 23/67 [00:33<00:51,  1.16s/it][A
Training:  37%|███▋      | 25/67 [00:38<01:03,  1.51s/it][A
Training:  40%|████      | 27/67 [00:38<00:43,  1.08s/it][A
Training:  43%|████▎     | 29/67 [00:42<00:55,  1.47s/it][A
Training:  46%|████▋     | 31/67 [00:

Epoch: 23/49 - Loss: 58.8869 - Accuracy: 0.9613



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:04<00:38,  4.86s/it][A
 22%|██▏       | 2/9 [00:05<00:14,  2.09s/it][A
 33%|███▎      | 3/9 [00:05<00:07,  1.20s/it][A
 44%|████▍     | 4/9 [00:05<00:03,  1.30it/s][A
 56%|█████▌    | 5/9 [00:09<00:08,  2.10s/it][A
 78%|███████▊  | 7/9 [00:09<00:02,  1.06s/it][A
100%|██████████| 9/9 [00:11<00:00,  1.26s/it][A
Epochs:  47%|████▋     | 23/49 [42:20<47:56, 110.65s/it]

Val Loss: 68.1763 - Val Accuracy: 0.9530



Training:   0%|          | 0/67 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/67 [00:05<06:00,  5.46s/it][A
Training:   3%|▎         | 2/67 [00:05<02:33,  2.37s/it][A
Training:   4%|▍         | 3/67 [00:05<01:26,  1.35s/it][A
Training:   6%|▌         | 4/67 [00:05<00:55,  1.14it/s][A
Training:   7%|▋         | 5/67 [00:10<02:22,  2.29s/it][A
Training:   9%|▉         | 6/67 [00:11<01:40,  1.64s/it][A
Training:  12%|█▏        | 8/67 [00:11<00:52,  1.12it/s][A
Training:  13%|█▎        | 9/67 [00:16<01:52,  1.93s/it][A
Training:  15%|█▍        | 10/67 [00:16<01:24,  1.49s/it][A
Training:  16%|█▋        | 11/67 [00:16<01:02,  1.12s/it][A
Training:  19%|█▉        | 13/67 [00:21<01:31,  1.70s/it][A
Training:  21%|██        | 14/67 [00:22<01:14,  1.40s/it][A
Training:  22%|██▏       | 15/67 [00:22<00:55,  1.07s/it][A
Training:  24%|██▍       | 16/67 [00:22<00:45,  1.13it/s][A
Training:  25%|██▌       | 17/67 [00:26<01:32,  1.85s/it][A
Training:  27%|██▋       | 18/67 [00:27<

Epoch: 24/49 - Loss: 61.3767 - Accuracy: 0.9600



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:04<00:36,  4.57s/it][A
 22%|██▏       | 2/9 [00:04<00:14,  2.06s/it][A
 33%|███▎      | 3/9 [00:05<00:07,  1.19s/it][A
 44%|████▍     | 4/9 [00:05<00:04,  1.24it/s][A
 56%|█████▌    | 5/9 [00:09<00:08,  2.01s/it][A
 78%|███████▊  | 7/9 [00:09<00:02,  1.03s/it][A
100%|██████████| 9/9 [00:11<00:00,  1.24s/it][A
Epochs:  49%|████▉     | 24/49 [44:03<45:05, 108.23s/it]

Val Loss: 84.1397 - Val Accuracy: 0.9471



Training:   0%|          | 0/67 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/67 [00:05<05:50,  5.31s/it][A
Training:   3%|▎         | 2/67 [00:05<02:40,  2.47s/it][A
Training:   6%|▌         | 4/67 [00:05<01:00,  1.04it/s][A
Training:   7%|▋         | 5/67 [00:11<02:24,  2.32s/it][A
Training:   9%|▉         | 6/67 [00:11<01:40,  1.65s/it][A
Training:  10%|█         | 7/67 [00:11<01:11,  1.19s/it][A
Training:  13%|█▎        | 9/67 [00:16<01:47,  1.85s/it][A
Training:  16%|█▋        | 11/67 [00:16<01:03,  1.14s/it][A
Training:  18%|█▊        | 12/67 [00:17<00:50,  1.10it/s][A
Training:  19%|█▉        | 13/67 [00:22<01:45,  1.95s/it][A
Training:  21%|██        | 14/67 [00:22<01:19,  1.49s/it][A
Training:  22%|██▏       | 15/67 [00:22<00:58,  1.12s/it][A
Training:  24%|██▍       | 16/67 [00:22<00:43,  1.18it/s][A
Training:  25%|██▌       | 17/67 [00:27<01:42,  2.04s/it][A
Training:  28%|██▊       | 19/67 [00:27<00:55,  1.16s/it][A
Training:  31%|███▏      | 21/67 [00:33

Epoch: 25/49 - Loss: 58.2212 - Accuracy: 0.9607



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:05<00:40,  5.11s/it][A
 22%|██▏       | 2/9 [00:05<00:15,  2.16s/it][A
 44%|████▍     | 4/9 [00:05<00:04,  1.16it/s][A
 56%|█████▌    | 5/9 [00:10<00:08,  2.04s/it][A
 78%|███████▊  | 7/9 [00:10<00:02,  1.11s/it][A
100%|██████████| 9/9 [00:11<00:00,  1.28s/it][A
Epochs:  51%|█████     | 25/49 [45:45<42:34, 106.45s/it]

Val Loss: 83.2673 - Val Accuracy: 0.9578



Training:   0%|          | 0/67 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/67 [00:05<06:00,  5.46s/it][A
Training:   3%|▎         | 2/67 [00:05<02:34,  2.37s/it][A
Training:   4%|▍         | 3/67 [00:05<01:26,  1.34s/it][A
Training:   6%|▌         | 4/67 [00:05<00:55,  1.14it/s][A
Training:   7%|▋         | 5/67 [00:11<02:32,  2.45s/it][A
Training:   9%|▉         | 6/67 [00:11<01:42,  1.68s/it][A
Training:  10%|█         | 7/67 [00:11<01:10,  1.17s/it][A
Training:  13%|█▎        | 9/67 [00:16<01:43,  1.79s/it][A
Training:  15%|█▍        | 10/67 [00:16<01:19,  1.40s/it][A
Training:  18%|█▊        | 12/67 [00:16<00:46,  1.17it/s][A
Training:  19%|█▉        | 13/67 [00:21<01:32,  1.72s/it][A
Training:  21%|██        | 14/67 [00:21<01:15,  1.42s/it][A
Training:  24%|██▍       | 16/67 [00:22<00:46,  1.09it/s][A
Training:  25%|██▌       | 17/67 [00:26<01:27,  1.74s/it][A
Training:  27%|██▋       | 18/67 [00:27<01:10,  1.44s/it][A
Training:  30%|██▉       | 20/67 [00:27<

Epoch: 26/49 - Loss: 63.4229 - Accuracy: 0.9588



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:04<00:38,  4.81s/it][A
 33%|███▎      | 3/9 [00:04<00:07,  1.30s/it][A
 44%|████▍     | 4/9 [00:05<00:04,  1.09it/s][A
 56%|█████▌    | 5/9 [00:10<00:08,  2.23s/it][A
 67%|██████▋   | 6/9 [00:10<00:04,  1.55s/it][A
 89%|████████▉ | 8/9 [00:10<00:00,  1.19it/s][A
100%|██████████| 9/9 [00:11<00:00,  1.27s/it][A
Epochs:  53%|█████▎    | 26/49 [47:27<40:18, 105.17s/it]

Val Loss: 69.7783 - Val Accuracy: 0.9520



Training:   0%|          | 0/67 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/67 [00:05<06:24,  5.83s/it][A
Training:   3%|▎         | 2/67 [00:05<02:40,  2.47s/it][A
Training:   4%|▍         | 3/67 [00:06<01:29,  1.39s/it][A
Training:   6%|▌         | 4/67 [00:06<00:57,  1.11it/s][A
Training:   7%|▋         | 5/67 [00:11<02:38,  2.56s/it][A
Training:  10%|█         | 7/67 [00:11<01:17,  1.28s/it][A
Training:  13%|█▎        | 9/67 [00:17<01:50,  1.90s/it][A
Training:  15%|█▍        | 10/67 [00:17<01:25,  1.50s/it][A
Training:  16%|█▋        | 11/67 [00:17<01:05,  1.16s/it][A
Training:  18%|█▊        | 12/67 [00:17<00:48,  1.13it/s][A
Training:  19%|█▉        | 13/67 [00:22<01:46,  1.97s/it][A
Training:  22%|██▏       | 15/67 [00:22<00:59,  1.14s/it][A
Training:  25%|██▌       | 17/67 [00:28<01:29,  1.79s/it][A
Training:  27%|██▋       | 18/67 [00:28<01:10,  1.43s/it][A
Training:  28%|██▊       | 19/67 [00:28<00:53,  1.12s/it][A
Training:  30%|██▉       | 20/67 [00:28

Epoch: 27/49 - Loss: 60.5172 - Accuracy: 0.9614



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:04<00:38,  4.77s/it][A
 22%|██▏       | 2/9 [00:05<00:14,  2.11s/it][A
 33%|███▎      | 3/9 [00:05<00:07,  1.22s/it][A
 56%|█████▌    | 5/9 [00:09<00:07,  1.87s/it][A
 78%|███████▊  | 7/9 [00:10<00:02,  1.08s/it][A
100%|██████████| 9/9 [00:11<00:00,  1.27s/it][A
Epochs:  55%|█████▌    | 27/49 [49:13<38:37, 105.35s/it]

Val Loss: 60.4441 - Val Accuracy: 0.9515



Training:   0%|          | 0/67 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/67 [00:05<06:32,  5.95s/it][A
Training:   3%|▎         | 2/67 [00:06<02:47,  2.58s/it][A
Training:   4%|▍         | 3/67 [00:06<01:33,  1.46s/it][A
Training:   6%|▌         | 4/67 [00:06<00:58,  1.07it/s][A
Training:   7%|▋         | 5/67 [00:11<02:36,  2.52s/it][A
Training:   9%|▉         | 6/67 [00:12<01:48,  1.77s/it][A
Training:  10%|█         | 7/67 [00:12<01:15,  1.26s/it][A
Training:  12%|█▏        | 8/67 [00:12<00:54,  1.08it/s][A
Training:  13%|█▎        | 9/67 [00:17<02:05,  2.17s/it][A
Training:  15%|█▍        | 10/67 [00:17<01:31,  1.60s/it][A
Training:  16%|█▋        | 11/67 [00:17<01:04,  1.15s/it][A
Training:  19%|█▉        | 13/67 [00:22<01:33,  1.74s/it][A
Training:  21%|██        | 14/67 [00:23<01:15,  1.42s/it][A
Training:  22%|██▏       | 15/67 [00:23<00:55,  1.07s/it][A
Training:  24%|██▍       | 16/67 [00:23<00:41,  1.23it/s][A
Training:  25%|██▌       | 17/67 [00:28<0

Epoch: 28/49 - Loss: 61.6703 - Accuracy: 0.9632



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:05<00:41,  5.20s/it][A
 22%|██▏       | 2/9 [00:05<00:15,  2.22s/it][A
 33%|███▎      | 3/9 [00:05<00:07,  1.26s/it][A
 56%|█████▌    | 5/9 [00:10<00:07,  1.86s/it][A
 78%|███████▊  | 7/9 [00:10<00:02,  1.05s/it][A
100%|██████████| 9/9 [00:11<00:00,  1.26s/it][A
Epochs:  57%|█████▋    | 28/49 [50:57<36:41, 104.81s/it]

Val Loss: 74.9643 - Val Accuracy: 0.9509



Training:   0%|          | 0/67 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/67 [00:06<06:48,  6.19s/it][A
Training:   3%|▎         | 2/67 [00:06<02:51,  2.64s/it][A
Training:   4%|▍         | 3/67 [00:06<01:35,  1.49s/it][A
Training:   6%|▌         | 4/67 [00:06<01:00,  1.04it/s][A
Training:   7%|▋         | 5/67 [00:11<02:35,  2.50s/it][A
Training:   9%|▉         | 6/67 [00:12<01:44,  1.71s/it][A
Training:  10%|█         | 7/67 [00:12<01:12,  1.20s/it][A
Training:  12%|█▏        | 8/67 [00:12<00:50,  1.16it/s][A
Training:  13%|█▎        | 9/67 [00:17<02:09,  2.22s/it][A
Training:  15%|█▍        | 10/67 [00:17<01:29,  1.57s/it][A
Training:  18%|█▊        | 12/67 [00:17<00:49,  1.12it/s][A
Training:  19%|█▉        | 13/67 [00:22<01:42,  1.90s/it][A
Training:  21%|██        | 14/67 [00:23<01:17,  1.46s/it][A
Training:  24%|██▍       | 16/67 [00:23<00:44,  1.14it/s][A
Training:  25%|██▌       | 17/67 [00:28<01:38,  1.96s/it][A
Training:  27%|██▋       | 18/67 [00:28<0

Epoch: 29/49 - Loss: 60.2576 - Accuracy: 0.9629



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:05<00:47,  5.95s/it][A
 22%|██▏       | 2/9 [00:06<00:17,  2.53s/it][A
 33%|███▎      | 3/9 [00:06<00:08,  1.48s/it][A
 44%|████▍     | 4/9 [00:06<00:04,  1.03it/s][A
 56%|█████▌    | 5/9 [00:10<00:08,  2.21s/it][A
 78%|███████▊  | 7/9 [00:11<00:02,  1.12s/it][A
100%|██████████| 9/9 [00:12<00:00,  1.37s/it][A
Epochs:  59%|█████▉    | 29/49 [52:45<35:19, 105.99s/it]

Val Loss: 93.0681 - Val Accuracy: 0.9551



Training:   0%|          | 0/67 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/67 [00:06<07:10,  6.52s/it][A
Training:   3%|▎         | 2/67 [00:06<02:59,  2.75s/it][A
Training:   6%|▌         | 4/67 [00:06<01:07,  1.07s/it][A
Training:   7%|▋         | 5/67 [00:12<02:34,  2.49s/it][A
Training:  10%|█         | 7/67 [00:12<01:23,  1.39s/it][A
Training:  13%|█▎        | 9/67 [00:18<01:51,  1.92s/it][A
Training:  15%|█▍        | 10/67 [00:18<01:32,  1.62s/it][A
Training:  16%|█▋        | 11/67 [00:19<01:13,  1.31s/it][A
Training:  19%|█▉        | 13/67 [00:24<01:37,  1.80s/it][A
Training:  21%|██        | 14/67 [00:24<01:21,  1.54s/it][A
Training:  22%|██▏       | 15/67 [00:25<01:04,  1.24s/it][A
Training:  24%|██▍       | 16/67 [00:25<00:49,  1.03it/s][A
Training:  25%|██▌       | 17/67 [00:30<01:39,  1.99s/it][A
Training:  27%|██▋       | 18/67 [00:30<01:15,  1.54s/it][A
Training:  28%|██▊       | 19/67 [00:30<00:59,  1.24s/it][A
Training:  31%|███▏      | 21/67 [00:3

Epoch: 30/49 - Loss: 60.6040 - Accuracy: 0.9638



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:05<00:46,  5.84s/it][A
 22%|██▏       | 2/9 [00:05<00:17,  2.47s/it][A
 33%|███▎      | 3/9 [00:06<00:08,  1.39s/it][A
 56%|█████▌    | 5/9 [00:10<00:07,  1.87s/it][A
 78%|███████▊  | 7/9 [00:10<00:02,  1.06s/it][A
100%|██████████| 9/9 [00:11<00:00,  1.31s/it][A
Epochs:  61%|██████    | 30/49 [54:34<33:46, 106.67s/it]

Val Loss: 103.6198 - Val Accuracy: 0.9515



Training:   0%|          | 0/67 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/67 [00:06<06:50,  6.22s/it][A
Training:   3%|▎         | 2/67 [00:06<02:51,  2.64s/it][A
Training:   4%|▍         | 3/67 [00:06<01:37,  1.52s/it][A
Training:   6%|▌         | 4/67 [00:06<01:03,  1.00s/it][A
Training:   7%|▋         | 5/67 [00:11<02:31,  2.44s/it][A
Training:  10%|█         | 7/67 [00:11<01:14,  1.24s/it][A
Training:  13%|█▎        | 9/67 [00:17<01:47,  1.85s/it][A
Training:  15%|█▍        | 10/67 [00:17<01:22,  1.45s/it][A
Training:  18%|█▊        | 12/67 [00:17<00:49,  1.11it/s][A
Training:  19%|█▉        | 13/67 [00:22<01:36,  1.79s/it][A
Training:  21%|██        | 14/67 [00:22<01:13,  1.39s/it][A
Training:  24%|██▍       | 16/67 [00:22<00:43,  1.18it/s][A
Training:  25%|██▌       | 17/67 [00:27<01:32,  1.85s/it][A
Training:  27%|██▋       | 18/67 [00:28<01:10,  1.43s/it][A
Training:  30%|██▉       | 20/67 [00:28<00:41,  1.14it/s][A
Training:  31%|███▏      | 21/67 [00:32

Epoch: 31/49 - Loss: 66.0538 - Accuracy: 0.9631



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:05<00:43,  5.49s/it][A
 22%|██▏       | 2/9 [00:05<00:16,  2.32s/it][A
 33%|███▎      | 3/9 [00:05<00:08,  1.34s/it][A
 44%|████▍     | 4/9 [00:05<00:04,  1.17it/s][A
 56%|█████▌    | 5/9 [00:10<00:08,  2.09s/it][A
 67%|██████▋   | 6/9 [00:10<00:04,  1.42s/it][A
 78%|███████▊  | 7/9 [00:10<00:02,  1.01s/it][A
100%|██████████| 9/9 [00:11<00:00,  1.28s/it][A
Epochs:  63%|██████▎   | 31/49 [56:17<31:42, 105.69s/it]

Val Loss: 94.8034 - Val Accuracy: 0.9515



Training:   0%|          | 0/67 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/67 [00:05<06:33,  5.96s/it][A
Training:   4%|▍         | 3/67 [00:06<01:43,  1.62s/it][A
Training:   6%|▌         | 4/67 [00:06<01:10,  1.12s/it][A
Training:   7%|▋         | 5/67 [00:11<02:35,  2.51s/it][A
Training:   9%|▉         | 6/67 [00:11<01:46,  1.75s/it][A
Training:  10%|█         | 7/67 [00:11<01:15,  1.26s/it][A
Training:  12%|█▏        | 8/67 [00:12<00:54,  1.08it/s][A
Training:  13%|█▎        | 9/67 [00:17<02:04,  2.15s/it][A
Training:  15%|█▍        | 10/67 [00:17<01:28,  1.55s/it][A
Training:  18%|█▊        | 12/67 [00:17<00:47,  1.15it/s][A
Training:  19%|█▉        | 13/67 [00:22<01:43,  1.92s/it][A
Training:  21%|██        | 14/67 [00:22<01:17,  1.46s/it][A
Training:  22%|██▏       | 15/67 [00:22<00:57,  1.11s/it][A
Training:  24%|██▍       | 16/67 [00:23<00:43,  1.18it/s][A
Training:  25%|██▌       | 17/67 [00:27<01:36,  1.93s/it][A
Training:  27%|██▋       | 18/67 [00:27<

Epoch: 32/49 - Loss: 65.4914 - Accuracy: 0.9599



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:05<00:46,  5.82s/it][A
 22%|██▏       | 2/9 [00:05<00:17,  2.48s/it][A
 33%|███▎      | 3/9 [00:06<00:08,  1.42s/it][A
 44%|████▍     | 4/9 [00:06<00:04,  1.09it/s][A
 56%|█████▌    | 5/9 [00:10<00:08,  2.13s/it][A
 78%|███████▊  | 7/9 [00:10<00:02,  1.08s/it][A
100%|██████████| 9/9 [00:11<00:00,  1.31s/it][A
Epochs:  65%|██████▌   | 32/49 [58:01<29:44, 104.99s/it]

Val Loss: 84.4037 - Val Accuracy: 0.9521



Training:   0%|          | 0/67 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/67 [00:05<06:23,  5.80s/it][A
Training:   3%|▎         | 2/67 [00:06<02:45,  2.55s/it][A
Training:   4%|▍         | 3/67 [00:06<01:42,  1.61s/it][A
Training:   7%|▋         | 5/67 [00:11<02:12,  2.13s/it][A
Training:  10%|█         | 7/67 [00:12<01:16,  1.28s/it][A
Training:  12%|█▏        | 8/67 [00:12<01:00,  1.02s/it][A
Training:  13%|█▎        | 9/67 [00:17<01:57,  2.03s/it][A
Training:  15%|█▍        | 10/67 [00:17<01:26,  1.52s/it][A
Training:  18%|█▊        | 12/67 [00:17<00:48,  1.12it/s][A
Training:  19%|█▉        | 13/67 [00:22<01:44,  1.93s/it][A
Training:  21%|██        | 14/67 [00:22<01:18,  1.48s/it][A
Training:  22%|██▏       | 15/67 [00:23<00:57,  1.11s/it][A
Training:  24%|██▍       | 16/67 [00:23<00:42,  1.19it/s][A
Training:  25%|██▌       | 17/67 [00:28<01:46,  2.13s/it][A
Training:  27%|██▋       | 18/67 [00:28<01:16,  1.56s/it][A
Training:  28%|██▊       | 19/67 [00:28

Epoch: 33/49 - Loss: 59.3673 - Accuracy: 0.9631



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:05<00:45,  5.63s/it][A
 22%|██▏       | 2/9 [00:06<00:17,  2.53s/it][A
 44%|████▍     | 4/9 [00:06<00:05,  1.00s/it][A
 56%|█████▌    | 5/9 [00:10<00:07,  1.95s/it][A
 67%|██████▋   | 6/9 [00:10<00:04,  1.44s/it][A
 89%|████████▉ | 8/9 [00:10<00:00,  1.26it/s][A
100%|██████████| 9/9 [00:11<00:00,  1.30s/it][A
Epochs:  67%|██████▋   | 33/49 [59:46<27:59, 105.00s/it]

Val Loss: 75.2201 - Val Accuracy: 0.9597



Training:   0%|          | 0/67 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/67 [00:06<06:52,  6.25s/it][A
Training:   3%|▎         | 2/67 [00:06<02:52,  2.66s/it][A
Training:   6%|▌         | 4/67 [00:06<01:05,  1.04s/it][A
Training:   7%|▋         | 5/67 [00:11<02:27,  2.38s/it][A
Training:   9%|▉         | 6/67 [00:12<01:43,  1.70s/it][A
Training:  12%|█▏        | 8/67 [00:12<00:55,  1.07it/s][A
Training:  13%|█▎        | 9/67 [00:17<01:55,  2.00s/it][A
Training:  15%|█▍        | 10/67 [00:17<01:28,  1.55s/it][A
Training:  16%|█▋        | 11/67 [00:17<01:05,  1.16s/it][A
Training:  18%|█▊        | 12/67 [00:17<00:48,  1.14it/s][A
Training:  19%|█▉        | 13/67 [00:22<01:47,  1.99s/it][A
Training:  21%|██        | 14/67 [00:23<01:19,  1.50s/it][A
Training:  22%|██▏       | 15/67 [00:23<00:57,  1.11s/it][A
Training:  24%|██▍       | 16/67 [00:23<00:41,  1.23it/s][A
Training:  25%|██▌       | 17/67 [00:27<01:38,  1.96s/it][A
Training:  27%|██▋       | 18/67 [00:28

Epoch: 34/49 - Loss: 58.2651 - Accuracy: 0.9612



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:05<00:43,  5.39s/it][A
 22%|██▏       | 2/9 [00:05<00:16,  2.38s/it][A
 33%|███▎      | 3/9 [00:05<00:08,  1.36s/it][A
 44%|████▍     | 4/9 [00:05<00:04,  1.12it/s][A
 56%|█████▌    | 5/9 [00:10<00:08,  2.06s/it][A
 78%|███████▊  | 7/9 [00:10<00:02,  1.04s/it][A
 89%|████████▉ | 8/9 [00:10<00:00,  1.26it/s][A
100%|██████████| 9/9 [00:11<00:00,  1.27s/it][A
Epochs:  69%|██████▉   | 34/49 [1:01:28<26:05, 104.36s/it]

Val Loss: 77.1452 - Val Accuracy: 0.9479



Training:   0%|          | 0/67 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/67 [00:06<06:53,  6.27s/it][A
Training:   3%|▎         | 2/67 [00:06<02:54,  2.69s/it][A
Training:   4%|▍         | 3/67 [00:06<01:39,  1.55s/it][A
Training:   6%|▌         | 4/67 [00:06<01:03,  1.00s/it][A
Training:   7%|▋         | 5/67 [00:12<02:36,  2.52s/it][A
Training:  10%|█         | 7/67 [00:12<01:16,  1.28s/it][A
Training:  12%|█▏        | 8/67 [00:12<00:59,  1.00s/it][A
Training:  13%|█▎        | 9/67 [00:17<02:05,  2.16s/it][A
Training:  15%|█▍        | 10/67 [00:17<01:30,  1.59s/it][A
Training:  18%|█▊        | 12/67 [00:18<00:53,  1.03it/s][A
Training:  19%|█▉        | 13/67 [00:23<01:45,  1.95s/it][A
Training:  22%|██▏       | 15/67 [00:23<01:01,  1.18s/it][A
Training:  24%|██▍       | 16/67 [00:23<00:49,  1.02it/s][A
Training:  25%|██▌       | 17/67 [00:28<01:36,  1.94s/it][A
Training:  27%|██▋       | 18/67 [00:28<01:12,  1.48s/it][A
Training:  28%|██▊       | 19/67 [00:28<

Epoch: 35/49 - Loss: 62.0854 - Accuracy: 0.9640



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:05<00:44,  5.53s/it][A
 33%|███▎      | 3/9 [00:05<00:08,  1.49s/it][A
 56%|█████▌    | 5/9 [00:09<00:07,  1.81s/it][A
 78%|███████▊  | 7/9 [00:10<00:02,  1.08s/it][A
100%|██████████| 9/9 [00:11<00:00,  1.26s/it][A
Epochs:  71%|███████▏  | 35/49 [1:03:12<24:17, 104.12s/it]

Val Loss: 78.7032 - Val Accuracy: 0.9576



Training:   0%|          | 0/67 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/67 [00:06<06:40,  6.06s/it][A
Training:   3%|▎         | 2/67 [00:06<02:59,  2.77s/it][A
Training:   4%|▍         | 3/67 [00:06<01:40,  1.57s/it][A
Training:   6%|▌         | 4/67 [00:06<01:03,  1.01s/it][A
Training:   7%|▋         | 5/67 [00:12<02:44,  2.65s/it][A
Training:   9%|▉         | 6/67 [00:12<01:53,  1.87s/it][A
Training:  12%|█▏        | 8/67 [00:12<00:57,  1.02it/s][A
Training:  13%|█▎        | 9/67 [00:18<02:00,  2.08s/it][A
Training:  15%|█▍        | 10/67 [00:18<01:33,  1.63s/it][A
Training:  18%|█▊        | 12/67 [00:18<00:52,  1.04it/s][A
Training:  19%|█▉        | 13/67 [00:23<01:45,  1.96s/it][A
Training:  21%|██        | 14/67 [00:24<01:27,  1.65s/it][A
Training:  24%|██▍       | 16/67 [00:24<00:50,  1.01it/s][A
Training:  25%|██▌       | 17/67 [00:29<01:38,  1.97s/it][A
Training:  27%|██▋       | 18/67 [00:30<01:20,  1.64s/it][A
Training:  28%|██▊       | 19/67 [00:30<

Epoch: 36/49 - Loss: 64.6700 - Accuracy: 0.9613



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:05<00:46,  5.77s/it][A
 33%|███▎      | 3/9 [00:05<00:09,  1.55s/it][A
 56%|█████▌    | 5/9 [00:10<00:07,  1.89s/it][A
100%|██████████| 9/9 [00:11<00:00,  1.30s/it][A
Epochs:  73%|███████▎  | 36/49 [1:05:00<22:48, 105.27s/it]

Val Loss: 80.6029 - Val Accuracy: 0.9393



Training:   0%|          | 0/67 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/67 [00:06<07:04,  6.44s/it][A
Training:   3%|▎         | 2/67 [00:06<02:56,  2.72s/it][A
Training:   6%|▌         | 4/67 [00:06<01:06,  1.05s/it][A
Training:   7%|▋         | 5/67 [00:12<02:27,  2.37s/it][A
Training:  10%|█         | 7/67 [00:12<01:17,  1.30s/it][A
Training:  13%|█▎        | 9/67 [00:17<01:46,  1.84s/it][A
Training:  15%|█▍        | 10/67 [00:17<01:23,  1.47s/it][A
Training:  16%|█▋        | 11/67 [00:17<01:04,  1.15s/it][A
Training:  18%|█▊        | 12/67 [00:17<00:49,  1.11it/s][A
Training:  19%|█▉        | 13/67 [00:22<01:47,  2.00s/it][A
Training:  21%|██        | 14/67 [00:23<01:18,  1.48s/it][A
Training:  22%|██▏       | 15/67 [00:23<00:57,  1.10s/it][A
Training:  25%|██▌       | 17/67 [00:28<01:26,  1.73s/it][A
Training:  27%|██▋       | 18/67 [00:28<01:06,  1.35s/it][A
Training:  28%|██▊       | 19/67 [00:28<00:50,  1.05s/it][A
Training:  30%|██▉       | 20/67 [00:2

Epoch: 37/49 - Loss: 61.8942 - Accuracy: 0.9625



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:05<00:46,  5.75s/it][A
 22%|██▏       | 2/9 [00:05<00:17,  2.43s/it][A
 33%|███▎      | 3/9 [00:05<00:08,  1.37s/it][A
 44%|████▍     | 4/9 [00:06<00:04,  1.14it/s][A
 56%|█████▌    | 5/9 [00:10<00:08,  2.00s/it][A
 78%|███████▊  | 7/9 [00:10<00:02,  1.02s/it][A
100%|██████████| 9/9 [00:11<00:00,  1.28s/it][A
Epochs:  76%|███████▌  | 37/49 [1:06:43<20:55, 104.62s/it]

Val Loss: 71.6146 - Val Accuracy: 0.9558



Training:   0%|          | 0/67 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/67 [00:06<06:49,  6.21s/it][A
Training:   3%|▎         | 2/67 [00:06<02:51,  2.63s/it][A
Training:   4%|▍         | 3/67 [00:06<01:37,  1.52s/it][A
Training:   6%|▌         | 4/67 [00:06<01:00,  1.03it/s][A
Training:   7%|▋         | 5/67 [00:11<02:31,  2.44s/it][A
Training:   9%|▉         | 6/67 [00:11<01:41,  1.66s/it][A
Training:  10%|█         | 7/67 [00:12<01:11,  1.19s/it][A
Training:  12%|█▏        | 8/67 [00:12<00:50,  1.16it/s][A
Training:  13%|█▎        | 9/67 [00:17<02:03,  2.12s/it][A
Training:  15%|█▍        | 10/67 [00:17<01:26,  1.52s/it][A
Training:  16%|█▋        | 11/67 [00:17<01:05,  1.18s/it][A
Training:  18%|█▊        | 12/67 [00:17<00:46,  1.17it/s][A
Training:  19%|█▉        | 13/67 [00:22<01:48,  2.00s/it][A
Training:  21%|██        | 14/67 [00:22<01:15,  1.43s/it][A
Training:  22%|██▏       | 15/67 [00:22<00:54,  1.06s/it][A
Training:  24%|██▍       | 16/67 [00:22<0

Epoch: 38/49 - Loss: 60.1382 - Accuracy: 0.9627



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:05<00:45,  5.64s/it][A
 22%|██▏       | 2/9 [00:05<00:16,  2.40s/it][A
 44%|████▍     | 4/9 [00:05<00:04,  1.04it/s][A
 56%|█████▌    | 5/9 [00:09<00:07,  1.85s/it][A
 78%|███████▊  | 7/9 [00:09<00:02,  1.01s/it][A
100%|██████████| 9/9 [00:11<00:00,  1.27s/it][A
Epochs:  78%|███████▊  | 38/49 [1:08:26<19:04, 104.05s/it]

Val Loss: 84.7407 - Val Accuracy: 0.9536



Training:   0%|          | 0/67 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/67 [00:06<07:02,  6.39s/it][A
Training:   3%|▎         | 2/67 [00:06<02:55,  2.71s/it][A
Training:   4%|▍         | 3/67 [00:06<01:39,  1.55s/it][A
Training:   6%|▌         | 4/67 [00:06<01:03,  1.00s/it][A
Training:   7%|▋         | 5/67 [00:11<02:34,  2.49s/it][A
Training:   9%|▉         | 6/67 [00:12<01:42,  1.68s/it][A
Training:  12%|█▏        | 8/67 [00:12<00:52,  1.13it/s][A
Training:  13%|█▎        | 9/67 [00:17<01:58,  2.05s/it][A
Training:  15%|█▍        | 10/67 [00:17<01:28,  1.55s/it][A
Training:  16%|█▋        | 11/67 [00:17<01:05,  1.17s/it][A
Training:  18%|█▊        | 12/67 [00:18<00:48,  1.13it/s][A
Training:  19%|█▉        | 13/67 [00:22<01:45,  1.95s/it][A
Training:  21%|██        | 14/67 [00:23<01:17,  1.46s/it][A
Training:  22%|██▏       | 15/67 [00:23<00:55,  1.07s/it][A
Training:  25%|██▌       | 17/67 [00:28<01:29,  1.79s/it][A
Training:  27%|██▋       | 18/67 [00:28<

Epoch: 39/49 - Loss: 59.9255 - Accuracy: 0.9619



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:05<00:45,  5.71s/it][A
 22%|██▏       | 2/9 [00:05<00:17,  2.44s/it][A
 33%|███▎      | 3/9 [00:06<00:08,  1.39s/it][A
 44%|████▍     | 4/9 [00:06<00:04,  1.13it/s][A
 56%|█████▌    | 5/9 [00:10<00:08,  2.05s/it][A
 67%|██████▋   | 6/9 [00:10<00:04,  1.47s/it][A
 89%|████████▉ | 8/9 [00:10<00:00,  1.28it/s][A
100%|██████████| 9/9 [00:11<00:00,  1.32s/it][A
Epochs:  80%|███████▉  | 39/49 [1:10:12<17:28, 104.81s/it]

Val Loss: 94.4497 - Val Accuracy: 0.9573



Training:   0%|          | 0/67 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/67 [00:06<07:23,  6.72s/it][A
Training:   3%|▎         | 2/67 [00:06<03:04,  2.84s/it][A
Training:   4%|▍         | 3/67 [00:06<01:42,  1.59s/it][A
Training:   7%|▋         | 5/67 [00:12<02:19,  2.25s/it][A
Training:   9%|▉         | 6/67 [00:12<01:42,  1.68s/it][A
Training:  10%|█         | 7/67 [00:12<01:14,  1.24s/it][A
Training:  13%|█▎        | 9/67 [00:18<01:51,  1.92s/it][A
Training:  15%|█▍        | 10/67 [00:18<01:24,  1.48s/it][A
Training:  16%|█▋        | 11/67 [00:18<01:04,  1.15s/it][A
Training:  19%|█▉        | 13/67 [00:24<01:37,  1.80s/it][A
Training:  21%|██        | 14/67 [00:24<01:16,  1.44s/it][A
Training:  22%|██▏       | 15/67 [00:24<00:57,  1.11s/it][A
Training:  25%|██▌       | 17/67 [00:29<01:26,  1.72s/it][A
Training:  27%|██▋       | 18/67 [00:29<01:06,  1.36s/it][A
Training:  30%|██▉       | 20/67 [00:29<00:40,  1.17it/s][A
Training:  31%|███▏      | 21/67 [00:34

Epoch: 40/49 - Loss: 64.1702 - Accuracy: 0.9623



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:05<00:43,  5.50s/it][A
 22%|██▏       | 2/9 [00:05<00:16,  2.33s/it][A
 33%|███▎      | 3/9 [00:05<00:08,  1.34s/it][A
 44%|████▍     | 4/9 [00:05<00:04,  1.17it/s][A
 56%|█████▌    | 5/9 [00:09<00:07,  1.95s/it][A
 78%|███████▊  | 7/9 [00:09<00:02,  1.01s/it][A
100%|██████████| 9/9 [00:11<00:00,  1.26s/it][A
Epochs:  82%|████████▏ | 40/49 [1:11:58<15:45, 105.01s/it]

Val Loss: 82.6106 - Val Accuracy: 0.9610



Training:   0%|          | 0/67 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/67 [00:06<06:56,  6.31s/it][A
Training:   3%|▎         | 2/67 [00:06<03:02,  2.81s/it][A
Training:   6%|▌         | 4/67 [00:06<01:08,  1.08s/it][A
Training:   7%|▋         | 5/67 [00:12<02:27,  2.39s/it][A
Training:   9%|▉         | 6/67 [00:12<01:45,  1.73s/it][A
Training:  10%|█         | 7/67 [00:12<01:14,  1.24s/it][A
Training:  12%|█▏        | 8/67 [00:12<00:54,  1.09it/s][A
Training:  13%|█▎        | 9/67 [00:17<01:57,  2.02s/it][A
Training:  15%|█▍        | 10/67 [00:17<01:30,  1.59s/it][A
Training:  18%|█▊        | 12/67 [00:17<00:49,  1.12it/s][A
Training:  19%|█▉        | 13/67 [00:22<01:40,  1.86s/it][A
Training:  21%|██        | 14/67 [00:23<01:22,  1.55s/it][A
Training:  22%|██▏       | 15/67 [00:23<01:01,  1.18s/it][A
Training:  25%|██▌       | 17/67 [00:28<01:23,  1.66s/it][A
Training:  27%|██▋       | 18/67 [00:28<01:06,  1.35s/it][A
Training:  30%|██▉       | 20/67 [00:28<

Epoch: 41/49 - Loss: 63.8027 - Accuracy: 0.9630



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:05<00:45,  5.70s/it][A
 33%|███▎      | 3/9 [00:05<00:09,  1.53s/it][A
 44%|████▍     | 4/9 [00:05<00:05,  1.04s/it][A
 56%|█████▌    | 5/9 [00:10<00:08,  2.10s/it][A
 78%|███████▊  | 7/9 [00:10<00:02,  1.11s/it][A
100%|██████████| 9/9 [00:11<00:00,  1.32s/it][A
Epochs:  84%|████████▎ | 41/49 [1:13:41<13:55, 104.42s/it]

Val Loss: 80.8512 - Val Accuracy: 0.9551



Training:   0%|          | 0/67 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/67 [00:06<06:54,  6.28s/it][A
Training:   3%|▎         | 2/67 [00:06<02:54,  2.68s/it][A
Training:   6%|▌         | 4/67 [00:06<01:05,  1.04s/it][A
Training:   7%|▋         | 5/67 [00:12<02:34,  2.50s/it][A
Training:   9%|▉         | 6/67 [00:12<01:49,  1.80s/it][A
Training:  12%|█▏        | 8/67 [00:12<00:58,  1.01it/s][A
Training:  13%|█▎        | 9/67 [00:17<01:59,  2.05s/it][A
Training:  15%|█▍        | 10/67 [00:18<01:28,  1.56s/it][A
Training:  16%|█▋        | 11/67 [00:18<01:05,  1.17s/it][A
Training:  18%|█▊        | 12/67 [00:18<00:49,  1.12it/s][A
Training:  19%|█▉        | 13/67 [00:23<01:51,  2.07s/it][A
Training:  22%|██▏       | 15/67 [00:23<01:01,  1.18s/it][A
Training:  24%|██▍       | 16/67 [00:23<00:46,  1.09it/s][A
Training:  25%|██▌       | 17/67 [00:28<01:39,  1.99s/it][A
Training:  28%|██▊       | 19/67 [00:28<00:56,  1.18s/it][A
Training:  31%|███▏      | 21/67 [00:33

Epoch: 42/49 - Loss: 60.3503 - Accuracy: 0.9631



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:05<00:46,  5.82s/it][A
 22%|██▏       | 2/9 [00:06<00:17,  2.50s/it][A
 44%|████▍     | 4/9 [00:06<00:04,  1.02it/s][A
 56%|█████▌    | 5/9 [00:10<00:08,  2.10s/it][A
 67%|██████▋   | 6/9 [00:11<00:04,  1.53s/it][A
 89%|████████▉ | 8/9 [00:11<00:00,  1.18it/s][A
100%|██████████| 9/9 [00:12<00:00,  1.40s/it][A
Epochs:  86%|████████▌ | 42/49 [1:15:26<12:12, 104.67s/it]

Val Loss: 95.3572 - Val Accuracy: 0.9265



Training:   0%|          | 0/67 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/67 [00:07<07:45,  7.05s/it][A
Training:   3%|▎         | 2/67 [00:07<03:13,  2.97s/it][A
Training:   4%|▍         | 3/67 [00:07<01:46,  1.67s/it][A
Training:   7%|▋         | 5/67 [00:13<02:25,  2.35s/it][A
Training:   9%|▉         | 6/67 [00:13<01:46,  1.75s/it][A
Training:  12%|█▏        | 8/67 [00:13<00:58,  1.01it/s][A
Training:  13%|█▎        | 9/67 [00:18<01:57,  2.02s/it][A
Training:  15%|█▍        | 10/67 [00:18<01:27,  1.53s/it][A
Training:  16%|█▋        | 11/67 [00:18<01:04,  1.15s/it][A
Training:  18%|█▊        | 12/67 [00:19<00:47,  1.16it/s][A
Training:  19%|█▉        | 13/67 [00:24<01:57,  2.17s/it][A
Training:  22%|██▏       | 15/67 [00:24<01:04,  1.23s/it][A
Training:  24%|██▍       | 16/67 [00:24<00:49,  1.04it/s][A
Training:  25%|██▌       | 17/67 [00:30<01:44,  2.10s/it][A
Training:  28%|██▊       | 19/67 [00:30<01:00,  1.26s/it][A
Training:  30%|██▉       | 20/67 [00:30

Epoch: 43/49 - Loss: 64.3828 - Accuracy: 0.9601



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:05<00:44,  5.56s/it][A
 33%|███▎      | 3/9 [00:05<00:08,  1.49s/it][A
 56%|█████▌    | 5/9 [00:10<00:07,  1.84s/it][A
 67%|██████▋   | 6/9 [00:10<00:04,  1.40s/it][A
 89%|████████▉ | 8/9 [00:10<00:00,  1.22it/s][A
100%|██████████| 9/9 [00:11<00:00,  1.30s/it][A
Epochs:  88%|████████▊ | 43/49 [1:17:13<10:32, 105.36s/it]

Val Loss: 90.6679 - Val Accuracy: 0.9437



Training:   0%|          | 0/67 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/67 [00:06<06:48,  6.18s/it][A
Training:   3%|▎         | 2/67 [00:06<02:54,  2.69s/it][A
Training:   4%|▍         | 3/67 [00:06<01:43,  1.61s/it][A
Training:   7%|▋         | 5/67 [00:11<02:08,  2.08s/it][A
Training:   9%|▉         | 6/67 [00:11<01:34,  1.54s/it][A
Training:  10%|█         | 7/67 [00:12<01:11,  1.20s/it][A
Training:  12%|█▏        | 8/67 [00:12<00:51,  1.14it/s][A
Training:  13%|█▎        | 9/67 [00:17<01:59,  2.06s/it][A
Training:  15%|█▍        | 10/67 [00:17<01:26,  1.51s/it][A
Training:  18%|█▊        | 12/67 [00:17<00:46,  1.17it/s][A
Training:  19%|█▉        | 13/67 [00:22<01:43,  1.92s/it][A
Training:  21%|██        | 14/67 [00:22<01:16,  1.45s/it][A
Training:  22%|██▏       | 15/67 [00:22<00:56,  1.09s/it][A
Training:  25%|██▌       | 17/67 [00:28<01:26,  1.73s/it][A
Training:  28%|██▊       | 19/67 [00:28<00:54,  1.13s/it][A
Training:  30%|██▉       | 20/67 [00:28<

Epoch: 44/49 - Loss: 61.1453 - Accuracy: 0.9631



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:05<00:42,  5.34s/it][A
 33%|███▎      | 3/9 [00:05<00:08,  1.45s/it][A
 44%|████▍     | 4/9 [00:05<00:04,  1.02it/s][A
 56%|█████▌    | 5/9 [00:10<00:08,  2.13s/it][A
 67%|██████▋   | 6/9 [00:10<00:04,  1.49s/it][A
 89%|████████▉ | 8/9 [00:10<00:00,  1.24it/s][A
100%|██████████| 9/9 [00:11<00:00,  1.30s/it][A
Epochs:  90%|████████▉ | 44/49 [1:18:56<08:43, 104.73s/it]

Val Loss: 79.0447 - Val Accuracy: 0.9471



Training:   0%|          | 0/67 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/67 [00:06<07:13,  6.57s/it][A
Training:   3%|▎         | 2/67 [00:06<03:00,  2.78s/it][A
Training:   6%|▌         | 4/67 [00:06<01:07,  1.08s/it][A
Training:   7%|▋         | 5/67 [00:12<02:28,  2.39s/it][A
Training:  10%|█         | 7/67 [00:12<01:18,  1.30s/it][A
Training:  13%|█▎        | 9/67 [00:17<01:47,  1.86s/it][A
Training:  15%|█▍        | 10/67 [00:17<01:24,  1.48s/it][A
Training:  16%|█▋        | 11/67 [00:17<01:04,  1.15s/it][A
Training:  19%|█▉        | 13/67 [00:23<01:35,  1.78s/it][A
Training:  21%|██        | 14/67 [00:23<01:14,  1.41s/it][A
Training:  22%|██▏       | 15/67 [00:23<00:58,  1.12s/it][A
Training:  24%|██▍       | 16/67 [00:23<00:44,  1.15it/s][A
Training:  25%|██▌       | 17/67 [00:28<01:31,  1.83s/it][A
Training:  28%|██▊       | 19/67 [00:28<00:52,  1.09s/it][A
Training:  31%|███▏      | 21/67 [00:32<01:07,  1.46s/it][A
Training:  34%|███▍      | 23/67 [00:3

Epoch: 45/49 - Loss: 63.7223 - Accuracy: 0.9618



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:06<00:48,  6.04s/it][A
 33%|███▎      | 3/9 [00:06<00:09,  1.66s/it][A
 44%|████▍     | 4/9 [00:06<00:05,  1.14s/it][A
 56%|█████▌    | 5/9 [00:11<00:09,  2.34s/it][A
 67%|██████▋   | 6/9 [00:11<00:04,  1.62s/it][A
 78%|███████▊  | 7/9 [00:11<00:02,  1.17s/it][A
100%|██████████| 9/9 [00:12<00:00,  1.43s/it][A
Epochs:  92%|█████████▏| 45/49 [1:20:46<07:04, 106.24s/it]

Val Loss: 79.0339 - Val Accuracy: 0.9614



Training:   0%|          | 0/67 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/67 [00:06<07:11,  6.54s/it][A
Training:   4%|▍         | 3/67 [00:06<01:52,  1.75s/it][A
Training:   6%|▌         | 4/67 [00:06<01:16,  1.21s/it][A
Training:   7%|▋         | 5/67 [00:12<02:47,  2.70s/it][A
Training:  10%|█         | 7/67 [00:12<01:26,  1.45s/it][A
Training:  12%|█▏        | 8/67 [00:12<01:05,  1.11s/it][A
Training:  13%|█▎        | 9/67 [00:18<02:06,  2.19s/it][A
Training:  15%|█▍        | 10/67 [00:18<01:37,  1.71s/it][A
Training:  16%|█▋        | 11/67 [00:18<01:11,  1.28s/it][A
Training:  19%|█▉        | 13/67 [00:23<01:35,  1.77s/it][A
Training:  21%|██        | 14/67 [00:24<01:21,  1.54s/it][A
Training:  24%|██▍       | 16/67 [00:24<00:47,  1.07it/s][A
Training:  25%|██▌       | 17/67 [00:29<01:27,  1.76s/it][A
Training:  27%|██▋       | 18/67 [00:29<01:14,  1.52s/it][A
Training:  30%|██▉       | 20/67 [00:29<00:43,  1.09it/s][A
Training:  31%|███▏      | 21/67 [00:33

Epoch: 46/49 - Loss: 61.0099 - Accuracy: 0.9634



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:05<00:40,  5.12s/it][A
 22%|██▏       | 2/9 [00:05<00:15,  2.19s/it][A
 44%|████▍     | 4/9 [00:05<00:04,  1.17it/s][A
 56%|█████▌    | 5/9 [00:10<00:08,  2.07s/it][A
 67%|██████▋   | 6/9 [00:10<00:04,  1.50s/it][A
100%|██████████| 9/9 [00:11<00:00,  1.30s/it][A
Epochs:  94%|█████████▍| 46/49 [1:22:31<05:17, 105.94s/it]

Val Loss: 83.6325 - Val Accuracy: 0.9613



Training:   0%|          | 0/67 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/67 [00:06<06:59,  6.36s/it][A
Training:   3%|▎         | 2/67 [00:06<02:57,  2.73s/it][A
Training:   4%|▍         | 3/67 [00:06<01:38,  1.55s/it][A
Training:   7%|▋         | 5/67 [00:12<02:21,  2.28s/it][A
Training:  10%|█         | 7/67 [00:12<01:17,  1.29s/it][A
Training:  13%|█▎        | 9/67 [00:17<01:47,  1.85s/it][A
Training:  15%|█▍        | 10/67 [00:18<01:23,  1.47s/it][A
Training:  16%|█▋        | 11/67 [00:18<01:05,  1.17s/it][A
Training:  18%|█▊        | 12/67 [00:18<00:50,  1.09it/s][A
Training:  19%|█▉        | 13/67 [00:23<01:50,  2.04s/it][A
Training:  22%|██▏       | 15/67 [00:23<01:01,  1.18s/it][A
Training:  25%|██▌       | 17/67 [00:28<01:26,  1.73s/it][A
Training:  28%|██▊       | 19/67 [00:29<00:54,  1.14s/it][A
Training:  30%|██▉       | 20/67 [00:29<00:44,  1.07it/s][A
Training:  31%|███▏      | 21/67 [00:33<01:14,  1.61s/it][A
Training:  33%|███▎      | 22/67 [00:3

Epoch: 47/49 - Loss: 62.9366 - Accuracy: 0.9656



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:05<00:43,  5.45s/it][A
 22%|██▏       | 2/9 [00:05<00:16,  2.33s/it][A
 44%|████▍     | 4/9 [00:05<00:04,  1.08it/s][A
 56%|█████▌    | 5/9 [00:10<00:08,  2.13s/it][A
 67%|██████▋   | 6/9 [00:10<00:04,  1.51s/it][A
 89%|████████▉ | 8/9 [00:10<00:00,  1.20it/s][A
100%|██████████| 9/9 [00:12<00:00,  1.36s/it][A
Epochs:  96%|█████████▌| 47/49 [1:24:19<03:32, 106.41s/it]

Val Loss: 77.8801 - Val Accuracy: 0.9588



Training:   0%|          | 0/67 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/67 [00:06<07:18,  6.65s/it][A
Training:   3%|▎         | 2/67 [00:07<03:12,  2.97s/it][A
Training:   6%|▌         | 4/67 [00:07<01:14,  1.18s/it][A
Training:   7%|▋         | 5/67 [00:12<02:26,  2.37s/it][A
Training:   9%|▉         | 6/67 [00:12<01:48,  1.78s/it][A
Training:  10%|█         | 7/67 [00:12<01:17,  1.29s/it][A
Training:  12%|█▏        | 8/67 [00:13<00:58,  1.01it/s][A
Training:  13%|█▎        | 9/67 [00:18<02:05,  2.17s/it][A
Training:  15%|█▍        | 10/67 [00:18<01:35,  1.67s/it][A
Training:  16%|█▋        | 11/67 [00:18<01:07,  1.21s/it][A
Training:  18%|█▊        | 12/67 [00:18<00:48,  1.14it/s][A
Training:  19%|█▉        | 13/67 [00:23<01:56,  2.15s/it][A
Training:  21%|██        | 14/67 [00:24<01:23,  1.57s/it][A
Training:  24%|██▍       | 16/67 [00:24<00:47,  1.07it/s][A
Training:  25%|██▌       | 17/67 [00:29<01:33,  1.88s/it][A
Training:  27%|██▋       | 18/67 [00:29<

Epoch: 48/49 - Loss: 71.0470 - Accuracy: 0.9653



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:06<00:51,  6.38s/it][A
 22%|██▏       | 2/9 [00:06<00:19,  2.75s/it][A
 33%|███▎      | 3/9 [00:06<00:09,  1.60s/it][A
 44%|████▍     | 4/9 [00:06<00:05,  1.03s/it][A
 56%|█████▌    | 5/9 [00:13<00:11,  2.94s/it][A
 67%|██████▋   | 6/9 [00:13<00:06,  2.08s/it][A
 78%|███████▊  | 7/9 [00:13<00:02,  1.44s/it][A
 89%|████████▉ | 8/9 [00:14<00:01,  1.06s/it][A
100%|██████████| 9/9 [00:15<00:00,  1.74s/it][A
Epochs:  98%|█████████▊| 48/49 [1:26:11<01:48, 108.05s/it]

Val Loss: 73.3180 - Val Accuracy: 0.9573



Training:   0%|          | 0/67 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/67 [00:07<07:50,  7.13s/it][A
Training:   3%|▎         | 2/67 [00:07<03:18,  3.06s/it][A
Training:   4%|▍         | 3/67 [00:07<01:50,  1.72s/it][A
Training:   6%|▌         | 4/67 [00:07<01:09,  1.11s/it][A
Training:   7%|▋         | 5/67 [00:13<02:45,  2.66s/it][A
Training:   9%|▉         | 6/67 [00:13<01:54,  1.87s/it][A
Training:  10%|█         | 7/67 [00:13<01:18,  1.30s/it][A
Training:  12%|█▏        | 8/67 [00:13<00:55,  1.06it/s][A
Training:  13%|█▎        | 9/67 [00:18<02:05,  2.16s/it][A
Training:  15%|█▍        | 10/67 [00:18<01:26,  1.52s/it][A
Training:  16%|█▋        | 11/67 [00:19<01:07,  1.20s/it][A
Training:  19%|█▉        | 13/67 [00:23<01:35,  1.76s/it][A
Training:  21%|██        | 14/67 [00:24<01:12,  1.37s/it][A
Training:  22%|██▏       | 15/67 [00:24<00:55,  1.06s/it][A
Training:  25%|██▌       | 17/67 [00:28<01:18,  1.57s/it][A
Training:  27%|██▋       | 18/67 [00:29<0

Epoch: 49/49 - Loss: 66.1872 - Accuracy: 0.9632



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:05<00:41,  5.22s/it][A
 22%|██▏       | 2/9 [00:05<00:15,  2.24s/it][A
 33%|███▎      | 3/9 [00:05<00:07,  1.28s/it][A
 56%|█████▌    | 5/9 [00:10<00:07,  1.94s/it][A
 78%|███████▊  | 7/9 [00:10<00:02,  1.11s/it][A
 89%|████████▉ | 8/9 [00:10<00:00,  1.11it/s][A
100%|██████████| 9/9 [00:12<00:00,  1.36s/it][A
Epochs: 100%|██████████| 49/49 [1:27:59<00:00, 107.74s/it]


Val Loss: 79.1341 - Val Accuracy: 0.9578


[32m[I 2023-12-08 16:57:13,935][0m Trial 4 finished with value: 0.9578335285186768 and parameters: {'loss_learning_rate': 0.0042754188900381235, 'learning_rate': 0.004531367393603924, 'weight_decay': 0.00046837344629150696, 'epsilon': 2.3522348716547854e-09, 'beta': 0.4, 'gamma': 0.4, 'batch_size': 209, 'epochs': 49}. Best is trial 0 with value: 0.9648317694664001.[0m



Study statistics: 
  Number of finished trials:  5
  Number of pruned trials:  0
  Number of complete trials:  5


In [27]:
study = optuna.create_study(direction='maximize',
                            study_name='triplet-arcface-12-8-mean-vit-study',
                            storage='sqlite:///study5.db',
                            load_if_exists=True)
study.optimize(objective, n_trials=15)

pruned_trials = study.get_trials(deepcopy=False, states=[TrialState.PRUNED])
complete_trials = study.get_trials(deepcopy=False, states=[TrialState.COMPLETE])

# Display the study statistics
print("\nStudy statistics: ")
print("  Number of finished trials: ", len(study.trials))
print("  Number of pruned trials: ", len(pruned_trials))
print("  Number of complete trials: ", len(complete_trials))

[32m[I 2023-12-08 16:57:14,363][0m Using an existing study with name 'triplet-arcface-12-8-mean-vit-study' instead of creating a new one.[0m


Learning rate for Loss: 0.006357172795546919
Learning rate: 0.0030186512218183703
Weight decay: 0.00014382598191632886
Epsilon: 4.5825840133117526e-08
Beta: 0.1
Gamma: 0.2
Batch size: 195
Number of epochs: 18


Epochs:   0%|          | 0/18 [00:00<?, ?it/s]
Training:   0%|          | 0/72 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/72 [00:06<07:12,  6.09s/it][A
Training:   3%|▎         | 2/72 [00:06<03:04,  2.64s/it][A
Training:   4%|▍         | 3/72 [00:06<01:43,  1.50s/it][A
Training:   7%|▋         | 5/72 [00:11<02:19,  2.09s/it][A
Training:   8%|▊         | 6/72 [00:11<01:41,  1.54s/it][A
Training:  10%|▉         | 7/72 [00:11<01:13,  1.13s/it][A
Training:  11%|█         | 8/72 [00:12<00:54,  1.18it/s][A
Training:  12%|█▎        | 9/72 [00:16<02:03,  1.96s/it][A
Training:  15%|█▌        | 11/72 [00:16<01:08,  1.12s/it][A
Training:  18%|█▊        | 13/72 [00:21<01:37,  1.65s/it][A
Training:  19%|█▉        | 14/72 [00:21<01:16,  1.31s/it][A
Training:  22%|██▏       | 16/72 [00:22<00:46,  1.20it/s][A
Training:  24%|██▎       | 17/72 [00:26<01:28,  1.61s/it][A
Training:  26%|██▋       | 19/72 [00:26<00:54,  1.02s/it][A
Training:  29%|██▉       | 21/72 [00:31<01:13,  1.45s/i

Epoch: 1/18 - Loss: 4.0021 - Accuracy: 0.9062



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:04<00:37,  4.70s/it][A
 22%|██▏       | 2/9 [00:04<00:14,  2.08s/it][A
 33%|███▎      | 3/9 [00:05<00:07,  1.20s/it][A
 44%|████▍     | 4/9 [00:05<00:03,  1.26it/s][A
 56%|█████▌    | 5/9 [00:09<00:08,  2.07s/it][A
 78%|███████▊  | 7/9 [00:09<00:02,  1.06s/it][A
100%|██████████| 9/9 [00:13<00:00,  1.50s/it][A
Epochs:   6%|▌         | 1/18 [01:46<30:15, 106.79s/it]

Val Loss: 3.7703 - Val Accuracy: 0.9507



Training:   0%|          | 0/72 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/72 [00:06<07:11,  6.07s/it][A
Training:   3%|▎         | 2/72 [00:06<02:59,  2.57s/it][A
Training:   6%|▌         | 4/72 [00:06<01:08,  1.01s/it][A
Training:   7%|▋         | 5/72 [00:11<02:31,  2.26s/it][A
Training:   8%|▊         | 6/72 [00:11<01:45,  1.61s/it][A
Training:  11%|█         | 8/72 [00:11<00:57,  1.11it/s][A
Training:  12%|█▎        | 9/72 [00:16<01:57,  1.86s/it][A
Training:  14%|█▍        | 10/72 [00:16<01:26,  1.40s/it][A
Training:  15%|█▌        | 11/72 [00:16<01:03,  1.05s/it][A
Training:  17%|█▋        | 12/72 [00:16<00:48,  1.25it/s][A
Training:  18%|█▊        | 13/72 [00:21<01:47,  1.83s/it][A
Training:  21%|██        | 15/72 [00:21<00:58,  1.03s/it][A
Training:  24%|██▎       | 17/72 [00:25<01:21,  1.47s/it][A
Training:  26%|██▋       | 19/72 [00:25<00:52,  1.01it/s][A
Training:  29%|██▉       | 21/72 [00:30<01:15,  1.49s/it][A
Training:  31%|███       | 22/72 [00:31

Epoch: 2/18 - Loss: 4.2724 - Accuracy: 0.9487



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:05<00:43,  5.44s/it][A
 22%|██▏       | 2/9 [00:05<00:16,  2.31s/it][A
 33%|███▎      | 3/9 [00:05<00:07,  1.31s/it][A
 56%|█████▌    | 5/9 [00:10<00:07,  1.90s/it][A
 67%|██████▋   | 6/9 [00:10<00:04,  1.40s/it][A
 78%|███████▊  | 7/9 [00:10<00:02,  1.04s/it][A
100%|██████████| 9/9 [00:14<00:00,  1.62s/it][A
Epochs:  11%|█         | 2/18 [03:36<28:57, 108.62s/it]

Val Loss: 5.3780 - Val Accuracy: 0.9558



Training:   0%|          | 0/72 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/72 [00:06<07:19,  6.19s/it][A
Training:   4%|▍         | 3/72 [00:06<01:57,  1.70s/it][A
Training:   6%|▌         | 4/72 [00:06<01:19,  1.17s/it][A
Training:   7%|▋         | 5/72 [00:11<02:47,  2.50s/it][A
Training:  10%|▉         | 7/72 [00:12<01:27,  1.34s/it][A
Training:  11%|█         | 8/72 [00:12<01:06,  1.04s/it][A
Training:  12%|█▎        | 9/72 [00:17<02:09,  2.06s/it][A
Training:  15%|█▌        | 11/72 [00:17<01:13,  1.20s/it][A
Training:  17%|█▋        | 12/72 [00:17<00:56,  1.06it/s][A
Training:  18%|█▊        | 13/72 [00:21<01:51,  1.89s/it][A
Training:  21%|██        | 15/72 [00:22<01:03,  1.12s/it][A
Training:  22%|██▏       | 16/72 [00:22<00:49,  1.12it/s][A
Training:  24%|██▎       | 17/72 [00:26<01:38,  1.79s/it][A
Training:  25%|██▌       | 18/72 [00:26<01:12,  1.35s/it][A
Training:  28%|██▊       | 20/72 [00:27<00:42,  1.21it/s][A
Training:  29%|██▉       | 21/72 [00:31

Epoch: 3/18 - Loss: 4.9016 - Accuracy: 0.9542



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:05<00:41,  5.15s/it][A
 22%|██▏       | 2/9 [00:05<00:15,  2.19s/it][A
 33%|███▎      | 3/9 [00:05<00:07,  1.25s/it][A
 44%|████▍     | 4/9 [00:05<00:04,  1.21it/s][A
 56%|█████▌    | 5/9 [00:09<00:08,  2.10s/it][A
 67%|██████▋   | 6/9 [00:10<00:04,  1.43s/it][A
 78%|███████▊  | 7/9 [00:10<00:02,  1.01s/it][A
100%|██████████| 9/9 [00:13<00:00,  1.55s/it][A
Epochs:  17%|█▋        | 3/18 [05:25<27:12, 108.80s/it]

Val Loss: 6.1887 - Val Accuracy: 0.9547



Training:   0%|          | 0/72 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/72 [00:06<07:17,  6.17s/it][A
Training:   3%|▎         | 2/72 [00:06<03:01,  2.60s/it][A
Training:   4%|▍         | 3/72 [00:06<01:41,  1.48s/it][A
Training:   6%|▌         | 4/72 [00:06<01:04,  1.06it/s][A
Training:   7%|▋         | 5/72 [00:11<02:39,  2.39s/it][A
Training:  10%|▉         | 7/72 [00:11<01:19,  1.22s/it][A
Training:  11%|█         | 8/72 [00:11<00:59,  1.08it/s][A
Training:  12%|█▎        | 9/72 [00:16<02:08,  2.04s/it][A
Training:  14%|█▍        | 10/72 [00:16<01:33,  1.50s/it][A
Training:  15%|█▌        | 11/72 [00:17<01:07,  1.11s/it][A
Training:  17%|█▋        | 12/72 [00:17<00:49,  1.21it/s][A
Training:  18%|█▊        | 13/72 [00:21<01:47,  1.82s/it][A
Training:  21%|██        | 15/72 [00:21<00:58,  1.02s/it][A
Training:  24%|██▎       | 17/72 [00:25<01:22,  1.50s/it][A
Training:  25%|██▌       | 18/72 [00:26<01:04,  1.20s/it][A
Training:  26%|██▋       | 19/72 [00:26<

Epoch: 4/18 - Loss: 5.3633 - Accuracy: 0.9555



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:05<00:42,  5.26s/it][A
 22%|██▏       | 2/9 [00:05<00:15,  2.25s/it][A
 33%|███▎      | 3/9 [00:05<00:07,  1.28s/it][A
 44%|████▍     | 4/9 [00:05<00:04,  1.20it/s][A
 56%|█████▌    | 5/9 [00:10<00:08,  2.10s/it][A
 67%|██████▋   | 6/9 [00:10<00:04,  1.42s/it][A
 78%|███████▊  | 7/9 [00:10<00:02,  1.00s/it][A
 89%|████████▉ | 8/9 [00:10<00:00,  1.38it/s][A
100%|██████████| 9/9 [00:14<00:00,  1.57s/it][A
Epochs:  22%|██▏       | 4/18 [07:13<25:17, 108.38s/it]

Val Loss: 5.7009 - Val Accuracy: 0.9599



Training:   0%|          | 0/72 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/72 [00:06<07:26,  6.29s/it][A
Training:   3%|▎         | 2/72 [00:06<03:07,  2.68s/it][A
Training:   6%|▌         | 4/72 [00:06<01:11,  1.05s/it][A
Training:   7%|▋         | 5/72 [00:11<02:30,  2.24s/it][A
Training:   8%|▊         | 6/72 [00:11<01:45,  1.59s/it][A
Training:  10%|▉         | 7/72 [00:11<01:14,  1.15s/it][A
Training:  11%|█         | 8/72 [00:11<00:53,  1.19it/s][A
Training:  12%|█▎        | 9/72 [00:16<02:07,  2.02s/it][A
Training:  15%|█▌        | 11/72 [00:16<01:07,  1.11s/it][A
Training:  18%|█▊        | 13/72 [00:20<01:28,  1.50s/it][A
Training:  21%|██        | 15/72 [00:21<00:55,  1.02it/s][A
Training:  24%|██▎       | 17/72 [00:26<01:23,  1.51s/it][A
Training:  26%|██▋       | 19/72 [00:26<00:55,  1.04s/it][A
Training:  28%|██▊       | 20/72 [00:26<00:44,  1.16it/s][A
Training:  29%|██▉       | 21/72 [00:31<01:28,  1.74s/it][A
Training:  32%|███▏      | 23/72 [00:31<

Epoch: 5/18 - Loss: 5.5485 - Accuracy: 0.9590



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:05<00:40,  5.10s/it][A
 22%|██▏       | 2/9 [00:05<00:15,  2.20s/it][A
 44%|████▍     | 4/9 [00:05<00:04,  1.11it/s][A
 56%|█████▌    | 5/9 [00:09<00:07,  1.98s/it][A
 78%|███████▊  | 7/9 [00:10<00:02,  1.09s/it][A
 89%|████████▉ | 8/9 [00:10<00:00,  1.16it/s][A
100%|██████████| 9/9 [00:13<00:00,  1.54s/it][A
Epochs:  28%|██▊       | 5/18 [09:00<23:22, 107.90s/it]

Val Loss: 5.6083 - Val Accuracy: 0.9575



Training:   0%|          | 0/72 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/72 [00:05<06:47,  5.73s/it][A
Training:   3%|▎         | 2/72 [00:05<02:52,  2.46s/it][A
Training:   4%|▍         | 3/72 [00:06<01:36,  1.40s/it][A
Training:   6%|▌         | 4/72 [00:06<01:00,  1.13it/s][A
Training:   7%|▋         | 5/72 [00:11<02:37,  2.36s/it][A
Training:  10%|▉         | 7/72 [00:11<01:17,  1.19s/it][A
Training:  11%|█         | 8/72 [00:11<00:58,  1.10it/s][A
Training:  12%|█▎        | 9/72 [00:15<01:59,  1.90s/it][A
Training:  15%|█▌        | 11/72 [00:16<01:06,  1.10s/it][A
Training:  17%|█▋        | 12/72 [00:16<00:51,  1.16it/s][A
Training:  18%|█▊        | 13/72 [00:20<01:40,  1.70s/it][A
Training:  19%|█▉        | 14/72 [00:20<01:17,  1.33s/it][A
Training:  22%|██▏       | 16/72 [00:20<00:43,  1.27it/s][A
Training:  24%|██▎       | 17/72 [00:25<01:37,  1.77s/it][A
Training:  26%|██▋       | 19/72 [00:25<00:57,  1.08s/it][A
Training:  29%|██▉       | 21/72 [00:30<

Epoch: 6/18 - Loss: 6.1029 - Accuracy: 0.9571



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:05<00:40,  5.10s/it][A
 22%|██▏       | 2/9 [00:05<00:15,  2.19s/it][A
 33%|███▎      | 3/9 [00:05<00:07,  1.28s/it][A
 56%|█████▌    | 5/9 [00:09<00:07,  1.83s/it][A
 67%|██████▋   | 6/9 [00:10<00:03,  1.33s/it][A
 78%|███████▊  | 7/9 [00:10<00:01,  1.01it/s][A
100%|██████████| 9/9 [00:13<00:00,  1.55s/it][A
Epochs:  33%|███▎      | 6/18 [10:47<21:31, 107.60s/it]

Val Loss: 6.6179 - Val Accuracy: 0.9529



Training:   0%|          | 0/72 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/72 [00:05<06:49,  5.77s/it][A
Training:   4%|▍         | 3/72 [00:06<01:55,  1.68s/it][A
Training:   6%|▌         | 4/72 [00:06<01:18,  1.16s/it][A
Training:   7%|▋         | 5/72 [00:11<02:38,  2.37s/it][A
Training:   8%|▊         | 6/72 [00:11<01:48,  1.65s/it][A
Training:  10%|▉         | 7/72 [00:11<01:19,  1.22s/it][A
Training:  12%|█▎        | 9/72 [00:15<01:41,  1.62s/it][A
Training:  14%|█▍        | 10/72 [00:15<01:17,  1.24s/it][A
Training:  15%|█▌        | 11/72 [00:16<01:03,  1.04s/it][A
Training:  18%|█▊        | 13/72 [00:20<01:27,  1.49s/it][A
Training:  21%|██        | 15/72 [00:21<01:01,  1.08s/it][A
Training:  24%|██▎       | 17/72 [00:25<01:19,  1.45s/it][A
Training:  25%|██▌       | 18/72 [00:25<01:03,  1.18s/it][A
Training:  26%|██▋       | 19/72 [00:26<01:00,  1.13s/it][A
Training:  29%|██▉       | 21/72 [00:30<01:14,  1.47s/it][A
Training:  31%|███       | 22/72 [00:30

Epoch: 7/18 - Loss: 6.6822 - Accuracy: 0.9600



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:05<00:42,  5.31s/it][A
 22%|██▏       | 2/9 [00:05<00:15,  2.25s/it][A
 33%|███▎      | 3/9 [00:05<00:07,  1.31s/it][A
 56%|█████▌    | 5/9 [00:10<00:07,  1.83s/it][A
 78%|███████▊  | 7/9 [00:10<00:02,  1.07s/it][A
 89%|████████▉ | 8/9 [00:10<00:00,  1.16it/s][A
100%|██████████| 9/9 [00:13<00:00,  1.54s/it][A
Epochs:  39%|███▉      | 7/18 [12:35<19:44, 107.68s/it]

Val Loss: 9.0213 - Val Accuracy: 0.9581



Training:   0%|          | 0/72 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/72 [00:05<06:47,  5.75s/it][A
Training:   3%|▎         | 2/72 [00:06<02:57,  2.53s/it][A
Training:   4%|▍         | 3/72 [00:06<01:39,  1.45s/it][A
Training:   6%|▌         | 4/72 [00:06<01:04,  1.05it/s][A
Training:   7%|▋         | 5/72 [00:11<02:34,  2.30s/it][A
Training:   8%|▊         | 6/72 [00:11<01:45,  1.60s/it][A
Training:  10%|▉         | 7/72 [00:11<01:12,  1.12s/it][A
Training:  11%|█         | 8/72 [00:11<00:51,  1.24it/s][A
Training:  12%|█▎        | 9/72 [00:15<01:57,  1.86s/it][A
Training:  15%|█▌        | 11/72 [00:15<01:02,  1.02s/it][A
Training:  18%|█▊        | 13/72 [00:20<01:30,  1.53s/it][A
Training:  21%|██        | 15/72 [00:20<00:56,  1.01it/s][A
Training:  22%|██▏       | 16/72 [00:20<00:45,  1.23it/s][A
Training:  24%|██▎       | 17/72 [00:25<01:38,  1.79s/it][A
Training:  26%|██▋       | 19/72 [00:25<00:58,  1.11s/it][A
Training:  29%|██▉       | 21/72 [00:30<0

Epoch: 8/18 - Loss: 6.8199 - Accuracy: 0.9599



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:05<00:44,  5.50s/it][A
 33%|███▎      | 3/9 [00:05<00:09,  1.54s/it][A
 44%|████▍     | 4/9 [00:05<00:05,  1.05s/it][A
 56%|█████▌    | 5/9 [00:10<00:08,  2.12s/it][A
 67%|██████▋   | 6/9 [00:10<00:04,  1.48s/it][A
 89%|████████▉ | 8/9 [00:10<00:00,  1.25it/s][A
100%|██████████| 9/9 [00:14<00:00,  1.58s/it][A
Epochs:  44%|████▍     | 8/18 [14:21<17:53, 107.34s/it]

Val Loss: 7.2801 - Val Accuracy: 0.9576



Training:   0%|          | 0/72 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/72 [00:05<06:55,  5.85s/it][A
Training:   4%|▍         | 3/72 [00:06<01:51,  1.62s/it][A
Training:   7%|▋         | 5/72 [00:11<02:19,  2.08s/it][A
Training:   8%|▊         | 6/72 [00:11<01:43,  1.57s/it][A
Training:  10%|▉         | 7/72 [00:11<01:22,  1.26s/it][A
Training:  12%|█▎        | 9/72 [00:15<01:37,  1.55s/it][A
Training:  14%|█▍        | 10/72 [00:15<01:14,  1.20s/it][A
Training:  15%|█▌        | 11/72 [00:16<01:02,  1.03s/it][A
Training:  17%|█▋        | 12/72 [00:16<00:48,  1.25it/s][A
Training:  18%|█▊        | 13/72 [00:20<01:44,  1.78s/it][A
Training:  19%|█▉        | 14/72 [00:20<01:16,  1.31s/it][A
Training:  21%|██        | 15/72 [00:21<01:00,  1.07s/it][A
Training:  24%|██▎       | 17/72 [00:26<01:32,  1.68s/it][A
Training:  25%|██▌       | 18/72 [00:26<01:10,  1.31s/it][A
Training:  26%|██▋       | 19/72 [00:26<00:55,  1.04s/it][A
Training:  29%|██▉       | 21/72 [00:3

Epoch: 9/18 - Loss: 6.5397 - Accuracy: 0.9586



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:05<00:43,  5.39s/it][A
 22%|██▏       | 2/9 [00:05<00:16,  2.30s/it][A
 33%|███▎      | 3/9 [00:05<00:07,  1.30s/it][A
 56%|█████▌    | 5/9 [00:10<00:07,  1.82s/it][A
 78%|███████▊  | 7/9 [00:10<00:02,  1.04s/it][A
 89%|████████▉ | 8/9 [00:10<00:00,  1.23it/s][A
100%|██████████| 9/9 [00:14<00:00,  1.56s/it][A
Epochs:  50%|█████     | 9/18 [16:09<16:07, 107.54s/it]

Val Loss: 8.6312 - Val Accuracy: 0.9427



Training:   0%|          | 0/72 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/72 [00:05<06:46,  5.72s/it][A
Training:   3%|▎         | 2/72 [00:06<02:57,  2.53s/it][A
Training:   6%|▌         | 4/72 [00:06<01:08,  1.01s/it][A
Training:   7%|▋         | 5/72 [00:11<02:26,  2.19s/it][A
Training:   8%|▊         | 6/72 [00:11<01:43,  1.56s/it][A
Training:  11%|█         | 8/72 [00:11<00:55,  1.16it/s][A
Training:  12%|█▎        | 9/72 [00:15<01:51,  1.78s/it][A
Training:  14%|█▍        | 10/72 [00:15<01:23,  1.35s/it][A
Training:  15%|█▌        | 11/72 [00:16<01:02,  1.02s/it][A
Training:  18%|█▊        | 13/72 [00:21<01:39,  1.68s/it][A
Training:  22%|██▏       | 16/72 [00:21<00:49,  1.12it/s][A
Training:  24%|██▎       | 17/72 [00:25<01:27,  1.59s/it][A
Training:  26%|██▋       | 19/72 [00:26<00:56,  1.06s/it][A
Training:  28%|██▊       | 20/72 [00:26<00:45,  1.15it/s][A
Training:  29%|██▉       | 21/72 [00:31<01:31,  1.80s/it][A
Training:  32%|███▏      | 23/72 [00:31

Epoch: 10/18 - Loss: 6.9586 - Accuracy: 0.9602



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:05<00:43,  5.49s/it][A
 22%|██▏       | 2/9 [00:05<00:16,  2.41s/it][A
 33%|███▎      | 3/9 [00:05<00:08,  1.40s/it][A
 44%|████▍     | 4/9 [00:06<00:04,  1.13it/s][A
 56%|█████▌    | 5/9 [00:10<00:08,  2.09s/it][A
 78%|███████▊  | 7/9 [00:10<00:02,  1.06s/it][A
 89%|████████▉ | 8/9 [00:10<00:00,  1.24it/s][A
100%|██████████| 9/9 [00:13<00:00,  1.55s/it][A
Epochs:  56%|█████▌    | 10/18 [17:57<14:21, 107.68s/it]

Val Loss: 8.0305 - Val Accuracy: 0.9604



Training:   0%|          | 0/72 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/72 [00:06<07:11,  6.08s/it][A
Training:   3%|▎         | 2/72 [00:06<03:13,  2.77s/it][A
Training:   6%|▌         | 4/72 [00:06<01:13,  1.08s/it][A
Training:   7%|▋         | 5/72 [00:10<02:16,  2.04s/it][A
Training:   8%|▊         | 6/72 [00:11<01:41,  1.53s/it][A
Training:  10%|▉         | 7/72 [00:11<01:12,  1.11s/it][A
Training:  12%|█▎        | 9/72 [00:15<01:36,  1.54s/it][A
Training:  14%|█▍        | 10/72 [00:16<01:22,  1.33s/it][A
Training:  15%|█▌        | 11/72 [00:16<01:05,  1.08s/it][A
Training:  17%|█▋        | 12/72 [00:16<00:49,  1.22it/s][A
Training:  18%|█▊        | 13/72 [00:20<01:42,  1.73s/it][A
Training:  19%|█▉        | 14/72 [00:21<01:26,  1.48s/it][A
Training:  21%|██        | 15/72 [00:21<01:03,  1.11s/it][A
Training:  24%|██▎       | 17/72 [00:26<01:26,  1.58s/it][A
Training:  25%|██▌       | 18/72 [00:26<01:11,  1.33s/it][A
Training:  26%|██▋       | 19/72 [00:26

Epoch: 11/18 - Loss: 7.2357 - Accuracy: 0.9608



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:04<00:39,  4.89s/it][A
 22%|██▏       | 2/9 [00:05<00:15,  2.17s/it][A
 33%|███▎      | 3/9 [00:05<00:07,  1.30s/it][A
 44%|████▍     | 4/9 [00:05<00:04,  1.10it/s][A
 56%|█████▌    | 5/9 [00:09<00:07,  1.88s/it][A
 67%|██████▋   | 6/9 [00:09<00:04,  1.37s/it][A
 78%|███████▊  | 7/9 [00:10<00:02,  1.03s/it][A
100%|██████████| 9/9 [00:13<00:00,  1.47s/it][A
Epochs:  61%|██████    | 11/18 [19:43<12:30, 107.16s/it]

Val Loss: 8.8606 - Val Accuracy: 0.9558



Training:   0%|          | 0/72 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/72 [00:05<06:41,  5.66s/it][A
Training:   3%|▎         | 2/72 [00:06<02:57,  2.53s/it][A
Training:   6%|▌         | 4/72 [00:06<01:08,  1.00s/it][A
Training:   7%|▋         | 5/72 [00:10<02:10,  1.94s/it][A
Training:  10%|▉         | 7/72 [00:10<01:10,  1.09s/it][A
Training:  12%|█▎        | 9/72 [00:15<01:38,  1.57s/it][A
Training:  14%|█▍        | 10/72 [00:15<01:21,  1.31s/it][A
Training:  17%|█▋        | 12/72 [00:15<00:51,  1.17it/s][A
Training:  18%|█▊        | 13/72 [00:20<01:34,  1.60s/it][A
Training:  19%|█▉        | 14/72 [00:20<01:20,  1.38s/it][A
Training:  22%|██▏       | 16/72 [00:20<00:48,  1.16it/s][A
Training:  24%|██▎       | 17/72 [00:24<01:24,  1.54s/it][A
Training:  25%|██▌       | 18/72 [00:25<01:13,  1.35s/it][A
Training:  26%|██▋       | 19/72 [00:25<00:55,  1.04s/it][A
Training:  28%|██▊       | 20/72 [00:25<00:41,  1.25it/s][A
Training:  29%|██▉       | 21/72 [00:2

Epoch: 12/18 - Loss: 7.1589 - Accuracy: 0.9611



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:05<00:39,  5.00s/it][A
 22%|██▏       | 2/9 [00:05<00:15,  2.15s/it][A
 44%|████▍     | 4/9 [00:05<00:04,  1.17it/s][A
 56%|█████▌    | 5/9 [00:09<00:07,  1.92s/it][A
 78%|███████▊  | 7/9 [00:09<00:02,  1.08s/it][A
100%|██████████| 9/9 [00:13<00:00,  1.52s/it][A
Epochs:  67%|██████▋   | 12/18 [21:26<10:35, 105.91s/it]

Val Loss: 8.5924 - Val Accuracy: 0.9565



Training:   0%|          | 0/72 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/72 [00:05<06:52,  5.80s/it][A
Training:   3%|▎         | 2/72 [00:05<02:53,  2.48s/it][A
Training:   4%|▍         | 3/72 [00:06<01:37,  1.42s/it][A
Training:   6%|▌         | 4/72 [00:06<01:01,  1.11it/s][A
Training:   7%|▋         | 5/72 [00:10<02:24,  2.15s/it][A
Training:   8%|▊         | 6/72 [00:10<01:39,  1.51s/it][A
Training:  10%|▉         | 7/72 [00:11<01:09,  1.07s/it][A
Training:  11%|█         | 8/72 [00:11<00:48,  1.31it/s][A
Training:  12%|█▎        | 9/72 [00:15<01:56,  1.85s/it][A
Training:  15%|█▌        | 11/72 [00:15<01:01,  1.00s/it][A
Training:  17%|█▋        | 12/72 [00:15<00:49,  1.22it/s][A
Training:  18%|█▊        | 13/72 [00:20<01:50,  1.88s/it][A
Training:  19%|█▉        | 14/72 [00:20<01:20,  1.40s/it][A
Training:  22%|██▏       | 16/72 [00:20<00:46,  1.20it/s][A
Training:  24%|██▎       | 17/72 [00:25<01:30,  1.64s/it][A
Training:  25%|██▌       | 18/72 [00:25<0

Epoch: 13/18 - Loss: 7.5982 - Accuracy: 0.9619



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:04<00:39,  4.92s/it][A
 22%|██▏       | 2/9 [00:05<00:14,  2.10s/it][A
 33%|███▎      | 3/9 [00:05<00:07,  1.20s/it][A
 44%|████▍     | 4/9 [00:05<00:03,  1.29it/s][A
 56%|█████▌    | 5/9 [00:09<00:08,  2.04s/it][A
 67%|██████▋   | 6/9 [00:09<00:04,  1.39s/it][A
 89%|████████▉ | 8/9 [00:09<00:00,  1.35it/s][A
100%|██████████| 9/9 [00:13<00:00,  1.47s/it][A
Epochs:  72%|███████▏  | 13/18 [23:08<08:43, 104.64s/it]

Val Loss: 8.2537 - Val Accuracy: 0.9587



Training:   0%|          | 0/72 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/72 [00:05<06:35,  5.57s/it][A
Training:   3%|▎         | 2/72 [00:05<02:53,  2.47s/it][A
Training:   6%|▌         | 4/72 [00:06<01:05,  1.04it/s][A
Training:   7%|▋         | 5/72 [00:09<02:07,  1.90s/it][A
Training:   8%|▊         | 6/72 [00:10<01:33,  1.41s/it][A
Training:  11%|█         | 8/72 [00:10<00:50,  1.27it/s][A
Training:  12%|█▎        | 9/72 [00:14<01:47,  1.71s/it][A
Training:  14%|█▍        | 10/72 [00:15<01:23,  1.34s/it][A
Training:  17%|█▋        | 12/72 [00:15<00:47,  1.25it/s][A
Training:  18%|█▊        | 13/72 [00:19<01:34,  1.60s/it][A
Training:  19%|█▉        | 14/72 [00:20<01:17,  1.34s/it][A
Training:  21%|██        | 15/72 [00:20<00:58,  1.03s/it][A
Training:  22%|██▏       | 16/72 [00:20<00:43,  1.27it/s][A
Training:  24%|██▎       | 17/72 [00:24<01:33,  1.70s/it][A
Training:  25%|██▌       | 18/72 [00:24<01:12,  1.35s/it][A
Training:  28%|██▊       | 20/72 [00:25

Epoch: 14/18 - Loss: 7.4947 - Accuracy: 0.9666



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:05<00:40,  5.04s/it][A
 22%|██▏       | 2/9 [00:05<00:15,  2.20s/it][A
 44%|████▍     | 4/9 [00:05<00:04,  1.15it/s][A
 56%|█████▌    | 5/9 [00:09<00:07,  1.88s/it][A
 67%|██████▋   | 6/9 [00:09<00:04,  1.44s/it][A
100%|██████████| 9/9 [00:13<00:00,  1.50s/it][A
Epochs:  78%|███████▊  | 14/18 [24:50<06:55, 103.91s/it]

Val Loss: 7.9037 - Val Accuracy: 0.9661



Training:   0%|          | 0/72 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/72 [00:05<06:46,  5.72s/it][A
Training:   3%|▎         | 2/72 [00:05<02:51,  2.45s/it][A
Training:   4%|▍         | 3/72 [00:06<01:37,  1.41s/it][A
Training:   6%|▌         | 4/72 [00:06<01:02,  1.09it/s][A
Training:   7%|▋         | 5/72 [00:10<02:11,  1.96s/it][A
Training:   8%|▊         | 6/72 [00:10<01:28,  1.34s/it][A
Training:  10%|▉         | 7/72 [00:10<01:01,  1.06it/s][A
Training:  12%|█▎        | 9/72 [00:14<01:37,  1.54s/it][A
Training:  14%|█▍        | 10/72 [00:14<01:12,  1.17s/it][A
Training:  15%|█▌        | 11/72 [00:15<00:57,  1.07it/s][A
Training:  18%|█▊        | 13/72 [00:19<01:29,  1.52s/it][A
Training:  19%|█▉        | 14/72 [00:19<01:08,  1.19s/it][A
Training:  21%|██        | 15/72 [00:20<00:57,  1.01s/it][A
Training:  24%|██▎       | 17/72 [00:24<01:18,  1.43s/it][A
Training:  25%|██▌       | 18/72 [00:24<01:02,  1.16s/it][A
Training:  26%|██▋       | 19/72 [00:24<

Epoch: 15/18 - Loss: 7.2562 - Accuracy: 0.9635



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:05<00:42,  5.25s/it][A
 22%|██▏       | 2/9 [00:05<00:15,  2.24s/it][A
 33%|███▎      | 3/9 [00:05<00:07,  1.27s/it][A
 56%|█████▌    | 5/9 [00:10<00:07,  1.83s/it][A
 67%|██████▋   | 6/9 [00:10<00:04,  1.34s/it][A
 78%|███████▊  | 7/9 [00:10<00:02,  1.02s/it][A
 89%|████████▉ | 8/9 [00:10<00:00,  1.29it/s][A
100%|██████████| 9/9 [00:14<00:00,  1.56s/it][A
Epochs:  83%|████████▎ | 15/18 [26:34<05:11, 103.76s/it]

Val Loss: 9.2205 - Val Accuracy: 0.9552



Training:   0%|          | 0/72 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/72 [00:05<06:54,  5.84s/it][A
Training:   3%|▎         | 2/72 [00:06<02:58,  2.56s/it][A
Training:   4%|▍         | 3/72 [00:06<01:39,  1.44s/it][A
Training:   7%|▋         | 5/72 [00:10<02:02,  1.83s/it][A
Training:  10%|▉         | 7/72 [00:10<01:07,  1.05s/it][A
Training:  12%|█▎        | 9/72 [00:15<01:45,  1.67s/it][A
Training:  15%|█▌        | 11/72 [00:16<01:06,  1.09s/it][A
Training:  18%|█▊        | 13/72 [00:20<01:32,  1.56s/it][A
Training:  19%|█▉        | 14/72 [00:21<01:14,  1.28s/it][A
Training:  22%|██▏       | 16/72 [00:21<00:47,  1.18it/s][A
Training:  24%|██▎       | 17/72 [00:26<01:33,  1.71s/it][A
Training:  26%|██▋       | 19/72 [00:26<00:58,  1.11s/it][A
Training:  29%|██▉       | 21/72 [00:31<01:17,  1.52s/it][A
Training:  31%|███       | 22/72 [00:31<01:02,  1.25s/it][A
Training:  32%|███▏      | 23/72 [00:31<00:48,  1.00it/s][A
Training:  33%|███▎      | 24/72 [00:3

Epoch: 16/18 - Loss: 7.0276 - Accuracy: 0.9614



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:05<00:44,  5.61s/it][A
 33%|███▎      | 3/9 [00:05<00:09,  1.51s/it][A
 44%|████▍     | 4/9 [00:05<00:05,  1.04s/it][A
 56%|█████▌    | 5/9 [00:10<00:08,  2.18s/it][A
 67%|██████▋   | 6/9 [00:10<00:04,  1.54s/it][A
 78%|███████▊  | 7/9 [00:10<00:02,  1.12s/it][A
100%|██████████| 9/9 [00:14<00:00,  1.63s/it][A
Epochs:  89%|████████▉ | 16/18 [28:24<03:31, 105.57s/it]

Val Loss: 9.6724 - Val Accuracy: 0.9575



Training:   0%|          | 0/72 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/72 [00:05<06:51,  5.79s/it][A
Training:   4%|▍         | 3/72 [00:06<01:54,  1.66s/it][A
Training:   7%|▋         | 5/72 [00:10<02:07,  1.91s/it][A
Training:   8%|▊         | 6/72 [00:10<01:34,  1.44s/it][A
Training:  10%|▉         | 7/72 [00:11<01:16,  1.18s/it][A
Training:  12%|█▎        | 9/72 [00:15<01:41,  1.61s/it][A
Training:  14%|█▍        | 10/72 [00:16<01:23,  1.35s/it][A
Training:  15%|█▌        | 11/72 [00:16<01:10,  1.16s/it][A
Training:  17%|█▋        | 12/72 [00:16<00:55,  1.09it/s][A
Training:  18%|█▊        | 13/72 [00:20<01:42,  1.74s/it][A
Training:  19%|█▉        | 14/72 [00:21<01:17,  1.34s/it][A
Training:  21%|██        | 15/72 [00:21<01:06,  1.17s/it][A
Training:  24%|██▎       | 17/72 [00:25<01:24,  1.53s/it][A
Training:  25%|██▌       | 18/72 [00:26<01:13,  1.35s/it][A
Training:  26%|██▋       | 19/72 [00:26<00:57,  1.08s/it][A
Training:  28%|██▊       | 20/72 [00:2

Epoch: 17/18 - Loss: 7.4348 - Accuracy: 0.9648



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:05<00:44,  5.52s/it][A
 22%|██▏       | 2/9 [00:05<00:17,  2.44s/it][A
 33%|███▎      | 3/9 [00:05<00:08,  1.39s/it][A
 56%|█████▌    | 5/9 [00:10<00:07,  1.85s/it][A
 67%|██████▋   | 6/9 [00:10<00:04,  1.48s/it][A
 89%|████████▉ | 8/9 [00:11<00:00,  1.18it/s][A
100%|██████████| 9/9 [00:14<00:00,  1.64s/it][A
Epochs:  94%|█████████▍| 17/18 [30:15<01:47, 107.30s/it]

Val Loss: 9.8277 - Val Accuracy: 0.9593



Training:   0%|          | 0/72 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/72 [00:05<06:42,  5.67s/it][A
Training:   3%|▎         | 2/72 [00:05<02:51,  2.45s/it][A
Training:   4%|▍         | 3/72 [00:06<01:36,  1.40s/it][A
Training:   6%|▌         | 4/72 [00:06<01:01,  1.10it/s][A
Training:   7%|▋         | 5/72 [00:10<02:34,  2.30s/it][A
Training:  10%|▉         | 7/72 [00:11<01:17,  1.19s/it][A
Training:  11%|█         | 8/72 [00:11<00:58,  1.09it/s][A
Training:  12%|█▎        | 9/72 [00:16<02:06,  2.00s/it][A
Training:  14%|█▍        | 10/72 [00:16<01:37,  1.57s/it][A
Training:  15%|█▌        | 11/72 [00:16<01:11,  1.17s/it][A
Training:  18%|█▊        | 13/72 [00:21<01:38,  1.66s/it][A
Training:  19%|█▉        | 14/72 [00:21<01:20,  1.40s/it][A
Training:  21%|██        | 15/72 [00:22<01:01,  1.08s/it][A
Training:  22%|██▏       | 16/72 [00:22<00:46,  1.21it/s][A
Training:  24%|██▎       | 17/72 [00:26<01:37,  1.77s/it][A
Training:  25%|██▌       | 18/72 [00:27<

Epoch: 18/18 - Loss: 7.3214 - Accuracy: 0.9626



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:05<00:46,  5.82s/it][A
 22%|██▏       | 2/9 [00:05<00:17,  2.47s/it][A
 33%|███▎      | 3/9 [00:06<00:08,  1.39s/it][A
 56%|█████▌    | 5/9 [00:10<00:07,  1.98s/it][A
 78%|███████▊  | 7/9 [00:11<00:02,  1.13s/it][A
100%|██████████| 9/9 [00:15<00:00,  1.67s/it][A
Epochs: 100%|██████████| 18/18 [32:06<00:00, 107.02s/it]


Val Loss: 9.9139 - Val Accuracy: 0.9519


[32m[I 2023-12-08 17:29:21,786][0m Trial 5 finished with value: 0.9518904089927673 and parameters: {'loss_learning_rate': 0.006357172795546919, 'learning_rate': 0.0030186512218183703, 'weight_decay': 0.00014382598191632886, 'epsilon': 4.5825840133117526e-08, 'beta': 0.1, 'gamma': 0.2, 'batch_size': 195, 'epochs': 18}. Best is trial 0 with value: 0.9648317694664001.[0m


Learning rate for Loss: 0.004792079263999562
Learning rate: 0.052626173193851586
Weight decay: 0.002616766302224421
Epsilon: 2.150952378136892e-08
Beta: 0.30000000000000004
Gamma: 0.7000000000000001
Batch size: 234
Number of epochs: 43


Epochs:   0%|          | 0/43 [00:00<?, ?it/s]
Training:   0%|          | 0/60 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/60 [00:06<06:12,  6.31s/it][A
Training:   3%|▎         | 2/60 [00:06<02:36,  2.70s/it][A
Training:   5%|▌         | 3/60 [00:06<01:29,  1.57s/it][A
Training:   8%|▊         | 5/60 [00:12<02:10,  2.36s/it][A
Training:  10%|█         | 6/60 [00:12<01:32,  1.72s/it][A
Training:  12%|█▏        | 7/60 [00:12<01:07,  1.28s/it][A
Training:  13%|█▎        | 8/60 [00:13<00:49,  1.05it/s][A
Training:  15%|█▌        | 9/60 [00:18<01:51,  2.20s/it][A
Training:  18%|█▊        | 11/60 [00:18<01:01,  1.25s/it][A
Training:  22%|██▏       | 13/60 [00:24<01:29,  1.90s/it][A
Training:  23%|██▎       | 14/60 [00:24<01:09,  1.51s/it][A
Training:  27%|██▋       | 16/60 [00:24<00:41,  1.05it/s][A
Training:  28%|██▊       | 17/60 [00:30<01:26,  2.00s/it][A
Training:  30%|███       | 18/60 [00:30<01:05,  1.57s/it][A
Training:  32%|███▏      | 19/60 [00:30<00:49,  1.20s/i

Epoch: 1/43 - Loss: 1552.2384 - Accuracy: 0.8782



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:06<00:44,  6.36s/it][A
 25%|██▌       | 2/8 [00:06<00:16,  2.69s/it][A
 38%|███▊      | 3/8 [00:06<00:07,  1.53s/it][A
 50%|█████     | 4/8 [00:06<00:03,  1.03it/s][A
 62%|██████▎   | 5/8 [00:11<00:06,  2.33s/it][A
100%|██████████| 8/8 [00:11<00:00,  1.47s/it][A
Epochs:   0%|          | 0/43 [01:45<?, ?it/s]


Val Loss: 2045.6267 - Val Accuracy: 0.9199


[32m[I 2023-12-08 17:31:08,172][0m Trial 6 pruned. [0m


Learning rate for Loss: 0.0008199807649343463
Learning rate: 1.1594582448067271e-05
Weight decay: 0.00875827181161662
Epsilon: 2.1574968844225627e-09
Beta: 0.30000000000000004
Gamma: 0.30000000000000004
Batch size: 155
Number of epochs: 86


Epochs:   0%|          | 0/86 [00:00<?, ?it/s]
Training:   0%|          | 0/91 [00:00<?, ?it/s][A
Training:   1%|          | 1/91 [00:04<06:43,  4.49s/it][A
Training:   3%|▎         | 3/91 [00:04<01:47,  1.22s/it][A
Training:   4%|▍         | 4/91 [00:04<01:13,  1.19it/s][A
Training:   5%|▌         | 5/91 [00:08<02:30,  1.75s/it][A
Training:   8%|▊         | 7/91 [00:08<01:18,  1.07it/s][A
Training:  10%|▉         | 9/91 [00:12<01:45,  1.29s/it][A
Training:  11%|█         | 10/91 [00:12<01:23,  1.03s/it][A
Training:  12%|█▏        | 11/91 [00:12<01:05,  1.23it/s][A
Training:  14%|█▍        | 13/91 [00:15<01:33,  1.20s/it][A
Training:  15%|█▌        | 14/91 [00:16<01:17,  1.00s/it][A
Training:  16%|█▋        | 15/91 [00:16<00:59,  1.27it/s][A
Training:  18%|█▊        | 16/91 [00:16<00:45,  1.64it/s][A
Training:  19%|█▊        | 17/91 [00:19<01:37,  1.32s/it][A
Training:  20%|█▉        | 18/91 [00:20<01:16,  1.05s/it][A
Training:  22%|██▏       | 20/91 [00:20<00:43,  1.63i

Epoch: 1/86 - Loss: 13.9893 - Accuracy: 0.5153



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:04<00:46,  4.27s/it][A
 25%|██▌       | 3/12 [00:04<00:10,  1.19s/it][A
 33%|███▎      | 4/12 [00:04<00:06,  1.23it/s][A
 42%|████▏     | 5/12 [00:07<00:11,  1.64s/it][A
 50%|█████     | 6/12 [00:08<00:07,  1.17s/it][A
 67%|██████▋   | 8/12 [00:08<00:02,  1.58it/s][A
 75%|███████▌  | 9/12 [00:11<00:03,  1.32s/it][A
100%|██████████| 12/12 [00:11<00:00,  1.02it/s][A
Epochs:   0%|          | 0/86 [01:41<?, ?it/s]
[32m[I 2023-12-08 17:32:50,133][0m Trial 7 pruned. [0m


Val Loss: 13.0763 - Val Accuracy: 0.5603
Learning rate for Loss: 0.0003173435090099667
Learning rate: 0.005742256225983083
Weight decay: 0.002526663240403206
Epsilon: 9.894853741566392e-09
Beta: 0.6
Gamma: 0.30000000000000004
Batch size: 236
Number of epochs: 86


Epochs:   0%|          | 0/86 [00:00<?, ?it/s]
Training:   0%|          | 0/60 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/60 [00:06<05:58,  6.07s/it][A
Training:   3%|▎         | 2/60 [00:06<02:34,  2.67s/it][A
Training:   7%|▋         | 4/60 [00:06<00:58,  1.04s/it][A
Training:   8%|▊         | 5/60 [00:11<02:12,  2.41s/it][A
Training:  12%|█▏        | 7/60 [00:12<01:10,  1.34s/it][A
Training:  13%|█▎        | 8/60 [00:12<00:56,  1.08s/it][A
Training:  15%|█▌        | 9/60 [00:17<01:51,  2.18s/it][A
Training:  18%|█▊        | 11/60 [00:17<01:02,  1.28s/it][A
Training:  20%|██        | 12/60 [00:18<00:52,  1.09s/it][A
Training:  22%|██▏       | 13/60 [00:23<01:38,  2.10s/it][A
Training:  23%|██▎       | 14/60 [00:23<01:13,  1.60s/it][A
Training:  25%|██▌       | 15/60 [00:23<00:53,  1.19s/it][A
Training:  27%|██▋       | 16/60 [00:24<00:47,  1.07s/it][A
Training:  28%|██▊       | 17/60 [00:29<01:32,  2.15s/it][A
Training:  30%|███       | 18/60 [00:29<01:10,  1.67s/

Epoch: 1/86 - Loss: 42.5583 - Accuracy: 0.8726



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:06<00:43,  6.20s/it][A
 25%|██▌       | 2/8 [00:06<00:16,  2.71s/it][A
 50%|█████     | 4/8 [00:06<00:04,  1.05s/it][A
 62%|██████▎   | 5/8 [00:11<00:06,  2.24s/it][A
100%|██████████| 8/8 [00:12<00:00,  1.50s/it][A
Epochs:   0%|          | 0/86 [01:40<?, ?it/s]
[32m[I 2023-12-08 17:34:31,272][0m Trial 8 pruned. [0m


Val Loss: 66.9433 - Val Accuracy: 0.9214
Learning rate for Loss: 0.0001778030429749886
Learning rate: 0.001724236805793263
Weight decay: 0.00028529889321951747
Epsilon: 1.4780077810240457e-09
Beta: 0.8
Gamma: 0.5
Batch size: 293
Number of epochs: 11


Epochs:   0%|          | 0/11 [00:00<?, ?it/s]
Training:   0%|          | 0/48 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/48 [00:07<06:01,  7.70s/it][A
Training:   4%|▍         | 2/48 [00:07<02:31,  3.30s/it][A
Training:   6%|▋         | 3/48 [00:08<01:22,  1.84s/it][A
Training:   8%|▊         | 4/48 [00:08<00:50,  1.16s/it][A
Training:  10%|█         | 5/48 [00:15<02:23,  3.33s/it][A
Training:  12%|█▎        | 6/48 [00:15<01:34,  2.25s/it][A
Training:  15%|█▍        | 7/48 [00:15<01:03,  1.55s/it][A
Training:  19%|█▉        | 9/48 [00:22<01:38,  2.52s/it][A
Training:  21%|██        | 10/48 [00:22<01:13,  1.93s/it][A
Training:  23%|██▎       | 11/48 [00:23<00:53,  1.46s/it][A
Training:  27%|██▋       | 13/48 [00:30<01:21,  2.33s/it][A
Training:  29%|██▉       | 14/48 [00:30<01:01,  1.82s/it][A
Training:  31%|███▏      | 15/48 [00:30<00:46,  1.40s/it][A
Training:  35%|███▌      | 17/48 [00:37<01:09,  2.24s/it][A
Training:  38%|███▊      | 18/48 [00:37<00:53,  1.78s/i

Epoch: 1/11 - Loss: 13.7309 - Accuracy: 0.8971



  0%|          | 0/6 [00:00<?, ?it/s][A
 17%|█▋        | 1/6 [00:07<00:37,  7.57s/it][A
 33%|███▎      | 2/6 [00:07<00:12,  3.18s/it][A
 67%|██████▋   | 4/6 [00:07<00:02,  1.26s/it][A
100%|██████████| 6/6 [00:13<00:00,  2.30s/it][A
Epochs:   9%|▉         | 1/11 [01:41<16:53, 101.37s/it]

Val Loss: 9.5863 - Val Accuracy: 0.9548



Training:   0%|          | 0/48 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/48 [00:07<05:30,  7.03s/it][A
Training:   4%|▍         | 2/48 [00:07<02:18,  3.01s/it][A
Training:   6%|▋         | 3/48 [00:07<01:16,  1.70s/it][A
Training:   8%|▊         | 4/48 [00:07<00:54,  1.25s/it][A
Training:  10%|█         | 5/48 [00:14<02:17,  3.20s/it][A
Training:  12%|█▎        | 6/48 [00:14<01:30,  2.15s/it][A
Training:  15%|█▍        | 7/48 [00:14<01:00,  1.48s/it][A
Training:  17%|█▋        | 8/48 [00:15<00:44,  1.12s/it][A
Training:  19%|█▉        | 9/48 [00:22<01:54,  2.93s/it][A
Training:  21%|██        | 10/48 [00:22<01:18,  2.07s/it][A
Training:  23%|██▎       | 11/48 [00:22<00:54,  1.47s/it][A
Training:  25%|██▌       | 12/48 [00:22<00:39,  1.09s/it][A
Training:  27%|██▋       | 13/48 [00:29<01:37,  2.79s/it][A
Training:  29%|██▉       | 14/48 [00:29<01:08,  2.02s/it][A
Training:  31%|███▏      | 15/48 [00:29<00:47,  1.44s/it][A
Training:  33%|███▎      | 16/48 [00:30<0

Epoch: 2/11 - Loss: 9.9179 - Accuracy: 0.9558



  0%|          | 0/6 [00:00<?, ?it/s][A
 17%|█▋        | 1/6 [00:07<00:36,  7.36s/it][A
 50%|█████     | 3/6 [00:07<00:06,  2.09s/it][A
100%|██████████| 6/6 [00:13<00:00,  2.23s/it][A
Epochs:  18%|█▊        | 2/11 [03:22<15:11, 101.27s/it]

Val Loss: 9.6912 - Val Accuracy: 0.9593



Training:   0%|          | 0/48 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/48 [00:07<06:08,  7.84s/it][A
Training:   4%|▍         | 2/48 [00:08<02:36,  3.41s/it][A
Training:   6%|▋         | 3/48 [00:08<01:26,  1.92s/it][A
Training:   8%|▊         | 4/48 [00:08<00:52,  1.20s/it][A
Training:  10%|█         | 5/48 [00:14<02:15,  3.14s/it][A
Training:  12%|█▎        | 6/48 [00:15<01:30,  2.15s/it][A
Training:  17%|█▋        | 8/48 [00:15<00:45,  1.13s/it][A
Training:  19%|█▉        | 9/48 [00:22<01:42,  2.63s/it][A
Training:  21%|██        | 10/48 [00:22<01:15,  1.98s/it][A
Training:  23%|██▎       | 11/48 [00:22<00:53,  1.46s/it][A
Training:  27%|██▋       | 13/48 [00:29<01:24,  2.41s/it][A
Training:  29%|██▉       | 14/48 [00:30<01:04,  1.89s/it][A
Training:  31%|███▏      | 15/48 [00:30<00:47,  1.44s/it][A
Training:  35%|███▌      | 17/48 [00:37<01:10,  2.29s/it][A
Training:  38%|███▊      | 18/48 [00:37<00:54,  1.82s/it][A
Training:  42%|████▏     | 20/48 [00:37<

Epoch: 3/11 - Loss: 9.7220 - Accuracy: 0.9598



  0%|          | 0/6 [00:00<?, ?it/s][A
 17%|█▋        | 1/6 [00:07<00:37,  7.42s/it][A
 33%|███▎      | 2/6 [00:07<00:12,  3.14s/it][A
 50%|█████     | 3/6 [00:07<00:05,  1.76s/it][A
100%|██████████| 6/6 [00:13<00:00,  2.17s/it][A
Epochs:  27%|██▋       | 3/11 [05:03<13:30, 101.28s/it]

Val Loss: 9.7566 - Val Accuracy: 0.9593



Training:   0%|          | 0/48 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/48 [00:07<06:12,  7.93s/it][A
Training:   4%|▍         | 2/48 [00:08<02:34,  3.36s/it][A
Training:   6%|▋         | 3/48 [00:08<01:25,  1.89s/it][A
Training:   8%|▊         | 4/48 [00:08<00:52,  1.20s/it][A
Training:  10%|█         | 5/48 [00:15<02:18,  3.21s/it][A
Training:  12%|█▎        | 6/48 [00:15<01:32,  2.21s/it][A
Training:  15%|█▍        | 7/48 [00:15<01:03,  1.55s/it][A
Training:  17%|█▋        | 8/48 [00:15<00:43,  1.09s/it][A
Training:  19%|█▉        | 9/48 [00:22<01:49,  2.80s/it][A
Training:  21%|██        | 10/48 [00:22<01:21,  2.16s/it][A
Training:  23%|██▎       | 11/48 [00:23<00:56,  1.54s/it][A
Training:  27%|██▋       | 13/48 [00:29<01:22,  2.37s/it][A
Training:  29%|██▉       | 14/48 [00:30<01:07,  1.99s/it][A
Training:  31%|███▏      | 15/48 [00:30<00:49,  1.51s/it][A
Training:  33%|███▎      | 16/48 [00:30<00:36,  1.13s/it][A
Training:  35%|███▌      | 17/48 [00:37<0

Epoch: 4/11 - Loss: 10.0501 - Accuracy: 0.9627



  0%|          | 0/6 [00:00<?, ?it/s][A
 17%|█▋        | 1/6 [00:07<00:37,  7.50s/it][A
 33%|███▎      | 2/6 [00:07<00:12,  3.17s/it][A
 50%|█████     | 3/6 [00:07<00:05,  1.83s/it][A
 67%|██████▋   | 4/6 [00:08<00:02,  1.18s/it][A
100%|██████████| 6/6 [00:13<00:00,  2.22s/it][A
Epochs:  36%|███▋      | 4/11 [06:46<11:51, 101.70s/it]

Val Loss: 11.0184 - Val Accuracy: 0.9564



Training:   0%|          | 0/48 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/48 [00:08<06:41,  8.53s/it][A
Training:   6%|▋         | 3/48 [00:08<01:43,  2.30s/it][A
Training:   8%|▊         | 4/48 [00:08<01:08,  1.55s/it][A
Training:  10%|█         | 5/48 [00:15<02:23,  3.34s/it][A
Training:  12%|█▎        | 6/48 [00:16<01:38,  2.34s/it][A
Training:  15%|█▍        | 7/48 [00:16<01:08,  1.67s/it][A
Training:  17%|█▋        | 8/48 [00:16<00:48,  1.21s/it][A
Training:  19%|█▉        | 9/48 [00:23<01:53,  2.90s/it][A
Training:  23%|██▎       | 11/48 [00:23<00:58,  1.58s/it][A
Training:  27%|██▋       | 13/48 [00:30<01:23,  2.39s/it][A
Training:  31%|███▏      | 15/48 [00:30<00:52,  1.58s/it][A
Training:  33%|███▎      | 16/48 [00:31<00:41,  1.28s/it][A
Training:  35%|███▌      | 17/48 [00:37<01:17,  2.50s/it][A
Training:  40%|███▉      | 19/48 [00:38<00:46,  1.61s/it][A
Training:  42%|████▏     | 20/48 [00:38<00:36,  1.30s/it][A
Training:  44%|████▍     | 21/48 [00:44<

Epoch: 5/11 - Loss: 10.0221 - Accuracy: 0.9574



  0%|          | 0/6 [00:00<?, ?it/s][A
 17%|█▋        | 1/6 [00:07<00:35,  7.15s/it][A
 33%|███▎      | 2/6 [00:07<00:12,  3.11s/it][A
 67%|██████▋   | 4/6 [00:07<00:02,  1.21s/it][A
 83%|████████▎ | 5/6 [00:12<00:02,  2.42s/it][A
100%|██████████| 6/6 [00:13<00:00,  2.18s/it][A
Epochs:  45%|████▌     | 5/11 [08:28<10:12, 102.05s/it]

Val Loss: 11.0866 - Val Accuracy: 0.9485



Training:   0%|          | 0/48 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/48 [00:07<06:12,  7.93s/it][A
Training:   4%|▍         | 2/48 [00:08<02:33,  3.34s/it][A
Training:   6%|▋         | 3/48 [00:08<01:25,  1.91s/it][A
Training:   8%|▊         | 4/48 [00:08<00:55,  1.27s/it][A
Training:  10%|█         | 5/48 [00:15<02:23,  3.33s/it][A
Training:  15%|█▍        | 7/48 [00:15<01:09,  1.70s/it][A
Training:  19%|█▉        | 9/48 [00:22<01:35,  2.44s/it][A
Training:  21%|██        | 10/48 [00:22<01:13,  1.93s/it][A
Training:  25%|██▌       | 12/48 [00:23<00:42,  1.19s/it][A
Training:  27%|██▋       | 13/48 [00:29<01:23,  2.37s/it][A
Training:  29%|██▉       | 14/48 [00:29<01:04,  1.89s/it][A
Training:  31%|███▏      | 15/48 [00:30<00:47,  1.44s/it][A
Training:  33%|███▎      | 16/48 [00:30<00:34,  1.09s/it][A
Training:  35%|███▌      | 17/48 [00:36<01:19,  2.56s/it][A
Training:  38%|███▊      | 18/48 [00:37<01:02,  2.07s/it][A
Training:  40%|███▉      | 19/48 [00:37

Epoch: 6/11 - Loss: 10.4996 - Accuracy: 0.9596



  0%|          | 0/6 [00:00<?, ?it/s][A
 17%|█▋        | 1/6 [00:06<00:34,  6.99s/it][A
 33%|███▎      | 2/6 [00:07<00:12,  3.04s/it][A
 67%|██████▋   | 4/6 [00:07<00:02,  1.18s/it][A
100%|██████████| 6/6 [00:12<00:00,  2.11s/it][A
Epochs:  55%|█████▍    | 6/11 [10:08<08:26, 101.28s/it]

Val Loss: 12.6936 - Val Accuracy: 0.9577



Training:   0%|          | 0/48 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/48 [00:08<06:31,  8.34s/it][A
Training:   4%|▍         | 2/48 [00:08<02:42,  3.52s/it][A
Training:   6%|▋         | 3/48 [00:08<01:28,  1.96s/it][A
Training:   8%|▊         | 4/48 [00:08<00:55,  1.26s/it][A
Training:  10%|█         | 5/48 [00:15<02:24,  3.36s/it][A
Training:  12%|█▎        | 6/48 [00:16<01:35,  2.28s/it][A
Training:  15%|█▍        | 7/48 [00:16<01:04,  1.58s/it][A
Training:  17%|█▋        | 8/48 [00:16<00:45,  1.14s/it][A
Training:  19%|█▉        | 9/48 [00:23<01:54,  2.93s/it][A
Training:  23%|██▎       | 11/48 [00:23<00:58,  1.59s/it][A
Training:  25%|██▌       | 12/48 [00:23<00:43,  1.22s/it][A
Training:  27%|██▋       | 13/48 [00:30<01:35,  2.73s/it][A
Training:  29%|██▉       | 14/48 [00:30<01:09,  2.04s/it][A
Training:  31%|███▏      | 15/48 [00:30<00:49,  1.51s/it][A
Training:  33%|███▎      | 16/48 [00:31<00:36,  1.13s/it][A
Training:  35%|███▌      | 17/48 [00:38<0

Epoch: 7/11 - Loss: 10.9517 - Accuracy: 0.9604



  0%|          | 0/6 [00:00<?, ?it/s][A
 17%|█▋        | 1/6 [00:06<00:34,  6.91s/it][A
 50%|█████     | 3/6 [00:07<00:05,  1.87s/it][A
 83%|████████▎ | 5/6 [00:12<00:02,  2.33s/it][A
100%|██████████| 6/6 [00:12<00:00,  2.15s/it][A
Epochs:  64%|██████▎   | 7/11 [11:50<06:46, 101.55s/it]

Val Loss: 13.5205 - Val Accuracy: 0.9587



Training:   0%|          | 0/48 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/48 [00:07<06:11,  7.90s/it][A
Training:   4%|▍         | 2/48 [00:08<02:40,  3.49s/it][A
Training:   6%|▋         | 3/48 [00:08<01:28,  1.96s/it][A
Training:   8%|▊         | 4/48 [00:08<00:54,  1.24s/it][A
Training:  10%|█         | 5/48 [00:15<02:22,  3.31s/it][A
Training:  12%|█▎        | 6/48 [00:15<01:35,  2.29s/it][A
Training:  15%|█▍        | 7/48 [00:15<01:04,  1.57s/it][A
Training:  19%|█▉        | 9/48 [00:22<01:36,  2.47s/it][A
Training:  21%|██        | 10/48 [00:22<01:11,  1.88s/it][A
Training:  23%|██▎       | 11/48 [00:23<00:52,  1.41s/it][A
Training:  27%|██▋       | 13/48 [00:30<01:22,  2.36s/it][A
Training:  29%|██▉       | 14/48 [00:30<01:02,  1.85s/it][A
Training:  31%|███▏      | 15/48 [00:30<00:46,  1.42s/it][A
Training:  35%|███▌      | 17/48 [00:37<01:08,  2.22s/it][A
Training:  38%|███▊      | 18/48 [00:37<00:54,  1.80s/it][A
Training:  40%|███▉      | 19/48 [00:37<

Epoch: 8/11 - Loss: 11.6040 - Accuracy: 0.9613



  0%|          | 0/6 [00:00<?, ?it/s][A
 17%|█▋        | 1/6 [00:06<00:33,  6.73s/it][A
 33%|███▎      | 2/6 [00:06<00:11,  2.85s/it][A
 67%|██████▋   | 4/6 [00:07<00:02,  1.11s/it][A
100%|██████████| 6/6 [00:12<00:00,  2.16s/it][A
Epochs:  73%|███████▎  | 8/11 [13:32<05:05, 101.68s/it]

Val Loss: 13.7245 - Val Accuracy: 0.9610



Training:   0%|          | 0/48 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/48 [00:07<06:15,  7.99s/it][A
Training:   4%|▍         | 2/48 [00:08<02:34,  3.36s/it][A
Training:   6%|▋         | 3/48 [00:08<01:25,  1.90s/it][A
Training:   8%|▊         | 4/48 [00:08<00:53,  1.22s/it][A
Training:  10%|█         | 5/48 [00:15<02:19,  3.24s/it][A
Training:  12%|█▎        | 6/48 [00:15<01:33,  2.22s/it][A
Training:  17%|█▋        | 8/48 [00:15<00:47,  1.19s/it][A
Training:  19%|█▉        | 9/48 [00:22<01:43,  2.65s/it][A
Training:  21%|██        | 10/48 [00:22<01:15,  1.98s/it][A
Training:  25%|██▌       | 12/48 [00:22<00:41,  1.16s/it][A
Training:  27%|██▋       | 13/48 [00:29<01:29,  2.55s/it][A
Training:  29%|██▉       | 14/48 [00:30<01:06,  1.96s/it][A
Training:  31%|███▏      | 15/48 [00:30<00:48,  1.47s/it][A
Training:  33%|███▎      | 16/48 [00:30<00:35,  1.11s/it][A
Training:  35%|███▌      | 17/48 [00:36<01:21,  2.63s/it][A
Training:  38%|███▊      | 18/48 [00:37<

Epoch: 9/11 - Loss: 12.5121 - Accuracy: 0.9548



  0%|          | 0/6 [00:00<?, ?it/s][A
 17%|█▋        | 1/6 [00:06<00:34,  6.81s/it][A
 33%|███▎      | 2/6 [00:06<00:11,  2.86s/it][A
 50%|█████     | 3/6 [00:07<00:04,  1.61s/it][A
 67%|██████▋   | 4/6 [00:07<00:02,  1.02s/it][A
100%|██████████| 6/6 [00:12<00:00,  2.16s/it][A
Epochs:  82%|████████▏ | 9/11 [15:14<03:23, 101.78s/it]

Val Loss: 13.9430 - Val Accuracy: 0.9564



Training:   0%|          | 0/48 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/48 [00:08<06:43,  8.58s/it][A
Training:   4%|▍         | 2/48 [00:09<02:55,  3.82s/it][A
Training:   6%|▋         | 3/48 [00:09<01:35,  2.13s/it][A
Training:   8%|▊         | 4/48 [00:09<00:58,  1.33s/it][A
Training:  10%|█         | 5/48 [00:18<02:54,  4.07s/it][A
Training:  12%|█▎        | 6/48 [00:19<02:05,  2.99s/it][A
Training:  17%|█▋        | 8/48 [00:19<01:02,  1.57s/it][A
Training:  19%|█▉        | 9/48 [00:27<02:10,  3.34s/it][A
Training:  21%|██        | 10/48 [00:28<01:38,  2.58s/it][A
Training:  25%|██▌       | 12/48 [00:28<00:53,  1.49s/it][A
Training:  27%|██▋       | 13/48 [00:35<01:40,  2.88s/it][A
Training:  29%|██▉       | 14/48 [00:36<01:17,  2.27s/it][A
Training:  33%|███▎      | 16/48 [00:36<00:43,  1.37s/it][A
Training:  35%|███▌      | 17/48 [00:43<01:23,  2.68s/it][A
Training:  38%|███▊      | 18/48 [00:44<01:04,  2.14s/it][A
Training:  42%|████▏     | 20/48 [00:44<

Epoch: 10/11 - Loss: 11.9473 - Accuracy: 0.9655



  0%|          | 0/6 [00:00<?, ?it/s][A
 17%|█▋        | 1/6 [00:07<00:36,  7.34s/it][A
 33%|███▎      | 2/6 [00:07<00:12,  3.08s/it][A
 67%|██████▋   | 4/6 [00:07<00:02,  1.20s/it][A
100%|██████████| 6/6 [00:13<00:00,  2.31s/it][A
Epochs:  91%|█████████ | 10/11 [17:05<01:44, 104.67s/it]

Val Loss: 13.6562 - Val Accuracy: 0.9553



Training:   0%|          | 0/48 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/48 [00:08<06:52,  8.78s/it][A
Training:   4%|▍         | 2/48 [00:09<02:52,  3.75s/it][A
Training:   6%|▋         | 3/48 [00:09<01:34,  2.10s/it][A
Training:  10%|█         | 5/48 [00:16<02:03,  2.88s/it][A
Training:  12%|█▎        | 6/48 [00:16<01:31,  2.17s/it][A
Training:  17%|█▋        | 8/48 [00:16<00:48,  1.22s/it][A
Training:  19%|█▉        | 9/48 [00:23<01:42,  2.62s/it][A
Training:  21%|██        | 10/48 [00:24<01:20,  2.11s/it][A
Training:  23%|██▎       | 11/48 [00:24<00:58,  1.59s/it][A
Training:  25%|██▌       | 12/48 [00:24<00:42,  1.18s/it][A
Training:  27%|██▋       | 13/48 [00:31<01:36,  2.76s/it][A
Training:  29%|██▉       | 14/48 [00:32<01:14,  2.18s/it][A
Training:  33%|███▎      | 16/48 [00:32<00:39,  1.23s/it][A
Training:  35%|███▌      | 17/48 [00:39<01:20,  2.60s/it][A
Training:  38%|███▊      | 18/48 [00:39<01:01,  2.06s/it][A
Training:  40%|███▉      | 19/48 [00:39

Epoch: 11/11 - Loss: 12.6749 - Accuracy: 0.9638



  0%|          | 0/6 [00:00<?, ?it/s][A
 17%|█▋        | 1/6 [00:07<00:37,  7.50s/it][A
 33%|███▎      | 2/6 [00:07<00:13,  3.30s/it][A
 50%|█████     | 3/6 [00:08<00:05,  1.89s/it][A
100%|██████████| 6/6 [00:13<00:00,  2.31s/it][A
Epochs: 100%|██████████| 11/11 [18:52<00:00, 102.91s/it]


Val Loss: 14.7946 - Val Accuracy: 0.9422


[32m[I 2023-12-08 17:53:24,166][0m Trial 9 finished with value: 0.942152202129364 and parameters: {'loss_learning_rate': 0.0001778030429749886, 'learning_rate': 0.001724236805793263, 'weight_decay': 0.00028529889321951747, 'epsilon': 1.4780077810240457e-09, 'beta': 0.8, 'gamma': 0.5, 'batch_size': 293, 'epochs': 11}. Best is trial 0 with value: 0.9648317694664001.[0m


Learning rate for Loss: 0.0022227970010410235
Learning rate: 0.00011114133406906028
Weight decay: 0.0012654121241573045
Epsilon: 1.0085253202150492e-09
Beta: 1.0
Gamma: 1.0
Batch size: 62
Number of epochs: 68


Epochs:   0%|          | 0/68 [00:00<?, ?it/s]
Training:   0%|          | 0/226 [00:00<?, ?it/s][A
Training:   0%|          | 1/226 [00:02<07:54,  2.11s/it][A
Training:   1%|▏         | 3/226 [00:02<02:13,  1.67it/s][A
Training:   2%|▏         | 5/226 [00:03<02:27,  1.49it/s][A
Training:   3%|▎         | 7/226 [00:03<01:29,  2.46it/s][A
Training:   4%|▍         | 9/226 [00:05<02:01,  1.78it/s][A
Training:   5%|▍         | 11/226 [00:05<01:23,  2.57it/s][A
Training:   6%|▌         | 13/226 [00:07<01:45,  2.01it/s][A
Training:   7%|▋         | 16/226 [00:07<01:03,  3.29it/s][A
Training:   8%|▊         | 18/226 [00:08<01:30,  2.30it/s][A
Training:   9%|▉         | 21/226 [00:10<01:42,  2.01it/s][A
Training:  10%|█         | 23/226 [00:10<01:17,  2.63it/s][A
Training:  11%|█         | 25/226 [00:12<01:37,  2.06it/s][A
Training:  12%|█▏        | 27/226 [00:12<01:12,  2.74it/s][A
Training:  13%|█▎        | 29/226 [00:13<01:32,  2.13it/s][A
Training:  15%|█▍        | 33/226 [00

Epoch: 1/68 - Loss: 23.2720 - Accuracy: 0.8649



  0%|          | 0/29 [00:00<?, ?it/s][A
  3%|▎         | 1/29 [00:01<00:51,  1.84s/it][A
  7%|▋         | 2/29 [00:02<00:24,  1.12it/s][A
 17%|█▋        | 5/29 [00:03<00:12,  1.90it/s][A
 21%|██        | 6/29 [00:03<00:11,  2.06it/s][A
 31%|███       | 9/29 [00:04<00:08,  2.39it/s][A
 34%|███▍      | 10/29 [00:05<00:07,  2.39it/s][A
 41%|████▏     | 12/29 [00:05<00:04,  3.48it/s][A
 45%|████▍     | 13/29 [00:06<00:07,  2.28it/s][A
 48%|████▊     | 14/29 [00:06<00:06,  2.49it/s][A
 55%|█████▌    | 16/29 [00:06<00:03,  3.73it/s][A
 59%|█████▊    | 17/29 [00:07<00:05,  2.20it/s][A
 62%|██████▏   | 18/29 [00:07<00:04,  2.52it/s][A
 69%|██████▉   | 20/29 [00:08<00:02,  3.86it/s][A
 72%|███████▏  | 21/29 [00:09<00:03,  2.28it/s][A
 76%|███████▌  | 22/29 [00:09<00:02,  2.35it/s][A
 86%|████████▌ | 25/29 [00:10<00:01,  2.63it/s][A
100%|██████████| 29/29 [00:10<00:00,  2.66it/s][A
Epochs:   0%|          | 0/68 [01:43<?, ?it/s]
[32m[I 2023-12-08 17:55:08,807][0m Trial 10 pr

Val Loss: 12.9893 - Val Accuracy: 0.9394
Learning rate for Loss: 0.0016533229994379524
Learning rate: 1.7419597116507105e-05
Weight decay: 0.005957082182471941
Epsilon: 4.839346938366986e-09
Beta: 0.2
Gamma: 0.7000000000000001
Batch size: 143
Number of epochs: 67


Epochs:   0%|          | 0/67 [00:00<?, ?it/s]
Training:   0%|          | 0/98 [00:00<?, ?it/s][A
Training:   1%|          | 1/98 [00:04<06:47,  4.20s/it][A
Training:   2%|▏         | 2/98 [00:04<02:51,  1.79s/it][A
Training:   3%|▎         | 3/98 [00:04<01:37,  1.03s/it][A
Training:   5%|▌         | 5/98 [00:08<02:21,  1.52s/it][A
Training:   6%|▌         | 6/98 [00:08<01:44,  1.13s/it][A
Training:   8%|▊         | 8/98 [00:08<00:59,  1.52it/s][A
Training:   9%|▉         | 9/98 [00:12<02:00,  1.35s/it][A
Training:  11%|█         | 11/98 [00:12<01:11,  1.22it/s][A
Training:  13%|█▎        | 13/98 [00:15<01:40,  1.19s/it][A
Training:  15%|█▌        | 15/98 [00:15<01:06,  1.24it/s][A
Training:  17%|█▋        | 17/98 [00:19<01:29,  1.10s/it][A
Training:  19%|█▉        | 19/98 [00:19<01:00,  1.30it/s][A
Training:  21%|██▏       | 21/98 [00:22<01:20,  1.05s/it][A
Training:  22%|██▏       | 22/98 [00:23<01:09,  1.09it/s][A
Training:  24%|██▍       | 24/98 [00:23<00:46,  1.60it

Epoch: 1/67 - Loss: 21.9563 - Accuracy: 0.6028



  0%|          | 0/13 [00:00<?, ?it/s][A
  8%|▊         | 1/13 [00:04<00:48,  4.02s/it][A
 15%|█▌        | 2/13 [00:04<00:18,  1.73s/it][A
 23%|██▎       | 3/13 [00:04<00:09,  1.01it/s][A
 38%|███▊      | 5/13 [00:07<00:10,  1.33s/it][A
 46%|████▌     | 6/13 [00:07<00:06,  1.02it/s][A
 54%|█████▍    | 7/13 [00:07<00:04,  1.37it/s][A
 62%|██████▏   | 8/13 [00:07<00:02,  1.83it/s][A
 69%|██████▉   | 9/13 [00:10<00:04,  1.24s/it][A
100%|██████████| 13/13 [00:11<00:00,  1.15it/s][A
Epochs:   0%|          | 0/67 [01:43<?, ?it/s]
[32m[I 2023-12-08 17:56:52,793][0m Trial 11 pruned. [0m


Val Loss: 18.3335 - Val Accuracy: 0.7227
Learning rate for Loss: 0.0004535126843030028
Learning rate: 0.00015103059926292156
Weight decay: 0.0011148955173299832
Epsilon: 6.052679797212322e-08
Beta: 0.1
Gamma: 0.6
Batch size: 279
Number of epochs: 99


Epochs:   0%|          | 0/99 [00:00<?, ?it/s]
Training:   0%|          | 0/51 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/51 [00:07<06:39,  7.98s/it][A
Training:   4%|▍         | 2/51 [00:08<02:48,  3.45s/it][A
Training:   6%|▌         | 3/51 [00:08<01:39,  2.07s/it][A
Training:  10%|▉         | 5/51 [00:15<02:06,  2.75s/it][A
Training:  12%|█▏        | 6/51 [00:15<01:31,  2.04s/it][A
Training:  14%|█▎        | 7/51 [00:16<01:11,  1.63s/it][A
Training:  18%|█▊        | 9/51 [00:22<01:40,  2.39s/it][A
Training:  20%|█▉        | 10/51 [00:22<01:15,  1.85s/it][A
Training:  22%|██▏       | 11/51 [00:23<01:01,  1.54s/it][A
Training:  24%|██▎       | 12/51 [00:23<00:44,  1.15s/it][A
Training:  25%|██▌       | 13/51 [00:30<01:39,  2.62s/it][A
Training:  27%|██▋       | 14/51 [00:30<01:13,  1.98s/it][A
Training:  29%|██▉       | 15/51 [00:31<00:56,  1.57s/it][A
Training:  31%|███▏      | 16/51 [00:31<00:40,  1.16s/it][A
Training:  33%|███▎      | 17/51 [00:37<01:33,  2.75s/

Epoch: 1/99 - Loss: 11.1655 - Accuracy: 0.8366



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:07<00:42,  7.15s/it][A
 29%|██▊       | 2/7 [00:07<00:15,  3.04s/it][A
 43%|████▎     | 3/7 [00:07<00:06,  1.72s/it][A
 71%|███████▏  | 5/7 [00:12<00:04,  2.30s/it][A
100%|██████████| 7/7 [00:13<00:00,  1.91s/it][A
Epochs:   0%|          | 0/99 [01:47<?, ?it/s]
[32m[I 2023-12-08 17:58:41,264][0m Trial 12 pruned. [0m


Val Loss: 5.5010 - Val Accuracy: 0.9322
Learning rate for Loss: 0.0016497647090660487
Learning rate: 0.00017578913403869465
Weight decay: 0.0006675163553006042
Epsilon: 1.755368853591293e-08
Beta: 0.7000000000000001
Gamma: 0.9
Batch size: 243
Number of epochs: 63


Epochs:   0%|          | 0/63 [00:00<?, ?it/s]
Training:   0%|          | 0/58 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/58 [00:06<06:09,  6.48s/it][A
Training:   3%|▎         | 2/58 [00:07<02:47,  2.99s/it][A
Training:   5%|▌         | 3/58 [00:07<01:35,  1.73s/it][A
Training:   9%|▊         | 5/58 [00:13<02:09,  2.44s/it][A
Training:  10%|█         | 6/58 [00:13<01:40,  1.93s/it][A
Training:  12%|█▏        | 7/58 [00:14<01:11,  1.41s/it][A
Training:  16%|█▌        | 9/58 [00:19<01:35,  1.95s/it][A
Training:  17%|█▋        | 10/58 [00:20<01:22,  1.73s/it][A
Training:  19%|█▉        | 11/58 [00:20<01:01,  1.31s/it][A
Training:  22%|██▏       | 13/58 [00:25<01:23,  1.87s/it][A
Training:  24%|██▍       | 14/58 [00:26<01:13,  1.68s/it][A
Training:  28%|██▊       | 16/58 [00:26<00:43,  1.03s/it][A
Training:  29%|██▉       | 17/58 [00:32<01:23,  2.04s/it][A
Training:  31%|███       | 18/58 [00:33<01:11,  1.79s/it][A
Training:  33%|███▎      | 19/58 [00:33<00:54,  1.40s/

Epoch: 1/63 - Loss: 23.1463 - Accuracy: 0.7930



  0%|          | 0/8 [00:00<?, ?it/s][A
 12%|█▎        | 1/8 [00:06<00:42,  6.09s/it][A
 25%|██▌       | 2/8 [00:06<00:16,  2.69s/it][A
 50%|█████     | 4/8 [00:06<00:04,  1.05s/it][A
 62%|██████▎   | 5/8 [00:11<00:07,  2.34s/it][A
 75%|███████▌  | 6/8 [00:12<00:03,  1.71s/it][A
100%|██████████| 8/8 [00:12<00:00,  1.54s/it][A
Epochs:   0%|          | 0/63 [01:51<?, ?it/s]
[32m[I 2023-12-08 18:00:33,413][0m Trial 13 pruned. [0m


Val Loss: 13.6321 - Val Accuracy: 0.9318
Learning rate for Loss: 0.0001045606317460309
Learning rate: 4.336281088315565e-05
Weight decay: 0.00159704810203426
Epsilon: 4.070376153578847e-09
Beta: 0.2
Gamma: 0.5
Batch size: 137
Number of epochs: 32


Epochs:   0%|          | 0/32 [00:00<?, ?it/s]
Training:   0%|          | 0/102 [00:00<?, ?it/s][A
Training:   1%|          | 1/102 [00:04<07:37,  4.53s/it][A
Training:   2%|▏         | 2/102 [00:04<03:12,  1.93s/it][A
Training:   4%|▍         | 4/102 [00:04<01:14,  1.32it/s][A
Training:   6%|▌         | 6/102 [00:08<02:10,  1.36s/it][A
Training:   9%|▉         | 9/102 [00:12<02:05,  1.35s/it][A
Training:  10%|▉         | 10/102 [00:12<01:42,  1.11s/it][A
Training:  11%|█         | 11/102 [00:13<01:21,  1.11it/s][A
Training:  12%|█▏        | 12/102 [00:13<01:04,  1.40it/s][A
Training:  13%|█▎        | 13/102 [00:16<02:02,  1.37s/it][A
Training:  15%|█▍        | 15/102 [00:16<01:12,  1.20it/s][A
Training:  16%|█▌        | 16/102 [00:16<00:57,  1.49it/s][A
Training:  17%|█▋        | 17/102 [00:20<01:58,  1.40s/it][A
Training:  19%|█▊        | 19/102 [00:20<01:09,  1.19it/s][A
Training:  21%|██        | 21/102 [00:24<01:38,  1.22s/it][A
Training:  24%|██▎       | 24/102 [00

Epoch: 1/32 - Loss: 14.3615 - Accuracy: 0.7203



  0%|          | 0/13 [00:00<?, ?it/s][A
  8%|▊         | 1/13 [00:03<00:44,  3.69s/it][A
 23%|██▎       | 3/13 [00:03<00:10,  1.04s/it][A
 38%|███▊      | 5/13 [00:06<00:10,  1.29s/it][A
 46%|████▌     | 6/13 [00:07<00:06,  1.03it/s][A
 54%|█████▍    | 7/13 [00:07<00:04,  1.29it/s][A
 69%|██████▉   | 9/13 [00:10<00:04,  1.08s/it][A
 85%|████████▍ | 11/13 [00:10<00:01,  1.36it/s][A
100%|██████████| 13/13 [00:12<00:00,  1.02it/s][A
Epochs:   0%|          | 0/32 [01:50<?, ?it/s]


Val Loss: 10.1629 - Val Accuracy: 0.8829


[32m[I 2023-12-08 18:02:24,384][0m Trial 14 pruned. [0m


Learning rate for Loss: 0.00953499792102873
Learning rate: 0.0004893954558618118
Weight decay: 0.004977508654911263
Epsilon: 8.634793963388647e-08
Beta: 0.5
Gamma: 0.6
Batch size: 165
Number of epochs: 56


Epochs:   0%|          | 0/56 [00:00<?, ?it/s]
Training:   0%|          | 0/85 [00:00<?, ?it/s][A
Training:   1%|          | 1/85 [00:05<07:21,  5.26s/it][A
Training:   2%|▏         | 2/85 [00:05<03:06,  2.24s/it][A
Training:   5%|▍         | 4/85 [00:05<01:11,  1.14it/s][A
Training:   6%|▌         | 5/85 [00:10<02:44,  2.05s/it][A
Training:   8%|▊         | 7/85 [00:10<01:26,  1.11s/it][A
Training:  11%|█         | 9/85 [00:14<01:55,  1.52s/it][A
Training:  13%|█▎        | 11/85 [00:14<01:13,  1.01it/s][A
Training:  15%|█▌        | 13/85 [00:19<01:42,  1.43s/it][A
Training:  16%|█▋        | 14/85 [00:19<01:23,  1.18s/it][A
Training:  18%|█▊        | 15/85 [00:19<01:06,  1.06it/s][A
Training:  19%|█▉        | 16/85 [00:19<00:51,  1.33it/s][A
Training:  20%|██        | 17/85 [00:23<01:50,  1.62s/it][A
Training:  21%|██        | 18/85 [00:23<01:22,  1.22s/it][A
Training:  24%|██▎       | 20/85 [00:24<00:46,  1.39it/s][A
Training:  25%|██▍       | 21/85 [00:28<01:42,  1.60s

Epoch: 1/56 - Loss: 9.4553 - Accuracy: 0.9004



  0%|          | 0/11 [00:00<?, ?it/s][A
  9%|▉         | 1/11 [00:04<00:45,  4.55s/it][A
 27%|██▋       | 3/11 [00:04<00:09,  1.24s/it][A
 36%|███▋      | 4/11 [00:04<00:05,  1.17it/s][A
 45%|████▌     | 5/11 [00:08<00:10,  1.81s/it][A
 55%|█████▍    | 6/11 [00:08<00:06,  1.27s/it][A
 64%|██████▎   | 7/11 [00:08<00:03,  1.10it/s][A
 73%|███████▎  | 8/11 [00:09<00:02,  1.48it/s][A
 82%|████████▏ | 9/11 [00:12<00:03,  1.61s/it][A
100%|██████████| 11/11 [00:13<00:00,  1.19s/it][A
Epochs:   2%|▏         | 1/56 [01:48<1:39:28, 108.52s/it]

Val Loss: 5.1366 - Val Accuracy: 0.9572



Training:   0%|          | 0/85 [00:00<?, ?it/s][A
Training:   1%|          | 1/85 [00:05<07:45,  5.54s/it][A
Training:   2%|▏         | 2/85 [00:05<03:18,  2.39s/it][A
Training:   4%|▎         | 3/85 [00:05<01:52,  1.38s/it][A
Training:   5%|▍         | 4/85 [00:06<01:11,  1.13it/s][A
Training:   6%|▌         | 5/85 [00:10<02:43,  2.04s/it][A
Training:   7%|▋         | 6/85 [00:10<01:49,  1.39s/it][A
Training:   8%|▊         | 7/85 [00:10<01:16,  1.02it/s][A
Training:  11%|█         | 9/85 [00:14<01:59,  1.57s/it][A
Training:  12%|█▏        | 10/85 [00:14<01:30,  1.20s/it][A
Training:  13%|█▎        | 11/85 [00:15<01:08,  1.07it/s][A
Training:  14%|█▍        | 12/85 [00:15<00:51,  1.42it/s][A
Training:  15%|█▌        | 13/85 [00:19<02:00,  1.67s/it][A
Training:  16%|█▋        | 14/85 [00:19<01:26,  1.22s/it][A
Training:  18%|█▊        | 15/85 [00:19<01:03,  1.10it/s][A
Training:  19%|█▉        | 16/85 [00:19<00:46,  1.48it/s][A
Training:  20%|██        | 17/85 [00:23<

Epoch: 2/56 - Loss: 4.9227 - Accuracy: 0.9558



  0%|          | 0/11 [00:00<?, ?it/s][A
  9%|▉         | 1/11 [00:04<00:45,  4.59s/it][A
 18%|█▊        | 2/11 [00:04<00:18,  2.02s/it][A
 27%|██▋       | 3/11 [00:04<00:09,  1.15s/it][A
 45%|████▌     | 5/11 [00:08<00:09,  1.61s/it][A
 64%|██████▎   | 7/11 [00:08<00:03,  1.09it/s][A
 82%|████████▏ | 9/11 [00:12<00:02,  1.26s/it][A
100%|██████████| 11/11 [00:13<00:00,  1.19s/it][A
Epochs:   4%|▎         | 2/56 [03:38<1:38:24, 109.34s/it]

Val Loss: 4.6242 - Val Accuracy: 0.9568



Training:   0%|          | 0/85 [00:00<?, ?it/s][A
Training:   1%|          | 1/85 [00:05<07:27,  5.32s/it][A
Training:   4%|▎         | 3/85 [00:05<01:56,  1.42s/it][A
Training:   6%|▌         | 5/85 [00:10<02:29,  1.87s/it][A
Training:   8%|▊         | 7/85 [00:10<01:26,  1.11s/it][A
Training:   9%|▉         | 8/85 [00:10<01:07,  1.13it/s][A
Training:  11%|█         | 9/85 [00:14<02:13,  1.75s/it][A
Training:  12%|█▏        | 10/85 [00:14<01:39,  1.33s/it][A
Training:  13%|█▎        | 11/85 [00:14<01:15,  1.01s/it][A
Training:  15%|█▌        | 13/85 [00:19<01:45,  1.46s/it][A
Training:  19%|█▉        | 16/85 [00:19<00:53,  1.28it/s][A
Training:  20%|██        | 17/85 [00:23<01:35,  1.41s/it][A
Training:  22%|██▏       | 19/85 [00:23<01:02,  1.06it/s][A
Training:  25%|██▍       | 21/85 [00:27<01:20,  1.26s/it][A
Training:  27%|██▋       | 23/85 [00:27<00:54,  1.14it/s][A
Training:  29%|██▉       | 25/85 [00:31<01:12,  1.21s/it][A
Training:  33%|███▎      | 28/85 [00:3

Epoch: 3/56 - Loss: 3.8825 - Accuracy: 0.9628



  0%|          | 0/11 [00:00<?, ?it/s][A
  9%|▉         | 1/11 [00:04<00:45,  4.51s/it][A
 36%|███▋      | 4/11 [00:04<00:06,  1.13it/s][A
 55%|█████▍    | 6/11 [00:08<00:06,  1.34s/it][A
 73%|███████▎  | 8/11 [00:08<00:02,  1.17it/s][A
100%|██████████| 11/11 [00:12<00:00,  1.10s/it][A
Epochs:   5%|▌         | 3/56 [05:22<1:34:19, 106.79s/it]

Val Loss: 4.0661 - Val Accuracy: 0.9637



Training:   0%|          | 0/85 [00:00<?, ?it/s][A
Training:   1%|          | 1/85 [00:05<07:01,  5.02s/it][A
Training:   4%|▎         | 3/85 [00:05<01:50,  1.35s/it][A
Training:   6%|▌         | 5/85 [00:09<02:20,  1.76s/it][A
Training:   8%|▊         | 7/85 [00:09<01:20,  1.03s/it][A
Training:  11%|█         | 9/85 [00:13<01:48,  1.42s/it][A
Training:  13%|█▎        | 11/85 [00:13<01:10,  1.06it/s][A
Training:  15%|█▌        | 13/85 [00:17<01:34,  1.31s/it][A
Training:  16%|█▋        | 14/85 [00:18<01:17,  1.08s/it][A
Training:  19%|█▉        | 16/85 [00:18<00:50,  1.37it/s][A
Training:  20%|██        | 17/85 [00:21<01:25,  1.25s/it][A
Training:  22%|██▏       | 19/85 [00:21<00:53,  1.23it/s][A
Training:  24%|██▎       | 20/85 [00:21<00:43,  1.49it/s][A
Training:  25%|██▍       | 21/85 [00:25<01:27,  1.37s/it][A
Training:  26%|██▌       | 22/85 [00:25<01:08,  1.08s/it][A
Training:  27%|██▋       | 23/85 [00:25<00:51,  1.20it/s][A
Training:  29%|██▉       | 25/85 [00:

Epoch: 4/56 - Loss: 3.5410 - Accuracy: 0.9640



  0%|          | 0/11 [00:00<?, ?it/s][A
  9%|▉         | 1/11 [00:05<00:53,  5.32s/it][A
 18%|█▊        | 2/11 [00:05<00:21,  2.34s/it][A
 27%|██▋       | 3/11 [00:05<00:10,  1.35s/it][A
 45%|████▌     | 5/11 [00:09<00:09,  1.62s/it][A
 55%|█████▍    | 6/11 [00:09<00:06,  1.23s/it][A
 82%|████████▏ | 9/11 [00:13<00:02,  1.22s/it][A
100%|██████████| 11/11 [00:14<00:00,  1.28s/it][A
Epochs:   7%|▋         | 4/56 [07:05<1:31:26, 105.51s/it]

Val Loss: 3.7237 - Val Accuracy: 0.9539



Training:   0%|          | 0/85 [00:00<?, ?it/s][A
Training:   1%|          | 1/85 [00:06<09:08,  6.53s/it][A
Training:   2%|▏         | 2/85 [00:06<03:52,  2.80s/it][A
Training:   4%|▎         | 3/85 [00:07<02:15,  1.65s/it][A
Training:   5%|▍         | 4/85 [00:07<01:29,  1.10s/it][A
Training:   6%|▌         | 5/85 [00:12<03:24,  2.56s/it][A
Training:   7%|▋         | 6/85 [00:12<02:17,  1.74s/it][A
Training:   8%|▊         | 7/85 [00:12<01:34,  1.22s/it][A
Training:   9%|▉         | 8/85 [00:12<01:09,  1.10it/s][A
Training:  11%|█         | 9/85 [00:18<02:48,  2.22s/it][A
Training:  12%|█▏        | 10/85 [00:18<01:57,  1.57s/it][A
Training:  13%|█▎        | 11/85 [00:18<01:24,  1.14s/it][A
Training:  14%|█▍        | 12/85 [00:18<01:01,  1.18it/s][A
Training:  15%|█▌        | 13/85 [00:23<02:20,  1.96s/it][A
Training:  16%|█▋        | 14/85 [00:23<01:40,  1.41s/it][A
Training:  18%|█▊        | 15/85 [00:23<01:11,  1.02s/it][A
Training:  19%|█▉        | 16/85 [00:23<0

Epoch: 5/56 - Loss: 3.4093 - Accuracy: 0.9651



  0%|          | 0/11 [00:00<?, ?it/s][A
  9%|▉         | 1/11 [00:04<00:48,  4.88s/it][A
 18%|█▊        | 2/11 [00:05<00:18,  2.09s/it][A
 27%|██▋       | 3/11 [00:05<00:09,  1.18s/it][A
 45%|████▌     | 5/11 [00:09<00:09,  1.62s/it][A
 64%|██████▎   | 7/11 [00:09<00:03,  1.09it/s][A
 73%|███████▎  | 8/11 [00:09<00:02,  1.36it/s][A
 82%|████████▏ | 9/11 [00:12<00:02,  1.39s/it][A
100%|██████████| 11/11 [00:12<00:00,  1.17s/it][A
Epochs:   9%|▉         | 5/56 [08:58<1:31:46, 107.96s/it]

Val Loss: 4.2435 - Val Accuracy: 0.9550



Training:   0%|          | 0/85 [00:00<?, ?it/s][A
Training:   1%|          | 1/85 [00:05<07:11,  5.14s/it][A
Training:   4%|▎         | 3/85 [00:05<01:53,  1.38s/it][A
Training:   6%|▌         | 5/85 [00:09<02:22,  1.78s/it][A
Training:   8%|▊         | 7/85 [00:09<01:22,  1.05s/it][A
Training:   9%|▉         | 8/85 [00:09<01:04,  1.19it/s][A
Training:  11%|█         | 9/85 [00:13<02:01,  1.60s/it][A
Training:  13%|█▎        | 11/85 [00:13<01:12,  1.02it/s][A
Training:  14%|█▍        | 12/85 [00:14<00:57,  1.28it/s][A
Training:  15%|█▌        | 13/85 [00:17<01:44,  1.45s/it][A
Training:  16%|█▋        | 14/85 [00:17<01:18,  1.11s/it][A
Training:  18%|█▊        | 15/85 [00:17<01:00,  1.15it/s][A
Training:  20%|██        | 17/85 [00:21<01:29,  1.32s/it][A
Training:  21%|██        | 18/85 [00:21<01:11,  1.07s/it][A
Training:  22%|██▏       | 19/85 [00:22<00:58,  1.13it/s][A
Training:  25%|██▍       | 21/85 [00:26<01:23,  1.30s/it][A
Training:  26%|██▌       | 22/85 [00:2

Epoch: 6/56 - Loss: 3.2302 - Accuracy: 0.9666



  0%|          | 0/11 [00:00<?, ?it/s][A
  9%|▉         | 1/11 [00:04<00:45,  4.59s/it][A
 27%|██▋       | 3/11 [00:04<00:09,  1.23s/it][A
 45%|████▌     | 5/11 [00:08<00:09,  1.57s/it][A
 55%|█████▍    | 6/11 [00:08<00:05,  1.18s/it][A
 64%|██████▎   | 7/11 [00:08<00:03,  1.13it/s][A
 82%|████████▏ | 9/11 [00:12<00:02,  1.22s/it][A
100%|██████████| 11/11 [00:12<00:00,  1.13s/it][A
Epochs:  11%|█         | 6/56 [10:42<1:28:55, 106.72s/it]

Val Loss: 4.0795 - Val Accuracy: 0.9587



Training:   0%|          | 0/85 [00:00<?, ?it/s][A
Training:   1%|          | 1/85 [00:05<07:05,  5.07s/it][A
Training:   4%|▎         | 3/85 [00:05<01:51,  1.36s/it][A
Training:   6%|▌         | 5/85 [00:10<02:32,  1.90s/it][A
Training:   9%|▉         | 8/85 [00:10<01:11,  1.08it/s][A
Training:  12%|█▏        | 10/85 [00:13<01:33,  1.25s/it][A
Training:  15%|█▌        | 13/85 [00:17<01:30,  1.26s/it][A
Training:  16%|█▋        | 14/85 [00:18<01:18,  1.11s/it][A
Training:  18%|█▊        | 15/85 [00:18<01:04,  1.08it/s][A
Training:  19%|█▉        | 16/85 [00:18<00:51,  1.34it/s][A
Training:  20%|██        | 17/85 [00:22<01:38,  1.45s/it][A
Training:  21%|██        | 18/85 [00:22<01:19,  1.18s/it][A
Training:  24%|██▎       | 20/85 [00:22<00:46,  1.39it/s][A
Training:  25%|██▍       | 21/85 [00:25<01:24,  1.32s/it][A
Training:  26%|██▌       | 22/85 [00:26<01:12,  1.15s/it][A
Training:  27%|██▋       | 23/85 [00:26<00:55,  1.12it/s][A
Training:  28%|██▊       | 24/85 [00

Epoch: 7/56 - Loss: 3.2331 - Accuracy: 0.9680



  0%|          | 0/11 [00:00<?, ?it/s][A
  9%|▉         | 1/11 [00:04<00:46,  4.67s/it][A
 18%|█▊        | 2/11 [00:04<00:17,  1.99s/it][A
 27%|██▋       | 3/11 [00:04<00:09,  1.14s/it][A
 36%|███▋      | 4/11 [00:05<00:05,  1.36it/s][A
 45%|████▌     | 5/11 [00:08<00:10,  1.67s/it][A
 73%|███████▎  | 8/11 [00:08<00:02,  1.47it/s][A
100%|██████████| 11/11 [00:12<00:00,  1.10s/it][A
Epochs:  12%|█▎        | 7/56 [12:25<1:26:12, 105.56s/it]

Val Loss: 3.7672 - Val Accuracy: 0.9609



Training:   0%|          | 0/85 [00:00<?, ?it/s][A
Training:   1%|          | 1/85 [00:05<07:28,  5.34s/it][A
Training:   2%|▏         | 2/85 [00:05<03:09,  2.29s/it][A
Training:   4%|▎         | 3/85 [00:05<01:48,  1.32s/it][A
Training:   5%|▍         | 4/85 [00:05<01:08,  1.18it/s][A
Training:   6%|▌         | 5/85 [00:09<02:38,  1.98s/it][A
Training:   7%|▋         | 6/85 [00:09<01:46,  1.34s/it][A
Training:   9%|▉         | 8/85 [00:10<00:55,  1.39it/s][A
Training:  11%|█         | 9/85 [00:13<01:55,  1.52s/it][A
Training:  13%|█▎        | 11/85 [00:14<01:07,  1.10it/s][A
Training:  15%|█▌        | 13/85 [00:18<01:35,  1.33s/it][A
Training:  18%|█▊        | 15/85 [00:18<01:02,  1.12it/s][A
Training:  19%|█▉        | 16/85 [00:18<00:50,  1.36it/s][A
Training:  20%|██        | 17/85 [00:22<01:36,  1.42s/it][A
Training:  22%|██▏       | 19/85 [00:22<01:00,  1.10it/s][A
Training:  25%|██▍       | 21/85 [00:26<01:23,  1.31s/it][A
Training:  26%|██▌       | 22/85 [00:26<

Epoch: 8/56 - Loss: 3.1454 - Accuracy: 0.9683



  0%|          | 0/11 [00:00<?, ?it/s][A
  9%|▉         | 1/11 [00:04<00:44,  4.41s/it][A
 18%|█▊        | 2/11 [00:04<00:17,  1.91s/it][A
 36%|███▋      | 4/11 [00:04<00:05,  1.33it/s][A
 45%|████▌     | 5/11 [00:08<00:09,  1.61s/it][A
 55%|█████▍    | 6/11 [00:08<00:05,  1.19s/it][A
 73%|███████▎  | 8/11 [00:08<00:01,  1.50it/s][A
 82%|████████▏ | 9/11 [00:11<00:02,  1.34s/it][A
100%|██████████| 11/11 [00:12<00:00,  1.13s/it][A
Epochs:  14%|█▍        | 8/56 [14:09<1:24:10, 105.21s/it]

Val Loss: 3.7659 - Val Accuracy: 0.9573



Training:   0%|          | 0/85 [00:00<?, ?it/s][A
Training:   1%|          | 1/85 [00:05<07:01,  5.02s/it][A
Training:   4%|▎         | 3/85 [00:05<01:53,  1.38s/it][A
Training:   6%|▌         | 5/85 [00:08<02:05,  1.56s/it][A
Training:   7%|▋         | 6/85 [00:08<01:34,  1.19s/it][A
Training:   8%|▊         | 7/85 [00:09<01:09,  1.12it/s][A
Training:   9%|▉         | 8/85 [00:09<00:52,  1.46it/s][A
Training:  11%|█         | 9/85 [00:12<01:58,  1.56s/it][A
Training:  12%|█▏        | 10/85 [00:13<01:31,  1.22s/it][A
Training:  13%|█▎        | 11/85 [00:13<01:06,  1.12it/s][A
Training:  14%|█▍        | 12/85 [00:13<00:51,  1.41it/s][A
Training:  15%|█▌        | 13/85 [00:16<01:45,  1.47s/it][A
Training:  16%|█▋        | 14/85 [00:17<01:26,  1.21s/it][A
Training:  18%|█▊        | 15/85 [00:17<01:02,  1.12it/s][A
Training:  19%|█▉        | 16/85 [00:17<00:47,  1.45it/s][A
Training:  20%|██        | 17/85 [00:21<01:35,  1.41s/it][A
Training:  21%|██        | 18/85 [00:21

Epoch: 9/56 - Loss: 3.2035 - Accuracy: 0.9687



  0%|          | 0/11 [00:00<?, ?it/s][A
  9%|▉         | 1/11 [00:04<00:45,  4.53s/it][A
 27%|██▋       | 3/11 [00:04<00:10,  1.26s/it][A
 45%|████▌     | 5/11 [00:08<00:09,  1.52s/it][A
 64%|██████▎   | 7/11 [00:08<00:04,  1.00s/it][A
 73%|███████▎  | 8/11 [00:09<00:02,  1.25it/s][A
 82%|████████▏ | 9/11 [00:11<00:02,  1.29s/it][A
100%|██████████| 11/11 [00:12<00:00,  1.12s/it][A
Epochs:  16%|█▌        | 9/56 [15:51<1:21:34, 104.15s/it]

Val Loss: 3.6764 - Val Accuracy: 0.9666



Training:   0%|          | 0/85 [00:00<?, ?it/s][A
Training:   1%|          | 1/85 [00:04<06:49,  4.87s/it][A
Training:   4%|▎         | 3/85 [00:05<01:47,  1.31s/it][A
Training:   6%|▌         | 5/85 [00:09<02:20,  1.75s/it][A
Training:   7%|▋         | 6/85 [00:09<01:43,  1.32s/it][A
Training:   8%|▊         | 7/85 [00:09<01:17,  1.01it/s][A
Training:  11%|█         | 9/85 [00:13<01:49,  1.45s/it][A
Training:  13%|█▎        | 11/85 [00:13<01:08,  1.09it/s][A
Training:  15%|█▌        | 13/85 [00:17<01:29,  1.24s/it][A
Training:  18%|█▊        | 15/85 [00:17<00:58,  1.19it/s][A
Training:  20%|██        | 17/85 [00:21<01:22,  1.22s/it][A
Training:  21%|██        | 18/85 [00:21<01:08,  1.02s/it][A
Training:  22%|██▏       | 19/85 [00:21<00:55,  1.20it/s][A
Training:  24%|██▎       | 20/85 [00:21<00:43,  1.51it/s][A
Training:  25%|██▍       | 21/85 [00:25<01:32,  1.45s/it][A
Training:  27%|██▋       | 23/85 [00:25<00:54,  1.14it/s][A
Training:  29%|██▉       | 25/85 [00:3

Epoch: 10/56 - Loss: 3.1631 - Accuracy: 0.9689



  0%|          | 0/11 [00:00<?, ?it/s][A
  9%|▉         | 1/11 [00:04<00:43,  4.39s/it][A
 27%|██▋       | 3/11 [00:04<00:09,  1.19s/it][A
 45%|████▌     | 5/11 [00:08<00:09,  1.57s/it][A
 73%|███████▎  | 8/11 [00:08<00:02,  1.30it/s][A
100%|██████████| 11/11 [00:12<00:00,  1.11s/it][A
Epochs:  18%|█▊        | 10/56 [17:33<1:19:18, 103.45s/it]

Val Loss: 3.4500 - Val Accuracy: 0.9663



Training:   0%|          | 0/85 [00:00<?, ?it/s][A
Training:   1%|          | 1/85 [00:04<06:26,  4.60s/it][A
Training:   2%|▏         | 2/85 [00:04<02:53,  2.09s/it][A
Training:   5%|▍         | 4/85 [00:05<01:07,  1.21it/s][A
Training:   6%|▌         | 5/85 [00:08<02:13,  1.67s/it][A
Training:   7%|▋         | 6/85 [00:09<01:41,  1.29s/it][A
Training:   8%|▊         | 7/85 [00:09<01:12,  1.08it/s][A
Training:   9%|▉         | 8/85 [00:09<00:53,  1.45it/s][A
Training:  11%|█         | 9/85 [00:12<02:01,  1.59s/it][A
Training:  12%|█▏        | 10/85 [00:13<01:31,  1.22s/it][A
Training:  14%|█▍        | 12/85 [00:13<00:49,  1.47it/s][A
Training:  15%|█▌        | 13/85 [00:16<01:39,  1.38s/it][A
Training:  16%|█▋        | 14/85 [00:17<01:16,  1.08s/it][A
Training:  18%|█▊        | 15/85 [00:17<00:57,  1.21it/s][A
Training:  19%|█▉        | 16/85 [00:17<00:43,  1.58it/s][A
Training:  20%|██        | 17/85 [00:21<01:41,  1.50s/it][A
Training:  21%|██        | 18/85 [00:21<

Epoch: 11/56 - Loss: 3.2174 - Accuracy: 0.9697



  0%|          | 0/11 [00:00<?, ?it/s][A
  9%|▉         | 1/11 [00:04<00:42,  4.28s/it][A
 18%|█▊        | 2/11 [00:04<00:17,  1.94s/it][A
 27%|██▋       | 3/11 [00:04<00:08,  1.12s/it][A
 45%|████▌     | 5/11 [00:08<00:08,  1.49s/it][A
 64%|██████▎   | 7/11 [00:08<00:03,  1.13it/s][A
 82%|████████▏ | 9/11 [00:11<00:02,  1.17s/it][A
100%|██████████| 11/11 [00:12<00:00,  1.09s/it][A
Epochs:  20%|█▉        | 11/56 [19:15<1:17:13, 102.97s/it]

Val Loss: 3.9433 - Val Accuracy: 0.9608



Training:   0%|          | 0/85 [00:00<?, ?it/s][A
Training:   1%|          | 1/85 [00:05<07:03,  5.04s/it][A
Training:   4%|▎         | 3/85 [00:05<01:50,  1.35s/it][A
Training:   6%|▌         | 5/85 [00:09<02:23,  1.80s/it][A
Training:   8%|▊         | 7/85 [00:09<01:23,  1.07s/it][A
Training:   9%|▉         | 8/85 [00:09<01:06,  1.16it/s][A
Training:  11%|█         | 9/85 [00:13<01:54,  1.50s/it][A
Training:  13%|█▎        | 11/85 [00:13<01:07,  1.09it/s][A
Training:  15%|█▌        | 13/85 [00:17<01:33,  1.30s/it][A
Training:  16%|█▋        | 14/85 [00:17<01:15,  1.07s/it][A
Training:  18%|█▊        | 15/85 [00:17<01:00,  1.15it/s][A
Training:  20%|██        | 17/85 [00:21<01:26,  1.27s/it][A
Training:  21%|██        | 18/85 [00:21<01:08,  1.03s/it][A
Training:  22%|██▏       | 19/85 [00:21<00:54,  1.22it/s][A
Training:  24%|██▎       | 20/85 [00:22<00:43,  1.51it/s][A
Training:  25%|██▍       | 21/85 [00:25<01:32,  1.44s/it][A
Training:  26%|██▌       | 22/85 [00:2

Epoch: 12/56 - Loss: 2.9845 - Accuracy: 0.9703



  0%|          | 0/11 [00:00<?, ?it/s][A
  9%|▉         | 1/11 [00:04<00:49,  4.93s/it][A
 27%|██▋       | 3/11 [00:05<00:10,  1.32s/it][A
 45%|████▌     | 5/11 [00:08<00:09,  1.64s/it][A
 55%|█████▍    | 6/11 [00:09<00:06,  1.23s/it][A
 73%|███████▎  | 8/11 [00:09<00:02,  1.38it/s][A
100%|██████████| 11/11 [00:12<00:00,  1.14s/it][A
Epochs:  21%|██▏       | 12/56 [20:58<1:15:27, 102.90s/it]

Val Loss: 3.9973 - Val Accuracy: 0.9583



Training:   0%|          | 0/85 [00:00<?, ?it/s][A
Training:   1%|          | 1/85 [00:05<07:02,  5.03s/it][A
Training:   2%|▏         | 2/85 [00:05<02:56,  2.13s/it][A
Training:   4%|▎         | 3/85 [00:05<01:40,  1.23s/it][A
Training:   6%|▌         | 5/85 [00:09<02:10,  1.63s/it][A
Training:   7%|▋         | 6/85 [00:09<01:36,  1.22s/it][A
Training:   8%|▊         | 7/85 [00:09<01:10,  1.10it/s][A
Training:  11%|█         | 9/85 [00:13<01:47,  1.41s/it][A
Training:  12%|█▏        | 10/85 [00:13<01:23,  1.11s/it][A
Training:  14%|█▍        | 12/85 [00:13<00:50,  1.45it/s][A
Training:  15%|█▌        | 13/85 [00:17<01:45,  1.46s/it][A
Training:  16%|█▋        | 14/85 [00:18<01:20,  1.13s/it][A
Training:  20%|██        | 17/85 [00:22<01:24,  1.25s/it][A
Training:  21%|██        | 18/85 [00:22<01:09,  1.03s/it][A
Training:  24%|██▎       | 20/85 [00:22<00:44,  1.46it/s][A
Training:  25%|██▍       | 21/85 [00:26<01:26,  1.36s/it][A
Training:  26%|██▌       | 22/85 [00:26

Epoch: 13/56 - Loss: 3.0535 - Accuracy: 0.9697



  0%|          | 0/11 [00:00<?, ?it/s][A
  9%|▉         | 1/11 [00:04<00:46,  4.61s/it][A
 18%|█▊        | 2/11 [00:04<00:17,  1.96s/it][A
 27%|██▋       | 3/11 [00:04<00:08,  1.11s/it][A
 45%|████▌     | 5/11 [00:08<00:08,  1.46s/it][A
 55%|█████▍    | 6/11 [00:08<00:05,  1.08s/it][A
 73%|███████▎  | 8/11 [00:08<00:01,  1.62it/s][A
 82%|████████▏ | 9/11 [00:11<00:02,  1.31s/it][A
100%|██████████| 11/11 [00:12<00:00,  1.11s/it][A
Epochs:  23%|██▎       | 13/56 [22:40<1:13:31, 102.59s/it]

Val Loss: 3.9716 - Val Accuracy: 0.9689



Training:   0%|          | 0/85 [00:00<?, ?it/s][A
Training:   1%|          | 1/85 [00:04<06:36,  4.72s/it][A
Training:   2%|▏         | 2/85 [00:04<02:46,  2.01s/it][A
Training:   5%|▍         | 4/85 [00:04<01:03,  1.27it/s][A
Training:   7%|▋         | 6/85 [00:09<01:48,  1.37s/it][A
Training:   8%|▊         | 7/85 [00:09<01:22,  1.06s/it][A
Training:  11%|█         | 9/85 [00:13<01:51,  1.47s/it][A
Training:  12%|█▏        | 10/85 [00:13<01:30,  1.20s/it][A
Training:  13%|█▎        | 11/85 [00:13<01:09,  1.07it/s][A
Training:  14%|█▍        | 12/85 [00:13<00:53,  1.36it/s][A
Training:  15%|█▌        | 13/85 [00:17<01:54,  1.59s/it][A
Training:  16%|█▋        | 14/85 [00:17<01:24,  1.18s/it][A
Training:  18%|█▊        | 15/85 [00:17<01:01,  1.13it/s][A
Training:  19%|█▉        | 16/85 [00:18<00:50,  1.37it/s][A
Training:  20%|██        | 17/85 [00:21<01:45,  1.54s/it][A
Training:  21%|██        | 18/85 [00:21<01:15,  1.12s/it][A
Training:  22%|██▏       | 19/85 [00:2

Epoch: 14/56 - Loss: 2.9985 - Accuracy: 0.9691



  0%|          | 0/11 [00:00<?, ?it/s][A
  9%|▉         | 1/11 [00:04<00:41,  4.16s/it][A
 27%|██▋       | 3/11 [00:04<00:08,  1.12s/it][A
 45%|████▌     | 5/11 [00:08<00:09,  1.52s/it][A
 55%|█████▍    | 6/11 [00:08<00:05,  1.14s/it][A
 64%|██████▎   | 7/11 [00:08<00:03,  1.16it/s][A
100%|██████████| 11/11 [00:11<00:00,  1.07s/it][A
Epochs:  25%|██▌       | 14/56 [24:22<1:11:47, 102.56s/it]

Val Loss: 3.7384 - Val Accuracy: 0.9600



Training:   0%|          | 0/85 [00:00<?, ?it/s][A
Training:   1%|          | 1/85 [00:04<06:35,  4.71s/it][A
Training:   2%|▏         | 2/85 [00:04<02:49,  2.05s/it][A
Training:   4%|▎         | 3/85 [00:05<01:35,  1.16s/it][A
Training:   5%|▍         | 4/85 [00:05<01:01,  1.32it/s][A
Training:   6%|▌         | 5/85 [00:09<02:33,  1.92s/it][A
Training:   7%|▋         | 6/85 [00:09<01:46,  1.35s/it][A
Training:   9%|▉         | 8/85 [00:09<00:56,  1.37it/s][A
Training:  11%|█         | 9/85 [00:13<01:57,  1.55s/it][A
Training:  12%|█▏        | 10/85 [00:13<01:33,  1.25s/it][A
Training:  14%|█▍        | 12/85 [00:14<00:54,  1.35it/s][A
Training:  15%|█▌        | 13/85 [00:17<01:39,  1.39s/it][A
Training:  16%|█▋        | 14/85 [00:18<01:27,  1.23s/it][A
Training:  18%|█▊        | 15/85 [00:18<01:05,  1.07it/s][A
Training:  19%|█▉        | 16/85 [00:18<00:49,  1.38it/s][A
Training:  20%|██        | 17/85 [00:21<01:37,  1.44s/it][A
Training:  21%|██        | 18/85 [00:22<

Epoch: 15/56 - Loss: 3.1162 - Accuracy: 0.9688



  0%|          | 0/11 [00:00<?, ?it/s][A
  9%|▉         | 1/11 [00:04<00:40,  4.06s/it][A
 18%|█▊        | 2/11 [00:04<00:17,  1.89s/it][A
 27%|██▋       | 3/11 [00:04<00:08,  1.08s/it][A
 45%|████▌     | 5/11 [00:07<00:08,  1.39s/it][A
 55%|█████▍    | 6/11 [00:08<00:05,  1.19s/it][A
 82%|████████▏ | 9/11 [00:11<00:02,  1.05s/it][A
100%|██████████| 11/11 [00:11<00:00,  1.08s/it][A
Epochs:  27%|██▋       | 15/56 [26:03<1:09:48, 102.16s/it]

Val Loss: 3.6848 - Val Accuracy: 0.9572



Training:   0%|          | 0/85 [00:00<?, ?it/s][A
Training:   1%|          | 1/85 [00:05<07:02,  5.04s/it][A
Training:   2%|▏         | 2/85 [00:05<03:01,  2.19s/it][A
Training:   5%|▍         | 4/85 [00:05<01:10,  1.14it/s][A
Training:   6%|▌         | 5/85 [00:09<02:27,  1.84s/it][A
Training:   7%|▋         | 6/85 [00:09<01:44,  1.33s/it][A
Training:   9%|▉         | 8/85 [00:09<00:57,  1.35it/s][A
Training:  11%|█         | 9/85 [00:13<02:01,  1.60s/it][A
Training:  13%|█▎        | 11/85 [00:14<01:10,  1.04it/s][A
Training:  15%|█▌        | 13/85 [00:18<01:36,  1.34s/it][A
Training:  16%|█▋        | 14/85 [00:18<01:17,  1.10s/it][A
Training:  18%|█▊        | 15/85 [00:18<01:00,  1.15it/s][A
Training:  20%|██        | 17/85 [00:22<01:29,  1.31s/it][A
Training:  21%|██        | 18/85 [00:22<01:09,  1.04s/it][A
Training:  22%|██▏       | 19/85 [00:22<00:54,  1.22it/s][A
Training:  25%|██▍       | 21/85 [00:26<01:23,  1.31s/it][A
Training:  26%|██▌       | 22/85 [00:26

Epoch: 16/56 - Loss: 3.0910 - Accuracy: 0.9696



  0%|          | 0/11 [00:00<?, ?it/s][A
  9%|▉         | 1/11 [00:04<00:42,  4.26s/it][A
 18%|█▊        | 2/11 [00:04<00:16,  1.84s/it][A
 27%|██▋       | 3/11 [00:04<00:08,  1.10s/it][A
 45%|████▌     | 5/11 [00:08<00:09,  1.52s/it][A
 64%|██████▎   | 7/11 [00:08<00:03,  1.14it/s][A
100%|██████████| 11/11 [00:11<00:00,  1.08s/it][A
Epochs:  29%|██▊       | 16/56 [27:45<1:08:03, 102.09s/it]

Val Loss: 3.7903 - Val Accuracy: 0.9648



Training:   0%|          | 0/85 [00:00<?, ?it/s][A
Training:   1%|          | 1/85 [00:04<06:40,  4.77s/it][A
Training:   2%|▏         | 2/85 [00:04<02:50,  2.06s/it][A
Training:   4%|▎         | 3/85 [00:05<01:36,  1.18s/it][A
Training:   5%|▍         | 4/85 [00:05<01:02,  1.29it/s][A
Training:   6%|▌         | 5/85 [00:09<02:35,  1.94s/it][A
Training:   7%|▋         | 6/85 [00:09<01:45,  1.34s/it][A
Training:   8%|▊         | 7/85 [00:09<01:16,  1.01it/s][A
Training:  11%|█         | 9/85 [00:13<01:52,  1.48s/it][A
Training:  12%|█▏        | 10/85 [00:13<01:25,  1.13s/it][A
Training:  14%|█▍        | 12/85 [00:13<00:50,  1.46it/s][A
Training:  15%|█▌        | 13/85 [00:17<01:41,  1.41s/it][A
Training:  18%|█▊        | 15/85 [00:17<01:02,  1.12it/s][A
Training:  19%|█▉        | 16/85 [00:18<00:50,  1.36it/s][A
Training:  20%|██        | 17/85 [00:21<01:39,  1.46s/it][A
Training:  21%|██        | 18/85 [00:22<01:14,  1.12s/it][A
Training:  24%|██▎       | 20/85 [00:22<

Epoch: 17/56 - Loss: 3.0979 - Accuracy: 0.9696



  0%|          | 0/11 [00:00<?, ?it/s][A
  9%|▉         | 1/11 [00:04<00:44,  4.50s/it][A
 18%|█▊        | 2/11 [00:04<00:17,  1.94s/it][A
 36%|███▋      | 4/11 [00:04<00:05,  1.27it/s][A
 45%|████▌     | 5/11 [00:08<00:09,  1.55s/it][A
 55%|█████▍    | 6/11 [00:08<00:05,  1.18s/it][A
 82%|████████▏ | 9/11 [00:11<00:02,  1.08s/it][A
100%|██████████| 11/11 [00:11<00:00,  1.09s/it][A
Epochs:  30%|███       | 17/56 [29:27<1:06:12, 101.86s/it]

Val Loss: 4.4741 - Val Accuracy: 0.9550



Training:   0%|          | 0/85 [00:00<?, ?it/s][A
Training:   1%|          | 1/85 [00:04<06:55,  4.94s/it][A
Training:   2%|▏         | 2/85 [00:05<03:02,  2.20s/it][A
Training:   5%|▍         | 4/85 [00:05<01:08,  1.17it/s][A
Training:   7%|▋         | 6/85 [00:09<01:55,  1.47s/it][A
Training:   9%|▉         | 8/85 [00:09<01:11,  1.08it/s][A
Training:  11%|█         | 9/85 [00:13<02:00,  1.58s/it][A
Training:  13%|█▎        | 11/85 [00:14<01:15,  1.02s/it][A
Training:  14%|█▍        | 12/85 [00:14<01:01,  1.19it/s][A
Training:  15%|█▌        | 13/85 [00:17<01:48,  1.51s/it][A
Training:  16%|█▋        | 14/85 [00:18<01:24,  1.19s/it][A
Training:  19%|█▉        | 16/85 [00:18<00:50,  1.37it/s][A
Training:  20%|██        | 17/85 [00:22<01:40,  1.48s/it][A
Training:  22%|██▏       | 19/85 [00:22<01:00,  1.09it/s][A
Training:  24%|██▎       | 20/85 [00:22<00:48,  1.34it/s][A
Training:  25%|██▍       | 21/85 [00:26<01:34,  1.47s/it][A
Training:  26%|██▌       | 22/85 [00:2

Epoch: 18/56 - Loss: 3.1852 - Accuracy: 0.9690



  0%|          | 0/11 [00:00<?, ?it/s][A
  9%|▉         | 1/11 [00:04<00:42,  4.26s/it][A
 18%|█▊        | 2/11 [00:04<00:16,  1.88s/it][A
 36%|███▋      | 4/11 [00:04<00:05,  1.34it/s][A
 45%|████▌     | 5/11 [00:07<00:08,  1.48s/it][A
 55%|█████▍    | 6/11 [00:08<00:05,  1.12s/it][A
 64%|██████▎   | 7/11 [00:08<00:03,  1.22it/s][A
 82%|████████▏ | 9/11 [00:11<00:02,  1.13s/it][A
100%|██████████| 11/11 [00:11<00:00,  1.07s/it][A
Epochs:  32%|███▏      | 18/56 [31:09<1:04:34, 101.97s/it]

Val Loss: 4.0388 - Val Accuracy: 0.9586



Training:   0%|          | 0/85 [00:00<?, ?it/s][A
Training:   1%|          | 1/85 [00:05<07:10,  5.13s/it][A
Training:   4%|▎         | 3/85 [00:05<01:53,  1.39s/it][A
Training:   6%|▌         | 5/85 [00:09<02:22,  1.78s/it][A
Training:   8%|▊         | 7/85 [00:09<01:21,  1.05s/it][A
Training:  11%|█         | 9/85 [00:13<01:50,  1.46s/it][A
Training:  13%|█▎        | 11/85 [00:14<01:11,  1.03it/s][A
Training:  15%|█▌        | 13/85 [00:18<01:37,  1.35s/it][A
Training:  18%|█▊        | 15/85 [00:18<01:05,  1.06it/s][A
Training:  20%|██        | 17/85 [00:22<01:27,  1.29s/it][A
Training:  24%|██▎       | 20/85 [00:22<00:51,  1.26it/s][A
Training:  26%|██▌       | 22/85 [00:26<01:11,  1.13s/it][A
Training:  27%|██▋       | 23/85 [00:26<00:59,  1.04it/s][A
Training:  29%|██▉       | 25/85 [00:30<01:13,  1.22s/it][A
Training:  32%|███▏      | 27/85 [00:30<00:49,  1.16it/s][A
Training:  34%|███▍      | 29/85 [00:34<01:07,  1.21s/it][A
Training:  36%|███▋      | 31/85 [00:

Epoch: 19/56 - Loss: 3.0047 - Accuracy: 0.9703



  0%|          | 0/11 [00:00<?, ?it/s][A
  9%|▉         | 1/11 [00:04<00:40,  4.07s/it][A
 18%|█▊        | 2/11 [00:04<00:15,  1.76s/it][A
 27%|██▋       | 3/11 [00:04<00:08,  1.01s/it][A
 36%|███▋      | 4/11 [00:04<00:04,  1.50it/s][A
 45%|████▌     | 5/11 [00:08<00:10,  1.73s/it][A
 55%|█████▍    | 6/11 [00:08<00:05,  1.18s/it][A
100%|██████████| 11/11 [00:12<00:00,  1.11s/it][A
Epochs:  34%|███▍      | 19/56 [32:52<1:03:02, 102.22s/it]

Val Loss: 3.9499 - Val Accuracy: 0.9657



Training:   0%|          | 0/85 [00:00<?, ?it/s][A
Training:   1%|          | 1/85 [00:04<06:29,  4.64s/it][A
Training:   2%|▏         | 2/85 [00:05<02:58,  2.16s/it][A
Training:   5%|▍         | 4/85 [00:05<01:08,  1.18it/s][A
Training:   6%|▌         | 5/85 [00:09<02:25,  1.82s/it][A
Training:   7%|▋         | 6/85 [00:09<01:43,  1.31s/it][A
Training:   8%|▊         | 7/85 [00:09<01:14,  1.05it/s][A
Training:  11%|█         | 9/85 [00:13<01:53,  1.49s/it][A
Training:  12%|█▏        | 10/85 [00:13<01:26,  1.15s/it][A
Training:  14%|█▍        | 12/85 [00:14<00:51,  1.41it/s][A
Training:  15%|█▌        | 13/85 [00:17<01:42,  1.43s/it][A
Training:  16%|█▋        | 14/85 [00:18<01:19,  1.11s/it][A
Training:  19%|█▉        | 16/85 [00:18<00:47,  1.47it/s][A
Training:  20%|██        | 17/85 [00:22<01:36,  1.42s/it][A
Training:  21%|██        | 18/85 [00:22<01:14,  1.11s/it][A
Training:  22%|██▏       | 19/85 [00:22<00:56,  1.18it/s][A
Training:  24%|██▎       | 20/85 [00:22

Epoch: 20/56 - Loss: 2.9199 - Accuracy: 0.9722



  0%|          | 0/11 [00:00<?, ?it/s][A
  9%|▉         | 1/11 [00:04<00:44,  4.44s/it][A
 18%|█▊        | 2/11 [00:04<00:17,  1.92s/it][A
 36%|███▋      | 4/11 [00:04<00:05,  1.31it/s][A
 45%|████▌     | 5/11 [00:08<00:10,  1.70s/it][A
 55%|█████▍    | 6/11 [00:08<00:06,  1.27s/it][A
 73%|███████▎  | 8/11 [00:08<00:02,  1.41it/s][A
 82%|████████▏ | 9/11 [00:11<00:02,  1.29s/it][A
100%|██████████| 11/11 [00:12<00:00,  1.13s/it][A
Epochs:  36%|███▌      | 20/56 [34:34<1:01:22, 102.28s/it]

Val Loss: 3.7054 - Val Accuracy: 0.9584



Training:   0%|          | 0/85 [00:00<?, ?it/s][A
Training:   1%|          | 1/85 [00:04<06:53,  4.93s/it][A
Training:   2%|▏         | 2/85 [00:05<02:55,  2.12s/it][A
Training:   4%|▎         | 3/85 [00:05<01:41,  1.24s/it][A
Training:   5%|▍         | 4/85 [00:05<01:05,  1.24it/s][A
Training:   6%|▌         | 5/85 [00:09<02:33,  1.92s/it][A
Training:   7%|▋         | 6/85 [00:09<01:44,  1.33s/it][A
Training:   8%|▊         | 7/85 [00:09<01:20,  1.03s/it][A
Training:  11%|█         | 9/85 [00:13<01:51,  1.46s/it][A
Training:  13%|█▎        | 11/85 [00:14<01:10,  1.05it/s][A
Training:  14%|█▍        | 12/85 [00:14<00:56,  1.30it/s][A
Training:  15%|█▌        | 13/85 [00:18<01:49,  1.53s/it][A
Training:  18%|█▊        | 15/85 [00:18<01:08,  1.02it/s][A
Training:  20%|██        | 17/85 [00:22<01:25,  1.26s/it][A
Training:  21%|██        | 18/85 [00:22<01:08,  1.02s/it][A
Training:  22%|██▏       | 19/85 [00:22<00:55,  1.20it/s][A
Training:  25%|██▍       | 21/85 [00:26<

Epoch: 21/56 - Loss: 2.9102 - Accuracy: 0.9729



  0%|          | 0/11 [00:00<?, ?it/s][A
  9%|▉         | 1/11 [00:04<00:41,  4.16s/it][A
 18%|█▊        | 2/11 [00:04<00:16,  1.83s/it][A
 36%|███▋      | 4/11 [00:04<00:05,  1.37it/s][A
 45%|████▌     | 5/11 [00:08<00:09,  1.62s/it][A
 64%|██████▎   | 7/11 [00:08<00:03,  1.11it/s][A
100%|██████████| 11/11 [00:11<00:00,  1.07s/it][A
Epochs:  38%|███▊      | 21/56 [36:16<59:31, 102.05s/it]  

Val Loss: 3.8008 - Val Accuracy: 0.9615



Training:   0%|          | 0/85 [00:00<?, ?it/s][A
Training:   1%|          | 1/85 [00:04<06:49,  4.88s/it][A
Training:   2%|▏         | 2/85 [00:04<02:51,  2.07s/it][A
Training:   6%|▌         | 5/85 [00:09<02:07,  1.59s/it][A
Training:   8%|▊         | 7/85 [00:09<01:15,  1.03it/s][A
Training:  11%|█         | 9/85 [00:13<01:51,  1.46s/it][A
Training:  12%|█▏        | 10/85 [00:14<01:28,  1.18s/it][A
Training:  14%|█▍        | 12/85 [00:14<00:55,  1.31it/s][A
Training:  16%|█▋        | 14/85 [00:18<01:23,  1.18s/it][A
Training:  19%|█▉        | 16/85 [00:18<00:55,  1.24it/s][A
Training:  21%|██        | 18/85 [00:21<01:12,  1.08s/it][A
Training:  24%|██▎       | 20/85 [00:21<00:49,  1.32it/s][A
Training:  26%|██▌       | 22/85 [00:25<01:13,  1.17s/it][A
Training:  28%|██▊       | 24/85 [00:25<00:50,  1.21it/s][A
Training:  31%|███       | 26/85 [00:30<01:11,  1.20s/it][A
Training:  33%|███▎      | 28/85 [00:30<00:49,  1.16it/s][A
Training:  34%|███▍      | 29/85 [00:

Epoch: 22/56 - Loss: 2.9200 - Accuracy: 0.9716



  0%|          | 0/11 [00:00<?, ?it/s][A
  9%|▉         | 1/11 [00:04<00:40,  4.02s/it][A
 27%|██▋       | 3/11 [00:04<00:08,  1.12s/it][A
 36%|███▋      | 4/11 [00:04<00:05,  1.28it/s][A
 45%|████▌     | 5/11 [00:08<00:10,  1.72s/it][A
 64%|██████▎   | 7/11 [00:08<00:03,  1.08it/s][A
 82%|████████▏ | 9/11 [00:11<00:02,  1.22s/it][A
100%|██████████| 11/11 [00:11<00:00,  1.07s/it][A
Epochs:  39%|███▉      | 22/56 [37:55<57:26, 101.37s/it]

Val Loss: 3.7351 - Val Accuracy: 0.9663



Training:   0%|          | 0/85 [00:00<?, ?it/s][A
Training:   1%|          | 1/85 [00:04<06:45,  4.83s/it][A
Training:   2%|▏         | 2/85 [00:05<03:03,  2.21s/it][A
Training:   5%|▍         | 4/85 [00:05<01:10,  1.15it/s][A
Training:   6%|▌         | 5/85 [00:09<02:25,  1.82s/it][A
Training:   7%|▋         | 6/85 [00:09<01:46,  1.35s/it][A
Training:   8%|▊         | 7/85 [00:09<01:17,  1.00it/s][A
Training:  11%|█         | 9/85 [00:13<01:52,  1.48s/it][A
Training:  12%|█▏        | 10/85 [00:14<01:28,  1.18s/it][A
Training:  14%|█▍        | 12/85 [00:14<00:52,  1.39it/s][A
Training:  15%|█▌        | 13/85 [00:18<01:44,  1.45s/it][A
Training:  16%|█▋        | 14/85 [00:18<01:20,  1.13s/it][A
Training:  18%|█▊        | 15/85 [00:18<01:00,  1.16it/s][A
Training:  19%|█▉        | 16/85 [00:18<00:45,  1.50it/s][A
Training:  20%|██        | 17/85 [00:22<01:40,  1.48s/it][A
Training:  21%|██        | 18/85 [00:22<01:13,  1.09s/it][A
Training:  22%|██▏       | 19/85 [00:22

Epoch: 23/56 - Loss: 2.9621 - Accuracy: 0.9700



  0%|          | 0/11 [00:00<?, ?it/s][A
  9%|▉         | 1/11 [00:03<00:39,  3.92s/it][A
 27%|██▋       | 3/11 [00:04<00:08,  1.08s/it][A
 36%|███▋      | 4/11 [00:04<00:05,  1.31it/s][A
 45%|████▌     | 5/11 [00:07<00:09,  1.66s/it][A
 64%|██████▎   | 7/11 [00:07<00:03,  1.14it/s][A
100%|██████████| 11/11 [00:11<00:00,  1.06s/it][A
Epochs:  41%|████      | 23/56 [39:38<55:53, 101.62s/it]

Val Loss: 3.8218 - Val Accuracy: 0.9619



Training:   0%|          | 0/85 [00:00<?, ?it/s][A
Training:   1%|          | 1/85 [00:04<06:47,  4.85s/it][A
Training:   2%|▏         | 2/85 [00:05<02:58,  2.15s/it][A
Training:   6%|▌         | 5/85 [00:09<02:12,  1.66s/it][A
Training:   7%|▋         | 6/85 [00:09<01:40,  1.27s/it][A
Training:   9%|▉         | 8/85 [00:09<00:58,  1.31it/s][A
Training:  11%|█         | 9/85 [00:13<01:58,  1.56s/it][A
Training:  12%|█▏        | 10/85 [00:14<01:31,  1.22s/it][A
Training:  13%|█▎        | 11/85 [00:14<01:08,  1.07it/s][A
Training:  14%|█▍        | 12/85 [00:14<00:52,  1.40it/s][A
Training:  15%|█▌        | 13/85 [00:18<01:49,  1.52s/it][A
Training:  18%|█▊        | 15/85 [00:18<01:01,  1.14it/s][A
Training:  20%|██        | 17/85 [00:22<01:27,  1.29s/it][A
Training:  22%|██▏       | 19/85 [00:22<00:57,  1.15it/s][A
Training:  25%|██▍       | 21/85 [00:26<01:17,  1.22s/it][A
Training:  27%|██▋       | 23/85 [00:26<00:52,  1.18it/s][A
Training:  29%|██▉       | 25/85 [00:2

Epoch: 24/56 - Loss: 2.9673 - Accuracy: 0.9710



  0%|          | 0/11 [00:00<?, ?it/s][A
  9%|▉         | 1/11 [00:03<00:37,  3.80s/it][A
 18%|█▊        | 2/11 [00:03<00:14,  1.66s/it][A
 36%|███▋      | 4/11 [00:04<00:04,  1.51it/s][A
 45%|████▌     | 5/11 [00:07<00:08,  1.48s/it][A
 55%|█████▍    | 6/11 [00:07<00:05,  1.10s/it][A
 64%|██████▎   | 7/11 [00:07<00:03,  1.22it/s][A
 82%|████████▏ | 9/11 [00:10<00:02,  1.16s/it][A
100%|██████████| 11/11 [00:11<00:00,  1.03s/it][A
Epochs:  43%|████▎     | 24/56 [41:19<54:08, 101.52s/it]

Val Loss: 4.0196 - Val Accuracy: 0.9600



Training:   0%|          | 0/85 [00:00<?, ?it/s][A
Training:   1%|          | 1/85 [00:05<07:00,  5.00s/it][A
Training:   2%|▏         | 2/85 [00:05<03:00,  2.17s/it][A
Training:   4%|▎         | 3/85 [00:05<01:42,  1.25s/it][A
Training:   5%|▍         | 4/85 [00:05<01:04,  1.26it/s][A
Training:   6%|▌         | 5/85 [00:09<02:35,  1.94s/it][A
Training:   7%|▋         | 6/85 [00:09<01:46,  1.34s/it][A
Training:   8%|▊         | 7/85 [00:09<01:15,  1.03it/s][A
Training:  11%|█         | 9/85 [00:13<01:51,  1.47s/it][A
Training:  12%|█▏        | 10/85 [00:13<01:24,  1.12s/it][A
Training:  13%|█▎        | 11/85 [00:14<01:03,  1.17it/s][A
Training:  15%|█▌        | 13/85 [00:17<01:31,  1.27s/it][A
Training:  16%|█▋        | 14/85 [00:17<01:10,  1.00it/s][A
Training:  19%|█▉        | 16/85 [00:17<00:43,  1.58it/s][A
Training:  20%|██        | 17/85 [00:21<01:33,  1.38s/it][A
Training:  21%|██        | 18/85 [00:22<01:12,  1.09s/it][A
Training:  22%|██▏       | 19/85 [00:22<

Epoch: 25/56 - Loss: 2.8887 - Accuracy: 0.9728



  0%|          | 0/11 [00:00<?, ?it/s][A
  9%|▉         | 1/11 [00:04<00:43,  4.33s/it][A
 27%|██▋       | 3/11 [00:04<00:09,  1.20s/it][A
 45%|████▌     | 5/11 [00:07<00:08,  1.43s/it][A
 55%|█████▍    | 6/11 [00:08<00:05,  1.14s/it][A
 73%|███████▎  | 8/11 [00:08<00:02,  1.46it/s][A
 82%|████████▏ | 9/11 [00:11<00:02,  1.25s/it][A
100%|██████████| 11/11 [00:11<00:00,  1.09s/it][A
Epochs:  45%|████▍     | 25/56 [43:00<52:25, 101.48s/it]

Val Loss: 3.9572 - Val Accuracy: 0.9584



Training:   0%|          | 0/85 [00:00<?, ?it/s][A
Training:   1%|          | 1/85 [00:04<06:44,  4.82s/it][A
Training:   2%|▏         | 2/85 [00:05<03:14,  2.34s/it][A
Training:   4%|▎         | 3/85 [00:05<01:50,  1.34s/it][A
Training:   6%|▌         | 5/85 [00:08<02:03,  1.55s/it][A
Training:   7%|▋         | 6/85 [00:09<01:46,  1.35s/it][A
Training:   8%|▊         | 7/85 [00:10<01:17,  1.00it/s][A
Training:  11%|█         | 9/85 [00:13<01:39,  1.31s/it][A
Training:  12%|█▏        | 10/85 [00:14<01:26,  1.16s/it][A
Training:  14%|█▍        | 12/85 [00:14<00:52,  1.39it/s][A
Training:  15%|█▌        | 13/85 [00:17<01:27,  1.22s/it][A
Training:  16%|█▋        | 14/85 [00:17<01:19,  1.13s/it][A
Training:  18%|█▊        | 15/85 [00:18<01:00,  1.16it/s][A
Training:  20%|██        | 17/85 [00:21<01:18,  1.16s/it][A
Training:  21%|██        | 18/85 [00:22<01:17,  1.15s/it][A
Training:  22%|██▏       | 19/85 [00:22<01:00,  1.10it/s][A
Training:  24%|██▎       | 20/85 [00:22

Epoch: 26/56 - Loss: 2.8681 - Accuracy: 0.9721



  0%|          | 0/11 [00:00<?, ?it/s][A
  9%|▉         | 1/11 [00:04<00:43,  4.38s/it][A
 27%|██▋       | 3/11 [00:04<00:09,  1.24s/it][A
 45%|████▌     | 5/11 [00:08<00:10,  1.67s/it][A
 55%|█████▍    | 6/11 [00:08<00:06,  1.27s/it][A
 64%|██████▎   | 7/11 [00:09<00:03,  1.05it/s][A
 82%|████████▏ | 9/11 [00:13<00:02,  1.39s/it][A
100%|██████████| 11/11 [00:13<00:00,  1.21s/it][A
Epochs:  46%|████▋     | 26/56 [44:44<51:00, 102.03s/it]

Val Loss: 3.6048 - Val Accuracy: 0.9589



Training:   0%|          | 0/85 [00:00<?, ?it/s][A
Training:   1%|          | 1/85 [00:06<08:51,  6.33s/it][A
Training:   2%|▏         | 2/85 [00:06<03:46,  2.73s/it][A
Training:   4%|▎         | 3/85 [00:06<02:06,  1.54s/it][A
Training:   6%|▌         | 5/85 [00:12<03:00,  2.25s/it][A
Training:   7%|▋         | 6/85 [00:12<02:10,  1.65s/it][A
Training:   8%|▊         | 7/85 [00:12<01:35,  1.23s/it][A
Training:   9%|▉         | 8/85 [00:12<01:11,  1.07it/s][A
Training:  11%|█         | 9/85 [00:17<02:37,  2.07s/it][A
Training:  12%|█▏        | 10/85 [00:18<02:01,  1.62s/it][A
Training:  13%|█▎        | 11/85 [00:18<01:27,  1.18s/it][A
Training:  14%|█▍        | 12/85 [00:18<01:03,  1.15it/s][A
Training:  15%|█▌        | 13/85 [00:22<02:16,  1.89s/it][A
Training:  16%|█▋        | 14/85 [00:23<01:44,  1.47s/it][A
Training:  18%|█▊        | 15/85 [00:23<01:14,  1.07s/it][A
Training:  20%|██        | 17/85 [00:27<01:49,  1.61s/it][A
Training:  21%|██        | 18/85 [00:27<

Epoch: 27/56 - Loss: 2.9867 - Accuracy: 0.9725



  0%|          | 0/11 [00:00<?, ?it/s][A
  9%|▉         | 1/11 [00:04<00:41,  4.14s/it][A
 27%|██▋       | 3/11 [00:04<00:09,  1.13s/it][A
 45%|████▌     | 5/11 [00:07<00:08,  1.45s/it][A
 64%|██████▎   | 7/11 [00:07<00:03,  1.17it/s][A
100%|██████████| 11/11 [00:11<00:00,  1.07s/it][A
Epochs:  48%|████▊     | 27/56 [46:37<51:00, 105.54s/it]

Val Loss: 4.0816 - Val Accuracy: 0.9644



Training:   0%|          | 0/85 [00:00<?, ?it/s][A
Training:   1%|          | 1/85 [00:04<06:49,  4.88s/it][A
Training:   2%|▏         | 2/85 [00:05<03:04,  2.22s/it][A
Training:   4%|▎         | 3/85 [00:05<01:43,  1.27s/it][A
Training:   6%|▌         | 5/85 [00:09<02:13,  1.67s/it][A
Training:   7%|▋         | 6/85 [00:09<01:38,  1.25s/it][A
Training:   8%|▊         | 7/85 [00:09<01:13,  1.06it/s][A
Training:  11%|█         | 9/85 [00:13<01:48,  1.43s/it][A
Training:  12%|█▏        | 10/85 [00:14<01:29,  1.19s/it][A
Training:  14%|█▍        | 12/85 [00:14<00:52,  1.38it/s][A
Training:  15%|█▌        | 13/85 [00:17<01:36,  1.34s/it][A
Training:  16%|█▋        | 14/85 [00:18<01:21,  1.15s/it][A
Training:  19%|█▉        | 16/85 [00:18<00:48,  1.42it/s][A
Training:  20%|██        | 17/85 [00:21<01:26,  1.27s/it][A
Training:  21%|██        | 18/85 [00:22<01:14,  1.10s/it][A
Training:  22%|██▏       | 19/85 [00:22<00:56,  1.17it/s][A
Training:  24%|██▎       | 20/85 [00:22

Epoch: 28/56 - Loss: 2.7939 - Accuracy: 0.9720



  0%|          | 0/11 [00:00<?, ?it/s][A
  9%|▉         | 1/11 [00:04<00:47,  4.73s/it][A
 18%|█▊        | 2/11 [00:04<00:18,  2.01s/it][A
 36%|███▋      | 4/11 [00:04<00:05,  1.28it/s][A
 55%|█████▍    | 6/11 [00:08<00:05,  1.18s/it][A
 73%|███████▎  | 8/11 [00:08<00:02,  1.35it/s][A
100%|██████████| 11/11 [00:11<00:00,  1.06s/it][A
Epochs:  50%|█████     | 28/56 [48:19<48:41, 104.32s/it]

Val Loss: 4.5304 - Val Accuracy: 0.9485



Training:   0%|          | 0/85 [00:00<?, ?it/s][A
Training:   1%|          | 1/85 [00:04<06:38,  4.75s/it][A
Training:   4%|▎         | 3/85 [00:04<01:46,  1.29s/it][A
Training:   6%|▌         | 5/85 [00:09<02:19,  1.74s/it][A
Training:   8%|▊         | 7/85 [00:09<01:21,  1.04s/it][A
Training:   9%|▉         | 8/85 [00:09<01:03,  1.20it/s][A
Training:  11%|█         | 9/85 [00:13<02:04,  1.64s/it][A
Training:  12%|█▏        | 10/85 [00:13<01:32,  1.24s/it][A
Training:  13%|█▎        | 11/85 [00:13<01:09,  1.07it/s][A
Training:  15%|█▌        | 13/85 [00:17<01:41,  1.41s/it][A
Training:  16%|█▋        | 14/85 [00:18<01:18,  1.10s/it][A
Training:  19%|█▉        | 16/85 [00:18<00:46,  1.47it/s][A
Training:  20%|██        | 17/85 [00:21<01:32,  1.36s/it][A
Training:  22%|██▏       | 19/85 [00:22<00:56,  1.16it/s][A
Training:  25%|██▍       | 21/85 [00:26<01:23,  1.31s/it][A
Training:  27%|██▋       | 23/85 [00:26<00:55,  1.13it/s][A
Training:  29%|██▉       | 25/85 [00:3

Epoch: 29/56 - Loss: 3.0232 - Accuracy: 0.9726



  0%|          | 0/11 [00:00<?, ?it/s][A
  9%|▉         | 1/11 [00:04<00:47,  4.70s/it][A
 36%|███▋      | 4/11 [00:04<00:06,  1.08it/s][A
 55%|█████▍    | 6/11 [00:08<00:06,  1.25s/it][A
 82%|████████▏ | 9/11 [00:11<00:02,  1.25s/it][A
100%|██████████| 11/11 [00:12<00:00,  1.11s/it][A
Epochs:  52%|█████▏    | 29/56 [50:03<46:53, 104.22s/it]

Val Loss: 3.7206 - Val Accuracy: 0.9631



Training:   0%|          | 0/85 [00:00<?, ?it/s][A
Training:   1%|          | 1/85 [00:05<07:15,  5.18s/it][A
Training:   4%|▎         | 3/85 [00:05<01:53,  1.39s/it][A
Training:   6%|▌         | 5/85 [00:09<02:26,  1.83s/it][A
Training:   7%|▋         | 6/85 [00:09<01:48,  1.38s/it][A
Training:   8%|▊         | 7/85 [00:10<01:20,  1.03s/it][A
Training:  11%|█         | 9/85 [00:14<01:56,  1.53s/it][A
Training:  13%|█▎        | 11/85 [00:14<01:11,  1.04it/s][A
Training:  14%|█▍        | 12/85 [00:14<00:56,  1.29it/s][A
Training:  15%|█▌        | 13/85 [00:18<01:52,  1.56s/it][A
Training:  16%|█▋        | 14/85 [00:18<01:26,  1.21s/it][A
Training:  18%|█▊        | 15/85 [00:19<01:04,  1.08it/s][A
Training:  20%|██        | 17/85 [00:22<01:26,  1.27s/it][A
Training:  21%|██        | 18/85 [00:22<01:08,  1.02s/it][A
Training:  24%|██▎       | 20/85 [00:23<00:45,  1.44it/s][A
Training:  25%|██▍       | 21/85 [00:26<01:27,  1.36s/it][A
Training:  27%|██▋       | 23/85 [00:2

Epoch: 30/56 - Loss: 2.9840 - Accuracy: 0.9716



  0%|          | 0/11 [00:00<?, ?it/s][A
  9%|▉         | 1/11 [00:06<01:08,  6.86s/it][A
 18%|█▊        | 2/11 [00:07<00:26,  2.94s/it][A
 36%|███▋      | 4/11 [00:07<00:08,  1.15s/it][A
 45%|████▌     | 5/11 [00:11<00:13,  2.26s/it][A
 64%|██████▎   | 7/11 [00:12<00:05,  1.26s/it][A
 73%|███████▎  | 8/11 [00:12<00:02,  1.02it/s][A
 82%|████████▏ | 9/11 [00:16<00:03,  1.90s/it][A
 91%|█████████ | 10/11 [00:17<00:01,  1.43s/it][A
100%|██████████| 11/11 [00:17<00:00,  1.58s/it][A
Epochs:  54%|█████▎    | 30/56 [52:14<48:43, 112.45s/it]

Val Loss: 3.6398 - Val Accuracy: 0.9622



Training:   0%|          | 0/85 [00:00<?, ?it/s][A
Training:   1%|          | 1/85 [00:07<10:23,  7.42s/it][A
Training:   2%|▏         | 2/85 [00:07<04:27,  3.22s/it][A
Training:   4%|▎         | 3/85 [00:07<02:31,  1.85s/it][A
Training:   5%|▍         | 4/85 [00:08<01:39,  1.23s/it][A
Training:   6%|▌         | 5/85 [00:13<03:45,  2.82s/it][A
Training:   7%|▋         | 6/85 [00:14<02:49,  2.15s/it][A
Training:   8%|▊         | 7/85 [00:14<01:58,  1.52s/it][A
Training:   9%|▉         | 8/85 [00:15<01:23,  1.09s/it][A
Training:  11%|█         | 9/85 [00:20<02:56,  2.33s/it][A
Training:  12%|█▏        | 10/85 [00:20<02:19,  1.87s/it][A
Training:  13%|█▎        | 11/85 [00:21<01:40,  1.35s/it][A
Training:  15%|█▌        | 13/85 [00:26<02:14,  1.86s/it][A
Training:  16%|█▋        | 14/85 [00:27<01:57,  1.66s/it][A
Training:  18%|█▊        | 15/85 [00:27<01:27,  1.25s/it][A
Training:  19%|█▉        | 16/85 [00:27<01:06,  1.04it/s][A
Training:  20%|██        | 17/85 [00:32<0

Epoch: 31/56 - Loss: 2.8839 - Accuracy: 0.9726



  0%|          | 0/11 [00:00<?, ?it/s][A
  9%|▉         | 1/11 [00:06<01:07,  6.76s/it][A
 18%|█▊        | 2/11 [00:06<00:25,  2.86s/it][A
 27%|██▋       | 3/11 [00:07<00:13,  1.65s/it][A
 36%|███▋      | 4/11 [00:07<00:08,  1.17s/it][A
 45%|████▌     | 5/11 [00:12<00:14,  2.37s/it][A
 55%|█████▍    | 6/11 [00:12<00:08,  1.64s/it][A
 64%|██████▎   | 7/11 [00:12<00:04,  1.15s/it][A
 73%|███████▎  | 8/11 [00:12<00:02,  1.17it/s][A
 82%|████████▏ | 9/11 [00:16<00:03,  1.92s/it][A
100%|██████████| 11/11 [00:17<00:00,  1.56s/it][A
Epochs:  55%|█████▌    | 31/56 [54:42<51:13, 122.93s/it]

Val Loss: 4.0470 - Val Accuracy: 0.9620



Training:   0%|          | 0/85 [00:00<?, ?it/s][A
Training:   1%|          | 1/85 [00:07<10:42,  7.64s/it][A
Training:   2%|▏         | 2/85 [00:07<04:31,  3.27s/it][A
Training:   4%|▎         | 3/85 [00:07<02:29,  1.83s/it][A
Training:   6%|▌         | 5/85 [00:13<03:12,  2.41s/it][A
Training:   7%|▋         | 6/85 [00:14<02:23,  1.82s/it][A
Training:   8%|▊         | 7/85 [00:14<01:43,  1.33s/it][A
Training:   9%|▉         | 8/85 [00:14<01:17,  1.00s/it][A
Training:  11%|█         | 9/85 [00:19<02:59,  2.36s/it][A
Training:  12%|█▏        | 10/85 [00:20<02:11,  1.76s/it][A
Training:  13%|█▎        | 11/85 [00:20<01:36,  1.30s/it][A
Training:  14%|█▍        | 12/85 [00:20<01:11,  1.02it/s][A
Training:  15%|█▌        | 13/85 [00:26<02:46,  2.31s/it][A
Training:  16%|█▋        | 14/85 [00:26<01:57,  1.66s/it][A
Training:  19%|█▉        | 16/85 [00:26<01:06,  1.04it/s][A
Training:  20%|██        | 17/85 [00:31<02:19,  2.05s/it][A
Training:  21%|██        | 18/85 [00:32<

Epoch: 32/56 - Loss: 2.9266 - Accuracy: 0.9729



  0%|          | 0/11 [00:00<?, ?it/s][A
  9%|▉         | 1/11 [00:06<01:03,  6.33s/it][A
 18%|█▊        | 2/11 [00:06<00:24,  2.77s/it][A
 27%|██▋       | 3/11 [00:06<00:12,  1.58s/it][A
 36%|███▋      | 4/11 [00:06<00:07,  1.03s/it][A
 45%|████▌     | 5/11 [00:11<00:14,  2.39s/it][A
 55%|█████▍    | 6/11 [00:11<00:08,  1.65s/it][A
 64%|██████▎   | 7/11 [00:12<00:04,  1.18s/it][A
 73%|███████▎  | 8/11 [00:12<00:02,  1.17it/s][A
 82%|████████▏ | 9/11 [00:16<00:03,  1.91s/it][A
100%|██████████| 11/11 [00:17<00:00,  1.55s/it][A
Epochs:  57%|█████▋    | 32/56 [57:10<52:12, 130.53s/it]

Val Loss: 3.9127 - Val Accuracy: 0.9620



Training:   0%|          | 0/85 [00:00<?, ?it/s][A
Training:   1%|          | 1/85 [00:07<10:13,  7.30s/it][A
Training:   2%|▏         | 2/85 [00:07<04:30,  3.26s/it][A
Training:   4%|▎         | 3/85 [00:07<02:34,  1.88s/it][A
Training:   5%|▍         | 4/85 [00:08<01:37,  1.21s/it][A
Training:   6%|▌         | 5/85 [00:13<03:41,  2.77s/it][A
Training:   7%|▋         | 6/85 [00:13<02:30,  1.91s/it][A
Training:   8%|▊         | 7/85 [00:14<01:43,  1.33s/it][A
Training:   9%|▉         | 8/85 [00:14<01:12,  1.06it/s][A
Training:  11%|█         | 9/85 [00:19<03:07,  2.46s/it][A
Training:  12%|█▏        | 10/85 [00:20<02:21,  1.88s/it][A
Training:  13%|█▎        | 11/85 [00:20<01:42,  1.38s/it][A
Training:  14%|█▍        | 12/85 [00:21<01:14,  1.02s/it][A
Training:  15%|█▌        | 13/85 [00:26<02:45,  2.30s/it][A
Training:  16%|█▋        | 14/85 [00:26<02:07,  1.79s/it][A
Training:  18%|█▊        | 15/85 [00:27<01:32,  1.33s/it][A
Training:  19%|█▉        | 16/85 [00:27<0

Epoch: 33/56 - Loss: 2.8696 - Accuracy: 0.9729



  0%|          | 0/11 [00:00<?, ?it/s][A
  9%|▉         | 1/11 [00:06<01:03,  6.39s/it][A
 18%|█▊        | 2/11 [00:06<00:24,  2.70s/it][A
 27%|██▋       | 3/11 [00:06<00:12,  1.53s/it][A
 36%|███▋      | 4/11 [00:06<00:06,  1.02it/s][A
 45%|████▌     | 5/11 [00:12<00:15,  2.62s/it][A
 55%|█████▍    | 6/11 [00:12<00:08,  1.77s/it][A
 64%|██████▎   | 7/11 [00:12<00:04,  1.24s/it][A
 73%|███████▎  | 8/11 [00:12<00:02,  1.11it/s][A
 82%|████████▏ | 9/11 [00:17<00:03,  1.97s/it][A
 91%|█████████ | 10/11 [00:17<00:01,  1.41s/it][A
100%|██████████| 11/11 [00:17<00:00,  1.59s/it][A
Epochs:  59%|█████▉    | 33/56 [59:39<52:09, 136.06s/it]

Val Loss: 4.0563 - Val Accuracy: 0.9646



Training:   0%|          | 0/85 [00:00<?, ?it/s][A
Training:   1%|          | 1/85 [00:07<10:10,  7.27s/it][A
Training:   2%|▏         | 2/85 [00:07<04:33,  3.29s/it][A
Training:   4%|▎         | 3/85 [00:08<02:35,  1.89s/it][A
Training:   5%|▍         | 4/85 [00:08<01:37,  1.20s/it][A
Training:   6%|▌         | 5/85 [00:13<03:36,  2.71s/it][A
Training:   7%|▋         | 6/85 [00:13<02:29,  1.89s/it][A
Training:   9%|▉         | 8/85 [00:13<01:16,  1.01it/s][A
Training:  11%|█         | 9/85 [00:20<03:01,  2.38s/it][A
Training:  12%|█▏        | 10/85 [00:20<02:13,  1.77s/it][A
Training:  14%|█▍        | 12/85 [00:20<01:15,  1.03s/it][A
Training:  15%|█▌        | 13/85 [00:26<02:36,  2.17s/it][A
Training:  16%|█▋        | 14/85 [00:26<01:57,  1.66s/it][A
Training:  19%|█▉        | 16/85 [00:26<01:11,  1.03s/it][A
Training:  20%|██        | 17/85 [00:32<02:20,  2.06s/it][A
Training:  21%|██        | 18/85 [00:32<01:47,  1.60s/it][A
Training:  22%|██▏       | 19/85 [00:32<

Epoch: 34/56 - Loss: 2.8982 - Accuracy: 0.9730



  0%|          | 0/11 [00:00<?, ?it/s][A
  9%|▉         | 1/11 [00:06<01:02,  6.26s/it][A
 18%|█▊        | 2/11 [00:06<00:25,  2.78s/it][A
 27%|██▋       | 3/11 [00:06<00:12,  1.58s/it][A
 45%|████▌     | 5/11 [00:11<00:12,  2.07s/it][A
 55%|█████▍    | 6/11 [00:11<00:07,  1.57s/it][A
 64%|██████▎   | 7/11 [00:12<00:04,  1.17s/it][A
 73%|███████▎  | 8/11 [00:12<00:02,  1.15it/s][A
 82%|████████▏ | 9/11 [00:16<00:03,  1.92s/it][A
 91%|█████████ | 10/11 [00:16<00:01,  1.39s/it][A
100%|██████████| 11/11 [00:17<00:00,  1.57s/it][A
Epochs:  61%|██████    | 34/56 [1:02:08<51:18, 139.92s/it]

Val Loss: 4.1892 - Val Accuracy: 0.9653



Training:   0%|          | 0/85 [00:00<?, ?it/s][A
Training:   1%|          | 1/85 [00:07<10:02,  7.17s/it][A
Training:   2%|▏         | 2/85 [00:07<04:16,  3.10s/it][A
Training:   4%|▎         | 3/85 [00:07<02:27,  1.80s/it][A
Training:   5%|▍         | 4/85 [00:07<01:33,  1.15s/it][A
Training:   6%|▌         | 5/85 [00:13<03:41,  2.77s/it][A
Training:   7%|▋         | 6/85 [00:13<02:29,  1.90s/it][A
Training:   8%|▊         | 7/85 [00:13<01:43,  1.33s/it][A
Training:   9%|▉         | 8/85 [00:14<01:13,  1.04it/s][A
Training:  11%|█         | 9/85 [00:19<03:09,  2.49s/it][A
Training:  12%|█▏        | 10/85 [00:20<02:12,  1.77s/it][A
Training:  13%|█▎        | 11/85 [00:20<01:34,  1.28s/it][A
Training:  14%|█▍        | 12/85 [00:20<01:09,  1.06it/s][A
Training:  15%|█▌        | 13/85 [00:25<02:49,  2.36s/it][A
Training:  16%|█▋        | 14/85 [00:26<01:59,  1.69s/it][A
Training:  18%|█▊        | 15/85 [00:26<01:32,  1.32s/it][A
Training:  19%|█▉        | 16/85 [00:26<0

Epoch: 35/56 - Loss: 2.9129 - Accuracy: 0.9720



  0%|          | 0/11 [00:00<?, ?it/s][A
  9%|▉         | 1/11 [00:06<01:05,  6.58s/it][A
 18%|█▊        | 2/11 [00:06<00:25,  2.81s/it][A
 27%|██▋       | 3/11 [00:07<00:13,  1.64s/it][A
 36%|███▋      | 4/11 [00:07<00:07,  1.08s/it][A
 45%|████▌     | 5/11 [00:12<00:15,  2.52s/it][A
 55%|█████▍    | 6/11 [00:12<00:08,  1.73s/it][A
 64%|██████▎   | 7/11 [00:12<00:05,  1.25s/it][A
 73%|███████▎  | 8/11 [00:12<00:02,  1.11it/s][A
 82%|████████▏ | 9/11 [00:17<00:03,  1.93s/it][A
 91%|█████████ | 10/11 [00:17<00:01,  1.38s/it][A
100%|██████████| 11/11 [00:17<00:00,  1.60s/it][A
Epochs:  62%|██████▎   | 35/56 [1:04:37<49:56, 142.67s/it]

Val Loss: 3.6672 - Val Accuracy: 0.9611



Training:   0%|          | 0/85 [00:00<?, ?it/s][A
Training:   1%|          | 1/85 [00:07<10:42,  7.64s/it][A
Training:   2%|▏         | 2/85 [00:07<04:29,  3.25s/it][A
Training:   4%|▎         | 3/85 [00:08<02:33,  1.87s/it][A
Training:   5%|▍         | 4/85 [00:08<01:39,  1.23s/it][A
Training:   6%|▌         | 5/85 [00:14<04:02,  3.04s/it][A
Training:   7%|▋         | 6/85 [00:14<02:43,  2.07s/it][A
Training:   9%|▉         | 8/85 [00:14<01:25,  1.11s/it][A
Training:  11%|█         | 9/85 [00:20<02:57,  2.34s/it][A
Training:  12%|█▏        | 10/85 [00:21<02:11,  1.76s/it][A
Training:  14%|█▍        | 12/85 [00:21<01:14,  1.02s/it][A
Training:  15%|█▌        | 13/85 [00:27<02:43,  2.26s/it][A
Training:  16%|█▋        | 14/85 [00:27<02:03,  1.74s/it][A
Training:  18%|█▊        | 15/85 [00:27<01:33,  1.33s/it][A
Training:  19%|█▉        | 16/85 [00:27<01:08,  1.00it/s][A
Training:  20%|██        | 17/85 [00:33<02:28,  2.18s/it][A
Training:  21%|██        | 18/85 [00:33<

Epoch: 36/56 - Loss: 2.9795 - Accuracy: 0.9725



  0%|          | 0/11 [00:00<?, ?it/s][A
  9%|▉         | 1/11 [00:06<01:08,  6.84s/it][A
 18%|█▊        | 2/11 [00:07<00:26,  2.94s/it][A
 36%|███▋      | 4/11 [00:07<00:08,  1.16s/it][A
 45%|████▌     | 5/11 [00:12<00:13,  2.31s/it][A
 55%|█████▍    | 6/11 [00:12<00:08,  1.64s/it][A
 64%|██████▎   | 7/11 [00:12<00:04,  1.17s/it][A
 82%|████████▏ | 9/11 [00:16<00:03,  1.70s/it][A
 91%|█████████ | 10/11 [00:17<00:01,  1.32s/it][A
100%|██████████| 11/11 [00:17<00:00,  1.59s/it][A
Epochs:  64%|██████▍   | 36/56 [1:07:07<48:14, 144.70s/it]

Val Loss: 4.1775 - Val Accuracy: 0.9584



Training:   0%|          | 0/85 [00:00<?, ?it/s][A
Training:   1%|          | 1/85 [00:07<10:36,  7.57s/it][A
Training:   2%|▏         | 2/85 [00:07<04:26,  3.21s/it][A
Training:   4%|▎         | 3/85 [00:07<02:28,  1.81s/it][A
Training:   5%|▍         | 4/85 [00:08<01:34,  1.17s/it][A
Training:   6%|▌         | 5/85 [00:13<03:49,  2.87s/it][A
Training:   7%|▋         | 6/85 [00:14<02:35,  1.97s/it][A
Training:   8%|▊         | 7/85 [00:14<01:51,  1.43s/it][A
Training:   9%|▉         | 8/85 [00:14<01:20,  1.04s/it][A
Training:  11%|█         | 9/85 [00:20<03:05,  2.45s/it][A
Training:  12%|█▏        | 10/85 [00:20<02:11,  1.75s/it][A
Training:  13%|█▎        | 11/85 [00:20<01:41,  1.38s/it][A
Training:  14%|█▍        | 12/85 [00:21<01:13,  1.00s/it][A
Training:  15%|█▌        | 13/85 [00:26<02:42,  2.25s/it][A
Training:  16%|█▋        | 14/85 [00:26<01:56,  1.64s/it][A
Training:  18%|█▊        | 15/85 [00:27<01:33,  1.34s/it][A
Training:  19%|█▉        | 16/85 [00:27<0

Epoch: 37/56 - Loss: 2.9712 - Accuracy: 0.9727



  0%|          | 0/11 [00:00<?, ?it/s][A
  9%|▉         | 1/11 [00:06<01:03,  6.30s/it][A
 18%|█▊        | 2/11 [00:06<00:25,  2.86s/it][A
 27%|██▋       | 3/11 [00:06<00:13,  1.63s/it][A
 36%|███▋      | 4/11 [00:07<00:07,  1.08s/it][A
 45%|████▌     | 5/11 [00:11<00:13,  2.33s/it][A
 55%|█████▍    | 6/11 [00:12<00:08,  1.73s/it][A
 64%|██████▎   | 7/11 [00:12<00:04,  1.20s/it][A
 73%|███████▎  | 8/11 [00:12<00:02,  1.15it/s][A
 82%|████████▏ | 9/11 [00:16<00:03,  1.73s/it][A
 91%|█████████ | 10/11 [00:16<00:01,  1.45s/it][A
100%|██████████| 11/11 [00:17<00:00,  1.58s/it][A
Epochs:  66%|██████▌   | 37/56 [1:09:35<46:12, 145.94s/it]

Val Loss: 4.6882 - Val Accuracy: 0.9598



Training:   0%|          | 0/85 [00:00<?, ?it/s][A
Training:   1%|          | 1/85 [00:07<10:21,  7.40s/it][A
Training:   2%|▏         | 2/85 [00:07<04:21,  3.14s/it][A
Training:   4%|▎         | 3/85 [00:07<02:29,  1.82s/it][A
Training:   5%|▍         | 4/85 [00:08<01:35,  1.18s/it][A
Training:   6%|▌         | 5/85 [00:13<03:33,  2.66s/it][A
Training:   7%|▋         | 6/85 [00:13<02:26,  1.85s/it][A
Training:   8%|▊         | 7/85 [00:13<01:43,  1.33s/it][A
Training:   9%|▉         | 8/85 [00:13<01:13,  1.04it/s][A
Training:  11%|█         | 9/85 [00:19<03:11,  2.52s/it][A
Training:  12%|█▏        | 10/85 [00:20<02:15,  1.80s/it][A
Training:  13%|█▎        | 11/85 [00:20<01:38,  1.33s/it][A
Training:  14%|█▍        | 12/85 [00:20<01:13,  1.01s/it][A
Training:  15%|█▌        | 13/85 [00:25<02:43,  2.27s/it][A
Training:  16%|█▋        | 14/85 [00:26<01:56,  1.64s/it][A
Training:  18%|█▊        | 15/85 [00:26<01:25,  1.23s/it][A
Training:  20%|██        | 17/85 [00:31<0

Epoch: 38/56 - Loss: 2.8748 - Accuracy: 0.9724



  0%|          | 0/11 [00:00<?, ?it/s][A
  9%|▉         | 1/11 [00:06<01:08,  6.82s/it][A
 36%|███▋      | 4/11 [00:07<00:09,  1.37s/it][A
 45%|████▌     | 5/11 [00:12<00:14,  2.41s/it][A
 64%|██████▎   | 7/11 [00:12<00:05,  1.37s/it][A
 73%|███████▎  | 8/11 [00:12<00:03,  1.07s/it][A
 82%|████████▏ | 9/11 [00:17<00:04,  2.03s/it][A
100%|██████████| 11/11 [00:17<00:00,  1.62s/it][A
Epochs:  68%|██████▊   | 38/56 [1:12:06<44:10, 147.26s/it]

Val Loss: 3.5041 - Val Accuracy: 0.9703



Training:   0%|          | 0/85 [00:00<?, ?it/s][A
Training:   1%|          | 1/85 [00:08<11:35,  8.28s/it][A
Training:   2%|▏         | 2/85 [00:08<04:50,  3.50s/it][A
Training:   4%|▎         | 3/85 [00:08<02:43,  2.00s/it][A
Training:   5%|▍         | 4/85 [00:08<01:45,  1.30s/it][A
Training:   6%|▌         | 5/85 [00:14<03:54,  2.93s/it][A
Training:   7%|▋         | 6/85 [00:14<02:40,  2.03s/it][A
Training:   8%|▊         | 7/85 [00:15<01:51,  1.42s/it][A
Training:   9%|▉         | 8/85 [00:15<01:19,  1.04s/it][A
Training:  11%|█         | 9/85 [00:20<03:04,  2.43s/it][A
Training:  12%|█▏        | 10/85 [00:21<02:10,  1.74s/it][A
Training:  13%|█▎        | 11/85 [00:21<01:32,  1.25s/it][A
Training:  14%|█▍        | 12/85 [00:21<01:07,  1.08it/s][A
Training:  15%|█▌        | 13/85 [00:26<02:34,  2.15s/it][A
Training:  16%|█▋        | 14/85 [00:26<01:49,  1.55s/it][A
Training:  18%|█▊        | 15/85 [00:26<01:20,  1.15s/it][A
Training:  19%|█▉        | 16/85 [00:27<0

Epoch: 39/56 - Loss: 2.9608 - Accuracy: 0.9723



  0%|          | 0/11 [00:00<?, ?it/s][A
  9%|▉         | 1/11 [00:06<01:04,  6.48s/it][A
 36%|███▋      | 4/11 [00:06<00:08,  1.26s/it][A
 55%|█████▍    | 6/11 [00:12<00:09,  1.90s/it][A
 64%|██████▎   | 7/11 [00:12<00:05,  1.48s/it][A
 82%|████████▏ | 9/11 [00:16<00:03,  1.81s/it][A
 91%|█████████ | 10/11 [00:17<00:01,  1.45s/it][A
100%|██████████| 11/11 [00:17<00:00,  1.59s/it][A
Epochs:  70%|██████▉   | 39/56 [1:14:36<41:58, 148.13s/it]

Val Loss: 4.1122 - Val Accuracy: 0.9555



Training:   0%|          | 0/85 [00:00<?, ?it/s][A
Training:   1%|          | 1/85 [00:07<10:23,  7.43s/it][A
Training:   2%|▏         | 2/85 [00:07<04:25,  3.20s/it][A
Training:   4%|▎         | 3/85 [00:07<02:27,  1.80s/it][A
Training:   5%|▍         | 4/85 [00:08<01:35,  1.18s/it][A
Training:   6%|▌         | 5/85 [00:13<03:48,  2.86s/it][A
Training:   7%|▋         | 6/85 [00:14<02:37,  2.00s/it][A
Training:   8%|▊         | 7/85 [00:14<01:59,  1.54s/it][A
Training:  11%|█         | 9/85 [00:20<02:35,  2.05s/it][A
Training:  12%|█▏        | 10/85 [00:20<02:04,  1.66s/it][A
Training:  13%|█▎        | 11/85 [00:21<01:46,  1.44s/it][A
Training:  14%|█▍        | 12/85 [00:21<01:18,  1.08s/it][A
Training:  15%|█▌        | 13/85 [00:25<02:21,  1.96s/it][A
Training:  16%|█▋        | 14/85 [00:26<01:59,  1.68s/it][A
Training:  18%|█▊        | 15/85 [00:26<01:27,  1.25s/it][A
Training:  19%|█▉        | 16/85 [00:27<01:05,  1.06it/s][A
Training:  20%|██        | 17/85 [00:31<

Epoch: 40/56 - Loss: 2.9194 - Accuracy: 0.9717



  0%|          | 0/11 [00:00<?, ?it/s][A
  9%|▉         | 1/11 [00:07<01:10,  7.08s/it][A
 18%|█▊        | 2/11 [00:07<00:26,  2.98s/it][A
 36%|███▋      | 4/11 [00:07<00:08,  1.16s/it][A
 45%|████▌     | 5/11 [00:13<00:15,  2.59s/it][A
 55%|█████▍    | 6/11 [00:13<00:09,  1.85s/it][A
 64%|██████▎   | 7/11 [00:13<00:05,  1.32s/it][A
 73%|███████▎  | 8/11 [00:13<00:02,  1.03it/s][A
 82%|████████▏ | 9/11 [00:17<00:03,  1.90s/it][A
 91%|█████████ | 10/11 [00:17<00:01,  1.39s/it][A
100%|██████████| 11/11 [00:18<00:00,  1.65s/it][A
Epochs:  71%|███████▏  | 40/56 [1:17:03<39:26, 147.90s/it]

Val Loss: 4.4347 - Val Accuracy: 0.9600



Training:   0%|          | 0/85 [00:00<?, ?it/s][A
Training:   1%|          | 1/85 [00:08<11:22,  8.13s/it][A
Training:   2%|▏         | 2/85 [00:08<04:44,  3.43s/it][A
Training:   4%|▎         | 3/85 [00:08<02:39,  1.95s/it][A
Training:   5%|▍         | 4/85 [00:08<01:42,  1.27s/it][A
Training:   6%|▌         | 5/85 [00:14<03:55,  2.94s/it][A
Training:   7%|▋         | 6/85 [00:14<02:36,  1.99s/it][A
Training:   8%|▊         | 7/85 [00:14<01:48,  1.39s/it][A
Training:   9%|▉         | 8/85 [00:15<01:17,  1.00s/it][A
Training:  11%|█         | 9/85 [00:20<03:07,  2.47s/it][A
Training:  12%|█▏        | 10/85 [00:20<02:12,  1.77s/it][A
Training:  13%|█▎        | 11/85 [00:21<01:35,  1.29s/it][A
Training:  15%|█▌        | 13/85 [00:26<02:14,  1.87s/it][A
Training:  16%|█▋        | 14/85 [00:26<01:42,  1.44s/it][A
Training:  18%|█▊        | 15/85 [00:26<01:18,  1.12s/it][A
Training:  19%|█▉        | 16/85 [00:26<01:00,  1.15it/s][A
Training:  20%|██        | 17/85 [00:31<0

Epoch: 41/56 - Loss: 3.0411 - Accuracy: 0.9713



  0%|          | 0/11 [00:00<?, ?it/s][A
  9%|▉         | 1/11 [00:06<01:04,  6.50s/it][A
 18%|█▊        | 2/11 [00:06<00:26,  2.93s/it][A
 27%|██▋       | 3/11 [00:07<00:13,  1.65s/it][A
 36%|███▋      | 4/11 [00:07<00:07,  1.06s/it][A
 45%|████▌     | 5/11 [00:12<00:14,  2.44s/it][A
 55%|█████▍    | 6/11 [00:12<00:08,  1.76s/it][A
 64%|██████▎   | 7/11 [00:12<00:04,  1.24s/it][A
 82%|████████▏ | 9/11 [00:16<00:03,  1.60s/it][A
100%|██████████| 11/11 [00:17<00:00,  1.61s/it][A
Epochs:  73%|███████▎  | 41/56 [1:19:33<37:07, 148.49s/it]

Val Loss: 3.5563 - Val Accuracy: 0.9648



Training:   0%|          | 0/85 [00:00<?, ?it/s][A
Training:   1%|          | 1/85 [00:07<09:58,  7.12s/it][A
Training:   4%|▎         | 3/85 [00:07<02:46,  2.03s/it][A
Training:   5%|▍         | 4/85 [00:07<01:52,  1.39s/it][A
Training:   6%|▌         | 5/85 [00:13<03:41,  2.77s/it][A
Training:   7%|▋         | 6/85 [00:13<02:31,  1.92s/it][A
Training:   8%|▊         | 7/85 [00:13<01:53,  1.46s/it][A
Training:  11%|█         | 9/85 [00:19<02:40,  2.11s/it][A
Training:  12%|█▏        | 10/85 [00:19<02:02,  1.63s/it][A
Training:  13%|█▎        | 11/85 [00:20<01:32,  1.26s/it][A
Training:  14%|█▍        | 12/85 [00:20<01:10,  1.03it/s][A
Training:  15%|█▌        | 13/85 [00:24<02:20,  1.95s/it][A
Training:  18%|█▊        | 15/85 [00:24<01:20,  1.15s/it][A
Training:  19%|█▉        | 16/85 [00:25<01:03,  1.09it/s][A
Training:  20%|██        | 17/85 [00:30<02:19,  2.05s/it][A
Training:  21%|██        | 18/85 [00:30<01:44,  1.56s/it][A
Training:  24%|██▎       | 20/85 [00:31

Epoch: 42/56 - Loss: 2.9692 - Accuracy: 0.9715



  0%|          | 0/11 [00:00<?, ?it/s][A
  9%|▉         | 1/11 [00:07<01:13,  7.37s/it][A
 18%|█▊        | 2/11 [00:07<00:28,  3.17s/it][A
 27%|██▋       | 3/11 [00:07<00:14,  1.86s/it][A
 36%|███▋      | 4/11 [00:08<00:08,  1.24s/it][A
 45%|████▌     | 5/11 [00:13<00:16,  2.74s/it][A
 64%|██████▎   | 7/11 [00:13<00:05,  1.42s/it][A
 73%|███████▎  | 8/11 [00:14<00:03,  1.09s/it][A
 82%|████████▏ | 9/11 [00:18<00:04,  2.08s/it][A
 91%|█████████ | 10/11 [00:18<00:01,  1.54s/it][A
100%|██████████| 11/11 [00:19<00:00,  1.75s/it][A
Epochs:  75%|███████▌  | 42/56 [1:22:05<34:53, 149.54s/it]

Val Loss: 4.0064 - Val Accuracy: 0.9619



Training:   0%|          | 0/85 [00:00<?, ?it/s][A
Training:   1%|          | 1/85 [00:07<10:57,  7.82s/it][A
Training:   2%|▏         | 2/85 [00:08<04:53,  3.54s/it][A
Training:   4%|▎         | 3/85 [00:08<02:45,  2.01s/it][A
Training:   5%|▍         | 4/85 [00:08<01:44,  1.29s/it][A
Training:   6%|▌         | 5/85 [00:14<03:55,  2.94s/it][A
Training:   7%|▋         | 6/85 [00:14<02:39,  2.02s/it][A
Training:   8%|▊         | 7/85 [00:15<01:52,  1.44s/it][A
Training:   9%|▉         | 8/85 [00:15<01:20,  1.05s/it][A
Training:  11%|█         | 9/85 [00:20<02:58,  2.35s/it][A
Training:  12%|█▏        | 10/85 [00:20<02:06,  1.69s/it][A
Training:  13%|█▎        | 11/85 [00:21<01:50,  1.49s/it][A
Training:  14%|█▍        | 12/85 [00:21<01:18,  1.07s/it][A
Training:  15%|█▌        | 13/85 [00:26<02:39,  2.21s/it][A
Training:  16%|█▋        | 14/85 [00:26<01:55,  1.63s/it][A
Training:  18%|█▊        | 15/85 [00:27<01:35,  1.37s/it][A
Training:  20%|██        | 17/85 [00:33<0

Epoch: 43/56 - Loss: 2.9196 - Accuracy: 0.9741



  0%|          | 0/11 [00:00<?, ?it/s][A
  9%|▉         | 1/11 [00:06<01:07,  6.77s/it][A
 18%|█▊        | 2/11 [00:07<00:26,  2.93s/it][A
 27%|██▋       | 3/11 [00:07<00:13,  1.73s/it][A
 36%|███▋      | 4/11 [00:07<00:07,  1.14s/it][A
 45%|████▌     | 5/11 [00:12<00:14,  2.36s/it][A
 64%|██████▎   | 7/11 [00:12<00:05,  1.30s/it][A
 73%|███████▎  | 8/11 [00:12<00:03,  1.03s/it][A
100%|██████████| 11/11 [00:17<00:00,  1.57s/it][A
Epochs:  77%|███████▋  | 43/56 [1:24:42<32:53, 151.81s/it]

Val Loss: 3.6295 - Val Accuracy: 0.9633



Training:   0%|          | 0/85 [00:00<?, ?it/s][A
Training:   1%|          | 1/85 [00:08<11:39,  8.33s/it][A
Training:   2%|▏         | 2/85 [00:08<04:55,  3.56s/it][A
Training:   4%|▎         | 3/85 [00:08<02:50,  2.08s/it][A
Training:   6%|▌         | 5/85 [00:14<03:29,  2.62s/it][A
Training:   9%|▉         | 8/85 [00:15<01:33,  1.21s/it][A
Training:  11%|█         | 9/85 [00:20<02:39,  2.10s/it][A
Training:  12%|█▏        | 10/85 [00:20<02:03,  1.64s/it][A
Training:  13%|█▎        | 11/85 [00:20<01:33,  1.26s/it][A
Training:  14%|█▍        | 12/85 [00:20<01:10,  1.03it/s][A
Training:  15%|█▌        | 13/85 [00:26<02:35,  2.16s/it][A
Training:  16%|█▋        | 14/85 [00:26<01:53,  1.60s/it][A
Training:  18%|█▊        | 15/85 [00:26<01:24,  1.21s/it][A
Training:  19%|█▉        | 16/85 [00:26<01:02,  1.10it/s][A
Training:  20%|██        | 17/85 [00:32<02:31,  2.23s/it][A
Training:  21%|██        | 18/85 [00:32<01:48,  1.62s/it][A
Training:  22%|██▏       | 19/85 [00:3

Epoch: 44/56 - Loss: 2.9230 - Accuracy: 0.9720



  0%|          | 0/11 [00:00<?, ?it/s][A
  9%|▉         | 1/11 [00:06<01:08,  6.90s/it][A
 18%|█▊        | 2/11 [00:07<00:29,  3.23s/it][A
 36%|███▋      | 4/11 [00:07<00:08,  1.24s/it][A
 45%|████▌     | 5/11 [00:12<00:13,  2.29s/it][A
 55%|█████▍    | 6/11 [00:12<00:08,  1.66s/it][A
 64%|██████▎   | 7/11 [00:12<00:04,  1.22s/it][A
 73%|███████▎  | 8/11 [00:13<00:02,  1.09it/s][A
 82%|████████▏ | 9/11 [00:17<00:04,  2.04s/it][A
 91%|█████████ | 10/11 [00:17<00:01,  1.48s/it][A
100%|██████████| 11/11 [00:18<00:00,  1.65s/it][A
Epochs:  79%|███████▊  | 44/56 [1:27:15<30:24, 152.04s/it]

Val Loss: 4.0984 - Val Accuracy: 0.9616



Training:   0%|          | 0/85 [00:00<?, ?it/s][A
Training:   1%|          | 1/85 [00:07<09:57,  7.12s/it][A
Training:   2%|▏         | 2/85 [00:07<04:44,  3.42s/it][A
Training:   4%|▎         | 3/85 [00:08<02:37,  1.92s/it][A
Training:   5%|▍         | 4/85 [00:08<01:40,  1.24s/it][A
Training:   6%|▌         | 5/85 [00:13<03:33,  2.67s/it][A
Training:   7%|▋         | 6/85 [00:13<02:25,  1.84s/it][A
Training:   8%|▊         | 7/85 [00:13<01:41,  1.30s/it][A
Training:   9%|▉         | 8/85 [00:14<01:19,  1.03s/it][A
Training:  11%|█         | 9/85 [00:19<03:03,  2.41s/it][A
Training:  12%|█▏        | 10/85 [00:20<02:10,  1.75s/it][A
Training:  13%|█▎        | 11/85 [00:20<01:35,  1.29s/it][A
Training:  14%|█▍        | 12/85 [00:20<01:16,  1.05s/it][A
Training:  15%|█▌        | 13/85 [00:26<02:45,  2.30s/it][A
Training:  16%|█▋        | 14/85 [00:26<01:59,  1.68s/it][A
Training:  18%|█▊        | 15/85 [00:26<01:26,  1.24s/it][A
Training:  19%|█▉        | 16/85 [00:26<0

Epoch: 45/56 - Loss: 2.9315 - Accuracy: 0.9713



  0%|          | 0/11 [00:00<?, ?it/s][A
  9%|▉         | 1/11 [00:06<01:04,  6.49s/it][A
 18%|█▊        | 2/11 [00:06<00:25,  2.79s/it][A
 27%|██▋       | 3/11 [00:06<00:12,  1.58s/it][A
 45%|████▌     | 5/11 [00:11<00:12,  2.08s/it][A
 55%|█████▍    | 6/11 [00:11<00:07,  1.55s/it][A
 64%|██████▎   | 7/11 [00:12<00:04,  1.21s/it][A
 82%|████████▏ | 9/11 [00:16<00:03,  1.57s/it][A
100%|██████████| 11/11 [00:16<00:00,  1.54s/it][A


Val Loss: 4.6141 - Val Accuracy: 0.9598


Epochs:  80%|████████  | 45/56 [1:29:46<27:49, 151.76s/it]
Training:   0%|          | 0/85 [00:00<?, ?it/s][A
Training:   1%|          | 1/85 [00:06<09:42,  6.94s/it][A
Training:   2%|▏         | 2/85 [00:07<04:05,  2.95s/it][A
Training:   4%|▎         | 3/85 [00:07<02:17,  1.68s/it][A
Training:   5%|▍         | 4/85 [00:07<01:26,  1.07s/it][A
Training:   6%|▌         | 5/85 [00:13<04:02,  3.03s/it][A
Training:   7%|▋         | 6/85 [00:14<02:41,  2.04s/it][A
Training:   8%|▊         | 7/85 [00:14<01:50,  1.42s/it][A
Training:   9%|▉         | 8/85 [00:14<01:17,  1.00s/it][A
Training:  11%|█         | 9/85 [00:19<02:48,  2.22s/it][A
Training:  12%|█▏        | 10/85 [00:19<02:00,  1.61s/it][A
Training:  13%|█▎        | 11/85 [00:19<01:28,  1.20s/it][A
Training:  14%|█▍        | 12/85 [00:19<01:05,  1.12it/s][A
Training:  15%|█▌        | 13/85 [00:25<02:39,  2.22s/it][A
Training:  16%|█▋        | 14/85 [00:25<01:54,  1.61s/it][A
Training:  18%|█▊        | 15/85 [00:25<01:2

Epoch: 46/56 - Loss: 3.0744 - Accuracy: 0.9708



  0%|          | 0/11 [00:00<?, ?it/s][A
  9%|▉         | 1/11 [00:06<01:01,  6.18s/it][A
 18%|█▊        | 2/11 [00:06<00:23,  2.65s/it][A
 27%|██▋       | 3/11 [00:06<00:11,  1.50s/it][A
 36%|███▋      | 4/11 [00:06<00:07,  1.07s/it][A
 45%|████▌     | 5/11 [00:11<00:14,  2.50s/it][A
 64%|██████▎   | 7/11 [00:12<00:05,  1.28s/it][A
 82%|████████▏ | 9/11 [00:16<00:03,  1.70s/it][A
100%|██████████| 11/11 [00:16<00:00,  1.55s/it][A
Epochs:  82%|████████▏ | 46/56 [1:32:14<25:07, 150.80s/it]

Val Loss: 3.6405 - Val Accuracy: 0.9657



Training:   0%|          | 0/85 [00:00<?, ?it/s][A
Training:   1%|          | 1/85 [00:06<09:33,  6.83s/it][A
Training:   2%|▏         | 2/85 [00:07<04:21,  3.15s/it][A
Training:   4%|▎         | 3/85 [00:07<02:27,  1.80s/it][A
Training:   5%|▍         | 4/85 [00:07<01:36,  1.19s/it][A
Training:   6%|▌         | 5/85 [00:12<03:19,  2.49s/it][A
Training:   7%|▋         | 6/85 [00:13<02:41,  2.04s/it][A
Training:   8%|▊         | 7/85 [00:14<01:53,  1.45s/it][A
Training:   9%|▉         | 8/85 [00:14<01:21,  1.05s/it][A
Training:  11%|█         | 9/85 [00:18<02:32,  2.01s/it][A
Training:  12%|█▏        | 10/85 [00:18<01:56,  1.56s/it][A
Training:  13%|█▎        | 11/85 [00:19<01:31,  1.23s/it][A
Training:  14%|█▍        | 12/85 [00:19<01:05,  1.12it/s][A
Training:  15%|█▌        | 13/85 [00:24<02:24,  2.01s/it][A
Training:  16%|█▋        | 14/85 [00:25<02:04,  1.75s/it][A
Training:  18%|█▊        | 15/85 [00:25<01:32,  1.32s/it][A
Training:  19%|█▉        | 16/85 [00:25<0

Epoch: 47/56 - Loss: 2.9823 - Accuracy: 0.9737



  0%|          | 0/11 [00:00<?, ?it/s][A
  9%|▉         | 1/11 [00:06<01:07,  6.74s/it][A
 18%|█▊        | 2/11 [00:06<00:25,  2.88s/it][A
 27%|██▋       | 3/11 [00:07<00:13,  1.70s/it][A
 45%|████▌     | 5/11 [00:11<00:12,  2.07s/it][A
 55%|█████▍    | 6/11 [00:12<00:07,  1.51s/it][A
 73%|███████▎  | 8/11 [00:12<00:02,  1.18it/s][A
 82%|████████▏ | 9/11 [00:16<00:03,  1.70s/it][A
 91%|█████████ | 10/11 [00:16<00:01,  1.31s/it][A
100%|██████████| 11/11 [00:17<00:00,  1.55s/it][A
Epochs:  84%|████████▍ | 47/56 [1:34:42<22:29, 149.95s/it]

Val Loss: 3.9680 - Val Accuracy: 0.9605



Training:   0%|          | 0/85 [00:00<?, ?it/s][A
Training:   1%|          | 1/85 [00:07<10:11,  7.28s/it][A
Training:   2%|▏         | 2/85 [00:07<04:23,  3.18s/it][A
Training:   4%|▎         | 3/85 [00:07<02:32,  1.85s/it][A
Training:   5%|▍         | 4/85 [00:07<01:35,  1.17s/it][A
Training:   6%|▌         | 5/85 [00:13<03:47,  2.84s/it][A
Training:   7%|▋         | 6/85 [00:13<02:32,  1.93s/it][A
Training:   8%|▊         | 7/85 [00:14<01:47,  1.37s/it][A
Training:   9%|▉         | 8/85 [00:14<01:15,  1.02it/s][A
Training:  11%|█         | 9/85 [00:19<02:53,  2.29s/it][A
Training:  12%|█▏        | 10/85 [00:19<02:02,  1.64s/it][A
Training:  13%|█▎        | 11/85 [00:19<01:28,  1.19s/it][A
Training:  14%|█▍        | 12/85 [00:20<01:04,  1.14it/s][A
Training:  15%|█▌        | 13/85 [00:25<02:44,  2.28s/it][A
Training:  16%|█▋        | 14/85 [00:25<01:56,  1.63s/it][A
Training:  18%|█▊        | 15/85 [00:25<01:23,  1.19s/it][A
Training:  19%|█▉        | 16/85 [00:25<0

Epoch: 48/56 - Loss: 2.8723 - Accuracy: 0.9738



  0%|          | 0/11 [00:00<?, ?it/s][A
  9%|▉         | 1/11 [00:06<01:04,  6.43s/it][A
 18%|█▊        | 2/11 [00:06<00:24,  2.76s/it][A
 27%|██▋       | 3/11 [00:06<00:12,  1.58s/it][A
 36%|███▋      | 4/11 [00:07<00:07,  1.06s/it][A
 45%|████▌     | 5/11 [00:11<00:14,  2.45s/it][A
 55%|█████▍    | 6/11 [00:12<00:08,  1.67s/it][A
 73%|███████▎  | 8/11 [00:12<00:02,  1.13it/s][A
 82%|████████▏ | 9/11 [00:16<00:03,  1.78s/it][A
 91%|█████████ | 10/11 [00:16<00:01,  1.33s/it][A
100%|██████████| 11/11 [00:17<00:00,  1.57s/it][A
Epochs:  86%|████████▌ | 48/56 [1:37:12<19:58, 149.78s/it]

Val Loss: 4.2671 - Val Accuracy: 0.9618



Training:   0%|          | 0/85 [00:00<?, ?it/s][A
Training:   1%|          | 1/85 [00:07<10:46,  7.70s/it][A
Training:   2%|▏         | 2/85 [00:07<04:28,  3.24s/it][A
Training:   4%|▎         | 3/85 [00:07<02:30,  1.83s/it][A
Training:   5%|▍         | 4/85 [00:08<01:38,  1.21s/it][A
Training:   6%|▌         | 5/85 [00:13<03:41,  2.77s/it][A
Training:   8%|▊         | 7/85 [00:13<01:49,  1.40s/it][A
Training:  11%|█         | 9/85 [00:19<02:32,  2.01s/it][A
Training:  12%|█▏        | 10/85 [00:19<01:59,  1.59s/it][A
Training:  13%|█▎        | 11/85 [00:20<01:33,  1.26s/it][A
Training:  14%|█▍        | 12/85 [00:20<01:12,  1.01it/s][A
Training:  15%|█▌        | 13/85 [00:25<02:40,  2.22s/it][A
Training:  16%|█▋        | 14/85 [00:25<01:56,  1.63s/it][A
Training:  18%|█▊        | 15/85 [00:26<01:27,  1.25s/it][A
Training:  19%|█▉        | 16/85 [00:26<01:06,  1.04it/s][A
Training:  20%|██        | 17/85 [00:32<02:36,  2.30s/it][A
Training:  21%|██        | 18/85 [00:32

Epoch: 49/56 - Loss: 2.9855 - Accuracy: 0.9745



  0%|          | 0/11 [00:00<?, ?it/s][A
  9%|▉         | 1/11 [00:06<01:02,  6.28s/it][A
 18%|█▊        | 2/11 [00:06<00:24,  2.67s/it][A
 27%|██▋       | 3/11 [00:06<00:12,  1.51s/it][A
 36%|███▋      | 4/11 [00:06<00:06,  1.01it/s][A
 45%|████▌     | 5/11 [00:12<00:15,  2.58s/it][A
 55%|█████▍    | 6/11 [00:12<00:08,  1.76s/it][A
 64%|██████▎   | 7/11 [00:12<00:04,  1.25s/it][A
 73%|███████▎  | 8/11 [00:12<00:02,  1.09it/s][A
 82%|████████▏ | 9/11 [00:17<00:04,  2.06s/it][A
 91%|█████████ | 10/11 [00:17<00:01,  1.52s/it][A
100%|██████████| 11/11 [00:18<00:00,  1.64s/it][A
Epochs:  88%|████████▊ | 49/56 [1:39:43<17:31, 150.21s/it]

Val Loss: 4.1908 - Val Accuracy: 0.9589



Training:   0%|          | 0/85 [00:00<?, ?it/s][A
Training:   1%|          | 1/85 [00:06<09:38,  6.89s/it][A
Training:   2%|▏         | 2/85 [00:07<04:24,  3.19s/it][A
Training:   5%|▍         | 4/85 [00:07<01:43,  1.28s/it][A
Training:   6%|▌         | 5/85 [00:13<03:33,  2.67s/it][A
Training:   7%|▋         | 6/85 [00:13<02:29,  1.89s/it][A
Training:   8%|▊         | 7/85 [00:13<01:47,  1.38s/it][A
Training:   9%|▉         | 8/85 [00:14<01:22,  1.07s/it][A
Training:  11%|█         | 9/85 [00:19<03:00,  2.37s/it][A
Training:  12%|█▏        | 10/85 [00:19<02:07,  1.70s/it][A
Training:  14%|█▍        | 12/85 [00:20<01:11,  1.02it/s][A
Training:  15%|█▌        | 13/85 [00:25<02:30,  2.09s/it][A
Training:  16%|█▋        | 14/85 [00:25<01:52,  1.59s/it][A
Training:  18%|█▊        | 15/85 [00:25<01:24,  1.21s/it][A
Training:  19%|█▉        | 16/85 [00:26<01:04,  1.08it/s][A
Training:  20%|██        | 17/85 [00:31<02:25,  2.13s/it][A
Training:  21%|██        | 18/85 [00:31<

Epoch: 50/56 - Loss: 2.9900 - Accuracy: 0.9711



  0%|          | 0/11 [00:00<?, ?it/s][A
  9%|▉         | 1/11 [00:06<01:05,  6.57s/it][A
 18%|█▊        | 2/11 [00:06<00:24,  2.78s/it][A
 27%|██▋       | 3/11 [00:06<00:12,  1.59s/it][A
 36%|███▋      | 4/11 [00:07<00:07,  1.05s/it][A
 45%|████▌     | 5/11 [00:11<00:14,  2.34s/it][A
 64%|██████▎   | 7/11 [00:11<00:04,  1.18s/it][A
 82%|████████▏ | 9/11 [00:16<00:03,  1.76s/it][A
 91%|█████████ | 10/11 [00:17<00:01,  1.39s/it][A
100%|██████████| 11/11 [00:17<00:00,  1.59s/it][A
Epochs:  89%|████████▉ | 50/56 [1:42:14<15:02, 150.39s/it]

Val Loss: 4.3825 - Val Accuracy: 0.9624



Training:   0%|          | 0/85 [00:00<?, ?it/s][A
Training:   1%|          | 1/85 [00:07<10:23,  7.42s/it][A
Training:   2%|▏         | 2/85 [00:07<04:23,  3.18s/it][A
Training:   4%|▎         | 3/85 [00:07<02:27,  1.80s/it][A
Training:   5%|▍         | 4/85 [00:07<01:33,  1.15s/it][A
Training:   6%|▌         | 5/85 [00:13<03:45,  2.82s/it][A
Training:   7%|▋         | 6/85 [00:13<02:30,  1.91s/it][A
Training:   9%|▉         | 8/85 [00:13<01:16,  1.00it/s][A
Training:  11%|█         | 9/85 [00:19<02:47,  2.21s/it][A
Training:  13%|█▎        | 11/85 [00:19<01:37,  1.32s/it][A
Training:  14%|█▍        | 12/85 [00:20<01:17,  1.06s/it][A
Training:  15%|█▌        | 13/85 [00:25<02:36,  2.17s/it][A
Training:  16%|█▋        | 14/85 [00:25<01:57,  1.65s/it][A
Training:  18%|█▊        | 15/85 [00:25<01:27,  1.25s/it][A
Training:  19%|█▉        | 16/85 [00:26<01:08,  1.01it/s][A
Training:  20%|██        | 17/85 [00:31<02:29,  2.20s/it][A
Training:  21%|██        | 18/85 [00:31<

Epoch: 51/56 - Loss: 2.8342 - Accuracy: 0.9732



  0%|          | 0/11 [00:00<?, ?it/s][A
  9%|▉         | 1/11 [00:06<01:08,  6.83s/it][A
 18%|█▊        | 2/11 [00:07<00:26,  2.93s/it][A
 27%|██▋       | 3/11 [00:07<00:13,  1.69s/it][A
 36%|███▋      | 4/11 [00:07<00:07,  1.11s/it][A
 45%|████▌     | 5/11 [00:12<00:15,  2.57s/it][A
 55%|█████▍    | 6/11 [00:12<00:08,  1.77s/it][A
 64%|██████▎   | 7/11 [00:13<00:05,  1.25s/it][A
 82%|████████▏ | 9/11 [00:17<00:03,  1.74s/it][A
100%|██████████| 11/11 [00:18<00:00,  1.64s/it][A
Epochs:  91%|█████████ | 51/56 [1:44:43<12:29, 149.97s/it]

Val Loss: 3.9667 - Val Accuracy: 0.9612



Training:   0%|          | 0/85 [00:00<?, ?it/s][A
Training:   1%|          | 1/85 [00:07<10:02,  7.17s/it][A
Training:   2%|▏         | 2/85 [00:07<04:19,  3.13s/it][A
Training:   4%|▎         | 3/85 [00:07<02:23,  1.75s/it][A
Training:   5%|▍         | 4/85 [00:07<01:29,  1.11s/it][A
Training:   6%|▌         | 5/85 [00:13<03:41,  2.77s/it][A
Training:   7%|▋         | 6/85 [00:14<02:43,  2.07s/it][A
Training:   8%|▊         | 7/85 [00:14<01:54,  1.47s/it][A
Training:   9%|▉         | 8/85 [00:14<01:30,  1.17s/it][A
Training:  11%|█         | 9/85 [00:19<02:48,  2.22s/it][A
Training:  12%|█▏        | 10/85 [00:19<02:06,  1.68s/it][A
Training:  13%|█▎        | 11/85 [00:20<01:29,  1.21s/it][A
Training:  14%|█▍        | 12/85 [00:20<01:11,  1.02it/s][A
Training:  15%|█▌        | 13/85 [00:25<02:30,  2.09s/it][A
Training:  16%|█▋        | 14/85 [00:25<01:58,  1.67s/it][A
Training:  18%|█▊        | 15/85 [00:25<01:24,  1.21s/it][A
Training:  19%|█▉        | 16/85 [00:26<0

Epoch: 52/56 - Loss: 2.8229 - Accuracy: 0.9743



  0%|          | 0/11 [00:00<?, ?it/s][A
  9%|▉         | 1/11 [00:06<01:07,  6.76s/it][A
 18%|█▊        | 2/11 [00:06<00:26,  2.91s/it][A
 27%|██▋       | 3/11 [00:07<00:13,  1.64s/it][A
 45%|████▌     | 5/11 [00:12<00:12,  2.10s/it][A
 55%|█████▍    | 6/11 [00:12<00:07,  1.57s/it][A
 64%|██████▎   | 7/11 [00:12<00:04,  1.17s/it][A
 73%|███████▎  | 8/11 [00:12<00:02,  1.15it/s][A
 82%|████████▏ | 9/11 [00:17<00:03,  1.98s/it][A
 91%|█████████ | 10/11 [00:17<00:01,  1.45s/it][A
100%|██████████| 11/11 [00:17<00:00,  1.62s/it][A
Epochs:  93%|█████████▎| 52/56 [1:47:12<09:58, 149.63s/it]

Val Loss: 3.9527 - Val Accuracy: 0.9589



Training:   0%|          | 0/85 [00:00<?, ?it/s][A
Training:   1%|          | 1/85 [00:07<10:38,  7.60s/it][A
Training:   2%|▏         | 2/85 [00:07<04:31,  3.27s/it][A
Training:   4%|▎         | 3/85 [00:08<02:33,  1.87s/it][A
Training:   5%|▍         | 4/85 [00:08<01:40,  1.24s/it][A
Training:   6%|▌         | 5/85 [00:14<03:56,  2.95s/it][A
Training:   7%|▋         | 6/85 [00:14<02:40,  2.03s/it][A
Training:   8%|▊         | 7/85 [00:14<01:51,  1.44s/it][A
Training:  11%|█         | 9/85 [00:20<02:43,  2.15s/it][A
Training:  12%|█▏        | 10/85 [00:20<02:06,  1.69s/it][A
Training:  13%|█▎        | 11/85 [00:21<01:33,  1.27s/it][A
Training:  14%|█▍        | 12/85 [00:21<01:10,  1.04it/s][A
Training:  15%|█▌        | 13/85 [00:26<02:31,  2.11s/it][A
Training:  16%|█▋        | 14/85 [00:27<02:03,  1.74s/it][A
Training:  18%|█▊        | 15/85 [00:27<01:31,  1.30s/it][A
Training:  19%|█▉        | 16/85 [00:27<01:07,  1.02it/s][A
Training:  20%|██        | 17/85 [00:32<

Epoch: 53/56 - Loss: 2.8425 - Accuracy: 0.9738



  0%|          | 0/11 [00:00<?, ?it/s][A
  9%|▉         | 1/11 [00:06<01:05,  6.53s/it][A
 18%|█▊        | 2/11 [00:06<00:25,  2.79s/it][A
 36%|███▋      | 4/11 [00:06<00:07,  1.08s/it][A
 45%|████▌     | 5/11 [00:12<00:14,  2.36s/it][A
 55%|█████▍    | 6/11 [00:12<00:08,  1.70s/it][A
 64%|██████▎   | 7/11 [00:12<00:04,  1.23s/it][A
 73%|███████▎  | 8/11 [00:12<00:02,  1.09it/s][A
 82%|████████▏ | 9/11 [00:17<00:04,  2.07s/it][A
100%|██████████| 11/11 [00:17<00:00,  1.61s/it][A
Epochs:  95%|█████████▍| 53/56 [1:49:45<07:31, 150.62s/it]

Val Loss: 3.9203 - Val Accuracy: 0.9616



Training:   0%|          | 0/85 [00:00<?, ?it/s][A
Training:   1%|          | 1/85 [00:07<10:29,  7.49s/it][A
Training:   2%|▏         | 2/85 [00:07<04:21,  3.15s/it][A
Training:   4%|▎         | 3/85 [00:08<02:51,  2.09s/it][A
Training:   5%|▍         | 4/85 [00:08<01:47,  1.32s/it][A
Training:   6%|▌         | 5/85 [00:14<03:46,  2.83s/it][A
Training:   7%|▋         | 6/85 [00:14<02:39,  2.02s/it][A
Training:   8%|▊         | 7/85 [00:14<01:55,  1.47s/it][A
Training:   9%|▉         | 8/85 [00:15<01:22,  1.07s/it][A
Training:  11%|█         | 9/85 [00:20<02:55,  2.30s/it][A
Training:  12%|█▏        | 10/85 [00:20<02:12,  1.77s/it][A
Training:  13%|█▎        | 11/85 [00:20<01:36,  1.30s/it][A
Training:  14%|█▍        | 12/85 [00:21<01:10,  1.03it/s][A
Training:  15%|█▌        | 13/85 [00:26<02:46,  2.32s/it][A
Training:  16%|█▋        | 14/85 [00:26<01:59,  1.68s/it][A
Training:  18%|█▊        | 15/85 [00:27<01:27,  1.25s/it][A
Training:  19%|█▉        | 16/85 [00:27<0

Epoch: 54/56 - Loss: 3.0639 - Accuracy: 0.9727



  0%|          | 0/11 [00:00<?, ?it/s][A
  9%|▉         | 1/11 [00:06<01:08,  6.81s/it][A
 18%|█▊        | 2/11 [00:07<00:27,  3.07s/it][A
 27%|██▋       | 3/11 [00:07<00:14,  1.76s/it][A
 36%|███▋      | 4/11 [00:07<00:08,  1.18s/it][A
 45%|████▌     | 5/11 [00:13<00:16,  2.72s/it][A
 55%|█████▍    | 6/11 [00:13<00:09,  1.89s/it][A
 73%|███████▎  | 8/11 [00:13<00:03,  1.01s/it][A
 82%|████████▏ | 9/11 [00:18<00:04,  2.10s/it][A
100%|██████████| 11/11 [00:19<00:00,  1.75s/it][A
Epochs:  96%|█████████▋| 54/56 [1:52:19<05:03, 151.75s/it]

Val Loss: 4.1202 - Val Accuracy: 0.9631



Training:   0%|          | 0/85 [00:00<?, ?it/s][A
Training:   1%|          | 1/85 [00:07<10:51,  7.75s/it][A
Training:   2%|▏         | 2/85 [00:07<04:34,  3.30s/it][A
Training:   5%|▍         | 4/85 [00:08<01:44,  1.29s/it][A
Training:   6%|▌         | 5/85 [00:14<03:47,  2.84s/it][A
Training:   8%|▊         | 7/85 [00:14<02:00,  1.55s/it][A
Training:   9%|▉         | 8/85 [00:14<01:32,  1.20s/it][A
Training:  11%|█         | 9/85 [00:20<02:56,  2.32s/it][A
Training:  12%|█▏        | 10/85 [00:20<02:11,  1.75s/it][A
Training:  13%|█▎        | 11/85 [00:20<01:37,  1.31s/it][A
Training:  14%|█▍        | 12/85 [00:20<01:11,  1.02it/s][A
Training:  15%|█▌        | 13/85 [00:25<02:32,  2.12s/it][A
Training:  16%|█▋        | 14/85 [00:26<01:53,  1.60s/it][A
Training:  18%|█▊        | 15/85 [00:26<01:26,  1.23s/it][A
Training:  19%|█▉        | 16/85 [00:26<01:03,  1.09it/s][A
Training:  20%|██        | 17/85 [00:32<02:43,  2.41s/it][A
Training:  21%|██        | 18/85 [00:32

Epoch: 55/56 - Loss: 2.9909 - Accuracy: 0.9736



  0%|          | 0/11 [00:00<?, ?it/s][A
  9%|▉         | 1/11 [00:06<01:07,  6.77s/it][A
 18%|█▊        | 2/11 [00:07<00:26,  2.98s/it][A
 27%|██▋       | 3/11 [00:07<00:13,  1.70s/it][A
 36%|███▋      | 4/11 [00:07<00:07,  1.07s/it][A
 45%|████▌     | 5/11 [00:12<00:15,  2.51s/it][A
 55%|█████▍    | 6/11 [00:12<00:08,  1.70s/it][A
 64%|██████▎   | 7/11 [00:12<00:04,  1.20s/it][A
 73%|███████▎  | 8/11 [00:12<00:02,  1.14it/s][A
 82%|████████▏ | 9/11 [00:17<00:04,  2.15s/it][A
 91%|█████████ | 10/11 [00:18<00:01,  1.53s/it][A
100%|██████████| 11/11 [00:18<00:00,  1.68s/it][A
Epochs:  98%|█████████▊| 55/56 [1:54:49<02:31, 151.19s/it]

Val Loss: 4.3545 - Val Accuracy: 0.9606



Training:   0%|          | 0/85 [00:00<?, ?it/s][A
Training:   1%|          | 1/85 [00:07<10:35,  7.57s/it][A
Training:   2%|▏         | 2/85 [00:07<04:27,  3.22s/it][A
Training:   4%|▎         | 3/85 [00:08<02:42,  1.98s/it][A
Training:   5%|▍         | 4/85 [00:08<01:41,  1.25s/it][A
Training:   6%|▌         | 5/85 [00:14<03:50,  2.88s/it][A
Training:   7%|▋         | 6/85 [00:14<02:35,  1.97s/it][A
Training:   8%|▊         | 7/85 [00:14<01:48,  1.39s/it][A
Training:   9%|▉         | 8/85 [00:14<01:19,  1.03s/it][A
Training:  11%|█         | 9/85 [00:20<03:05,  2.44s/it][A
Training:  12%|█▏        | 10/85 [00:20<02:10,  1.74s/it][A
Training:  13%|█▎        | 11/85 [00:20<01:34,  1.28s/it][A
Training:  15%|█▌        | 13/85 [00:25<02:13,  1.86s/it][A
Training:  16%|█▋        | 14/85 [00:26<01:43,  1.45s/it][A
Training:  18%|█▊        | 15/85 [00:26<01:23,  1.19s/it][A
Training:  19%|█▉        | 16/85 [00:26<01:04,  1.07it/s][A
Training:  20%|██        | 17/85 [00:31<0

Epoch: 56/56 - Loss: 2.9942 - Accuracy: 0.9724



  0%|          | 0/11 [00:00<?, ?it/s][A
  9%|▉         | 1/11 [00:06<01:04,  6.43s/it][A
 18%|█▊        | 2/11 [00:07<00:27,  3.02s/it][A
 27%|██▋       | 3/11 [00:07<00:13,  1.73s/it][A
 36%|███▋      | 4/11 [00:07<00:07,  1.14s/it][A
 45%|████▌     | 5/11 [00:12<00:14,  2.49s/it][A
 55%|█████▍    | 6/11 [00:12<00:09,  1.80s/it][A
 64%|██████▎   | 7/11 [00:13<00:05,  1.27s/it][A
 73%|███████▎  | 8/11 [00:13<00:02,  1.09it/s][A
 82%|████████▏ | 9/11 [00:17<00:04,  2.05s/it][A
 91%|█████████ | 10/11 [00:17<00:01,  1.49s/it][A
100%|██████████| 11/11 [00:18<00:00,  1.67s/it][A
Epochs: 100%|██████████| 56/56 [1:57:20<00:00, 125.72s/it]


Val Loss: 3.8741 - Val Accuracy: 0.9649
Saving best model...


[32m[I 2023-12-08 19:59:45,885][0m Trial 15 finished with value: 0.9649122357368469 and parameters: {'loss_learning_rate': 0.00953499792102873, 'learning_rate': 0.0004893954558618118, 'weight_decay': 0.004977508654911263, 'epsilon': 8.634793963388647e-08, 'beta': 0.5, 'gamma': 0.6, 'batch_size': 165, 'epochs': 56}. Best is trial 15 with value: 0.9649122357368469.[0m


Learning rate for Loss: 0.009182383596361456
Learning rate: 0.0005227903627863731
Weight decay: 0.00022533397273366494
Epsilon: 8.488395942056724e-08
Beta: 1.0
Gamma: 0.7000000000000001
Batch size: 107
Number of epochs: 55


Epochs:   0%|          | 0/55 [00:00<?, ?it/s]
Training:   0%|          | 0/131 [00:00<?, ?it/s][A
Training:   1%|          | 1/131 [00:05<11:55,  5.51s/it][A
Training:   2%|▏         | 2/131 [00:05<05:07,  2.38s/it][A
Training:   2%|▏         | 3/131 [00:05<02:57,  1.39s/it][A
Training:   3%|▎         | 4/131 [00:06<01:56,  1.09it/s][A
Training:   4%|▍         | 5/131 [00:09<03:49,  1.82s/it][A
Training:   5%|▍         | 6/131 [00:09<02:36,  1.25s/it][A
Training:   5%|▌         | 7/131 [00:09<01:49,  1.14it/s][A
Training:   6%|▌         | 8/131 [00:10<01:23,  1.47it/s][A
Training:   7%|▋         | 9/131 [00:13<03:26,  1.69s/it][A
Training:   8%|▊         | 10/131 [00:14<02:26,  1.21s/it][A
Training:   8%|▊         | 11/131 [00:14<01:47,  1.11it/s][A
Training:   9%|▉         | 12/131 [00:14<01:18,  1.52it/s][A
Training:  10%|▉         | 13/131 [00:17<03:01,  1.53s/it][A
Training:  11%|█▏        | 15/131 [00:18<01:40,  1.15it/s][A
Training:  12%|█▏        | 16/131 [00:18<

Epoch: 1/55 - Loss: 13.1483 - Accuracy: 0.9099



  0%|          | 0/17 [00:00<?, ?it/s][A
  6%|▌         | 1/17 [00:04<01:14,  4.67s/it][A
 18%|█▊        | 3/17 [00:04<00:18,  1.30s/it][A
 24%|██▎       | 4/17 [00:05<00:11,  1.10it/s][A
 29%|██▉       | 5/17 [00:08<00:21,  1.79s/it][A
 41%|████      | 7/17 [00:08<00:09,  1.04it/s][A
 53%|█████▎    | 9/17 [00:12<00:10,  1.29s/it][A
 59%|█████▉    | 10/17 [00:12<00:07,  1.03s/it][A
 71%|███████   | 12/17 [00:12<00:03,  1.54it/s][A
 76%|███████▋  | 13/17 [00:16<00:05,  1.26s/it][A
100%|██████████| 17/17 [00:17<00:00,  1.00s/it][A
Epochs:   2%|▏         | 1/55 [02:30<2:15:37, 150.69s/it]

Val Loss: 8.6590 - Val Accuracy: 0.9552



Training:   0%|          | 0/131 [00:00<?, ?it/s][A
Training:   1%|          | 1/131 [00:05<11:22,  5.25s/it][A
Training:   2%|▏         | 2/131 [00:05<04:51,  2.26s/it][A
Training:   2%|▏         | 3/131 [00:05<02:45,  1.29s/it][A
Training:   3%|▎         | 4/131 [00:05<01:47,  1.18it/s][A
Training:   4%|▍         | 5/131 [00:09<04:00,  1.91s/it][A
Training:   5%|▍         | 6/131 [00:09<02:57,  1.42s/it][A
Training:   5%|▌         | 7/131 [00:10<02:04,  1.00s/it][A
Training:   6%|▌         | 8/131 [00:10<01:28,  1.39it/s][A
Training:   7%|▋         | 9/131 [00:13<03:07,  1.54s/it][A
Training:   8%|▊         | 10/131 [00:14<02:50,  1.41s/it][A
Training:   8%|▊         | 11/131 [00:14<02:01,  1.01s/it][A
Training:   9%|▉         | 12/131 [00:14<01:29,  1.32it/s][A
Training:  10%|▉         | 13/131 [00:17<02:44,  1.40s/it][A
Training:  11%|█         | 14/131 [00:19<02:36,  1.34s/it][A
Training:  11%|█▏        | 15/131 [00:19<01:55,  1.00it/s][A
Training:  12%|█▏        

Epoch: 2/55 - Loss: 7.3800 - Accuracy: 0.9590



  0%|          | 0/17 [00:00<?, ?it/s][A
  6%|▌         | 1/17 [00:04<01:14,  4.65s/it][A
 12%|█▏        | 2/17 [00:05<00:35,  2.35s/it][A
 18%|█▊        | 3/17 [00:05<00:18,  1.36s/it][A
 24%|██▎       | 4/17 [00:05<00:11,  1.16it/s][A
 29%|██▉       | 5/17 [00:08<00:18,  1.53s/it][A
 35%|███▌      | 6/17 [00:09<00:14,  1.34s/it][A
 47%|████▋     | 8/17 [00:09<00:06,  1.39it/s][A
 53%|█████▎    | 9/17 [00:12<00:09,  1.22s/it][A
 59%|█████▉    | 10/17 [00:13<00:08,  1.16s/it][A
 65%|██████▍   | 11/17 [00:13<00:05,  1.13it/s][A
 71%|███████   | 12/17 [00:13<00:03,  1.50it/s][A
 76%|███████▋  | 13/17 [00:16<00:05,  1.26s/it][A
 82%|████████▏ | 14/17 [00:16<00:03,  1.04s/it][A
 94%|█████████▍| 16/17 [00:16<00:00,  1.67it/s][A
100%|██████████| 17/17 [00:17<00:00,  1.03s/it][A
Epochs:   4%|▎         | 2/55 [05:07<2:16:20, 154.34s/it]

Val Loss: 7.5207 - Val Accuracy: 0.9600



Training:   0%|          | 0/131 [00:00<?, ?it/s][A
Training:   1%|          | 1/131 [00:05<12:23,  5.72s/it][A
Training:   2%|▏         | 2/131 [00:05<05:14,  2.44s/it][A
Training:   2%|▏         | 3/131 [00:06<03:05,  1.45s/it][A
Training:   3%|▎         | 4/131 [00:06<01:58,  1.07it/s][A
Training:   4%|▍         | 5/131 [00:09<03:54,  1.86s/it][A
Training:   5%|▍         | 6/131 [00:09<02:40,  1.29s/it][A
Training:   5%|▌         | 7/131 [00:10<02:06,  1.02s/it][A
Training:   6%|▌         | 8/131 [00:10<01:32,  1.33it/s][A
Training:   7%|▋         | 9/131 [00:14<03:20,  1.64s/it][A
Training:   8%|▊         | 10/131 [00:14<02:25,  1.20s/it][A
Training:   8%|▊         | 11/131 [00:14<01:47,  1.12it/s][A
Training:   9%|▉         | 12/131 [00:14<01:24,  1.40it/s][A
Training:  10%|▉         | 13/131 [00:18<03:07,  1.59s/it][A
Training:  11%|█         | 14/131 [00:18<02:15,  1.16s/it][A
Training:  11%|█▏        | 15/131 [00:18<01:37,  1.19it/s][A
Training:  12%|█▏        

Epoch: 3/55 - Loss: 6.6121 - Accuracy: 0.9612



  0%|          | 0/17 [00:00<?, ?it/s][A
  6%|▌         | 1/17 [00:04<01:17,  4.87s/it][A
 24%|██▎       | 4/17 [00:05<00:12,  1.03it/s][A
 29%|██▉       | 5/17 [00:08<00:19,  1.66s/it][A
 35%|███▌      | 6/17 [00:08<00:14,  1.31s/it][A
 41%|████      | 7/17 [00:09<00:09,  1.02it/s][A
 47%|████▋     | 8/17 [00:09<00:06,  1.38it/s][A
 53%|█████▎    | 9/17 [00:12<00:11,  1.44s/it][A
 59%|█████▉    | 10/17 [00:13<00:08,  1.20s/it][A
 71%|███████   | 12/17 [00:13<00:03,  1.43it/s][A
 76%|███████▋  | 13/17 [00:16<00:05,  1.35s/it][A
 82%|████████▏ | 14/17 [00:16<00:03,  1.03s/it][A
 88%|████████▊ | 15/17 [00:16<00:01,  1.28it/s][A
 94%|█████████▍| 16/17 [00:16<00:00,  1.66it/s][A
100%|██████████| 17/17 [00:17<00:00,  1.05s/it][A
Epochs:   5%|▌         | 3/55 [07:38<2:12:31, 152.91s/it]

Val Loss: 7.0540 - Val Accuracy: 0.9640



Training:   0%|          | 0/131 [00:00<?, ?it/s][A
Training:   1%|          | 1/131 [00:05<11:39,  5.38s/it][A
Training:   2%|▏         | 2/131 [00:05<04:55,  2.29s/it][A
Training:   2%|▏         | 3/131 [00:05<02:48,  1.32s/it][A
Training:   3%|▎         | 4/131 [00:05<01:54,  1.11it/s][A
Training:   4%|▍         | 5/131 [00:09<03:55,  1.87s/it][A
Training:   5%|▍         | 6/131 [00:10<03:00,  1.45s/it][A
Training:   5%|▌         | 7/131 [00:10<02:07,  1.03s/it][A
Training:   6%|▌         | 8/131 [00:10<01:36,  1.28it/s][A
Training:   7%|▋         | 9/131 [00:14<03:29,  1.72s/it][A
Training:   8%|▊         | 10/131 [00:14<02:44,  1.36s/it][A
Training:   8%|▊         | 11/131 [00:15<01:59,  1.00it/s][A
Training:  10%|▉         | 13/131 [00:19<02:53,  1.47s/it][A
Training:  11%|█         | 14/131 [00:19<02:28,  1.27s/it][A
Training:  11%|█▏        | 15/131 [00:19<01:53,  1.02it/s][A
Training:  12%|█▏        | 16/131 [00:20<01:27,  1.32it/s][A
Training:  13%|█▎        

Epoch: 4/55 - Loss: 6.2868 - Accuracy: 0.9629



  0%|          | 0/17 [00:00<?, ?it/s][A
  6%|▌         | 1/17 [00:04<01:10,  4.38s/it][A
 12%|█▏        | 2/17 [00:04<00:28,  1.91s/it][A
 24%|██▎       | 4/17 [00:04<00:10,  1.24it/s][A
 29%|██▉       | 5/17 [00:07<00:17,  1.49s/it][A
 41%|████      | 7/17 [00:08<00:08,  1.11it/s][A
 47%|████▋     | 8/17 [00:08<00:06,  1.38it/s][A
 53%|█████▎    | 9/17 [00:11<00:10,  1.32s/it][A
 65%|██████▍   | 11/17 [00:12<00:05,  1.16it/s][A
 71%|███████   | 12/17 [00:12<00:03,  1.40it/s][A
 76%|███████▋  | 13/17 [00:14<00:04,  1.22s/it][A
 82%|████████▏ | 14/17 [00:15<00:02,  1.04it/s][A
 88%|████████▊ | 15/17 [00:15<00:01,  1.36it/s][A
 94%|█████████▍| 16/17 [00:15<00:00,  1.45it/s][A
100%|██████████| 17/17 [00:16<00:00,  1.04it/s][A
Epochs:   7%|▋         | 4/55 [10:14<2:10:58, 154.09s/it]

Val Loss: 6.8935 - Val Accuracy: 0.9658



Training:   0%|          | 0/131 [00:00<?, ?it/s][A
Training:   1%|          | 1/131 [00:05<11:55,  5.50s/it][A
Training:   2%|▏         | 2/131 [00:05<05:02,  2.35s/it][A
Training:   2%|▏         | 3/131 [00:05<02:53,  1.36s/it][A
Training:   3%|▎         | 4/131 [00:05<01:52,  1.13it/s][A
Training:   4%|▍         | 5/131 [00:09<03:56,  1.88s/it][A
Training:   5%|▍         | 6/131 [00:09<02:43,  1.31s/it][A
Training:   5%|▌         | 7/131 [00:09<01:54,  1.08it/s][A
Training:   7%|▋         | 9/131 [00:13<02:50,  1.39s/it][A
Training:   8%|▊         | 10/131 [00:13<02:08,  1.06s/it][A
Training:   8%|▊         | 11/131 [00:14<01:39,  1.21it/s][A
Training:   9%|▉         | 12/131 [00:14<01:16,  1.56it/s][A
Training:  10%|▉         | 13/131 [00:17<03:00,  1.53s/it][A
Training:  11%|█         | 14/131 [00:18<02:11,  1.12s/it][A
Training:  12%|█▏        | 16/131 [00:18<01:16,  1.51it/s][A
Training:  13%|█▎        | 17/131 [00:22<02:52,  1.51s/it][A
Training:  15%|█▍       

Epoch: 5/55 - Loss: 6.1831 - Accuracy: 0.9630



  0%|          | 0/17 [00:00<?, ?it/s][A
  6%|▌         | 1/17 [00:04<01:15,  4.71s/it][A
 12%|█▏        | 2/17 [00:04<00:30,  2.05s/it][A
 18%|█▊        | 3/17 [00:05<00:16,  1.21s/it][A
 24%|██▎       | 4/17 [00:05<00:10,  1.24it/s][A
 29%|██▉       | 5/17 [00:08<00:20,  1.70s/it][A
 41%|████      | 7/17 [00:08<00:08,  1.15it/s][A
 47%|████▋     | 8/17 [00:08<00:06,  1.47it/s][A
 53%|█████▎    | 9/17 [00:12<00:12,  1.59s/it][A
 71%|███████   | 12/17 [00:13<00:03,  1.29it/s][A
 76%|███████▋  | 13/17 [00:16<00:05,  1.28s/it][A
 82%|████████▏ | 14/17 [00:16<00:03,  1.02s/it][A
 94%|█████████▍| 16/17 [00:16<00:00,  1.55it/s][A
100%|██████████| 17/17 [00:17<00:00,  1.03s/it][A
Epochs:   9%|▉         | 5/55 [12:48<2:08:11, 153.82s/it]

Val Loss: 7.8945 - Val Accuracy: 0.9658



Training:   0%|          | 0/131 [00:00<?, ?it/s][A
Training:   1%|          | 1/131 [00:05<11:57,  5.52s/it][A
Training:   2%|▏         | 2/131 [00:06<05:39,  2.63s/it][A
Training:   2%|▏         | 3/131 [00:06<03:11,  1.50s/it][A
Training:   3%|▎         | 4/131 [00:06<02:02,  1.04it/s][A
Training:   4%|▍         | 5/131 [00:09<03:48,  1.82s/it][A
Training:   5%|▍         | 6/131 [00:10<03:06,  1.49s/it][A
Training:   6%|▌         | 8/131 [00:10<01:42,  1.20it/s][A
Training:   7%|▋         | 9/131 [00:14<03:06,  1.53s/it][A
Training:   8%|▊         | 10/131 [00:14<02:32,  1.26s/it][A
Training:   8%|▊         | 11/131 [00:15<01:54,  1.05it/s][A
Training:   9%|▉         | 12/131 [00:15<01:29,  1.33it/s][A
Training:  10%|▉         | 13/131 [00:19<03:06,  1.58s/it][A
Training:  11%|█         | 14/131 [00:19<02:34,  1.32s/it][A
Training:  11%|█▏        | 15/131 [00:19<01:51,  1.04it/s][A
Training:  12%|█▏        | 16/131 [00:20<01:26,  1.33it/s][A
Training:  13%|█▎       

Epoch: 6/55 - Loss: 6.3381 - Accuracy: 0.9657



  0%|          | 0/17 [00:00<?, ?it/s][A
  6%|▌         | 1/17 [00:05<01:20,  5.02s/it][A
 12%|█▏        | 2/17 [00:05<00:32,  2.16s/it][A
 24%|██▎       | 4/17 [00:05<00:11,  1.14it/s][A
 29%|██▉       | 5/17 [00:08<00:20,  1.67s/it][A
 35%|███▌      | 6/17 [00:09<00:13,  1.24s/it][A
 41%|████      | 7/17 [00:09<00:09,  1.11it/s][A
 47%|████▋     | 8/17 [00:09<00:06,  1.47it/s][A
 53%|█████▎    | 9/17 [00:12<00:10,  1.37s/it][A
 59%|█████▉    | 10/17 [00:12<00:06,  1.01it/s][A
 71%|███████   | 12/17 [00:12<00:02,  1.71it/s][A
 76%|███████▋  | 13/17 [00:15<00:04,  1.25s/it][A
 88%|████████▊ | 15/17 [00:16<00:01,  1.32it/s][A
 94%|█████████▍| 16/17 [00:16<00:00,  1.49it/s][A
100%|██████████| 17/17 [00:17<00:00,  1.04s/it][A
Epochs:  11%|█         | 6/55 [15:25<2:06:39, 155.08s/it]

Val Loss: 7.2766 - Val Accuracy: 0.9618



Training:   0%|          | 0/131 [00:00<?, ?it/s][A
Training:   1%|          | 1/131 [00:05<11:36,  5.36s/it][A
Training:   2%|▏         | 2/131 [00:05<05:24,  2.52s/it][A
Training:   2%|▏         | 3/131 [00:06<03:02,  1.43s/it][A
Training:   3%|▎         | 4/131 [00:06<01:58,  1.08it/s][A
Training:   4%|▍         | 5/131 [00:09<03:48,  1.81s/it][A
Training:   5%|▍         | 6/131 [00:10<03:23,  1.63s/it][A
Training:   5%|▌         | 7/131 [00:10<02:20,  1.13s/it][A
Training:   6%|▌         | 8/131 [00:11<01:41,  1.22it/s][A
Training:   7%|▋         | 9/131 [00:13<02:55,  1.44s/it][A
Training:   8%|▊         | 10/131 [00:15<02:54,  1.44s/it][A
Training:   8%|▊         | 11/131 [00:15<02:04,  1.04s/it][A
Training:   9%|▉         | 12/131 [00:15<01:31,  1.30it/s][A
Training:  10%|▉         | 13/131 [00:18<02:48,  1.43s/it][A
Training:  11%|█         | 14/131 [00:19<02:45,  1.42s/it][A
Training:  11%|█▏        | 15/131 [00:20<01:59,  1.03s/it][A
Training:  12%|█▏        

Epoch: 7/55 - Loss: 6.1809 - Accuracy: 0.9667



  0%|          | 0/17 [00:00<?, ?it/s][A
  6%|▌         | 1/17 [00:04<01:17,  4.83s/it][A
 12%|█▏        | 2/17 [00:04<00:30,  2.06s/it][A
 18%|█▊        | 3/17 [00:05<00:16,  1.17s/it][A
 24%|██▎       | 4/17 [00:05<00:10,  1.29it/s][A
 29%|██▉       | 5/17 [00:08<00:19,  1.65s/it][A
 35%|███▌      | 6/17 [00:08<00:12,  1.13s/it][A
 41%|████      | 7/17 [00:08<00:08,  1.25it/s][A
 47%|████▋     | 8/17 [00:08<00:05,  1.63it/s][A
 53%|█████▎    | 9/17 [00:11<00:10,  1.37s/it][A
 59%|█████▉    | 10/17 [00:12<00:06,  1.00it/s][A
 71%|███████   | 12/17 [00:12<00:02,  1.76it/s][A
 76%|███████▋  | 13/17 [00:15<00:05,  1.29s/it][A
 82%|████████▏ | 14/17 [00:15<00:02,  1.02it/s][A
 94%|█████████▍| 16/17 [00:15<00:00,  1.68it/s][A
100%|██████████| 17/17 [00:17<00:00,  1.01s/it][A
Epochs:  13%|█▎        | 7/55 [18:02<2:04:36, 155.76s/it]

Val Loss: 7.0909 - Val Accuracy: 0.9613



Training:   0%|          | 0/131 [00:00<?, ?it/s][A
Training:   1%|          | 1/131 [00:05<12:02,  5.55s/it][A
Training:   2%|▏         | 2/131 [00:05<05:24,  2.51s/it][A
Training:   2%|▏         | 3/131 [00:06<03:09,  1.48s/it][A
Training:   3%|▎         | 4/131 [00:06<02:04,  1.02it/s][A
Training:   4%|▍         | 5/131 [00:09<03:50,  1.83s/it][A
Training:   5%|▍         | 6/131 [00:10<02:44,  1.32s/it][A
Training:   5%|▌         | 7/131 [00:10<01:54,  1.08it/s][A
Training:   6%|▌         | 8/131 [00:10<01:25,  1.43it/s][A
Training:   7%|▋         | 9/131 [00:14<03:18,  1.63s/it][A
Training:   8%|▊         | 10/131 [00:14<02:22,  1.18s/it][A
Training:   8%|▊         | 11/131 [00:14<01:46,  1.13it/s][A
Training:   9%|▉         | 12/131 [00:14<01:18,  1.52it/s][A
Training:  10%|▉         | 13/131 [00:18<03:09,  1.60s/it][A
Training:  11%|█         | 14/131 [00:18<02:17,  1.17s/it][A
Training:  11%|█▏        | 15/131 [00:18<01:40,  1.16it/s][A
Training:  12%|█▏        

Epoch: 8/55 - Loss: 5.9391 - Accuracy: 0.9675



  0%|          | 0/17 [00:00<?, ?it/s][A
  6%|▌         | 1/17 [00:04<01:12,  4.56s/it][A
 12%|█▏        | 2/17 [00:04<00:30,  2.01s/it][A
 18%|█▊        | 3/17 [00:04<00:16,  1.15s/it][A
 24%|██▎       | 4/17 [00:05<00:09,  1.34it/s][A
 29%|██▉       | 5/17 [00:08<00:18,  1.56s/it][A
 41%|████      | 7/17 [00:08<00:08,  1.17it/s][A
 47%|████▋     | 8/17 [00:08<00:05,  1.51it/s][A
 53%|█████▎    | 9/17 [00:11<00:10,  1.35s/it][A
 59%|█████▉    | 10/17 [00:11<00:07,  1.02s/it][A
 65%|██████▍   | 11/17 [00:11<00:04,  1.31it/s][A
 71%|███████   | 12/17 [00:12<00:02,  1.75it/s][A
 76%|███████▋  | 13/17 [00:15<00:05,  1.30s/it][A
 82%|████████▏ | 14/17 [00:15<00:03,  1.08s/it][A
 88%|████████▊ | 15/17 [00:15<00:01,  1.22it/s][A
 94%|█████████▍| 16/17 [00:16<00:00,  1.61it/s][A
100%|██████████| 17/17 [00:16<00:00,  1.04it/s][A
Epochs:  15%|█▍        | 8/55 [20:32<2:00:35, 153.96s/it]

Val Loss: 7.3328 - Val Accuracy: 0.9658



Training:   0%|          | 0/131 [00:00<?, ?it/s][A
Training:   1%|          | 1/131 [00:05<11:04,  5.11s/it][A
Training:   2%|▏         | 2/131 [00:05<04:47,  2.23s/it][A
Training:   2%|▏         | 3/131 [00:05<02:45,  1.29s/it][A
Training:   3%|▎         | 4/131 [00:05<01:49,  1.16it/s][A
Training:   4%|▍         | 5/131 [00:09<03:52,  1.85s/it][A
Training:   5%|▍         | 6/131 [00:09<02:43,  1.31s/it][A
Training:   5%|▌         | 7/131 [00:09<01:56,  1.07it/s][A
Training:   7%|▋         | 9/131 [00:13<02:43,  1.34s/it][A
Training:   8%|▊         | 10/131 [00:13<02:07,  1.05s/it][A
Training:   8%|▊         | 11/131 [00:13<01:47,  1.12it/s][A
Training:   9%|▉         | 12/131 [00:14<01:24,  1.42it/s][A
Training:  10%|▉         | 13/131 [00:17<02:53,  1.47s/it][A
Training:  11%|█         | 14/131 [00:17<02:16,  1.16s/it][A
Training:  11%|█▏        | 15/131 [00:18<01:44,  1.11it/s][A
Training:  12%|█▏        | 16/131 [00:18<01:18,  1.47it/s][A
Training:  13%|█▎       

Epoch: 9/55 - Loss: 6.0479 - Accuracy: 0.9667



  0%|          | 0/17 [00:00<?, ?it/s][A
  6%|▌         | 1/17 [00:04<01:17,  4.82s/it][A
 12%|█▏        | 2/17 [00:04<00:30,  2.05s/it][A
 18%|█▊        | 3/17 [00:05<00:16,  1.16s/it][A
 24%|██▎       | 4/17 [00:05<00:09,  1.32it/s][A
 29%|██▉       | 5/17 [00:08<00:20,  1.68s/it][A
 35%|███▌      | 6/17 [00:08<00:12,  1.15s/it][A
 41%|████      | 7/17 [00:08<00:08,  1.21it/s][A
 47%|████▋     | 8/17 [00:08<00:05,  1.59it/s][A
 53%|█████▎    | 9/17 [00:12<00:11,  1.49s/it][A
 59%|█████▉    | 10/17 [00:12<00:07,  1.09s/it][A
 65%|██████▍   | 11/17 [00:12<00:04,  1.26it/s][A
 71%|███████   | 12/17 [00:12<00:02,  1.69it/s][A
 76%|███████▋  | 13/17 [00:16<00:05,  1.43s/it][A
 82%|████████▏ | 14/17 [00:16<00:03,  1.04s/it][A
 88%|████████▊ | 15/17 [00:16<00:01,  1.28it/s][A
 94%|█████████▍| 16/17 [00:16<00:00,  1.69it/s][A
100%|██████████| 17/17 [00:17<00:00,  1.03s/it][A
Epochs:  16%|█▋        | 9/55 [23:03<1:57:14, 152.93s/it]

Val Loss: 7.0884 - Val Accuracy: 0.9613



Training:   0%|          | 0/131 [00:00<?, ?it/s][A
Training:   1%|          | 1/131 [00:06<13:10,  6.08s/it][A
Training:   2%|▏         | 2/131 [00:06<05:39,  2.64s/it][A
Training:   2%|▏         | 3/131 [00:06<03:11,  1.49s/it][A
Training:   3%|▎         | 4/131 [00:06<02:04,  1.02it/s][A
Training:   4%|▍         | 5/131 [00:11<04:41,  2.23s/it][A
Training:   5%|▍         | 6/131 [00:11<03:13,  1.55s/it][A
Training:   5%|▌         | 7/131 [00:11<02:16,  1.10s/it][A
Training:   7%|▋         | 9/131 [00:15<03:15,  1.60s/it][A
Training:   8%|▊         | 11/131 [00:16<02:05,  1.05s/it][A
Training:   9%|▉         | 12/131 [00:16<01:40,  1.19it/s][A
Training:  10%|▉         | 13/131 [00:19<02:50,  1.44s/it][A
Training:  11%|█         | 14/131 [00:20<02:13,  1.14s/it][A
Training:  11%|█▏        | 15/131 [00:20<02:03,  1.07s/it][A
Training:  12%|█▏        | 16/131 [00:21<01:33,  1.23it/s][A
Training:  13%|█▎        | 17/131 [00:23<02:38,  1.39s/it][A
Training:  14%|█▎       

Epoch: 10/55 - Loss: 5.9342 - Accuracy: 0.9673



  0%|          | 0/17 [00:00<?, ?it/s][A
  6%|▌         | 1/17 [00:04<01:12,  4.55s/it][A
 12%|█▏        | 2/17 [00:04<00:29,  1.96s/it][A
 18%|█▊        | 3/17 [00:05<00:19,  1.40s/it][A
 24%|██▎       | 4/17 [00:05<00:11,  1.11it/s][A
 29%|██▉       | 5/17 [00:08<00:18,  1.54s/it][A
 35%|███▌      | 6/17 [00:08<00:11,  1.06s/it][A
 41%|████      | 7/17 [00:09<00:09,  1.08it/s][A
 53%|█████▎    | 9/17 [00:11<00:08,  1.12s/it][A
 59%|█████▉    | 10/17 [00:11<00:06,  1.16it/s][A
 65%|██████▍   | 11/17 [00:13<00:05,  1.05it/s][A
 71%|███████   | 12/17 [00:13<00:03,  1.37it/s][A
 76%|███████▋  | 13/17 [00:15<00:04,  1.14s/it][A
 82%|████████▏ | 14/17 [00:15<00:02,  1.19it/s][A
 88%|████████▊ | 15/17 [00:16<00:01,  1.08it/s][A
100%|██████████| 17/17 [00:16<00:00,  1.00it/s][A
Epochs:  18%|█▊        | 10/55 [25:34<1:54:21, 152.48s/it]

Val Loss: 7.4264 - Val Accuracy: 0.9624



Training:   0%|          | 0/131 [00:00<?, ?it/s][A
Training:   1%|          | 1/131 [00:05<11:20,  5.23s/it][A
Training:   2%|▏         | 2/131 [00:05<04:58,  2.31s/it][A
Training:   2%|▏         | 3/131 [00:05<02:54,  1.36s/it][A
Training:   3%|▎         | 4/131 [00:05<01:50,  1.15it/s][A
Training:   4%|▍         | 5/131 [00:09<03:53,  1.85s/it][A
Training:   5%|▍         | 6/131 [00:09<02:39,  1.28s/it][A
Training:   5%|▌         | 7/131 [00:09<01:53,  1.09it/s][A
Training:   6%|▌         | 8/131 [00:09<01:21,  1.50it/s][A
Training:   7%|▋         | 9/131 [00:13<03:18,  1.62s/it][A
Training:   8%|▊         | 10/131 [00:13<02:21,  1.17s/it][A
Training:   8%|▊         | 11/131 [00:14<01:48,  1.10it/s][A
Training:   9%|▉         | 12/131 [00:14<01:18,  1.51it/s][A
Training:  10%|▉         | 13/131 [00:17<03:07,  1.59s/it][A
Training:  11%|█         | 14/131 [00:18<02:15,  1.16s/it][A
Training:  11%|█▏        | 15/131 [00:18<01:41,  1.14it/s][A
Training:  12%|█▏        

Epoch: 11/55 - Loss: 6.1992 - Accuracy: 0.9680



  0%|          | 0/17 [00:00<?, ?it/s][A
  6%|▌         | 1/17 [00:04<01:13,  4.62s/it][A
 12%|█▏        | 2/17 [00:04<00:30,  2.01s/it][A
 18%|█▊        | 3/17 [00:04<00:16,  1.15s/it][A
 24%|██▎       | 4/17 [00:05<00:10,  1.21it/s][A
 29%|██▉       | 5/17 [00:08<00:20,  1.68s/it][A
 35%|███▌      | 6/17 [00:08<00:12,  1.18s/it][A
 53%|█████▎    | 9/17 [00:12<00:09,  1.17s/it][A
 59%|█████▉    | 10/17 [00:12<00:06,  1.06it/s][A
 65%|██████▍   | 11/17 [00:12<00:04,  1.31it/s][A
 71%|███████   | 12/17 [00:12<00:03,  1.66it/s][A
 76%|███████▋  | 13/17 [00:15<00:05,  1.30s/it][A
 82%|████████▏ | 14/17 [00:16<00:02,  1.02it/s][A
 88%|████████▊ | 15/17 [00:16<00:01,  1.36it/s][A
100%|██████████| 17/17 [00:16<00:00,  1.00it/s][A
Epochs:  20%|██        | 11/55 [28:02<1:50:39, 150.90s/it]

Val Loss: 7.5599 - Val Accuracy: 0.9652



Training:   0%|          | 0/131 [00:00<?, ?it/s][A
Training:   1%|          | 1/131 [00:04<10:38,  4.91s/it][A
Training:   2%|▏         | 2/131 [00:05<04:36,  2.14s/it][A
Training:   2%|▏         | 3/131 [00:05<02:39,  1.24s/it][A
Training:   4%|▍         | 5/131 [00:09<03:26,  1.64s/it][A
Training:   5%|▍         | 6/131 [00:09<02:33,  1.23s/it][A
Training:   5%|▌         | 7/131 [00:09<01:55,  1.07it/s][A
Training:   6%|▌         | 8/131 [00:09<01:28,  1.39it/s][A
Training:   7%|▋         | 9/131 [00:13<03:02,  1.50s/it][A
Training:   8%|▊         | 10/131 [00:13<02:12,  1.09s/it][A
Training:   8%|▊         | 11/131 [00:13<01:38,  1.21it/s][A
Training:   9%|▉         | 12/131 [00:13<01:13,  1.63it/s][A
Training:  10%|▉         | 13/131 [00:17<02:55,  1.48s/it][A
Training:  11%|█▏        | 15/131 [00:17<01:37,  1.19it/s][A
Training:  12%|█▏        | 16/131 [00:17<01:22,  1.40it/s][A
Training:  13%|█▎        | 17/131 [00:21<02:48,  1.48s/it][A
Training:  14%|█▎       

Epoch: 12/55 - Loss: 6.2716 - Accuracy: 0.9681



  0%|          | 0/17 [00:00<?, ?it/s][A
  6%|▌         | 1/17 [00:04<01:19,  4.94s/it][A
 12%|█▏        | 2/17 [00:05<00:32,  2.15s/it][A
 18%|█▊        | 3/17 [00:05<00:17,  1.28s/it][A
 24%|██▎       | 4/17 [00:05<00:10,  1.19it/s][A
 29%|██▉       | 5/17 [00:08<00:17,  1.49s/it][A
 35%|███▌      | 6/17 [00:08<00:11,  1.04s/it][A
 41%|████      | 7/17 [00:08<00:07,  1.32it/s][A
 53%|█████▎    | 9/17 [00:11<00:09,  1.22s/it][A
 59%|█████▉    | 10/17 [00:12<00:06,  1.07it/s][A
 65%|██████▍   | 11/17 [00:12<00:04,  1.39it/s][A
 76%|███████▋  | 13/17 [00:15<00:04,  1.11s/it][A
 82%|████████▏ | 14/17 [00:15<00:02,  1.15it/s][A
 88%|████████▊ | 15/17 [00:15<00:01,  1.46it/s][A
100%|██████████| 17/17 [00:16<00:00,  1.01it/s][A
Epochs:  22%|██▏       | 12/55 [30:29<1:47:21, 149.80s/it]

Val Loss: 6.3751 - Val Accuracy: 0.9630



Training:   0%|          | 0/131 [00:00<?, ?it/s][A
Training:   1%|          | 1/131 [00:04<09:46,  4.51s/it][A
Training:   2%|▏         | 2/131 [00:05<04:45,  2.21s/it][A
Training:   2%|▏         | 3/131 [00:05<02:44,  1.28s/it][A
Training:   4%|▍         | 5/131 [00:08<03:10,  1.52s/it][A
Training:   5%|▍         | 6/131 [00:09<02:43,  1.31s/it][A
Training:   5%|▌         | 7/131 [00:09<02:00,  1.03it/s][A
Training:   6%|▌         | 8/131 [00:09<01:29,  1.38it/s][A
Training:   7%|▋         | 9/131 [00:12<02:50,  1.40s/it][A
Training:   8%|▊         | 10/131 [00:13<02:29,  1.24s/it][A
Training:   8%|▊         | 11/131 [00:13<01:52,  1.07it/s][A
Training:   9%|▉         | 12/131 [00:14<01:23,  1.42it/s][A
Training:  10%|▉         | 13/131 [00:16<02:38,  1.34s/it][A
Training:  11%|█         | 14/131 [00:17<02:26,  1.25s/it][A
Training:  11%|█▏        | 15/131 [00:18<01:48,  1.07it/s][A
Training:  12%|█▏        | 16/131 [00:18<01:21,  1.41it/s][A
Training:  13%|█▎       

Epoch: 13/55 - Loss: 6.2711 - Accuracy: 0.9684



  0%|          | 0/17 [00:00<?, ?it/s][A
  6%|▌         | 1/17 [00:04<01:17,  4.83s/it][A
 12%|█▏        | 2/17 [00:04<00:31,  2.07s/it][A
 18%|█▊        | 3/17 [00:05<00:16,  1.19s/it][A
 24%|██▎       | 4/17 [00:05<00:10,  1.24it/s][A
 29%|██▉       | 5/17 [00:08<00:20,  1.68s/it][A
 35%|███▌      | 6/17 [00:08<00:12,  1.17s/it][A
 53%|█████▎    | 9/17 [00:12<00:09,  1.13s/it][A
 59%|█████▉    | 10/17 [00:12<00:06,  1.08it/s][A
 65%|██████▍   | 11/17 [00:12<00:04,  1.35it/s][A
 71%|███████   | 12/17 [00:12<00:02,  1.69it/s][A
 76%|███████▋  | 13/17 [00:15<00:04,  1.19s/it][A
 88%|████████▊ | 15/17 [00:15<00:01,  1.42it/s][A
100%|██████████| 17/17 [00:16<00:00,  1.02it/s][A
Epochs:  24%|██▎       | 13/55 [32:56<1:44:20, 149.06s/it]

Val Loss: 8.5767 - Val Accuracy: 0.9618



Training:   0%|          | 0/131 [00:00<?, ?it/s][A
Training:   1%|          | 1/131 [00:04<10:28,  4.83s/it][A
Training:   2%|▏         | 2/131 [00:05<04:28,  2.08s/it][A
Training:   2%|▏         | 3/131 [00:05<02:51,  1.34s/it][A
Training:   3%|▎         | 4/131 [00:05<01:50,  1.15it/s][A
Training:   4%|▍         | 5/131 [00:08<03:34,  1.71s/it][A
Training:   5%|▍         | 6/131 [00:09<02:35,  1.24s/it][A
Training:   5%|▌         | 7/131 [00:09<01:54,  1.08it/s][A
Training:   6%|▌         | 8/131 [00:09<01:25,  1.44it/s][A
Training:   7%|▋         | 9/131 [00:12<03:03,  1.50s/it][A
Training:   8%|▊         | 10/131 [00:13<02:13,  1.10s/it][A
Training:   8%|▊         | 11/131 [00:13<01:55,  1.04it/s][A
Training:   9%|▉         | 12/131 [00:13<01:26,  1.38it/s][A
Training:  10%|▉         | 13/131 [00:17<02:51,  1.45s/it][A
Training:  11%|█         | 14/131 [00:17<02:03,  1.06s/it][A
Training:  11%|█▏        | 15/131 [00:17<01:51,  1.04it/s][A
Training:  12%|█▏        

Epoch: 14/55 - Loss: 6.1686 - Accuracy: 0.9668



  0%|          | 0/17 [00:00<?, ?it/s][A
  6%|▌         | 1/17 [00:04<01:16,  4.78s/it][A
 12%|█▏        | 2/17 [00:04<00:31,  2.08s/it][A
 18%|█▊        | 3/17 [00:05<00:16,  1.21s/it][A
 24%|██▎       | 4/17 [00:05<00:10,  1.29it/s][A
 29%|██▉       | 5/17 [00:08<00:20,  1.67s/it][A
 41%|████      | 7/17 [00:08<00:08,  1.17it/s][A
 47%|████▋     | 8/17 [00:08<00:05,  1.51it/s][A
 53%|█████▎    | 9/17 [00:11<00:10,  1.33s/it][A
 59%|█████▉    | 10/17 [00:12<00:07,  1.01s/it][A
 65%|██████▍   | 11/17 [00:12<00:04,  1.29it/s][A
 71%|███████   | 12/17 [00:12<00:03,  1.66it/s][A
 76%|███████▋  | 13/17 [00:15<00:05,  1.33s/it][A
 88%|████████▊ | 15/17 [00:15<00:01,  1.29it/s][A
 94%|█████████▍| 16/17 [00:15<00:00,  1.64it/s][A
100%|██████████| 17/17 [00:16<00:00,  1.03it/s][A
Epochs:  25%|██▌       | 14/55 [35:24<1:41:34, 148.65s/it]

Val Loss: 7.8083 - Val Accuracy: 0.9669



Training:   0%|          | 0/131 [00:00<?, ?it/s][A
Training:   1%|          | 1/131 [00:04<10:13,  4.72s/it][A
Training:   2%|▏         | 2/131 [00:05<04:56,  2.30s/it][A
Training:   2%|▏         | 3/131 [00:05<02:46,  1.30s/it][A
Training:   3%|▎         | 4/131 [00:05<01:47,  1.18it/s][A
Training:   4%|▍         | 5/131 [00:09<03:51,  1.83s/it][A
Training:   5%|▍         | 6/131 [00:09<02:50,  1.36s/it][A
Training:   5%|▌         | 7/131 [00:09<01:59,  1.03it/s][A
Training:   6%|▌         | 8/131 [00:09<01:25,  1.44it/s][A
Training:   7%|▋         | 9/131 [00:13<03:12,  1.58s/it][A
Training:   8%|▊         | 10/131 [00:13<02:28,  1.22s/it][A
Training:   8%|▊         | 11/131 [00:13<01:45,  1.14it/s][A
Training:   9%|▉         | 12/131 [00:14<01:16,  1.55it/s][A
Training:  10%|▉         | 13/131 [00:17<02:56,  1.50s/it][A
Training:  11%|█         | 14/131 [00:17<02:17,  1.18s/it][A
Training:  11%|█▏        | 15/131 [00:18<01:41,  1.15it/s][A
Training:  13%|█▎        

Epoch: 15/55 - Loss: 6.1602 - Accuracy: 0.9688



  0%|          | 0/17 [00:00<?, ?it/s][A
  6%|▌         | 1/17 [00:04<01:16,  4.78s/it][A
 12%|█▏        | 2/17 [00:05<00:31,  2.10s/it][A
 18%|█▊        | 3/17 [00:05<00:16,  1.21s/it][A
 29%|██▉       | 5/17 [00:08<00:17,  1.46s/it][A
 41%|████      | 7/17 [00:08<00:08,  1.19it/s][A
 47%|████▋     | 8/17 [00:08<00:06,  1.48it/s][A
 53%|█████▎    | 9/17 [00:11<00:10,  1.31s/it][A
 59%|█████▉    | 10/17 [00:12<00:06,  1.00it/s][A
 65%|██████▍   | 11/17 [00:12<00:04,  1.30it/s][A
 71%|███████   | 12/17 [00:12<00:03,  1.66it/s][A
 76%|███████▋  | 13/17 [00:15<00:05,  1.31s/it][A
 82%|████████▏ | 14/17 [00:15<00:02,  1.03it/s][A
 94%|█████████▍| 16/17 [00:15<00:00,  1.73it/s][A
100%|██████████| 17/17 [00:16<00:00,  1.02it/s][A
Epochs:  27%|██▋       | 15/55 [37:50<1:38:38, 147.96s/it]

Val Loss: 9.2498 - Val Accuracy: 0.9707



Training:   0%|          | 0/131 [00:00<?, ?it/s][A
Training:   1%|          | 1/131 [00:05<11:05,  5.12s/it][A
Training:   2%|▏         | 2/131 [00:05<04:46,  2.22s/it][A
Training:   2%|▏         | 3/131 [00:05<02:41,  1.26s/it][A
Training:   3%|▎         | 4/131 [00:05<01:45,  1.20it/s][A
Training:   4%|▍         | 5/131 [00:09<03:45,  1.79s/it][A
Training:   5%|▌         | 7/131 [00:09<01:54,  1.08it/s][A
Training:   7%|▋         | 9/131 [00:13<02:47,  1.37s/it][A
Training:   8%|▊         | 10/131 [00:13<02:14,  1.11s/it][A
Training:   8%|▊         | 11/131 [00:13<01:43,  1.15it/s][A
Training:   9%|▉         | 12/131 [00:13<01:20,  1.49it/s][A
Training:  10%|▉         | 13/131 [00:17<02:55,  1.49s/it][A
Training:  11%|█         | 14/131 [00:17<02:08,  1.10s/it][A
Training:  11%|█▏        | 15/131 [00:17<01:35,  1.22it/s][A
Training:  13%|█▎        | 17/131 [00:21<02:27,  1.29s/it][A
Training:  14%|█▎        | 18/131 [00:21<01:55,  1.02s/it][A
Training:  15%|█▍      

Epoch: 16/55 - Loss: 6.4181 - Accuracy: 0.9671



  0%|          | 0/17 [00:00<?, ?it/s][A
  6%|▌         | 1/17 [00:04<01:13,  4.58s/it][A
 12%|█▏        | 2/17 [00:04<00:31,  2.07s/it][A
 18%|█▊        | 3/17 [00:05<00:17,  1.24s/it][A
 24%|██▎       | 4/17 [00:05<00:10,  1.21it/s][A
 29%|██▉       | 5/17 [00:08<00:18,  1.58s/it][A
 35%|███▌      | 6/17 [00:08<00:12,  1.15s/it][A
 41%|████      | 7/17 [00:08<00:08,  1.19it/s][A
 47%|████▋     | 8/17 [00:08<00:05,  1.60it/s][A
 53%|█████▎    | 9/17 [00:11<00:10,  1.32s/it][A
 59%|█████▉    | 10/17 [00:12<00:07,  1.00s/it][A
 65%|██████▍   | 11/17 [00:12<00:04,  1.22it/s][A
 76%|███████▋  | 13/17 [00:15<00:04,  1.09s/it][A
 82%|████████▏ | 14/17 [00:15<00:02,  1.02it/s][A
 88%|████████▊ | 15/17 [00:16<00:01,  1.31it/s][A
100%|██████████| 17/17 [00:16<00:00,  1.03it/s][A
Epochs:  29%|██▉       | 16/55 [40:17<1:35:57, 147.62s/it]

Val Loss: 8.1856 - Val Accuracy: 0.9618



Training:   0%|          | 0/131 [00:00<?, ?it/s][A
Training:   1%|          | 1/131 [00:04<10:34,  4.88s/it][A
Training:   2%|▏         | 2/131 [00:05<04:45,  2.21s/it][A
Training:   3%|▎         | 4/131 [00:05<01:51,  1.14it/s][A
Training:   4%|▍         | 5/131 [00:08<03:29,  1.66s/it][A
Training:   5%|▍         | 6/131 [00:09<02:46,  1.33s/it][A
Training:   6%|▌         | 8/131 [00:09<01:33,  1.31it/s][A
Training:   7%|▋         | 9/131 [00:13<02:55,  1.44s/it][A
Training:   8%|▊         | 10/131 [00:13<02:14,  1.11s/it][A
Training:   8%|▊         | 11/131 [00:13<01:41,  1.18it/s][A
Training:   9%|▉         | 12/131 [00:14<01:37,  1.22it/s][A
Training:  10%|▉         | 13/131 [00:17<02:44,  1.39s/it][A
Training:  11%|█         | 14/131 [00:17<02:05,  1.07s/it][A
Training:  11%|█▏        | 15/131 [00:17<01:32,  1.25it/s][A
Training:  12%|█▏        | 16/131 [00:18<01:44,  1.11it/s][A
Training:  13%|█▎        | 17/131 [00:20<02:27,  1.29s/it][A
Training:  14%|█▎      

Epoch: 17/55 - Loss: 6.4000 - Accuracy: 0.9690



  0%|          | 0/17 [00:00<?, ?it/s][A
  6%|▌         | 1/17 [00:03<00:48,  3.04s/it][A
 12%|█▏        | 2/17 [00:03<00:19,  1.33s/it][A
 24%|██▎       | 4/17 [00:03<00:07,  1.79it/s][A
 29%|██▉       | 5/17 [00:05<00:12,  1.05s/it][A
 35%|███▌      | 6/17 [00:05<00:08,  1.26it/s][A
 41%|████      | 7/17 [00:05<00:05,  1.71it/s][A
 53%|█████▎    | 9/17 [00:08<00:06,  1.19it/s][A
 59%|█████▉    | 10/17 [00:08<00:04,  1.50it/s][A
 65%|██████▍   | 11/17 [00:08<00:03,  1.74it/s][A
 76%|███████▋  | 13/17 [00:10<00:03,  1.27it/s][A
 82%|████████▏ | 14/17 [00:10<00:01,  1.53it/s][A
 88%|████████▊ | 15/17 [00:11<00:01,  1.88it/s][A
100%|██████████| 17/17 [00:11<00:00,  1.47it/s][A
Epochs:  31%|███       | 17/55 [42:09<1:26:37, 136.78s/it]

Val Loss: 7.7698 - Val Accuracy: 0.9634



Training:   0%|          | 0/131 [00:00<?, ?it/s][A
Training:   1%|          | 1/131 [00:03<07:45,  3.58s/it][A
Training:   2%|▏         | 3/131 [00:03<02:05,  1.02it/s][A
Training:   4%|▍         | 5/131 [00:06<02:24,  1.14s/it][A
Training:   5%|▍         | 6/131 [00:06<01:49,  1.14it/s][A
Training:   6%|▌         | 8/131 [00:06<01:04,  1.90it/s][A
Training:   7%|▋         | 9/131 [00:08<01:57,  1.04it/s][A
Training:   8%|▊         | 10/131 [00:09<01:38,  1.23it/s][A
Training:   8%|▊         | 11/131 [00:09<01:15,  1.59it/s][A
Training:  10%|▉         | 13/131 [00:11<01:39,  1.19it/s][A
Training:  11%|█         | 14/131 [00:12<01:34,  1.23it/s][A
Training:  12%|█▏        | 16/131 [00:12<00:58,  1.98it/s][A
Training:  13%|█▎        | 17/131 [00:14<01:40,  1.14it/s][A
Training:  14%|█▎        | 18/131 [00:15<01:31,  1.23it/s][A
Training:  16%|█▌        | 21/131 [00:17<01:22,  1.33it/s][A
Training:  17%|█▋        | 22/131 [00:18<01:19,  1.38it/s][A
Training:  18%|█▊     

Epoch: 18/55 - Loss: 6.5629 - Accuracy: 0.9690



  0%|          | 0/17 [00:00<?, ?it/s][A
  6%|▌         | 1/17 [00:03<00:49,  3.11s/it][A
 12%|█▏        | 2/17 [00:03<00:20,  1.35s/it][A
 24%|██▎       | 4/17 [00:03<00:07,  1.81it/s][A
 29%|██▉       | 5/17 [00:05<00:13,  1.09s/it][A
 41%|████      | 7/17 [00:05<00:06,  1.65it/s][A
 53%|█████▎    | 9/17 [00:08<00:06,  1.20it/s][A
 59%|█████▉    | 10/17 [00:08<00:04,  1.48it/s][A
 71%|███████   | 12/17 [00:08<00:02,  2.31it/s][A
 82%|████████▏ | 14/17 [00:10<00:02,  1.39it/s][A
100%|██████████| 17/17 [00:11<00:00,  1.47it/s][A
Epochs:  33%|███▎      | 18/55 [43:52<1:18:09, 126.74s/it]

Val Loss: 9.1242 - Val Accuracy: 0.9596



Training:   0%|          | 0/131 [00:00<?, ?it/s][A
Training:   1%|          | 1/131 [00:03<07:12,  3.33s/it][A
Training:   2%|▏         | 3/131 [00:03<02:01,  1.06it/s][A
Training:   4%|▍         | 5/131 [00:06<02:27,  1.17s/it][A
Training:   5%|▍         | 6/131 [00:06<01:51,  1.12it/s][A
Training:   5%|▌         | 7/131 [00:06<01:24,  1.48it/s][A
Training:   6%|▌         | 8/131 [00:06<01:05,  1.89it/s][A
Training:   7%|▋         | 9/131 [00:09<02:15,  1.11s/it][A
Training:   8%|▊         | 11/131 [00:09<01:16,  1.57it/s][A
Training:   9%|▉         | 12/131 [00:09<01:00,  1.96it/s][A
Training:  10%|▉         | 13/131 [00:11<01:57,  1.00it/s][A
Training:  11%|█         | 14/131 [00:12<01:29,  1.30it/s][A
Training:  11%|█▏        | 15/131 [00:12<01:08,  1.69it/s][A
Training:  12%|█▏        | 16/131 [00:12<00:52,  2.18it/s][A
Training:  13%|█▎        | 17/131 [00:14<01:51,  1.03it/s][A
Training:  14%|█▎        | 18/131 [00:14<01:29,  1.26it/s][A
Training:  15%|█▍      

Epoch: 19/55 - Loss: 7.0547 - Accuracy: 0.9674



  0%|          | 0/17 [00:00<?, ?it/s][A
  6%|▌         | 1/17 [00:02<00:47,  2.94s/it][A
 12%|█▏        | 2/17 [00:03<00:19,  1.29s/it][A
 24%|██▎       | 4/17 [00:03<00:07,  1.84it/s][A
 29%|██▉       | 5/17 [00:05<00:13,  1.09s/it][A
 35%|███▌      | 6/17 [00:05<00:09,  1.19it/s][A
 47%|████▋     | 8/17 [00:06<00:04,  2.05it/s][A
 53%|█████▎    | 9/17 [00:08<00:06,  1.14it/s][A
 59%|█████▉    | 10/17 [00:08<00:05,  1.32it/s][A
 71%|███████   | 12/17 [00:08<00:02,  2.08it/s][A
 76%|███████▋  | 13/17 [00:10<00:03,  1.17it/s][A
 82%|████████▏ | 14/17 [00:11<00:02,  1.44it/s][A
 94%|█████████▍| 16/17 [00:11<00:00,  2.32it/s][A
100%|██████████| 17/17 [00:11<00:00,  1.47it/s][A
Epochs:  35%|███▍      | 19/55 [45:34<1:11:33, 119.25s/it]

Val Loss: 7.9818 - Val Accuracy: 0.9618



Training:   0%|          | 0/131 [00:00<?, ?it/s][A
Training:   1%|          | 1/131 [00:03<07:32,  3.48s/it][A
Training:   2%|▏         | 2/131 [00:03<03:12,  1.50s/it][A
Training:   4%|▍         | 5/131 [00:06<02:14,  1.07s/it][A
Training:   5%|▌         | 7/131 [00:06<01:23,  1.49it/s][A
Training:   7%|▋         | 9/131 [00:09<01:52,  1.09it/s][A
Training:   8%|▊         | 11/131 [00:09<01:18,  1.53it/s][A
Training:  10%|▉         | 13/131 [00:12<01:43,  1.14it/s][A
Training:  11%|█▏        | 15/131 [00:12<01:16,  1.51it/s][A
Training:  12%|█▏        | 16/131 [00:12<01:04,  1.78it/s][A
Training:  13%|█▎        | 17/131 [00:15<01:50,  1.03it/s][A
Training:  15%|█▍        | 19/131 [00:15<01:14,  1.51it/s][A
Training:  15%|█▌        | 20/131 [00:15<01:00,  1.82it/s][A
Training:  16%|█▌        | 21/131 [00:18<01:48,  1.01it/s][A
Training:  18%|█▊        | 23/131 [00:18<01:08,  1.59it/s][A
Training:  19%|█▉        | 25/131 [00:20<01:31,  1.16it/s][A
Training:  21%|██    

Epoch: 20/55 - Loss: 6.4267 - Accuracy: 0.9684



  0%|          | 0/17 [00:00<?, ?it/s][A
  6%|▌         | 1/17 [00:03<00:50,  3.17s/it][A
 12%|█▏        | 2/17 [00:03<00:20,  1.37s/it][A
 24%|██▎       | 4/17 [00:03<00:07,  1.72it/s][A
 29%|██▉       | 5/17 [00:05<00:13,  1.10s/it][A
 35%|███▌      | 6/17 [00:05<00:08,  1.26it/s][A
 41%|████      | 7/17 [00:05<00:05,  1.71it/s][A
 53%|█████▎    | 9/17 [00:08<00:07,  1.12it/s][A
 59%|█████▉    | 10/17 [00:08<00:04,  1.44it/s][A
 65%|██████▍   | 11/17 [00:08<00:03,  1.84it/s][A
 71%|███████   | 12/17 [00:08<00:02,  2.33it/s][A
 76%|███████▋  | 13/17 [00:10<00:03,  1.12it/s][A
 94%|█████████▍| 16/17 [00:11<00:00,  2.23it/s][A
100%|██████████| 17/17 [00:11<00:00,  1.45it/s][A
Epochs:  36%|███▋      | 20/55 [47:16<1:06:29, 113.98s/it]

Val Loss: 8.1979 - Val Accuracy: 0.9658



Training:   0%|          | 0/131 [00:00<?, ?it/s][A
Training:   1%|          | 1/131 [00:03<07:30,  3.46s/it][A
Training:   2%|▏         | 3/131 [00:03<02:01,  1.05it/s][A
Training:   3%|▎         | 4/131 [00:03<01:23,  1.52it/s][A
Training:   4%|▍         | 5/131 [00:06<02:40,  1.28s/it][A
Training:   5%|▌         | 7/131 [00:06<01:24,  1.47it/s][A
Training:   7%|▋         | 9/131 [00:09<01:56,  1.04it/s][A
Training:   8%|▊         | 11/131 [00:09<01:16,  1.58it/s][A
Training:  10%|▉         | 13/131 [00:11<01:42,  1.15it/s][A
Training:  11%|█▏        | 15/131 [00:11<01:09,  1.66it/s][A
Training:  13%|█▎        | 17/131 [00:15<01:44,  1.09it/s][A
Training:  15%|█▌        | 20/131 [00:15<01:01,  1.79it/s][A
Training:  17%|█▋        | 22/131 [00:17<01:23,  1.30it/s][A
Training:  18%|█▊        | 24/131 [00:18<01:01,  1.74it/s][A
Training:  20%|█▉        | 26/131 [00:20<01:21,  1.29it/s][A
Training:  22%|██▏       | 29/131 [00:23<01:20,  1.27it/s][A
Training:  24%|██▎    

Epoch: 21/55 - Loss: 6.3127 - Accuracy: 0.9697



  0%|          | 0/17 [00:00<?, ?it/s][A
  6%|▌         | 1/17 [00:03<00:49,  3.10s/it][A
 18%|█▊        | 3/17 [00:03<00:12,  1.16it/s][A
 24%|██▎       | 4/17 [00:03<00:07,  1.67it/s][A
 29%|██▉       | 5/17 [00:05<00:14,  1.18s/it][A
 41%|████      | 7/17 [00:05<00:06,  1.56it/s][A
 47%|████▋     | 8/17 [00:06<00:04,  1.95it/s][A
 53%|█████▎    | 9/17 [00:08<00:07,  1.05it/s][A
 59%|█████▉    | 10/17 [00:08<00:05,  1.37it/s][A
 71%|███████   | 12/17 [00:08<00:02,  2.23it/s][A
 76%|███████▋  | 13/17 [00:10<00:03,  1.23it/s][A
 82%|████████▏ | 14/17 [00:10<00:01,  1.57it/s][A
 88%|████████▊ | 15/17 [00:10<00:01,  1.94it/s][A
 94%|█████████▍| 16/17 [00:10<00:00,  2.33it/s][A
100%|██████████| 17/17 [00:11<00:00,  1.50it/s][A
Epochs:  38%|███▊      | 21/55 [48:57<1:02:26, 110.20s/it]

Val Loss: 8.9113 - Val Accuracy: 0.9608



Training:   0%|          | 0/131 [00:00<?, ?it/s][A
Training:   1%|          | 1/131 [00:03<07:34,  3.50s/it][A
Training:   3%|▎         | 4/131 [00:03<01:28,  1.44it/s][A
Training:   5%|▍         | 6/131 [00:06<02:05,  1.01s/it][A
Training:   6%|▌         | 8/131 [00:06<01:18,  1.56it/s][A
Training:   8%|▊         | 10/131 [00:09<01:50,  1.09it/s][A
Training:  10%|▉         | 13/131 [00:12<01:51,  1.06it/s][A
Training:  12%|█▏        | 16/131 [00:12<01:09,  1.66it/s][A
Training:  14%|█▎        | 18/131 [00:15<01:32,  1.22it/s][A
Training:  15%|█▌        | 20/131 [00:15<01:07,  1.64it/s][A
Training:  17%|█▋        | 22/131 [00:18<01:28,  1.23it/s][A
Training:  18%|█▊        | 24/131 [00:18<01:03,  1.69it/s][A
Training:  20%|█▉        | 26/131 [00:20<01:21,  1.28it/s][A
Training:  21%|██▏       | 28/131 [00:20<00:58,  1.77it/s][A
Training:  23%|██▎       | 30/131 [00:23<01:17,  1.30it/s][A
Training:  25%|██▌       | 33/131 [00:25<01:17,  1.27it/s][A
Training:  27%|██▋  

Epoch: 22/55 - Loss: 6.5156 - Accuracy: 0.9687



  0%|          | 0/17 [00:00<?, ?it/s][A
  6%|▌         | 1/17 [00:03<00:52,  3.25s/it][A
 12%|█▏        | 2/17 [00:03<00:21,  1.42s/it][A
 18%|█▊        | 3/17 [00:03<00:11,  1.22it/s][A
 29%|██▉       | 5/17 [00:05<00:11,  1.03it/s][A
 35%|███▌      | 6/17 [00:05<00:08,  1.37it/s][A
 47%|████▋     | 8/17 [00:05<00:03,  2.36it/s][A
 53%|█████▎    | 9/17 [00:08<00:07,  1.11it/s][A
 65%|██████▍   | 11/17 [00:08<00:03,  1.75it/s][A
 71%|███████   | 12/17 [00:08<00:02,  2.13it/s][A
 76%|███████▋  | 13/17 [00:10<00:03,  1.11it/s][A
100%|██████████| 17/17 [00:11<00:00,  1.46it/s][A
Epochs:  40%|████      | 22/55 [50:39<59:09, 107.56s/it]  

Val Loss: 8.2416 - Val Accuracy: 0.9602



Training:   0%|          | 0/131 [00:00<?, ?it/s][A
Training:   1%|          | 1/131 [00:03<07:06,  3.28s/it][A
Training:   2%|▏         | 2/131 [00:03<03:04,  1.43s/it][A
Training:   2%|▏         | 3/131 [00:03<01:52,  1.13it/s][A
Training:   4%|▍         | 5/131 [00:06<02:12,  1.05s/it][A
Training:   5%|▍         | 6/131 [00:06<01:37,  1.28it/s][A
Training:   5%|▌         | 7/131 [00:06<01:20,  1.53it/s][A
Training:   7%|▋         | 9/131 [00:08<01:48,  1.12it/s][A
Training:   8%|▊         | 10/131 [00:08<01:25,  1.41it/s][A
Training:   8%|▊         | 11/131 [00:09<01:14,  1.61it/s][A
Training:   9%|▉         | 12/131 [00:09<00:58,  2.02it/s][A
Training:  10%|▉         | 13/131 [00:11<01:50,  1.06it/s][A
Training:  11%|█         | 14/131 [00:12<01:36,  1.21it/s][A
Training:  11%|█▏        | 15/131 [00:12<01:12,  1.61it/s][A
Training:  12%|█▏        | 16/131 [00:12<00:57,  2.02it/s][A
Training:  13%|█▎        | 17/131 [00:14<01:50,  1.03it/s][A
Training:  14%|█▎      

Epoch: 23/55 - Loss: 6.5895 - Accuracy: 0.9697



  0%|          | 0/17 [00:00<?, ?it/s][A
  6%|▌         | 1/17 [00:03<00:48,  3.03s/it][A
 24%|██▎       | 4/17 [00:03<00:07,  1.66it/s][A
 35%|███▌      | 6/17 [00:05<00:09,  1.13it/s][A
 47%|████▋     | 8/17 [00:05<00:05,  1.74it/s][A
 59%|█████▉    | 10/17 [00:08<00:05,  1.25it/s][A
 65%|██████▍   | 11/17 [00:08<00:03,  1.51it/s][A
 76%|███████▋  | 13/17 [00:10<00:03,  1.28it/s][A
 82%|████████▏ | 14/17 [00:10<00:02,  1.38it/s][A
100%|██████████| 17/17 [00:11<00:00,  1.51it/s][A
Epochs:  42%|████▏     | 23/55 [52:20<56:26, 105.82s/it]

Val Loss: 8.5793 - Val Accuracy: 0.9667



Training:   0%|          | 0/131 [00:00<?, ?it/s][A
Training:   1%|          | 1/131 [00:03<07:13,  3.34s/it][A
Training:   2%|▏         | 2/131 [00:03<03:10,  1.48s/it][A
Training:   3%|▎         | 4/131 [00:03<01:15,  1.67it/s][A
Training:   4%|▍         | 5/131 [00:06<02:31,  1.20s/it][A
Training:   6%|▌         | 8/131 [00:06<01:07,  1.82it/s][A
Training:   7%|▋         | 9/131 [00:09<02:00,  1.01it/s][A
Training:   8%|▊         | 11/131 [00:09<01:17,  1.55it/s][A
Training:  10%|▉         | 13/131 [00:11<01:47,  1.09it/s][A
Training:  11%|█         | 14/131 [00:12<01:28,  1.32it/s][A
Training:  11%|█▏        | 15/131 [00:12<01:11,  1.62it/s][A
Training:  12%|█▏        | 16/131 [00:12<00:57,  2.01it/s][A
Training:  13%|█▎        | 17/131 [00:14<01:55,  1.01s/it][A
Training:  15%|█▌        | 20/131 [00:14<00:55,  1.99it/s][A
Training:  17%|█▋        | 22/131 [00:17<01:24,  1.28it/s][A
Training:  18%|█▊        | 23/131 [00:17<01:10,  1.53it/s][A
Training:  19%|█▉     

Epoch: 24/55 - Loss: 6.6306 - Accuracy: 0.9698



  0%|          | 0/17 [00:00<?, ?it/s][A
  6%|▌         | 1/17 [00:03<00:48,  3.01s/it][A
 12%|█▏        | 2/17 [00:03<00:19,  1.31s/it][A
 24%|██▎       | 4/17 [00:03<00:06,  1.91it/s][A
 35%|███▌      | 6/17 [00:05<00:09,  1.17it/s][A
 41%|████      | 7/17 [00:05<00:06,  1.50it/s][A
 53%|█████▎    | 9/17 [00:08<00:07,  1.12it/s][A
 65%|██████▍   | 11/17 [00:08<00:03,  1.67it/s][A
 76%|███████▋  | 13/17 [00:10<00:03,  1.29it/s][A
 88%|████████▊ | 15/17 [00:10<00:01,  1.74it/s][A
100%|██████████| 17/17 [00:11<00:00,  1.46it/s][A
Epochs:  44%|████▎     | 24/55 [54:02<54:06, 104.73s/it]

Val Loss: 7.7475 - Val Accuracy: 0.9585



Training:   0%|          | 0/131 [00:00<?, ?it/s][A
Training:   1%|          | 1/131 [00:03<06:57,  3.21s/it][A
Training:   2%|▏         | 3/131 [00:03<01:59,  1.07it/s][A
Training:   4%|▍         | 5/131 [00:05<02:17,  1.09s/it][A
Training:   5%|▍         | 6/131 [00:06<01:44,  1.20it/s][A
Training:   5%|▌         | 7/131 [00:06<01:23,  1.49it/s][A
Training:   7%|▋         | 9/131 [00:08<01:53,  1.08it/s][A
Training:   8%|▊         | 10/131 [00:08<01:28,  1.37it/s][A
Training:   8%|▊         | 11/131 [00:09<01:17,  1.55it/s][A
Training:  10%|▉         | 13/131 [00:11<01:39,  1.19it/s][A
Training:  11%|█         | 14/131 [00:11<01:21,  1.43it/s][A
Training:  11%|█▏        | 15/131 [00:12<01:17,  1.50it/s][A
Training:  13%|█▎        | 17/131 [00:14<01:38,  1.16it/s][A
Training:  14%|█▎        | 18/131 [00:14<01:18,  1.43it/s][A
Training:  15%|█▍        | 19/131 [00:14<01:03,  1.76it/s][A
Training:  15%|█▌        | 20/131 [00:15<00:49,  2.22it/s][A
Training:  16%|█▌     

Epoch: 25/55 - Loss: 6.8161 - Accuracy: 0.9690



  0%|          | 0/17 [00:00<?, ?it/s][A
  6%|▌         | 1/17 [00:02<00:46,  2.91s/it][A
 18%|█▊        | 3/17 [00:03<00:12,  1.16it/s][A
 24%|██▎       | 4/17 [00:03<00:07,  1.67it/s][A
 29%|██▉       | 5/17 [00:05<00:12,  1.08s/it][A
 35%|███▌      | 6/17 [00:05<00:08,  1.25it/s][A
 41%|████      | 7/17 [00:05<00:06,  1.63it/s][A
 53%|█████▎    | 9/17 [00:07<00:06,  1.23it/s][A
 59%|█████▉    | 10/17 [00:08<00:04,  1.51it/s][A
 65%|██████▍   | 11/17 [00:08<00:03,  1.81it/s][A
 76%|███████▋  | 13/17 [00:10<00:03,  1.32it/s][A
 82%|████████▏ | 14/17 [00:10<00:01,  1.62it/s][A
 88%|████████▊ | 15/17 [00:10<00:01,  1.92it/s][A
100%|██████████| 17/17 [00:11<00:00,  1.51it/s][A
Epochs:  45%|████▌     | 25/55 [55:44<51:55, 103.85s/it]

Val Loss: 8.0002 - Val Accuracy: 0.9617



Training:   0%|          | 0/131 [00:00<?, ?it/s][A
Training:   1%|          | 1/131 [00:03<07:18,  3.38s/it][A
Training:   2%|▏         | 2/131 [00:03<03:09,  1.47s/it][A
Training:   3%|▎         | 4/131 [00:03<01:14,  1.71it/s][A
Training:   5%|▍         | 6/131 [00:06<02:01,  1.03it/s][A
Training:   7%|▋         | 9/131 [00:08<01:47,  1.13it/s][A
Training:   8%|▊         | 10/131 [00:09<01:34,  1.28it/s][A
Training:   9%|▉         | 12/131 [00:09<01:02,  1.89it/s][A
Training:  10%|▉         | 13/131 [00:11<01:47,  1.10it/s][A
Training:  11%|█         | 14/131 [00:11<01:27,  1.34it/s][A
Training:  11%|█▏        | 15/131 [00:12<01:11,  1.62it/s][A
Training:  13%|█▎        | 17/131 [00:14<01:39,  1.15it/s][A
Training:  15%|█▍        | 19/131 [00:14<01:09,  1.61it/s][A
Training:  16%|█▌        | 21/131 [00:17<01:32,  1.19it/s][A
Training:  17%|█▋        | 22/131 [00:17<01:15,  1.44it/s][A
Training:  18%|█▊        | 23/131 [00:17<01:01,  1.74it/s][A
Training:  19%|█▉    

Epoch: 26/55 - Loss: 6.2630 - Accuracy: 0.9714



  0%|          | 0/17 [00:00<?, ?it/s][A
  6%|▌         | 1/17 [00:03<00:48,  3.00s/it][A
 12%|█▏        | 2/17 [00:03<00:19,  1.31s/it][A
 18%|█▊        | 3/17 [00:03<00:10,  1.31it/s][A
 29%|██▉       | 5/17 [00:05<00:11,  1.03it/s][A
 35%|███▌      | 6/17 [00:05<00:07,  1.38it/s][A
 41%|████      | 7/17 [00:05<00:05,  1.80it/s][A
 53%|█████▎    | 9/17 [00:07<00:06,  1.24it/s][A
 59%|█████▉    | 10/17 [00:08<00:04,  1.57it/s][A
 71%|███████   | 12/17 [00:08<00:02,  2.43it/s][A
 76%|███████▋  | 13/17 [00:10<00:03,  1.16it/s][A
 88%|████████▊ | 15/17 [00:10<00:01,  1.81it/s][A
100%|██████████| 17/17 [00:11<00:00,  1.48it/s][A
Epochs:  47%|████▋     | 26/55 [57:26<49:57, 103.35s/it]

Val Loss: 7.8768 - Val Accuracy: 0.9663



Training:   0%|          | 0/131 [00:00<?, ?it/s][A
Training:   1%|          | 1/131 [00:03<07:20,  3.39s/it][A
Training:   2%|▏         | 2/131 [00:03<03:13,  1.50s/it][A
Training:   2%|▏         | 3/131 [00:03<01:59,  1.07it/s][A
Training:   4%|▍         | 5/131 [00:06<02:23,  1.14s/it][A
Training:   5%|▍         | 6/131 [00:06<01:48,  1.15it/s][A
Training:   5%|▌         | 7/131 [00:06<01:23,  1.48it/s][A
Training:   6%|▌         | 8/131 [00:06<01:03,  1.95it/s][A
Training:   7%|▋         | 9/131 [00:09<02:06,  1.03s/it][A
Training:   8%|▊         | 10/131 [00:09<01:32,  1.30it/s][A
Training:   8%|▊         | 11/131 [00:09<01:10,  1.71it/s][A
Training:  10%|▉         | 13/131 [00:12<01:49,  1.07it/s][A
Training:  11%|█         | 14/131 [00:12<01:27,  1.33it/s][A
Training:  12%|█▏        | 16/131 [00:12<00:55,  2.07it/s][A
Training:  13%|█▎        | 17/131 [00:15<01:46,  1.07it/s][A
Training:  14%|█▎        | 18/131 [00:15<01:24,  1.33it/s][A
Training:  15%|█▌       

Epoch: 27/55 - Loss: 6.5533 - Accuracy: 0.9696



  0%|          | 0/17 [00:00<?, ?it/s][A
  6%|▌         | 1/17 [00:03<00:47,  3.00s/it][A
 12%|█▏        | 2/17 [00:03<00:19,  1.29s/it][A
 18%|█▊        | 3/17 [00:03<00:10,  1.32it/s][A
 24%|██▎       | 4/17 [00:03<00:06,  1.99it/s][A
 29%|██▉       | 5/17 [00:05<00:13,  1.09s/it][A
 35%|███▌      | 6/17 [00:05<00:08,  1.23it/s][A
 47%|████▋     | 8/17 [00:05<00:03,  2.28it/s][A
 53%|█████▎    | 9/17 [00:08<00:07,  1.12it/s][A
 59%|█████▉    | 10/17 [00:08<00:04,  1.41it/s][A
 76%|███████▋  | 13/17 [00:10<00:03,  1.33it/s][A
 82%|████████▏ | 14/17 [00:10<00:01,  1.60it/s][A
100%|██████████| 17/17 [00:11<00:00,  1.50it/s][A
Epochs:  49%|████▉     | 27/55 [59:09<48:04, 103.00s/it]

Val Loss: 8.6358 - Val Accuracy: 0.9591



Training:   0%|          | 0/131 [00:00<?, ?it/s][A
Training:   1%|          | 1/131 [00:03<08:00,  3.69s/it][A
Training:   2%|▏         | 3/131 [00:03<02:10,  1.02s/it][A
Training:   4%|▍         | 5/131 [00:06<02:32,  1.21s/it][A
Training:   5%|▌         | 7/131 [00:06<01:29,  1.38it/s][A
Training:   7%|▋         | 9/131 [00:09<02:00,  1.02it/s][A
Training:   8%|▊         | 11/131 [00:09<01:19,  1.52it/s][A
Training:  10%|▉         | 13/131 [00:12<01:45,  1.12it/s][A
Training:  11%|█         | 14/131 [00:12<01:27,  1.34it/s][A
Training:  13%|█▎        | 17/131 [00:15<01:36,  1.18it/s][A
Training:  15%|█▍        | 19/131 [00:15<01:10,  1.60it/s][A
Training:  16%|█▌        | 21/131 [00:18<01:28,  1.25it/s][A
Training:  18%|█▊        | 23/131 [00:18<01:02,  1.74it/s][A
Training:  19%|█▉        | 25/131 [00:20<01:23,  1.27it/s][A
Training:  21%|██▏       | 28/131 [00:20<00:51,  2.02it/s][A
Training:  23%|██▎       | 30/131 [00:23<01:14,  1.35it/s][A
Training:  25%|██▌   

Epoch: 28/55 - Loss: 7.0508 - Accuracy: 0.9692



  0%|          | 0/17 [00:00<?, ?it/s][A
  6%|▌         | 1/17 [00:03<00:52,  3.27s/it][A
 18%|█▊        | 3/17 [00:03<00:12,  1.12it/s][A
 24%|██▎       | 4/17 [00:03<00:08,  1.57it/s][A
 29%|██▉       | 5/17 [00:05<00:13,  1.11s/it][A
 41%|████      | 7/17 [00:05<00:06,  1.61it/s][A
 53%|█████▎    | 9/17 [00:08<00:06,  1.21it/s][A
 65%|██████▍   | 11/17 [00:08<00:03,  1.66it/s][A
 76%|███████▋  | 13/17 [00:10<00:03,  1.27it/s][A
 88%|████████▊ | 15/17 [00:10<00:01,  1.79it/s][A
100%|██████████| 17/17 [00:11<00:00,  1.47it/s][A
Epochs:  51%|█████     | 28/55 [1:00:50<46:11, 102.63s/it]

Val Loss: 8.9019 - Val Accuracy: 0.9629



Training:   0%|          | 0/131 [00:00<?, ?it/s][A
Training:   1%|          | 1/131 [00:03<07:15,  3.35s/it][A
Training:   2%|▏         | 2/131 [00:03<03:17,  1.53s/it][A
Training:   2%|▏         | 3/131 [00:03<01:54,  1.12it/s][A
Training:   3%|▎         | 4/131 [00:03<01:13,  1.72it/s][A
Training:   4%|▍         | 5/131 [00:06<02:30,  1.19s/it][A
Training:   5%|▍         | 6/131 [00:06<01:49,  1.14it/s][A
Training:   5%|▌         | 7/131 [00:06<01:18,  1.59it/s][A
Training:   7%|▋         | 9/131 [00:08<01:50,  1.11it/s][A
Training:   8%|▊         | 10/131 [00:09<01:35,  1.27it/s][A
Training:   9%|▉         | 12/131 [00:09<00:58,  2.05it/s][A
Training:  10%|▉         | 13/131 [00:11<01:45,  1.12it/s][A
Training:  11%|█         | 14/131 [00:12<01:30,  1.29it/s][A
Training:  11%|█▏        | 15/131 [00:12<01:09,  1.67it/s][A
Training:  13%|█▎        | 17/131 [00:14<01:38,  1.16it/s][A
Training:  14%|█▎        | 18/131 [00:15<01:24,  1.33it/s][A
Training:  15%|█▌       

Epoch: 29/55 - Loss: 6.8360 - Accuracy: 0.9710



  0%|          | 0/17 [00:00<?, ?it/s][A
  6%|▌         | 1/17 [00:03<00:50,  3.15s/it][A
 18%|█▊        | 3/17 [00:03<00:12,  1.11it/s][A
 29%|██▉       | 5/17 [00:05<00:12,  1.02s/it][A
 41%|████      | 7/17 [00:05<00:06,  1.59it/s][A
 53%|█████▎    | 9/17 [00:08<00:06,  1.17it/s][A
 65%|██████▍   | 11/17 [00:08<00:03,  1.68it/s][A
 76%|███████▋  | 13/17 [00:10<00:03,  1.29it/s][A
 88%|████████▊ | 15/17 [00:11<00:01,  1.77it/s][A
100%|██████████| 17/17 [00:11<00:00,  1.46it/s][A
Epochs:  53%|█████▎    | 29/55 [1:02:32<44:23, 102.46s/it]

Val Loss: 7.8011 - Val Accuracy: 0.9629



Training:   0%|          | 0/131 [00:00<?, ?it/s][A
Training:   1%|          | 1/131 [00:03<07:24,  3.42s/it][A
Training:   2%|▏         | 2/131 [00:03<03:09,  1.47s/it][A
Training:   3%|▎         | 4/131 [00:03<01:16,  1.66it/s][A
Training:   4%|▍         | 5/131 [00:06<02:28,  1.18s/it][A
Training:   5%|▌         | 7/131 [00:06<01:21,  1.52it/s][A
Training:   7%|▋         | 9/131 [00:09<01:58,  1.03it/s][A
Training:   8%|▊         | 11/131 [00:09<01:17,  1.54it/s][A
Training:   9%|▉         | 12/131 [00:09<01:04,  1.85it/s][A
Training:  10%|▉         | 13/131 [00:12<01:58,  1.00s/it][A
Training:  11%|█         | 14/131 [00:12<01:31,  1.28it/s][A
Training:  12%|█▏        | 16/131 [00:12<00:56,  2.04it/s][A
Training:  13%|█▎        | 17/131 [00:14<01:50,  1.03it/s][A
Training:  14%|█▎        | 18/131 [00:15<01:25,  1.32it/s][A
Training:  15%|█▌        | 20/131 [00:15<00:51,  2.14it/s][A
Training:  17%|█▋        | 22/131 [00:17<01:20,  1.35it/s][A
Training:  18%|█▊     

Epoch: 30/55 - Loss: 6.5869 - Accuracy: 0.9703



  0%|          | 0/17 [00:00<?, ?it/s][A
  6%|▌         | 1/17 [00:03<00:50,  3.19s/it][A
 12%|█▏        | 2/17 [00:03<00:20,  1.38s/it][A
 18%|█▊        | 3/17 [00:03<00:11,  1.24it/s][A
 24%|██▎       | 4/17 [00:03<00:06,  1.89it/s][A
 29%|██▉       | 5/17 [00:05<00:13,  1.10s/it][A
 47%|████▋     | 8/17 [00:05<00:04,  2.17it/s][A
 59%|█████▉    | 10/17 [00:08<00:05,  1.37it/s][A
 76%|███████▋  | 13/17 [00:10<00:03,  1.30it/s][A
 88%|████████▊ | 15/17 [00:10<00:01,  1.79it/s][A
100%|██████████| 17/17 [00:11<00:00,  1.48it/s][A
Epochs:  55%|█████▍    | 30/55 [1:04:14<42:34, 102.20s/it]

Val Loss: 9.0554 - Val Accuracy: 0.9607



Training:   0%|          | 0/131 [00:00<?, ?it/s][A
Training:   1%|          | 1/131 [00:03<07:26,  3.43s/it][A
Training:   3%|▎         | 4/131 [00:03<01:27,  1.46it/s][A
Training:   5%|▍         | 6/131 [00:06<02:06,  1.01s/it][A
Training:   6%|▌         | 8/131 [00:06<01:20,  1.53it/s][A
Training:   7%|▋         | 9/131 [00:09<02:08,  1.05s/it][A
Training:   9%|▉         | 12/131 [00:09<01:08,  1.73it/s][A
Training:  10%|▉         | 13/131 [00:11<01:54,  1.03it/s][A
Training:  11%|█         | 14/131 [00:12<01:32,  1.26it/s][A
Training:  11%|█▏        | 15/131 [00:12<01:13,  1.57it/s][A
Training:  12%|█▏        | 16/131 [00:12<00:58,  1.97it/s][A
Training:  13%|█▎        | 17/131 [00:14<01:51,  1.02it/s][A
Training:  15%|█▍        | 19/131 [00:14<01:06,  1.69it/s][A
Training:  16%|█▌        | 21/131 [00:17<01:31,  1.20it/s][A
Training:  17%|█▋        | 22/131 [00:17<01:14,  1.47it/s][A
Training:  19%|█▉        | 25/131 [00:19<01:20,  1.32it/s][A
Training:  21%|██    

Epoch: 31/55 - Loss: 6.6915 - Accuracy: 0.9694



  0%|          | 0/17 [00:00<?, ?it/s][A
  6%|▌         | 1/17 [00:03<00:49,  3.10s/it][A
 12%|█▏        | 2/17 [00:03<00:20,  1.34s/it][A
 29%|██▉       | 5/17 [00:05<00:11,  1.04it/s][A
 35%|███▌      | 6/17 [00:05<00:08,  1.34it/s][A
 53%|█████▎    | 9/17 [00:08<00:06,  1.29it/s][A
 65%|██████▍   | 11/17 [00:08<00:03,  1.86it/s][A
 76%|███████▋  | 13/17 [00:10<00:02,  1.36it/s][A
100%|██████████| 17/17 [00:11<00:00,  1.50it/s][A
Epochs:  56%|█████▋    | 31/55 [1:05:56<40:50, 102.09s/it]

Val Loss: 8.4962 - Val Accuracy: 0.9656



Training:   0%|          | 0/131 [00:00<?, ?it/s][A
Training:   1%|          | 1/131 [00:03<07:08,  3.30s/it][A
Training:   2%|▏         | 2/131 [00:03<03:18,  1.54s/it][A
Training:   3%|▎         | 4/131 [00:03<01:17,  1.63it/s][A
Training:   4%|▍         | 5/131 [00:06<02:21,  1.12s/it][A
Training:   5%|▍         | 6/131 [00:06<01:51,  1.12it/s][A
Training:   6%|▌         | 8/131 [00:06<01:02,  1.96it/s][A
Training:   7%|▋         | 9/131 [00:08<01:57,  1.04it/s][A
Training:   8%|▊         | 10/131 [00:09<01:34,  1.28it/s][A
Training:   9%|▉         | 12/131 [00:09<00:56,  2.12it/s][A
Training:  10%|▉         | 13/131 [00:11<01:57,  1.01it/s][A
Training:  11%|█▏        | 15/131 [00:12<01:13,  1.57it/s][A
Training:  12%|█▏        | 16/131 [00:12<00:59,  1.92it/s][A
Training:  13%|█▎        | 17/131 [00:14<01:43,  1.10it/s][A
Training:  14%|█▎        | 18/131 [00:14<01:19,  1.43it/s][A
Training:  15%|█▍        | 19/131 [00:14<01:04,  1.74it/s][A
Training:  15%|█▌      

Epoch: 32/55 - Loss: 6.3600 - Accuracy: 0.9693



  0%|          | 0/17 [00:00<?, ?it/s][A
  6%|▌         | 1/17 [00:02<00:46,  2.88s/it][A
 18%|█▊        | 3/17 [00:03<00:12,  1.15it/s][A
 24%|██▎       | 4/17 [00:03<00:07,  1.65it/s][A
 29%|██▉       | 5/17 [00:05<00:13,  1.10s/it][A
 35%|███▌      | 6/17 [00:05<00:08,  1.22it/s][A
 41%|████      | 7/17 [00:05<00:06,  1.55it/s][A
 53%|█████▎    | 9/17 [00:08<00:06,  1.16it/s][A
 59%|█████▉    | 10/17 [00:08<00:04,  1.46it/s][A
 71%|███████   | 12/17 [00:08<00:02,  2.29it/s][A
 76%|███████▋  | 13/17 [00:10<00:03,  1.21it/s][A
 82%|████████▏ | 14/17 [00:10<00:02,  1.48it/s][A
 94%|█████████▍| 16/17 [00:11<00:00,  2.29it/s][A
100%|██████████| 17/17 [00:11<00:00,  1.48it/s][A
Epochs:  58%|█████▊    | 32/55 [1:07:38<39:06, 102.04s/it]

Val Loss: 9.1131 - Val Accuracy: 0.9645



Training:   0%|          | 0/131 [00:00<?, ?it/s][A
Training:   1%|          | 1/131 [00:03<07:23,  3.41s/it][A
Training:   2%|▏         | 3/131 [00:03<02:03,  1.04it/s][A
Training:   4%|▍         | 5/131 [00:06<02:21,  1.12s/it][A
Training:   5%|▌         | 7/131 [00:06<01:26,  1.44it/s][A
Training:   6%|▌         | 8/131 [00:06<01:08,  1.79it/s][A
Training:   7%|▋         | 9/131 [00:09<02:08,  1.05s/it][A
Training:   8%|▊         | 11/131 [00:09<01:18,  1.53it/s][A
Training:  10%|▉         | 13/131 [00:11<01:49,  1.08it/s][A
Training:  11%|█         | 14/131 [00:12<01:27,  1.33it/s][A
Training:  13%|█▎        | 17/131 [00:14<01:34,  1.21it/s][A
Training:  15%|█▍        | 19/131 [00:14<01:05,  1.71it/s][A
Training:  16%|█▌        | 21/131 [00:17<01:25,  1.29it/s][A
Training:  18%|█▊        | 23/131 [00:17<01:00,  1.80it/s][A
Training:  19%|█▉        | 25/131 [00:19<01:18,  1.36it/s][A
Training:  21%|██        | 27/131 [00:19<00:55,  1.87it/s][A
Training:  22%|██▏    

Epoch: 33/55 - Loss: 6.4819 - Accuracy: 0.9702



  0%|          | 0/17 [00:00<?, ?it/s][A
  6%|▌         | 1/17 [00:03<00:48,  3.05s/it][A
 12%|█▏        | 2/17 [00:03<00:20,  1.40s/it][A
 18%|█▊        | 3/17 [00:03<00:12,  1.15it/s][A
 24%|██▎       | 4/17 [00:03<00:07,  1.74it/s][A
 29%|██▉       | 5/17 [00:05<00:13,  1.08s/it][A
 41%|████      | 7/17 [00:06<00:06,  1.56it/s][A
 53%|█████▎    | 9/17 [00:08<00:06,  1.19it/s][A
 65%|██████▍   | 11/17 [00:08<00:03,  1.73it/s][A
 76%|███████▋  | 13/17 [00:10<00:03,  1.33it/s][A
 88%|████████▊ | 15/17 [00:10<00:01,  1.85it/s][A
100%|██████████| 17/17 [00:11<00:00,  1.46it/s][A
Epochs:  60%|██████    | 33/55 [1:09:20<37:22, 101.93s/it]

Val Loss: 8.6943 - Val Accuracy: 0.9641



Training:   0%|          | 0/131 [00:00<?, ?it/s][A
Training:   1%|          | 1/131 [00:03<06:57,  3.21s/it][A
Training:   2%|▏         | 2/131 [00:03<03:05,  1.44s/it][A
Training:   3%|▎         | 4/131 [00:03<01:13,  1.73it/s][A
Training:   4%|▍         | 5/131 [00:06<02:26,  1.17s/it][A
Training:   5%|▌         | 7/131 [00:06<01:24,  1.47it/s][A
Training:   7%|▋         | 9/131 [00:08<01:48,  1.12it/s][A
Training:   8%|▊         | 10/131 [00:08<01:31,  1.32it/s][A
Training:   8%|▊         | 11/131 [00:09<01:12,  1.66it/s][A
Training:  10%|▉         | 13/131 [00:11<01:43,  1.14it/s][A
Training:  11%|█         | 14/131 [00:11<01:22,  1.42it/s][A
Training:  11%|█▏        | 15/131 [00:11<01:06,  1.75it/s][A
Training:  13%|█▎        | 17/131 [00:14<01:35,  1.20it/s][A
Training:  14%|█▎        | 18/131 [00:14<01:16,  1.49it/s][A
Training:  15%|█▍        | 19/131 [00:14<01:01,  1.82it/s][A
Training:  16%|█▌        | 21/131 [00:17<01:29,  1.23it/s][A
Training:  18%|█▊     

Epoch: 34/55 - Loss: 6.4916 - Accuracy: 0.9715



  0%|          | 0/17 [00:00<?, ?it/s][A
  6%|▌         | 1/17 [00:03<00:49,  3.11s/it][A
 12%|█▏        | 2/17 [00:03<00:20,  1.37s/it][A
 29%|██▉       | 5/17 [00:05<00:11,  1.05it/s][A
 35%|███▌      | 6/17 [00:05<00:08,  1.31it/s][A
 47%|████▋     | 8/17 [00:05<00:04,  2.13it/s][A
 53%|█████▎    | 9/17 [00:08<00:07,  1.11it/s][A
 59%|█████▉    | 10/17 [00:08<00:05,  1.39it/s][A
 76%|███████▋  | 13/17 [00:10<00:02,  1.35it/s][A
 82%|████████▏ | 14/17 [00:10<00:01,  1.62it/s][A
100%|██████████| 17/17 [00:11<00:00,  1.47it/s][A
Epochs:  62%|██████▏   | 34/55 [1:11:00<35:32, 101.56s/it]

Val Loss: 9.3214 - Val Accuracy: 0.9619



Training:   0%|          | 0/131 [00:00<?, ?it/s][A
Training:   1%|          | 1/131 [00:03<07:11,  3.32s/it][A
Training:   2%|▏         | 3/131 [00:03<01:55,  1.11it/s][A
Training:   4%|▍         | 5/131 [00:06<02:21,  1.12s/it][A
Training:   6%|▌         | 8/131 [00:06<01:09,  1.77it/s][A
Training:   8%|▊         | 10/131 [00:08<01:36,  1.25it/s][A
Training:   9%|▉         | 12/131 [00:09<01:10,  1.69it/s][A
Training:  10%|▉         | 13/131 [00:11<01:50,  1.07it/s][A
Training:  11%|█         | 14/131 [00:11<01:29,  1.31it/s][A
Training:  11%|█▏        | 15/131 [00:11<01:10,  1.64it/s][A
Training:  12%|█▏        | 16/131 [00:11<00:55,  2.07it/s][A
Training:  13%|█▎        | 17/131 [00:14<01:51,  1.02it/s][A
Training:  14%|█▎        | 18/131 [00:14<01:24,  1.34it/s][A
Training:  15%|█▌        | 20/131 [00:14<00:52,  2.12it/s][A
Training:  16%|█▌        | 21/131 [00:16<01:35,  1.15it/s][A
Training:  18%|█▊        | 24/131 [00:16<00:50,  2.11it/s][A
Training:  19%|█▉   

Epoch: 35/55 - Loss: 6.3723 - Accuracy: 0.9715



  0%|          | 0/17 [00:00<?, ?it/s][A
  6%|▌         | 1/17 [00:03<00:50,  3.14s/it][A
 18%|█▊        | 3/17 [00:03<00:12,  1.16it/s][A
 29%|██▉       | 5/17 [00:05<00:12,  1.06s/it][A
 53%|█████▎    | 9/17 [00:08<00:06,  1.26it/s][A
 59%|█████▉    | 10/17 [00:08<00:04,  1.48it/s][A
 76%|███████▋  | 13/17 [00:10<00:02,  1.37it/s][A
 88%|████████▊ | 15/17 [00:10<00:01,  1.86it/s][A
100%|██████████| 17/17 [00:11<00:00,  1.48it/s][A
Epochs:  64%|██████▎   | 35/55 [1:12:41<33:49, 101.46s/it]

Val Loss: 9.2142 - Val Accuracy: 0.9536



Training:   0%|          | 0/131 [00:00<?, ?it/s][A
Training:   1%|          | 1/131 [00:03<07:15,  3.35s/it][A
Training:   2%|▏         | 2/131 [00:03<03:07,  1.45s/it][A
Training:   2%|▏         | 3/131 [00:03<01:47,  1.19it/s][A
Training:   3%|▎         | 4/131 [00:03<01:11,  1.77it/s][A
Training:   4%|▍         | 5/131 [00:06<02:42,  1.29s/it][A
Training:   6%|▌         | 8/131 [00:06<01:05,  1.87it/s][A
Training:   8%|▊         | 10/131 [00:09<01:41,  1.19it/s][A
Training:   8%|▊         | 11/131 [00:09<01:22,  1.45it/s][A
Training:  10%|▉         | 13/131 [00:11<01:46,  1.11it/s][A
Training:  11%|█         | 14/131 [00:12<01:28,  1.33it/s][A
Training:  11%|█▏        | 15/131 [00:12<01:10,  1.64it/s][A
Training:  12%|█▏        | 16/131 [00:12<00:55,  2.06it/s][A
Training:  13%|█▎        | 17/131 [00:14<01:51,  1.03it/s][A
Training:  14%|█▎        | 18/131 [00:14<01:26,  1.31it/s][A
Training:  15%|█▌        | 20/131 [00:14<00:50,  2.22it/s][A
Training:  16%|█▌     

Epoch: 36/55 - Loss: 6.5503 - Accuracy: 0.9699



  0%|          | 0/17 [00:00<?, ?it/s][A
  6%|▌         | 1/17 [00:03<00:48,  3.01s/it][A
 12%|█▏        | 2/17 [00:03<00:19,  1.33s/it][A
 18%|█▊        | 3/17 [00:03<00:11,  1.27it/s][A
 29%|██▉       | 5/17 [00:05<00:11,  1.07it/s][A
 41%|████      | 7/17 [00:05<00:05,  1.69it/s][A
 47%|████▋     | 8/17 [00:05<00:04,  2.09it/s][A
 53%|█████▎    | 9/17 [00:07<00:07,  1.11it/s][A
 65%|██████▍   | 11/17 [00:08<00:03,  1.63it/s][A
 76%|███████▋  | 13/17 [00:10<00:03,  1.27it/s][A
 88%|████████▊ | 15/17 [00:10<00:01,  1.72it/s][A
100%|██████████| 17/17 [00:11<00:00,  1.50it/s][A
Epochs:  65%|██████▌   | 36/55 [1:14:24<32:12, 101.71s/it]

Val Loss: 9.7125 - Val Accuracy: 0.9651



Training:   0%|          | 0/131 [00:00<?, ?it/s][A
Training:   1%|          | 1/131 [00:03<07:09,  3.31s/it][A
Training:   2%|▏         | 3/131 [00:03<01:57,  1.09it/s][A
Training:   4%|▍         | 5/131 [00:06<02:22,  1.13s/it][A
Training:   5%|▌         | 7/131 [00:06<01:25,  1.46it/s][A
Training:   6%|▌         | 8/131 [00:06<01:08,  1.81it/s][A
Training:   7%|▋         | 9/131 [00:08<02:02,  1.01s/it][A
Training:   8%|▊         | 11/131 [00:08<01:13,  1.63it/s][A
Training:  10%|▉         | 13/131 [00:11<01:45,  1.12it/s][A
Training:  11%|█▏        | 15/131 [00:11<01:10,  1.65it/s][A
Training:  13%|█▎        | 17/131 [00:14<01:33,  1.22it/s][A
Training:  15%|█▍        | 19/131 [00:14<01:04,  1.75it/s][A
Training:  16%|█▌        | 21/131 [00:16<01:25,  1.28it/s][A
Training:  18%|█▊        | 24/131 [00:16<00:51,  2.07it/s][A
Training:  20%|█▉        | 26/131 [00:19<01:11,  1.47it/s][A
Training:  21%|██▏       | 28/131 [00:19<00:51,  1.98it/s][A
Training:  23%|██▎    

Epoch: 37/55 - Loss: 6.4187 - Accuracy: 0.9714



  0%|          | 0/17 [00:00<?, ?it/s][A
  6%|▌         | 1/17 [00:03<00:51,  3.23s/it][A
 18%|█▊        | 3/17 [00:03<00:12,  1.13it/s][A
 29%|██▉       | 5/17 [00:05<00:12,  1.03s/it][A
 41%|████      | 7/17 [00:05<00:06,  1.61it/s][A
 53%|█████▎    | 9/17 [00:08<00:06,  1.22it/s][A
 59%|█████▉    | 10/17 [00:08<00:04,  1.48it/s][A
 71%|███████   | 12/17 [00:08<00:02,  2.20it/s][A
 76%|███████▋  | 13/17 [00:10<00:03,  1.22it/s][A
 82%|████████▏ | 14/17 [00:10<00:02,  1.48it/s][A
100%|██████████| 17/17 [00:11<00:00,  1.49it/s][A
Epochs:  67%|██████▋   | 37/55 [1:16:05<30:29, 101.61s/it]

Val Loss: 9.7612 - Val Accuracy: 0.9629



Training:   0%|          | 0/131 [00:00<?, ?it/s][A
Training:   1%|          | 1/131 [00:03<07:08,  3.30s/it][A
Training:   2%|▏         | 2/131 [00:03<03:08,  1.46s/it][A
Training:   3%|▎         | 4/131 [00:03<01:13,  1.72it/s][A
Training:   5%|▍         | 6/131 [00:06<02:00,  1.04it/s][A
Training:   5%|▌         | 7/131 [00:06<01:32,  1.34it/s][A
Training:   7%|▋         | 9/131 [00:08<01:45,  1.16it/s][A
Training:   8%|▊         | 10/131 [00:09<01:37,  1.23it/s][A
Training:   9%|▉         | 12/131 [00:09<01:02,  1.91it/s][A
Training:  10%|▉         | 13/131 [00:11<01:37,  1.21it/s][A
Training:  11%|█         | 14/131 [00:11<01:27,  1.33it/s][A
Training:  12%|█▏        | 16/131 [00:11<00:53,  2.15it/s][A
Training:  13%|█▎        | 17/131 [00:14<01:39,  1.14it/s][A
Training:  14%|█▎        | 18/131 [00:14<01:21,  1.38it/s][A
Training:  15%|█▌        | 20/131 [00:14<00:51,  2.15it/s][A
Training:  16%|█▌        | 21/131 [00:16<01:28,  1.25it/s][A
Training:  17%|█▋     

Epoch: 38/55 - Loss: 6.4311 - Accuracy: 0.9718



  0%|          | 0/17 [00:00<?, ?it/s][A
  6%|▌         | 1/17 [00:02<00:46,  2.93s/it][A
 12%|█▏        | 2/17 [00:03<00:19,  1.29s/it][A
 24%|██▎       | 4/17 [00:03<00:06,  1.93it/s][A
 29%|██▉       | 5/17 [00:05<00:12,  1.02s/it][A
 35%|███▌      | 6/17 [00:05<00:08,  1.24it/s][A
 47%|████▋     | 8/17 [00:05<00:04,  2.15it/s][A
 53%|█████▎    | 9/17 [00:07<00:07,  1.14it/s][A
 59%|█████▉    | 10/17 [00:08<00:05,  1.33it/s][A
 65%|██████▍   | 11/17 [00:08<00:03,  1.68it/s][A
 76%|███████▋  | 13/17 [00:10<00:03,  1.30it/s][A
 82%|████████▏ | 14/17 [00:10<00:01,  1.51it/s][A
100%|██████████| 17/17 [00:11<00:00,  1.51it/s][A
Epochs:  69%|██████▉   | 38/55 [1:17:47<28:48, 101.66s/it]

Val Loss: 8.2936 - Val Accuracy: 0.9603



Training:   0%|          | 0/131 [00:00<?, ?it/s][A
Training:   1%|          | 1/131 [00:03<07:21,  3.40s/it][A
Training:   2%|▏         | 2/131 [00:03<03:11,  1.48s/it][A
Training:   2%|▏         | 3/131 [00:03<01:51,  1.15it/s][A
Training:   3%|▎         | 4/131 [00:03<01:12,  1.76it/s][A
Training:   4%|▍         | 5/131 [00:06<02:31,  1.21s/it][A
Training:   5%|▌         | 7/131 [00:06<01:17,  1.60it/s][A
Training:   7%|▋         | 9/131 [00:08<01:50,  1.11it/s][A
Training:   8%|▊         | 11/131 [00:09<01:11,  1.68it/s][A
Training:   9%|▉         | 12/131 [00:09<00:58,  2.03it/s][A
Training:  10%|▉         | 13/131 [00:11<01:53,  1.04it/s][A
Training:  12%|█▏        | 16/131 [00:11<00:57,  2.00it/s][A
Training:  14%|█▎        | 18/131 [00:13<01:18,  1.44it/s][A
Training:  16%|█▌        | 21/131 [00:16<01:22,  1.34it/s][A
Training:  18%|█▊        | 23/131 [00:16<00:59,  1.81it/s][A
Training:  19%|█▉        | 25/131 [00:18<01:19,  1.33it/s][A
Training:  21%|██      

Epoch: 39/55 - Loss: 6.7292 - Accuracy: 0.9708



  0%|          | 0/17 [00:00<?, ?it/s][A
  6%|▌         | 1/17 [00:03<00:49,  3.12s/it][A
 12%|█▏        | 2/17 [00:03<00:20,  1.38s/it][A
 24%|██▎       | 4/17 [00:03<00:07,  1.74it/s][A
 29%|██▉       | 5/17 [00:05<00:12,  1.07s/it][A
 35%|███▌      | 6/17 [00:05<00:08,  1.29it/s][A
 47%|████▋     | 8/17 [00:05<00:04,  2.21it/s][A
 53%|█████▎    | 9/17 [00:08<00:07,  1.12it/s][A
 71%|███████   | 12/17 [00:08<00:02,  2.14it/s][A
 76%|███████▋  | 13/17 [00:10<00:03,  1.15it/s][A
100%|██████████| 17/17 [00:11<00:00,  1.46it/s][A
Epochs:  71%|███████   | 39/55 [1:19:29<27:08, 101.76s/it]

Val Loss: 8.1732 - Val Accuracy: 0.9596



Training:   0%|          | 0/131 [00:00<?, ?it/s][A
Training:   1%|          | 1/131 [00:03<07:59,  3.69s/it][A
Training:   2%|▏         | 3/131 [00:03<02:08,  1.01s/it][A
Training:   4%|▍         | 5/131 [00:06<02:23,  1.14s/it][A
Training:   5%|▍         | 6/131 [00:06<01:49,  1.14it/s][A
Training:   6%|▌         | 8/131 [00:06<01:08,  1.80it/s][A
Training:   7%|▋         | 9/131 [00:09<02:01,  1.00it/s][A
Training:   9%|▉         | 12/131 [00:09<01:06,  1.78it/s][A
Training:  10%|▉         | 13/131 [00:12<01:50,  1.07it/s][A
Training:  12%|█▏        | 16/131 [00:12<01:04,  1.79it/s][A
Training:  13%|█▎        | 17/131 [00:14<01:34,  1.20it/s][A
Training:  15%|█▌        | 20/131 [00:14<00:58,  1.90it/s][A
Training:  16%|█▌        | 21/131 [00:17<01:29,  1.23it/s][A
Training:  18%|█▊        | 23/131 [00:17<01:00,  1.77it/s][A
Training:  18%|█▊        | 24/131 [00:17<00:51,  2.09it/s][A
Training:  19%|█▉        | 25/131 [00:19<01:30,  1.17it/s][A
Training:  21%|██     

Epoch: 40/55 - Loss: 6.7266 - Accuracy: 0.9721



  0%|          | 0/17 [00:00<?, ?it/s][A
  6%|▌         | 1/17 [00:02<00:47,  2.99s/it][A
 18%|█▊        | 3/17 [00:03<00:11,  1.18it/s][A
 29%|██▉       | 5/17 [00:05<00:12,  1.03s/it][A
 47%|████▋     | 8/17 [00:05<00:04,  1.93it/s][A
 53%|█████▎    | 9/17 [00:08<00:07,  1.11it/s][A
 65%|██████▍   | 11/17 [00:08<00:03,  1.67it/s][A
 76%|███████▋  | 13/17 [00:10<00:03,  1.26it/s][A
100%|██████████| 17/17 [00:11<00:00,  1.47it/s][A
Epochs:  73%|███████▎  | 40/55 [1:21:10<25:25, 101.68s/it]

Val Loss: 9.3834 - Val Accuracy: 0.9629



Training:   0%|          | 0/131 [00:00<?, ?it/s][A
Training:   1%|          | 1/131 [00:03<07:49,  3.61s/it][A
Training:   2%|▏         | 3/131 [00:03<02:06,  1.01it/s][A
Training:   4%|▍         | 5/131 [00:06<02:18,  1.10s/it][A
Training:   5%|▍         | 6/131 [00:06<01:45,  1.18it/s][A
Training:   6%|▌         | 8/131 [00:06<01:03,  1.95it/s][A
Training:   7%|▋         | 9/131 [00:09<02:01,  1.00it/s][A
Training:   8%|▊         | 11/131 [00:09<01:14,  1.61it/s][A
Training:  10%|▉         | 13/131 [00:11<01:41,  1.16it/s][A
Training:  11%|█▏        | 15/131 [00:11<01:08,  1.69it/s][A
Training:  13%|█▎        | 17/131 [00:14<01:27,  1.30it/s][A
Training:  15%|█▍        | 19/131 [00:14<01:01,  1.83it/s][A
Training:  16%|█▌        | 21/131 [00:16<01:24,  1.30it/s][A
Training:  17%|█▋        | 22/131 [00:16<01:10,  1.54it/s][A
Training:  18%|█▊        | 24/131 [00:17<00:47,  2.23it/s][A
Training:  19%|█▉        | 25/131 [00:19<01:30,  1.18it/s][A
Training:  21%|██▏    

Epoch: 41/55 - Loss: 7.1456 - Accuracy: 0.9709



  0%|          | 0/17 [00:00<?, ?it/s][A
  6%|▌         | 1/17 [00:03<00:49,  3.09s/it][A
 12%|█▏        | 2/17 [00:03<00:20,  1.34s/it][A
 18%|█▊        | 3/17 [00:03<00:10,  1.28it/s][A
 24%|██▎       | 4/17 [00:03<00:06,  1.89it/s][A
 29%|██▉       | 5/17 [00:05<00:13,  1.15s/it][A
 35%|███▌      | 6/17 [00:05<00:08,  1.25it/s][A
 53%|█████▎    | 9/17 [00:08<00:06,  1.27it/s][A
 59%|█████▉    | 10/17 [00:08<00:04,  1.49it/s][A
 76%|███████▋  | 13/17 [00:10<00:02,  1.34it/s][A
 88%|████████▊ | 15/17 [00:11<00:01,  1.89it/s][A
100%|██████████| 17/17 [00:11<00:00,  1.44it/s][A
Epochs:  75%|███████▍  | 41/55 [1:22:52<23:44, 101.77s/it]

Val Loss: 9.4720 - Val Accuracy: 0.9574



Training:   0%|          | 0/131 [00:00<?, ?it/s][A
Training:   1%|          | 1/131 [00:03<06:57,  3.21s/it][A
Training:   2%|▏         | 3/131 [00:03<01:52,  1.14it/s][A
Training:   4%|▍         | 5/131 [00:06<02:20,  1.12s/it][A
Training:   5%|▍         | 6/131 [00:06<01:48,  1.16it/s][A
Training:   5%|▌         | 7/131 [00:06<01:21,  1.53it/s][A
Training:   7%|▋         | 9/131 [00:08<01:53,  1.08it/s][A
Training:   9%|▉         | 12/131 [00:08<00:59,  2.02it/s][A
Training:  11%|█         | 14/131 [00:11<01:23,  1.40it/s][A
Training:  12%|█▏        | 16/131 [00:11<00:58,  1.97it/s][A
Training:  14%|█▎        | 18/131 [00:13<01:22,  1.36it/s][A
Training:  15%|█▍        | 19/131 [00:14<01:09,  1.61it/s][A
Training:  16%|█▌        | 21/131 [00:16<01:29,  1.23it/s][A
Training:  18%|█▊        | 23/131 [00:16<01:00,  1.77it/s][A
Training:  18%|█▊        | 24/131 [00:16<00:51,  2.07it/s][A
Training:  19%|█▉        | 25/131 [00:19<01:42,  1.03it/s][A
Training:  21%|██▏    

Epoch: 42/55 - Loss: 7.1359 - Accuracy: 0.9698



  0%|          | 0/17 [00:00<?, ?it/s][A
  6%|▌         | 1/17 [00:02<00:44,  2.80s/it][A
 12%|█▏        | 2/17 [00:03<00:19,  1.28s/it][A
 24%|██▎       | 4/17 [00:03<00:06,  1.95it/s][A
 29%|██▉       | 5/17 [00:05<00:12,  1.07s/it][A
 41%|████      | 7/17 [00:05<00:05,  1.68it/s][A
 53%|█████▎    | 9/17 [00:08<00:07,  1.13it/s][A
 65%|██████▍   | 11/17 [00:08<00:03,  1.69it/s][A
 76%|███████▋  | 13/17 [00:10<00:03,  1.27it/s][A
100%|██████████| 17/17 [00:11<00:00,  1.47it/s][A
Epochs:  76%|███████▋  | 42/55 [1:24:33<22:00, 101.55s/it]

Val Loss: 8.6587 - Val Accuracy: 0.9656



Training:   0%|          | 0/131 [00:00<?, ?it/s][A
Training:   1%|          | 1/131 [00:02<06:12,  2.87s/it][A
Training:   2%|▏         | 2/131 [00:03<02:44,  1.28s/it][A
Training:   2%|▏         | 3/131 [00:03<01:43,  1.23it/s][A
Training:   4%|▍         | 5/131 [00:05<02:18,  1.10s/it][A
Training:   5%|▌         | 7/131 [00:06<01:25,  1.45it/s][A
Training:   7%|▋         | 9/131 [00:08<01:47,  1.14it/s][A
Training:   8%|▊         | 10/131 [00:08<01:26,  1.41it/s][A
Training:   8%|▊         | 11/131 [00:09<01:13,  1.63it/s][A
Training:  10%|▉         | 13/131 [00:11<01:30,  1.30it/s][A
Training:  11%|█▏        | 15/131 [00:11<01:03,  1.83it/s][A
Training:  13%|█▎        | 17/131 [00:13<01:29,  1.27it/s][A
Training:  15%|█▍        | 19/131 [00:13<01:01,  1.83it/s][A
Training:  16%|█▌        | 21/131 [00:16<01:25,  1.28it/s][A
Training:  18%|█▊        | 23/131 [00:16<01:01,  1.77it/s][A
Training:  18%|█▊        | 24/131 [00:16<00:51,  2.08it/s][A
Training:  19%|█▉     

Epoch: 43/55 - Loss: 6.8355 - Accuracy: 0.9713



  0%|          | 0/17 [00:00<?, ?it/s][A
  6%|▌         | 1/17 [00:03<00:49,  3.06s/it][A
 12%|█▏        | 2/17 [00:03<00:20,  1.33s/it][A
 18%|█▊        | 3/17 [00:03<00:11,  1.25it/s][A
 24%|██▎       | 4/17 [00:03<00:06,  1.88it/s][A
 29%|██▉       | 5/17 [00:05<00:13,  1.14s/it][A
 41%|████      | 7/17 [00:05<00:05,  1.69it/s][A
 53%|█████▎    | 9/17 [00:08<00:06,  1.17it/s][A
 65%|██████▍   | 11/17 [00:08<00:03,  1.78it/s][A
 76%|███████▋  | 13/17 [00:10<00:03,  1.28it/s][A
100%|██████████| 17/17 [00:11<00:00,  1.49it/s][A
Epochs:  78%|███████▊  | 43/55 [1:26:15<20:19, 101.60s/it]

Val Loss: 10.7311 - Val Accuracy: 0.9624



Training:   0%|          | 0/131 [00:00<?, ?it/s][A
Training:   1%|          | 1/131 [00:03<06:46,  3.12s/it][A
Training:   2%|▏         | 2/131 [00:03<03:14,  1.51s/it][A
Training:   3%|▎         | 4/131 [00:03<01:18,  1.63it/s][A
Training:   4%|▍         | 5/131 [00:05<02:22,  1.13s/it][A
Training:   5%|▍         | 6/131 [00:06<01:50,  1.13it/s][A
Training:   7%|▋         | 9/131 [00:08<01:36,  1.26it/s][A
Training:   8%|▊         | 10/131 [00:08<01:27,  1.38it/s][A
Training:  10%|▉         | 13/131 [00:10<01:19,  1.48it/s][A
Training:  11%|█         | 14/131 [00:11<01:17,  1.52it/s][A
Training:  13%|█▎        | 17/131 [00:13<01:15,  1.51it/s][A
Training:  14%|█▎        | 18/131 [00:14<01:17,  1.46it/s][A
Training:  15%|█▍        | 19/131 [00:14<01:04,  1.74it/s][A
Training:  16%|█▌        | 21/131 [00:16<01:22,  1.34it/s][A
Training:  17%|█▋        | 22/131 [00:17<01:18,  1.39it/s][A
Training:  18%|█▊        | 24/131 [00:17<00:51,  2.09it/s][A
Training:  19%|█▉     

Epoch: 44/55 - Loss: 7.0270 - Accuracy: 0.9708



  0%|          | 0/17 [00:00<?, ?it/s][A
  6%|▌         | 1/17 [00:03<00:49,  3.10s/it][A
 12%|█▏        | 2/17 [00:03<00:22,  1.50s/it][A
 24%|██▎       | 4/17 [00:03<00:08,  1.61it/s][A
 29%|██▉       | 5/17 [00:05<00:11,  1.00it/s][A
 35%|███▌      | 6/17 [00:05<00:08,  1.26it/s][A
 41%|████      | 7/17 [00:05<00:05,  1.70it/s][A
 53%|█████▎    | 9/17 [00:08<00:06,  1.21it/s][A
 59%|█████▉    | 10/17 [00:08<00:04,  1.47it/s][A
 71%|███████   | 12/17 [00:08<00:02,  2.31it/s][A
 76%|███████▋  | 13/17 [00:10<00:03,  1.21it/s][A
100%|██████████| 17/17 [00:11<00:00,  1.48it/s][A
Epochs:  80%|████████  | 44/55 [1:27:57<18:39, 101.81s/it]

Val Loss: 8.6082 - Val Accuracy: 0.9629



Training:   0%|          | 0/131 [00:00<?, ?it/s][A
Training:   1%|          | 1/131 [00:03<07:03,  3.26s/it][A
Training:   2%|▏         | 3/131 [00:03<01:55,  1.11it/s][A
Training:   3%|▎         | 4/131 [00:03<01:20,  1.58it/s][A
Training:   4%|▍         | 5/131 [00:05<02:31,  1.20s/it][A
Training:   5%|▌         | 7/131 [00:05<01:19,  1.56it/s][A
Training:   7%|▋         | 9/131 [00:08<01:46,  1.15it/s][A
Training:   8%|▊         | 11/131 [00:08<01:08,  1.75it/s][A
Training:  10%|▉         | 13/131 [00:11<01:34,  1.24it/s][A
Training:  11%|█▏        | 15/131 [00:11<01:05,  1.77it/s][A
Training:  12%|█▏        | 16/131 [00:11<00:54,  2.09it/s][A
Training:  13%|█▎        | 17/131 [00:13<01:45,  1.08it/s][A
Training:  14%|█▎        | 18/131 [00:14<01:25,  1.33it/s][A
Training:  15%|█▌        | 20/131 [00:14<00:53,  2.08it/s][A
Training:  16%|█▌        | 21/131 [00:16<01:38,  1.12it/s][A
Training:  17%|█▋        | 22/131 [00:16<01:16,  1.42it/s][A
Training:  18%|█▊     

Epoch: 45/55 - Loss: 6.6309 - Accuracy: 0.9708



  0%|          | 0/17 [00:00<?, ?it/s][A
  6%|▌         | 1/17 [00:02<00:46,  2.93s/it][A
 12%|█▏        | 2/17 [00:03<00:19,  1.32s/it][A
 29%|██▉       | 5/17 [00:05<00:11,  1.08it/s][A
 35%|███▌      | 6/17 [00:05<00:08,  1.32it/s][A
 53%|█████▎    | 9/17 [00:08<00:06,  1.24it/s][A
 65%|██████▍   | 11/17 [00:08<00:03,  1.79it/s][A
 76%|███████▋  | 13/17 [00:10<00:02,  1.37it/s][A
 88%|████████▊ | 15/17 [00:10<00:01,  1.90it/s][A
100%|██████████| 17/17 [00:11<00:00,  1.50it/s][A
Epochs:  82%|████████▏ | 45/55 [1:29:38<16:54, 101.46s/it]

Val Loss: 10.1072 - Val Accuracy: 0.9629



Training:   0%|          | 0/131 [00:00<?, ?it/s][A
Training:   1%|          | 1/131 [00:03<07:34,  3.50s/it][A
Training:   2%|▏         | 3/131 [00:03<02:00,  1.06it/s][A
Training:   4%|▍         | 5/131 [00:06<02:23,  1.14s/it][A
Training:   6%|▌         | 8/131 [00:06<01:09,  1.77it/s][A
Training:   8%|▊         | 10/131 [00:08<01:33,  1.30it/s][A
Training:   9%|▉         | 12/131 [00:08<01:04,  1.86it/s][A
Training:  11%|█         | 14/131 [00:11<01:34,  1.24it/s][A
Training:  13%|█▎        | 17/131 [00:14<01:37,  1.17it/s][A
Training:  16%|█▌        | 21/131 [00:16<01:20,  1.37it/s][A
Training:  18%|█▊        | 23/131 [00:16<01:01,  1.76it/s][A
Training:  18%|█▊        | 24/131 [00:16<00:53,  1.99it/s][A
Training:  19%|█▉        | 25/131 [00:19<01:26,  1.22it/s][A
Training:  21%|██        | 27/131 [00:19<00:59,  1.76it/s][A
Training:  22%|██▏       | 29/131 [00:22<01:23,  1.23it/s][A
Training:  24%|██▎       | 31/131 [00:22<00:58,  1.71it/s][A
Training:  25%|██▌  

Epoch: 46/55 - Loss: 6.6217 - Accuracy: 0.9714



  0%|          | 0/17 [00:00<?, ?it/s][A
  6%|▌         | 1/17 [00:03<00:50,  3.14s/it][A
 18%|█▊        | 3/17 [00:03<00:11,  1.17it/s][A
 29%|██▉       | 5/17 [00:05<00:12,  1.06s/it][A
 35%|███▌      | 6/17 [00:05<00:08,  1.25it/s][A
 47%|████▋     | 8/17 [00:05<00:04,  2.08it/s][A
 59%|█████▉    | 10/17 [00:08<00:04,  1.41it/s][A
 71%|███████   | 12/17 [00:08<00:02,  2.07it/s][A
 76%|███████▋  | 13/17 [00:10<00:03,  1.19it/s][A
 88%|████████▊ | 15/17 [00:10<00:01,  1.81it/s][A
100%|██████████| 17/17 [00:11<00:00,  1.51it/s][A
Epochs:  84%|████████▎ | 46/55 [1:31:19<15:12, 101.37s/it]

Val Loss: 9.1281 - Val Accuracy: 0.9628



Training:   0%|          | 0/131 [00:00<?, ?it/s][A
Training:   1%|          | 1/131 [00:03<07:25,  3.43s/it][A
Training:   2%|▏         | 2/131 [00:03<03:12,  1.49s/it][A
Training:   4%|▍         | 5/131 [00:05<01:58,  1.06it/s][A
Training:   5%|▍         | 6/131 [00:05<01:31,  1.36it/s][A
Training:   6%|▌         | 8/131 [00:05<00:55,  2.21it/s][A
Training:   7%|▋         | 9/131 [00:08<01:44,  1.17it/s][A
Training:   8%|▊         | 10/131 [00:08<01:24,  1.43it/s][A
Training:   8%|▊         | 11/131 [00:08<01:06,  1.82it/s][A
Training:   9%|▉         | 12/131 [00:08<00:52,  2.29it/s][A
Training:  10%|▉         | 13/131 [00:10<01:51,  1.06it/s][A
Training:  11%|█         | 14/131 [00:11<01:30,  1.29it/s][A
Training:  11%|█▏        | 15/131 [00:11<01:07,  1.72it/s][A
Training:  12%|█▏        | 16/131 [00:11<00:52,  2.18it/s][A
Training:  13%|█▎        | 17/131 [00:13<01:52,  1.01it/s][A
Training:  14%|█▎        | 18/131 [00:14<01:33,  1.21it/s][A
Training:  15%|█▌     

Epoch: 47/55 - Loss: 6.7996 - Accuracy: 0.9720



  0%|          | 0/17 [00:00<?, ?it/s][A
  6%|▌         | 1/17 [00:03<00:48,  3.04s/it][A
 12%|█▏        | 2/17 [00:03<00:20,  1.35s/it][A
 24%|██▎       | 4/17 [00:03<00:06,  1.87it/s][A
 35%|███▌      | 6/17 [00:05<00:09,  1.18it/s][A
 53%|█████▎    | 9/17 [00:07<00:06,  1.27it/s][A
 59%|█████▉    | 10/17 [00:08<00:04,  1.51it/s][A
 76%|███████▋  | 13/17 [00:10<00:02,  1.41it/s][A
 82%|████████▏ | 14/17 [00:10<00:01,  1.66it/s][A
100%|██████████| 17/17 [00:11<00:00,  1.53it/s][A
Epochs:  85%|████████▌ | 47/55 [1:33:00<13:28, 101.06s/it]

Val Loss: 9.1587 - Val Accuracy: 0.9636



Training:   0%|          | 0/131 [00:00<?, ?it/s][A
Training:   1%|          | 1/131 [00:03<07:14,  3.35s/it][A
Training:   2%|▏         | 3/131 [00:03<01:55,  1.10it/s][A
Training:   4%|▍         | 5/131 [00:05<02:10,  1.04s/it][A
Training:   5%|▌         | 7/131 [00:05<01:17,  1.60it/s][A
Training:   7%|▋         | 9/131 [00:08<01:40,  1.22it/s][A
Training:   8%|▊         | 10/131 [00:08<01:21,  1.49it/s][A
Training:  10%|▉         | 13/131 [00:10<01:25,  1.37it/s][A
Training:  11%|█         | 14/131 [00:10<01:16,  1.54it/s][A
Training:  12%|█▏        | 16/131 [00:11<00:53,  2.16it/s][A
Training:  13%|█▎        | 17/131 [00:13<01:40,  1.14it/s][A
Training:  14%|█▎        | 18/131 [00:13<01:23,  1.36it/s][A
Training:  15%|█▌        | 20/131 [00:14<00:53,  2.07it/s][A
Training:  16%|█▌        | 21/131 [00:16<01:34,  1.17it/s][A
Training:  17%|█▋        | 22/131 [00:16<01:15,  1.45it/s][A
Training:  19%|█▉        | 25/131 [00:18<01:18,  1.34it/s][A
Training:  20%|█▉    

Epoch: 48/55 - Loss: 6.7896 - Accuracy: 0.9715



  0%|          | 0/17 [00:00<?, ?it/s][A
  6%|▌         | 1/17 [00:03<00:52,  3.27s/it][A
 18%|█▊        | 3/17 [00:03<00:12,  1.10it/s][A
 29%|██▉       | 5/17 [00:05<00:12,  1.06s/it][A
 35%|███▌      | 6/17 [00:06<00:08,  1.22it/s][A
 41%|████      | 7/17 [00:06<00:06,  1.60it/s][A
 47%|████▋     | 8/17 [00:06<00:04,  2.08it/s][A
 53%|█████▎    | 9/17 [00:08<00:07,  1.09it/s][A
 59%|█████▉    | 10/17 [00:08<00:04,  1.47it/s][A
 76%|███████▋  | 13/17 [00:10<00:02,  1.41it/s][A
100%|██████████| 17/17 [00:11<00:00,  1.49it/s][A
Epochs:  87%|████████▋ | 48/55 [1:34:40<11:46, 100.97s/it]

Val Loss: 9.4783 - Val Accuracy: 0.9624



Training:   0%|          | 0/131 [00:00<?, ?it/s][A
Training:   1%|          | 1/131 [00:03<06:46,  3.13s/it][A
Training:   2%|▏         | 2/131 [00:03<02:59,  1.39s/it][A
Training:   3%|▎         | 4/131 [00:03<01:12,  1.74it/s][A
Training:   4%|▍         | 5/131 [00:05<02:09,  1.03s/it][A
Training:   5%|▍         | 6/131 [00:05<01:35,  1.31it/s][A
Training:   5%|▌         | 7/131 [00:05<01:11,  1.73it/s][A
Training:   6%|▌         | 8/131 [00:06<00:55,  2.21it/s][A
Training:   7%|▋         | 9/131 [00:08<01:53,  1.08it/s][A
Training:   8%|▊         | 10/131 [00:08<01:25,  1.41it/s][A
Training:   8%|▊         | 11/131 [00:08<01:05,  1.84it/s][A
Training:   9%|▉         | 12/131 [00:08<00:49,  2.43it/s][A
Training:  10%|▉         | 13/131 [00:10<01:47,  1.10it/s][A
Training:  11%|█         | 14/131 [00:11<01:31,  1.28it/s][A
Training:  12%|█▏        | 16/131 [00:11<00:51,  2.22it/s][A
Training:  13%|█▎        | 17/131 [00:13<01:50,  1.03it/s][A
Training:  14%|█▎       

Epoch: 49/55 - Loss: 6.8405 - Accuracy: 0.9716



  0%|          | 0/17 [00:00<?, ?it/s][A
  6%|▌         | 1/17 [00:03<00:48,  3.02s/it][A
 12%|█▏        | 2/17 [00:03<00:20,  1.40s/it][A
 29%|██▉       | 5/17 [00:05<00:10,  1.10it/s][A
 35%|███▌      | 6/17 [00:05<00:08,  1.30it/s][A
 53%|█████▎    | 9/17 [00:07<00:05,  1.44it/s][A
 59%|█████▉    | 10/17 [00:08<00:04,  1.56it/s][A
 65%|██████▍   | 11/17 [00:08<00:03,  1.92it/s][A
 76%|███████▋  | 13/17 [00:10<00:02,  1.42it/s][A
 82%|████████▏ | 14/17 [00:10<00:01,  1.57it/s][A
100%|██████████| 17/17 [00:11<00:00,  1.53it/s][A
Epochs:  89%|████████▉ | 49/55 [1:36:22<10:07, 101.17s/it]

Val Loss: 9.3015 - Val Accuracy: 0.9630



Training:   0%|          | 0/131 [00:00<?, ?it/s][A
Training:   1%|          | 1/131 [00:03<07:01,  3.25s/it][A
Training:   2%|▏         | 3/131 [00:03<01:52,  1.13it/s][A
Training:   4%|▍         | 5/131 [00:05<02:10,  1.04s/it][A
Training:   5%|▌         | 7/131 [00:05<01:18,  1.59it/s][A
Training:   7%|▋         | 9/131 [00:08<01:44,  1.17it/s][A
Training:   8%|▊         | 10/131 [00:08<01:24,  1.43it/s][A
Training:   8%|▊         | 11/131 [00:08<01:07,  1.78it/s][A
Training:   9%|▉         | 12/131 [00:08<00:53,  2.22it/s][A
Training:  10%|▉         | 13/131 [00:11<01:53,  1.04it/s][A
Training:  11%|█▏        | 15/131 [00:11<01:08,  1.69it/s][A
Training:  13%|█▎        | 17/131 [00:13<01:36,  1.18it/s][A
Training:  14%|█▎        | 18/131 [00:13<01:18,  1.44it/s][A
Training:  16%|█▌        | 21/131 [00:16<01:20,  1.37it/s][A
Training:  17%|█▋        | 22/131 [00:16<01:10,  1.54it/s][A
Training:  19%|█▉        | 25/131 [00:18<01:14,  1.42it/s][A
Training:  20%|█▉    

Epoch: 50/55 - Loss: 6.8859 - Accuracy: 0.9712



  0%|          | 0/17 [00:00<?, ?it/s][A
  6%|▌         | 1/17 [00:03<00:53,  3.35s/it][A
 18%|█▊        | 3/17 [00:03<00:12,  1.08it/s][A
 29%|██▉       | 5/17 [00:05<00:11,  1.03it/s][A
 41%|████      | 7/17 [00:05<00:05,  1.69it/s][A
 53%|█████▎    | 9/17 [00:07<00:06,  1.27it/s][A
 59%|█████▉    | 10/17 [00:08<00:04,  1.48it/s][A
 71%|███████   | 12/17 [00:08<00:02,  2.22it/s][A
 76%|███████▋  | 13/17 [00:10<00:03,  1.26it/s][A
 82%|████████▏ | 14/17 [00:10<00:01,  1.55it/s][A
 94%|█████████▍| 16/17 [00:10<00:00,  2.43it/s][A
100%|██████████| 17/17 [00:11<00:00,  1.53it/s][A
Epochs:  91%|█████████ | 50/55 [1:38:04<08:27, 101.50s/it]

Val Loss: 10.9451 - Val Accuracy: 0.9584



Training:   0%|          | 0/131 [00:00<?, ?it/s][A
Training:   1%|          | 1/131 [00:02<05:40,  2.62s/it][A
Training:   2%|▏         | 2/131 [00:02<02:46,  1.29s/it][A
Training:   2%|▏         | 3/131 [00:03<01:37,  1.32it/s][A
Training:   3%|▎         | 4/131 [00:03<01:03,  2.01it/s][A
Training:   4%|▍         | 5/131 [00:05<02:03,  1.02it/s][A
Training:   5%|▍         | 6/131 [00:05<01:34,  1.32it/s][A
Training:   6%|▌         | 8/131 [00:05<00:54,  2.27it/s][A
Training:   7%|▋         | 9/131 [00:07<01:45,  1.16it/s][A
Training:   8%|▊         | 10/131 [00:08<01:36,  1.25it/s][A
Training:   9%|▉         | 12/131 [00:08<00:57,  2.06it/s][A
Training:  10%|▉         | 13/131 [00:10<01:39,  1.18it/s][A
Training:  11%|█         | 14/131 [00:11<01:31,  1.27it/s][A
Training:  12%|█▏        | 16/131 [00:11<00:55,  2.09it/s][A
Training:  13%|█▎        | 17/131 [00:13<01:31,  1.24it/s][A
Training:  14%|█▎        | 18/131 [00:13<01:27,  1.29it/s][A
Training:  15%|█▌       

Epoch: 51/55 - Loss: 6.9420 - Accuracy: 0.9711



  0%|          | 0/17 [00:00<?, ?it/s][A
  6%|▌         | 1/17 [00:02<00:47,  2.99s/it][A
 18%|█▊        | 3/17 [00:03<00:11,  1.19it/s][A
 29%|██▉       | 5/17 [00:05<00:11,  1.02it/s][A
 41%|████      | 7/17 [00:05<00:06,  1.66it/s][A
 53%|█████▎    | 9/17 [00:07<00:06,  1.22it/s][A
 65%|██████▍   | 11/17 [00:08<00:03,  1.78it/s][A
 76%|███████▋  | 13/17 [00:10<00:02,  1.34it/s][A
 88%|████████▊ | 15/17 [00:10<00:01,  1.87it/s][A
100%|██████████| 17/17 [00:11<00:00,  1.53it/s][A
Epochs:  93%|█████████▎| 51/55 [1:39:46<06:46, 101.57s/it]

Val Loss: 9.2788 - Val Accuracy: 0.9647



Training:   0%|          | 0/131 [00:00<?, ?it/s][A
Training:   1%|          | 1/131 [00:03<06:39,  3.07s/it][A
Training:   2%|▏         | 3/131 [00:03<01:47,  1.19it/s][A
Training:   4%|▍         | 5/131 [00:05<02:11,  1.05s/it][A
Training:   5%|▌         | 7/131 [00:05<01:20,  1.55it/s][A
Training:   7%|▋         | 9/131 [00:08<01:48,  1.13it/s][A
Training:   8%|▊         | 10/131 [00:08<01:30,  1.34it/s][A
Training:   8%|▊         | 11/131 [00:08<01:11,  1.67it/s][A
Training:  10%|▉         | 13/131 [00:11<01:38,  1.20it/s][A
Training:  11%|█▏        | 15/131 [00:11<01:05,  1.78it/s][A
Training:  13%|█▎        | 17/131 [00:13<01:30,  1.27it/s][A
Training:  15%|█▍        | 19/131 [00:13<01:01,  1.81it/s][A
Training:  16%|█▌        | 21/131 [00:16<01:30,  1.22it/s][A
Training:  18%|█▊        | 23/131 [00:16<01:03,  1.70it/s][A
Training:  19%|█▉        | 25/131 [00:19<01:26,  1.22it/s][A
Training:  21%|██        | 27/131 [00:19<01:00,  1.71it/s][A
Training:  22%|██▏   

Epoch: 52/55 - Loss: 6.7408 - Accuracy: 0.9737



  0%|          | 0/17 [00:00<?, ?it/s][A
  6%|▌         | 1/17 [00:02<00:44,  2.81s/it][A
 12%|█▏        | 2/17 [00:02<00:18,  1.23s/it][A
 24%|██▎       | 4/17 [00:03<00:06,  1.97it/s][A
 29%|██▉       | 5/17 [00:05<00:12,  1.03s/it][A
 41%|████      | 7/17 [00:05<00:06,  1.63it/s][A
 53%|█████▎    | 9/17 [00:07<00:06,  1.23it/s][A
 65%|██████▍   | 11/17 [00:07<00:03,  1.86it/s][A
 71%|███████   | 12/17 [00:08<00:02,  2.21it/s][A
 76%|███████▋  | 13/17 [00:10<00:03,  1.24it/s][A
 88%|████████▊ | 15/17 [00:10<00:01,  1.89it/s][A
100%|██████████| 17/17 [00:10<00:00,  1.58it/s][A
Epochs:  95%|█████████▍| 52/55 [1:41:27<05:04, 101.56s/it]

Val Loss: 8.7346 - Val Accuracy: 0.9624



Training:   0%|          | 0/131 [00:00<?, ?it/s][A
Training:   1%|          | 1/131 [00:03<06:51,  3.17s/it][A
Training:   2%|▏         | 2/131 [00:03<02:58,  1.39s/it][A
Training:   2%|▏         | 3/131 [00:03<01:44,  1.22it/s][A
Training:   4%|▍         | 5/131 [00:06<02:23,  1.14s/it][A
Training:   6%|▌         | 8/131 [00:06<01:06,  1.86it/s][A
Training:   8%|▊         | 10/131 [00:09<01:39,  1.21it/s][A
Training:   8%|▊         | 11/131 [00:09<01:22,  1.46it/s][A
Training:  10%|▉         | 13/131 [00:11<01:42,  1.15it/s][A
Training:  11%|█▏        | 15/131 [00:11<01:11,  1.63it/s][A
Training:  13%|█▎        | 17/131 [00:14<01:31,  1.25it/s][A
Training:  14%|█▎        | 18/131 [00:14<01:15,  1.49it/s][A
Training:  15%|█▍        | 19/131 [00:14<01:05,  1.72it/s][A
Training:  16%|█▌        | 21/131 [00:16<01:28,  1.24it/s][A
Training:  18%|█▊        | 23/131 [00:17<01:03,  1.70it/s][A
Training:  18%|█▊        | 24/131 [00:17<00:52,  2.03it/s][A
Training:  19%|█▉    

Epoch: 53/55 - Loss: 7.1111 - Accuracy: 0.9709



  0%|          | 0/17 [00:00<?, ?it/s][A
  6%|▌         | 1/17 [00:02<00:46,  2.88s/it][A
 12%|█▏        | 2/17 [00:02<00:18,  1.25s/it][A
 24%|██▎       | 4/17 [00:03<00:06,  1.97it/s][A
 29%|██▉       | 5/17 [00:05<00:12,  1.04s/it][A
 35%|███▌      | 6/17 [00:05<00:08,  1.32it/s][A
 53%|█████▎    | 9/17 [00:07<00:06,  1.30it/s][A
 65%|██████▍   | 11/17 [00:07<00:03,  1.90it/s][A
 76%|███████▋  | 13/17 [00:10<00:02,  1.43it/s][A
100%|██████████| 17/17 [00:10<00:00,  1.59it/s][A
Epochs:  96%|█████████▋| 53/55 [1:43:08<03:22, 101.36s/it]

Val Loss: 9.9744 - Val Accuracy: 0.9584



Training:   0%|          | 0/131 [00:00<?, ?it/s][A
Training:   1%|          | 1/131 [00:03<07:02,  3.25s/it][A
Training:   3%|▎         | 4/131 [00:03<01:26,  1.47it/s][A
Training:   4%|▍         | 5/131 [00:06<02:31,  1.20s/it][A
Training:   5%|▍         | 6/131 [00:06<01:52,  1.12it/s][A
Training:   5%|▌         | 7/131 [00:06<01:24,  1.47it/s][A
Training:   7%|▋         | 9/131 [00:08<01:55,  1.06it/s][A
Training:   8%|▊         | 11/131 [00:09<01:12,  1.66it/s][A
Training:  10%|▉         | 13/131 [00:11<01:40,  1.17it/s][A
Training:  11%|█         | 14/131 [00:11<01:21,  1.43it/s][A
Training:  11%|█▏        | 15/131 [00:11<01:05,  1.76it/s][A
Training:  13%|█▎        | 17/131 [00:14<01:36,  1.18it/s][A
Training:  15%|█▌        | 20/131 [00:14<00:53,  2.07it/s][A
Training:  17%|█▋        | 22/131 [00:17<01:19,  1.37it/s][A
Training:  19%|█▉        | 25/131 [00:19<01:22,  1.28it/s][A
Training:  20%|█▉        | 26/131 [00:19<01:13,  1.43it/s][A
Training:  21%|██▏    

Epoch: 54/55 - Loss: 7.4406 - Accuracy: 0.9704



  0%|          | 0/17 [00:00<?, ?it/s][A
  6%|▌         | 1/17 [00:02<00:47,  2.98s/it][A
 24%|██▎       | 4/17 [00:03<00:07,  1.69it/s][A
 35%|███▌      | 6/17 [00:05<00:09,  1.15it/s][A
 47%|████▋     | 8/17 [00:05<00:05,  1.78it/s][A
 59%|█████▉    | 10/17 [00:08<00:05,  1.29it/s][A
 71%|███████   | 12/17 [00:08<00:02,  1.87it/s][A
 82%|████████▏ | 14/17 [00:10<00:02,  1.43it/s][A
100%|██████████| 17/17 [00:10<00:00,  1.56it/s][A
Epochs:  98%|█████████▊| 54/55 [1:44:50<01:41, 101.30s/it]

Val Loss: 9.3067 - Val Accuracy: 0.9606



Training:   0%|          | 0/131 [00:00<?, ?it/s][A
Training:   1%|          | 1/131 [00:03<06:48,  3.14s/it][A
Training:   2%|▏         | 3/131 [00:03<01:50,  1.16it/s][A
Training:   4%|▍         | 5/131 [00:05<02:19,  1.10s/it][A
Training:   5%|▍         | 6/131 [00:06<01:47,  1.16it/s][A
Training:   5%|▌         | 7/131 [00:06<01:22,  1.51it/s][A
Training:   7%|▋         | 9/131 [00:08<01:46,  1.15it/s][A
Training:   8%|▊         | 10/131 [00:08<01:25,  1.42it/s][A
Training:   9%|▉         | 12/131 [00:08<00:52,  2.28it/s][A
Training:  10%|▉         | 13/131 [00:11<01:47,  1.10it/s][A
Training:  11%|█         | 14/131 [00:11<01:30,  1.29it/s][A
Training:  12%|█▏        | 16/131 [00:11<00:55,  2.07it/s][A
Training:  13%|█▎        | 17/131 [00:14<01:46,  1.07it/s][A
Training:  14%|█▎        | 18/131 [00:14<01:23,  1.36it/s][A
Training:  15%|█▌        | 20/131 [00:14<00:50,  2.20it/s][A
Training:  17%|█▋        | 22/131 [00:17<01:29,  1.22it/s][A
Training:  18%|█▊     

Epoch: 55/55 - Loss: 6.7315 - Accuracy: 0.9720



  0%|          | 0/17 [00:00<?, ?it/s][A
  6%|▌         | 1/17 [00:03<00:49,  3.10s/it][A
 12%|█▏        | 2/17 [00:03<00:20,  1.35s/it][A
 29%|██▉       | 5/17 [00:05<00:11,  1.04it/s][A
 47%|████▋     | 8/17 [00:05<00:04,  2.03it/s][A
 59%|█████▉    | 10/17 [00:08<00:05,  1.40it/s][A
 76%|███████▋  | 13/17 [00:10<00:02,  1.40it/s][A
100%|██████████| 17/17 [00:10<00:00,  1.56it/s][A
Epochs: 100%|██████████| 55/55 [1:46:31<00:00, 116.21s/it]


Val Loss: 8.3335 - Val Accuracy: 0.9602


[32m[I 2023-12-08 21:46:18,545][0m Trial 16 finished with value: 0.960151195526123 and parameters: {'loss_learning_rate': 0.009182383596361456, 'learning_rate': 0.0005227903627863731, 'weight_decay': 0.00022533397273366494, 'epsilon': 8.488395942056724e-08, 'beta': 1.0, 'gamma': 0.7000000000000001, 'batch_size': 107, 'epochs': 55}. Best is trial 15 with value: 0.9649122357368469.[0m


Learning rate for Loss: 0.008447568694221697
Learning rate: 0.000633457353251843
Weight decay: 0.001876909923779263
Epsilon: 9.402328890865692e-08
Beta: 0.8
Gamma: 0.9
Batch size: 266
Number of epochs: 37


Epochs:   0%|          | 0/37 [00:00<?, ?it/s]
Training:   0%|          | 0/53 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/53 [00:07<06:25,  7.41s/it][A
Training:   6%|▌         | 3/53 [00:07<01:39,  1.99s/it][A
Training:   8%|▊         | 4/53 [00:07<01:05,  1.34s/it][A
Training:   9%|▉         | 5/53 [00:14<02:23,  2.98s/it][A
Training:  11%|█▏        | 6/53 [00:14<01:38,  2.10s/it][A
Training:  13%|█▎        | 7/53 [00:14<01:09,  1.50s/it][A
Training:  17%|█▋        | 9/53 [00:20<01:38,  2.23s/it][A
Training:  19%|█▉        | 10/53 [00:20<01:16,  1.78s/it][A
Training:  21%|██        | 11/53 [00:21<00:55,  1.33s/it][A
Training:  25%|██▍       | 13/53 [00:27<01:25,  2.14s/it][A
Training:  26%|██▋       | 14/53 [00:27<01:06,  1.70s/it][A
Training:  28%|██▊       | 15/53 [00:27<00:49,  1.31s/it][A
Training:  32%|███▏      | 17/53 [00:34<01:13,  2.04s/it][A
Training:  36%|███▌      | 19/53 [00:34<00:46,  1.38s/it][A
Training:  40%|███▉      | 21/53 [00:40<01:04,  2.00s/

Epoch: 1/37 - Loss: 16.3506 - Accuracy: 0.8776



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:06<00:38,  6.50s/it][A
 29%|██▊       | 2/7 [00:06<00:13,  2.75s/it][A
 57%|█████▋    | 4/7 [00:06<00:03,  1.08s/it][A
 71%|███████▏  | 5/7 [00:11<00:04,  2.33s/it][A
 86%|████████▌ | 6/7 [00:12<00:01,  1.65s/it][A
100%|██████████| 7/7 [00:12<00:00,  1.76s/it][A
Epochs:   3%|▎         | 1/37 [01:43<1:02:17, 103.83s/it]

Val Loss: 8.0060 - Val Accuracy: 0.9545



Training:   0%|          | 0/53 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/53 [00:07<06:36,  7.63s/it][A
Training:   4%|▍         | 2/53 [00:07<02:45,  3.24s/it][A
Training:   6%|▌         | 3/53 [00:07<01:31,  1.82s/it][A
Training:   8%|▊         | 4/53 [00:08<00:56,  1.16s/it][A
Training:   9%|▉         | 5/53 [00:14<02:22,  2.96s/it][A
Training:  11%|█▏        | 6/53 [00:14<01:33,  2.00s/it][A
Training:  15%|█▌        | 8/53 [00:14<00:47,  1.06s/it][A
Training:  17%|█▋        | 9/53 [00:21<01:50,  2.52s/it][A
Training:  19%|█▉        | 10/53 [00:21<01:21,  1.90s/it][A
Training:  21%|██        | 11/53 [00:21<01:00,  1.44s/it][A
Training:  23%|██▎       | 12/53 [00:21<00:44,  1.08s/it][A
Training:  25%|██▍       | 13/53 [00:27<01:38,  2.46s/it][A
Training:  26%|██▋       | 14/53 [00:27<01:09,  1.77s/it][A
Training:  30%|███       | 16/53 [00:27<00:36,  1.00it/s][A
Training:  32%|███▏      | 17/53 [00:34<01:23,  2.33s/it][A
Training:  34%|███▍      | 18/53 [00:34<

Epoch: 2/37 - Loss: 7.3917 - Accuracy: 0.9577



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:06<00:37,  6.24s/it][A
 29%|██▊       | 2/7 [00:06<00:13,  2.70s/it][A
 43%|████▎     | 3/7 [00:06<00:06,  1.51s/it][A
 71%|███████▏  | 5/7 [00:11<00:04,  2.09s/it][A
100%|██████████| 7/7 [00:12<00:00,  1.72s/it][A
Epochs:   5%|▌         | 2/37 [03:27<1:00:35, 103.88s/it]

Val Loss: 7.2965 - Val Accuracy: 0.9604



Training:   0%|          | 0/53 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/53 [00:07<06:40,  7.71s/it][A
Training:   6%|▌         | 3/53 [00:07<01:43,  2.08s/it][A
Training:   9%|▉         | 5/53 [00:14<02:06,  2.64s/it][A
Training:  11%|█▏        | 6/53 [00:14<01:33,  2.00s/it][A
Training:  13%|█▎        | 7/53 [00:14<01:08,  1.48s/it][A
Training:  15%|█▌        | 8/53 [00:14<00:49,  1.10s/it][A
Training:  17%|█▋        | 9/53 [00:20<01:52,  2.57s/it][A
Training:  19%|█▉        | 10/53 [00:21<01:19,  1.86s/it][A
Training:  21%|██        | 11/53 [00:21<00:56,  1.35s/it][A
Training:  23%|██▎       | 12/53 [00:21<00:40,  1.02it/s][A
Training:  25%|██▍       | 13/53 [00:27<01:40,  2.51s/it][A
Training:  26%|██▋       | 14/53 [00:28<01:15,  1.93s/it][A
Training:  28%|██▊       | 15/53 [00:28<00:53,  1.41s/it][A
Training:  32%|███▏      | 17/53 [00:34<01:18,  2.17s/it][A
Training:  34%|███▍      | 18/53 [00:34<00:59,  1.70s/it][A
Training:  38%|███▊      | 20/53 [00:34

Epoch: 3/37 - Loss: 6.2495 - Accuracy: 0.9624



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:06<00:40,  6.77s/it][A
 29%|██▊       | 2/7 [00:06<00:14,  2.86s/it][A
 57%|█████▋    | 4/7 [00:07<00:03,  1.12s/it][A
 71%|███████▏  | 5/7 [00:12<00:04,  2.38s/it][A
100%|██████████| 7/7 [00:12<00:00,  1.80s/it][A
Epochs:   8%|▊         | 3/37 [05:11<58:43, 103.64s/it]  

Val Loss: 6.2676 - Val Accuracy: 0.9573



Training:   0%|          | 0/53 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/53 [00:07<06:20,  7.32s/it][A
Training:   4%|▍         | 2/53 [00:07<02:42,  3.18s/it][A
Training:   6%|▌         | 3/53 [00:07<01:30,  1.82s/it][A
Training:   8%|▊         | 4/53 [00:07<00:57,  1.17s/it][A
Training:   9%|▉         | 5/53 [00:14<02:22,  2.97s/it][A
Training:  11%|█▏        | 6/53 [00:14<01:36,  2.05s/it][A
Training:  13%|█▎        | 7/53 [00:14<01:08,  1.50s/it][A
Training:  15%|█▌        | 8/53 [00:14<00:47,  1.07s/it][A
Training:  17%|█▋        | 9/53 [00:20<01:52,  2.57s/it][A
Training:  19%|█▉        | 10/53 [00:20<01:18,  1.82s/it][A
Training:  21%|██        | 11/53 [00:21<01:00,  1.45s/it][A
Training:  23%|██▎       | 12/53 [00:21<00:43,  1.06s/it][A
Training:  25%|██▍       | 13/53 [00:27<01:40,  2.51s/it][A
Training:  28%|██▊       | 15/53 [00:28<00:56,  1.48s/it][A
Training:  30%|███       | 16/53 [00:28<00:42,  1.14s/it][A
Training:  32%|███▏      | 17/53 [00:34<0

Epoch: 4/37 - Loss: 5.7437 - Accuracy: 0.9642



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:06<00:39,  6.62s/it][A
 29%|██▊       | 2/7 [00:06<00:14,  2.84s/it][A
 57%|█████▋    | 4/7 [00:06<00:03,  1.11s/it][A
 71%|███████▏  | 5/7 [00:12<00:04,  2.45s/it][A
100%|██████████| 7/7 [00:12<00:00,  1.82s/it][A
Epochs:  11%|█         | 4/37 [06:54<56:52, 103.42s/it]

Val Loss: 5.9611 - Val Accuracy: 0.9626



Training:   0%|          | 0/53 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/53 [00:08<06:56,  8.01s/it][A
Training:   4%|▍         | 2/53 [00:08<02:51,  3.37s/it][A
Training:   6%|▌         | 3/53 [00:08<01:34,  1.88s/it][A
Training:   9%|▉         | 5/53 [00:14<02:02,  2.56s/it][A
Training:  11%|█▏        | 6/53 [00:14<01:28,  1.89s/it][A
Training:  15%|█▌        | 8/53 [00:14<00:48,  1.07s/it][A
Training:  17%|█▋        | 9/53 [00:21<01:45,  2.40s/it][A
Training:  19%|█▉        | 10/53 [00:21<01:17,  1.81s/it][A
Training:  23%|██▎       | 12/53 [00:21<00:44,  1.08s/it][A
Training:  25%|██▍       | 13/53 [00:28<01:34,  2.36s/it][A
Training:  28%|██▊       | 15/53 [00:28<00:54,  1.45s/it][A
Training:  30%|███       | 16/53 [00:28<00:42,  1.16s/it][A
Training:  32%|███▏      | 17/53 [00:35<01:28,  2.46s/it][A
Training:  34%|███▍      | 18/53 [00:35<01:05,  1.86s/it][A
Training:  36%|███▌      | 19/53 [00:35<00:47,  1.39s/it][A
Training:  40%|███▉      | 21/53 [00:41

Epoch: 5/37 - Loss: 5.3301 - Accuracy: 0.9653



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:06<00:39,  6.54s/it][A
 29%|██▊       | 2/7 [00:06<00:13,  2.77s/it][A
 43%|████▎     | 3/7 [00:06<00:06,  1.55s/it][A
 57%|█████▋    | 4/7 [00:06<00:02,  1.00it/s][A
 71%|███████▏  | 5/7 [00:12<00:05,  2.56s/it][A
100%|██████████| 7/7 [00:12<00:00,  1.80s/it][A
Epochs:  14%|█▎        | 5/37 [08:38<55:17, 103.67s/it]

Val Loss: 5.7441 - Val Accuracy: 0.9615



Training:   0%|          | 0/53 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/53 [00:07<06:26,  7.43s/it][A
Training:   4%|▍         | 2/53 [00:07<02:48,  3.31s/it][A
Training:   6%|▌         | 3/53 [00:08<01:35,  1.92s/it][A
Training:   8%|▊         | 4/53 [00:08<00:59,  1.22s/it][A
Training:   9%|▉         | 5/53 [00:13<02:14,  2.81s/it][A
Training:  11%|█▏        | 6/53 [00:14<01:36,  2.05s/it][A
Training:  13%|█▎        | 7/53 [00:14<01:09,  1.51s/it][A
Training:  15%|█▌        | 8/53 [00:15<00:48,  1.08s/it][A
Training:  17%|█▋        | 9/53 [00:20<01:53,  2.58s/it][A
Training:  19%|█▉        | 10/53 [00:21<01:22,  1.92s/it][A
Training:  21%|██        | 11/53 [00:22<01:04,  1.54s/it][A
Training:  23%|██▎       | 12/53 [00:22<00:45,  1.10s/it][A
Training:  25%|██▍       | 13/53 [00:27<01:37,  2.43s/it][A
Training:  26%|██▋       | 14/53 [00:28<01:17,  1.98s/it][A
Training:  28%|██▊       | 15/53 [00:28<00:55,  1.45s/it][A
Training:  30%|███       | 16/53 [00:28<0

Epoch: 6/37 - Loss: 5.1881 - Accuracy: 0.9671



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:06<00:40,  6.81s/it][A
 29%|██▊       | 2/7 [00:07<00:14,  2.92s/it][A
 43%|████▎     | 3/7 [00:07<00:06,  1.65s/it][A
 57%|█████▋    | 4/7 [00:07<00:03,  1.04s/it][A
 71%|███████▏  | 5/7 [00:12<00:05,  2.55s/it][A
100%|██████████| 7/7 [00:12<00:00,  1.84s/it][A
Epochs:  16%|█▌        | 6/37 [10:22<53:40, 103.87s/it]

Val Loss: 5.7624 - Val Accuracy: 0.9627



Training:   0%|          | 0/53 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/53 [00:07<06:31,  7.53s/it][A
Training:   4%|▍         | 2/53 [00:07<02:43,  3.22s/it][A
Training:   6%|▌         | 3/53 [00:07<01:31,  1.84s/it][A
Training:   9%|▉         | 5/53 [00:14<02:07,  2.65s/it][A
Training:  11%|█▏        | 6/53 [00:14<01:31,  1.95s/it][A
Training:  15%|█▌        | 8/53 [00:14<00:49,  1.11s/it][A
Training:  17%|█▋        | 9/53 [00:21<01:43,  2.36s/it][A
Training:  19%|█▉        | 10/53 [00:21<01:18,  1.83s/it][A
Training:  21%|██        | 11/53 [00:21<00:57,  1.37s/it][A
Training:  23%|██▎       | 12/53 [00:21<00:42,  1.03s/it][A
Training:  25%|██▍       | 13/53 [00:27<01:40,  2.51s/it][A
Training:  26%|██▋       | 14/53 [00:28<01:12,  1.87s/it][A
Training:  28%|██▊       | 15/53 [00:28<00:52,  1.38s/it][A
Training:  30%|███       | 16/53 [00:28<00:37,  1.00s/it][A
Training:  32%|███▏      | 17/53 [00:34<01:29,  2.50s/it][A
Training:  34%|███▍      | 18/53 [00:35

Epoch: 7/37 - Loss: 4.8593 - Accuracy: 0.9672



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:06<00:40,  6.82s/it][A
 43%|████▎     | 3/7 [00:06<00:07,  1.83s/it][A
 71%|███████▏  | 5/7 [00:12<00:04,  2.30s/it][A
100%|██████████| 7/7 [00:12<00:00,  1.82s/it][A
Epochs:  19%|█▉        | 7/37 [12:06<52:00, 104.02s/it]

Val Loss: 6.8508 - Val Accuracy: 0.9556



Training:   0%|          | 0/53 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/53 [00:07<06:20,  7.32s/it][A
Training:   6%|▌         | 3/53 [00:07<01:38,  1.97s/it][A
Training:   9%|▉         | 5/53 [00:14<02:09,  2.69s/it][A
Training:  13%|█▎        | 7/53 [00:14<01:13,  1.60s/it][A
Training:  17%|█▋        | 9/53 [00:20<01:37,  2.22s/it][A
Training:  21%|██        | 11/53 [00:21<01:02,  1.49s/it][A
Training:  25%|██▍       | 13/53 [00:27<01:23,  2.09s/it][A
Training:  28%|██▊       | 15/53 [00:28<00:55,  1.47s/it][A
Training:  30%|███       | 16/53 [00:28<00:44,  1.22s/it][A
Training:  32%|███▏      | 17/53 [00:34<01:25,  2.36s/it][A
Training:  34%|███▍      | 18/53 [00:35<01:04,  1.84s/it][A
Training:  36%|███▌      | 19/53 [00:35<00:47,  1.41s/it][A
Training:  38%|███▊      | 20/53 [00:35<00:35,  1.07s/it][A
Training:  40%|███▉      | 21/53 [00:41<01:20,  2.50s/it][A
Training:  42%|████▏     | 22/53 [00:41<00:57,  1.85s/it][A
Training:  45%|████▌     | 24/53 [00:

Epoch: 8/37 - Loss: 4.9530 - Accuracy: 0.9673



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:06<00:40,  6.81s/it][A
 29%|██▊       | 2/7 [00:07<00:15,  3.02s/it][A
 57%|█████▋    | 4/7 [00:07<00:03,  1.19s/it][A
 71%|███████▏  | 5/7 [00:12<00:04,  2.33s/it][A
100%|██████████| 7/7 [00:12<00:00,  1.82s/it][A
Epochs:  22%|██▏       | 8/37 [13:50<50:13, 103.92s/it]

Val Loss: 6.1687 - Val Accuracy: 0.9687



Training:   0%|          | 0/53 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/53 [00:07<06:41,  7.71s/it][A
Training:   4%|▍         | 2/53 [00:08<02:51,  3.37s/it][A
Training:   8%|▊         | 4/53 [00:08<01:04,  1.32s/it][A
Training:   9%|▉         | 5/53 [00:14<02:17,  2.87s/it][A
Training:  11%|█▏        | 6/53 [00:15<01:41,  2.16s/it][A
Training:  15%|█▌        | 8/53 [00:15<00:53,  1.18s/it][A
Training:  17%|█▋        | 9/53 [00:21<01:46,  2.42s/it][A
Training:  19%|█▉        | 10/53 [00:21<01:21,  1.89s/it][A
Training:  21%|██        | 11/53 [00:22<00:59,  1.43s/it][A
Training:  23%|██▎       | 12/53 [00:22<00:43,  1.06s/it][A
Training:  25%|██▍       | 13/53 [00:28<01:43,  2.60s/it][A
Training:  26%|██▋       | 14/53 [00:28<01:13,  1.89s/it][A
Training:  30%|███       | 16/53 [00:28<00:39,  1.07s/it][A
Training:  32%|███▏      | 17/53 [00:35<01:24,  2.34s/it][A
Training:  34%|███▍      | 18/53 [00:35<01:02,  1.80s/it][A
Training:  36%|███▌      | 19/53 [00:35

Epoch: 9/37 - Loss: 4.9170 - Accuracy: 0.9688



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:06<00:40,  6.74s/it][A
 43%|████▎     | 3/7 [00:06<00:07,  1.80s/it][A
 71%|███████▏  | 5/7 [00:12<00:04,  2.30s/it][A
100%|██████████| 7/7 [00:12<00:00,  1.83s/it][A
Epochs:  24%|██▍       | 9/37 [15:34<48:30, 103.93s/it]

Val Loss: 5.3337 - Val Accuracy: 0.9684



Training:   0%|          | 0/53 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/53 [00:07<06:48,  7.85s/it][A
Training:   4%|▍         | 2/53 [00:08<02:53,  3.39s/it][A
Training:   6%|▌         | 3/53 [00:08<01:35,  1.91s/it][A
Training:   8%|▊         | 4/53 [00:08<00:58,  1.20s/it][A
Training:   9%|▉         | 5/53 [00:14<02:27,  3.07s/it][A
Training:  11%|█▏        | 6/53 [00:14<01:36,  2.06s/it][A
Training:  15%|█▌        | 8/53 [00:15<00:49,  1.10s/it][A
Training:  17%|█▋        | 9/53 [00:21<01:49,  2.49s/it][A
Training:  21%|██        | 11/53 [00:21<01:01,  1.46s/it][A
Training:  25%|██▍       | 13/53 [00:27<01:23,  2.10s/it][A
Training:  26%|██▋       | 14/53 [00:28<01:08,  1.75s/it][A
Training:  28%|██▊       | 15/53 [00:28<00:52,  1.37s/it][A
Training:  30%|███       | 16/53 [00:28<00:40,  1.09s/it][A
Training:  32%|███▏      | 17/53 [00:34<01:26,  2.41s/it][A
Training:  34%|███▍      | 18/53 [00:35<01:04,  1.85s/it][A
Training:  36%|███▌      | 19/53 [00:35<

Epoch: 10/37 - Loss: 4.7845 - Accuracy: 0.9669



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:06<00:38,  6.34s/it][A
 29%|██▊       | 2/7 [00:06<00:13,  2.75s/it][A
 43%|████▎     | 3/7 [00:06<00:06,  1.54s/it][A
 57%|█████▋    | 4/7 [00:06<00:02,  1.01it/s][A
 71%|███████▏  | 5/7 [00:12<00:05,  2.51s/it][A
100%|██████████| 7/7 [00:12<00:00,  1.77s/it][A
Epochs:  27%|██▋       | 10/37 [17:17<46:40, 103.72s/it]

Val Loss: 5.7220 - Val Accuracy: 0.9601



Training:   0%|          | 0/53 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/53 [00:07<06:35,  7.60s/it][A
Training:   4%|▍         | 2/53 [00:07<02:46,  3.26s/it][A
Training:   6%|▌         | 3/53 [00:07<01:32,  1.85s/it][A
Training:   9%|▉         | 5/53 [00:14<02:05,  2.62s/it][A
Training:  11%|█▏        | 6/53 [00:14<01:29,  1.90s/it][A
Training:  13%|█▎        | 7/53 [00:14<01:04,  1.40s/it][A
Training:  15%|█▌        | 8/53 [00:14<00:46,  1.04s/it][A
Training:  17%|█▋        | 9/53 [00:20<01:50,  2.51s/it][A
Training:  19%|█▉        | 10/53 [00:21<01:21,  1.90s/it][A
Training:  21%|██        | 11/53 [00:21<00:58,  1.39s/it][A
Training:  23%|██▎       | 12/53 [00:21<00:42,  1.04s/it][A
Training:  25%|██▍       | 13/53 [00:27<01:36,  2.42s/it][A
Training:  26%|██▋       | 14/53 [00:28<01:14,  1.90s/it][A
Training:  28%|██▊       | 15/53 [00:28<00:53,  1.41s/it][A
Training:  32%|███▏      | 17/53 [00:34<01:15,  2.08s/it][A
Training:  34%|███▍      | 18/53 [00:35<

Epoch: 11/37 - Loss: 4.8409 - Accuracy: 0.9669



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:06<00:40,  6.82s/it][A
 29%|██▊       | 2/7 [00:06<00:14,  2.89s/it][A
 43%|████▎     | 3/7 [00:07<00:06,  1.62s/it][A
 71%|███████▏  | 5/7 [00:12<00:04,  2.34s/it][A
100%|██████████| 7/7 [00:13<00:00,  1.88s/it][A
Epochs:  30%|██▉       | 11/37 [19:01<44:54, 103.63s/it]

Val Loss: 5.4307 - Val Accuracy: 0.9663



Training:   0%|          | 0/53 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/53 [00:07<06:38,  7.67s/it][A
Training:   6%|▌         | 3/53 [00:07<01:42,  2.05s/it][A
Training:   8%|▊         | 4/53 [00:07<01:07,  1.38s/it][A
Training:   9%|▉         | 5/53 [00:14<02:28,  3.09s/it][A
Training:  11%|█▏        | 6/53 [00:14<01:42,  2.18s/it][A
Training:  15%|█▌        | 8/53 [00:14<00:52,  1.17s/it][A
Training:  17%|█▋        | 9/53 [00:21<01:51,  2.54s/it][A
Training:  19%|█▉        | 10/53 [00:21<01:21,  1.90s/it][A
Training:  21%|██        | 11/53 [00:21<01:00,  1.43s/it][A
Training:  23%|██▎       | 12/53 [00:21<00:43,  1.06s/it][A
Training:  25%|██▍       | 13/53 [00:27<01:40,  2.51s/it][A
Training:  26%|██▋       | 14/53 [00:28<01:13,  1.89s/it][A
Training:  28%|██▊       | 15/53 [00:28<00:52,  1.38s/it][A
Training:  32%|███▏      | 17/53 [00:34<01:19,  2.21s/it][A
Training:  34%|███▍      | 18/53 [00:35<01:01,  1.75s/it][A
Training:  38%|███▊      | 20/53 [00:35

Epoch: 12/37 - Loss: 4.7646 - Accuracy: 0.9691



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:07<00:42,  7.05s/it][A
 29%|██▊       | 2/7 [00:07<00:15,  3.05s/it][A
 43%|████▎     | 3/7 [00:07<00:06,  1.71s/it][A
 71%|███████▏  | 5/7 [00:12<00:04,  2.26s/it][A
100%|██████████| 7/7 [00:13<00:00,  1.91s/it][A
Epochs:  32%|███▏      | 12/37 [20:45<43:14, 103.79s/it]

Val Loss: 5.2295 - Val Accuracy: 0.9562



Training:   0%|          | 0/53 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/53 [00:07<06:39,  7.69s/it][A
Training:   4%|▍         | 2/53 [00:07<02:47,  3.28s/it][A
Training:   6%|▌         | 3/53 [00:08<01:34,  1.90s/it][A
Training:   8%|▊         | 4/53 [00:08<00:58,  1.20s/it][A
Training:   9%|▉         | 5/53 [00:14<02:29,  3.11s/it][A
Training:  11%|█▏        | 6/53 [00:14<01:38,  2.09s/it][A
Training:  13%|█▎        | 7/53 [00:15<01:11,  1.56s/it][A
Training:  17%|█▋        | 9/53 [00:21<01:41,  2.30s/it][A
Training:  19%|█▉        | 10/53 [00:21<01:15,  1.76s/it][A
Training:  21%|██        | 11/53 [00:22<00:57,  1.37s/it][A
Training:  23%|██▎       | 12/53 [00:22<00:41,  1.02s/it][A
Training:  25%|██▍       | 13/53 [00:28<01:40,  2.51s/it][A
Training:  26%|██▋       | 14/53 [00:28<01:11,  1.84s/it][A
Training:  28%|██▊       | 15/53 [00:28<00:53,  1.40s/it][A
Training:  32%|███▏      | 17/53 [00:35<01:18,  2.17s/it][A
Training:  36%|███▌      | 19/53 [00:35<

Epoch: 13/37 - Loss: 4.5934 - Accuracy: 0.9716



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:07<00:43,  7.20s/it][A
 29%|██▊       | 2/7 [00:07<00:15,  3.05s/it][A
 57%|█████▋    | 4/7 [00:07<00:03,  1.19s/it][A
 71%|███████▏  | 5/7 [00:12<00:04,  2.48s/it][A
100%|██████████| 7/7 [00:13<00:00,  1.88s/it][A
Epochs:  35%|███▌      | 13/37 [22:28<41:28, 103.68s/it]

Val Loss: 6.2012 - Val Accuracy: 0.9619



Training:   0%|          | 0/53 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/53 [00:08<07:05,  8.18s/it][A
Training:   6%|▌         | 3/53 [00:08<01:49,  2.19s/it][A
Training:   8%|▊         | 4/53 [00:08<01:11,  1.47s/it][A
Training:   9%|▉         | 5/53 [00:14<02:27,  3.08s/it][A
Training:  11%|█▏        | 6/53 [00:15<01:43,  2.20s/it][A
Training:  15%|█▌        | 8/53 [00:15<00:54,  1.21s/it][A
Training:  17%|█▋        | 9/53 [00:21<01:45,  2.41s/it][A
Training:  19%|█▉        | 10/53 [00:22<01:25,  1.98s/it][A
Training:  21%|██        | 11/53 [00:22<01:01,  1.47s/it][A
Training:  23%|██▎       | 12/53 [00:22<00:44,  1.09s/it][A
Training:  25%|██▍       | 13/53 [00:28<01:35,  2.39s/it][A
Training:  26%|██▋       | 14/53 [00:28<01:17,  1.98s/it][A
Training:  28%|██▊       | 15/53 [00:29<00:54,  1.44s/it][A
Training:  32%|███▏      | 17/53 [00:34<01:13,  2.03s/it][A
Training:  34%|███▍      | 18/53 [00:35<00:59,  1.69s/it][A
Training:  38%|███▊      | 20/53 [00:35

Epoch: 14/37 - Loss: 4.8296 - Accuracy: 0.9688



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:06<00:40,  6.79s/it][A
 29%|██▊       | 2/7 [00:06<00:14,  2.85s/it][A
 57%|█████▋    | 4/7 [00:07<00:03,  1.14s/it][A
 71%|███████▏  | 5/7 [00:12<00:04,  2.45s/it][A
100%|██████████| 7/7 [00:12<00:00,  1.85s/it][A
Epochs:  38%|███▊      | 14/37 [24:11<39:36, 103.34s/it]

Val Loss: 6.9354 - Val Accuracy: 0.9609



Training:   0%|          | 0/53 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/53 [00:07<06:53,  7.95s/it][A
Training:   4%|▍         | 2/53 [00:08<02:52,  3.39s/it][A
Training:   6%|▌         | 3/53 [00:08<01:36,  1.93s/it][A
Training:   9%|▉         | 5/53 [00:15<02:10,  2.73s/it][A
Training:  11%|█▏        | 6/53 [00:15<01:33,  2.00s/it][A
Training:  13%|█▎        | 7/53 [00:15<01:06,  1.44s/it][A
Training:  17%|█▋        | 9/53 [00:21<01:36,  2.20s/it][A
Training:  19%|█▉        | 10/53 [00:21<01:13,  1.71s/it][A
Training:  21%|██        | 11/53 [00:21<00:55,  1.33s/it][A
Training:  23%|██▎       | 12/53 [00:22<00:41,  1.00s/it][A
Training:  25%|██▍       | 13/53 [00:28<01:39,  2.50s/it][A
Training:  26%|██▋       | 14/53 [00:28<01:11,  1.83s/it][A
Training:  28%|██▊       | 15/53 [00:29<00:54,  1.44s/it][A
Training:  32%|███▏      | 17/53 [00:34<01:15,  2.09s/it][A
Training:  34%|███▍      | 18/53 [00:34<00:56,  1.60s/it][A
Training:  36%|███▌      | 19/53 [00:35

Epoch: 15/37 - Loss: 4.7165 - Accuracy: 0.9693



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:07<00:42,  7.08s/it][A
 29%|██▊       | 2/7 [00:07<00:14,  2.99s/it][A
 43%|████▎     | 3/7 [00:07<00:06,  1.67s/it][A
 71%|███████▏  | 5/7 [00:12<00:04,  2.25s/it][A
100%|██████████| 7/7 [00:12<00:00,  1.86s/it][A
Epochs:  41%|████      | 15/37 [25:55<37:56, 103.49s/it]

Val Loss: 5.9960 - Val Accuracy: 0.9623



Training:   0%|          | 0/53 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/53 [00:07<06:27,  7.46s/it][A
Training:   4%|▍         | 2/53 [00:07<02:48,  3.30s/it][A
Training:   6%|▌         | 3/53 [00:07<01:32,  1.85s/it][A
Training:   9%|▉         | 5/53 [00:14<02:03,  2.57s/it][A
Training:  11%|█▏        | 6/53 [00:14<01:29,  1.90s/it][A
Training:  13%|█▎        | 7/53 [00:14<01:06,  1.45s/it][A
Training:  15%|█▌        | 8/53 [00:14<00:47,  1.06s/it][A
Training:  17%|█▋        | 9/53 [00:21<01:53,  2.57s/it][A
Training:  19%|█▉        | 10/53 [00:21<01:19,  1.86s/it][A
Training:  21%|██        | 11/53 [00:21<00:56,  1.35s/it][A
Training:  25%|██▍       | 13/53 [00:28<01:30,  2.27s/it][A
Training:  26%|██▋       | 14/53 [00:28<01:07,  1.73s/it][A
Training:  28%|██▊       | 15/53 [00:28<00:49,  1.31s/it][A
Training:  30%|███       | 16/53 [00:28<00:36,  1.02it/s][A
Training:  32%|███▏      | 17/53 [00:34<01:22,  2.30s/it][A
Training:  34%|███▍      | 18/53 [00:34<

Epoch: 16/37 - Loss: 4.7216 - Accuracy: 0.9707



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:06<00:41,  6.91s/it][A
 29%|██▊       | 2/7 [00:07<00:14,  2.91s/it][A
 43%|████▎     | 3/7 [00:07<00:06,  1.64s/it][A
 57%|█████▋    | 4/7 [00:07<00:03,  1.04s/it][A
 71%|███████▏  | 5/7 [00:12<00:05,  2.61s/it][A
100%|██████████| 7/7 [00:13<00:00,  1.87s/it][A
Epochs:  43%|████▎     | 16/37 [27:38<36:13, 103.50s/it]

Val Loss: 5.6051 - Val Accuracy: 0.9652



Training:   0%|          | 0/53 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/53 [00:07<06:51,  7.91s/it][A
Training:   4%|▍         | 2/53 [00:08<02:50,  3.34s/it][A
Training:   8%|▊         | 4/53 [00:08<01:03,  1.29s/it][A
Training:   9%|▉         | 5/53 [00:14<02:22,  2.98s/it][A
Training:  11%|█▏        | 6/53 [00:15<01:39,  2.12s/it][A
Training:  15%|█▌        | 8/53 [00:15<00:52,  1.17s/it][A
Training:  17%|█▋        | 9/53 [00:21<01:47,  2.43s/it][A
Training:  19%|█▉        | 10/53 [00:21<01:18,  1.84s/it][A
Training:  23%|██▎       | 12/53 [00:21<00:44,  1.08s/it][A
Training:  25%|██▍       | 13/53 [00:28<01:31,  2.28s/it][A
Training:  28%|██▊       | 15/53 [00:28<00:53,  1.40s/it][A
Training:  32%|███▏      | 17/53 [00:34<01:10,  1.97s/it][A
Training:  36%|███▌      | 19/53 [00:34<00:44,  1.32s/it][A
Training:  38%|███▊      | 20/53 [00:34<00:35,  1.08s/it][A
Training:  40%|███▉      | 21/53 [00:40<01:12,  2.27s/it][A
Training:  42%|████▏     | 22/53 [00:41

Epoch: 17/37 - Loss: 4.5085 - Accuracy: 0.9718



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:06<00:39,  6.61s/it][A
 29%|██▊       | 2/7 [00:06<00:14,  2.90s/it][A
 43%|████▎     | 3/7 [00:07<00:06,  1.67s/it][A
 57%|█████▋    | 4/7 [00:07<00:03,  1.10s/it][A
 71%|███████▏  | 5/7 [00:12<00:05,  2.57s/it][A
100%|██████████| 7/7 [00:12<00:00,  1.85s/it][A
Epochs:  46%|████▌     | 17/37 [29:22<34:31, 103.57s/it]

Val Loss: 5.7761 - Val Accuracy: 0.9631



Training:   0%|          | 0/53 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/53 [00:07<06:44,  7.78s/it][A
Training:   4%|▍         | 2/53 [00:07<02:47,  3.28s/it][A
Training:   8%|▊         | 4/53 [00:08<01:02,  1.28s/it][A
Training:   9%|▉         | 5/53 [00:14<02:22,  2.97s/it][A
Training:  13%|█▎        | 7/53 [00:14<01:14,  1.61s/it][A
Training:  17%|█▋        | 9/53 [00:21<01:41,  2.31s/it][A
Training:  19%|█▉        | 10/53 [00:21<01:19,  1.84s/it][A
Training:  23%|██▎       | 12/53 [00:22<00:47,  1.17s/it][A
Training:  25%|██▍       | 13/53 [00:27<01:24,  2.12s/it][A
Training:  26%|██▋       | 14/53 [00:27<01:04,  1.65s/it][A
Training:  30%|███       | 16/53 [00:28<00:37,  1.03s/it][A
Training:  32%|███▏      | 17/53 [00:34<01:18,  2.19s/it][A
Training:  34%|███▍      | 18/53 [00:34<00:59,  1.69s/it][A
Training:  36%|███▌      | 19/53 [00:34<00:43,  1.29s/it][A
Training:  38%|███▊      | 20/53 [00:34<00:32,  1.02it/s][A
Training:  40%|███▉      | 21/53 [00:4

Epoch: 18/37 - Loss: 4.7459 - Accuracy: 0.9694



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:07<00:43,  7.21s/it][A
 29%|██▊       | 2/7 [00:07<00:15,  3.06s/it][A
 43%|████▎     | 3/7 [00:07<00:07,  1.76s/it][A
 71%|███████▏  | 5/7 [00:13<00:04,  2.37s/it][A
100%|██████████| 7/7 [00:13<00:00,  1.95s/it][A
Epochs:  49%|████▊     | 18/37 [31:06<32:50, 103.73s/it]

Val Loss: 5.6977 - Val Accuracy: 0.9650



Training:   0%|          | 0/53 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/53 [00:07<06:33,  7.57s/it][A
Training:   4%|▍         | 2/53 [00:07<02:42,  3.18s/it][A
Training:   6%|▌         | 3/53 [00:07<01:28,  1.78s/it][A
Training:   9%|▉         | 5/53 [00:14<02:04,  2.60s/it][A
Training:  11%|█▏        | 6/53 [00:14<01:31,  1.95s/it][A
Training:  15%|█▌        | 8/53 [00:14<00:49,  1.11s/it][A
Training:  17%|█▋        | 9/53 [00:20<01:39,  2.26s/it][A
Training:  19%|█▉        | 10/53 [00:20<01:15,  1.75s/it][A
Training:  23%|██▎       | 12/53 [00:21<00:43,  1.05s/it][A
Training:  25%|██▍       | 13/53 [00:26<01:22,  2.07s/it][A
Training:  26%|██▋       | 14/53 [00:27<01:07,  1.72s/it][A
Training:  28%|██▊       | 15/53 [00:27<00:50,  1.32s/it][A
Training:  32%|███▏      | 17/53 [00:32<01:08,  1.89s/it][A
Training:  34%|███▍      | 18/53 [00:33<00:57,  1.65s/it][A
Training:  38%|███▊      | 20/53 [00:33<00:33,  1.02s/it][A
Training:  40%|███▉      | 21/53 [00:39

Epoch: 19/37 - Loss: 4.7097 - Accuracy: 0.9700



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:07<00:42,  7.01s/it][A
 43%|████▎     | 3/7 [00:07<00:07,  1.87s/it][A
 71%|███████▏  | 5/7 [00:12<00:04,  2.34s/it][A
100%|██████████| 7/7 [00:12<00:00,  1.85s/it][A
Epochs:  51%|█████▏    | 19/37 [32:49<31:04, 103.59s/it]

Val Loss: 5.4550 - Val Accuracy: 0.9629



Training:   0%|          | 0/53 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/53 [00:07<06:39,  7.67s/it][A
Training:   4%|▍         | 2/53 [00:07<02:47,  3.29s/it][A
Training:   6%|▌         | 3/53 [00:08<01:34,  1.89s/it][A
Training:   8%|▊         | 4/53 [00:08<00:59,  1.21s/it][A
Training:   9%|▉         | 5/53 [00:14<02:28,  3.09s/it][A
Training:  13%|█▎        | 7/53 [00:14<01:11,  1.56s/it][A
Training:  15%|█▌        | 8/53 [00:15<00:55,  1.23s/it][A
Training:  17%|█▋        | 9/53 [00:20<01:46,  2.41s/it][A
Training:  19%|█▉        | 10/53 [00:20<01:15,  1.77s/it][A
Training:  21%|██        | 11/53 [00:20<00:54,  1.29s/it][A
Training:  23%|██▎       | 12/53 [00:21<00:38,  1.06it/s][A
Training:  25%|██▍       | 13/53 [00:27<01:40,  2.52s/it][A
Training:  26%|██▋       | 14/53 [00:27<01:10,  1.81s/it][A
Training:  28%|██▊       | 15/53 [00:27<00:49,  1.31s/it][A
Training:  30%|███       | 16/53 [00:27<00:35,  1.05it/s][A
Training:  32%|███▏      | 17/53 [00:33<

Epoch: 20/37 - Loss: 4.3511 - Accuracy: 0.9715



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:06<00:40,  6.68s/it][A
 29%|██▊       | 2/7 [00:06<00:14,  2.89s/it][A
 43%|████▎     | 3/7 [00:07<00:06,  1.62s/it][A
 57%|█████▋    | 4/7 [00:07<00:03,  1.13s/it][A
 71%|███████▏  | 5/7 [00:12<00:05,  2.61s/it][A
100%|██████████| 7/7 [00:12<00:00,  1.85s/it][A
Epochs:  54%|█████▍    | 20/37 [34:33<29:20, 103.55s/it]

Val Loss: 6.0414 - Val Accuracy: 0.9600



Training:   0%|          | 0/53 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/53 [00:07<06:47,  7.84s/it][A
Training:   4%|▍         | 2/53 [00:07<02:49,  3.32s/it][A
Training:   6%|▌         | 3/53 [00:08<01:33,  1.88s/it][A
Training:   8%|▊         | 4/53 [00:08<00:59,  1.21s/it][A
Training:   9%|▉         | 5/53 [00:14<02:20,  2.92s/it][A
Training:  13%|█▎        | 7/53 [00:14<01:08,  1.48s/it][A
Training:  17%|█▋        | 9/53 [00:20<01:33,  2.13s/it][A
Training:  21%|██        | 11/53 [00:20<00:57,  1.38s/it][A
Training:  23%|██▎       | 12/53 [00:20<00:45,  1.11s/it][A
Training:  25%|██▍       | 13/53 [00:27<01:31,  2.29s/it][A
Training:  26%|██▋       | 14/53 [00:27<01:08,  1.75s/it][A
Training:  28%|██▊       | 15/53 [00:27<00:49,  1.32s/it][A
Training:  30%|███       | 16/53 [00:27<00:36,  1.01it/s][A
Training:  32%|███▏      | 17/53 [00:33<01:27,  2.42s/it][A
Training:  34%|███▍      | 18/53 [00:33<01:01,  1.77s/it][A
Training:  36%|███▌      | 19/53 [00:33

Epoch: 21/37 - Loss: 4.5727 - Accuracy: 0.9715



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:06<00:41,  6.92s/it][A
 29%|██▊       | 2/7 [00:07<00:14,  2.96s/it][A
 57%|█████▋    | 4/7 [00:07<00:03,  1.18s/it][A
 71%|███████▏  | 5/7 [00:12<00:04,  2.42s/it][A
 86%|████████▌ | 6/7 [00:12<00:01,  1.75s/it][A
100%|██████████| 7/7 [00:13<00:00,  1.86s/it][A
Epochs:  57%|█████▋    | 21/37 [36:15<27:31, 103.22s/it]

Val Loss: 5.8825 - Val Accuracy: 0.9632



Training:   0%|          | 0/53 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/53 [00:07<06:45,  7.79s/it][A
Training:   4%|▍         | 2/53 [00:08<02:51,  3.37s/it][A
Training:   6%|▌         | 3/53 [00:08<01:36,  1.92s/it][A
Training:   8%|▊         | 4/53 [00:08<00:59,  1.21s/it][A
Training:   9%|▉         | 5/53 [00:13<02:11,  2.74s/it][A
Training:  11%|█▏        | 6/53 [00:13<01:27,  1.85s/it][A
Training:  15%|█▌        | 8/53 [00:14<00:44,  1.02it/s][A
Training:  17%|█▋        | 9/53 [00:20<01:45,  2.40s/it][A
Training:  21%|██        | 11/53 [00:20<01:00,  1.44s/it][A
Training:  23%|██▎       | 12/53 [00:20<00:46,  1.13s/it][A
Training:  25%|██▍       | 13/53 [00:26<01:33,  2.34s/it][A
Training:  28%|██▊       | 15/53 [00:27<00:53,  1.40s/it][A
Training:  32%|███▏      | 17/53 [00:33<01:12,  2.03s/it][A
Training:  34%|███▍      | 18/53 [00:33<00:57,  1.65s/it][A
Training:  36%|███▌      | 19/53 [00:33<00:44,  1.30s/it][A
Training:  38%|███▊      | 20/53 [00:33<

Epoch: 22/37 - Loss: 4.5909 - Accuracy: 0.9694



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:07<00:42,  7.02s/it][A
 43%|████▎     | 3/7 [00:07<00:07,  1.87s/it][A
 71%|███████▏  | 5/7 [00:12<00:04,  2.32s/it][A
100%|██████████| 7/7 [00:13<00:00,  1.86s/it][A
Epochs:  59%|█████▉    | 22/37 [37:58<25:48, 103.21s/it]

Val Loss: 6.2281 - Val Accuracy: 0.9574



Training:   0%|          | 0/53 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/53 [00:07<06:45,  7.80s/it][A
Training:   6%|▌         | 3/53 [00:08<01:45,  2.10s/it][A
Training:   8%|▊         | 4/53 [00:08<01:09,  1.42s/it][A
Training:   9%|▉         | 5/53 [00:13<02:14,  2.80s/it][A
Training:  11%|█▏        | 6/53 [00:13<01:31,  1.94s/it][A
Training:  13%|█▎        | 7/53 [00:14<01:03,  1.39s/it][A
Training:  15%|█▌        | 8/53 [00:14<00:45,  1.01s/it][A
Training:  17%|█▋        | 9/53 [00:20<01:54,  2.60s/it][A
Training:  19%|█▉        | 10/53 [00:20<01:21,  1.90s/it][A
Training:  21%|██        | 11/53 [00:20<00:57,  1.36s/it][A
Training:  25%|██▍       | 13/53 [00:26<01:23,  2.08s/it][A
Training:  26%|██▋       | 14/53 [00:26<01:02,  1.60s/it][A
Training:  28%|██▊       | 15/53 [00:27<00:47,  1.25s/it][A
Training:  32%|███▏      | 17/53 [00:33<01:14,  2.07s/it][A
Training:  34%|███▍      | 18/53 [00:33<00:57,  1.64s/it][A
Training:  36%|███▌      | 19/53 [00:33<

Epoch: 23/37 - Loss: 4.4925 - Accuracy: 0.9715



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:07<00:42,  7.05s/it][A
 29%|██▊       | 2/7 [00:07<00:14,  2.99s/it][A
 43%|████▎     | 3/7 [00:07<00:06,  1.68s/it][A
 71%|███████▏  | 5/7 [00:12<00:04,  2.32s/it][A
100%|██████████| 7/7 [00:13<00:00,  1.90s/it][A
Epochs:  62%|██████▏   | 23/37 [39:43<24:10, 103.64s/it]

Val Loss: 6.4570 - Val Accuracy: 0.9636



Training:   0%|          | 0/53 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/53 [00:06<05:44,  6.63s/it][A
Training:   4%|▍         | 2/53 [00:06<02:25,  2.85s/it][A
Training:   6%|▌         | 3/53 [00:07<01:21,  1.62s/it][A
Training:   8%|▊         | 4/53 [00:07<00:50,  1.03s/it][A
Training:   9%|▉         | 5/53 [00:13<02:20,  2.92s/it][A
Training:  11%|█▏        | 6/53 [00:13<01:32,  1.96s/it][A
Training:  15%|█▌        | 8/53 [00:13<00:46,  1.04s/it][A
Training:  17%|█▋        | 9/53 [00:19<01:38,  2.25s/it][A
Training:  19%|█▉        | 10/53 [00:19<01:13,  1.71s/it][A
Training:  23%|██▎       | 12/53 [00:19<00:42,  1.03s/it][A
Training:  25%|██▍       | 13/53 [00:25<01:27,  2.19s/it][A
Training:  26%|██▋       | 14/53 [00:26<01:06,  1.71s/it][A
Training:  30%|███       | 16/53 [00:26<00:38,  1.04s/it][A
Training:  32%|███▏      | 17/53 [00:32<01:20,  2.24s/it][A
Training:  34%|███▍      | 18/53 [00:33<01:03,  1.81s/it][A
Training:  36%|███▌      | 19/53 [00:33<

Epoch: 24/37 - Loss: 4.6619 - Accuracy: 0.9724



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:06<00:41,  6.91s/it][A
 29%|██▊       | 2/7 [00:07<00:14,  2.91s/it][A
 43%|████▎     | 3/7 [00:07<00:06,  1.70s/it][A
 57%|█████▋    | 4/7 [00:07<00:03,  1.12s/it][A
 71%|███████▏  | 5/7 [00:12<00:05,  2.51s/it][A
100%|██████████| 7/7 [00:12<00:00,  1.83s/it][A
Epochs:  65%|██████▍   | 24/37 [41:26<22:25, 103.52s/it]

Val Loss: 6.0406 - Val Accuracy: 0.9628



Training:   0%|          | 0/53 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/53 [00:06<05:38,  6.51s/it][A
Training:   4%|▍         | 2/53 [00:06<02:20,  2.76s/it][A
Training:   6%|▌         | 3/53 [00:06<01:17,  1.55s/it][A
Training:   8%|▊         | 4/53 [00:06<00:48,  1.02it/s][A
Training:   9%|▉         | 5/53 [00:13<02:19,  2.91s/it][A
Training:  13%|█▎        | 7/53 [00:13<01:07,  1.47s/it][A
Training:  15%|█▌        | 8/53 [00:13<00:49,  1.11s/it][A
Training:  17%|█▋        | 9/53 [00:19<01:49,  2.49s/it][A
Training:  19%|█▉        | 10/53 [00:19<01:17,  1.81s/it][A
Training:  23%|██▎       | 12/53 [00:19<00:42,  1.04s/it][A
Training:  25%|██▍       | 13/53 [00:26<01:32,  2.31s/it][A
Training:  26%|██▋       | 14/53 [00:26<01:08,  1.75s/it][A
Training:  28%|██▊       | 15/53 [00:26<00:49,  1.31s/it][A
Training:  30%|███       | 16/53 [00:26<00:36,  1.03it/s][A
Training:  32%|███▏      | 17/53 [00:32<01:27,  2.43s/it][A
Training:  34%|███▍      | 18/53 [00:32<

Epoch: 25/37 - Loss: 4.6325 - Accuracy: 0.9701



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:06<00:41,  6.95s/it][A
 29%|██▊       | 2/7 [00:07<00:15,  3.13s/it][A
 57%|█████▋    | 4/7 [00:07<00:03,  1.26s/it][A
 71%|███████▏  | 5/7 [00:12<00:04,  2.32s/it][A
100%|██████████| 7/7 [00:12<00:00,  1.84s/it][A
Epochs:  68%|██████▊   | 25/37 [43:09<20:40, 103.34s/it]

Val Loss: 6.2867 - Val Accuracy: 0.9589



Training:   0%|          | 0/53 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/53 [00:07<06:09,  7.10s/it][A
Training:   4%|▍         | 2/53 [00:07<02:34,  3.03s/it][A
Training:   8%|▊         | 4/53 [00:07<00:58,  1.19s/it][A
Training:   9%|▉         | 5/53 [00:13<02:03,  2.58s/it][A
Training:  13%|█▎        | 7/53 [00:13<01:04,  1.40s/it][A
Training:  15%|█▌        | 8/53 [00:13<00:52,  1.16s/it][A
Training:  17%|█▋        | 9/53 [00:19<01:40,  2.29s/it][A
Training:  19%|█▉        | 10/53 [00:19<01:13,  1.70s/it][A
Training:  21%|██        | 11/53 [00:19<00:52,  1.25s/it][A
Training:  23%|██▎       | 12/53 [00:19<00:43,  1.06s/it][A
Training:  25%|██▍       | 13/53 [00:25<01:36,  2.41s/it][A
Training:  26%|██▋       | 14/53 [00:26<01:12,  1.87s/it][A
Training:  28%|██▊       | 15/53 [00:26<00:52,  1.38s/it][A
Training:  30%|███       | 16/53 [00:26<00:38,  1.03s/it][A
Training:  32%|███▏      | 17/53 [00:32<01:23,  2.32s/it][A
Training:  34%|███▍      | 18/53 [00:32

Epoch: 26/37 - Loss: 4.3094 - Accuracy: 0.9713



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:06<00:41,  6.94s/it][A
 43%|████▎     | 3/7 [00:07<00:07,  1.86s/it][A
 71%|███████▏  | 5/7 [00:12<00:04,  2.18s/it][A
100%|██████████| 7/7 [00:12<00:00,  1.76s/it][A
Epochs:  70%|███████   | 26/37 [44:51<18:52, 102.98s/it]

Val Loss: 5.6438 - Val Accuracy: 0.9642



Training:   0%|          | 0/53 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/53 [00:07<06:15,  7.22s/it][A
Training:   4%|▍         | 2/53 [00:07<02:43,  3.20s/it][A
Training:   6%|▌         | 3/53 [00:07<01:32,  1.85s/it][A
Training:   9%|▉         | 5/53 [00:13<01:55,  2.42s/it][A
Training:  11%|█▏        | 6/53 [00:13<01:23,  1.78s/it][A
Training:  13%|█▎        | 7/53 [00:13<00:59,  1.29s/it][A
Training:  15%|█▌        | 8/53 [00:14<00:46,  1.02s/it][A
Training:  17%|█▋        | 9/53 [00:19<01:45,  2.40s/it][A
Training:  19%|█▉        | 10/53 [00:20<01:16,  1.77s/it][A
Training:  21%|██        | 11/53 [00:20<00:53,  1.28s/it][A
Training:  23%|██▎       | 12/53 [00:20<00:38,  1.06it/s][A
Training:  25%|██▍       | 13/53 [00:26<01:38,  2.45s/it][A
Training:  26%|██▋       | 14/53 [00:26<01:09,  1.78s/it][A
Training:  30%|███       | 16/53 [00:27<00:39,  1.06s/it][A
Training:  32%|███▏      | 17/53 [00:33<01:21,  2.26s/it][A
Training:  34%|███▍      | 18/53 [00:33<

Epoch: 27/37 - Loss: 4.4326 - Accuracy: 0.9720



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:06<00:37,  6.24s/it][A
 29%|██▊       | 2/7 [00:06<00:13,  2.79s/it][A
 57%|█████▋    | 4/7 [00:06<00:03,  1.08s/it][A
 71%|███████▏  | 5/7 [00:11<00:04,  2.10s/it][A
100%|██████████| 7/7 [00:11<00:00,  1.65s/it][A
Epochs:  73%|███████▎  | 27/37 [46:34<17:07, 102.79s/it]

Val Loss: 6.0636 - Val Accuracy: 0.9616



Training:   0%|          | 0/53 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/53 [00:07<06:26,  7.43s/it][A
Training:   4%|▍         | 2/53 [00:07<02:42,  3.18s/it][A
Training:   6%|▌         | 3/53 [00:07<01:32,  1.85s/it][A
Training:   8%|▊         | 4/53 [00:08<00:56,  1.16s/it][A
Training:   9%|▉         | 5/53 [00:13<02:16,  2.84s/it][A
Training:  11%|█▏        | 6/53 [00:14<01:30,  1.93s/it][A
Training:  13%|█▎        | 7/53 [00:14<01:02,  1.35s/it][A
Training:  15%|█▌        | 8/53 [00:14<00:43,  1.04it/s][A
Training:  17%|█▋        | 9/53 [00:20<01:53,  2.57s/it][A
Training:  19%|█▉        | 10/53 [00:20<01:19,  1.84s/it][A
Training:  21%|██        | 11/53 [00:20<00:57,  1.38s/it][A
Training:  23%|██▎       | 12/53 [00:21<00:40,  1.00it/s][A
Training:  25%|██▍       | 13/53 [00:26<01:33,  2.34s/it][A
Training:  26%|██▋       | 14/53 [00:26<01:08,  1.76s/it][A
Training:  28%|██▊       | 15/53 [00:27<00:51,  1.36s/it][A
Training:  30%|███       | 16/53 [00:27<0

Epoch: 28/37 - Loss: 4.7454 - Accuracy: 0.9711



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:06<00:40,  6.67s/it][A
 43%|████▎     | 3/7 [00:06<00:07,  1.78s/it][A
 71%|███████▏  | 5/7 [00:11<00:04,  2.16s/it][A
100%|██████████| 7/7 [00:12<00:00,  1.74s/it][A
Epochs:  76%|███████▌  | 28/37 [48:16<15:23, 102.58s/it]

Val Loss: 6.4358 - Val Accuracy: 0.9604



Training:   0%|          | 0/53 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/53 [00:07<06:16,  7.24s/it][A
Training:   4%|▍         | 2/53 [00:07<02:38,  3.10s/it][A
Training:   6%|▌         | 3/53 [00:07<01:28,  1.77s/it][A
Training:   8%|▊         | 4/53 [00:07<00:57,  1.17s/it][A
Training:   9%|▉         | 5/53 [00:13<02:15,  2.83s/it][A
Training:  11%|█▏        | 6/53 [00:13<01:30,  1.93s/it][A
Training:  13%|█▎        | 7/53 [00:13<01:01,  1.34s/it][A
Training:  15%|█▌        | 8/53 [00:14<00:42,  1.05it/s][A
Training:  17%|█▋        | 9/53 [00:20<02:02,  2.79s/it][A
Training:  19%|█▉        | 10/53 [00:21<01:24,  1.97s/it][A
Training:  21%|██        | 11/53 [00:21<00:58,  1.40s/it][A
Training:  25%|██▍       | 13/53 [00:27<01:26,  2.15s/it][A
Training:  26%|██▋       | 14/53 [00:27<01:04,  1.65s/it][A
Training:  28%|██▊       | 15/53 [00:27<00:47,  1.25s/it][A
Training:  30%|███       | 16/53 [00:27<00:34,  1.06it/s][A
Training:  32%|███▏      | 17/53 [00:33<0

Epoch: 29/37 - Loss: 4.6304 - Accuracy: 0.9720



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:05<00:34,  5.81s/it][A
 29%|██▊       | 2/7 [00:06<00:12,  2.57s/it][A
 43%|████▎     | 3/7 [00:06<00:05,  1.45s/it][A
 57%|█████▋    | 4/7 [00:06<00:02,  1.08it/s][A
 71%|███████▏  | 5/7 [00:11<00:04,  2.36s/it][A
100%|██████████| 7/7 [00:11<00:00,  1.67s/it][A
Epochs:  78%|███████▊  | 29/37 [49:58<13:40, 102.54s/it]

Val Loss: 5.2325 - Val Accuracy: 0.9648



Training:   0%|          | 0/53 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/53 [00:07<06:05,  7.03s/it][A
Training:   4%|▍         | 2/53 [00:07<02:31,  2.97s/it][A
Training:   6%|▌         | 3/53 [00:07<01:23,  1.66s/it][A
Training:   9%|▉         | 5/53 [00:13<02:02,  2.56s/it][A
Training:  11%|█▏        | 6/53 [00:13<01:27,  1.86s/it][A
Training:  13%|█▎        | 7/53 [00:13<01:01,  1.35s/it][A
Training:  15%|█▌        | 8/53 [00:14<00:44,  1.02it/s][A
Training:  17%|█▋        | 9/53 [00:20<01:51,  2.53s/it][A
Training:  21%|██        | 11/53 [00:20<00:59,  1.41s/it][A
Training:  25%|██▍       | 13/53 [00:26<01:22,  2.07s/it][A
Training:  28%|██▊       | 15/53 [00:26<00:51,  1.35s/it][A
Training:  32%|███▏      | 17/53 [00:33<01:11,  1.99s/it][A
Training:  34%|███▍      | 18/53 [00:33<00:57,  1.65s/it][A
Training:  36%|███▌      | 19/53 [00:33<00:44,  1.31s/it][A
Training:  38%|███▊      | 20/53 [00:33<00:34,  1.05s/it][A
Training:  40%|███▉      | 21/53 [00:40<

Epoch: 30/37 - Loss: 4.5955 - Accuracy: 0.9724



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:05<00:35,  5.88s/it][A
 43%|████▎     | 3/7 [00:06<00:06,  1.58s/it][A
 71%|███████▏  | 5/7 [00:11<00:04,  2.19s/it][A
100%|██████████| 7/7 [00:11<00:00,  1.70s/it][A
Epochs:  81%|████████  | 30/37 [51:41<11:57, 102.47s/it]

Val Loss: 6.3154 - Val Accuracy: 0.9601



Training:   0%|          | 0/53 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/53 [00:07<06:16,  7.23s/it][A
Training:   4%|▍         | 2/53 [00:07<02:38,  3.11s/it][A
Training:   6%|▌         | 3/53 [00:07<01:28,  1.76s/it][A
Training:   8%|▊         | 4/53 [00:07<00:55,  1.14s/it][A
Training:   9%|▉         | 5/53 [00:14<02:22,  2.96s/it][A
Training:  13%|█▎        | 7/53 [00:14<01:09,  1.52s/it][A
Training:  15%|█▌        | 8/53 [00:14<00:52,  1.17s/it][A
Training:  17%|█▋        | 9/53 [00:20<01:47,  2.45s/it][A
Training:  19%|█▉        | 10/53 [00:20<01:18,  1.81s/it][A
Training:  23%|██▎       | 12/53 [00:20<00:43,  1.05s/it][A
Training:  25%|██▍       | 13/53 [00:27<01:33,  2.34s/it][A
Training:  26%|██▋       | 14/53 [00:27<01:08,  1.77s/it][A
Training:  28%|██▊       | 15/53 [00:27<00:50,  1.34s/it][A
Training:  30%|███       | 16/53 [00:27<00:37,  1.01s/it][A
Training:  32%|███▏      | 17/53 [00:33<01:27,  2.43s/it][A
Training:  34%|███▍      | 18/53 [00:33<

Epoch: 31/37 - Loss: 4.6075 - Accuracy: 0.9737



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:06<00:39,  6.54s/it][A
 43%|████▎     | 3/7 [00:06<00:07,  1.77s/it][A
 57%|█████▋    | 4/7 [00:06<00:03,  1.21s/it][A
 71%|███████▏  | 5/7 [00:12<00:05,  2.55s/it][A
100%|██████████| 7/7 [00:12<00:00,  1.78s/it][A
Epochs:  84%|████████▍ | 31/37 [53:23<10:15, 102.58s/it]

Val Loss: 5.0939 - Val Accuracy: 0.9608



Training:   0%|          | 0/53 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/53 [00:07<06:16,  7.25s/it][A
Training:   4%|▍         | 2/53 [00:07<02:37,  3.08s/it][A
Training:   8%|▊         | 4/53 [00:07<00:58,  1.20s/it][A
Training:   9%|▉         | 5/53 [00:13<02:11,  2.74s/it][A
Training:  11%|█▏        | 6/53 [00:13<01:31,  1.95s/it][A
Training:  13%|█▎        | 7/53 [00:14<01:04,  1.40s/it][A
Training:  17%|█▋        | 9/53 [00:19<01:32,  2.11s/it][A
Training:  19%|█▉        | 10/53 [00:20<01:09,  1.63s/it][A
Training:  21%|██        | 11/53 [00:20<00:52,  1.26s/it][A
Training:  23%|██▎       | 12/53 [00:20<00:39,  1.03it/s][A
Training:  25%|██▍       | 13/53 [00:26<01:31,  2.30s/it][A
Training:  26%|██▋       | 14/53 [00:26<01:11,  1.84s/it][A
Training:  28%|██▊       | 15/53 [00:27<00:51,  1.36s/it][A
Training:  30%|███       | 16/53 [00:27<00:37,  1.01s/it][A
Training:  32%|███▏      | 17/53 [00:32<01:25,  2.36s/it][A
Training:  34%|███▍      | 18/53 [00:33

Epoch: 32/37 - Loss: 4.3466 - Accuracy: 0.9714



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:07<00:43,  7.31s/it][A
 43%|████▎     | 3/7 [00:07<00:07,  1.95s/it][A
 71%|███████▏  | 5/7 [00:12<00:04,  2.30s/it][A
100%|██████████| 7/7 [00:13<00:00,  1.86s/it][A
Epochs:  86%|████████▋ | 32/37 [55:06<08:33, 102.67s/it]

Val Loss: 5.7878 - Val Accuracy: 0.9642



Training:   0%|          | 0/53 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/53 [00:07<06:20,  7.32s/it][A
Training:   4%|▍         | 2/53 [00:07<02:37,  3.10s/it][A
Training:   8%|▊         | 4/53 [00:07<00:59,  1.21s/it][A
Training:   9%|▉         | 5/53 [00:13<02:08,  2.68s/it][A
Training:  13%|█▎        | 7/53 [00:13<01:08,  1.48s/it][A
Training:  15%|█▌        | 8/53 [00:14<00:53,  1.18s/it][A
Training:  17%|█▋        | 9/53 [00:20<01:49,  2.48s/it][A
Training:  19%|█▉        | 10/53 [00:20<01:18,  1.83s/it][A
Training:  21%|██        | 11/53 [00:20<00:56,  1.35s/it][A
Training:  23%|██▎       | 12/53 [00:20<00:45,  1.11s/it][A
Training:  25%|██▍       | 13/53 [00:27<01:45,  2.63s/it][A
Training:  26%|██▋       | 14/53 [00:27<01:14,  1.90s/it][A
Training:  28%|██▊       | 15/53 [00:27<00:52,  1.38s/it][A
Training:  30%|███       | 16/53 [00:27<00:38,  1.03s/it][A
Training:  32%|███▏      | 17/53 [00:34<01:37,  2.71s/it][A
Training:  34%|███▍      | 18/53 [00:34

Epoch: 33/37 - Loss: 4.5322 - Accuracy: 0.9732



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:06<00:40,  6.70s/it][A
 43%|████▎     | 3/7 [00:06<00:07,  1.82s/it][A
 57%|█████▋    | 4/7 [00:07<00:03,  1.22s/it][A
 71%|███████▏  | 5/7 [00:12<00:05,  2.52s/it][A
100%|██████████| 7/7 [00:12<00:00,  1.79s/it][A
Epochs:  89%|████████▉ | 33/37 [56:49<06:51, 102.84s/it]

Val Loss: 5.6955 - Val Accuracy: 0.9631



Training:   0%|          | 0/53 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/53 [00:07<06:30,  7.51s/it][A
Training:   4%|▍         | 2/53 [00:07<02:50,  3.34s/it][A
Training:   6%|▌         | 3/53 [00:08<01:34,  1.90s/it][A
Training:   9%|▉         | 5/53 [00:14<02:02,  2.56s/it][A
Training:  11%|█▏        | 6/53 [00:14<01:30,  1.93s/it][A
Training:  15%|█▌        | 8/53 [00:14<00:48,  1.09s/it][A
Training:  17%|█▋        | 9/53 [00:20<01:42,  2.34s/it][A
Training:  19%|█▉        | 10/53 [00:21<01:17,  1.79s/it][A
Training:  23%|██▎       | 12/53 [00:21<00:43,  1.06s/it][A
Training:  25%|██▍       | 13/53 [00:27<01:29,  2.23s/it][A
Training:  26%|██▋       | 14/53 [00:27<01:08,  1.77s/it][A
Training:  28%|██▊       | 15/53 [00:27<00:51,  1.35s/it][A
Training:  30%|███       | 16/53 [00:28<00:38,  1.03s/it][A
Training:  32%|███▏      | 17/53 [00:34<01:28,  2.46s/it][A
Training:  34%|███▍      | 18/53 [00:34<01:06,  1.89s/it][A
Training:  36%|███▌      | 19/53 [00:34

Epoch: 34/37 - Loss: 4.4432 - Accuracy: 0.9723



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:06<00:38,  6.44s/it][A
 29%|██▊       | 2/7 [00:06<00:13,  2.72s/it][A
 57%|█████▋    | 4/7 [00:06<00:03,  1.05s/it][A
100%|██████████| 7/7 [00:12<00:00,  1.75s/it][A
Epochs:  92%|█████████▏| 34/37 [58:32<05:08, 102.70s/it]

Val Loss: 5.3592 - Val Accuracy: 0.9706



Training:   0%|          | 0/53 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/53 [00:07<06:25,  7.42s/it][A
Training:   4%|▍         | 2/53 [00:07<02:41,  3.17s/it][A
Training:   6%|▌         | 3/53 [00:07<01:30,  1.81s/it][A
Training:   8%|▊         | 4/53 [00:08<00:57,  1.18s/it][A
Training:   9%|▉         | 5/53 [00:14<02:26,  3.05s/it][A
Training:  11%|█▏        | 6/53 [00:14<01:36,  2.05s/it][A
Training:  13%|█▎        | 7/53 [00:14<01:07,  1.46s/it][A
Training:  15%|█▌        | 8/53 [00:14<00:46,  1.03s/it][A
Training:  17%|█▋        | 9/53 [00:21<01:58,  2.70s/it][A
Training:  19%|█▉        | 10/53 [00:21<01:22,  1.91s/it][A
Training:  21%|██        | 11/53 [00:21<00:56,  1.36s/it][A
Training:  25%|██▍       | 13/53 [00:28<01:32,  2.31s/it][A
Training:  26%|██▋       | 14/53 [00:28<01:09,  1.78s/it][A
Training:  28%|██▊       | 15/53 [00:28<00:51,  1.36s/it][A
Training:  32%|███▏      | 17/53 [00:34<01:15,  2.11s/it][A
Training:  34%|███▍      | 18/53 [00:35<0

Epoch: 35/37 - Loss: 4.5397 - Accuracy: 0.9724



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:06<00:37,  6.17s/it][A
 29%|██▊       | 2/7 [00:06<00:13,  2.70s/it][A
 57%|█████▋    | 4/7 [00:06<00:03,  1.06s/it][A
 71%|███████▏  | 5/7 [00:11<00:04,  2.37s/it][A
100%|██████████| 7/7 [00:12<00:00,  1.76s/it][A
Epochs:  95%|█████████▍| 35/37 [1:00:15<03:25, 102.73s/it]

Val Loss: 5.9319 - Val Accuracy: 0.9652



Training:   0%|          | 0/53 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/53 [00:07<06:15,  7.22s/it][A
Training:   6%|▌         | 3/53 [00:07<01:36,  1.94s/it][A
Training:   8%|▊         | 4/53 [00:07<01:04,  1.32s/it][A
Training:   9%|▉         | 5/53 [00:14<02:26,  3.05s/it][A
Training:  11%|█▏        | 6/53 [00:14<01:40,  2.13s/it][A
Training:  13%|█▎        | 7/53 [00:14<01:10,  1.52s/it][A
Training:  15%|█▌        | 8/53 [00:14<00:50,  1.13s/it][A
Training:  17%|█▋        | 9/53 [00:20<01:56,  2.64s/it][A
Training:  21%|██        | 11/53 [00:20<01:00,  1.44s/it][A
Training:  23%|██▎       | 12/53 [00:21<00:47,  1.15s/it][A
Training:  25%|██▍       | 13/53 [00:27<01:42,  2.55s/it][A
Training:  26%|██▋       | 14/53 [00:27<01:14,  1.92s/it][A
Training:  28%|██▊       | 15/53 [00:28<00:54,  1.45s/it][A
Training:  32%|███▏      | 17/53 [00:34<01:17,  2.16s/it][A
Training:  34%|███▍      | 18/53 [00:34<00:59,  1.69s/it][A
Training:  36%|███▌      | 19/53 [00:34<

Epoch: 36/37 - Loss: 4.5077 - Accuracy: 0.9718



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:06<00:37,  6.33s/it][A
 29%|██▊       | 2/7 [00:06<00:14,  2.84s/it][A
 43%|████▎     | 3/7 [00:06<00:06,  1.62s/it][A
 57%|█████▋    | 4/7 [00:07<00:03,  1.03s/it][A
 71%|███████▏  | 5/7 [00:12<00:05,  2.54s/it][A
100%|██████████| 7/7 [00:12<00:00,  1.80s/it][A
Epochs:  97%|█████████▋| 36/37 [1:01:57<01:42, 102.61s/it]

Val Loss: 5.7450 - Val Accuracy: 0.9629



Training:   0%|          | 0/53 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/53 [00:07<06:13,  7.18s/it][A
Training:   4%|▍         | 2/53 [00:07<02:39,  3.13s/it][A
Training:   6%|▌         | 3/53 [00:07<01:28,  1.77s/it][A
Training:   8%|▊         | 4/53 [00:07<00:54,  1.11s/it][A
Training:   9%|▉         | 5/53 [00:14<02:30,  3.13s/it][A
Training:  11%|█▏        | 6/53 [00:14<01:39,  2.11s/it][A
Training:  15%|█▌        | 8/53 [00:14<00:49,  1.11s/it][A
Training:  17%|█▋        | 9/53 [00:21<01:51,  2.53s/it][A
Training:  19%|█▉        | 10/53 [00:21<01:20,  1.88s/it][A
Training:  21%|██        | 11/53 [00:21<00:59,  1.42s/it][A
Training:  23%|██▎       | 12/53 [00:21<00:44,  1.07s/it][A
Training:  25%|██▍       | 13/53 [00:27<01:41,  2.54s/it][A
Training:  26%|██▋       | 14/53 [00:28<01:11,  1.84s/it][A
Training:  28%|██▊       | 15/53 [00:28<00:52,  1.39s/it][A
Training:  32%|███▏      | 17/53 [00:34<01:17,  2.14s/it][A
Training:  34%|███▍      | 18/53 [00:34<

Epoch: 37/37 - Loss: 4.5444 - Accuracy: 0.9729



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:06<00:39,  6.56s/it][A
 29%|██▊       | 2/7 [00:06<00:13,  2.80s/it][A
 57%|█████▋    | 4/7 [00:06<00:03,  1.10s/it][A
 71%|███████▏  | 5/7 [00:12<00:04,  2.36s/it][A
100%|██████████| 7/7 [00:12<00:00,  1.76s/it][A
Epochs: 100%|██████████| 37/37 [1:03:39<00:00, 103.24s/it]


Val Loss: 5.6440 - Val Accuracy: 0.9676
Saving best model...


[32m[I 2023-12-08 22:49:59,147][0m Trial 17 finished with value: 0.9676252007484436 and parameters: {'loss_learning_rate': 0.008447568694221697, 'learning_rate': 0.000633457353251843, 'weight_decay': 0.001876909923779263, 'epsilon': 9.402328890865692e-08, 'beta': 0.8, 'gamma': 0.9, 'batch_size': 266, 'epochs': 37}. Best is trial 17 with value: 0.9676252007484436.[0m


Learning rate for Loss: 0.00962637196816694
Learning rate: 0.00046344113311681204
Weight decay: 0.00919395544531611
Epsilon: 3.5390578711303653e-08
Beta: 0.8
Gamma: 1.0
Batch size: 267
Number of epochs: 54


Epochs:   0%|          | 0/54 [00:00<?, ?it/s]
Training:   0%|          | 0/53 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/53 [00:07<06:44,  7.77s/it][A
Training:   4%|▍         | 2/53 [00:07<02:47,  3.29s/it][A
Training:   6%|▌         | 3/53 [00:08<01:33,  1.86s/it][A
Training:   8%|▊         | 4/53 [00:08<00:57,  1.17s/it][A
Training:   9%|▉         | 5/53 [00:14<02:20,  2.92s/it][A
Training:  11%|█▏        | 6/53 [00:14<01:32,  1.97s/it][A
Training:  13%|█▎        | 7/53 [00:14<01:07,  1.46s/it][A
Training:  15%|█▌        | 8/53 [00:14<00:47,  1.05s/it][A
Training:  17%|█▋        | 9/53 [00:21<01:56,  2.65s/it][A
Training:  21%|██        | 11/53 [00:21<01:02,  1.48s/it][A
Training:  23%|██▎       | 12/53 [00:21<00:47,  1.16s/it][A
Training:  25%|██▍       | 13/53 [00:27<01:39,  2.49s/it][A
Training:  26%|██▋       | 14/53 [00:27<01:11,  1.84s/it][A
Training:  28%|██▊       | 15/53 [00:28<00:53,  1.42s/it][A
Training:  32%|███▏      | 17/53 [00:34<01:17,  2.16s/it

Epoch: 1/54 - Loss: 17.8151 - Accuracy: 0.8645



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:06<00:41,  6.88s/it][A
 43%|████▎     | 3/7 [00:07<00:07,  1.91s/it][A
 71%|███████▏  | 5/7 [00:12<00:04,  2.16s/it][A
100%|██████████| 7/7 [00:12<00:00,  1.77s/it][A
Epochs:   0%|          | 0/54 [01:41<?, ?it/s]
[32m[I 2023-12-08 22:51:41,456][0m Trial 18 pruned. [0m


Val Loss: 8.8661 - Val Accuracy: 0.9486
Learning rate for Loss: 0.0026095667746146318
Learning rate: 0.0007654254891103729
Weight decay: 0.0018147852099258965
Epsilon: 8.897455126188771e-08
Beta: 0.8
Gamma: 0.9
Batch size: 172
Number of epochs: 42


Epochs:   0%|          | 0/42 [00:00<?, ?it/s]
Training:   0%|          | 0/82 [00:00<?, ?it/s][A
Training:   1%|          | 1/82 [00:05<07:01,  5.20s/it][A
Training:   2%|▏         | 2/82 [00:05<02:57,  2.22s/it][A
Training:   5%|▍         | 4/82 [00:05<01:08,  1.14it/s][A
Training:   6%|▌         | 5/82 [00:09<02:31,  1.96s/it][A
Training:   9%|▊         | 7/82 [00:10<01:22,  1.10s/it][A
Training:  10%|▉         | 8/82 [00:10<01:05,  1.13it/s][A
Training:  11%|█         | 9/82 [00:14<02:02,  1.68s/it][A
Training:  12%|█▏        | 10/82 [00:14<01:30,  1.25s/it][A
Training:  15%|█▍        | 12/82 [00:14<00:57,  1.22it/s][A
Training:  16%|█▌        | 13/82 [00:18<01:42,  1.49s/it][A
Training:  17%|█▋        | 14/82 [00:18<01:21,  1.19s/it][A
Training:  20%|█▉        | 16/82 [00:19<00:55,  1.20it/s][A
Training:  21%|██        | 17/82 [00:23<01:34,  1.45s/it][A
Training:  22%|██▏       | 18/82 [00:23<01:15,  1.17s/it][A
Training:  24%|██▍       | 20/82 [00:24<00:51,  1.21it

Epoch: 1/42 - Loss: 13.7492 - Accuracy: 0.9175



  0%|          | 0/11 [00:00<?, ?it/s][A
  9%|▉         | 1/11 [00:04<00:43,  4.39s/it][A
 18%|█▊        | 2/11 [00:04<00:17,  1.95s/it][A
 36%|███▋      | 4/11 [00:04<00:05,  1.30it/s][A
 45%|████▌     | 5/11 [00:08<00:09,  1.58s/it][A
 55%|█████▍    | 6/11 [00:08<00:05,  1.15s/it][A
 64%|██████▎   | 7/11 [00:08<00:03,  1.17it/s][A
 73%|███████▎  | 8/11 [00:08<00:01,  1.54it/s][A
 82%|████████▏ | 9/11 [00:11<00:02,  1.37s/it][A
100%|██████████| 11/11 [00:12<00:00,  1.10s/it][A
Epochs:   2%|▏         | 1/42 [01:43<1:10:26, 103.09s/it]

Val Loss: 7.7663 - Val Accuracy: 0.9573



Training:   0%|          | 0/82 [00:00<?, ?it/s][A
Training:   1%|          | 1/82 [00:05<06:53,  5.11s/it][A
Training:   2%|▏         | 2/82 [00:05<02:59,  2.25s/it][A
Training:   4%|▎         | 3/82 [00:05<01:40,  1.28s/it][A
Training:   5%|▍         | 4/82 [00:05<01:03,  1.23it/s][A
Training:   6%|▌         | 5/82 [00:09<02:32,  1.99s/it][A
Training:   7%|▋         | 6/82 [00:09<01:43,  1.36s/it][A
Training:  10%|▉         | 8/82 [00:09<00:53,  1.39it/s][A
Training:  11%|█         | 9/82 [00:14<02:01,  1.66s/it][A
Training:  12%|█▏        | 10/82 [00:14<01:34,  1.31s/it][A
Training:  13%|█▎        | 11/82 [00:14<01:09,  1.03it/s][A
Training:  15%|█▍        | 12/82 [00:14<00:51,  1.36it/s][A
Training:  16%|█▌        | 13/82 [00:18<01:48,  1.58s/it][A
Training:  17%|█▋        | 14/82 [00:19<01:25,  1.26s/it][A
Training:  18%|█▊        | 15/82 [00:19<01:01,  1.09it/s][A
Training:  21%|██        | 17/82 [00:22<01:28,  1.37s/it][A
Training:  22%|██▏       | 18/82 [00:23<

Epoch: 2/42 - Loss: 7.7174 - Accuracy: 0.9597



  0%|          | 0/11 [00:00<?, ?it/s][A
  9%|▉         | 1/11 [00:04<00:43,  4.39s/it][A
 27%|██▋       | 3/11 [00:04<00:09,  1.19s/it][A
 45%|████▌     | 5/11 [00:08<00:09,  1.60s/it][A
 55%|█████▍    | 6/11 [00:08<00:06,  1.22s/it][A
 73%|███████▎  | 8/11 [00:08<00:02,  1.37it/s][A
100%|██████████| 11/11 [00:12<00:00,  1.12s/it][A
Epochs:   5%|▍         | 2/42 [03:26<1:08:44, 103.11s/it]

Val Loss: 7.5483 - Val Accuracy: 0.9604



Training:   0%|          | 0/82 [00:00<?, ?it/s][A
Training:   1%|          | 1/82 [00:05<06:59,  5.18s/it][A
Training:   2%|▏         | 2/82 [00:05<02:55,  2.20s/it][A
Training:   5%|▍         | 4/82 [00:05<01:08,  1.14it/s][A
Training:   6%|▌         | 5/82 [00:09<02:31,  1.96s/it][A
Training:   7%|▋         | 6/82 [00:10<01:48,  1.42s/it][A
Training:  10%|▉         | 8/82 [00:10<00:59,  1.25it/s][A
Training:  11%|█         | 9/82 [00:14<01:58,  1.62s/it][A
Training:  12%|█▏        | 10/82 [00:14<01:35,  1.33s/it][A
Training:  13%|█▎        | 11/82 [00:14<01:10,  1.00it/s][A
Training:  16%|█▌        | 13/82 [00:18<01:36,  1.40s/it][A
Training:  17%|█▋        | 14/82 [00:19<01:19,  1.16s/it][A
Training:  20%|█▉        | 16/82 [00:19<00:47,  1.39it/s][A
Training:  21%|██        | 17/82 [00:23<01:29,  1.38s/it][A
Training:  22%|██▏       | 18/82 [00:23<01:16,  1.19s/it][A
Training:  23%|██▎       | 19/82 [00:23<00:58,  1.08it/s][A
Training:  24%|██▍       | 20/82 [00:23

Epoch: 3/42 - Loss: 6.7298 - Accuracy: 0.9598



  0%|          | 0/11 [00:00<?, ?it/s][A
  9%|▉         | 1/11 [00:04<00:47,  4.73s/it][A
 27%|██▋       | 3/11 [00:04<00:10,  1.28s/it][A
 45%|████▌     | 5/11 [00:08<00:10,  1.67s/it][A
 64%|██████▎   | 7/11 [00:09<00:03,  1.01it/s][A
100%|██████████| 11/11 [00:12<00:00,  1.17s/it][A
Epochs:   7%|▋         | 3/42 [05:09<1:07:06, 103.25s/it]

Val Loss: 8.4543 - Val Accuracy: 0.9494



Training:   0%|          | 0/82 [00:00<?, ?it/s][A
Training:   1%|          | 1/82 [00:05<07:14,  5.37s/it][A
Training:   4%|▎         | 3/82 [00:05<01:52,  1.43s/it][A
Training:   6%|▌         | 5/82 [00:09<02:19,  1.82s/it][A
Training:   9%|▊         | 7/82 [00:09<01:20,  1.08s/it][A
Training:  11%|█         | 9/82 [00:14<01:49,  1.50s/it][A
Training:  13%|█▎        | 11/82 [00:14<01:13,  1.03s/it][A
Training:  15%|█▍        | 12/82 [00:14<01:00,  1.16it/s][A
Training:  16%|█▌        | 13/82 [00:18<01:46,  1.54s/it][A
Training:  17%|█▋        | 14/82 [00:18<01:21,  1.20s/it][A
Training:  20%|█▉        | 16/82 [00:19<00:48,  1.36it/s][A
Training:  21%|██        | 17/82 [00:23<01:37,  1.50s/it][A
Training:  22%|██▏       | 18/82 [00:23<01:15,  1.18s/it][A
Training:  23%|██▎       | 19/82 [00:23<00:56,  1.11it/s][A
Training:  24%|██▍       | 20/82 [00:23<00:44,  1.40it/s][A
Training:  26%|██▌       | 21/82 [00:28<01:47,  1.76s/it][A
Training:  27%|██▋       | 22/82 [00:

Epoch: 4/42 - Loss: 6.5345 - Accuracy: 0.9630



  0%|          | 0/11 [00:00<?, ?it/s][A
  9%|▉         | 1/11 [00:04<00:46,  4.66s/it][A
 18%|█▊        | 2/11 [00:04<00:17,  1.98s/it][A
 36%|███▋      | 4/11 [00:04<00:05,  1.29it/s][A
 55%|█████▍    | 6/11 [00:08<00:06,  1.35s/it][A
 73%|███████▎  | 8/11 [00:08<00:02,  1.21it/s][A
100%|██████████| 11/11 [00:12<00:00,  1.15s/it][A
Epochs:  10%|▉         | 4/42 [06:53<1:05:26, 103.34s/it]

Val Loss: 7.6399 - Val Accuracy: 0.9615



Training:   0%|          | 0/82 [00:00<?, ?it/s][A
Training:   1%|          | 1/82 [00:05<07:04,  5.24s/it][A
Training:   2%|▏         | 2/82 [00:05<02:58,  2.23s/it][A
Training:   4%|▎         | 3/82 [00:05<01:40,  1.27s/it][A
Training:   6%|▌         | 5/82 [00:09<02:18,  1.80s/it][A
Training:   9%|▊         | 7/82 [00:10<01:17,  1.04s/it][A
Training:  11%|█         | 9/82 [00:14<01:46,  1.46s/it][A
Training:  12%|█▏        | 10/82 [00:14<01:23,  1.16s/it][A
Training:  13%|█▎        | 11/82 [00:14<01:04,  1.09it/s][A
Training:  15%|█▍        | 12/82 [00:14<00:50,  1.39it/s][A
Training:  16%|█▌        | 13/82 [00:18<01:49,  1.58s/it][A
Training:  18%|█▊        | 15/82 [00:18<01:03,  1.06it/s][A
Training:  20%|█▉        | 16/82 [00:19<00:49,  1.33it/s][A
Training:  21%|██        | 17/82 [00:22<01:40,  1.54s/it][A
Training:  22%|██▏       | 18/82 [00:23<01:16,  1.20s/it][A
Training:  23%|██▎       | 19/82 [00:23<00:58,  1.07it/s][A
Training:  26%|██▌       | 21/82 [00:2

Epoch: 5/42 - Loss: 6.7024 - Accuracy: 0.9646



  0%|          | 0/11 [00:00<?, ?it/s][A
  9%|▉         | 1/11 [00:04<00:47,  4.75s/it][A
 27%|██▋       | 3/11 [00:04<00:10,  1.29s/it][A
 36%|███▋      | 4/11 [00:05<00:06,  1.11it/s][A
 45%|████▌     | 5/11 [00:08<00:11,  1.89s/it][A
 64%|██████▎   | 7/11 [00:09<00:04,  1.00s/it][A
100%|██████████| 11/11 [00:12<00:00,  1.15s/it][A
Epochs:  12%|█▏        | 5/42 [08:36<1:03:40, 103.25s/it]

Val Loss: 7.4393 - Val Accuracy: 0.9615



Training:   0%|          | 0/82 [00:00<?, ?it/s][A
Training:   1%|          | 1/82 [00:05<07:13,  5.35s/it][A
Training:   2%|▏         | 2/82 [00:05<03:01,  2.27s/it][A
Training:   4%|▎         | 3/82 [00:05<01:44,  1.33s/it][A
Training:   5%|▍         | 4/82 [00:05<01:06,  1.17it/s][A
Training:   6%|▌         | 5/82 [00:09<02:35,  2.02s/it][A
Training:   7%|▋         | 6/82 [00:10<01:45,  1.39s/it][A
Training:   9%|▊         | 7/82 [00:10<01:13,  1.02it/s][A
Training:  10%|▉         | 8/82 [00:10<00:52,  1.42it/s][A
Training:  11%|█         | 9/82 [00:14<02:14,  1.85s/it][A
Training:  12%|█▏        | 10/82 [00:14<01:34,  1.31s/it][A
Training:  15%|█▍        | 12/82 [00:14<00:50,  1.38it/s][A
Training:  16%|█▌        | 13/82 [00:18<01:48,  1.57s/it][A
Training:  18%|█▊        | 15/82 [00:19<01:02,  1.07it/s][A
Training:  21%|██        | 17/82 [00:23<01:26,  1.33s/it][A
Training:  23%|██▎       | 19/82 [00:23<00:55,  1.13it/s][A
Training:  26%|██▌       | 21/82 [00:27<0

Epoch: 6/42 - Loss: 6.7477 - Accuracy: 0.9646



  0%|          | 0/11 [00:00<?, ?it/s][A
  9%|▉         | 1/11 [00:04<00:48,  4.81s/it][A
 18%|█▊        | 2/11 [00:04<00:18,  2.05s/it][A
 36%|███▋      | 4/11 [00:05<00:05,  1.25it/s][A
 55%|█████▍    | 6/11 [00:08<00:06,  1.33s/it][A
 73%|███████▎  | 8/11 [00:09<00:02,  1.20it/s][A
100%|██████████| 11/11 [00:12<00:00,  1.15s/it][A
Epochs:  14%|█▍        | 6/42 [10:19<1:02:01, 103.36s/it]

Val Loss: 8.8394 - Val Accuracy: 0.9600



Training:   0%|          | 0/82 [00:00<?, ?it/s][A
Training:   1%|          | 1/82 [00:05<06:47,  5.03s/it][A
Training:   2%|▏         | 2/82 [00:05<03:02,  2.28s/it][A
Training:   5%|▍         | 4/82 [00:05<01:09,  1.13it/s][A
Training:   6%|▌         | 5/82 [00:09<02:25,  1.89s/it][A
Training:   7%|▋         | 6/82 [00:09<01:47,  1.41s/it][A
Training:   9%|▊         | 7/82 [00:10<01:16,  1.03s/it][A
Training:  11%|█         | 9/82 [00:14<01:48,  1.49s/it][A
Training:  12%|█▏        | 10/82 [00:14<01:25,  1.19s/it][A
Training:  13%|█▎        | 11/82 [00:14<01:06,  1.07it/s][A
Training:  15%|█▍        | 12/82 [00:14<00:50,  1.40it/s][A
Training:  16%|█▌        | 13/82 [00:18<01:47,  1.56s/it][A
Training:  17%|█▋        | 14/82 [00:18<01:17,  1.14s/it][A
Training:  18%|█▊        | 15/82 [00:18<01:01,  1.09it/s][A
Training:  21%|██        | 17/82 [00:22<01:27,  1.35s/it][A
Training:  22%|██▏       | 18/82 [00:22<01:06,  1.05s/it][A
Training:  23%|██▎       | 19/82 [00:23

Epoch: 7/42 - Loss: 6.5684 - Accuracy: 0.9649



  0%|          | 0/11 [00:00<?, ?it/s][A
  9%|▉         | 1/11 [00:04<00:44,  4.45s/it][A
 18%|█▊        | 2/11 [00:04<00:17,  1.90s/it][A
 36%|███▋      | 4/11 [00:04<00:05,  1.33it/s][A
 45%|████▌     | 5/11 [00:08<00:10,  1.71s/it][A
 64%|██████▎   | 7/11 [00:08<00:03,  1.06it/s][A
 82%|████████▏ | 9/11 [00:12<00:02,  1.24s/it][A
100%|██████████| 11/11 [00:12<00:00,  1.13s/it][A
Epochs:  17%|█▋        | 7/42 [12:02<1:00:06, 103.04s/it]

Val Loss: 7.9295 - Val Accuracy: 0.9594



Training:   0%|          | 0/82 [00:00<?, ?it/s][A
Training:   1%|          | 1/82 [00:05<06:49,  5.05s/it][A
Training:   4%|▎         | 3/82 [00:05<01:49,  1.39s/it][A
Training:   5%|▍         | 4/82 [00:05<01:15,  1.04it/s][A
Training:   6%|▌         | 5/82 [00:09<02:34,  2.00s/it][A
Training:   7%|▋         | 6/82 [00:09<01:46,  1.40s/it][A
Training:   9%|▊         | 7/82 [00:09<01:18,  1.05s/it][A
Training:  11%|█         | 9/82 [00:13<01:48,  1.49s/it][A
Training:  13%|█▎        | 11/82 [00:14<01:06,  1.07it/s][A
Training:  15%|█▍        | 12/82 [00:14<00:52,  1.33it/s][A
Training:  16%|█▌        | 13/82 [00:18<01:45,  1.53s/it][A
Training:  20%|█▉        | 16/82 [00:18<00:51,  1.29it/s][A
Training:  21%|██        | 17/82 [00:22<01:32,  1.42s/it][A
Training:  22%|██▏       | 18/82 [00:22<01:12,  1.13s/it][A
Training:  24%|██▍       | 20/82 [00:22<00:45,  1.37it/s][A
Training:  26%|██▌       | 21/82 [00:26<01:24,  1.38s/it][A
Training:  28%|██▊       | 23/82 [00:26

Epoch: 8/42 - Loss: 6.7795 - Accuracy: 0.9662



  0%|          | 0/11 [00:00<?, ?it/s][A
  9%|▉         | 1/11 [00:04<00:46,  4.68s/it][A
 18%|█▊        | 2/11 [00:04<00:18,  2.04s/it][A
 27%|██▋       | 3/11 [00:05<00:09,  1.17s/it][A
 36%|███▋      | 4/11 [00:05<00:05,  1.28it/s][A
 45%|████▌     | 5/11 [00:08<00:10,  1.77s/it][A
 55%|█████▍    | 6/11 [00:08<00:06,  1.21s/it][A
 64%|██████▎   | 7/11 [00:09<00:03,  1.15it/s][A
100%|██████████| 11/11 [00:12<00:00,  1.13s/it][A
Epochs:  19%|█▉        | 8/42 [13:44<58:18, 102.91s/it]  

Val Loss: 7.2831 - Val Accuracy: 0.9568



Training:   0%|          | 0/82 [00:00<?, ?it/s][A
Training:   1%|          | 1/82 [00:05<07:04,  5.25s/it][A
Training:   4%|▎         | 3/82 [00:05<01:52,  1.42s/it][A
Training:   5%|▍         | 4/82 [00:05<01:15,  1.03it/s][A
Training:   6%|▌         | 5/82 [00:09<02:31,  1.97s/it][A
Training:   9%|▊         | 7/82 [00:09<01:19,  1.06s/it][A
Training:  10%|▉         | 8/82 [00:09<01:00,  1.22it/s][A
Training:  11%|█         | 9/82 [00:13<02:00,  1.66s/it][A
Training:  12%|█▏        | 10/82 [00:13<01:28,  1.23s/it][A
Training:  13%|█▎        | 11/82 [00:14<01:09,  1.01it/s][A
Training:  15%|█▍        | 12/82 [00:14<00:52,  1.33it/s][A
Training:  16%|█▌        | 13/82 [00:18<01:50,  1.60s/it][A
Training:  17%|█▋        | 14/82 [00:18<01:18,  1.16s/it][A
Training:  18%|█▊        | 15/82 [00:18<01:08,  1.02s/it][A
Training:  20%|█▉        | 16/82 [00:19<00:49,  1.33it/s][A
Training:  21%|██        | 17/82 [00:22<01:35,  1.46s/it][A
Training:  22%|██▏       | 18/82 [00:22

Epoch: 9/42 - Loss: 6.6152 - Accuracy: 0.9656



  0%|          | 0/11 [00:00<?, ?it/s][A
  9%|▉         | 1/11 [00:04<00:46,  4.62s/it][A
 27%|██▋       | 3/11 [00:04<00:09,  1.24s/it][A
 45%|████▌     | 5/11 [00:08<00:09,  1.66s/it][A
 55%|█████▍    | 6/11 [00:08<00:06,  1.24s/it][A
 73%|███████▎  | 8/11 [00:09<00:02,  1.36it/s][A
100%|██████████| 11/11 [00:12<00:00,  1.14s/it][A
Epochs:  21%|██▏       | 9/42 [15:27<56:28, 102.70s/it]

Val Loss: 8.0458 - Val Accuracy: 0.9673



Training:   0%|          | 0/82 [00:00<?, ?it/s][A
Training:   1%|          | 1/82 [00:05<07:01,  5.21s/it][A
Training:   4%|▎         | 3/82 [00:05<01:50,  1.40s/it][A
Training:   6%|▌         | 5/82 [00:09<02:17,  1.78s/it][A
Training:   9%|▊         | 7/82 [00:09<01:18,  1.05s/it][A
Training:  11%|█         | 9/82 [00:13<01:46,  1.45s/it][A
Training:  15%|█▍        | 12/82 [00:14<00:57,  1.21it/s][A
Training:  17%|█▋        | 14/82 [00:18<01:20,  1.18s/it][A
Training:  20%|█▉        | 16/82 [00:18<00:56,  1.17it/s][A
Training:  22%|██▏       | 18/82 [00:22<01:16,  1.19s/it][A
Training:  24%|██▍       | 20/82 [00:22<00:52,  1.17it/s][A
Training:  27%|██▋       | 22/82 [00:26<01:14,  1.25s/it][A
Training:  30%|███       | 25/82 [00:31<01:15,  1.32s/it][A
Training:  32%|███▏      | 26/82 [00:31<01:03,  1.13s/it][A
Training:  34%|███▍      | 28/82 [00:31<00:43,  1.24it/s][A
Training:  35%|███▌      | 29/82 [00:35<01:15,  1.42s/it][A
Training:  38%|███▊      | 31/82 [00:

Epoch: 10/42 - Loss: 6.4796 - Accuracy: 0.9676



  0%|          | 0/11 [00:00<?, ?it/s][A
  9%|▉         | 1/11 [00:04<00:47,  4.79s/it][A
 27%|██▋       | 3/11 [00:04<00:10,  1.28s/it][A
 45%|████▌     | 5/11 [00:09<00:10,  1.69s/it][A
 64%|██████▎   | 7/11 [00:09<00:03,  1.00it/s][A
100%|██████████| 11/11 [00:12<00:00,  1.18s/it][A
Epochs:  24%|██▍       | 10/42 [17:10<54:54, 102.95s/it]

Val Loss: 7.2223 - Val Accuracy: 0.9668



Training:   0%|          | 0/82 [00:00<?, ?it/s][A
Training:   1%|          | 1/82 [00:05<06:51,  5.08s/it][A
Training:   2%|▏         | 2/82 [00:05<02:55,  2.20s/it][A
Training:   4%|▎         | 3/82 [00:05<01:41,  1.28s/it][A
Training:   6%|▌         | 5/82 [00:09<02:11,  1.71s/it][A
Training:   9%|▊         | 7/82 [00:10<01:19,  1.06s/it][A
Training:  10%|▉         | 8/82 [00:10<01:01,  1.20it/s][A
Training:  11%|█         | 9/82 [00:13<01:55,  1.58s/it][A
Training:  12%|█▏        | 10/82 [00:13<01:25,  1.18s/it][A
Training:  13%|█▎        | 11/82 [00:14<01:04,  1.10it/s][A
Training:  16%|█▌        | 13/82 [00:18<01:34,  1.36s/it][A
Training:  18%|█▊        | 15/82 [00:18<00:59,  1.12it/s][A
Training:  20%|█▉        | 16/82 [00:18<00:48,  1.37it/s][A
Training:  21%|██        | 17/82 [00:22<01:34,  1.45s/it][A
Training:  22%|██▏       | 18/82 [00:22<01:11,  1.12s/it][A
Training:  23%|██▎       | 19/82 [00:22<00:57,  1.10it/s][A
Training:  24%|██▍       | 20/82 [00:22

Epoch: 11/42 - Loss: 6.3590 - Accuracy: 0.9703



  0%|          | 0/11 [00:00<?, ?it/s][A
  9%|▉         | 1/11 [00:04<00:44,  4.44s/it][A
 18%|█▊        | 2/11 [00:04<00:18,  2.07s/it][A
 36%|███▋      | 4/11 [00:04<00:05,  1.24it/s][A
 45%|████▌     | 5/11 [00:08<00:10,  1.67s/it][A
 55%|█████▍    | 6/11 [00:08<00:06,  1.25s/it][A
 82%|████████▏ | 9/11 [00:11<00:02,  1.12s/it][A
100%|██████████| 11/11 [00:12<00:00,  1.14s/it][A
Epochs:  26%|██▌       | 11/42 [18:52<53:00, 102.58s/it]

Val Loss: 8.0237 - Val Accuracy: 0.9578



Training:   0%|          | 0/82 [00:00<?, ?it/s][A
Training:   1%|          | 1/82 [00:04<06:42,  4.97s/it][A
Training:   2%|▏         | 2/82 [00:05<03:00,  2.26s/it][A
Training:   4%|▎         | 3/82 [00:05<01:41,  1.29s/it][A
Training:   5%|▍         | 4/82 [00:05<01:05,  1.19it/s][A
Training:   6%|▌         | 5/82 [00:09<02:19,  1.81s/it][A
Training:   7%|▋         | 6/82 [00:09<01:41,  1.34s/it][A
Training:   9%|▊         | 7/82 [00:09<01:11,  1.05it/s][A
Training:  10%|▉         | 8/82 [00:09<00:51,  1.44it/s][A
Training:  11%|█         | 9/82 [00:13<01:47,  1.47s/it][A
Training:  12%|█▏        | 10/82 [00:13<01:27,  1.21s/it][A
Training:  13%|█▎        | 11/82 [00:13<01:02,  1.14it/s][A
Training:  15%|█▍        | 12/82 [00:13<00:45,  1.55it/s][A
Training:  16%|█▌        | 13/82 [00:17<01:42,  1.48s/it][A
Training:  17%|█▋        | 14/82 [00:18<01:24,  1.25s/it][A
Training:  18%|█▊        | 15/82 [00:18<01:00,  1.11it/s][A
Training:  20%|█▉        | 16/82 [00:18<0

Epoch: 12/42 - Loss: 6.0045 - Accuracy: 0.9704



  0%|          | 0/11 [00:00<?, ?it/s][A
  9%|▉         | 1/11 [00:04<00:45,  4.59s/it][A
 18%|█▊        | 2/11 [00:05<00:19,  2.16s/it][A
 27%|██▋       | 3/11 [00:05<00:09,  1.24s/it][A
 36%|███▋      | 4/11 [00:05<00:05,  1.24it/s][A
 45%|████▌     | 5/11 [00:08<00:10,  1.72s/it][A
 64%|██████▎   | 7/11 [00:08<00:03,  1.12it/s][A
 73%|███████▎  | 8/11 [00:08<00:02,  1.46it/s][A
 82%|████████▏ | 9/11 [00:11<00:02,  1.30s/it][A
100%|██████████| 11/11 [00:12<00:00,  1.14s/it][A
Epochs:  29%|██▊       | 12/42 [20:34<51:13, 102.44s/it]

Val Loss: 8.8403 - Val Accuracy: 0.9578



Training:   0%|          | 0/82 [00:00<?, ?it/s][A
Training:   1%|          | 1/82 [00:05<06:48,  5.04s/it][A
Training:   2%|▏         | 2/82 [00:05<02:50,  2.13s/it][A
Training:   4%|▎         | 3/82 [00:05<01:37,  1.24s/it][A
Training:   5%|▍         | 4/82 [00:05<01:02,  1.25it/s][A
Training:   6%|▌         | 5/82 [00:08<02:16,  1.78s/it][A
Training:   7%|▋         | 6/82 [00:09<01:36,  1.27s/it][A
Training:   9%|▊         | 7/82 [00:09<01:09,  1.08it/s][A
Training:  10%|▉         | 8/82 [00:09<00:49,  1.48it/s][A
Training:  11%|█         | 9/82 [00:13<02:00,  1.65s/it][A
Training:  12%|█▏        | 10/82 [00:13<01:29,  1.24s/it][A
Training:  13%|█▎        | 11/82 [00:13<01:07,  1.06it/s][A
Training:  15%|█▍        | 12/82 [00:14<00:50,  1.38it/s][A
Training:  16%|█▌        | 13/82 [00:17<01:50,  1.60s/it][A
Training:  17%|█▋        | 14/82 [00:18<01:23,  1.23s/it][A
Training:  18%|█▊        | 15/82 [00:18<01:04,  1.04it/s][A
Training:  21%|██        | 17/82 [00:22<0

Epoch: 13/42 - Loss: 6.2498 - Accuracy: 0.9702



  0%|          | 0/11 [00:00<?, ?it/s][A
  9%|▉         | 1/11 [00:04<00:43,  4.33s/it][A
 18%|█▊        | 2/11 [00:04<00:17,  1.90s/it][A
 36%|███▋      | 4/11 [00:04<00:05,  1.30it/s][A
 45%|████▌     | 5/11 [00:08<00:09,  1.57s/it][A
 55%|█████▍    | 6/11 [00:08<00:05,  1.20s/it][A
 64%|██████▎   | 7/11 [00:08<00:03,  1.15it/s][A
 82%|████████▏ | 9/11 [00:11<00:02,  1.18s/it][A
100%|██████████| 11/11 [00:12<00:00,  1.10s/it][A
Epochs:  31%|███       | 13/42 [22:16<49:30, 102.44s/it]

Val Loss: 7.4486 - Val Accuracy: 0.9668



Training:   0%|          | 0/82 [00:00<?, ?it/s][A
Training:   1%|          | 1/82 [00:04<06:32,  4.85s/it][A
Training:   2%|▏         | 2/82 [00:05<02:48,  2.11s/it][A
Training:   4%|▎         | 3/82 [00:05<01:36,  1.22s/it][A
Training:   5%|▍         | 4/82 [00:05<01:01,  1.26it/s][A
Training:   6%|▌         | 5/82 [00:09<02:30,  1.95s/it][A
Training:   7%|▋         | 6/82 [00:09<01:40,  1.33s/it][A
Training:  10%|▉         | 8/82 [00:09<00:54,  1.37it/s][A
Training:  11%|█         | 9/82 [00:13<01:57,  1.61s/it][A
Training:  13%|█▎        | 11/82 [00:13<01:08,  1.04it/s][A
Training:  16%|█▌        | 13/82 [00:18<01:34,  1.38s/it][A
Training:  18%|█▊        | 15/82 [00:18<01:01,  1.09it/s][A
Training:  20%|█▉        | 16/82 [00:18<00:50,  1.32it/s][A
Training:  21%|██        | 17/82 [00:22<01:40,  1.55s/it][A
Training:  23%|██▎       | 19/82 [00:22<01:01,  1.03it/s][A
Training:  26%|██▌       | 21/82 [00:27<01:23,  1.37s/it][A
Training:  28%|██▊       | 23/82 [00:27<

Epoch: 14/42 - Loss: 6.8038 - Accuracy: 0.9699



  0%|          | 0/11 [00:00<?, ?it/s][A
  9%|▉         | 1/11 [00:04<00:43,  4.36s/it][A
 18%|█▊        | 2/11 [00:04<00:17,  1.90s/it][A
 27%|██▋       | 3/11 [00:04<00:08,  1.09s/it][A
 45%|████▌     | 5/11 [00:08<00:09,  1.54s/it][A
 55%|█████▍    | 6/11 [00:08<00:05,  1.18s/it][A
 73%|███████▎  | 8/11 [00:08<00:02,  1.48it/s][A
 82%|████████▏ | 9/11 [00:11<00:02,  1.23s/it][A
100%|██████████| 11/11 [00:12<00:00,  1.11s/it][A
Epochs:  33%|███▎      | 14/42 [23:59<47:53, 102.61s/it]

Val Loss: 8.6167 - Val Accuracy: 0.9637



Training:   0%|          | 0/82 [00:00<?, ?it/s][A
Training:   1%|          | 1/82 [00:05<06:48,  5.05s/it][A
Training:   4%|▎         | 3/82 [00:05<01:47,  1.37s/it][A
Training:   6%|▌         | 5/82 [00:09<02:16,  1.77s/it][A
Training:   9%|▊         | 7/82 [00:09<01:21,  1.08s/it][A
Training:  10%|▉         | 8/82 [00:09<01:03,  1.17it/s][A
Training:  11%|█         | 9/82 [00:13<02:00,  1.64s/it][A
Training:  12%|█▏        | 10/82 [00:14<01:29,  1.25s/it][A
Training:  13%|█▎        | 11/82 [00:14<01:12,  1.02s/it][A
Training:  15%|█▍        | 12/82 [00:14<00:53,  1.30it/s][A
Training:  16%|█▌        | 13/82 [00:18<01:52,  1.62s/it][A
Training:  17%|█▋        | 14/82 [00:18<01:20,  1.18s/it][A
Training:  18%|█▊        | 15/82 [00:18<01:04,  1.04it/s][A
Training:  20%|█▉        | 16/82 [00:19<00:46,  1.40it/s][A
Training:  21%|██        | 17/82 [00:22<01:43,  1.59s/it][A
Training:  23%|██▎       | 19/82 [00:23<01:03,  1.00s/it][A
Training:  24%|██▍       | 20/82 [00:2

Epoch: 15/42 - Loss: 6.8909 - Accuracy: 0.9676



  0%|          | 0/11 [00:00<?, ?it/s][A
  9%|▉         | 1/11 [00:04<00:46,  4.65s/it][A
 18%|█▊        | 2/11 [00:04<00:18,  2.00s/it][A
 36%|███▋      | 4/11 [00:04<00:05,  1.24it/s][A
 45%|████▌     | 5/11 [00:08<00:09,  1.64s/it][A
 73%|███████▎  | 8/11 [00:08<00:02,  1.37it/s][A
100%|██████████| 11/11 [00:12<00:00,  1.12s/it][A
Epochs:  36%|███▌      | 15/42 [25:42<46:09, 102.58s/it]

Val Loss: 8.3566 - Val Accuracy: 0.9647



Training:   0%|          | 0/82 [00:00<?, ?it/s][A
Training:   1%|          | 1/82 [00:05<07:00,  5.19s/it][A
Training:   4%|▎         | 3/82 [00:05<01:51,  1.42s/it][A
Training:   5%|▍         | 4/82 [00:05<01:15,  1.04it/s][A
Training:   6%|▌         | 5/82 [00:09<02:38,  2.05s/it][A
Training:  10%|▉         | 8/82 [00:09<01:04,  1.14it/s][A
Training:  12%|█▏        | 10/82 [00:14<01:39,  1.39s/it][A
Training:  13%|█▎        | 11/82 [00:14<01:19,  1.12s/it][A
Training:  15%|█▍        | 12/82 [00:14<01:02,  1.12it/s][A
Training:  16%|█▌        | 13/82 [00:18<01:58,  1.71s/it][A
Training:  18%|█▊        | 15/82 [00:19<01:09,  1.03s/it][A
Training:  21%|██        | 17/82 [00:23<01:34,  1.46s/it][A
Training:  22%|██▏       | 18/82 [00:23<01:15,  1.18s/it][A
Training:  24%|██▍       | 20/82 [00:23<00:46,  1.32it/s][A
Training:  27%|██▋       | 22/82 [00:27<01:13,  1.22s/it][A
Training:  29%|██▉       | 24/82 [00:27<00:48,  1.19it/s][A
Training:  30%|███       | 25/82 [00:

Epoch: 16/42 - Loss: 6.8467 - Accuracy: 0.9695



  0%|          | 0/11 [00:00<?, ?it/s][A
  9%|▉         | 1/11 [00:04<00:41,  4.17s/it][A
 18%|█▊        | 2/11 [00:04<00:16,  1.86s/it][A
 36%|███▋      | 4/11 [00:04<00:05,  1.34it/s][A
 45%|████▌     | 5/11 [00:08<00:09,  1.65s/it][A
 55%|█████▍    | 6/11 [00:08<00:06,  1.24s/it][A
 73%|███████▎  | 8/11 [00:08<00:02,  1.45it/s][A
 82%|████████▏ | 9/11 [00:12<00:02,  1.38s/it][A
100%|██████████| 11/11 [00:12<00:00,  1.13s/it][A
Epochs:  38%|███▊      | 16/42 [27:26<44:38, 103.01s/it]

Val Loss: 8.5468 - Val Accuracy: 0.9615



Training:   0%|          | 0/82 [00:00<?, ?it/s][A
Training:   1%|          | 1/82 [00:05<07:01,  5.21s/it][A
Training:   5%|▍         | 4/82 [00:05<01:21,  1.04s/it][A
Training:   6%|▌         | 5/82 [00:09<02:29,  1.94s/it][A
Training:   7%|▋         | 6/82 [00:09<01:47,  1.42s/it][A
Training:  10%|▉         | 8/82 [00:09<01:00,  1.23it/s][A
Training:  11%|█         | 9/82 [00:14<01:58,  1.62s/it][A
Training:  12%|█▏        | 10/82 [00:14<01:28,  1.23s/it][A
Training:  15%|█▍        | 12/82 [00:14<00:52,  1.33it/s][A
Training:  16%|█▌        | 13/82 [00:18<01:41,  1.47s/it][A
Training:  17%|█▋        | 14/82 [00:18<01:17,  1.13s/it][A
Training:  20%|█▉        | 16/82 [00:18<00:46,  1.42it/s][A
Training:  21%|██        | 17/82 [00:22<01:37,  1.49s/it][A
Training:  23%|██▎       | 19/82 [00:22<00:58,  1.08it/s][A
Training:  26%|██▌       | 21/82 [00:26<01:18,  1.28s/it][A
Training:  28%|██▊       | 23/82 [00:26<00:51,  1.15it/s][A
Training:  30%|███       | 25/82 [00:3

Epoch: 17/42 - Loss: 6.8797 - Accuracy: 0.9694



  0%|          | 0/11 [00:00<?, ?it/s][A
  9%|▉         | 1/11 [00:04<00:43,  4.31s/it][A
 18%|█▊        | 2/11 [00:04<00:17,  1.93s/it][A
 27%|██▋       | 3/11 [00:04<00:08,  1.12s/it][A
 36%|███▋      | 4/11 [00:04<00:05,  1.39it/s][A
 45%|████▌     | 5/11 [00:08<00:10,  1.72s/it][A
 55%|█████▍    | 6/11 [00:08<00:06,  1.21s/it][A
 64%|██████▎   | 7/11 [00:08<00:03,  1.14it/s][A
 73%|███████▎  | 8/11 [00:08<00:01,  1.55it/s][A
 82%|████████▏ | 9/11 [00:12<00:02,  1.47s/it][A
100%|██████████| 11/11 [00:12<00:00,  1.14s/it][A
Epochs:  40%|████      | 17/42 [29:08<42:47, 102.69s/it]

Val Loss: 7.6398 - Val Accuracy: 0.9668



Training:   0%|          | 0/82 [00:00<?, ?it/s][A
Training:   1%|          | 1/82 [00:05<07:10,  5.31s/it][A
Training:   2%|▏         | 2/82 [00:05<03:10,  2.38s/it][A
Training:   4%|▎         | 3/82 [00:05<01:47,  1.37s/it][A
Training:   5%|▍         | 4/82 [00:05<01:07,  1.15it/s][A
Training:   6%|▌         | 5/82 [00:10<02:37,  2.04s/it][A
Training:   7%|▋         | 6/82 [00:10<01:54,  1.51s/it][A
Training:  10%|▉         | 8/82 [00:10<00:59,  1.24it/s][A
Training:  11%|█         | 9/82 [00:14<01:56,  1.59s/it][A
Training:  12%|█▏        | 10/82 [00:14<01:29,  1.25s/it][A
Training:  13%|█▎        | 11/82 [00:14<01:05,  1.08it/s][A
Training:  15%|█▍        | 12/82 [00:15<00:49,  1.42it/s][A
Training:  16%|█▌        | 13/82 [00:18<01:49,  1.59s/it][A
Training:  17%|█▋        | 14/82 [00:19<01:21,  1.20s/it][A
Training:  18%|█▊        | 15/82 [00:19<00:59,  1.13it/s][A
Training:  21%|██        | 17/82 [00:22<01:24,  1.30s/it][A
Training:  23%|██▎       | 19/82 [00:22<

Epoch: 18/42 - Loss: 6.5853 - Accuracy: 0.9702



  0%|          | 0/11 [00:00<?, ?it/s][A
  9%|▉         | 1/11 [00:04<00:48,  4.84s/it][A
 36%|███▋      | 4/11 [00:04<00:06,  1.05it/s][A
 55%|█████▍    | 6/11 [00:08<00:06,  1.40s/it][A
 82%|████████▏ | 9/11 [00:12<00:02,  1.30s/it][A
100%|██████████| 11/11 [00:12<00:00,  1.17s/it][A
Epochs:  43%|████▎     | 18/42 [30:51<41:06, 102.77s/it]

Val Loss: 8.3243 - Val Accuracy: 0.9668



Training:   0%|          | 0/82 [00:00<?, ?it/s][A
Training:   1%|          | 1/82 [00:05<07:21,  5.45s/it][A
Training:   2%|▏         | 2/82 [00:05<03:04,  2.30s/it][A
Training:   5%|▍         | 4/82 [00:05<01:10,  1.10it/s][A
Training:   6%|▌         | 5/82 [00:10<02:31,  1.96s/it][A
Training:   9%|▊         | 7/82 [00:10<01:20,  1.08s/it][A
Training:  10%|▉         | 8/82 [00:10<01:01,  1.19it/s][A
Training:  11%|█         | 9/82 [00:14<02:07,  1.75s/it][A
Training:  13%|█▎        | 11/82 [00:14<01:12,  1.02s/it][A
Training:  16%|█▌        | 13/82 [00:18<01:36,  1.40s/it][A
Training:  18%|█▊        | 15/82 [00:18<01:03,  1.06it/s][A
Training:  21%|██        | 17/82 [00:23<01:25,  1.32s/it][A
Training:  22%|██▏       | 18/82 [00:23<01:09,  1.09s/it][A
Training:  26%|██▌       | 21/82 [00:27<01:17,  1.28s/it][A
Training:  28%|██▊       | 23/82 [00:27<00:53,  1.10it/s][A
Training:  30%|███       | 25/82 [00:31<01:09,  1.22s/it][A
Training:  33%|███▎      | 27/82 [00:31

Epoch: 19/42 - Loss: 7.0543 - Accuracy: 0.9708



  0%|          | 0/11 [00:00<?, ?it/s][A
  9%|▉         | 1/11 [00:04<00:44,  4.48s/it][A
 27%|██▋       | 3/11 [00:04<00:09,  1.22s/it][A
 45%|████▌     | 5/11 [00:08<00:09,  1.54s/it][A
 55%|█████▍    | 6/11 [00:08<00:05,  1.17s/it][A
 73%|███████▎  | 8/11 [00:08<00:02,  1.45it/s][A
 82%|████████▏ | 9/11 [00:11<00:02,  1.30s/it][A
100%|██████████| 11/11 [00:12<00:00,  1.12s/it][A
Epochs:  45%|████▌     | 19/42 [32:34<39:27, 102.92s/it]

Val Loss: 7.8169 - Val Accuracy: 0.9637



Training:   0%|          | 0/82 [00:00<?, ?it/s][A
Training:   1%|          | 1/82 [00:04<06:30,  4.82s/it][A
Training:   2%|▏         | 2/82 [00:05<02:56,  2.21s/it][A
Training:   4%|▎         | 3/82 [00:05<01:40,  1.27s/it][A
Training:   6%|▌         | 5/82 [00:09<02:09,  1.69s/it][A
Training:   7%|▋         | 6/82 [00:09<01:39,  1.31s/it][A
Training:  10%|▉         | 8/82 [00:09<00:55,  1.32it/s][A
Training:  11%|█         | 9/82 [00:13<01:49,  1.50s/it][A
Training:  12%|█▏        | 10/82 [00:13<01:22,  1.14s/it][A
Training:  15%|█▍        | 12/82 [00:14<00:49,  1.40it/s][A
Training:  16%|█▌        | 13/82 [00:17<01:34,  1.36s/it][A
Training:  18%|█▊        | 15/82 [00:17<00:58,  1.14it/s][A
Training:  20%|█▉        | 16/82 [00:18<00:47,  1.40it/s][A
Training:  21%|██        | 17/82 [00:22<01:38,  1.52s/it][A
Training:  23%|██▎       | 19/82 [00:22<01:00,  1.05it/s][A
Training:  24%|██▍       | 20/82 [00:22<00:47,  1.30it/s][A
Training:  26%|██▌       | 21/82 [00:26

Epoch: 20/42 - Loss: 7.0172 - Accuracy: 0.9690



  0%|          | 0/11 [00:00<?, ?it/s][A
  9%|▉         | 1/11 [00:04<00:46,  4.65s/it][A
 27%|██▋       | 3/11 [00:04<00:10,  1.26s/it][A
 36%|███▋      | 4/11 [00:04<00:06,  1.17it/s][A
 45%|████▌     | 5/11 [00:08<00:11,  1.86s/it][A
 64%|██████▎   | 7/11 [00:08<00:03,  1.02it/s][A
 82%|████████▏ | 9/11 [00:12<00:02,  1.29s/it][A
100%|██████████| 11/11 [00:12<00:00,  1.15s/it][A
Epochs:  48%|████▊     | 20/42 [34:17<37:41, 102.79s/it]

Val Loss: 7.9443 - Val Accuracy: 0.9626



Training:   0%|          | 0/82 [00:00<?, ?it/s][A
Training:   1%|          | 1/82 [00:05<07:07,  5.28s/it][A
Training:   4%|▎         | 3/82 [00:05<01:58,  1.50s/it][A
Training:   5%|▍         | 4/82 [00:05<01:20,  1.03s/it][A
Training:   6%|▌         | 5/82 [00:09<02:34,  2.00s/it][A
Training:   7%|▋         | 6/82 [00:09<01:47,  1.41s/it][A
Training:   9%|▊         | 7/82 [00:10<01:17,  1.03s/it][A
Training:  10%|▉         | 8/82 [00:10<00:55,  1.34it/s][A
Training:  11%|█         | 9/82 [00:13<01:56,  1.59s/it][A
Training:  13%|█▎        | 11/82 [00:13<01:03,  1.11it/s][A
Training:  15%|█▍        | 12/82 [00:14<00:49,  1.42it/s][A
Training:  16%|█▌        | 13/82 [00:18<01:48,  1.57s/it][A
Training:  17%|█▋        | 14/82 [00:18<01:19,  1.17s/it][A
Training:  20%|█▉        | 16/82 [00:18<00:46,  1.42it/s][A
Training:  21%|██        | 17/82 [00:22<01:36,  1.48s/it][A
Training:  23%|██▎       | 19/82 [00:22<00:58,  1.08it/s][A
Training:  24%|██▍       | 20/82 [00:22<

Epoch: 21/42 - Loss: 7.0566 - Accuracy: 0.9725



  0%|          | 0/11 [00:00<?, ?it/s][A
  9%|▉         | 1/11 [00:04<00:45,  4.55s/it][A
 27%|██▋       | 3/11 [00:04<00:09,  1.23s/it][A
 45%|████▌     | 5/11 [00:08<00:09,  1.61s/it][A
 64%|██████▎   | 7/11 [00:08<00:03,  1.04it/s][A
 82%|████████▏ | 9/11 [00:12<00:02,  1.27s/it][A
100%|██████████| 11/11 [00:12<00:00,  1.15s/it][A
Epochs:  50%|█████     | 21/42 [36:00<36:03, 103.02s/it]

Val Loss: 10.0704 - Val Accuracy: 0.9621



Training:   0%|          | 0/82 [00:00<?, ?it/s][A
Training:   1%|          | 1/82 [00:05<07:07,  5.28s/it][A
Training:   4%|▎         | 3/82 [00:05<01:51,  1.42s/it][A
Training:   6%|▌         | 5/82 [00:08<02:03,  1.61s/it][A
Training:   7%|▋         | 6/82 [00:09<01:31,  1.21s/it][A
Training:   9%|▊         | 7/82 [00:09<01:07,  1.11it/s][A
Training:  11%|█         | 9/82 [00:13<01:46,  1.46s/it][A
Training:  13%|█▎        | 11/82 [00:13<01:06,  1.06it/s][A
Training:  16%|█▌        | 13/82 [00:17<01:32,  1.34s/it][A
Training:  18%|█▊        | 15/82 [00:18<01:02,  1.08it/s][A
Training:  20%|█▉        | 16/82 [00:18<00:50,  1.30it/s][A
Training:  21%|██        | 17/82 [00:21<01:31,  1.41s/it][A
Training:  23%|██▎       | 19/82 [00:22<00:58,  1.08it/s][A
Training:  24%|██▍       | 20/82 [00:22<00:46,  1.34it/s][A
Training:  26%|██▌       | 21/82 [00:26<01:28,  1.45s/it][A
Training:  27%|██▋       | 22/82 [00:26<01:07,  1.13s/it][A
Training:  28%|██▊       | 23/82 [00:2

Epoch: 22/42 - Loss: 7.0641 - Accuracy: 0.9694



  0%|          | 0/11 [00:00<?, ?it/s][A
  9%|▉         | 1/11 [00:04<00:49,  4.96s/it][A
 18%|█▊        | 2/11 [00:05<00:18,  2.11s/it][A
 36%|███▋      | 4/11 [00:05<00:05,  1.19it/s][A
 45%|████▌     | 5/11 [00:09<00:10,  1.75s/it][A
 73%|███████▎  | 8/11 [00:09<00:02,  1.28it/s][A
100%|██████████| 11/11 [00:12<00:00,  1.18s/it][A
Epochs:  52%|█████▏    | 22/42 [37:43<34:18, 102.91s/it]

Val Loss: 10.3817 - Val Accuracy: 0.9621



Training:   0%|          | 0/82 [00:00<?, ?it/s][A
Training:   1%|          | 1/82 [00:05<06:52,  5.09s/it][A
Training:   4%|▎         | 3/82 [00:05<01:47,  1.36s/it][A
Training:   6%|▌         | 5/82 [00:09<02:08,  1.67s/it][A
Training:   7%|▋         | 6/82 [00:09<01:34,  1.25s/it][A
Training:   9%|▊         | 7/82 [00:09<01:10,  1.06it/s][A
Training:  11%|█         | 9/82 [00:13<01:46,  1.46s/it][A
Training:  12%|█▏        | 10/82 [00:13<01:22,  1.15s/it][A
Training:  15%|█▍        | 12/82 [00:13<00:49,  1.41it/s][A
Training:  16%|█▌        | 13/82 [00:17<01:40,  1.45s/it][A
Training:  18%|█▊        | 15/82 [00:18<01:01,  1.10it/s][A
Training:  20%|█▉        | 16/82 [00:18<00:48,  1.36it/s][A
Training:  21%|██        | 17/82 [00:21<01:33,  1.43s/it][A
Training:  22%|██▏       | 18/82 [00:21<01:10,  1.09s/it][A
Training:  23%|██▎       | 19/82 [00:22<00:53,  1.19it/s][A
Training:  26%|██▌       | 21/82 [00:25<01:20,  1.32s/it][A
Training:  28%|██▊       | 23/82 [00:2

Epoch: 23/42 - Loss: 7.1557 - Accuracy: 0.9699



  0%|          | 0/11 [00:00<?, ?it/s][A
  9%|▉         | 1/11 [00:04<00:48,  4.84s/it][A
 18%|█▊        | 2/11 [00:04<00:18,  2.08s/it][A
 36%|███▋      | 4/11 [00:05<00:05,  1.21it/s][A
 45%|████▌     | 5/11 [00:09<00:10,  1.80s/it][A
 64%|██████▎   | 7/11 [00:09<00:03,  1.02it/s][A
100%|██████████| 11/11 [00:13<00:00,  1.18s/it][A
Epochs:  55%|█████▍    | 23/42 [39:26<32:35, 102.90s/it]

Val Loss: 8.4149 - Val Accuracy: 0.9621



Training:   0%|          | 0/82 [00:00<?, ?it/s][A
Training:   1%|          | 1/82 [00:04<06:20,  4.69s/it][A
Training:   4%|▎         | 3/82 [00:04<01:40,  1.27s/it][A
Training:   6%|▌         | 5/82 [00:09<02:10,  1.70s/it][A
Training:   7%|▋         | 6/82 [00:09<01:37,  1.28s/it][A
Training:  10%|▉         | 8/82 [00:09<00:55,  1.33it/s][A
Training:  11%|█         | 9/82 [00:13<01:51,  1.53s/it][A
Training:  12%|█▏        | 10/82 [00:13<01:24,  1.17s/it][A
Training:  15%|█▍        | 12/82 [00:13<00:49,  1.40it/s][A
Training:  16%|█▌        | 13/82 [00:17<01:41,  1.47s/it][A
Training:  20%|█▉        | 16/82 [00:17<00:50,  1.31it/s][A
Training:  22%|██▏       | 18/82 [00:21<01:16,  1.19s/it][A
Training:  24%|██▍       | 20/82 [00:22<00:51,  1.19it/s][A
Training:  27%|██▋       | 22/82 [00:26<01:14,  1.24s/it][A
Training:  29%|██▉       | 24/82 [00:26<00:51,  1.13it/s][A
Training:  30%|███       | 25/82 [00:30<01:22,  1.45s/it][A
Training:  32%|███▏      | 26/82 [00:3

Epoch: 24/42 - Loss: 7.0129 - Accuracy: 0.9719



  0%|          | 0/11 [00:00<?, ?it/s][A
  9%|▉         | 1/11 [00:04<00:45,  4.53s/it][A
 18%|█▊        | 2/11 [00:04<00:17,  1.95s/it][A
 36%|███▋      | 4/11 [00:04<00:05,  1.29it/s][A
 45%|████▌     | 5/11 [00:08<00:10,  1.73s/it][A
 64%|██████▎   | 7/11 [00:08<00:03,  1.05it/s][A
100%|██████████| 11/11 [00:12<00:00,  1.11s/it][A
Epochs:  57%|█████▋    | 24/42 [41:08<30:51, 102.86s/it]

Val Loss: 8.5197 - Val Accuracy: 0.9631



Training:   0%|          | 0/82 [00:00<?, ?it/s][A
Training:   1%|          | 1/82 [00:05<07:08,  5.29s/it][A
Training:   4%|▎         | 3/82 [00:05<01:52,  1.43s/it][A
Training:   5%|▍         | 4/82 [00:05<01:18,  1.00s/it][A
Training:   6%|▌         | 5/82 [00:09<02:41,  2.10s/it][A
Training:   9%|▊         | 7/82 [00:10<01:23,  1.11s/it][A
Training:  11%|█         | 9/82 [00:13<01:46,  1.45s/it][A
Training:  12%|█▏        | 10/82 [00:14<01:22,  1.15s/it][A
Training:  13%|█▎        | 11/82 [00:14<01:04,  1.10it/s][A
Training:  15%|█▍        | 12/82 [00:14<00:49,  1.42it/s][A
Training:  16%|█▌        | 13/82 [00:17<01:38,  1.42s/it][A
Training:  17%|█▋        | 14/82 [00:17<01:11,  1.06s/it][A
Training:  18%|█▊        | 15/82 [00:18<00:53,  1.25it/s][A
Training:  20%|█▉        | 16/82 [00:18<00:40,  1.65it/s][A
Training:  21%|██        | 17/82 [00:22<01:46,  1.64s/it][A
Training:  23%|██▎       | 19/82 [00:22<00:58,  1.08it/s][A
Training:  26%|██▌       | 21/82 [00:2

Epoch: 25/42 - Loss: 6.9079 - Accuracy: 0.9721



  0%|          | 0/11 [00:00<?, ?it/s][A
  9%|▉         | 1/11 [00:04<00:46,  4.67s/it][A
 18%|█▊        | 2/11 [00:04<00:17,  1.99s/it][A
 27%|██▋       | 3/11 [00:04<00:09,  1.14s/it][A
 36%|███▋      | 4/11 [00:05<00:05,  1.34it/s][A
 45%|████▌     | 5/11 [00:08<00:10,  1.73s/it][A
 73%|███████▎  | 8/11 [00:08<00:02,  1.41it/s][A
100%|██████████| 11/11 [00:11<00:00,  1.07s/it][A
Epochs:  60%|█████▉    | 25/42 [42:51<29:04, 102.65s/it]

Val Loss: 8.6460 - Val Accuracy: 0.9641



Training:   0%|          | 0/82 [00:00<?, ?it/s][A
Training:   1%|          | 1/82 [00:05<07:27,  5.52s/it][A
Training:   2%|▏         | 2/82 [00:05<03:07,  2.34s/it][A
Training:   4%|▎         | 3/82 [00:05<01:45,  1.34s/it][A
Training:   6%|▌         | 5/82 [00:09<02:15,  1.76s/it][A
Training:   9%|▊         | 7/82 [00:10<01:14,  1.00it/s][A
Training:  11%|█         | 9/82 [00:13<01:39,  1.37s/it][A
Training:  13%|█▎        | 11/82 [00:14<01:03,  1.11it/s][A
Training:  16%|█▌        | 13/82 [00:18<01:33,  1.35s/it][A
Training:  17%|█▋        | 14/82 [00:18<01:15,  1.11s/it][A
Training:  18%|█▊        | 15/82 [00:18<01:00,  1.10it/s][A
Training:  20%|█▉        | 16/82 [00:18<00:47,  1.40it/s][A
Training:  21%|██        | 17/82 [00:22<01:41,  1.56s/it][A
Training:  22%|██▏       | 18/82 [00:23<01:15,  1.18s/it][A
Training:  23%|██▎       | 19/82 [00:23<00:56,  1.11it/s][A
Training:  26%|██▌       | 21/82 [00:26<01:18,  1.29s/it][A
Training:  27%|██▋       | 22/82 [00:2

Epoch: 26/42 - Loss: 6.8766 - Accuracy: 0.9714



  0%|          | 0/11 [00:00<?, ?it/s][A
  9%|▉         | 1/11 [00:04<00:46,  4.69s/it][A
 18%|█▊        | 2/11 [00:04<00:18,  2.04s/it][A
 36%|███▋      | 4/11 [00:04<00:05,  1.26it/s][A
 45%|████▌     | 5/11 [00:08<00:09,  1.52s/it][A
 55%|█████▍    | 6/11 [00:08<00:05,  1.18s/it][A
 82%|████████▏ | 9/11 [00:11<00:02,  1.10s/it][A
100%|██████████| 11/11 [00:12<00:00,  1.11s/it][A
Epochs:  62%|██████▏   | 26/42 [44:34<27:25, 102.85s/it]

Val Loss: 9.9824 - Val Accuracy: 0.9605



Training:   0%|          | 0/82 [00:00<?, ?it/s][A
Training:   1%|          | 1/82 [00:04<06:25,  4.76s/it][A
Training:   2%|▏         | 2/82 [00:05<02:47,  2.10s/it][A
Training:   5%|▍         | 4/82 [00:05<01:04,  1.21it/s][A
Training:   6%|▌         | 5/82 [00:08<02:12,  1.73s/it][A
Training:   7%|▋         | 6/82 [00:09<01:37,  1.28s/it][A
Training:   9%|▊         | 7/82 [00:09<01:09,  1.08it/s][A
Training:  11%|█         | 9/82 [00:13<01:43,  1.42s/it][A
Training:  12%|█▏        | 10/82 [00:13<01:22,  1.15s/it][A
Training:  15%|█▍        | 12/82 [00:13<00:49,  1.41it/s][A
Training:  16%|█▌        | 13/82 [00:17<01:39,  1.44s/it][A
Training:  17%|█▋        | 14/82 [00:17<01:19,  1.17s/it][A
Training:  20%|█▉        | 16/82 [00:18<00:46,  1.42it/s][A
Training:  21%|██        | 17/82 [00:21<01:29,  1.38s/it][A
Training:  22%|██▏       | 18/82 [00:22<01:11,  1.11s/it][A
Training:  23%|██▎       | 19/82 [00:22<00:54,  1.15it/s][A
Training:  26%|██▌       | 21/82 [00:25

Epoch: 27/42 - Loss: 7.3694 - Accuracy: 0.9707



  0%|          | 0/11 [00:00<?, ?it/s][A
  9%|▉         | 1/11 [00:04<00:43,  4.33s/it][A
 27%|██▋       | 3/11 [00:04<00:09,  1.17s/it][A
 45%|████▌     | 5/11 [00:08<00:09,  1.56s/it][A
 64%|██████▎   | 7/11 [00:08<00:03,  1.09it/s][A
 82%|████████▏ | 9/11 [00:11<00:02,  1.24s/it][A
100%|██████████| 11/11 [00:12<00:00,  1.12s/it][A
Epochs:  64%|██████▍   | 27/42 [46:17<25:43, 102.91s/it]

Val Loss: 12.0639 - Val Accuracy: 0.9636



Training:   0%|          | 0/82 [00:00<?, ?it/s][A
Training:   1%|          | 1/82 [00:04<06:25,  4.76s/it][A
Training:   4%|▎         | 3/82 [00:04<01:41,  1.28s/it][A
Training:   6%|▌         | 5/82 [00:09<02:19,  1.81s/it][A
Training:   7%|▋         | 6/82 [00:09<01:44,  1.37s/it][A
Training:   9%|▊         | 7/82 [00:09<01:17,  1.03s/it][A
Training:  10%|▉         | 8/82 [00:09<00:57,  1.30it/s][A
Training:  11%|█         | 9/82 [00:14<02:06,  1.73s/it][A
Training:  13%|█▎        | 11/82 [00:14<01:10,  1.01it/s][A
Training:  15%|█▍        | 12/82 [00:14<00:54,  1.28it/s][A
Training:  16%|█▌        | 13/82 [00:18<01:46,  1.54s/it][A
Training:  18%|█▊        | 15/82 [00:18<01:01,  1.10it/s][A
Training:  21%|██        | 17/82 [00:22<01:27,  1.35s/it][A
Training:  22%|██▏       | 18/82 [00:22<01:10,  1.10s/it][A
Training:  23%|██▎       | 19/82 [00:22<00:54,  1.16it/s][A
Training:  26%|██▌       | 21/82 [00:26<01:23,  1.36s/it][A
Training:  28%|██▊       | 23/82 [00:27

Epoch: 28/42 - Loss: 6.8195 - Accuracy: 0.9712



  0%|          | 0/11 [00:00<?, ?it/s][A
  9%|▉         | 1/11 [00:04<00:40,  4.04s/it][A
 18%|█▊        | 2/11 [00:04<00:15,  1.75s/it][A
 36%|███▋      | 4/11 [00:04<00:04,  1.42it/s][A
 45%|████▌     | 5/11 [00:07<00:09,  1.61s/it][A
 55%|█████▍    | 6/11 [00:08<00:05,  1.16s/it][A
 64%|██████▎   | 7/11 [00:08<00:03,  1.18it/s][A
 73%|███████▎  | 8/11 [00:08<00:01,  1.61it/s][A
100%|██████████| 11/11 [00:11<00:00,  1.07s/it][A
Epochs:  67%|██████▋   | 28/42 [48:00<24:01, 102.93s/it]

Val Loss: 10.3629 - Val Accuracy: 0.9684



Training:   0%|          | 0/82 [00:00<?, ?it/s][A
Training:   1%|          | 1/82 [00:04<06:31,  4.83s/it][A
Training:   2%|▏         | 2/82 [00:04<02:46,  2.08s/it][A
Training:   4%|▎         | 3/82 [00:05<01:35,  1.21s/it][A
Training:   5%|▍         | 4/82 [00:05<01:02,  1.25it/s][A
Training:   6%|▌         | 5/82 [00:09<02:33,  2.00s/it][A
Training:   7%|▋         | 6/82 [00:09<01:44,  1.38s/it][A
Training:  10%|▉         | 8/82 [00:09<00:54,  1.36it/s][A
Training:  11%|█         | 9/82 [00:13<01:52,  1.55s/it][A
Training:  13%|█▎        | 11/82 [00:13<01:05,  1.08it/s][A
Training:  15%|█▍        | 12/82 [00:13<00:51,  1.37it/s][A
Training:  16%|█▌        | 13/82 [00:17<01:44,  1.52s/it][A
Training:  17%|█▋        | 14/82 [00:17<01:18,  1.15s/it][A
Training:  20%|█▉        | 16/82 [00:18<00:45,  1.46it/s][A
Training:  21%|██        | 17/82 [00:22<01:39,  1.53s/it][A
Training:  22%|██▏       | 18/82 [00:22<01:15,  1.18s/it][A
Training:  24%|██▍       | 20/82 [00:22<

Epoch: 29/42 - Loss: 7.6809 - Accuracy: 0.9717



  0%|          | 0/11 [00:00<?, ?it/s][A
  9%|▉         | 1/11 [00:04<00:45,  4.56s/it][A
 18%|█▊        | 2/11 [00:04<00:18,  2.01s/it][A
 36%|███▋      | 4/11 [00:04<00:05,  1.28it/s][A
 55%|█████▍    | 6/11 [00:08<00:06,  1.35s/it][A
 82%|████████▏ | 9/11 [00:11<00:02,  1.18s/it][A
100%|██████████| 11/11 [00:12<00:00,  1.12s/it][A
Epochs:  69%|██████▉   | 29/42 [49:43<22:18, 102.97s/it]

Val Loss: 9.8123 - Val Accuracy: 0.9610



Training:   0%|          | 0/82 [00:00<?, ?it/s][A
Training:   1%|          | 1/82 [00:04<06:34,  4.87s/it][A
Training:   2%|▏         | 2/82 [00:05<02:50,  2.13s/it][A
Training:   5%|▍         | 4/82 [00:05<01:05,  1.20it/s][A
Training:   6%|▌         | 5/82 [00:09<02:17,  1.79s/it][A
Training:   7%|▋         | 6/82 [00:09<01:41,  1.33s/it][A
Training:   9%|▊         | 7/82 [00:09<01:12,  1.04it/s][A
Training:  11%|█         | 9/82 [00:12<01:35,  1.30s/it][A
Training:  12%|█▏        | 10/82 [00:13<01:16,  1.07s/it][A
Training:  13%|█▎        | 11/82 [00:13<01:02,  1.14it/s][A
Training:  16%|█▌        | 13/82 [00:17<01:26,  1.26s/it][A
Training:  17%|█▋        | 14/82 [00:17<01:10,  1.04s/it][A
Training:  18%|█▊        | 15/82 [00:17<01:00,  1.11it/s][A
Training:  21%|██        | 17/82 [00:21<01:18,  1.21s/it][A
Training:  22%|██▏       | 18/82 [00:21<01:06,  1.04s/it][A
Training:  23%|██▎       | 19/82 [00:22<00:57,  1.10it/s][A
Training:  26%|██▌       | 21/82 [00:25

Epoch: 30/42 - Loss: 7.4289 - Accuracy: 0.9713



  0%|          | 0/11 [00:00<?, ?it/s][A
  9%|▉         | 1/11 [00:04<00:46,  4.67s/it][A
 27%|██▋       | 3/11 [00:04<00:10,  1.27s/it][A
 36%|███▋      | 4/11 [00:04<00:06,  1.15it/s][A
 45%|████▌     | 5/11 [00:08<00:10,  1.73s/it][A
 64%|██████▎   | 7/11 [00:08<00:03,  1.06it/s][A
100%|██████████| 11/11 [00:11<00:00,  1.09s/it][A
Epochs:  71%|███████▏  | 30/42 [51:25<20:33, 102.75s/it]

Val Loss: 8.6239 - Val Accuracy: 0.9615



Training:   0%|          | 0/82 [00:00<?, ?it/s][A
Training:   1%|          | 1/82 [00:05<07:03,  5.23s/it][A
Training:   2%|▏         | 2/82 [00:05<02:59,  2.24s/it][A
Training:   4%|▎         | 3/82 [00:05<01:41,  1.29s/it][A
Training:   5%|▍         | 4/82 [00:05<01:04,  1.21it/s][A
Training:   6%|▌         | 5/82 [00:09<02:25,  1.89s/it][A
Training:   7%|▋         | 6/82 [00:09<01:37,  1.28s/it][A
Training:  10%|▉         | 8/82 [00:09<00:50,  1.47it/s][A
Training:  11%|█         | 9/82 [00:13<01:53,  1.55s/it][A
Training:  12%|█▏        | 10/82 [00:13<01:23,  1.16s/it][A
Training:  15%|█▍        | 12/82 [00:14<00:49,  1.42it/s][A
Training:  16%|█▌        | 13/82 [00:18<01:45,  1.53s/it][A
Training:  18%|█▊        | 15/82 [00:18<01:03,  1.05it/s][A
Training:  21%|██        | 17/82 [00:22<01:29,  1.37s/it][A
Training:  22%|██▏       | 18/82 [00:22<01:11,  1.12s/it][A
Training:  24%|██▍       | 20/82 [00:22<00:44,  1.38it/s][A
Training:  26%|██▌       | 21/82 [00:26<

Epoch: 31/42 - Loss: 7.1006 - Accuracy: 0.9715



  0%|          | 0/11 [00:00<?, ?it/s][A
  9%|▉         | 1/11 [00:04<00:43,  4.33s/it][A
 18%|█▊        | 2/11 [00:04<00:16,  1.88s/it][A
 45%|████▌     | 5/11 [00:07<00:08,  1.36s/it][A
 55%|█████▍    | 6/11 [00:08<00:05,  1.04s/it][A
 64%|██████▎   | 7/11 [00:08<00:03,  1.26it/s][A
 82%|████████▏ | 9/11 [00:11<00:02,  1.16s/it][A
100%|██████████| 11/11 [00:11<00:00,  1.07s/it][A
Epochs:  74%|███████▍  | 31/42 [53:08<18:50, 102.79s/it]

Val Loss: 11.5451 - Val Accuracy: 0.9541



Training:   0%|          | 0/82 [00:00<?, ?it/s][A
Training:   1%|          | 1/82 [00:05<07:13,  5.35s/it][A
Training:   2%|▏         | 2/82 [00:05<03:01,  2.26s/it][A
Training:   5%|▍         | 4/82 [00:05<01:08,  1.14it/s][A
Training:   7%|▋         | 6/82 [00:09<01:50,  1.45s/it][A
Training:   9%|▊         | 7/82 [00:09<01:23,  1.12s/it][A
Training:  10%|▉         | 8/82 [00:09<01:02,  1.18it/s][A
Training:  11%|█         | 9/82 [00:14<02:06,  1.73s/it][A
Training:  12%|█▏        | 10/82 [00:14<01:32,  1.28s/it][A
Training:  13%|█▎        | 11/82 [00:14<01:07,  1.05it/s][A
Training:  15%|█▍        | 12/82 [00:14<00:49,  1.42it/s][A
Training:  16%|█▌        | 13/82 [00:18<01:50,  1.60s/it][A
Training:  18%|█▊        | 15/82 [00:18<01:00,  1.10it/s][A
Training:  20%|█▉        | 16/82 [00:18<00:46,  1.40it/s][A
Training:  21%|██        | 17/82 [00:22<01:42,  1.58s/it][A
Training:  22%|██▏       | 18/82 [00:22<01:15,  1.18s/it][A
Training:  23%|██▎       | 19/82 [00:22

Epoch: 32/42 - Loss: 7.5297 - Accuracy: 0.9706



  0%|          | 0/11 [00:00<?, ?it/s][A
  9%|▉         | 1/11 [00:04<00:40,  4.07s/it][A
 18%|█▊        | 2/11 [00:04<00:15,  1.76s/it][A
 27%|██▋       | 3/11 [00:04<00:08,  1.05s/it][A
 36%|███▋      | 4/11 [00:04<00:04,  1.47it/s][A
 45%|████▌     | 5/11 [00:08<00:10,  1.74s/it][A
 64%|██████▎   | 7/11 [00:08<00:03,  1.12it/s][A
 73%|███████▎  | 8/11 [00:08<00:02,  1.45it/s][A
 82%|████████▏ | 9/11 [00:11<00:02,  1.43s/it][A
100%|██████████| 11/11 [00:12<00:00,  1.10s/it][A
Epochs:  76%|███████▌  | 32/42 [54:51<17:08, 102.80s/it]

Val Loss: 9.6137 - Val Accuracy: 0.9631



Training:   0%|          | 0/82 [00:00<?, ?it/s][A
Training:   1%|          | 1/82 [00:05<06:46,  5.02s/it][A
Training:   2%|▏         | 2/82 [00:05<02:50,  2.13s/it][A
Training:   5%|▍         | 4/82 [00:05<01:04,  1.21it/s][A
Training:   7%|▋         | 6/82 [00:09<01:52,  1.49s/it][A
Training:  10%|▉         | 8/82 [00:09<01:09,  1.07it/s][A
Training:  11%|█         | 9/82 [00:13<01:54,  1.56s/it][A
Training:  12%|█▏        | 10/82 [00:13<01:27,  1.22s/it][A
Training:  13%|█▎        | 11/82 [00:13<01:06,  1.06it/s][A
Training:  15%|█▍        | 12/82 [00:14<00:50,  1.37it/s][A
Training:  16%|█▌        | 13/82 [00:18<01:57,  1.70s/it][A
Training:  18%|█▊        | 15/82 [00:18<01:05,  1.02it/s][A
Training:  21%|██        | 17/82 [00:22<01:30,  1.39s/it][A
Training:  23%|██▎       | 19/82 [00:22<00:58,  1.08it/s][A
Training:  26%|██▌       | 21/82 [00:27<01:21,  1.34s/it][A
Training:  27%|██▋       | 22/82 [00:27<01:06,  1.10s/it][A
Training:  28%|██▊       | 23/82 [00:2

Epoch: 33/42 - Loss: 7.1912 - Accuracy: 0.9715



  0%|          | 0/11 [00:00<?, ?it/s][A
  9%|▉         | 1/11 [00:03<00:39,  3.92s/it][A
 18%|█▊        | 2/11 [00:04<00:16,  1.81s/it][A
 27%|██▋       | 3/11 [00:04<00:08,  1.05s/it][A
 36%|███▋      | 4/11 [00:04<00:04,  1.42it/s][A
 45%|████▌     | 5/11 [00:08<00:10,  1.71s/it][A
 55%|█████▍    | 6/11 [00:08<00:06,  1.27s/it][A
 73%|███████▎  | 8/11 [00:08<00:02,  1.43it/s][A
 82%|████████▏ | 9/11 [00:11<00:02,  1.23s/it][A
100%|██████████| 11/11 [00:12<00:00,  1.10s/it][A
Epochs:  79%|███████▊  | 33/42 [56:34<15:25, 102.87s/it]

Val Loss: 8.2533 - Val Accuracy: 0.9652



Training:   0%|          | 0/82 [00:00<?, ?it/s][A
Training:   1%|          | 1/82 [00:04<06:27,  4.78s/it][A
Training:   2%|▏         | 2/82 [00:04<02:44,  2.05s/it][A
Training:   4%|▎         | 3/82 [00:05<01:33,  1.18s/it][A
Training:   5%|▍         | 4/82 [00:05<01:00,  1.30it/s][A
Training:   6%|▌         | 5/82 [00:09<02:28,  1.93s/it][A
Training:   9%|▊         | 7/82 [00:09<01:13,  1.02it/s][A
Training:  11%|█         | 9/82 [00:13<01:50,  1.52s/it][A
Training:  12%|█▏        | 10/82 [00:13<01:26,  1.20s/it][A
Training:  13%|█▎        | 11/82 [00:14<01:05,  1.08it/s][A
Training:  16%|█▌        | 13/82 [00:18<01:34,  1.37s/it][A
Training:  17%|█▋        | 14/82 [00:18<01:14,  1.10s/it][A
Training:  18%|█▊        | 15/82 [00:18<00:57,  1.16it/s][A
Training:  21%|██        | 17/82 [00:22<01:27,  1.34s/it][A
Training:  23%|██▎       | 19/82 [00:22<00:54,  1.15it/s][A
Training:  26%|██▌       | 21/82 [00:26<01:21,  1.33s/it][A
Training:  27%|██▋       | 22/82 [00:27

Epoch: 34/42 - Loss: 7.7756 - Accuracy: 0.9700



  0%|          | 0/11 [00:00<?, ?it/s][A
  9%|▉         | 1/11 [00:04<00:45,  4.51s/it][A
 18%|█▊        | 2/11 [00:04<00:17,  1.94s/it][A
 27%|██▋       | 3/11 [00:04<00:08,  1.11s/it][A
 45%|████▌     | 5/11 [00:08<00:09,  1.55s/it][A
 64%|██████▎   | 7/11 [00:08<00:03,  1.12it/s][A
100%|██████████| 11/11 [00:11<00:00,  1.09s/it][A
Epochs:  81%|████████  | 34/42 [58:17<13:43, 102.96s/it]

Val Loss: 13.3089 - Val Accuracy: 0.9563



Training:   0%|          | 0/82 [00:00<?, ?it/s][A
Training:   1%|          | 1/82 [00:05<06:58,  5.17s/it][A
Training:   4%|▎         | 3/82 [00:05<01:49,  1.39s/it][A
Training:   6%|▌         | 5/82 [00:09<02:16,  1.77s/it][A
Training:   7%|▋         | 6/82 [00:09<01:44,  1.38s/it][A
Training:  10%|▉         | 8/82 [00:09<00:59,  1.24it/s][A
Training:  11%|█         | 9/82 [00:13<01:45,  1.45s/it][A
Training:  12%|█▏        | 10/82 [00:14<01:28,  1.24s/it][A
Training:  15%|█▍        | 12/82 [00:14<00:51,  1.35it/s][A
Training:  16%|█▌        | 13/82 [00:17<01:33,  1.35s/it][A
Training:  17%|█▋        | 14/82 [00:18<01:21,  1.20s/it][A
Training:  20%|█▉        | 16/82 [00:18<00:47,  1.38it/s][A
Training:  21%|██        | 17/82 [00:21<01:27,  1.35s/it][A
Training:  22%|██▏       | 18/82 [00:22<01:18,  1.23s/it][A
Training:  23%|██▎       | 19/82 [00:22<00:59,  1.06it/s][A
Training:  26%|██▌       | 21/82 [00:26<01:16,  1.25s/it][A
Training:  27%|██▋       | 22/82 [00:2

Epoch: 35/42 - Loss: 7.3959 - Accuracy: 0.9718



  0%|          | 0/11 [00:00<?, ?it/s][A
  9%|▉         | 1/11 [00:04<00:45,  4.51s/it][A
 18%|█▊        | 2/11 [00:04<00:17,  1.92s/it][A
 36%|███▋      | 4/11 [00:04<00:05,  1.32it/s][A
 45%|████▌     | 5/11 [00:08<00:09,  1.58s/it][A
 64%|██████▎   | 7/11 [00:08<00:03,  1.13it/s][A
 82%|████████▏ | 9/11 [00:11<00:02,  1.14s/it][A
100%|██████████| 11/11 [00:11<00:00,  1.07s/it][A
Epochs:  83%|████████▎ | 35/42 [59:59<11:59, 102.72s/it]

Val Loss: 9.4421 - Val Accuracy: 0.9668



Training:   0%|          | 0/82 [00:00<?, ?it/s][A
Training:   1%|          | 1/82 [00:05<07:30,  5.56s/it][A
Training:   4%|▎         | 3/82 [00:05<01:57,  1.49s/it][A
Training:   5%|▍         | 4/82 [00:05<01:20,  1.03s/it][A
Training:   6%|▌         | 5/82 [00:09<02:34,  2.01s/it][A
Training:   9%|▊         | 7/82 [00:10<01:20,  1.07s/it][A
Training:  11%|█         | 9/82 [00:14<01:52,  1.54s/it][A
Training:  13%|█▎        | 11/82 [00:14<01:11,  1.00s/it][A
Training:  16%|█▌        | 13/82 [00:18<01:37,  1.41s/it][A
Training:  17%|█▋        | 14/82 [00:19<01:18,  1.16s/it][A
Training:  18%|█▊        | 15/82 [00:19<01:02,  1.08it/s][A
Training:  21%|██        | 17/82 [00:23<01:28,  1.37s/it][A
Training:  23%|██▎       | 19/82 [00:23<00:57,  1.10it/s][A
Training:  26%|██▌       | 21/82 [00:27<01:20,  1.32s/it][A
Training:  27%|██▋       | 22/82 [00:27<01:05,  1.09s/it][A
Training:  28%|██▊       | 23/82 [00:28<00:51,  1.14it/s][A
Training:  29%|██▉       | 24/82 [00:2

Epoch: 36/42 - Loss: 7.0697 - Accuracy: 0.9731



  0%|          | 0/11 [00:00<?, ?it/s][A
  9%|▉         | 1/11 [00:04<00:41,  4.11s/it][A
 18%|█▊        | 2/11 [00:04<00:16,  1.87s/it][A
 36%|███▋      | 4/11 [00:04<00:05,  1.31it/s][A
 45%|████▌     | 5/11 [00:07<00:09,  1.51s/it][A
 55%|█████▍    | 6/11 [00:08<00:05,  1.11s/it][A
 73%|███████▎  | 8/11 [00:08<00:01,  1.59it/s][A
 82%|████████▏ | 9/11 [00:11<00:02,  1.24s/it][A
100%|██████████| 11/11 [00:11<00:00,  1.06s/it][A
Epochs:  86%|████████▌ | 36/42 [1:01:43<10:17, 102.93s/it]

Val Loss: 9.9402 - Val Accuracy: 0.9631



Training:   0%|          | 0/82 [00:00<?, ?it/s][A
Training:   1%|          | 1/82 [00:05<07:08,  5.29s/it][A
Training:   4%|▎         | 3/82 [00:05<01:52,  1.42s/it][A
Training:   6%|▌         | 5/82 [00:09<02:16,  1.77s/it][A
Training:   9%|▊         | 7/82 [00:09<01:19,  1.06s/it][A
Training:  11%|█         | 9/82 [00:13<01:45,  1.45s/it][A
Training:  12%|█▏        | 10/82 [00:14<01:24,  1.17s/it][A
Training:  13%|█▎        | 11/82 [00:14<01:05,  1.09it/s][A
Training:  16%|█▌        | 13/82 [00:18<01:36,  1.39s/it][A
Training:  17%|█▋        | 14/82 [00:18<01:15,  1.11s/it][A
Training:  18%|█▊        | 15/82 [00:18<00:58,  1.14it/s][A
Training:  20%|█▉        | 16/82 [00:18<00:45,  1.45it/s][A
Training:  21%|██        | 17/82 [00:22<01:41,  1.56s/it][A
Training:  23%|██▎       | 19/82 [00:22<00:57,  1.09it/s][A
Training:  26%|██▌       | 21/82 [00:27<01:22,  1.36s/it][A
Training:  28%|██▊       | 23/82 [00:27<00:54,  1.08it/s][A
Training:  29%|██▉       | 24/82 [00:

Epoch: 37/42 - Loss: 7.1458 - Accuracy: 0.9733



  0%|          | 0/11 [00:00<?, ?it/s][A
  9%|▉         | 1/11 [00:04<00:40,  4.06s/it][A
 18%|█▊        | 2/11 [00:04<00:15,  1.73s/it][A
 36%|███▋      | 4/11 [00:04<00:04,  1.46it/s][A
 55%|█████▍    | 6/11 [00:08<00:06,  1.27s/it][A
 64%|██████▎   | 7/11 [00:08<00:03,  1.02it/s][A
 82%|████████▏ | 9/11 [00:11<00:02,  1.27s/it][A
100%|██████████| 11/11 [00:11<00:00,  1.08s/it][A
Epochs:  88%|████████▊ | 37/42 [1:03:25<08:33, 102.70s/it]

Val Loss: 8.9635 - Val Accuracy: 0.9668



Training:   0%|          | 0/82 [00:00<?, ?it/s][A
Training:   1%|          | 1/82 [00:04<06:35,  4.88s/it][A
Training:   4%|▎         | 3/82 [00:05<01:43,  1.31s/it][A
Training:   6%|▌         | 5/82 [00:09<02:12,  1.72s/it][A
Training:   7%|▋         | 6/82 [00:09<01:40,  1.33s/it][A
Training:  10%|▉         | 8/82 [00:09<00:57,  1.28it/s][A
Training:  11%|█         | 9/82 [00:13<01:52,  1.53s/it][A
Training:  12%|█▏        | 10/82 [00:14<01:31,  1.27s/it][A
Training:  13%|█▎        | 11/82 [00:14<01:08,  1.04it/s][A
Training:  15%|█▍        | 12/82 [00:14<00:51,  1.36it/s][A
Training:  16%|█▌        | 13/82 [00:17<01:46,  1.54s/it][A
Training:  17%|█▋        | 14/82 [00:18<01:21,  1.20s/it][A
Training:  18%|█▊        | 15/82 [00:18<00:58,  1.14it/s][A
Training:  21%|██        | 17/82 [00:22<01:32,  1.42s/it][A
Training:  22%|██▏       | 18/82 [00:22<01:13,  1.15s/it][A
Training:  24%|██▍       | 20/82 [00:22<00:43,  1.42it/s][A
Training:  26%|██▌       | 21/82 [00:2

Epoch: 38/42 - Loss: 7.1653 - Accuracy: 0.9720



  0%|          | 0/11 [00:00<?, ?it/s][A
  9%|▉         | 1/11 [00:04<00:45,  4.53s/it][A
 18%|█▊        | 2/11 [00:04<00:17,  1.96s/it][A
 27%|██▋       | 3/11 [00:04<00:09,  1.14s/it][A
 36%|███▋      | 4/11 [00:04<00:05,  1.37it/s][A
 45%|████▌     | 5/11 [00:08<00:10,  1.71s/it][A
 55%|█████▍    | 6/11 [00:08<00:06,  1.22s/it][A
 64%|██████▎   | 7/11 [00:08<00:03,  1.16it/s][A
 82%|████████▏ | 9/11 [00:11<00:02,  1.20s/it][A
100%|██████████| 11/11 [00:12<00:00,  1.12s/it][A
Epochs:  90%|█████████ | 38/42 [1:05:08<06:50, 102.75s/it]

Val Loss: 10.9433 - Val Accuracy: 0.9621



Training:   0%|          | 0/82 [00:00<?, ?it/s][A
Training:   1%|          | 1/82 [00:05<07:06,  5.26s/it][A
Training:   2%|▏         | 2/82 [00:05<03:08,  2.36s/it][A
Training:   5%|▍         | 4/82 [00:05<01:13,  1.06it/s][A
Training:   6%|▌         | 5/82 [00:09<02:20,  1.83s/it][A
Training:   7%|▋         | 6/82 [00:09<01:41,  1.33s/it][A
Training:   9%|▊         | 7/82 [00:09<01:12,  1.04it/s][A
Training:  11%|█         | 9/82 [00:13<01:42,  1.40s/it][A
Training:  12%|█▏        | 10/82 [00:14<01:27,  1.21s/it][A
Training:  13%|█▎        | 11/82 [00:14<01:07,  1.06it/s][A
Training:  15%|█▍        | 12/82 [00:14<00:50,  1.38it/s][A
Training:  16%|█▌        | 13/82 [00:18<01:41,  1.47s/it][A
Training:  17%|█▋        | 14/82 [00:18<01:24,  1.24s/it][A
Training:  18%|█▊        | 15/82 [00:18<01:02,  1.07it/s][A
Training:  20%|█▉        | 16/82 [00:19<00:45,  1.44it/s][A
Training:  21%|██        | 17/82 [00:22<01:37,  1.51s/it][A
Training:  22%|██▏       | 18/82 [00:23

Epoch: 39/42 - Loss: 7.2549 - Accuracy: 0.9715



  0%|          | 0/11 [00:00<?, ?it/s][A
  9%|▉         | 1/11 [00:04<00:47,  4.76s/it][A
 27%|██▋       | 3/11 [00:04<00:10,  1.29s/it][A
 36%|███▋      | 4/11 [00:05<00:06,  1.14it/s][A
 45%|████▌     | 5/11 [00:08<00:10,  1.82s/it][A
 64%|██████▎   | 7/11 [00:08<00:03,  1.03it/s][A
100%|██████████| 11/11 [00:12<00:00,  1.16s/it][A
Epochs:  93%|█████████▎| 39/42 [1:06:50<05:08, 102.69s/it]

Val Loss: 11.0511 - Val Accuracy: 0.9647



Training:   0%|          | 0/82 [00:00<?, ?it/s][A
Training:   1%|          | 1/82 [00:05<06:52,  5.09s/it][A
Training:   2%|▏         | 2/82 [00:05<03:09,  2.37s/it][A
Training:   4%|▎         | 3/82 [00:05<01:46,  1.34s/it][A
Training:   6%|▌         | 5/82 [00:09<02:12,  1.72s/it][A
Training:   7%|▋         | 6/82 [00:10<01:41,  1.34s/it][A
Training:   9%|▊         | 7/82 [00:10<01:14,  1.01it/s][A
Training:  10%|▉         | 8/82 [00:10<00:54,  1.36it/s][A
Training:  11%|█         | 9/82 [00:14<01:57,  1.61s/it][A
Training:  12%|█▏        | 10/82 [00:14<01:32,  1.28s/it][A
Training:  15%|█▍        | 12/82 [00:14<00:51,  1.36it/s][A
Training:  16%|█▌        | 13/82 [00:18<01:41,  1.47s/it][A
Training:  17%|█▋        | 14/82 [00:18<01:23,  1.22s/it][A
Training:  18%|█▊        | 15/82 [00:19<01:02,  1.07it/s][A
Training:  20%|█▉        | 16/82 [00:19<00:47,  1.38it/s][A
Training:  21%|██        | 17/82 [00:22<01:38,  1.52s/it][A
Training:  22%|██▏       | 18/82 [00:23<

Epoch: 40/42 - Loss: 7.3768 - Accuracy: 0.9725



  0%|          | 0/11 [00:00<?, ?it/s][A
  9%|▉         | 1/11 [00:04<00:43,  4.38s/it][A
 18%|█▊        | 2/11 [00:04<00:17,  1.93s/it][A
 27%|██▋       | 3/11 [00:04<00:08,  1.10s/it][A
 45%|████▌     | 5/11 [00:08<00:09,  1.53s/it][A
 64%|██████▎   | 7/11 [00:08<00:03,  1.13it/s][A
 73%|███████▎  | 8/11 [00:08<00:02,  1.42it/s][A
 82%|████████▏ | 9/11 [00:11<00:02,  1.36s/it][A
100%|██████████| 11/11 [00:12<00:00,  1.13s/it][A
Epochs:  95%|█████████▌| 40/42 [1:08:33<03:25, 102.84s/it]

Val Loss: 10.2745 - Val Accuracy: 0.9615



Training:   0%|          | 0/82 [00:00<?, ?it/s][A
Training:   1%|          | 1/82 [00:04<06:43,  4.98s/it][A
Training:   2%|▏         | 2/82 [00:05<02:54,  2.18s/it][A
Training:   5%|▍         | 4/82 [00:05<01:06,  1.17it/s][A
Training:   6%|▌         | 5/82 [00:09<02:22,  1.85s/it][A
Training:   7%|▋         | 6/82 [00:09<01:44,  1.38s/it][A
Training:  10%|▉         | 8/82 [00:09<00:56,  1.30it/s][A
Training:  11%|█         | 9/82 [00:13<01:50,  1.52s/it][A
Training:  12%|█▏        | 10/82 [00:13<01:26,  1.20s/it][A
Training:  13%|█▎        | 11/82 [00:14<01:07,  1.05it/s][A
Training:  15%|█▍        | 12/82 [00:14<00:49,  1.41it/s][A
Training:  16%|█▌        | 13/82 [00:18<01:51,  1.62s/it][A
Training:  17%|█▋        | 14/82 [00:18<01:22,  1.22s/it][A
Training:  18%|█▊        | 15/82 [00:18<01:08,  1.02s/it][A
Training:  21%|██        | 17/82 [00:22<01:34,  1.46s/it][A
Training:  22%|██▏       | 18/82 [00:23<01:12,  1.14s/it][A
Training:  23%|██▎       | 19/82 [00:23

Epoch: 41/42 - Loss: 7.4954 - Accuracy: 0.9720



  0%|          | 0/11 [00:00<?, ?it/s][A
  9%|▉         | 1/11 [00:04<00:42,  4.25s/it][A
 18%|█▊        | 2/11 [00:04<00:17,  1.96s/it][A
 27%|██▋       | 3/11 [00:04<00:08,  1.12s/it][A
 45%|████▌     | 5/11 [00:08<00:09,  1.52s/it][A
 55%|█████▍    | 6/11 [00:08<00:05,  1.16s/it][A
 73%|███████▎  | 8/11 [00:08<00:01,  1.50it/s][A
 82%|████████▏ | 9/11 [00:11<00:02,  1.26s/it][A
100%|██████████| 11/11 [00:12<00:00,  1.14s/it][A
Epochs:  98%|█████████▊| 41/42 [1:10:15<01:42, 102.45s/it]

Val Loss: 11.1347 - Val Accuracy: 0.9615



Training:   0%|          | 0/82 [00:00<?, ?it/s][A
Training:   1%|          | 1/82 [00:05<07:34,  5.61s/it][A
Training:   2%|▏         | 2/82 [00:05<03:13,  2.41s/it][A
Training:   4%|▎         | 3/82 [00:05<01:49,  1.38s/it][A
Training:   5%|▍         | 4/82 [00:06<01:09,  1.13it/s][A
Training:   6%|▌         | 5/82 [00:10<02:40,  2.08s/it][A
Training:   7%|▋         | 6/82 [00:10<01:48,  1.42s/it][A
Training:   9%|▊         | 7/82 [00:10<01:14,  1.01it/s][A
Training:  10%|▉         | 8/82 [00:10<00:52,  1.41it/s][A
Training:  11%|█         | 9/82 [00:14<02:08,  1.76s/it][A
Training:  12%|█▏        | 10/82 [00:14<01:30,  1.26s/it][A
Training:  13%|█▎        | 11/82 [00:14<01:04,  1.10it/s][A
Training:  15%|█▍        | 12/82 [00:15<00:49,  1.41it/s][A
Training:  16%|█▌        | 13/82 [00:18<01:51,  1.61s/it][A
Training:  17%|█▋        | 14/82 [00:19<01:18,  1.16s/it][A
Training:  20%|█▉        | 16/82 [00:19<00:53,  1.23it/s][A
Training:  21%|██        | 17/82 [00:23<0

Epoch: 42/42 - Loss: 7.2207 - Accuracy: 0.9723



  0%|          | 0/11 [00:00<?, ?it/s][A
  9%|▉         | 1/11 [00:04<00:47,  4.79s/it][A
 27%|██▋       | 3/11 [00:04<00:10,  1.29s/it][A
 36%|███▋      | 4/11 [00:05<00:06,  1.08it/s][A
 45%|████▌     | 5/11 [00:08<00:10,  1.83s/it][A
 64%|██████▎   | 7/11 [00:08<00:03,  1.02it/s][A
 73%|███████▎  | 8/11 [00:09<00:02,  1.29it/s][A
100%|██████████| 11/11 [00:12<00:00,  1.15s/it][A
Epochs: 100%|██████████| 42/42 [1:11:58<00:00, 102.82s/it]


Val Loss: 10.3907 - Val Accuracy: 0.9610


[32m[I 2023-12-09 00:03:40,834][0m Trial 19 finished with value: 0.9610147476196289 and parameters: {'loss_learning_rate': 0.0026095667746146318, 'learning_rate': 0.0007654254891103729, 'weight_decay': 0.0018147852099258965, 'epsilon': 8.897455126188771e-08, 'beta': 0.8, 'gamma': 0.9, 'batch_size': 172, 'epochs': 42}. Best is trial 17 with value: 0.9676252007484436.[0m



Study statistics: 
  Number of finished trials:  20
  Number of pruned trials:  9
  Number of complete trials:  11


In [28]:
print("Best trial:")
trial = study.best_trial

print("  Value: ", trial.value)

print("  Params: ")
for key, value in trial.params.items():
    print("    {}: {}".format(key, value))

Best trial:
  Value:  0.9676252007484436
  Params: 
    batch_size: 266
    beta: 0.8
    epochs: 37
    epsilon: 9.402328890865692e-08
    gamma: 0.9
    learning_rate: 0.000633457353251843
    loss_learning_rate: 0.008447568694221697
    weight_decay: 0.001876909923779263


In [None]:
# ViT P12-S8 Triplet ArcFace Mean

Best trial:
Value:  0.9676252007484436
Params: 
batch_size: 266
beta: 0.8
epochs: 37
epsilon: 9.402328890865692e-08
gamma: 0.9
learning_rate: 0.000633457353251843
loss_learning_rate: 0.008447568694221697
weight_decay: 0.001876909923779263