In [1]:
import os
import random
import pandas as pd
import numpy as np
import mxnet as mx
import torch
import torch.nn as nn
import torch.nn.functional as F
import torch.optim as opt
from torch.utils.data import Dataset, DataLoader
from einops import rearrange, repeat
import optuna
from optuna.trial import TrialState
from tqdm import tqdm

In [2]:
def file_to_embed(embeds, file):
    emb = []
    for f in file:
        emb.append(embeds[f][0])
    return torch.stack(emb)

In [3]:
MIN_NUM_PATCHES = 16

In [4]:
device = torch.device("cuda:0" if torch.cuda.is_available() else "cpu")
device

device(type='cuda', index=0)

In [5]:
class AdienceDataset(Dataset):
    def __init__(self, annot_file, img_dir, train=False):
        self.img_lbls = pd.read_csv(annot_file, header=None)
        self.img_dir = img_dir
        self.is_train = train
    
    def __len__(self):
        return len(self.img_lbls)
    
    def __getitem__(self, idx):
        img_file = self.img_lbls.iloc[idx, 0]
        img_path = os.path.join(self.img_dir, img_file)
        image = mx.image.imread(img_path)
        if image.shape[1] != 112:
            image = mx.image.resize_short(image, 112)
        image = mx.nd.transpose(image, axes=(2,0,1))
        image = torch.tensor(image.asnumpy()).type(torch.FloatTensor)
        label = self.img_lbls.iloc[idx, 1]
        
        if self.is_train:
            positive_list = self.img_lbls[self.img_lbls.iloc[:, 1] == label].index.values
            positive_list = np.setdiff1d(positive_list, np.array([idx]))
            positive_item = random.choice(positive_list)
            positive_img = self.img_lbls.iloc[positive_item, 0]
            pos_img_path = os.path.join(self.img_dir, positive_img)
            pos_image = mx.image.imread(pos_img_path)
            if pos_image.shape[1] != 112:
                pos_image = mx.image.resize_short(pos_image, 112)
            pos_image = mx.nd.transpose(pos_image, axes=(2,0,1))
            pos_image = torch.tensor(pos_image.asnumpy()).type(torch.FloatTensor)
            
            negative_list = self.img_lbls[self.img_lbls.iloc[:, 1] != label].index.values
            negative_item = random.choice(negative_list)
            negative_img = self.img_lbls.iloc[negative_item, 0]
            neg_img_path = os.path.join(self.img_dir, negative_img)
            neg_image = mx.image.imread(neg_img_path)
            if neg_image.shape[1] != 112:
                neg_image = mx.image.resize_short(neg_image, 112)
            neg_image = mx.nd.transpose(neg_image, axes=(2,0,1))
            neg_image = torch.tensor(neg_image.asnumpy()).type(torch.FloatTensor)
            
            return image, pos_image, neg_image, label, img_file, positive_img, negative_img

        return image, label, img_file

In [6]:
train_data = AdienceDataset("../train.csv", "../cropped_Adience/", train=False)
val_data = AdienceDataset("../val.csv", "../cropped_Adience/", train=False)

In [20]:
train_data = AdienceDataset("../train.csv", "../cropped_Adience/", train=True)
val_data = AdienceDataset("../val.csv", "../cropped_Adience/", train=True)

In [7]:
class TripletLoss(nn.Module):
    def __init__(self, margin=1.0):
        super(TripletLoss, self).__init__()
        self.margin = margin
        
    def calc_euclidean(self, x1, x2):
        return (x1 - x2).pow(2).sum(1)
    
    def forward(self, anchor, positive, negative):
        distance_positive = self.calc_euclidean(anchor, positive)
        distance_negative = self.calc_euclidean(anchor, negative)
        losses = torch.relu(distance_positive - distance_negative + self.margin)

        return losses.mean()

In [8]:
class CombinedLoss(nn.Module):
    def __init__(self, beta=1.0):
        super(CombinedLoss, self).__init__()
        self.beta = beta
        self.triplet = TripletLoss(margin=1.0)
        self.classification = nn.CrossEntropyLoss()
        
    def forward(self, anchor, positive, negative, classification_out, labels):
        triplet_loss = self.triplet(anchor, positive, negative)
        classification_loss = self.classification(classification_out, labels)
        total_loss = (self.beta * triplet_loss) + classification_loss
        
        return total_loss

In [9]:
class CosFace(nn.Module):
    r"""Implement of CosFace (https://arxiv.org/pdf/1801.09414.pdf):
    Args:
        in_features: size of each input sample
        out_features: size of each output sample
        device_id: the ID of GPU where the model will be trained by model parallel.
                       if device_id=None, it will be trained on CPU without model parallel.
        s: norm of input feature
        m: margin
        cos(theta)-m
    """

    def __init__(self, in_features, out_features, device_id, s=64.0, m=0.35):
        super(CosFace, self).__init__()
        self.in_features = in_features
        self.out_features = out_features
        self.device_id = device_id
        self.s = s
        self.m = m
        print("self.device_id", self.device_id)
        self.weight = nn.Parameter(torch.FloatTensor(out_features, in_features))
        nn.init.xavier_uniform_(self.weight)

    def forward(self, input, label):
        # --------------------------- cos(theta) & phi(theta) ---------------------------

        if self.device_id == None:
            cosine = F.linear(F.normalize(input), F.normalize(self.weight))
        else:
            x = input
            sub_weights = torch.chunk(self.weight, len(self.device_id), dim=0)
            temp_x = x.cuda(self.device_id[0])
            weight = sub_weights[0].cuda(self.device_id[0])
            cosine = F.linear(F.normalize(temp_x), F.normalize(weight))
            for i in range(1, len(self.device_id)):
                temp_x = x.cuda(self.device_id[i])
                weight = sub_weights[i].cuda(self.device_id[i])
                cosine = torch.cat((cosine, F.linear(F.normalize(temp_x), F.normalize(weight)).cuda(self.device_id[0])),
                                   dim=1)
        phi = cosine - self.m
        # --------------------------- convert label to one-hot ---------------------------
        one_hot = torch.zeros(cosine.size())
        if self.device_id != None:
            one_hot = one_hot.cuda(self.device_id[0])
        # one_hot = one_hot.cuda() if cosine.is_cuda else one_hot

        one_hot.scatter_(1, label.view(-1, 1).long(), 1)
        # -------------torch.where(out_i = {x_i if condition_i else y_i) -------------
        output = (one_hot * phi) + (
                    (1.0 - one_hot) * cosine)  # you can use torch.where if your torch.__version__ is 0.4
        output *= self.s

        return output

    def __repr__(self):
        return self.__class__.__name__ + '(' \
               + 'in_features = ' + str(self.in_features) \
               + ', out_features = ' + str(self.out_features) \
               + ', s = ' + str(self.s) \
               + ', m = ' + str(self.m) + ')'

In [10]:
class Residual(nn.Module):
    def __init__(self, fn):
        super().__init__()
        self.fn = fn
    def forward(self, x, **kwargs):
        return self.fn(x, **kwargs) + x

In [11]:
class PreNorm(nn.Module):
    def __init__(self, dim, fn):
        super().__init__()
        self.norm = nn.LayerNorm(dim)
        self.fn = fn
    def forward(self, x, **kwargs):
        return self.fn(self.norm(x), **kwargs)

In [12]:
class FeedForward(nn.Module):
    def __init__(self, dim, hidden_dim, dropout = 0.):
        super().__init__()
        self.net = nn.Sequential(
            nn.Linear(dim, hidden_dim),
            nn.GELU(),
            nn.Dropout(dropout),
            nn.Linear(hidden_dim, dim),
            nn.Dropout(dropout)
        )
    def forward(self, x):
        return self.net(x)

In [13]:
class Attention(nn.Module):
    def __init__(self, dim, heads = 8, dim_head = 64, dropout = 0.):
        super().__init__()
        inner_dim = dim_head *  heads
        self.heads = heads
        self.scale = dim ** -0.5

        self.to_qkv = nn.Linear(dim, inner_dim * 3, bias = False)
        self.to_out = nn.Sequential(
            nn.Linear(inner_dim, dim),
            nn.Dropout(dropout)
        )

    def forward(self, x, mask = None):
        b, n, _, h = *x.shape, self.heads
        qkv = self.to_qkv(x).chunk(3, dim = -1)

        q, k, v = map(lambda t: rearrange(t, 'b n (h d) -> b h n d', h = h), qkv)
        dots = torch.einsum('bhid,bhjd->bhij', q, k) * self.scale
        mask_value = -torch.finfo(dots.dtype).max
        #embed()
        if mask is not None:
            mask = F.pad(mask.flatten(1), (1, 0), value = True)
            assert mask.shape[-1] == dots.shape[-1], 'mask has incorrect dimensions'
            mask = mask[:, None, :] * mask[:, :, None]
            dots.masked_fill_(~mask, mask_value)
            del mask

        attn = dots.softmax(dim=-1)

        out = torch.einsum('bhij,bhjd->bhid', attn, v)
        out = rearrange(out, 'b h n d -> b n (h d)')
        out =  self.to_out(out)

        return out

In [14]:
class Transformer(nn.Module):
    def __init__(self, dim, depth, heads, dim_head, mlp_dim, dropout):
        super().__init__()
        self.layers = nn.ModuleList([])
        for _ in range(depth):
            self.layers.append(nn.ModuleList([
                Residual(PreNorm(dim, Attention(dim, heads = heads, dim_head = dim_head, dropout = dropout))),
                Residual(PreNorm(dim, FeedForward(dim, mlp_dim, dropout = dropout)))
            ]))
    def forward(self, x, mask = None):
        for attn, ff in self.layers:
            x = attn(x, mask = mask)
            #embed()
            x = ff(x)
        return x

In [15]:
class ViTs_face(nn.Module):
    def __init__(self, *, loss_type, GPU_ID, num_class, image_size, patch_size, ac_patch_size,
                         pad, dim, depth, heads, mlp_dim, pool = 'mean', channels = 3, dim_head = 64, dropout = 0., emb_dropout = 0.):
        super().__init__()
        assert image_size % patch_size == 0, 'Image dimensions must be divisible by the patch size.'
        num_patches = (image_size // patch_size) ** 2
        patch_dim = channels * ac_patch_size ** 2
        assert num_patches > MIN_NUM_PATCHES, f'your number of patches ({num_patches}) is way too small for attention to be effective (at least 16). Try decreasing your patch size'
        assert pool in {'cls', 'mean'}, 'pool type must be either cls (cls token) or mean (mean pooling)'

        self.patch_size = patch_size
        self.soft_split = nn.Unfold(kernel_size=(ac_patch_size, ac_patch_size), stride=(self.patch_size, self.patch_size), padding=(pad, pad))


        self.pos_embedding = nn.Parameter(torch.randn(1, num_patches + 1, dim))
        self.patch_to_embedding = nn.Linear(patch_dim, dim)
        self.cls_token = nn.Parameter(torch.randn(1, 1, dim))
        self.dropout = nn.Dropout(emb_dropout)

        self.transformer = Transformer(dim, depth, heads, dim_head, mlp_dim, dropout)

        self.pool = pool
        self.to_latent = nn.Identity()

        self.mlp_head = nn.Sequential(
            nn.LayerNorm(dim),
        )
        self.loss_type = loss_type
        self.GPU_ID = GPU_ID
        if self.loss_type == 'None':
            print("no loss for vit_face")
        else:
            if self.loss_type == 'CosFace':
                self.loss = CosFace(in_features=dim, out_features=num_class, device_id=self.GPU_ID)

    def forward(self, img, label= None , mask = None):
        p = self.patch_size
        x = self.soft_split(img).transpose(1, 2)
        x = self.patch_to_embedding(x)
        b, n, _ = x.shape

        cls_tokens = repeat(self.cls_token, '() n d -> b n d', b = b)
        x = torch.cat((cls_tokens, x), dim=1)
        x += self.pos_embedding[:, :(n + 1)]
        x = self.dropout(x)
        x = self.transformer(x, mask)

        # y = x[:, 0]
        z = x[:, 1:].mean(dim = 1)

        # y = self.to_latent(y)
        # emb_y = self.mlp_head(y)
        z = self.to_latent(z)
        emb_z = self.mlp_head(z)
        # emb = torch.cat((emb_y, emb_z), dim=1)
        emb = emb_z
        if label is not None:
            x = self.loss(emb, label)
            return x, emb
        else:
            return emb

In [16]:
class ViT_plus(nn.Module):
    def __init__(self):
        super(ViT_plus, self).__init__()
        
        self.fc1 = nn.Linear(in_features=512, out_features=512)
        self.fc2 = nn.Linear(in_features=512, out_features=2)
        
    def forward(self, x):
        x = self.fc1(x)
        x_cosface = x
        x_classification = self.fc2(x)
        
        return x_cosface, x_classification

In [17]:
model = ViTs_face(
            loss_type='CosFace',
            GPU_ID=[device],
            num_class=93431,
            image_size=112,
            patch_size=8,
            ac_patch_size=12,
            pad=4,
            dim=512,
            depth=20,
            heads=8,
            mlp_dim=2048,
            dropout=0.1,
            emb_dropout=0.1
        ).to(device)
model.load_state_dict(
    torch.load("../Backbone_VITs_Epoch_2_Batch_12000_Time_2021-03-17-04-05_checkpoint.pth", map_location=device)
)

self.device_id [device(type='cuda', index=0)]


<All keys matched successfully>

In [18]:
for param in model.parameters():
    param.requires_grad = False

In [19]:
embeds = {}
model.eval()

with torch.no_grad():
    for img, label, file in train_data:
        img = img.to(device)
        embeds[file] = model(torch.unsqueeze(img, 0))

    for img, label, file in val_data:
        img = img.to(device)
        embeds[file] = model(torch.unsqueeze(img, 0))

In [21]:
best_accu = 0.0
def objective(trial):
    model_xtr = ViT_plus().to(device)
    
    lr = trial.suggest_float("learning_rate", 1e-5, 1e-1, log=True)
    wd = trial.suggest_float('weight_decay', 1e-4, 1e-2, log=True)
    eps = trial.suggest_float("epsilon", 1e-9, 1e-7, log=True)
    optimizer = opt.AdamW(model_xtr.parameters(), lr=lr, eps=eps, weight_decay=wd)
    
    criterion = CombinedLoss().to(device)
    
    batch_size = trial.suggest_int('batch_size', 50, 300)
    num_epochs = trial.suggest_int('epochs', 10, 100)
    
    print("Learning rate: "+ str(lr))
    print("Weight decay: "+ str(wd))
    print("Epsilon: "+ str(eps))
    print("Batch size: "+ str(batch_size))
    print("Number of epochs: "+ str(num_epochs))
    
    for epoch in tqdm(range(num_epochs), desc="Epochs"):
        train_loader = DataLoader(train_data, batch_size=batch_size, shuffle=True, num_workers=4)
        val_loader = DataLoader(val_data, batch_size=batch_size, shuffle=False, num_workers=4)
        
        # training loop
        running_loss = []
        running_accu = []
        
        model_xtr.train()
        for img, pos_img, neg_img, label, img_file, pos_file, neg_file in tqdm(train_loader, desc="Training", leave=False):
            img, pos_img, neg_img, label = img.to(device), pos_img.to(device), neg_img.to(device), label.to(device)

            x1 = file_to_embed(embeds, img_file)
            x2 = file_to_embed(embeds, pos_file)
            x3 = file_to_embed(embeds, neg_file)
            
            optimizer.zero_grad()
            anchor, output = model_xtr(x1)
            pos, _ = model_xtr(x2)
            neg, _ = model_xtr(x3)
            
            pred = torch.argmax(output, 1)
            accuracy = torch.eq(pred, label).sum() / len(img)

            loss = criterion(anchor, pos, neg, output, label)
            loss.backward()
            optimizer.step()

            running_accu.append(accuracy.cpu().detach().numpy())
            running_loss.append(loss.cpu().detach().numpy())
        print("Epoch: {}/{} - Loss: {:.4f} - Accuracy: {:.4f}".format(epoch+1, num_epochs, np.mean(running_loss), np.mean(running_accu)))
        
        # validation loop
        val_loss = []
        val_accu = []

        model_xtr.eval()
        with torch.no_grad():
            for img, pos_img, neg_img, label, img_file, pos_file, neg_file in tqdm(val_loader):
                img, pos_img, neg_img, label = img.to(device), pos_img.to(device), neg_img.to(device), label.to(device)
                
                x1 = file_to_embed(embeds, img_file)
                x2 = file_to_embed(embeds, pos_file)
                x3 = file_to_embed(embeds, neg_file)
                
                anchor, output = model_xtr(x1)
                pos, _ = model_xtr(x2)
                neg, _ = model_xtr(x3)
                
                pred = torch.argmax(output, 1)
                accuracy = torch.eq(pred, label).sum() / len(img)
                
                loss = criterion(anchor, pos, neg, output, label)
                
                val_accu.append(accuracy.cpu().detach().numpy())
                val_loss.append(loss.cpu().detach().numpy())
        val_accu = np.mean(val_accu)
        val_loss = np.mean(val_loss)
        print("Val Loss: {:.4f} - Val Accuracy: {:.4f}".format(val_loss, val_accu))
        
        trial.report(val_accu, epoch)
        if trial.should_prune():
            raise optuna.exceptions.TrialPruned()
    
    global best_accu
    if val_accu > best_accu:
        best_accu = val_accu
        print("Saving best model...")
        torch.save(model_xtr.state_dict(), "../vit_12-8_triplet_mean_only.pt")
            
    return val_accu

In [22]:
study = optuna.create_study(direction='maximize',
                            study_name='triplet-12-8-mean-only-vit-study',
                            storage='sqlite:///study.db',
                            load_if_exists=True)
study.optimize(objective, n_trials=20)

pruned_trials = study.get_trials(deepcopy=False, states=[TrialState.PRUNED])
complete_trials = study.get_trials(deepcopy=False, states=[TrialState.COMPLETE])

# Display the study statistics
print("\nStudy statistics: ")
print("  Number of finished trials: ", len(study.trials))
print("  Number of pruned trials: ", len(pruned_trials))
print("  Number of complete trials: ", len(complete_trials))

[32m[I 2023-12-14 21:51:40,224][0m A new study created in RDB with name: triplet-12-8-mean-only-vit-study[0m


Learning rate: 0.00035883062711026257
Weight decay: 0.0010839916629925644
Epsilon: 4.615406108202454e-09
Batch size: 94
Number of epochs: 56


Epochs:   0%|          | 0/56 [00:00<?, ?it/s]
Training:   0%|          | 0/149 [00:00<?, ?it/s][A
Training:   1%|          | 1/149 [00:02<07:00,  2.84s/it][A
Training:   2%|▏         | 3/149 [00:02<01:53,  1.29it/s][A
Training:   3%|▎         | 5/149 [00:04<02:06,  1.13it/s][A
Training:   5%|▌         | 8/149 [00:05<01:01,  2.29it/s][A
Training:   7%|▋         | 10/149 [00:07<01:30,  1.54it/s][A
Training:   8%|▊         | 12/149 [00:07<01:02,  2.18it/s][A
Training:   9%|▉         | 14/149 [00:09<01:28,  1.53it/s][A
Training:  11%|█▏        | 17/149 [00:11<01:21,  1.62it/s][A
Training:  12%|█▏        | 18/149 [00:11<01:18,  1.67it/s][A
Training:  14%|█▍        | 21/149 [00:13<01:14,  1.72it/s][A
Training:  15%|█▍        | 22/149 [00:13<01:11,  1.78it/s][A
Training:  16%|█▌        | 24/149 [00:13<00:49,  2.51it/s][A
Training:  17%|█▋        | 25/149 [00:15<01:16,  1.63it/s][A
Training:  17%|█▋        | 26/149 [00:16<01:15,  1.63it/s][A
Training:  19%|█▉        | 28/149 [0

Epoch: 1/56 - Loss: 3.4106 - Accuracy: 0.8272



  0%|          | 0/19 [00:00<?, ?it/s][A
  5%|▌         | 1/19 [00:02<00:48,  2.68s/it][A
 26%|██▋       | 5/19 [00:04<00:11,  1.17it/s][A
 42%|████▏     | 8/19 [00:04<00:05,  2.15it/s][A
 53%|█████▎    | 10/19 [00:07<00:05,  1.54it/s][A
 68%|██████▊   | 13/19 [00:09<00:04,  1.50it/s][A
100%|██████████| 19/19 [00:11<00:00,  1.68it/s][A
Epochs:   2%|▏         | 1/56 [01:31<1:24:13, 91.88s/it]

Val Loss: 2.1302 - Val Accuracy: 0.9099



Training:   0%|          | 0/149 [00:00<?, ?it/s][A
Training:   1%|          | 1/149 [00:02<06:22,  2.59s/it][A
Training:   3%|▎         | 4/149 [00:02<01:16,  1.90it/s][A
Training:   4%|▍         | 6/149 [00:04<01:47,  1.34it/s][A
Training:   6%|▌         | 9/149 [00:06<01:41,  1.38it/s][A
Training:   9%|▊         | 13/149 [00:09<01:25,  1.58it/s][A
Training:  11%|█         | 16/149 [00:09<00:58,  2.29it/s][A
Training:  11%|█▏        | 17/149 [00:11<01:24,  1.57it/s][A
Training:  13%|█▎        | 19/149 [00:11<01:02,  2.06it/s][A
Training:  14%|█▍        | 21/149 [00:13<01:21,  1.58it/s][A
Training:  15%|█▌        | 23/149 [00:13<01:00,  2.07it/s][A
Training:  17%|█▋        | 25/149 [00:15<01:20,  1.54it/s][A
Training:  18%|█▊        | 27/149 [00:15<00:59,  2.05it/s][A
Training:  19%|█▉        | 29/149 [00:17<01:15,  1.58it/s][A
Training:  21%|██        | 31/149 [00:17<00:54,  2.16it/s][A
Training:  22%|██▏       | 33/149 [00:19<01:11,  1.62it/s][A
Training:  23%|██▎  

Epoch: 2/56 - Loss: 1.7012 - Accuracy: 0.9165



  0%|          | 0/19 [00:00<?, ?it/s][A
  5%|▌         | 1/19 [00:02<00:41,  2.33s/it][A
 16%|█▌        | 3/19 [00:02<00:10,  1.55it/s][A
 26%|██▋       | 5/19 [00:04<00:10,  1.30it/s][A
 37%|███▋      | 7/19 [00:04<00:06,  1.98it/s][A
 47%|████▋     | 9/19 [00:06<00:06,  1.61it/s][A
 58%|█████▊    | 11/19 [00:06<00:03,  2.08it/s][A
 68%|██████▊   | 13/19 [00:08<00:03,  1.68it/s][A
 79%|███████▉  | 15/19 [00:08<00:01,  2.19it/s][A
100%|██████████| 19/19 [00:10<00:00,  1.84it/s][A
Epochs:   4%|▎         | 2/56 [03:03<1:22:45, 91.96s/it]

Val Loss: 1.6311 - Val Accuracy: 0.9216



Training:   0%|          | 0/149 [00:00<?, ?it/s][A
Training:   1%|          | 1/149 [00:02<06:31,  2.65s/it][A
Training:   3%|▎         | 5/149 [00:04<02:02,  1.18it/s][A
Training:   5%|▌         | 8/149 [00:04<01:05,  2.16it/s][A
Training:   7%|▋         | 10/149 [00:06<01:29,  1.56it/s][A
Training:   9%|▊         | 13/149 [00:09<01:31,  1.49it/s][A
Training:  11%|█▏        | 17/149 [00:11<01:20,  1.65it/s][A
Training:  14%|█▍        | 21/149 [00:13<01:12,  1.78it/s][A
Training:  15%|█▌        | 23/149 [00:13<00:57,  2.20it/s][A
Training:  17%|█▋        | 25/149 [00:15<01:12,  1.71it/s][A
Training:  17%|█▋        | 26/149 [00:15<01:08,  1.79it/s][A
Training:  19%|█▉        | 29/149 [00:17<01:06,  1.82it/s][A
Training:  20%|██        | 30/149 [00:17<01:03,  1.89it/s][A
Training:  22%|██▏       | 33/149 [00:19<01:03,  1.82it/s][A
Training:  23%|██▎       | 34/149 [00:20<01:06,  1.74it/s][A
Training:  25%|██▍       | 37/149 [00:21<00:57,  1.95it/s][A
Training:  26%|██▌ 

Epoch: 3/56 - Loss: 1.3471 - Accuracy: 0.9273



  0%|          | 0/19 [00:00<?, ?it/s][A
  5%|▌         | 1/19 [00:02<00:36,  2.05s/it][A
 26%|██▋       | 5/19 [00:03<00:08,  1.57it/s][A
 37%|███▋      | 7/19 [00:03<00:05,  2.39it/s][A
 47%|████▋     | 9/19 [00:05<00:05,  1.84it/s][A
 53%|█████▎    | 10/19 [00:05<00:04,  2.18it/s][A
 68%|██████▊   | 13/19 [00:06<00:02,  2.06it/s][A
 79%|███████▉  | 15/19 [00:07<00:01,  2.79it/s][A
 89%|████████▉ | 17/19 [00:08<00:00,  2.17it/s][A
100%|██████████| 19/19 [00:08<00:00,  2.18it/s][A
Epochs:   5%|▌         | 3/56 [04:24<1:16:36, 86.73s/it]

Val Loss: 1.1306 - Val Accuracy: 0.9328



Training:   0%|          | 0/149 [00:00<?, ?it/s][A
Training:   1%|          | 1/149 [00:02<05:37,  2.28s/it][A
Training:   2%|▏         | 3/149 [00:02<01:31,  1.59it/s][A
Training:   3%|▎         | 5/149 [00:03<01:40,  1.44it/s][A
Training:   4%|▍         | 6/149 [00:04<01:19,  1.80it/s][A
Training:   6%|▌         | 9/149 [00:05<01:16,  1.84it/s][A
Training:   7%|▋         | 10/149 [00:05<01:07,  2.04it/s][A
Training:   9%|▊         | 13/149 [00:07<01:07,  2.01it/s][A
Training:   9%|▉         | 14/149 [00:07<01:01,  2.20it/s][A
Training:  11%|█▏        | 17/149 [00:09<01:03,  2.07it/s][A
Training:  12%|█▏        | 18/149 [00:09<00:59,  2.19it/s][A
Training:  14%|█▍        | 21/149 [00:11<01:00,  2.11it/s][A
Training:  15%|█▍        | 22/149 [00:11<00:57,  2.20it/s][A
Training:  17%|█▋        | 25/149 [00:13<01:00,  2.05it/s][A
Training:  17%|█▋        | 26/149 [00:13<00:54,  2.26it/s][A
Training:  19%|█▉        | 29/149 [00:14<00:56,  2.12it/s][A
Training:  20%|██    

Epoch: 4/56 - Loss: 1.1308 - Accuracy: 0.9349



  0%|          | 0/19 [00:00<?, ?it/s][A
  5%|▌         | 1/19 [00:01<00:33,  1.84s/it][A
 21%|██        | 4/19 [00:01<00:05,  2.63it/s][A
 32%|███▏      | 6/19 [00:03<00:06,  1.89it/s][A
 47%|████▋     | 9/19 [00:04<00:05,  1.96it/s][A
 53%|█████▎    | 10/19 [00:04<00:03,  2.29it/s][A
 68%|██████▊   | 13/19 [00:06<00:02,  2.08it/s][A
 84%|████████▍ | 16/19 [00:06<00:00,  3.23it/s][A
100%|██████████| 19/19 [00:08<00:00,  2.28it/s][A
Epochs:   7%|▋         | 4/56 [05:40<1:11:39, 82.68s/it]

Val Loss: 1.0809 - Val Accuracy: 0.9328



Training:   0%|          | 0/149 [00:00<?, ?it/s][A
Training:   1%|          | 1/149 [00:02<05:09,  2.09s/it][A
Training:   2%|▏         | 3/149 [00:02<01:28,  1.65it/s][A
Training:   3%|▎         | 5/149 [00:03<01:38,  1.47it/s][A
Training:   5%|▍         | 7/149 [00:03<01:00,  2.34it/s][A
Training:   6%|▌         | 9/149 [00:05<01:17,  1.80it/s][A
Training:   7%|▋         | 10/149 [00:05<01:05,  2.14it/s][A
Training:   9%|▊         | 13/149 [00:06<00:59,  2.27it/s][A
Training:   9%|▉         | 14/149 [00:07<00:53,  2.53it/s][A
Training:  11%|█▏        | 17/149 [00:08<00:52,  2.51it/s][A
Training:  12%|█▏        | 18/149 [00:08<00:48,  2.69it/s][A
Training:  14%|█▍        | 21/149 [00:09<00:48,  2.64it/s][A
Training:  15%|█▍        | 22/149 [00:09<00:46,  2.73it/s][A
Training:  17%|█▋        | 25/149 [00:10<00:42,  2.91it/s][A
Training:  17%|█▋        | 26/149 [00:11<00:43,  2.83it/s][A
Training:  19%|█▉        | 29/149 [00:12<00:42,  2.84it/s][A
Training:  20%|██    

Epoch: 5/56 - Loss: 1.0286 - Accuracy: 0.9356



  0%|          | 0/19 [00:00<?, ?it/s][A
  5%|▌         | 1/19 [00:01<00:29,  1.64s/it][A
 26%|██▋       | 5/19 [00:02<00:06,  2.05it/s][A
 42%|████▏     | 8/19 [00:02<00:02,  3.68it/s][A
 53%|█████▎    | 10/19 [00:04<00:03,  2.74it/s][A
 68%|██████▊   | 13/19 [00:05<00:02,  2.53it/s][A
 79%|███████▉  | 15/19 [00:05<00:01,  3.31it/s][A
100%|██████████| 19/19 [00:06<00:00,  2.89it/s][A
Epochs:   9%|▉         | 5/56 [06:41<1:03:30, 74.72s/it]

Val Loss: 0.9759 - Val Accuracy: 0.9354



Training:   0%|          | 0/149 [00:00<?, ?it/s][A
Training:   1%|          | 1/149 [00:01<04:06,  1.66s/it][A
Training:   3%|▎         | 4/149 [00:01<00:50,  2.87it/s][A
Training:   4%|▍         | 6/149 [00:03<01:07,  2.11it/s][A
Training:   6%|▌         | 9/149 [00:04<01:06,  2.09it/s][A
Training:   7%|▋         | 11/149 [00:04<00:47,  2.90it/s][A
Training:   9%|▊         | 13/149 [00:06<01:02,  2.19it/s][A
Training:  11%|█▏        | 17/149 [00:07<00:52,  2.53it/s][A
Training:  14%|█▍        | 21/149 [00:08<00:48,  2.63it/s][A
Training:  17%|█▋        | 25/149 [00:10<00:46,  2.69it/s][A
Training:  19%|█▉        | 29/149 [00:11<00:44,  2.68it/s][A
Training:  22%|██▏       | 33/149 [00:13<00:41,  2.77it/s][A
Training:  25%|██▍       | 37/149 [00:14<00:40,  2.77it/s][A
Training:  28%|██▊       | 41/149 [00:16<00:39,  2.72it/s][A
Training:  30%|███       | 45/149 [00:17<00:38,  2.74it/s][A
Training:  33%|███▎      | 49/149 [00:18<00:35,  2.80it/s][A
Training:  36%|███▌ 

Epoch: 6/56 - Loss: 0.9461 - Accuracy: 0.9353



  0%|          | 0/19 [00:00<?, ?it/s][A
  5%|▌         | 1/19 [00:01<00:22,  1.26s/it][A
 26%|██▋       | 5/19 [00:02<00:05,  2.47it/s][A
 47%|████▋     | 9/19 [00:03<00:03,  3.32it/s][A
 68%|██████▊   | 13/19 [00:04<00:01,  3.58it/s][A
100%|██████████| 19/19 [00:05<00:00,  3.73it/s][A
Epochs:  11%|█         | 6/56 [07:33<55:43, 66.87s/it]  

Val Loss: 0.8814 - Val Accuracy: 0.9342



Training:   0%|          | 0/149 [00:00<?, ?it/s][A
Training:   1%|          | 1/149 [00:01<03:12,  1.30s/it][A
Training:   3%|▎         | 5/149 [00:02<01:02,  2.32it/s][A
Training:   6%|▌         | 9/149 [00:03<00:48,  2.87it/s][A
Training:   9%|▊         | 13/149 [00:04<00:41,  3.25it/s][A
Training:  11%|█▏        | 17/149 [00:05<00:39,  3.38it/s][A
Training:  14%|█▍        | 21/149 [00:06<00:36,  3.52it/s][A
Training:  17%|█▋        | 25/149 [00:07<00:33,  3.67it/s][A
Training:  19%|█▉        | 29/149 [00:08<00:33,  3.63it/s][A
Training:  22%|██▏       | 33/149 [00:09<00:31,  3.69it/s][A
Training:  25%|██▍       | 37/149 [00:10<00:29,  3.75it/s][A
Training:  28%|██▊       | 41/149 [00:12<00:29,  3.70it/s][A
Training:  30%|███       | 45/149 [00:13<00:27,  3.73it/s][A
Training:  33%|███▎      | 49/149 [00:14<00:26,  3.76it/s][A
Training:  36%|███▌      | 53/149 [00:15<00:26,  3.68it/s][A
Training:  38%|███▊      | 57/149 [00:16<00:23,  3.84it/s][A
Training:  41%|████

Epoch: 7/56 - Loss: 0.9016 - Accuracy: 0.9358



  0%|          | 0/19 [00:00<?, ?it/s][A
  5%|▌         | 1/19 [00:01<00:23,  1.30s/it][A
 26%|██▋       | 5/19 [00:02<00:05,  2.66it/s][A
 42%|████▏     | 8/19 [00:02<00:02,  4.66it/s][A
 53%|█████▎    | 10/19 [00:03<00:02,  3.36it/s][A
 68%|██████▊   | 13/19 [00:04<00:01,  3.28it/s][A
100%|██████████| 19/19 [00:05<00:00,  3.67it/s][A
Epochs:  12%|█▎        | 7/56 [08:18<48:56, 59.92s/it]

Val Loss: 0.9163 - Val Accuracy: 0.9328



Training:   0%|          | 0/149 [00:00<?, ?it/s][A
Training:   1%|          | 1/149 [00:01<03:27,  1.40s/it][A
Training:   3%|▎         | 5/149 [00:02<01:03,  2.26it/s][A
Training:   6%|▌         | 9/149 [00:03<00:46,  3.01it/s][A
Training:   9%|▊         | 13/149 [00:04<00:41,  3.26it/s][A
Training:  11%|█▏        | 17/149 [00:05<00:37,  3.55it/s][A
Training:  13%|█▎        | 20/149 [00:05<00:27,  4.74it/s][A
Training:  15%|█▍        | 22/149 [00:06<00:35,  3.62it/s][A
Training:  17%|█▋        | 25/149 [00:07<00:36,  3.37it/s][A
Training:  19%|█▉        | 28/149 [00:07<00:26,  4.65it/s][A
Training:  20%|██        | 30/149 [00:08<00:32,  3.66it/s][A
Training:  22%|██▏       | 33/149 [00:09<00:35,  3.28it/s][A
Training:  25%|██▍       | 37/149 [00:10<00:32,  3.46it/s][A
Training:  28%|██▊       | 41/149 [00:11<00:29,  3.61it/s][A
Training:  30%|███       | 45/149 [00:13<00:28,  3.62it/s][A
Training:  33%|███▎      | 49/149 [00:14<00:27,  3.69it/s][A
Training:  36%|███▌

Epoch: 8/56 - Loss: 0.8376 - Accuracy: 0.9423



  0%|          | 0/19 [00:00<?, ?it/s][A
  5%|▌         | 1/19 [00:01<00:25,  1.40s/it][A
 26%|██▋       | 5/19 [00:02<00:06,  2.28it/s][A
 47%|████▋     | 9/19 [00:03<00:03,  2.88it/s][A
 68%|██████▊   | 13/19 [00:04<00:01,  3.02it/s][A
100%|██████████| 19/19 [00:05<00:00,  3.28it/s][A
Epochs:  14%|█▍        | 8/56 [09:08<45:13, 56.54s/it]

Val Loss: 0.8527 - Val Accuracy: 0.9364



Training:   0%|          | 0/149 [00:00<?, ?it/s][A
Training:   1%|          | 1/149 [00:01<03:10,  1.28s/it][A
Training:   3%|▎         | 4/149 [00:01<00:39,  3.70it/s][A
Training:   4%|▍         | 6/149 [00:02<00:54,  2.63it/s][A
Training:   6%|▌         | 9/149 [00:03<00:53,  2.64it/s][A
Training:   9%|▊         | 13/149 [00:04<00:44,  3.06it/s][A
Training:  11%|█▏        | 17/149 [00:05<00:41,  3.17it/s][A
Training:  14%|█▍        | 21/149 [00:06<00:37,  3.41it/s][A
Training:  15%|█▌        | 23/149 [00:06<00:30,  4.12it/s][A
Training:  17%|█▋        | 25/149 [00:08<00:38,  3.20it/s][A
Training:  19%|█▉        | 28/149 [00:08<00:26,  4.51it/s][A
Training:  20%|██        | 30/149 [00:09<00:35,  3.39it/s][A
Training:  22%|██▏       | 33/149 [00:10<00:35,  3.31it/s][A
Training:  24%|██▍       | 36/149 [00:10<00:24,  4.66it/s][A
Training:  26%|██▌       | 38/149 [00:11<00:32,  3.41it/s][A
Training:  28%|██▊       | 41/149 [00:12<00:33,  3.26it/s][A
Training:  30%|███  

Epoch: 9/56 - Loss: 0.7984 - Accuracy: 0.9416



  0%|          | 0/19 [00:00<?, ?it/s][A
  5%|▌         | 1/19 [00:01<00:22,  1.26s/it][A
 26%|██▋       | 5/19 [00:02<00:05,  2.44it/s][A
 47%|████▋     | 9/19 [00:03<00:03,  3.26it/s][A
 68%|██████▊   | 13/19 [00:04<00:01,  3.52it/s][A
100%|██████████| 19/19 [00:05<00:00,  3.64it/s][A
Epochs:  16%|█▌        | 9/56 [09:54<41:52, 53.46s/it]

Val Loss: 0.9072 - Val Accuracy: 0.9316



Training:   0%|          | 0/149 [00:00<?, ?it/s][A
Training:   1%|          | 1/149 [00:01<03:30,  1.42s/it][A
Training:   3%|▎         | 5/149 [00:02<01:04,  2.24it/s][A
Training:   6%|▌         | 9/149 [00:03<00:51,  2.71it/s][A
Training:   9%|▊         | 13/149 [00:04<00:43,  3.14it/s][A
Training:  11%|█▏        | 17/149 [00:05<00:40,  3.26it/s][A
Training:  14%|█▍        | 21/149 [00:07<00:38,  3.35it/s][A
Training:  17%|█▋        | 25/149 [00:08<00:35,  3.54it/s][A
Training:  19%|█▉        | 29/149 [00:09<00:33,  3.54it/s][A
Training:  22%|██▏       | 33/149 [00:10<00:33,  3.41it/s][A
Training:  25%|██▍       | 37/149 [00:11<00:31,  3.60it/s][A
Training:  28%|██▊       | 41/149 [00:12<00:30,  3.55it/s][A
Training:  30%|███       | 45/149 [00:13<00:28,  3.61it/s][A
Training:  33%|███▎      | 49/149 [00:14<00:27,  3.69it/s][A
Training:  36%|███▌      | 53/149 [00:15<00:26,  3.64it/s][A
Training:  38%|███▊      | 57/149 [00:16<00:24,  3.71it/s][A
Training:  41%|████

Epoch: 10/56 - Loss: 0.7986 - Accuracy: 0.9408



  0%|          | 0/19 [00:00<?, ?it/s][A
  5%|▌         | 1/19 [00:01<00:32,  1.78s/it][A
 26%|██▋       | 5/19 [00:03<00:07,  1.76it/s][A
 47%|████▋     | 9/19 [00:04<00:04,  2.25it/s][A
 68%|██████▊   | 13/19 [00:05<00:02,  2.61it/s][A
100%|██████████| 19/19 [00:06<00:00,  2.76it/s][A
Epochs:  18%|█▊        | 10/56 [10:45<40:20, 52.63s/it]

Val Loss: 0.7772 - Val Accuracy: 0.9343



Training:   0%|          | 0/149 [00:00<?, ?it/s][A
Training:   1%|          | 1/149 [00:01<04:03,  1.64s/it][A
Training:   3%|▎         | 4/149 [00:01<00:49,  2.94it/s][A
Training:   4%|▍         | 6/149 [00:03<01:10,  2.03it/s][A
Training:   5%|▍         | 7/149 [00:03<00:58,  2.41it/s][A
Training:   6%|▌         | 9/149 [00:04<01:15,  1.85it/s][A
Training:   7%|▋         | 11/149 [00:04<00:52,  2.63it/s][A
Training:   9%|▊         | 13/149 [00:06<01:07,  2.03it/s][A
Training:  10%|█         | 15/149 [00:06<00:47,  2.82it/s][A
Training:  11%|█▏        | 17/149 [00:07<01:02,  2.13it/s][A
Training:  13%|█▎        | 19/149 [00:08<00:45,  2.86it/s][A
Training:  14%|█▍        | 21/149 [00:09<00:54,  2.35it/s][A
Training:  15%|█▌        | 23/149 [00:09<00:39,  3.17it/s][A
Training:  17%|█▋        | 25/149 [00:10<00:51,  2.39it/s][A
Training:  18%|█▊        | 27/149 [00:10<00:38,  3.20it/s][A
Training:  19%|█▉        | 29/149 [00:11<00:44,  2.70it/s][A
Training:  21%|██    

Epoch: 11/56 - Loss: 0.7631 - Accuracy: 0.9413



  0%|          | 0/19 [00:00<?, ?it/s][A
  5%|▌         | 1/19 [00:01<00:23,  1.30s/it][A
 26%|██▋       | 5/19 [00:02<00:05,  2.60it/s][A
 47%|████▋     | 9/19 [00:03<00:03,  3.21it/s][A
 68%|██████▊   | 13/19 [00:04<00:01,  3.57it/s][A
100%|██████████| 19/19 [00:05<00:00,  3.66it/s][A
Epochs:  20%|█▉        | 11/56 [11:35<38:47, 51.71s/it]

Val Loss: 0.8595 - Val Accuracy: 0.9344



Training:   0%|          | 0/149 [00:00<?, ?it/s][A
Training:   1%|          | 1/149 [00:01<03:24,  1.38s/it][A
Training:   3%|▎         | 5/149 [00:02<01:04,  2.22it/s][A
Training:   6%|▌         | 9/149 [00:03<00:48,  2.89it/s][A
Training:   9%|▊         | 13/149 [00:04<00:42,  3.22it/s][A
Training:  11%|█▏        | 17/149 [00:05<00:39,  3.36it/s][A
Training:  14%|█▍        | 21/149 [00:06<00:35,  3.60it/s][A
Training:  17%|█▋        | 25/149 [00:07<00:34,  3.58it/s][A
Training:  19%|█▉        | 29/149 [00:08<00:33,  3.61it/s][A
Training:  22%|██▏       | 33/149 [00:09<00:31,  3.71it/s][A
Training:  25%|██▍       | 37/149 [00:11<00:31,  3.61it/s][A
Training:  28%|██▊       | 41/149 [00:12<00:28,  3.76it/s][A
Training:  30%|███       | 45/149 [00:13<00:28,  3.70it/s][A
Training:  33%|███▎      | 49/149 [00:14<00:28,  3.56it/s][A
Training:  36%|███▌      | 53/149 [00:15<00:26,  3.65it/s][A
Training:  38%|███▊      | 57/149 [00:16<00:25,  3.61it/s][A
Training:  41%|████

Epoch: 12/56 - Loss: 0.7665 - Accuracy: 0.9387



  0%|          | 0/19 [00:00<?, ?it/s][A
  5%|▌         | 1/19 [00:01<00:23,  1.33s/it][A
 26%|██▋       | 5/19 [00:02<00:05,  2.57it/s][A
 47%|████▋     | 9/19 [00:03<00:03,  3.15it/s][A
 68%|██████▊   | 13/19 [00:04<00:01,  3.53it/s][A
100%|██████████| 19/19 [00:05<00:00,  3.59it/s][A
Epochs:  21%|██▏       | 12/56 [12:22<36:52, 50.28s/it]

Val Loss: 0.8774 - Val Accuracy: 0.9194



Training:   0%|          | 0/149 [00:00<?, ?it/s][A
Training:   1%|          | 1/149 [00:01<03:27,  1.40s/it][A
Training:   3%|▎         | 5/149 [00:02<01:05,  2.21it/s][A
Training:   6%|▌         | 9/149 [00:03<00:47,  2.92it/s][A
Training:   9%|▊         | 13/149 [00:04<00:43,  3.14it/s][A
Training:  11%|█▏        | 17/149 [00:05<00:40,  3.28it/s][A
Training:  14%|█▍        | 21/149 [00:06<00:36,  3.55it/s][A
Training:  17%|█▋        | 25/149 [00:07<00:34,  3.55it/s][A
Training:  19%|█▉        | 29/149 [00:08<00:33,  3.61it/s][A
Training:  22%|██▏       | 33/149 [00:10<00:31,  3.64it/s][A
Training:  25%|██▍       | 37/149 [00:11<00:31,  3.59it/s][A
Training:  28%|██▊       | 41/149 [00:12<00:29,  3.65it/s][A
Training:  30%|███       | 45/149 [00:13<00:27,  3.72it/s][A
Training:  33%|███▎      | 49/149 [00:14<00:27,  3.63it/s][A
Training:  36%|███▌      | 53/149 [00:15<00:25,  3.73it/s][A
Training:  38%|███▊      | 57/149 [00:16<00:25,  3.64it/s][A
Training:  41%|████

Epoch: 13/56 - Loss: 0.7337 - Accuracy: 0.9404



  0%|          | 0/19 [00:00<?, ?it/s][A
  5%|▌         | 1/19 [00:01<00:23,  1.32s/it][A
 26%|██▋       | 5/19 [00:02<00:05,  2.45it/s][A
 47%|████▋     | 9/19 [00:03<00:03,  2.82it/s][A
 68%|██████▊   | 13/19 [00:04<00:01,  3.04it/s][A
100%|██████████| 19/19 [00:05<00:00,  3.29it/s][A
Epochs:  23%|██▎       | 13/56 [13:09<35:21, 49.33s/it]

Val Loss: 0.8886 - Val Accuracy: 0.9262



Training:   0%|          | 0/149 [00:00<?, ?it/s][A
Training:   1%|          | 1/149 [00:01<03:25,  1.39s/it][A
Training:   3%|▎         | 5/149 [00:02<01:03,  2.27it/s][A
Training:   6%|▌         | 9/149 [00:03<00:49,  2.83it/s][A
Training:   9%|▊         | 13/149 [00:04<00:42,  3.19it/s][A
Training:  11%|█▏        | 17/149 [00:05<00:40,  3.29it/s][A
Training:  14%|█▍        | 21/149 [00:06<00:37,  3.41it/s][A
Training:  17%|█▋        | 25/149 [00:07<00:35,  3.51it/s][A
Training:  19%|█▉        | 29/149 [00:09<00:34,  3.49it/s][A
Training:  22%|██▏       | 33/149 [00:10<00:31,  3.65it/s][A
Training:  25%|██▍       | 37/149 [00:11<00:30,  3.64it/s][A
Training:  28%|██▊       | 41/149 [00:12<00:30,  3.60it/s][A
Training:  30%|███       | 45/149 [00:13<00:28,  3.70it/s][A
Training:  33%|███▎      | 49/149 [00:14<00:27,  3.64it/s][A
Training:  36%|███▌      | 53/149 [00:15<00:26,  3.60it/s][A
Training:  38%|███▊      | 57/149 [00:16<00:24,  3.69it/s][A
Training:  41%|████

Epoch: 14/56 - Loss: 0.7130 - Accuracy: 0.9406



  0%|          | 0/19 [00:00<?, ?it/s][A
  5%|▌         | 1/19 [00:01<00:22,  1.25s/it][A
 26%|██▋       | 5/19 [00:02<00:05,  2.48it/s][A
 47%|████▋     | 9/19 [00:03<00:03,  3.28it/s][A
 63%|██████▎   | 12/19 [00:03<00:01,  4.87it/s][A
 74%|███████▎  | 14/19 [00:04<00:01,  3.58it/s][A
100%|██████████| 19/19 [00:05<00:00,  3.57it/s][A
Epochs:  25%|██▌       | 14/56 [13:56<34:06, 48.74s/it]

Val Loss: 0.7947 - Val Accuracy: 0.9399



Training:   0%|          | 0/149 [00:00<?, ?it/s][A
Training:   1%|          | 1/149 [00:01<03:23,  1.38s/it][A
Training:   3%|▎         | 4/149 [00:01<00:42,  3.40it/s][A
Training:   4%|▍         | 6/149 [00:02<00:52,  2.71it/s][A
Training:   6%|▌         | 9/149 [00:03<00:51,  2.74it/s][A
Training:   7%|▋         | 10/149 [00:03<00:43,  3.17it/s][A
Training:   9%|▊         | 13/149 [00:04<00:43,  3.09it/s][A
Training:   9%|▉         | 14/149 [00:04<00:38,  3.49it/s][A
Training:  11%|█▏        | 17/149 [00:05<00:39,  3.35it/s][A
Training:  13%|█▎        | 19/149 [00:05<00:29,  4.41it/s][A
Training:  14%|█▍        | 21/149 [00:06<00:40,  3.16it/s][A
Training:  16%|█▌        | 24/149 [00:06<00:26,  4.79it/s][A
Training:  17%|█▋        | 26/149 [00:07<00:35,  3.45it/s][A
Training:  19%|█▉        | 29/149 [00:08<00:36,  3.25it/s][A
Training:  21%|██▏       | 32/149 [00:09<00:25,  4.65it/s][A
Training:  23%|██▎       | 34/149 [00:10<00:34,  3.36it/s][A
Training:  25%|██▍  

Epoch: 15/56 - Loss: 0.7065 - Accuracy: 0.9398



  0%|          | 0/19 [00:00<?, ?it/s][A
  5%|▌         | 1/19 [00:01<00:22,  1.23s/it][A
 26%|██▋       | 5/19 [00:02<00:05,  2.49it/s][A
 47%|████▋     | 9/19 [00:03<00:03,  3.17it/s][A
 68%|██████▊   | 13/19 [00:04<00:01,  3.58it/s][A
100%|██████████| 19/19 [00:05<00:00,  3.62it/s][A
Epochs:  27%|██▋       | 15/56 [14:43<32:50, 48.06s/it]

Val Loss: 0.7088 - Val Accuracy: 0.9325



Training:   0%|          | 0/149 [00:00<?, ?it/s][A
Training:   1%|          | 1/149 [00:01<03:32,  1.44s/it][A
Training:   3%|▎         | 5/149 [00:02<01:02,  2.31it/s][A
Training:   6%|▌         | 9/149 [00:03<00:48,  2.90it/s][A
Training:   9%|▊         | 13/149 [00:04<00:42,  3.17it/s][A
Training:  11%|█▏        | 17/149 [00:05<00:38,  3.45it/s][A
Training:  14%|█▍        | 21/149 [00:06<00:35,  3.57it/s][A
Training:  17%|█▋        | 25/149 [00:07<00:34,  3.60it/s][A
Training:  19%|█▉        | 29/149 [00:08<00:32,  3.69it/s][A
Training:  22%|██▏       | 33/149 [00:09<00:31,  3.63it/s][A
Training:  25%|██▍       | 37/149 [00:11<00:30,  3.62it/s][A
Training:  28%|██▊       | 41/149 [00:12<00:28,  3.76it/s][A
Training:  30%|███       | 45/149 [00:13<00:28,  3.69it/s][A
Training:  33%|███▎      | 49/149 [00:14<00:26,  3.78it/s][A
Training:  36%|███▌      | 53/149 [00:15<00:25,  3.76it/s][A
Training:  38%|███▊      | 57/149 [00:16<00:24,  3.69it/s][A
Training:  41%|████

Epoch: 16/56 - Loss: 0.7103 - Accuracy: 0.9421



  0%|          | 0/19 [00:00<?, ?it/s][A
  5%|▌         | 1/19 [00:01<00:22,  1.25s/it][A
 26%|██▋       | 5/19 [00:02<00:05,  2.46it/s][A
 47%|████▋     | 9/19 [00:03<00:03,  3.10it/s][A
 68%|██████▊   | 13/19 [00:04<00:01,  3.56it/s][A
100%|██████████| 19/19 [00:05<00:00,  3.58it/s][A
Epochs:  29%|██▊       | 16/56 [15:29<31:40, 47.51s/it]

Val Loss: 0.7957 - Val Accuracy: 0.9392



Training:   0%|          | 0/149 [00:00<?, ?it/s][A
Training:   1%|          | 1/149 [00:01<03:29,  1.42s/it][A
Training:   3%|▎         | 5/149 [00:02<01:02,  2.31it/s][A
Training:   5%|▌         | 8/149 [00:02<00:34,  4.06it/s][A
Training:   7%|▋         | 10/149 [00:03<00:44,  3.11it/s][A
Training:   9%|▊         | 13/149 [00:04<00:46,  2.92it/s][A
Training:  11%|█▏        | 17/149 [00:05<00:41,  3.21it/s][A
Training:  14%|█▍        | 21/149 [00:06<00:37,  3.41it/s][A
Training:  17%|█▋        | 25/149 [00:08<00:36,  3.39it/s][A
Training:  19%|█▉        | 29/149 [00:08<00:33,  3.59it/s][A
Training:  22%|██▏       | 33/149 [00:10<00:32,  3.57it/s][A
Training:  25%|██▍       | 37/149 [00:11<00:31,  3.59it/s][A
Training:  28%|██▊       | 41/149 [00:12<00:28,  3.74it/s][A
Training:  30%|███       | 45/149 [00:13<00:28,  3.66it/s][A
Training:  33%|███▎      | 49/149 [00:14<00:26,  3.78it/s][A
Training:  36%|███▌      | 53/149 [00:15<00:25,  3.72it/s][A
Training:  38%|███▊

Epoch: 17/56 - Loss: 0.6964 - Accuracy: 0.9376



  0%|          | 0/19 [00:00<?, ?it/s][A
  5%|▌         | 1/19 [00:01<00:24,  1.35s/it][A
 26%|██▋       | 5/19 [00:02<00:05,  2.50it/s][A
 47%|████▋     | 9/19 [00:03<00:03,  3.15it/s][A
 68%|██████▊   | 13/19 [00:04<00:01,  3.49it/s][A
100%|██████████| 19/19 [00:05<00:00,  3.59it/s][A
Epochs:  30%|███       | 17/56 [16:16<30:48, 47.40s/it]

Val Loss: 0.8040 - Val Accuracy: 0.9342



Training:   0%|          | 0/149 [00:00<?, ?it/s][A
Training:   1%|          | 1/149 [00:01<03:30,  1.42s/it][A
Training:   3%|▎         | 5/149 [00:02<01:06,  2.17it/s][A
Training:   6%|▌         | 9/149 [00:03<00:48,  2.91it/s][A
Training:   9%|▊         | 13/149 [00:04<00:44,  3.03it/s][A
Training:  11%|█▏        | 17/149 [00:05<00:41,  3.21it/s][A
Training:  14%|█▍        | 21/149 [00:06<00:36,  3.46it/s][A
Training:  17%|█▋        | 25/149 [00:08<00:35,  3.54it/s][A
Training:  19%|█▉        | 29/149 [00:09<00:33,  3.58it/s][A
Training:  22%|██▏       | 33/149 [00:10<00:31,  3.70it/s][A
Training:  25%|██▍       | 37/149 [00:11<00:30,  3.65it/s][A
Training:  28%|██▊       | 41/149 [00:12<00:29,  3.69it/s][A
Training:  30%|██▉       | 44/149 [00:12<00:22,  4.68it/s][A
Training:  31%|███       | 46/149 [00:13<00:26,  3.83it/s][A
Training:  33%|███▎      | 49/149 [00:14<00:29,  3.41it/s][A
Training:  36%|███▌      | 53/149 [00:15<00:27,  3.55it/s][A
Training:  38%|███▊

Epoch: 18/56 - Loss: 0.6786 - Accuracy: 0.9389



  0%|          | 0/19 [00:00<?, ?it/s][A
  5%|▌         | 1/19 [00:01<00:22,  1.28s/it][A
 21%|██        | 4/19 [00:01<00:04,  3.71it/s][A
 32%|███▏      | 6/19 [00:02<00:04,  2.99it/s][A
 47%|████▋     | 9/19 [00:03<00:03,  2.98it/s][A
 68%|██████▊   | 13/19 [00:04<00:01,  3.56it/s][A
100%|██████████| 19/19 [00:05<00:00,  3.55it/s][A
Epochs:  32%|███▏      | 18/56 [17:03<29:58, 47.33s/it]

Val Loss: 0.7962 - Val Accuracy: 0.9298



Training:   0%|          | 0/149 [00:00<?, ?it/s][A
Training:   1%|          | 1/149 [00:01<03:38,  1.48s/it][A
Training:   3%|▎         | 5/149 [00:02<01:03,  2.25it/s][A
Training:   5%|▌         | 8/149 [00:02<00:35,  3.99it/s][A
Training:   7%|▋         | 10/149 [00:03<00:49,  2.82it/s][A
Training:   9%|▊         | 13/149 [00:04<00:48,  2.81it/s][A
Training:  11%|█         | 16/149 [00:04<00:31,  4.17it/s][A
Training:  12%|█▏        | 18/149 [00:05<00:39,  3.31it/s][A
Training:  14%|█▍        | 21/149 [00:07<00:41,  3.06it/s][A
Training:  17%|█▋        | 25/149 [00:08<00:38,  3.25it/s][A
Training:  19%|█▉        | 29/149 [00:09<00:34,  3.46it/s][A
Training:  22%|██▏       | 33/149 [00:10<00:32,  3.55it/s][A
Training:  25%|██▍       | 37/149 [00:11<00:30,  3.61it/s][A
Training:  27%|██▋       | 40/149 [00:11<00:23,  4.63it/s][A
Training:  28%|██▊       | 42/149 [00:12<00:28,  3.75it/s][A
Training:  30%|███       | 45/149 [00:13<00:30,  3.36it/s][A
Training:  32%|███▏

Epoch: 19/56 - Loss: 0.6889 - Accuracy: 0.9409



  0%|          | 0/19 [00:00<?, ?it/s][A
  5%|▌         | 1/19 [00:01<00:22,  1.22s/it][A
 26%|██▋       | 5/19 [00:02<00:05,  2.45it/s][A
 47%|████▋     | 9/19 [00:03<00:03,  3.15it/s][A
 68%|██████▊   | 13/19 [00:04<00:01,  3.52it/s][A
100%|██████████| 19/19 [00:05<00:00,  3.59it/s][A
Epochs:  34%|███▍      | 19/56 [17:50<29:02, 47.10s/it]

Val Loss: 0.7860 - Val Accuracy: 0.9421



Training:   0%|          | 0/149 [00:00<?, ?it/s][A
Training:   1%|          | 1/149 [00:01<03:35,  1.46s/it][A
Training:   3%|▎         | 5/149 [00:02<01:02,  2.31it/s][A
Training:   6%|▌         | 9/149 [00:03<00:48,  2.88it/s][A
Training:   9%|▊         | 13/149 [00:04<00:44,  3.03it/s][A
Training:  11%|█▏        | 17/149 [00:05<00:39,  3.30it/s][A
Training:  14%|█▍        | 21/149 [00:07<00:39,  3.24it/s][A
Training:  17%|█▋        | 25/149 [00:08<00:37,  3.31it/s][A
Training:  19%|█▉        | 29/149 [00:09<00:34,  3.51it/s][A
Training:  22%|██▏       | 33/149 [00:10<00:32,  3.53it/s][A
Training:  25%|██▍       | 37/149 [00:11<00:31,  3.55it/s][A
Training:  28%|██▊       | 41/149 [00:12<00:29,  3.69it/s][A
Training:  30%|███       | 45/149 [00:13<00:28,  3.66it/s][A
Training:  33%|███▎      | 49/149 [00:14<00:27,  3.64it/s][A
Training:  36%|███▌      | 53/149 [00:15<00:25,  3.72it/s][A
Training:  38%|███▊      | 57/149 [00:16<00:25,  3.64it/s][A
Training:  41%|████

Epoch: 20/56 - Loss: 0.6730 - Accuracy: 0.9406



  0%|          | 0/19 [00:00<?, ?it/s][A
  5%|▌         | 1/19 [00:01<00:23,  1.33s/it][A
 26%|██▋       | 5/19 [00:02<00:05,  2.52it/s][A
 47%|████▋     | 9/19 [00:03<00:03,  3.07it/s][A
 68%|██████▊   | 13/19 [00:04<00:01,  3.37it/s][A
100%|██████████| 19/19 [00:05<00:00,  3.50it/s][A
Epochs:  36%|███▌      | 20/56 [18:37<28:20, 47.24s/it]

Val Loss: 0.8219 - Val Accuracy: 0.9214



Training:   0%|          | 0/149 [00:00<?, ?it/s][A
Training:   1%|          | 1/149 [00:01<03:38,  1.47s/it][A
Training:   3%|▎         | 5/149 [00:02<01:05,  2.19it/s][A
Training:   6%|▌         | 9/149 [00:03<00:47,  2.93it/s][A
Training:   9%|▊         | 13/149 [00:04<00:42,  3.16it/s][A
Training:  11%|█▏        | 17/149 [00:05<00:38,  3.39it/s][A
Training:  13%|█▎        | 19/149 [00:05<00:31,  4.12it/s][A
Training:  14%|█▍        | 21/149 [00:06<00:38,  3.36it/s][A
Training:  15%|█▌        | 23/149 [00:06<00:29,  4.22it/s][A
Training:  17%|█▋        | 25/149 [00:07<00:38,  3.20it/s][A
Training:  19%|█▉        | 28/149 [00:08<00:25,  4.68it/s][A
Training:  20%|██        | 30/149 [00:09<00:35,  3.38it/s][A
Training:  22%|██▏       | 33/149 [00:10<00:35,  3.31it/s][A
Training:  24%|██▍       | 36/149 [00:10<00:23,  4.72it/s][A
Training:  26%|██▌       | 38/149 [00:11<00:32,  3.40it/s][A
Training:  28%|██▊       | 41/149 [00:12<00:32,  3.28it/s][A
Training:  30%|██▉ 

Epoch: 21/56 - Loss: 0.6771 - Accuracy: 0.9393



  0%|          | 0/19 [00:00<?, ?it/s][A
  5%|▌         | 1/19 [00:01<00:23,  1.32s/it][A
 26%|██▋       | 5/19 [00:02<00:05,  2.43it/s][A
 47%|████▋     | 9/19 [00:03<00:03,  3.20it/s][A
 68%|██████▊   | 13/19 [00:04<00:01,  3.44it/s][A
100%|██████████| 19/19 [00:05<00:00,  3.53it/s][A
Epochs:  38%|███▊      | 21/56 [19:24<27:31, 47.18s/it]

Val Loss: 0.8176 - Val Accuracy: 0.9304



Training:   0%|          | 0/149 [00:00<?, ?it/s][A
Training:   1%|          | 1/149 [00:01<03:24,  1.38s/it][A
Training:   3%|▎         | 4/149 [00:01<00:42,  3.45it/s][A
Training:   4%|▍         | 6/149 [00:02<00:54,  2.63it/s][A
Training:   6%|▌         | 9/149 [00:03<00:55,  2.51it/s][A
Training:   8%|▊         | 12/149 [00:03<00:34,  4.01it/s][A
Training:   9%|▉         | 14/149 [00:04<00:43,  3.10it/s][A
Training:  11%|█▏        | 17/149 [00:05<00:44,  2.96it/s][A
Training:  13%|█▎        | 20/149 [00:06<00:30,  4.29it/s][A
Training:  15%|█▍        | 22/149 [00:07<00:37,  3.36it/s][A
Training:  17%|█▋        | 25/149 [00:08<00:38,  3.19it/s][A
Training:  19%|█▉        | 29/149 [00:09<00:36,  3.25it/s][A
Training:  22%|██▏       | 33/149 [00:10<00:33,  3.45it/s][A
Training:  23%|██▎       | 35/149 [00:10<00:27,  4.16it/s][A
Training:  25%|██▍       | 37/149 [00:11<00:33,  3.38it/s][A
Training:  28%|██▊       | 41/149 [00:12<00:31,  3.45it/s][A
Training:  29%|██▉  

Epoch: 22/56 - Loss: 0.6540 - Accuracy: 0.9396



  0%|          | 0/19 [00:00<?, ?it/s][A
  5%|▌         | 1/19 [00:01<00:21,  1.20s/it][A
 21%|██        | 4/19 [00:01<00:03,  3.92it/s][A
 32%|███▏      | 6/19 [00:02<00:04,  2.88it/s][A
 47%|████▋     | 9/19 [00:03<00:03,  2.91it/s][A
 68%|██████▊   | 13/19 [00:04<00:01,  3.47it/s][A
100%|██████████| 19/19 [00:05<00:00,  3.60it/s][A
Epochs:  39%|███▉      | 22/56 [20:11<26:41, 47.09s/it]

Val Loss: 0.6752 - Val Accuracy: 0.9406



Training:   0%|          | 0/149 [00:00<?, ?it/s][A
Training:   1%|          | 1/149 [00:01<03:31,  1.43s/it][A
Training:   3%|▎         | 5/149 [00:02<01:04,  2.25it/s][A
Training:   6%|▌         | 9/149 [00:03<00:47,  2.92it/s][A
Training:   9%|▊         | 13/149 [00:04<00:43,  3.12it/s][A
Training:  11%|█▏        | 17/149 [00:05<00:39,  3.31it/s][A
Training:  14%|█▍        | 21/149 [00:06<00:36,  3.55it/s][A
Training:  17%|█▋        | 25/149 [00:07<00:35,  3.51it/s][A
Training:  19%|█▉        | 29/149 [00:08<00:33,  3.62it/s][A
Training:  21%|██▏       | 32/149 [00:09<00:25,  4.58it/s][A
Training:  22%|██▏       | 33/149 [00:10<00:34,  3.40it/s][A
Training:  24%|██▍       | 36/149 [00:10<00:24,  4.65it/s][A
Training:  26%|██▌       | 38/149 [00:11<00:30,  3.64it/s][A
Training:  27%|██▋       | 40/149 [00:11<00:24,  4.49it/s][A
Training:  28%|██▊       | 42/149 [00:12<00:30,  3.51it/s][A
Training:  30%|██▉       | 44/149 [00:12<00:23,  4.53it/s][A
Training:  31%|███ 

Epoch: 23/56 - Loss: 0.6605 - Accuracy: 0.9421



  0%|          | 0/19 [00:00<?, ?it/s][A
  5%|▌         | 1/19 [00:01<00:24,  1.35s/it][A
 26%|██▋       | 5/19 [00:02<00:05,  2.53it/s][A
 47%|████▋     | 9/19 [00:03<00:03,  3.15it/s][A
 68%|██████▊   | 13/19 [00:04<00:01,  3.51it/s][A
 84%|████████▍ | 16/19 [00:04<00:00,  4.84it/s][A
100%|██████████| 19/19 [00:05<00:00,  3.53it/s][A
Epochs:  41%|████      | 23/56 [20:58<25:51, 47.02s/it]

Val Loss: 0.7306 - Val Accuracy: 0.9323



Training:   0%|          | 0/149 [00:00<?, ?it/s][A
Training:   1%|          | 1/149 [00:01<03:35,  1.45s/it][A
Training:   3%|▎         | 5/149 [00:02<01:06,  2.18it/s][A
Training:   6%|▌         | 9/149 [00:03<00:47,  2.93it/s][A
Training:   9%|▊         | 13/149 [00:04<00:42,  3.17it/s][A
Training:  11%|█▏        | 17/149 [00:05<00:40,  3.29it/s][A
Training:  14%|█▍        | 21/149 [00:06<00:36,  3.47it/s][A
Training:  17%|█▋        | 25/149 [00:08<00:35,  3.49it/s][A
Training:  19%|█▉        | 29/149 [00:09<00:34,  3.48it/s][A
Training:  22%|██▏       | 33/149 [00:10<00:31,  3.65it/s][A
Training:  25%|██▍       | 37/149 [00:11<00:30,  3.62it/s][A
Training:  28%|██▊       | 41/149 [00:12<00:29,  3.64it/s][A
Training:  30%|███       | 45/149 [00:13<00:27,  3.74it/s][A
Training:  33%|███▎      | 49/149 [00:14<00:27,  3.70it/s][A
Training:  36%|███▌      | 53/149 [00:15<00:25,  3.72it/s][A
Training:  38%|███▊      | 57/149 [00:16<00:25,  3.65it/s][A
Training:  41%|████

Epoch: 24/56 - Loss: 0.6566 - Accuracy: 0.9408



  0%|          | 0/19 [00:00<?, ?it/s][A
  5%|▌         | 1/19 [00:01<00:21,  1.17s/it][A
 26%|██▋       | 5/19 [00:02<00:05,  2.59it/s][A
 47%|████▋     | 9/19 [00:03<00:03,  3.26it/s][A
 68%|██████▊   | 13/19 [00:04<00:01,  3.67it/s][A
100%|██████████| 19/19 [00:05<00:00,  3.70it/s][A
Epochs:  43%|████▎     | 24/56 [21:45<25:04, 47.02s/it]

Val Loss: 0.7668 - Val Accuracy: 0.9403



Training:   0%|          | 0/149 [00:00<?, ?it/s][A
Training:   1%|          | 1/149 [00:01<04:01,  1.63s/it][A
Training:   3%|▎         | 5/149 [00:02<01:06,  2.18it/s][A
Training:   6%|▌         | 9/149 [00:03<00:50,  2.75it/s][A
Training:   9%|▊         | 13/149 [00:04<00:45,  3.01it/s][A
Training:  11%|█▏        | 17/149 [00:05<00:39,  3.31it/s][A
Training:  14%|█▍        | 21/149 [00:07<00:37,  3.40it/s][A
Training:  17%|█▋        | 25/149 [00:08<00:37,  3.34it/s][A
Training:  19%|█▉        | 29/149 [00:09<00:34,  3.51it/s][A
Training:  22%|██▏       | 33/149 [00:10<00:33,  3.49it/s][A
Training:  25%|██▍       | 37/149 [00:11<00:32,  3.49it/s][A
Training:  28%|██▊       | 41/149 [00:12<00:29,  3.62it/s][A
Training:  30%|███       | 45/149 [00:13<00:29,  3.58it/s][A
Training:  33%|███▎      | 49/149 [00:14<00:28,  3.57it/s][A
Training:  36%|███▌      | 53/149 [00:15<00:26,  3.67it/s][A
Training:  38%|███▊      | 57/149 [00:17<00:25,  3.59it/s][A
Training:  41%|████

Epoch: 25/56 - Loss: 0.6655 - Accuracy: 0.9413



  0%|          | 0/19 [00:00<?, ?it/s][A
  5%|▌         | 1/19 [00:01<00:22,  1.25s/it][A
 21%|██        | 4/19 [00:01<00:04,  3.66it/s][A
 32%|███▏      | 6/19 [00:02<00:04,  2.84it/s][A
 47%|████▋     | 9/19 [00:03<00:03,  2.91it/s][A
 68%|██████▊   | 13/19 [00:04<00:01,  3.49it/s][A
100%|██████████| 19/19 [00:05<00:00,  3.60it/s][A
Epochs:  45%|████▍     | 25/56 [22:32<24:20, 47.10s/it]

Val Loss: 0.7616 - Val Accuracy: 0.9410



Training:   0%|          | 0/149 [00:00<?, ?it/s][A
Training:   1%|          | 1/149 [00:01<03:28,  1.41s/it][A
Training:   3%|▎         | 4/149 [00:01<00:42,  3.41it/s][A
Training:   4%|▍         | 6/149 [00:02<00:55,  2.59it/s][A
Training:   6%|▌         | 9/149 [00:03<00:50,  2.76it/s][A
Training:   8%|▊         | 12/149 [00:03<00:31,  4.34it/s][A
Training:   9%|▉         | 14/149 [00:04<00:43,  3.09it/s][A
Training:  11%|█▏        | 17/149 [00:05<00:42,  3.10it/s][A
Training:  12%|█▏        | 18/149 [00:05<00:38,  3.43it/s][A
Training:  14%|█▍        | 21/149 [00:06<00:40,  3.20it/s][A
Training:  16%|█▌        | 24/149 [00:07<00:26,  4.66it/s][A
Training:  17%|█▋        | 26/149 [00:08<00:36,  3.40it/s][A
Training:  19%|█▉        | 29/149 [00:08<00:35,  3.35it/s][A
Training:  21%|██▏       | 32/149 [00:09<00:25,  4.68it/s][A
Training:  23%|██▎       | 34/149 [00:10<00:33,  3.47it/s][A
Training:  25%|██▍       | 37/149 [00:11<00:34,  3.29it/s][A
Training:  26%|██▌  

Epoch: 26/56 - Loss: 0.6307 - Accuracy: 0.9426



  0%|          | 0/19 [00:00<?, ?it/s][A
  5%|▌         | 1/19 [00:01<00:23,  1.31s/it][A
 26%|██▋       | 5/19 [00:02<00:05,  2.62it/s][A
 47%|████▋     | 9/19 [00:03<00:03,  3.17it/s][A
 68%|██████▊   | 13/19 [00:04<00:01,  3.56it/s][A
100%|██████████| 19/19 [00:05<00:00,  3.64it/s][A
Epochs:  46%|████▋     | 26/56 [23:19<23:28, 46.95s/it]

Val Loss: 0.6822 - Val Accuracy: 0.9378



Training:   0%|          | 0/149 [00:00<?, ?it/s][A
Training:   1%|          | 1/149 [00:01<03:29,  1.41s/it][A
Training:   3%|▎         | 5/149 [00:02<01:05,  2.20it/s][A
Training:   6%|▌         | 9/149 [00:03<00:47,  2.94it/s][A
Training:   9%|▊         | 13/149 [00:04<00:43,  3.16it/s][A
Training:  11%|█▏        | 17/149 [00:05<00:38,  3.43it/s][A
Training:  14%|█▍        | 21/149 [00:06<00:37,  3.44it/s][A
Training:  17%|█▋        | 25/149 [00:07<00:35,  3.51it/s][A
Training:  17%|█▋        | 26/149 [00:08<00:33,  3.71it/s][A
Training:  19%|█▉        | 29/149 [00:08<00:33,  3.57it/s][A
Training:  21%|██        | 31/149 [00:09<00:27,  4.35it/s][A
Training:  22%|██▏       | 33/149 [00:10<00:34,  3.36it/s][A
Training:  23%|██▎       | 35/149 [00:10<00:26,  4.29it/s][A
Training:  25%|██▍       | 37/149 [00:11<00:34,  3.28it/s][A
Training:  26%|██▌       | 39/149 [00:11<00:26,  4.17it/s][A
Training:  28%|██▊       | 41/149 [00:12<00:32,  3.35it/s][A
Training:  30%|██▉ 

Epoch: 27/56 - Loss: 0.6710 - Accuracy: 0.9395



  0%|          | 0/19 [00:00<?, ?it/s][A
  5%|▌         | 1/19 [00:01<00:21,  1.18s/it][A
 26%|██▋       | 5/19 [00:02<00:06,  2.29it/s][A
 47%|████▋     | 9/19 [00:03<00:03,  2.96it/s][A
 63%|██████▎   | 12/19 [00:03<00:01,  4.41it/s][A
 74%|███████▎  | 14/19 [00:04<00:01,  3.15it/s][A
100%|██████████| 19/19 [00:05<00:00,  3.25it/s][A
Epochs:  48%|████▊     | 27/56 [24:07<22:51, 47.29s/it]

Val Loss: 0.7808 - Val Accuracy: 0.9338



Training:   0%|          | 0/149 [00:00<?, ?it/s][A
Training:   1%|          | 1/149 [00:01<04:06,  1.67s/it][A
Training:   3%|▎         | 5/149 [00:02<01:09,  2.06it/s][A
Training:   5%|▌         | 8/149 [00:02<00:38,  3.66it/s][A
Training:   7%|▋         | 10/149 [00:04<00:51,  2.68it/s][A
Training:   9%|▊         | 13/149 [00:05<00:52,  2.59it/s][A
Training:   9%|▉         | 14/149 [00:05<00:47,  2.87it/s][A
Training:  11%|█▏        | 17/149 [00:06<00:45,  2.93it/s][A
Training:  12%|█▏        | 18/149 [00:06<00:40,  3.25it/s][A
Training:  14%|█▍        | 21/149 [00:07<00:43,  2.95it/s][A
Training:  15%|█▍        | 22/149 [00:07<00:39,  3.23it/s][A
Training:  17%|█▋        | 25/149 [00:09<00:42,  2.91it/s][A
Training:  17%|█▋        | 26/149 [00:09<00:37,  3.25it/s][A
Training:  19%|█▉        | 29/149 [00:10<00:40,  2.98it/s][A
Training:  20%|██        | 30/149 [00:10<00:37,  3.21it/s][A
Training:  22%|██▏       | 33/149 [00:11<00:35,  3.23it/s][A
Training:  23%|██▎ 

Epoch: 28/56 - Loss: 0.6449 - Accuracy: 0.9441



  0%|          | 0/19 [00:00<?, ?it/s][A
  5%|▌         | 1/19 [00:03<00:57,  3.21s/it][A
 11%|█         | 2/19 [00:03<00:23,  1.39s/it][A
 26%|██▋       | 5/19 [00:05<00:12,  1.11it/s][A
 32%|███▏      | 6/19 [00:05<00:09,  1.41it/s][A
 37%|███▋      | 7/19 [00:05<00:06,  1.83it/s][A
 47%|████▋     | 9/19 [00:08<00:08,  1.21it/s][A
 53%|█████▎    | 10/19 [00:08<00:05,  1.50it/s][A
 58%|█████▊    | 11/19 [00:08<00:04,  1.86it/s][A
 68%|██████▊   | 13/19 [00:10<00:04,  1.46it/s][A
 79%|███████▉  | 15/19 [00:10<00:01,  2.18it/s][A
 84%|████████▍ | 16/19 [00:10<00:01,  2.61it/s][A
 89%|████████▉ | 17/19 [00:12<00:01,  1.25it/s][A
100%|██████████| 19/19 [00:12<00:00,  1.47it/s][A
Epochs:  50%|█████     | 28/56 [25:41<28:36, 61.32s/it]

Val Loss: 0.6660 - Val Accuracy: 0.9381



Training:   0%|          | 0/149 [00:00<?, ?it/s][A
Training:   1%|          | 1/149 [00:03<08:29,  3.44s/it][A
Training:   1%|▏         | 2/149 [00:03<03:55,  1.60s/it][A
Training:   2%|▏         | 3/149 [00:03<02:16,  1.07it/s][A
Training:   3%|▎         | 4/149 [00:04<01:30,  1.60it/s][A
Training:   3%|▎         | 5/149 [00:06<02:39,  1.11s/it][A
Training:   4%|▍         | 6/149 [00:06<02:23,  1.00s/it][A
Training:   5%|▍         | 7/149 [00:06<01:41,  1.40it/s][A
Training:   5%|▌         | 8/149 [00:07<01:15,  1.87it/s][A
Training:   6%|▌         | 9/149 [00:08<02:09,  1.08it/s][A
Training:   7%|▋         | 10/149 [00:09<02:01,  1.15it/s][A
Training:   9%|▊         | 13/149 [00:11<01:44,  1.30it/s][A
Training:   9%|▉         | 14/149 [00:12<01:54,  1.18it/s][A
Training:  11%|█         | 16/149 [00:12<01:12,  1.83it/s][A
Training:  11%|█▏        | 17/149 [00:14<01:43,  1.27it/s][A
Training:  12%|█▏        | 18/149 [00:15<01:49,  1.20it/s][A
Training:  13%|█▎        

Epoch: 29/56 - Loss: 0.6580 - Accuracy: 0.9367



  0%|          | 0/19 [00:00<?, ?it/s][A
  5%|▌         | 1/19 [00:03<00:54,  3.00s/it][A
 11%|█         | 2/19 [00:03<00:22,  1.30s/it][A
 16%|█▌        | 3/19 [00:03<00:12,  1.31it/s][A
 21%|██        | 4/19 [00:03<00:07,  1.92it/s][A
 26%|██▋       | 5/19 [00:05<00:15,  1.09s/it][A
 42%|████▏     | 8/19 [00:05<00:05,  2.03it/s][A
 47%|████▋     | 9/19 [00:07<00:07,  1.28it/s][A
 58%|█████▊    | 11/19 [00:07<00:04,  1.98it/s][A
 63%|██████▎   | 12/19 [00:08<00:03,  2.11it/s][A
 68%|██████▊   | 13/19 [00:10<00:04,  1.20it/s][A
 74%|███████▎  | 14/19 [00:10<00:03,  1.54it/s][A
 89%|████████▉ | 17/19 [00:12<00:01,  1.52it/s][A
100%|██████████| 19/19 [00:12<00:00,  1.52it/s][A
Epochs:  52%|█████▏    | 29/56 [27:42<35:41, 79.31s/it]

Val Loss: 0.7176 - Val Accuracy: 0.9399



Training:   0%|          | 0/149 [00:00<?, ?it/s][A
Training:   1%|          | 1/149 [00:03<08:54,  3.61s/it][A
Training:   2%|▏         | 3/149 [00:03<02:22,  1.02it/s][A
Training:   3%|▎         | 5/149 [00:06<02:44,  1.14s/it][A
Training:   5%|▍         | 7/149 [00:06<01:36,  1.47it/s][A
Training:   6%|▌         | 9/149 [00:09<02:07,  1.10it/s][A
Training:   8%|▊         | 12/149 [00:09<01:11,  1.92it/s][A
Training:   9%|▉         | 14/149 [00:11<01:38,  1.37it/s][A
Training:  10%|█         | 15/149 [00:11<01:23,  1.61it/s][A
Training:  11%|█▏        | 17/149 [00:14<01:49,  1.20it/s][A
Training:  12%|█▏        | 18/149 [00:14<01:30,  1.45it/s][A
Training:  13%|█▎        | 20/149 [00:14<01:01,  2.09it/s][A
Training:  14%|█▍        | 21/149 [00:16<01:47,  1.20it/s][A
Training:  15%|█▍        | 22/149 [00:16<01:25,  1.49it/s][A
Training:  15%|█▌        | 23/149 [00:16<01:08,  1.85it/s][A
Training:  16%|█▌        | 24/149 [00:17<00:54,  2.29it/s][A
Training:  17%|█▋    

Epoch: 30/56 - Loss: 0.6346 - Accuracy: 0.9406



  0%|          | 0/19 [00:00<?, ?it/s][A
  5%|▌         | 1/19 [00:03<01:03,  3.53s/it][A
 11%|█         | 2/19 [00:03<00:26,  1.55s/it][A
 21%|██        | 4/19 [00:03<00:09,  1.63it/s][A
 32%|███▏      | 6/19 [00:05<00:09,  1.32it/s][A
 47%|████▋     | 9/19 [00:07<00:07,  1.41it/s][A
 63%|██████▎   | 12/19 [00:07<00:03,  2.27it/s][A
 68%|██████▊   | 13/19 [00:10<00:04,  1.34it/s][A
 89%|████████▉ | 17/19 [00:12<00:01,  1.62it/s][A
100%|██████████| 19/19 [00:12<00:00,  1.53it/s][A
Epochs:  54%|█████▎    | 30/56 [29:38<39:01, 90.07s/it]

Val Loss: 0.7736 - Val Accuracy: 0.9273



Training:   0%|          | 0/149 [00:00<?, ?it/s][A
Training:   1%|          | 1/149 [00:03<08:02,  3.26s/it][A
Training:   1%|▏         | 2/149 [00:03<03:37,  1.48s/it][A
Training:   2%|▏         | 3/149 [00:03<02:05,  1.17it/s][A
Training:   3%|▎         | 4/149 [00:03<01:21,  1.77it/s][A
Training:   3%|▎         | 5/149 [00:05<02:49,  1.18s/it][A
Training:   4%|▍         | 6/149 [00:06<02:20,  1.02it/s][A
Training:   5%|▌         | 8/149 [00:06<01:15,  1.86it/s][A
Training:   6%|▌         | 9/149 [00:09<02:18,  1.01it/s][A
Training:   7%|▋         | 10/149 [00:09<02:03,  1.12it/s][A
Training:   7%|▋         | 11/149 [00:09<01:34,  1.47it/s][A
Training:   9%|▊         | 13/149 [00:12<02:06,  1.07it/s][A
Training:   9%|▉         | 14/149 [00:12<01:45,  1.28it/s][A
Training:  11%|█         | 16/149 [00:12<01:04,  2.06it/s][A
Training:  11%|█▏        | 17/149 [00:15<02:03,  1.07it/s][A
Training:  12%|█▏        | 18/149 [00:15<01:47,  1.21it/s][A
Training:  14%|█▍       

Epoch: 31/56 - Loss: 0.6394 - Accuracy: 0.9422



  0%|          | 0/19 [00:00<?, ?it/s][A
  5%|▌         | 1/19 [00:03<01:02,  3.47s/it][A
 16%|█▌        | 3/19 [00:03<00:16,  1.01s/it][A
 26%|██▋       | 5/19 [00:05<00:14,  1.02s/it][A
 32%|███▏      | 6/19 [00:05<00:10,  1.28it/s][A
 37%|███▋      | 7/19 [00:06<00:07,  1.65it/s][A
 42%|████▏     | 8/19 [00:06<00:05,  2.11it/s][A
 47%|████▋     | 9/19 [00:08<00:08,  1.13it/s][A
 53%|█████▎    | 10/19 [00:08<00:05,  1.50it/s][A
 63%|██████▎   | 12/19 [00:08<00:02,  2.56it/s][A
 68%|██████▊   | 13/19 [00:10<00:05,  1.18it/s][A
 84%|████████▍ | 16/19 [00:10<00:01,  2.30it/s][A
100%|██████████| 19/19 [00:12<00:00,  1.48it/s][A
Epochs:  55%|█████▌    | 31/56 [31:37<41:12, 98.90s/it]

Val Loss: 0.7663 - Val Accuracy: 0.9276



Training:   0%|          | 0/149 [00:00<?, ?it/s][A
Training:   1%|          | 1/149 [00:03<08:00,  3.25s/it][A
Training:   1%|▏         | 2/149 [00:03<04:12,  1.72s/it][A
Training:   2%|▏         | 3/149 [00:04<02:26,  1.00s/it][A
Training:   3%|▎         | 4/149 [00:04<01:35,  1.52it/s][A
Training:   3%|▎         | 5/149 [00:06<02:51,  1.19s/it][A
Training:   4%|▍         | 6/149 [00:06<02:15,  1.06it/s][A
Training:   5%|▍         | 7/149 [00:06<01:37,  1.45it/s][A
Training:   5%|▌         | 8/149 [00:07<01:13,  1.92it/s][A
Training:   6%|▌         | 9/149 [00:08<02:11,  1.07it/s][A
Training:   7%|▋         | 10/149 [00:09<02:03,  1.12it/s][A
Training:   7%|▋         | 11/149 [00:09<01:30,  1.53it/s][A
Training:   9%|▊         | 13/149 [00:11<01:52,  1.21it/s][A
Training:   9%|▉         | 14/149 [00:12<01:45,  1.28it/s][A
Training:  11%|█         | 16/149 [00:12<01:05,  2.02it/s][A
Training:  11%|█▏        | 17/149 [00:14<01:49,  1.20it/s][A
Training:  12%|█▏        

Epoch: 32/56 - Loss: 0.6381 - Accuracy: 0.9411



  0%|          | 0/19 [00:00<?, ?it/s][A
  5%|▌         | 1/19 [00:03<00:55,  3.09s/it][A
 11%|█         | 2/19 [00:03<00:22,  1.34s/it][A
 21%|██        | 4/19 [00:03<00:08,  1.79it/s][A
 26%|██▋       | 5/19 [00:05<00:13,  1.02it/s][A
 37%|███▋      | 7/19 [00:05<00:06,  1.83it/s][A
 47%|████▋     | 9/19 [00:08<00:08,  1.13it/s][A
 68%|██████▊   | 13/19 [00:10<00:04,  1.40it/s][A
 79%|███████▉  | 15/19 [00:10<00:02,  1.86it/s][A
 84%|████████▍ | 16/19 [00:10<00:01,  2.14it/s][A
 89%|████████▉ | 17/19 [00:12<00:01,  1.29it/s][A
100%|██████████| 19/19 [00:13<00:00,  1.44it/s][A
Epochs:  57%|█████▋    | 32/56 [33:31<41:24, 103.53s/it]

Val Loss: 0.7204 - Val Accuracy: 0.9312



Training:   0%|          | 0/149 [00:00<?, ?it/s][A
Training:   1%|          | 1/149 [00:03<08:10,  3.31s/it][A
Training:   1%|▏         | 2/149 [00:03<03:55,  1.60s/it][A
Training:   3%|▎         | 4/149 [00:03<01:31,  1.59it/s][A
Training:   3%|▎         | 5/149 [00:05<02:34,  1.07s/it][A
Training:   4%|▍         | 6/149 [00:06<02:01,  1.18it/s][A
Training:   6%|▌         | 9/149 [00:08<01:59,  1.17it/s][A
Training:   7%|▋         | 10/149 [00:09<01:41,  1.37it/s][A
Training:   8%|▊         | 12/149 [00:09<01:06,  2.07it/s][A
Training:   9%|▊         | 13/149 [00:11<02:02,  1.11it/s][A
Training:   9%|▉         | 14/149 [00:11<01:38,  1.37it/s][A
Training:  11%|█         | 16/149 [00:11<01:02,  2.14it/s][A
Training:  11%|█▏        | 17/149 [00:14<02:02,  1.08it/s][A
Training:  12%|█▏        | 18/149 [00:14<01:36,  1.35it/s][A
Training:  13%|█▎        | 20/149 [00:14<01:01,  2.09it/s][A
Training:  14%|█▍        | 21/149 [00:17<01:53,  1.13it/s][A
Training:  15%|█▍     

Epoch: 33/56 - Loss: 0.6332 - Accuracy: 0.9414



  0%|          | 0/19 [00:00<?, ?it/s][A
  5%|▌         | 1/19 [00:02<00:52,  2.90s/it][A
 21%|██        | 4/19 [00:03<00:08,  1.72it/s][A
 32%|███▏      | 6/19 [00:05<00:11,  1.14it/s][A
 37%|███▋      | 7/19 [00:05<00:08,  1.42it/s][A
 47%|████▋     | 9/19 [00:07<00:08,  1.14it/s][A
 53%|█████▎    | 10/19 [00:08<00:06,  1.38it/s][A
 58%|█████▊    | 11/19 [00:08<00:04,  1.71it/s][A
 63%|██████▎   | 12/19 [00:08<00:03,  2.10it/s][A
 68%|██████▊   | 13/19 [00:10<00:05,  1.05it/s][A
 74%|███████▎  | 14/19 [00:10<00:03,  1.34it/s][A
 84%|████████▍ | 16/19 [00:11<00:01,  2.21it/s][A
100%|██████████| 19/19 [00:14<00:00,  1.35it/s][A
Epochs:  59%|█████▉    | 33/56 [35:25<40:52, 106.63s/it]

Val Loss: 0.7417 - Val Accuracy: 0.9231



Training:   0%|          | 0/149 [00:00<?, ?it/s][A
Training:   1%|          | 1/149 [00:03<09:39,  3.91s/it][A
Training:   1%|▏         | 2/149 [00:04<04:15,  1.74s/it][A
Training:   3%|▎         | 4/149 [00:04<01:40,  1.44it/s][A
Training:   3%|▎         | 5/149 [00:06<02:59,  1.25s/it][A
Training:   4%|▍         | 6/149 [00:07<02:18,  1.03it/s][A
Training:   6%|▌         | 9/149 [00:09<02:08,  1.09it/s][A
Training:   7%|▋         | 10/149 [00:10<01:49,  1.27it/s][A
Training:   7%|▋         | 11/149 [00:10<01:27,  1.58it/s][A
Training:   9%|▊         | 13/149 [00:12<02:02,  1.11it/s][A
Training:   9%|▉         | 14/149 [00:13<01:48,  1.24it/s][A
Training:  10%|█         | 15/149 [00:13<01:26,  1.54it/s][A
Training:  11%|█         | 16/149 [00:13<01:08,  1.93it/s][A
Training:  11%|█▏        | 17/149 [00:15<02:09,  1.02it/s][A
Training:  12%|█▏        | 18/149 [00:16<01:47,  1.22it/s][A
Training:  13%|█▎        | 19/149 [00:16<01:21,  1.60it/s][A
Training:  13%|█▎     

Epoch: 34/56 - Loss: 0.6401 - Accuracy: 0.9449



  0%|          | 0/19 [00:00<?, ?it/s][A
  5%|▌         | 1/19 [00:03<00:57,  3.18s/it][A
 16%|█▌        | 3/19 [00:03<00:13,  1.16it/s][A
 26%|██▋       | 5/19 [00:05<00:12,  1.09it/s][A
 32%|███▏      | 6/19 [00:05<00:09,  1.43it/s][A
 37%|███▋      | 7/19 [00:05<00:06,  1.83it/s][A
 47%|████▋     | 9/19 [00:07<00:08,  1.23it/s][A
 58%|█████▊    | 11/19 [00:07<00:04,  1.89it/s][A
 68%|██████▊   | 13/19 [00:10<00:04,  1.37it/s][A
 79%|███████▉  | 15/19 [00:10<00:02,  1.84it/s][A
 89%|████████▉ | 17/19 [00:12<00:01,  1.41it/s][A
100%|██████████| 19/19 [00:12<00:00,  1.47it/s][A
Epochs:  61%|██████    | 34/56 [37:25<40:32, 110.55s/it]

Val Loss: 0.6285 - Val Accuracy: 0.9392



Training:   0%|          | 0/149 [00:00<?, ?it/s][A
Training:   1%|          | 1/149 [00:03<08:24,  3.41s/it][A
Training:   1%|▏         | 2/149 [00:03<03:36,  1.47s/it][A
Training:   2%|▏         | 3/149 [00:03<02:08,  1.14it/s][A
Training:   3%|▎         | 5/149 [00:06<02:30,  1.05s/it][A
Training:   5%|▍         | 7/149 [00:06<01:26,  1.65it/s][A
Training:   6%|▌         | 9/149 [00:08<02:03,  1.14it/s][A
Training:   7%|▋         | 11/149 [00:08<01:22,  1.68it/s][A
Training:   9%|▊         | 13/149 [00:11<01:52,  1.21it/s][A
Training:   9%|▉         | 14/149 [00:11<01:33,  1.45it/s][A
Training:  10%|█         | 15/149 [00:11<01:16,  1.75it/s][A
Training:  11%|█         | 16/149 [00:11<01:02,  2.13it/s][A
Training:  11%|█▏        | 17/149 [00:14<02:07,  1.04it/s][A
Training:  13%|█▎        | 19/149 [00:14<01:16,  1.70it/s][A
Training:  14%|█▍        | 21/149 [00:16<01:36,  1.33it/s][A
Training:  15%|█▌        | 23/149 [00:17<01:12,  1.75it/s][A
Training:  16%|█▌     

Epoch: 35/56 - Loss: 0.6579 - Accuracy: 0.9389



  0%|          | 0/19 [00:00<?, ?it/s][A
  5%|▌         | 1/19 [00:02<00:53,  2.96s/it][A
 11%|█         | 2/19 [00:03<00:21,  1.28s/it][A
 16%|█▌        | 3/19 [00:03<00:12,  1.33it/s][A
 26%|██▋       | 5/19 [00:05<00:13,  1.05it/s][A
 37%|███▋      | 7/19 [00:05<00:06,  1.82it/s][A
 42%|████▏     | 8/19 [00:05<00:05,  2.18it/s][A
 47%|████▋     | 9/19 [00:07<00:08,  1.18it/s][A
 58%|█████▊    | 11/19 [00:07<00:04,  1.94it/s][A
 63%|██████▎   | 12/19 [00:08<00:03,  2.18it/s][A
 68%|██████▊   | 13/19 [00:10<00:05,  1.19it/s][A
 84%|████████▍ | 16/19 [00:10<00:01,  2.21it/s][A
 89%|████████▉ | 17/19 [00:12<00:01,  1.36it/s][A
100%|██████████| 19/19 [00:12<00:00,  1.53it/s][A
Epochs:  62%|██████▎   | 35/56 [39:19<39:03, 111.61s/it]

Val Loss: 0.8645 - Val Accuracy: 0.9077



Training:   0%|          | 0/149 [00:00<?, ?it/s][A
Training:   1%|          | 1/149 [00:03<08:20,  3.38s/it][A
Training:   1%|▏         | 2/149 [00:03<03:36,  1.47s/it][A
Training:   2%|▏         | 3/149 [00:03<02:05,  1.16it/s][A
Training:   3%|▎         | 5/149 [00:06<02:39,  1.11s/it][A
Training:   4%|▍         | 6/149 [00:06<01:57,  1.22it/s][A
Training:   5%|▌         | 8/149 [00:06<01:08,  2.05it/s][A
Training:   6%|▌         | 9/149 [00:08<02:04,  1.12it/s][A
Training:   7%|▋         | 11/149 [00:08<01:17,  1.78it/s][A
Training:   9%|▊         | 13/149 [00:11<01:48,  1.26it/s][A
Training:  10%|█         | 15/149 [00:11<01:12,  1.85it/s][A
Training:  11%|█▏        | 17/149 [00:13<01:35,  1.39it/s][A
Training:  13%|█▎        | 20/149 [00:13<00:56,  2.28it/s][A
Training:  15%|█▍        | 22/149 [00:16<01:25,  1.49it/s][A
Training:  16%|█▌        | 24/149 [00:16<01:02,  2.01it/s][A
Training:  17%|█▋        | 26/149 [00:18<01:23,  1.48it/s][A
Training:  19%|█▉      

Epoch: 36/56 - Loss: 0.6320 - Accuracy: 0.9429



  0%|          | 0/19 [00:00<?, ?it/s][A
  5%|▌         | 1/19 [00:02<00:47,  2.63s/it][A
 11%|█         | 2/19 [00:02<00:21,  1.28s/it][A
 16%|█▌        | 3/19 [00:03<00:12,  1.33it/s][A
 26%|██▋       | 5/19 [00:04<00:11,  1.18it/s][A
 32%|███▏      | 6/19 [00:05<00:08,  1.54it/s][A
 37%|███▋      | 7/19 [00:05<00:06,  1.99it/s][A
 42%|████▏     | 8/19 [00:05<00:04,  2.59it/s][A
 47%|████▋     | 9/19 [00:07<00:08,  1.19it/s][A
 53%|█████▎    | 10/19 [00:07<00:06,  1.45it/s][A
 58%|█████▊    | 11/19 [00:07<00:04,  1.93it/s][A
 68%|██████▊   | 13/19 [00:09<00:04,  1.35it/s][A
 74%|███████▎  | 14/19 [00:09<00:03,  1.63it/s][A
 79%|███████▉  | 15/19 [00:10<00:01,  2.09it/s][A
 89%|████████▉ | 17/19 [00:12<00:01,  1.35it/s][A
100%|██████████| 19/19 [00:12<00:00,  1.50it/s][A
Epochs:  64%|██████▍   | 36/56 [41:10<37:06, 111.31s/it]

Val Loss: 0.8574 - Val Accuracy: 0.9204



Training:   0%|          | 0/149 [00:00<?, ?it/s][A
Training:   1%|          | 1/149 [00:03<08:11,  3.32s/it][A
Training:   2%|▏         | 3/149 [00:03<02:16,  1.07it/s][A
Training:   3%|▎         | 4/149 [00:03<01:36,  1.51it/s][A
Training:   3%|▎         | 5/149 [00:06<02:56,  1.22s/it][A
Training:   5%|▍         | 7/149 [00:06<01:33,  1.51it/s][A
Training:   5%|▌         | 8/149 [00:06<01:14,  1.88it/s][A
Training:   6%|▌         | 9/149 [00:08<02:25,  1.04s/it][A
Training:   7%|▋         | 10/149 [00:08<01:49,  1.27it/s][A
Training:   8%|▊         | 12/149 [00:09<01:07,  2.04it/s][A
Training:   9%|▊         | 13/149 [00:11<02:02,  1.11it/s][A
Training:  10%|█         | 15/149 [00:11<01:16,  1.75it/s][A
Training:  11%|█         | 16/149 [00:11<01:02,  2.13it/s][A
Training:  11%|█▏        | 17/149 [00:13<01:47,  1.22it/s][A
Training:  12%|█▏        | 18/149 [00:13<01:23,  1.57it/s][A
Training:  14%|█▍        | 21/149 [00:15<01:24,  1.51it/s][A
Training:  15%|█▍      

Epoch: 37/56 - Loss: 0.6366 - Accuracy: 0.9413



  0%|          | 0/19 [00:00<?, ?it/s][A
  5%|▌         | 1/19 [00:02<00:50,  2.79s/it][A
 11%|█         | 2/19 [00:03<00:24,  1.42s/it][A
 16%|█▌        | 3/19 [00:03<00:13,  1.20it/s][A
 26%|██▋       | 5/19 [00:04<00:11,  1.23it/s][A
 32%|███▏      | 6/19 [00:05<00:08,  1.60it/s][A
 42%|████▏     | 8/19 [00:05<00:04,  2.54it/s][A
 47%|████▋     | 9/19 [00:07<00:07,  1.28it/s][A
 58%|█████▊    | 11/19 [00:07<00:03,  2.02it/s][A
 68%|██████▊   | 13/19 [00:09<00:04,  1.44it/s][A
 84%|████████▍ | 16/19 [00:09<00:01,  2.43it/s][A
 89%|████████▉ | 17/19 [00:11<00:01,  1.45it/s][A
100%|██████████| 19/19 [00:12<00:00,  1.58it/s][A
Epochs:  66%|██████▌   | 37/56 [43:00<35:06, 110.89s/it]

Val Loss: 0.7513 - Val Accuracy: 0.9372



Training:   0%|          | 0/149 [00:00<?, ?it/s][A
Training:   1%|          | 1/149 [00:03<07:59,  3.24s/it][A
Training:   1%|▏         | 2/149 [00:03<04:02,  1.65s/it][A
Training:   2%|▏         | 3/149 [00:03<02:21,  1.03it/s][A
Training:   3%|▎         | 4/149 [00:04<01:31,  1.58it/s][A
Training:   3%|▎         | 5/149 [00:05<02:26,  1.02s/it][A
Training:   4%|▍         | 6/149 [00:06<02:08,  1.11it/s][A
Training:   5%|▌         | 8/149 [00:06<01:08,  2.05it/s][A
Training:   6%|▌         | 9/149 [00:08<01:47,  1.31it/s][A
Training:   7%|▋         | 10/149 [00:08<01:50,  1.26it/s][A
Training:   8%|▊         | 12/149 [00:09<01:04,  2.12it/s][A
Training:   9%|▊         | 13/149 [00:10<01:41,  1.33it/s][A
Training:   9%|▉         | 14/149 [00:11<01:38,  1.37it/s][A
Training:  11%|█▏        | 17/149 [00:13<01:26,  1.52it/s][A
Training:  12%|█▏        | 18/149 [00:14<01:30,  1.45it/s][A
Training:  13%|█▎        | 20/149 [00:14<00:59,  2.17it/s][A
Training:  14%|█▍       

Epoch: 38/56 - Loss: 0.6333 - Accuracy: 0.9431



  0%|          | 0/19 [00:00<?, ?it/s][A
  5%|▌         | 1/19 [00:03<00:54,  3.00s/it][A
 11%|█         | 2/19 [00:03<00:22,  1.32s/it][A
 16%|█▌        | 3/19 [00:03<00:12,  1.30it/s][A
 21%|██        | 4/19 [00:03<00:07,  1.92it/s][A
 26%|██▋       | 5/19 [00:05<00:12,  1.08it/s][A
 37%|███▋      | 7/19 [00:05<00:05,  2.08it/s][A
 47%|████▋     | 9/19 [00:07<00:07,  1.37it/s][A
 53%|█████▎    | 10/19 [00:07<00:05,  1.71it/s][A
 58%|█████▊    | 11/19 [00:07<00:03,  2.14it/s][A
 63%|██████▎   | 12/19 [00:07<00:02,  2.67it/s][A
 68%|██████▊   | 13/19 [00:09<00:04,  1.34it/s][A
 79%|███████▉  | 15/19 [00:09<00:01,  2.22it/s][A
 84%|████████▍ | 16/19 [00:09<00:01,  2.35it/s][A
 89%|████████▉ | 17/19 [00:11<00:01,  1.38it/s][A
100%|██████████| 19/19 [00:11<00:00,  1.62it/s][A
Epochs:  68%|██████▊   | 38/56 [44:49<33:07, 110.42s/it]

Val Loss: 0.8245 - Val Accuracy: 0.9273



Training:   0%|          | 0/149 [00:00<?, ?it/s][A
Training:   1%|          | 1/149 [00:03<08:46,  3.56s/it][A
Training:   3%|▎         | 4/149 [00:03<01:42,  1.41it/s][A
Training:   4%|▍         | 6/149 [00:06<02:12,  1.08it/s][A
Training:   5%|▍         | 7/149 [00:06<01:44,  1.35it/s][A
Training:   6%|▌         | 9/149 [00:08<01:59,  1.17it/s][A
Training:   7%|▋         | 10/149 [00:08<01:39,  1.39it/s][A
Training:   8%|▊         | 12/149 [00:08<01:03,  2.17it/s][A
Training:   9%|▊         | 13/149 [00:10<01:58,  1.15it/s][A
Training:  10%|█         | 15/149 [00:11<01:15,  1.78it/s][A
Training:  11%|█▏        | 17/149 [00:13<01:42,  1.29it/s][A
Training:  13%|█▎        | 19/149 [00:13<01:09,  1.87it/s][A
Training:  14%|█▍        | 21/149 [00:15<01:36,  1.33it/s][A
Training:  15%|█▌        | 23/149 [00:16<01:07,  1.86it/s][A
Training:  17%|█▋        | 25/149 [00:18<01:37,  1.27it/s][A
Training:  18%|█▊        | 27/149 [00:19<01:10,  1.73it/s][A
Training:  19%|█▉    

Epoch: 39/56 - Loss: 0.6257 - Accuracy: 0.9433



  0%|          | 0/19 [00:00<?, ?it/s][A
  5%|▌         | 1/19 [00:03<01:03,  3.53s/it][A
 11%|█         | 2/19 [00:03<00:26,  1.54s/it][A
 21%|██        | 4/19 [00:03<00:09,  1.58it/s][A
 26%|██▋       | 5/19 [00:05<00:14,  1.06s/it][A
 32%|███▏      | 6/19 [00:05<00:10,  1.30it/s][A
 37%|███▋      | 7/19 [00:06<00:06,  1.76it/s][A
 47%|████▋     | 9/19 [00:08<00:08,  1.24it/s][A
 63%|██████▎   | 12/19 [00:08<00:02,  2.37it/s][A
 74%|███████▎  | 14/19 [00:10<00:03,  1.65it/s][A
100%|██████████| 19/19 [00:12<00:00,  1.50it/s][A
Epochs:  70%|██████▉   | 39/56 [46:40<31:18, 110.51s/it]

Val Loss: 0.6996 - Val Accuracy: 0.9387



Training:   0%|          | 0/149 [00:00<?, ?it/s][A
Training:   1%|          | 1/149 [00:03<07:29,  3.03s/it][A
Training:   1%|▏         | 2/149 [00:03<03:23,  1.38s/it][A
Training:   3%|▎         | 5/149 [00:05<02:15,  1.06it/s][A
Training:   4%|▍         | 6/149 [00:05<01:46,  1.35it/s][A
Training:   5%|▌         | 8/149 [00:05<01:06,  2.13it/s][A
Training:   6%|▌         | 9/149 [00:07<01:52,  1.24it/s][A
Training:   7%|▋         | 10/149 [00:08<01:34,  1.47it/s][A
Training:   7%|▋         | 11/149 [00:08<01:13,  1.89it/s][A
Training:   9%|▊         | 13/149 [00:10<01:42,  1.32it/s][A
Training:   9%|▉         | 14/149 [00:10<01:31,  1.48it/s][A
Training:  11%|█▏        | 17/149 [00:13<01:36,  1.37it/s][A
Training:  12%|█▏        | 18/149 [00:13<01:31,  1.43it/s][A
Training:  13%|█▎        | 20/149 [00:13<01:02,  2.07it/s][A
Training:  14%|█▍        | 21/149 [00:15<01:37,  1.31it/s][A
Training:  15%|█▍        | 22/149 [00:16<01:42,  1.24it/s][A
Training:  16%|█▌     

Epoch: 40/56 - Loss: 0.6349 - Accuracy: 0.9439



  0%|          | 0/19 [00:00<?, ?it/s][A
  5%|▌         | 1/19 [00:03<00:58,  3.26s/it][A
 16%|█▌        | 3/19 [00:03<00:14,  1.11it/s][A
 26%|██▋       | 5/19 [00:05<00:14,  1.01s/it][A
 37%|███▋      | 7/19 [00:05<00:07,  1.60it/s][A
 42%|████▏     | 8/19 [00:05<00:05,  1.95it/s][A
 47%|████▋     | 9/19 [00:08<00:08,  1.13it/s][A
 58%|█████▊    | 11/19 [00:08<00:04,  1.83it/s][A
 63%|██████▎   | 12/19 [00:08<00:03,  2.01it/s][A
 68%|██████▊   | 13/19 [00:10<00:05,  1.17it/s][A
 84%|████████▍ | 16/19 [00:10<00:01,  2.22it/s][A
100%|██████████| 19/19 [00:12<00:00,  1.52it/s][A
Epochs:  71%|███████▏  | 40/56 [48:30<29:25, 110.35s/it]

Val Loss: 0.6935 - Val Accuracy: 0.9371



Training:   0%|          | 0/149 [00:00<?, ?it/s][A
Training:   1%|          | 1/149 [00:02<06:45,  2.74s/it][A
Training:   1%|▏         | 2/149 [00:02<03:00,  1.23s/it][A
Training:   3%|▎         | 4/149 [00:03<01:11,  2.03it/s][A
Training:   4%|▍         | 6/149 [00:05<01:54,  1.25it/s][A
Training:   5%|▌         | 8/149 [00:05<01:10,  2.00it/s][A
Training:   7%|▋         | 10/149 [00:07<01:46,  1.31it/s][A
Training:   9%|▊         | 13/149 [00:10<01:43,  1.32it/s][A
Training:   9%|▉         | 14/149 [00:10<01:35,  1.41it/s][A
Training:  10%|█         | 15/149 [00:10<01:19,  1.69it/s][A
Training:  11%|█▏        | 17/149 [00:12<01:42,  1.29it/s][A
Training:  12%|█▏        | 18/149 [00:13<01:26,  1.51it/s][A
Training:  13%|█▎        | 20/149 [00:13<00:58,  2.22it/s][A
Training:  14%|█▍        | 21/149 [00:15<01:43,  1.23it/s][A
Training:  16%|█▌        | 24/149 [00:15<00:55,  2.24it/s][A
Training:  17%|█▋        | 26/149 [00:18<01:27,  1.41it/s][A
Training:  19%|█▉    

Epoch: 41/56 - Loss: 0.6187 - Accuracy: 0.9446



  0%|          | 0/19 [00:00<?, ?it/s][A
  5%|▌         | 1/19 [00:03<00:55,  3.10s/it][A
 16%|█▌        | 3/19 [00:03<00:15,  1.01it/s][A
 26%|██▋       | 5/19 [00:05<00:13,  1.07it/s][A
 37%|███▋      | 7/19 [00:05<00:07,  1.59it/s][A
 47%|████▋     | 9/19 [00:07<00:07,  1.31it/s][A
 58%|█████▊    | 11/19 [00:08<00:04,  1.78it/s][A
 68%|██████▊   | 13/19 [00:09<00:04,  1.48it/s][A
 79%|███████▉  | 15/19 [00:10<00:02,  1.84it/s][A
100%|██████████| 19/19 [00:12<00:00,  1.56it/s][A
Epochs:  73%|███████▎  | 41/56 [50:19<27:29, 109.98s/it]

Val Loss: 0.6152 - Val Accuracy: 0.9400



Training:   0%|          | 0/149 [00:00<?, ?it/s][A
Training:   1%|          | 1/149 [00:03<07:58,  3.23s/it][A
Training:   1%|▏         | 2/149 [00:03<03:26,  1.40s/it][A
Training:   2%|▏         | 3/149 [00:03<01:59,  1.23it/s][A
Training:   3%|▎         | 5/149 [00:05<02:27,  1.03s/it][A
Training:   4%|▍         | 6/149 [00:05<01:50,  1.29it/s][A
Training:   5%|▌         | 8/149 [00:06<01:04,  2.17it/s][A
Training:   6%|▌         | 9/149 [00:08<02:00,  1.17it/s][A
Training:   7%|▋         | 11/149 [00:08<01:13,  1.89it/s][A
Training:   8%|▊         | 12/149 [00:08<01:01,  2.24it/s][A
Training:   9%|▊         | 13/149 [00:10<01:58,  1.15it/s][A
Training:  10%|█         | 15/149 [00:10<01:12,  1.86it/s][A
Training:  11%|█         | 16/149 [00:10<00:59,  2.25it/s][A
Training:  11%|█▏        | 17/149 [00:13<01:54,  1.15it/s][A
Training:  12%|█▏        | 18/149 [00:13<01:27,  1.49it/s][A
Training:  13%|█▎        | 19/149 [00:13<01:07,  1.93it/s][A
Training:  13%|█▎      

Epoch: 42/56 - Loss: 0.6242 - Accuracy: 0.9395



  0%|          | 0/19 [00:00<?, ?it/s][A
  5%|▌         | 1/19 [00:03<01:00,  3.35s/it][A
 11%|█         | 2/19 [00:03<00:25,  1.51s/it][A
 21%|██        | 4/19 [00:03<00:08,  1.68it/s][A
 26%|██▋       | 5/19 [00:05<00:13,  1.03it/s][A
 37%|███▋      | 7/19 [00:05<00:06,  1.85it/s][A
 47%|████▋     | 9/19 [00:07<00:07,  1.30it/s][A
 58%|█████▊    | 11/19 [00:07<00:04,  1.97it/s][A
 68%|██████▊   | 13/19 [00:10<00:04,  1.40it/s][A
 74%|███████▎  | 14/19 [00:10<00:02,  1.68it/s][A
100%|██████████| 19/19 [00:12<00:00,  1.51it/s][A
Epochs:  75%|███████▌  | 42/56 [52:11<25:50, 110.78s/it]

Val Loss: 0.7372 - Val Accuracy: 0.9283



Training:   0%|          | 0/149 [00:00<?, ?it/s][A
Training:   1%|          | 1/149 [00:03<08:49,  3.58s/it][A
Training:   3%|▎         | 4/149 [00:03<01:53,  1.28it/s][A
Training:   3%|▎         | 5/149 [00:06<02:57,  1.23s/it][A
Training:   5%|▍         | 7/149 [00:06<01:42,  1.38it/s][A
Training:   6%|▌         | 9/149 [00:09<02:12,  1.05it/s][A
Training:   8%|▊         | 12/149 [00:09<01:17,  1.76it/s][A
Training:   9%|▊         | 13/149 [00:12<02:05,  1.09it/s][A
Training:  10%|█         | 15/149 [00:12<01:26,  1.55it/s][A
Training:  11%|█         | 16/149 [00:12<01:12,  1.84it/s][A
Training:  11%|█▏        | 17/149 [00:14<02:05,  1.05it/s][A
Training:  12%|█▏        | 18/149 [00:14<01:38,  1.33it/s][A
Training:  13%|█▎        | 19/149 [00:14<01:16,  1.70it/s][A
Training:  14%|█▍        | 21/149 [00:17<01:48,  1.18it/s][A
Training:  15%|█▍        | 22/149 [00:17<01:26,  1.48it/s][A
Training:  16%|█▌        | 24/149 [00:17<00:54,  2.29it/s][A
Training:  17%|█▋    

Epoch: 43/56 - Loss: 0.6283 - Accuracy: 0.9428



  0%|          | 0/19 [00:00<?, ?it/s][A
  5%|▌         | 1/19 [00:02<00:51,  2.86s/it][A
 11%|█         | 2/19 [00:03<00:23,  1.38s/it][A
 26%|██▋       | 5/19 [00:04<00:11,  1.23it/s][A
 32%|███▏      | 6/19 [00:05<00:08,  1.48it/s][A
 47%|████▋     | 9/19 [00:07<00:06,  1.56it/s][A
 53%|█████▎    | 10/19 [00:07<00:05,  1.73it/s][A
 63%|██████▎   | 12/19 [00:07<00:02,  2.56it/s][A
 68%|██████▊   | 13/19 [00:09<00:03,  1.56it/s][A
 74%|███████▎  | 14/19 [00:09<00:02,  1.84it/s][A
 89%|████████▉ | 17/19 [00:10<00:01,  1.88it/s][A
100%|██████████| 19/19 [00:11<00:00,  1.67it/s][A
Epochs:  77%|███████▋  | 43/56 [54:05<24:10, 111.56s/it]

Val Loss: 0.6254 - Val Accuracy: 0.9410



Training:   0%|          | 0/149 [00:00<?, ?it/s][A
Training:   1%|          | 1/149 [00:03<08:25,  3.42s/it][A
Training:   2%|▏         | 3/149 [00:03<02:17,  1.06it/s][A
Training:   3%|▎         | 5/149 [00:05<02:32,  1.06s/it][A
Training:   4%|▍         | 6/149 [00:06<01:55,  1.24it/s][A
Training:   5%|▌         | 8/149 [00:06<01:08,  2.06it/s][A
Training:   6%|▌         | 9/149 [00:08<02:12,  1.06it/s][A
Training:   7%|▋         | 11/149 [00:08<01:21,  1.69it/s][A
Training:   8%|▊         | 12/149 [00:08<01:06,  2.06it/s][A
Training:   9%|▊         | 13/149 [00:11<02:11,  1.03it/s][A
Training:  10%|█         | 15/149 [00:11<01:23,  1.60it/s][A
Training:  11%|█▏        | 17/149 [00:14<01:59,  1.10it/s][A
Training:  12%|█▏        | 18/149 [00:14<01:38,  1.33it/s][A
Training:  13%|█▎        | 19/149 [00:14<01:18,  1.66it/s][A
Training:  14%|█▍        | 21/149 [00:17<02:10,  1.02s/it][A
Training:  15%|█▌        | 23/149 [00:18<01:24,  1.48it/s][A
Training:  17%|█▋     

Epoch: 44/56 - Loss: 0.6209 - Accuracy: 0.9424



  0%|          | 0/19 [00:00<?, ?it/s][A
  5%|▌         | 1/19 [00:03<01:00,  3.34s/it][A
 16%|█▌        | 3/19 [00:03<00:15,  1.06it/s][A
 26%|██▋       | 5/19 [00:05<00:14,  1.04s/it][A
 42%|████▏     | 8/19 [00:05<00:05,  1.90it/s][A
 47%|████▋     | 9/19 [00:08<00:08,  1.22it/s][A
 53%|█████▎    | 10/19 [00:08<00:06,  1.50it/s][A
 58%|█████▊    | 11/19 [00:08<00:04,  1.85it/s][A
 63%|██████▎   | 12/19 [00:08<00:02,  2.34it/s][A
 68%|██████▊   | 13/19 [00:10<00:05,  1.14it/s][A
 84%|████████▍ | 16/19 [00:10<00:01,  2.23it/s][A
100%|██████████| 19/19 [00:12<00:00,  1.51it/s][A
Epochs:  79%|███████▊  | 44/56 [55:56<22:16, 111.40s/it]

Val Loss: 0.7362 - Val Accuracy: 0.9344



Training:   0%|          | 0/149 [00:00<?, ?it/s][A
Training:   1%|          | 1/149 [00:03<07:35,  3.07s/it][A
Training:   2%|▏         | 3/149 [00:03<02:04,  1.17it/s][A
Training:   3%|▎         | 5/149 [00:05<02:17,  1.05it/s][A
Training:   4%|▍         | 6/149 [00:05<01:44,  1.37it/s][A
Training:   5%|▌         | 8/149 [00:05<01:01,  2.28it/s][A
Training:   7%|▋         | 10/149 [00:07<01:37,  1.43it/s][A
Training:   9%|▊         | 13/149 [00:10<01:51,  1.22it/s][A
Training:  10%|█         | 15/149 [00:10<01:19,  1.68it/s][A
Training:  11%|█         | 16/149 [00:10<01:07,  1.96it/s][A
Training:  11%|█▏        | 17/149 [00:13<02:04,  1.06it/s][A
Training:  13%|█▎        | 19/149 [00:13<01:22,  1.58it/s][A
Training:  14%|█▍        | 21/149 [00:16<02:01,  1.05it/s][A
Training:  15%|█▍        | 22/149 [00:17<01:39,  1.27it/s][A
Training:  15%|█▌        | 23/149 [00:17<01:20,  1.56it/s][A
Training:  17%|█▋        | 25/149 [00:19<01:44,  1.18it/s][A
Training:  17%|█▋    

Epoch: 45/56 - Loss: 0.6155 - Accuracy: 0.9433



  0%|          | 0/19 [00:00<?, ?it/s][A
  5%|▌         | 1/19 [00:02<00:49,  2.74s/it][A
 11%|█         | 2/19 [00:02<00:20,  1.21s/it][A
 16%|█▌        | 3/19 [00:03<00:11,  1.35it/s][A
 26%|██▋       | 5/19 [00:05<00:12,  1.14it/s][A
 37%|███▋      | 7/19 [00:05<00:06,  1.93it/s][A
 47%|████▋     | 9/19 [00:07<00:07,  1.41it/s][A
 53%|█████▎    | 10/19 [00:07<00:05,  1.73it/s][A
 58%|█████▊    | 11/19 [00:07<00:03,  2.12it/s][A
 68%|██████▊   | 13/19 [00:09<00:03,  1.52it/s][A
 84%|████████▍ | 16/19 [00:09<00:01,  2.69it/s][A
100%|██████████| 19/19 [00:11<00:00,  1.62it/s][A
Epochs:  80%|████████  | 45/56 [57:46<20:20, 110.93s/it]

Val Loss: 0.6717 - Val Accuracy: 0.9331



Training:   0%|          | 0/149 [00:00<?, ?it/s][A
Training:   1%|          | 1/149 [00:03<07:25,  3.01s/it][A
Training:   1%|▏         | 2/149 [00:03<03:29,  1.43s/it][A
Training:   2%|▏         | 3/149 [00:03<02:01,  1.20it/s][A
Training:   3%|▎         | 4/149 [00:03<01:21,  1.79it/s][A
Training:   3%|▎         | 5/149 [00:05<02:42,  1.13s/it][A
Training:   5%|▍         | 7/149 [00:05<01:23,  1.70it/s][A
Training:   5%|▌         | 8/149 [00:06<01:07,  2.08it/s][A
Training:   6%|▌         | 9/149 [00:08<02:18,  1.01it/s][A
Training:   7%|▋         | 10/149 [00:08<01:42,  1.35it/s][A
Training:   8%|▊         | 12/149 [00:08<01:02,  2.20it/s][A
Training:   9%|▊         | 13/149 [00:11<02:06,  1.08it/s][A
Training:  11%|█         | 16/149 [00:11<01:05,  2.04it/s][A
Training:  11%|█▏        | 17/149 [00:13<01:54,  1.15it/s][A
Training:  12%|█▏        | 18/149 [00:14<01:37,  1.34it/s][A
Training:  13%|█▎        | 20/149 [00:14<01:04,  2.01it/s][A
Training:  14%|█▍       

Epoch: 46/56 - Loss: 0.6226 - Accuracy: 0.9412



  0%|          | 0/19 [00:00<?, ?it/s][A
  5%|▌         | 1/19 [00:02<00:51,  2.85s/it][A
 11%|█         | 2/19 [00:03<00:23,  1.35s/it][A
 21%|██        | 4/19 [00:03<00:08,  1.83it/s][A
 26%|██▋       | 5/19 [00:05<00:12,  1.09it/s][A
 32%|███▏      | 6/19 [00:05<00:08,  1.49it/s][A
 42%|████▏     | 8/19 [00:05<00:04,  2.53it/s][A
 47%|████▋     | 9/19 [00:07<00:07,  1.29it/s][A
 53%|█████▎    | 10/19 [00:07<00:05,  1.51it/s][A
 63%|██████▎   | 12/19 [00:07<00:02,  2.45it/s][A
 68%|██████▊   | 13/19 [00:09<00:04,  1.30it/s][A
 74%|███████▎  | 14/19 [00:10<00:03,  1.33it/s][A
 84%|████████▍ | 16/19 [00:10<00:01,  2.08it/s][A
 89%|████████▉ | 17/19 [00:12<00:01,  1.42it/s][A
100%|██████████| 19/19 [00:12<00:00,  1.51it/s][A
Epochs:  82%|████████▏ | 46/56 [59:35<18:23, 110.35s/it]

Val Loss: 0.7313 - Val Accuracy: 0.9349



Training:   0%|          | 0/149 [00:00<?, ?it/s][A
Training:   1%|          | 1/149 [00:03<07:54,  3.21s/it][A
Training:   1%|▏         | 2/149 [00:03<03:25,  1.40s/it][A
Training:   3%|▎         | 4/149 [00:03<01:20,  1.80it/s][A
Training:   4%|▍         | 6/149 [00:05<02:00,  1.19it/s][A
Training:   5%|▍         | 7/149 [00:05<01:33,  1.53it/s][A
Training:   5%|▌         | 8/149 [00:06<01:13,  1.92it/s][A
Training:   6%|▌         | 9/149 [00:08<02:25,  1.04s/it][A
Training:   7%|▋         | 11/149 [00:08<01:25,  1.62it/s][A
Training:   9%|▊         | 13/149 [00:11<02:09,  1.05it/s][A
Training:   9%|▉         | 14/149 [00:11<01:44,  1.29it/s][A
Training:  11%|█         | 16/149 [00:11<01:07,  1.98it/s][A
Training:  11%|█▏        | 17/149 [00:14<01:58,  1.11it/s][A
Training:  13%|█▎        | 19/149 [00:14<01:16,  1.70it/s][A
Training:  14%|█▍        | 21/149 [00:16<01:43,  1.24it/s][A
Training:  15%|█▌        | 23/149 [00:16<01:10,  1.79it/s][A
Training:  16%|█▌      

Epoch: 47/56 - Loss: 0.6280 - Accuracy: 0.9424



  0%|          | 0/19 [00:00<?, ?it/s][A
  5%|▌         | 1/19 [00:03<01:02,  3.44s/it][A
 11%|█         | 2/19 [00:03<00:25,  1.51s/it][A
 21%|██        | 4/19 [00:03<00:09,  1.63it/s][A
 26%|██▋       | 5/19 [00:05<00:13,  1.01it/s][A
 32%|███▏      | 6/19 [00:05<00:09,  1.35it/s][A
 42%|████▏     | 8/19 [00:05<00:04,  2.29it/s][A
 47%|████▋     | 9/19 [00:08<00:08,  1.16it/s][A
 53%|█████▎    | 10/19 [00:08<00:06,  1.45it/s][A
 68%|██████▊   | 13/19 [00:10<00:04,  1.27it/s][A
 74%|███████▎  | 14/19 [00:11<00:03,  1.50it/s][A
 84%|████████▍ | 16/19 [00:11<00:01,  2.20it/s][A
 89%|████████▉ | 17/19 [00:13<00:01,  1.32it/s][A
100%|██████████| 19/19 [00:13<00:00,  1.40it/s][A
Epochs:  84%|████████▍ | 47/56 [1:01:28<16:40, 111.15s/it]

Val Loss: 0.7053 - Val Accuracy: 0.9364



Training:   0%|          | 0/149 [00:00<?, ?it/s][A
Training:   1%|          | 1/149 [00:03<08:54,  3.61s/it][A
Training:   1%|▏         | 2/149 [00:03<03:48,  1.55s/it][A
Training:   2%|▏         | 3/149 [00:03<02:10,  1.12it/s][A
Training:   3%|▎         | 5/149 [00:06<02:25,  1.01s/it][A
Training:   5%|▍         | 7/149 [00:06<01:24,  1.69it/s][A
Training:   5%|▌         | 8/149 [00:06<01:07,  2.08it/s][A
Training:   6%|▌         | 9/149 [00:08<02:08,  1.09it/s][A
Training:   7%|▋         | 10/149 [00:08<01:37,  1.43it/s][A
Training:   8%|▊         | 12/149 [00:08<00:58,  2.33it/s][A
Training:   9%|▊         | 13/149 [00:11<02:13,  1.02it/s][A
Training:  11%|█         | 16/149 [00:11<01:08,  1.93it/s][A
Training:  11%|█▏        | 17/149 [00:14<01:59,  1.11it/s][A
Training:  13%|█▎        | 19/149 [00:14<01:18,  1.66it/s][A
Training:  14%|█▍        | 21/149 [00:16<01:44,  1.23it/s][A
Training:  15%|█▍        | 22/149 [00:16<01:26,  1.47it/s][A
Training:  15%|█▌      

Epoch: 48/56 - Loss: 0.6254 - Accuracy: 0.9422



  0%|          | 0/19 [00:00<?, ?it/s][A
  5%|▌         | 1/19 [00:02<00:50,  2.79s/it][A
 11%|█         | 2/19 [00:03<00:22,  1.33s/it][A
 16%|█▌        | 3/19 [00:03<00:12,  1.28it/s][A
 26%|██▋       | 5/19 [00:05<00:12,  1.12it/s][A
 32%|███▏      | 6/19 [00:05<00:08,  1.49it/s][A
 42%|████▏     | 8/19 [00:05<00:04,  2.51it/s][A
 47%|████▋     | 9/19 [00:07<00:08,  1.23it/s][A
 68%|██████▊   | 13/19 [00:10<00:04,  1.30it/s][A
 79%|███████▉  | 15/19 [00:10<00:02,  1.77it/s][A
 89%|████████▉ | 17/19 [00:12<00:01,  1.41it/s][A
100%|██████████| 19/19 [00:13<00:00,  1.46it/s][A
Epochs:  86%|████████▌ | 48/56 [1:03:21<14:55, 111.95s/it]

Val Loss: 0.7616 - Val Accuracy: 0.9312



Training:   0%|          | 0/149 [00:00<?, ?it/s][A
Training:   1%|          | 1/149 [00:02<07:15,  2.94s/it][A
Training:   1%|▏         | 2/149 [00:03<03:22,  1.37s/it][A
Training:   2%|▏         | 3/149 [00:03<02:05,  1.17it/s][A
Training:   3%|▎         | 4/149 [00:03<01:22,  1.75it/s][A
Training:   3%|▎         | 5/149 [00:05<02:23,  1.00it/s][A
Training:   4%|▍         | 6/149 [00:05<02:01,  1.18it/s][A
Training:   5%|▍         | 7/149 [00:06<01:32,  1.54it/s][A
Training:   5%|▌         | 8/149 [00:06<01:07,  2.10it/s][A
Training:   6%|▌         | 9/149 [00:08<02:23,  1.03s/it][A
Training:   7%|▋         | 10/149 [00:09<02:19,  1.01s/it][A
Training:   7%|▋         | 11/149 [00:09<01:40,  1.37it/s][A
Training:   9%|▊         | 13/149 [00:11<01:46,  1.28it/s][A
Training:   9%|▉         | 14/149 [00:12<01:52,  1.20it/s][A
Training:  10%|█         | 15/149 [00:12<01:26,  1.55it/s][A
Training:  11%|█▏        | 17/149 [00:13<01:28,  1.50it/s][A
Training:  12%|█▏        

Epoch: 49/56 - Loss: 0.6265 - Accuracy: 0.9395



  0%|          | 0/19 [00:00<?, ?it/s][A
  5%|▌         | 1/19 [00:02<00:43,  2.40s/it][A
 11%|█         | 2/19 [00:02<00:19,  1.15s/it][A
 21%|██        | 4/19 [00:02<00:07,  2.14it/s][A
 26%|██▋       | 5/19 [00:04<00:12,  1.16it/s][A
 32%|███▏      | 6/19 [00:04<00:09,  1.44it/s][A
 37%|███▋      | 7/19 [00:05<00:08,  1.42it/s][A
 47%|████▋     | 9/19 [00:07<00:07,  1.26it/s][A
 53%|█████▎    | 10/19 [00:07<00:06,  1.47it/s][A
 58%|█████▊    | 11/19 [00:07<00:04,  1.78it/s][A
 68%|██████▊   | 13/19 [00:09<00:04,  1.40it/s][A
 74%|███████▎  | 14/19 [00:10<00:03,  1.65it/s][A
 84%|████████▍ | 16/19 [00:10<00:01,  2.24it/s][A
 89%|████████▉ | 17/19 [00:11<00:01,  1.46it/s][A
100%|██████████| 19/19 [00:12<00:00,  1.54it/s][A
Epochs:  88%|████████▊ | 49/56 [1:05:14<13:04, 112.12s/it]

Val Loss: 0.6781 - Val Accuracy: 0.9382



Training:   0%|          | 0/149 [00:00<?, ?it/s][A
Training:   1%|          | 1/149 [00:03<08:05,  3.28s/it][A
Training:   2%|▏         | 3/149 [00:03<02:14,  1.08it/s][A
Training:   3%|▎         | 5/149 [00:06<02:41,  1.12s/it][A
Training:   5%|▌         | 8/149 [00:06<01:27,  1.61it/s][A
Training:   6%|▌         | 9/149 [00:09<02:16,  1.02it/s][A
Training:   7%|▋         | 11/149 [00:09<01:34,  1.46it/s][A
Training:   9%|▊         | 13/149 [00:11<01:55,  1.17it/s][A
Training:   9%|▉         | 14/149 [00:11<01:35,  1.41it/s][A
Training:  10%|█         | 15/149 [00:12<01:25,  1.57it/s][A
Training:  11%|█▏        | 17/149 [00:14<01:37,  1.35it/s][A
Training:  12%|█▏        | 18/149 [00:14<01:19,  1.65it/s][A
Training:  13%|█▎        | 19/149 [00:14<01:14,  1.74it/s][A
Training:  14%|█▍        | 21/149 [00:16<01:33,  1.37it/s][A
Training:  15%|█▍        | 22/149 [00:16<01:17,  1.63it/s][A
Training:  15%|█▌        | 23/149 [00:16<01:05,  1.93it/s][A
Training:  16%|█▌    

Epoch: 50/56 - Loss: 0.6141 - Accuracy: 0.9436



  0%|          | 0/19 [00:00<?, ?it/s][A
  5%|▌         | 1/19 [00:03<00:54,  3.02s/it][A
 11%|█         | 2/19 [00:03<00:23,  1.39s/it][A
 16%|█▌        | 3/19 [00:03<00:13,  1.23it/s][A
 26%|██▋       | 5/19 [00:06<00:15,  1.10s/it][A
 32%|███▏      | 6/19 [00:06<00:11,  1.16it/s][A
 37%|███▋      | 7/19 [00:06<00:08,  1.47it/s][A
 47%|████▋     | 9/19 [00:08<00:07,  1.30it/s][A
 53%|█████▎    | 10/19 [00:08<00:05,  1.63it/s][A
 58%|█████▊    | 11/19 [00:08<00:04,  1.76it/s][A
 63%|██████▎   | 12/19 [00:09<00:03,  2.23it/s][A
 68%|██████▊   | 13/19 [00:10<00:04,  1.26it/s][A
 79%|███████▉  | 15/19 [00:11<00:02,  1.73it/s][A
100%|██████████| 19/19 [00:13<00:00,  1.45it/s][A
Epochs:  89%|████████▉ | 50/56 [1:07:09<11:18, 113.12s/it]

Val Loss: 0.8102 - Val Accuracy: 0.9249



Training:   0%|          | 0/149 [00:00<?, ?it/s][A
Training:   1%|          | 1/149 [00:04<10:06,  4.10s/it][A
Training:   2%|▏         | 3/149 [00:04<02:42,  1.11s/it][A
Training:   3%|▎         | 5/149 [00:06<02:48,  1.17s/it][A
Training:   4%|▍         | 6/149 [00:06<02:06,  1.13it/s][A
Training:   5%|▍         | 7/149 [00:06<01:35,  1.49it/s][A
Training:   5%|▌         | 8/149 [00:07<01:14,  1.89it/s][A
Training:   6%|▌         | 9/149 [00:10<02:52,  1.23s/it][A
Training:   7%|▋         | 10/149 [00:10<02:05,  1.11it/s][A
Training:   7%|▋         | 11/149 [00:10<01:34,  1.46it/s][A
Training:   9%|▊         | 13/149 [00:13<02:14,  1.01it/s][A
Training:  11%|█         | 16/149 [00:13<01:09,  1.92it/s][A
Training:  12%|█▏        | 18/149 [00:15<01:44,  1.26it/s][A
Training:  13%|█▎        | 20/149 [00:16<01:12,  1.77it/s][A
Training:  15%|█▍        | 22/149 [00:18<01:32,  1.37it/s][A
Training:  17%|█▋        | 25/149 [00:20<01:35,  1.30it/s][A
Training:  17%|█▋      

Epoch: 51/56 - Loss: 0.6097 - Accuracy: 0.9448



  0%|          | 0/19 [00:00<?, ?it/s][A
  5%|▌         | 1/19 [00:02<00:47,  2.66s/it][A
 21%|██        | 4/19 [00:02<00:08,  1.85it/s][A
 32%|███▏      | 6/19 [00:05<00:11,  1.17it/s][A
 42%|████▏     | 8/19 [00:05<00:06,  1.79it/s][A
 47%|████▋     | 9/19 [00:07<00:07,  1.29it/s][A
 53%|█████▎    | 10/19 [00:07<00:06,  1.43it/s][A
 58%|█████▊    | 11/19 [00:07<00:04,  1.77it/s][A
 68%|██████▊   | 13/19 [00:09<00:04,  1.45it/s][A
 74%|███████▎  | 14/19 [00:09<00:03,  1.65it/s][A
 79%|███████▉  | 15/19 [00:09<00:02,  1.93it/s][A
 89%|████████▉ | 17/19 [00:11<00:01,  1.59it/s][A
100%|██████████| 19/19 [00:12<00:00,  1.57it/s][A
Epochs:  91%|█████████ | 51/56 [1:09:00<09:22, 112.44s/it]

Val Loss: 0.6636 - Val Accuracy: 0.9453



Training:   0%|          | 0/149 [00:00<?, ?it/s][A
Training:   1%|          | 1/149 [00:03<08:50,  3.58s/it][A
Training:   1%|▏         | 2/149 [00:03<03:53,  1.59s/it][A
Training:   3%|▎         | 4/149 [00:03<01:30,  1.60it/s][A
Training:   4%|▍         | 6/149 [00:06<02:30,  1.05s/it][A
Training:   5%|▍         | 7/149 [00:07<01:57,  1.21it/s][A
Training:   5%|▌         | 8/149 [00:07<01:31,  1.54it/s][A
Training:   6%|▌         | 9/149 [00:09<02:21,  1.01s/it][A
Training:   7%|▋         | 10/149 [00:09<01:58,  1.17it/s][A
Training:   8%|▊         | 12/149 [00:09<01:11,  1.92it/s][A
Training:   9%|▊         | 13/149 [00:11<01:56,  1.17it/s][A
Training:   9%|▉         | 14/149 [00:12<01:40,  1.34it/s][A
Training:  11%|█         | 16/149 [00:12<01:00,  2.19it/s][A
Training:  11%|█▏        | 17/149 [00:14<01:44,  1.26it/s][A
Training:  12%|█▏        | 18/149 [00:14<01:34,  1.39it/s][A
Training:  13%|█▎        | 20/149 [00:14<00:57,  2.24it/s][A
Training:  14%|█▍      

Epoch: 52/56 - Loss: 0.6028 - Accuracy: 0.9443



  0%|          | 0/19 [00:00<?, ?it/s][A
  5%|▌         | 1/19 [00:02<00:51,  2.83s/it][A
 16%|█▌        | 3/19 [00:03<00:13,  1.19it/s][A
 21%|██        | 4/19 [00:03<00:09,  1.55it/s][A
 26%|██▋       | 5/19 [00:05<00:14,  1.06s/it][A
 37%|███▋      | 7/19 [00:05<00:07,  1.67it/s][A
 47%|████▋     | 9/19 [00:07<00:07,  1.31it/s][A
 58%|█████▊    | 11/19 [00:07<00:04,  1.82it/s][A
 63%|██████▎   | 12/19 [00:08<00:03,  2.14it/s][A
 68%|██████▊   | 13/19 [00:09<00:04,  1.33it/s][A
 79%|███████▉  | 15/19 [00:10<00:02,  1.98it/s][A
 89%|████████▉ | 17/19 [00:12<00:01,  1.46it/s][A
100%|██████████| 19/19 [00:12<00:00,  1.54it/s][A
Epochs:  93%|█████████▎| 52/56 [1:10:51<07:28, 112.01s/it]

Val Loss: 0.6931 - Val Accuracy: 0.9389



Training:   0%|          | 0/149 [00:00<?, ?it/s][A
Training:   1%|          | 1/149 [00:03<09:09,  3.71s/it][A
Training:   2%|▏         | 3/149 [00:03<02:28,  1.01s/it][A
Training:   3%|▎         | 4/149 [00:04<01:56,  1.25it/s][A
Training:   3%|▎         | 5/149 [00:06<03:21,  1.40s/it][A
Training:   4%|▍         | 6/149 [00:06<02:20,  1.02it/s][A
Training:   5%|▍         | 7/149 [00:07<01:42,  1.39it/s][A
Training:   5%|▌         | 8/149 [00:07<01:15,  1.88it/s][A
Training:   6%|▌         | 9/149 [00:09<02:19,  1.00it/s][A
Training:   7%|▋         | 11/149 [00:09<01:18,  1.77it/s][A
Training:   8%|▊         | 12/149 [00:09<01:01,  2.22it/s][A
Training:   9%|▊         | 13/149 [00:11<02:09,  1.05it/s][A
Training:  10%|█         | 15/149 [00:12<01:18,  1.70it/s][A
Training:  11%|█▏        | 17/149 [00:14<01:36,  1.36it/s][A
Training:  12%|█▏        | 18/149 [00:14<01:19,  1.66it/s][A
Training:  13%|█▎        | 19/149 [00:14<01:05,  1.99it/s][A
Training:  13%|█▎       

Epoch: 53/56 - Loss: 0.6093 - Accuracy: 0.9426



  0%|          | 0/19 [00:00<?, ?it/s][A
  5%|▌         | 1/19 [00:02<00:53,  2.99s/it][A
 11%|█         | 2/19 [00:03<00:22,  1.30s/it][A
 21%|██        | 4/19 [00:03<00:09,  1.61it/s][A
 26%|██▋       | 5/19 [00:05<00:13,  1.03it/s][A
 32%|███▏      | 6/19 [00:05<00:09,  1.39it/s][A
 42%|████▏     | 8/19 [00:05<00:05,  2.12it/s][A
 47%|████▋     | 9/19 [00:07<00:07,  1.34it/s][A
 53%|█████▎    | 10/19 [00:07<00:05,  1.65it/s][A
 63%|██████▎   | 12/19 [00:08<00:03,  2.14it/s][A
 68%|██████▊   | 13/19 [00:09<00:04,  1.38it/s][A
 74%|███████▎  | 14/19 [00:09<00:02,  1.69it/s][A
 84%|████████▍ | 16/19 [00:10<00:01,  2.19it/s][A
 89%|████████▉ | 17/19 [00:11<00:01,  1.49it/s][A
100%|██████████| 19/19 [00:12<00:00,  1.56it/s][A
Epochs:  95%|█████████▍| 53/56 [1:12:42<05:34, 111.58s/it]

Val Loss: 0.7116 - Val Accuracy: 0.9427



Training:   0%|          | 0/149 [00:00<?, ?it/s][A
Training:   1%|          | 1/149 [00:03<08:33,  3.47s/it][A
Training:   1%|▏         | 2/149 [00:03<03:41,  1.50s/it][A
Training:   2%|▏         | 3/149 [00:03<02:06,  1.15it/s][A
Training:   3%|▎         | 5/149 [00:06<02:41,  1.12s/it][A
Training:   4%|▍         | 6/149 [00:06<01:59,  1.19it/s][A
Training:   5%|▍         | 7/149 [00:06<01:34,  1.51it/s][A
Training:   5%|▌         | 8/149 [00:06<01:10,  1.99it/s][A
Training:   6%|▌         | 9/149 [00:08<02:13,  1.05it/s][A
Training:   7%|▋         | 10/149 [00:09<01:40,  1.38it/s][A
Training:   7%|▋         | 11/149 [00:09<01:23,  1.66it/s][A
Training:   8%|▊         | 12/149 [00:09<01:03,  2.17it/s][A
Training:   9%|▊         | 13/149 [00:11<02:01,  1.12it/s][A
Training:   9%|▉         | 14/149 [00:11<01:38,  1.37it/s][A
Training:  10%|█         | 15/149 [00:12<01:19,  1.69it/s][A
Training:  11%|█▏        | 17/149 [00:13<01:33,  1.41it/s][A
Training:  12%|█▏       

Training:  97%|█████████▋| 145/149 [01:36<00:02,  1.38it/s][A
Training:  99%|█████████▊| 147/149 [01:37<00:01,  1.57it/s][A
Training:  99%|█████████▉| 148/149 [01:37<00:00,  1.81it/s][A
                                                           [A

Epoch: 54/56 - Loss: 0.6156 - Accuracy: 0.9455



  0%|          | 0/19 [00:00<?, ?it/s][A
  5%|▌         | 1/19 [00:03<00:54,  3.03s/it][A
 11%|█         | 2/19 [00:03<00:24,  1.42s/it][A
 21%|██        | 4/19 [00:03<00:08,  1.77it/s][A
 26%|██▋       | 5/19 [00:05<00:12,  1.09it/s][A
 32%|███▏      | 6/19 [00:05<00:09,  1.42it/s][A
 42%|████▏     | 8/19 [00:05<00:04,  2.44it/s][A
 47%|████▋     | 9/19 [00:07<00:07,  1.27it/s][A
 53%|█████▎    | 10/19 [00:07<00:06,  1.48it/s][A
 58%|█████▊    | 11/19 [00:07<00:04,  1.92it/s][A
 68%|██████▊   | 13/19 [00:09<00:04,  1.39it/s][A
 74%|███████▎  | 14/19 [00:10<00:03,  1.60it/s][A
 84%|████████▍ | 16/19 [00:10<00:01,  2.55it/s][A
 89%|████████▉ | 17/19 [00:11<00:01,  1.45it/s][A
100%|██████████| 19/19 [00:12<00:00,  1.54it/s][A
Epochs:  96%|█████████▋| 54/56 [1:14:32<03:42, 111.17s/it]

Val Loss: 0.6431 - Val Accuracy: 0.9334



Training:   0%|          | 0/149 [00:00<?, ?it/s][A
Training:   1%|          | 1/149 [00:04<10:24,  4.22s/it][A
Training:   2%|▏         | 3/149 [00:04<02:46,  1.14s/it][A
Training:   3%|▎         | 4/149 [00:04<01:55,  1.25it/s][A
Training:   3%|▎         | 5/149 [00:06<03:08,  1.31s/it][A
Training:   5%|▍         | 7/149 [00:06<01:40,  1.42it/s][A
Training:   6%|▌         | 9/149 [00:09<02:08,  1.09it/s][A
Training:   7%|▋         | 11/149 [00:09<01:22,  1.67it/s][A
Training:   9%|▊         | 13/149 [00:12<01:53,  1.20it/s][A
Training:   9%|▉         | 14/149 [00:12<01:33,  1.44it/s][A
Training:  10%|█         | 15/149 [00:12<01:15,  1.78it/s][A
Training:  11%|█▏        | 17/149 [00:14<01:36,  1.37it/s][A
Training:  13%|█▎        | 20/149 [00:14<00:55,  2.34it/s][A
Training:  14%|█▍        | 21/149 [00:16<01:40,  1.28it/s][A
Training:  16%|█▌        | 24/149 [00:17<00:58,  2.15it/s][A
Training:  17%|█▋        | 26/149 [00:19<01:23,  1.47it/s][A
Training:  18%|█▊     

Epoch: 55/56 - Loss: 0.6049 - Accuracy: 0.9447



  0%|          | 0/19 [00:00<?, ?it/s][A
  5%|▌         | 1/19 [00:03<00:58,  3.27s/it][A
 11%|█         | 2/19 [00:03<00:23,  1.40s/it][A
 16%|█▌        | 3/19 [00:03<00:13,  1.21it/s][A
 26%|██▋       | 5/19 [00:05<00:12,  1.15it/s][A
 37%|███▋      | 7/19 [00:05<00:06,  1.91it/s][A
 47%|████▋     | 9/19 [00:07<00:07,  1.31it/s][A
 58%|█████▊    | 11/19 [00:07<00:04,  1.97it/s][A
 68%|██████▊   | 13/19 [00:10<00:04,  1.37it/s][A
 84%|████████▍ | 16/19 [00:10<00:01,  2.28it/s][A
100%|██████████| 19/19 [00:12<00:00,  1.52it/s][A
Epochs:  98%|█████████▊| 55/56 [1:16:22<01:50, 110.75s/it]

Val Loss: 0.7337 - Val Accuracy: 0.9255



Training:   0%|          | 0/149 [00:00<?, ?it/s][A
Training:   1%|          | 1/149 [00:03<09:40,  3.92s/it][A
Training:   1%|▏         | 2/149 [00:04<04:09,  1.70s/it][A
Training:   2%|▏         | 3/149 [00:04<02:21,  1.03it/s][A
Training:   3%|▎         | 5/149 [00:06<02:35,  1.08s/it][A
Training:   5%|▍         | 7/149 [00:06<01:30,  1.57it/s][A
Training:   6%|▌         | 9/149 [00:08<01:55,  1.21it/s][A
Training:   7%|▋         | 10/149 [00:09<01:33,  1.49it/s][A
Training:   8%|▊         | 12/149 [00:09<01:01,  2.24it/s][A
Training:   9%|▊         | 13/149 [00:11<01:55,  1.18it/s][A
Training:  10%|█         | 15/149 [00:11<01:14,  1.79it/s][A
Training:  11%|█▏        | 17/149 [00:14<01:43,  1.28it/s][A
Training:  13%|█▎        | 20/149 [00:14<00:59,  2.16it/s][A
Training:  15%|█▍        | 22/149 [00:16<01:26,  1.47it/s][A
Training:  17%|█▋        | 25/149 [00:18<01:25,  1.44it/s][A
Training:  17%|█▋        | 26/149 [00:18<01:15,  1.64it/s][A
Training:  19%|█▉     

Epoch: 56/56 - Loss: 0.6141 - Accuracy: 0.9431



  0%|          | 0/19 [00:00<?, ?it/s][A
  5%|▌         | 1/19 [00:02<00:52,  2.91s/it][A
 11%|█         | 2/19 [00:03<00:25,  1.50s/it][A
 21%|██        | 4/19 [00:03<00:09,  1.65it/s][A
 26%|██▋       | 5/19 [00:04<00:11,  1.19it/s][A
 32%|███▏      | 6/19 [00:05<00:09,  1.39it/s][A
 42%|████▏     | 8/19 [00:05<00:04,  2.39it/s][A
 47%|████▋     | 9/19 [00:07<00:07,  1.31it/s][A
 53%|█████▎    | 10/19 [00:07<00:06,  1.41it/s][A
 58%|█████▊    | 11/19 [00:08<00:04,  1.83it/s][A
 63%|██████▎   | 12/19 [00:08<00:03,  2.33it/s][A
 68%|██████▊   | 13/19 [00:09<00:04,  1.41it/s][A
 74%|███████▎  | 14/19 [00:10<00:03,  1.47it/s][A
 84%|████████▍ | 16/19 [00:10<00:01,  2.53it/s][A
 89%|████████▉ | 17/19 [00:11<00:01,  1.42it/s][A
100%|██████████| 19/19 [00:12<00:00,  1.53it/s][A
Epochs: 100%|██████████| 56/56 [1:18:11<00:00, 83.77s/it] 


Val Loss: 0.6861 - Val Accuracy: 0.9371
Saving best model...


[32m[I 2023-12-14 23:09:52,401][0m Trial 0 finished with value: 0.937110424041748 and parameters: {'learning_rate': 0.00035883062711026257, 'weight_decay': 0.0010839916629925644, 'epsilon': 4.615406108202454e-09, 'batch_size': 94, 'epochs': 56}. Best is trial 0 with value: 0.937110424041748.[0m


Learning rate: 0.09367970229059014
Weight decay: 0.00011786297022567189
Epsilon: 1.3474912558273086e-08
Batch size: 52
Number of epochs: 96


Epochs:   0%|          | 0/96 [00:00<?, ?it/s]
Training:   0%|          | 0/269 [00:00<?, ?it/s][A
Training:   0%|          | 1/269 [00:02<09:05,  2.04s/it][A
Training:   1%|          | 3/269 [00:02<02:34,  1.73it/s][A
Training:   2%|▏         | 5/269 [00:03<02:49,  1.55it/s][A
Training:   3%|▎         | 8/269 [00:03<01:27,  2.98it/s][A
Training:   4%|▎         | 10/269 [00:05<01:56,  2.22it/s][A
Training:   4%|▍         | 11/269 [00:05<01:40,  2.58it/s][A
Training:   4%|▍         | 12/269 [00:05<01:29,  2.88it/s][A
Training:   5%|▍         | 13/269 [00:06<02:11,  1.95it/s][A
Training:   5%|▌         | 14/269 [00:06<01:45,  2.43it/s][A
Training:   6%|▌         | 16/269 [00:06<01:13,  3.45it/s][A
Training:   6%|▋         | 17/269 [00:08<02:05,  2.00it/s][A
Training:   7%|▋         | 19/269 [00:08<01:22,  3.04it/s][A
Training:   8%|▊         | 21/269 [00:09<01:43,  2.40it/s][A
Training:   9%|▉         | 24/269 [00:09<01:02,  3.91it/s][A
Training:  10%|▉         | 26/269 [0

Training:  94%|█████████▍| 253/269 [01:30<00:06,  2.38it/s][A
Training:  94%|█████████▍| 254/269 [01:30<00:05,  2.61it/s][A
Training:  96%|█████████▌| 257/269 [01:31<00:04,  2.69it/s][A
Training:  96%|█████████▌| 258/269 [01:32<00:04,  2.59it/s][A
Training:  97%|█████████▋| 261/269 [01:32<00:02,  2.91it/s][A
Training:  97%|█████████▋| 262/269 [01:33<00:02,  2.48it/s][A
Training:  98%|█████████▊| 264/269 [01:33<00:01,  3.39it/s][A
Training:  99%|█████████▊| 265/269 [01:34<00:01,  2.96it/s][A
Training:  99%|█████████▉| 266/269 [01:34<00:01,  2.67it/s][A
Training: 100%|██████████| 269/269 [01:35<00:00,  4.05it/s][A
                                                           [A

Epoch: 1/96 - Loss: 8187.7490 - Accuracy: 0.8380



  0%|          | 0/34 [00:00<?, ?it/s][A
  3%|▎         | 1/34 [00:01<00:49,  1.51s/it][A
  9%|▉         | 3/34 [00:01<00:14,  2.21it/s][A
 15%|█▍        | 5/34 [00:02<00:12,  2.23it/s][A
 18%|█▊        | 6/34 [00:02<00:10,  2.57it/s][A
 26%|██▋       | 9/34 [00:04<00:09,  2.54it/s][A
 29%|██▉       | 10/34 [00:04<00:08,  2.94it/s][A
 35%|███▌      | 12/34 [00:04<00:05,  4.23it/s][A
 38%|███▊      | 13/34 [00:05<00:08,  2.58it/s][A
 44%|████▍     | 15/34 [00:05<00:04,  3.80it/s][A
 50%|█████     | 17/34 [00:06<00:05,  2.92it/s][A
 53%|█████▎    | 18/34 [00:06<00:05,  3.15it/s][A
 56%|█████▌    | 19/34 [00:06<00:04,  3.42it/s][A
 62%|██████▏   | 21/34 [00:07<00:04,  2.80it/s][A
 65%|██████▍   | 22/34 [00:07<00:03,  3.02it/s][A
 68%|██████▊   | 23/34 [00:08<00:03,  3.50it/s][A
 74%|███████▎  | 25/34 [00:08<00:03,  2.93it/s][A
 76%|███████▋  | 26/34 [00:09<00:02,  3.05it/s][A
 82%|████████▏ | 28/34 [00:09<00:01,  4.53it/s][A
 85%|████████▌ | 29/34 [00:10<00:01,  2.93it

Val Loss: 9808.7031 - Val Accuracy: 0.8997



Training:   0%|          | 0/269 [00:00<?, ?it/s][A
Training:   0%|          | 1/269 [00:01<08:29,  1.90s/it][A
Training:   1%|          | 3/269 [00:02<02:29,  1.78it/s][A
Training:   1%|▏         | 4/269 [00:02<01:50,  2.39it/s][A
Training:   2%|▏         | 5/269 [00:03<02:40,  1.64it/s][A
Training:   3%|▎         | 7/269 [00:03<01:28,  2.95it/s][A
Training:   3%|▎         | 9/269 [00:04<02:03,  2.10it/s][A
Training:   4%|▍         | 12/269 [00:04<01:09,  3.67it/s][A
Training:   5%|▌         | 14/269 [00:06<01:40,  2.53it/s][A
Training:   6%|▌         | 16/269 [00:06<01:14,  3.41it/s][A
Training:   7%|▋         | 18/269 [00:07<01:50,  2.27it/s][A
Training:   7%|▋         | 20/269 [00:07<01:20,  3.08it/s][A
Training:   8%|▊         | 22/269 [00:09<01:46,  2.32it/s][A
Training:   9%|▉         | 24/269 [00:09<01:17,  3.15it/s][A
Training:  10%|▉         | 26/269 [00:10<01:46,  2.28it/s][A
Training:  10%|█         | 28/269 [00:10<01:17,  3.09it/s][A
Training:  11%|█      

Epoch: 2/96 - Loss: 11060.6445 - Accuracy: 0.8829



  0%|          | 0/34 [00:00<?, ?it/s][A
  3%|▎         | 1/34 [00:01<01:00,  1.84s/it][A
  6%|▌         | 2/34 [00:01<00:26,  1.21it/s][A
 12%|█▏        | 4/34 [00:02<00:10,  2.93it/s][A
 18%|█▊        | 6/34 [00:03<00:11,  2.44it/s][A
 26%|██▋       | 9/34 [00:04<00:09,  2.73it/s][A
 29%|██▉       | 10/34 [00:04<00:07,  3.02it/s][A
 38%|███▊      | 13/34 [00:05<00:06,  3.08it/s][A
 41%|████      | 14/34 [00:05<00:06,  3.06it/s][A
 50%|█████     | 17/34 [00:06<00:05,  3.33it/s][A
 53%|█████▎    | 18/34 [00:06<00:05,  3.02it/s][A
 59%|█████▉    | 20/34 [00:06<00:03,  4.00it/s][A
 62%|██████▏   | 21/34 [00:07<00:04,  3.07it/s][A
 65%|██████▍   | 22/34 [00:08<00:04,  2.80it/s][A
 71%|███████   | 24/34 [00:08<00:02,  4.01it/s][A
 74%|███████▎  | 25/34 [00:08<00:02,  3.02it/s][A
 76%|███████▋  | 26/34 [00:09<00:02,  2.95it/s][A
 85%|████████▌ | 29/34 [00:10<00:01,  3.26it/s][A
 88%|████████▊ | 30/34 [00:10<00:01,  3.08it/s][A
100%|██████████| 34/34 [00:11<00:00,  2.99it

Val Loss: 11531.9033 - Val Accuracy: 0.8591



Training:   0%|          | 0/269 [00:00<?, ?it/s][A
Training:   0%|          | 1/269 [00:01<08:40,  1.94s/it][A
Training:   1%|          | 3/269 [00:02<02:26,  1.81it/s][A
Training:   2%|▏         | 5/269 [00:03<02:25,  1.82it/s][A
Training:   2%|▏         | 6/269 [00:03<01:59,  2.21it/s][A
Training:   3%|▎         | 9/269 [00:04<01:52,  2.30it/s][A
Training:   4%|▎         | 10/269 [00:04<01:38,  2.63it/s][A
Training:   5%|▍         | 13/269 [00:05<01:36,  2.66it/s][A
Training:   5%|▌         | 14/269 [00:06<01:30,  2.82it/s][A
Training:   6%|▋         | 17/269 [00:07<01:32,  2.74it/s][A
Training:   7%|▋         | 18/269 [00:07<01:20,  3.13it/s][A
Training:   7%|▋         | 20/269 [00:07<01:02,  3.98it/s][A
Training:   8%|▊         | 21/269 [00:08<01:43,  2.39it/s][A
Training:   9%|▊         | 23/269 [00:08<01:15,  3.26it/s][A
Training:   9%|▉         | 25/269 [00:10<01:35,  2.57it/s][A
Training:  10%|▉         | 26/269 [00:10<01:24,  2.87it/s][A
Training:  10%|█     

Training:  60%|█████▉    | 161/269 [00:56<00:37,  2.89it/s][A
Training:  60%|██████    | 162/269 [00:57<00:42,  2.54it/s][A
Training:  61%|██████    | 164/269 [00:57<00:35,  2.97it/s][A
Training:  61%|██████▏   | 165/269 [00:58<00:33,  3.06it/s][A
Training:  62%|██████▏   | 166/269 [00:58<00:39,  2.58it/s][A
Training:  62%|██████▏   | 168/269 [00:59<00:32,  3.10it/s][A
Training:  63%|██████▎   | 169/269 [00:59<00:31,  3.17it/s][A
Training:  63%|██████▎   | 170/269 [00:59<00:37,  2.61it/s][A
Training:  64%|██████▍   | 172/269 [01:00<00:36,  2.67it/s][A
Training:  64%|██████▍   | 173/269 [01:01<00:35,  2.74it/s][A
Training:  65%|██████▍   | 174/269 [01:01<00:38,  2.48it/s][A
Training:  65%|██████▌   | 176/269 [01:02<00:35,  2.60it/s][A
Training:  66%|██████▌   | 177/269 [01:02<00:33,  2.78it/s][A
Training:  66%|██████▌   | 178/269 [01:03<00:37,  2.46it/s][A
Training:  67%|██████▋   | 180/269 [01:03<00:35,  2.52it/s][A
Training:  68%|██████▊   | 182/269 [01:04<00:32,  2.64i

Epoch: 3/96 - Loss: 11559.5684 - Accuracy: 0.8915



  0%|          | 0/34 [00:00<?, ?it/s][A
  3%|▎         | 1/34 [00:01<00:50,  1.54s/it][A
  6%|▌         | 2/34 [00:01<00:24,  1.29it/s][A
 12%|█▏        | 4/34 [00:01<00:10,  2.97it/s][A
 15%|█▍        | 5/34 [00:02<00:13,  2.17it/s][A
 18%|█▊        | 6/34 [00:02<00:11,  2.52it/s][A
 26%|██▋       | 9/34 [00:03<00:09,  2.73it/s][A
 29%|██▉       | 10/34 [00:04<00:07,  3.09it/s][A
 38%|███▊      | 13/34 [00:05<00:06,  3.09it/s][A
 41%|████      | 14/34 [00:05<00:06,  3.08it/s][A
 50%|█████     | 17/34 [00:06<00:05,  3.17it/s][A
 53%|█████▎    | 18/34 [00:06<00:04,  3.51it/s][A
 62%|██████▏   | 21/34 [00:07<00:04,  3.20it/s][A
 65%|██████▍   | 22/34 [00:07<00:03,  3.45it/s][A
 74%|███████▎  | 25/34 [00:08<00:02,  3.15it/s][A
 76%|███████▋  | 26/34 [00:08<00:02,  3.41it/s][A
 82%|████████▏ | 28/34 [00:09<00:01,  4.39it/s][A
 85%|████████▌ | 29/34 [00:09<00:01,  3.10it/s][A
 88%|████████▊ | 30/34 [00:10<00:01,  3.20it/s][A
100%|██████████| 34/34 [00:11<00:00,  3.08it/

Val Loss: 10657.3789 - Val Accuracy: 0.9070



Training:   0%|          | 0/269 [00:00<?, ?it/s][A
Training:   0%|          | 1/269 [00:01<08:24,  1.88s/it][A
Training:   1%|          | 2/269 [00:02<03:51,  1.15it/s][A
Training:   1%|▏         | 4/269 [00:02<01:40,  2.63it/s][A
Training:   2%|▏         | 5/269 [00:03<02:37,  1.68it/s][A
Training:   3%|▎         | 7/269 [00:03<01:30,  2.89it/s][A
Training:   3%|▎         | 8/269 [00:03<01:16,  3.43it/s][A
Training:   3%|▎         | 9/269 [00:04<02:11,  1.97it/s][A
Training:   4%|▍         | 11/269 [00:04<01:23,  3.10it/s][A
Training:   5%|▍         | 13/269 [00:06<01:50,  2.31it/s][A
Training:   5%|▌         | 14/269 [00:06<01:34,  2.69it/s][A
Training:   6%|▌         | 15/269 [00:06<01:18,  3.23it/s][A
Training:   6%|▋         | 17/269 [00:07<01:36,  2.61it/s][A
Training:   7%|▋         | 18/269 [00:07<01:30,  2.77it/s][A
Training:   7%|▋         | 20/269 [00:07<01:01,  4.05it/s][A
Training:   8%|▊         | 21/269 [00:08<01:38,  2.52it/s][A
Training:   8%|▊       

Training: 100%|██████████| 269/269 [01:34<00:00,  3.03it/s][A
                                                           [A

Epoch: 4/96 - Loss: 11497.3789 - Accuracy: 0.9062



  0%|          | 0/34 [00:00<?, ?it/s][A
  3%|▎         | 1/34 [00:02<01:05,  1.99s/it][A
  9%|▉         | 3/34 [00:02<00:17,  1.80it/s][A
 15%|█▍        | 5/34 [00:03<00:16,  1.72it/s][A
 21%|██        | 7/34 [00:03<00:09,  2.75it/s][A
 26%|██▋       | 9/34 [00:04<00:10,  2.30it/s][A
 35%|███▌      | 12/34 [00:04<00:05,  3.89it/s][A
 41%|████      | 14/34 [00:05<00:07,  2.76it/s][A
 47%|████▋     | 16/34 [00:06<00:04,  3.68it/s][A
 53%|█████▎    | 18/34 [00:07<00:05,  2.91it/s][A
 62%|██████▏   | 21/34 [00:08<00:04,  2.85it/s][A
 74%|███████▎  | 25/34 [00:09<00:02,  3.06it/s][A
 85%|████████▌ | 29/34 [00:10<00:01,  3.22it/s][A
100%|██████████| 34/34 [00:11<00:00,  2.92it/s][A
Epochs:   4%|▍         | 4/96 [07:05<2:43:09, 106.41s/it]

Val Loss: 9936.2910 - Val Accuracy: 0.9083



Training:   0%|          | 0/269 [00:00<?, ?it/s][A
Training:   0%|          | 1/269 [00:01<07:47,  1.75s/it][A
Training:   1%|          | 3/269 [00:01<02:15,  1.96it/s][A
Training:   1%|▏         | 4/269 [00:02<01:38,  2.68it/s][A
Training:   2%|▏         | 5/269 [00:03<02:32,  1.73it/s][A
Training:   2%|▏         | 6/269 [00:03<01:53,  2.31it/s][A
Training:   3%|▎         | 8/269 [00:03<01:16,  3.42it/s][A
Training:   3%|▎         | 9/269 [00:04<02:18,  1.88it/s][A
Training:   4%|▍         | 12/269 [00:04<01:17,  3.33it/s][A
Training:   5%|▍         | 13/269 [00:06<02:07,  2.00it/s][A
Training:   6%|▌         | 16/269 [00:06<01:22,  3.05it/s][A
Training:   6%|▋         | 17/269 [00:07<01:54,  2.20it/s][A
Training:   7%|▋         | 19/269 [00:07<01:19,  3.14it/s][A
Training:   7%|▋         | 20/269 [00:08<01:21,  3.05it/s][A
Training:   8%|▊         | 21/269 [00:08<01:46,  2.32it/s][A
Training:   9%|▊         | 23/269 [00:08<01:10,  3.51it/s][A
Training:   9%|▉       

Training:  77%|███████▋  | 207/269 [01:15<00:25,  2.45it/s][A
Training:  78%|███████▊  | 209/269 [01:15<00:19,  3.14it/s][A
Training:  78%|███████▊  | 211/269 [01:16<00:22,  2.60it/s][A
Training:  79%|███████▉  | 213/269 [01:16<00:17,  3.17it/s][A
Training:  80%|███████▉  | 215/269 [01:18<00:21,  2.47it/s][A
Training:  81%|████████  | 217/269 [01:18<00:17,  3.02it/s][A
Training:  81%|████████▏ | 219/269 [01:19<00:18,  2.71it/s][A
Training:  82%|████████▏ | 221/269 [01:19<00:15,  3.16it/s][A
Training:  83%|████████▎ | 223/269 [01:20<00:17,  2.66it/s][A
Training:  84%|████████▎ | 225/269 [01:21<00:14,  3.09it/s][A
Training:  84%|████████▍ | 227/269 [01:22<00:15,  2.67it/s][A
Training:  85%|████████▌ | 229/269 [01:22<00:12,  3.08it/s][A
Training:  86%|████████▌ | 231/269 [01:23<00:13,  2.88it/s][A
Training:  87%|████████▋ | 233/269 [01:23<00:11,  3.12it/s][A
Training:  87%|████████▋ | 235/269 [01:24<00:11,  2.84it/s][A
Training:  88%|████████▊ | 237/269 [01:25<00:09,  3.30i

Epoch: 5/96 - Loss: 10663.1133 - Accuracy: 0.9040



  0%|          | 0/34 [00:00<?, ?it/s][A
  3%|▎         | 1/34 [00:01<01:02,  1.88s/it][A
  6%|▌         | 2/34 [00:02<00:27,  1.15it/s][A
  9%|▉         | 3/34 [00:02<00:16,  1.94it/s][A
 15%|█▍        | 5/34 [00:03<00:15,  1.89it/s][A
 18%|█▊        | 6/34 [00:03<00:12,  2.20it/s][A
 24%|██▎       | 8/34 [00:03<00:07,  3.66it/s][A
 26%|██▋       | 9/34 [00:04<00:10,  2.44it/s][A
 29%|██▉       | 10/34 [00:04<00:09,  2.61it/s][A
 35%|███▌      | 12/34 [00:04<00:05,  3.94it/s][A
 38%|███▊      | 13/34 [00:05<00:08,  2.36it/s][A
 41%|████      | 14/34 [00:06<00:07,  2.64it/s][A
 47%|████▋     | 16/34 [00:06<00:04,  4.12it/s][A
 50%|█████     | 17/34 [00:07<00:06,  2.56it/s][A
 53%|█████▎    | 18/34 [00:07<00:05,  2.85it/s][A
 62%|██████▏   | 21/34 [00:08<00:04,  2.91it/s][A
 65%|██████▍   | 22/34 [00:08<00:03,  3.04it/s][A
 71%|███████   | 24/34 [00:08<00:02,  4.26it/s][A
 74%|███████▎  | 25/34 [00:09<00:03,  2.54it/s][A
 76%|███████▋  | 26/34 [00:09<00:02,  2.97it/s

Val Loss: 10492.3398 - Val Accuracy: 0.8980



Training:   0%|          | 0/269 [00:00<?, ?it/s][A
Training:   0%|          | 1/269 [00:01<08:40,  1.94s/it][A
Training:   2%|▏         | 5/269 [00:03<02:26,  1.80it/s][A
Training:   3%|▎         | 7/269 [00:03<01:36,  2.72it/s][A
Training:   3%|▎         | 9/269 [00:04<02:00,  2.16it/s][A
Training:   4%|▍         | 11/269 [00:04<01:26,  2.99it/s][A
Training:   5%|▍         | 13/269 [00:05<01:48,  2.35it/s][A
Training:   5%|▌         | 14/269 [00:06<01:33,  2.74it/s][A
Training:   6%|▌         | 16/269 [00:06<01:05,  3.86it/s][A
Training:   7%|▋         | 18/269 [00:07<01:40,  2.50it/s][A
Training:   7%|▋         | 20/269 [00:07<01:13,  3.41it/s][A
Training:   8%|▊         | 21/269 [00:08<01:52,  2.20it/s][A
Training:   9%|▉         | 24/269 [00:09<01:07,  3.64it/s][A
Training:  10%|▉         | 26/269 [00:10<01:35,  2.55it/s][A
Training:  10%|█         | 28/269 [00:10<01:11,  3.35it/s][A
Training:  11%|█         | 29/269 [00:11<01:46,  2.26it/s][A
Training:  12%|█▏   

Epoch: 6/96 - Loss: 11284.5234 - Accuracy: 0.9041



  0%|          | 0/34 [00:00<?, ?it/s][A
  3%|▎         | 1/34 [00:01<01:03,  1.93s/it][A
  9%|▉         | 3/34 [00:02<00:16,  1.85it/s][A
 15%|█▍        | 5/34 [00:03<00:16,  1.71it/s][A
 21%|██        | 7/34 [00:03<00:09,  2.77it/s][A
 26%|██▋       | 9/34 [00:04<00:10,  2.31it/s][A
 35%|███▌      | 12/34 [00:04<00:05,  3.91it/s][A
 41%|████      | 14/34 [00:05<00:07,  2.64it/s][A
 50%|█████     | 17/34 [00:07<00:06,  2.54it/s][A
 56%|█████▌    | 19/34 [00:07<00:04,  3.28it/s][A
 62%|██████▏   | 21/34 [00:08<00:04,  2.62it/s][A
 71%|███████   | 24/34 [00:08<00:02,  3.96it/s][A
 76%|███████▋  | 26/34 [00:09<00:02,  2.90it/s][A
 82%|████████▏ | 28/34 [00:09<00:01,  3.68it/s][A
 88%|████████▊ | 30/34 [00:11<00:01,  2.90it/s][A
100%|██████████| 34/34 [00:12<00:00,  2.78it/s][A
Epochs:   6%|▋         | 6/96 [10:42<2:41:18, 107.54s/it]

Val Loss: 10406.8262 - Val Accuracy: 0.9195



Training:   0%|          | 0/269 [00:00<?, ?it/s][A
Training:   0%|          | 1/269 [00:01<07:54,  1.77s/it][A
Training:   1%|▏         | 4/269 [00:02<01:46,  2.50it/s][A
Training:   2%|▏         | 5/269 [00:03<02:47,  1.57it/s][A
Training:   3%|▎         | 7/269 [00:03<01:39,  2.64it/s][A
Training:   3%|▎         | 8/269 [00:03<01:22,  3.15it/s][A
Training:   3%|▎         | 9/269 [00:04<02:12,  1.96it/s][A
Training:   4%|▍         | 11/269 [00:04<01:22,  3.12it/s][A
Training:   4%|▍         | 12/269 [00:04<01:10,  3.63it/s][A
Training:   5%|▍         | 13/269 [00:05<01:43,  2.48it/s][A
Training:   6%|▌         | 15/269 [00:05<01:06,  3.84it/s][A
Training:   6%|▌         | 16/269 [00:05<00:59,  4.23it/s][A
Training:   6%|▋         | 17/269 [00:06<01:46,  2.36it/s][A
Training:   7%|▋         | 18/269 [00:07<01:43,  2.43it/s][A
Training:   8%|▊         | 21/269 [00:08<01:39,  2.49it/s][A
Training:   8%|▊         | 22/269 [00:08<01:31,  2.70it/s][A
Training:   9%|▉      

Training:  79%|███████▉  | 213/269 [01:16<00:20,  2.78it/s][A
Training:  80%|███████▉  | 214/269 [01:16<00:21,  2.62it/s][A
Training:  80%|███████▉  | 215/269 [01:16<00:17,  3.06it/s][A
Training:  81%|████████  | 217/269 [01:17<00:19,  2.70it/s][A
Training:  81%|████████  | 218/269 [01:18<00:19,  2.57it/s][A
Training:  82%|████████▏ | 221/269 [01:18<00:16,  2.99it/s][A
Training:  83%|████████▎ | 222/269 [01:19<00:16,  2.78it/s][A
Training:  83%|████████▎ | 224/269 [01:19<00:11,  3.91it/s][A
Training:  84%|████████▎ | 225/269 [01:20<00:15,  2.87it/s][A
Training:  84%|████████▍ | 226/269 [01:20<00:16,  2.56it/s][A
Training:  85%|████████▍ | 228/269 [01:20<00:11,  3.66it/s][A
Training:  85%|████████▌ | 229/269 [01:21<00:15,  2.63it/s][A
Training:  86%|████████▌ | 230/269 [01:22<00:15,  2.57it/s][A
Training:  87%|████████▋ | 233/269 [01:22<00:12,  2.92it/s][A
Training:  87%|████████▋ | 234/269 [01:23<00:12,  2.85it/s][A
Training:  87%|████████▋ | 235/269 [01:23<00:10,  3.33i

Epoch: 7/96 - Loss: 12301.7920 - Accuracy: 0.9053



  0%|          | 0/34 [00:00<?, ?it/s][A
  3%|▎         | 1/34 [00:01<00:57,  1.74s/it][A
 12%|█▏        | 4/34 [00:01<00:11,  2.72it/s][A
 18%|█▊        | 6/34 [00:03<00:13,  2.10it/s][A
 26%|██▋       | 9/34 [00:04<00:11,  2.26it/s][A
 35%|███▌      | 12/34 [00:04<00:06,  3.58it/s][A
 41%|████      | 14/34 [00:05<00:06,  2.86it/s][A
 47%|████▋     | 16/34 [00:05<00:05,  3.56it/s][A
 50%|█████     | 17/34 [00:06<00:07,  2.40it/s][A
 59%|█████▉    | 20/34 [00:07<00:03,  3.56it/s][A
 62%|██████▏   | 21/34 [00:08<00:05,  2.55it/s][A
 71%|███████   | 24/34 [00:08<00:02,  3.63it/s][A
 74%|███████▎  | 25/34 [00:09<00:03,  2.78it/s][A
 79%|███████▉  | 27/34 [00:09<00:01,  3.72it/s][A
 82%|████████▏ | 28/34 [00:09<00:01,  3.79it/s][A
 85%|████████▌ | 29/34 [00:10<00:01,  2.72it/s][A
 94%|█████████▍| 32/34 [00:10<00:00,  3.94it/s][A
100%|██████████| 34/34 [00:11<00:00,  2.95it/s][A
Epochs:   7%|▋         | 7/96 [12:28<2:39:00, 107.19s/it]

Val Loss: 13859.2910 - Val Accuracy: 0.9080



Training:   0%|          | 0/269 [00:00<?, ?it/s][A
Training:   0%|          | 1/269 [00:01<08:23,  1.88s/it][A
Training:   1%|          | 3/269 [00:02<02:36,  1.70it/s][A
Training:   2%|▏         | 5/269 [00:03<02:21,  1.86it/s][A
Training:   2%|▏         | 6/269 [00:03<01:58,  2.22it/s][A
Training:   3%|▎         | 8/269 [00:03<01:14,  3.50it/s][A
Training:   3%|▎         | 9/269 [00:04<01:57,  2.22it/s][A
Training:   4%|▎         | 10/269 [00:04<01:36,  2.69it/s][A
Training:   4%|▍         | 12/269 [00:04<01:07,  3.83it/s][A
Training:   5%|▍         | 13/269 [00:05<01:34,  2.70it/s][A
Training:   5%|▌         | 14/269 [00:05<01:31,  2.79it/s][A
Training:   6%|▌         | 16/269 [00:06<01:06,  3.83it/s][A
Training:   6%|▋         | 17/269 [00:06<01:39,  2.53it/s][A
Training:   7%|▋         | 18/269 [00:07<01:35,  2.63it/s][A
Training:   7%|▋         | 20/269 [00:07<01:04,  3.85it/s][A
Training:   8%|▊         | 21/269 [00:08<01:34,  2.64it/s][A
Training:   8%|▊      

Training:  72%|███████▏  | 193/269 [01:07<00:21,  3.58it/s][A
Training:  72%|███████▏  | 195/269 [01:08<00:29,  2.52it/s][A
Training:  73%|███████▎  | 197/269 [01:08<00:21,  3.42it/s][A
Training:  74%|███████▍  | 199/269 [01:10<00:28,  2.45it/s][A
Training:  75%|███████▌  | 202/269 [01:10<00:17,  3.80it/s][A
Training:  76%|███████▌  | 204/269 [01:11<00:24,  2.68it/s][A
Training:  77%|███████▋  | 207/269 [01:12<00:24,  2.49it/s][A
Training:  78%|███████▊  | 210/269 [01:13<00:16,  3.63it/s][A
Training:  79%|███████▉  | 212/269 [01:14<00:22,  2.58it/s][A
Training:  80%|███████▉  | 215/269 [01:15<00:21,  2.46it/s][A
Training:  81%|████████  | 217/269 [01:15<00:16,  3.14it/s][A
Training:  81%|████████▏ | 219/269 [01:17<00:20,  2.46it/s][A
Training:  82%|████████▏ | 221/269 [01:17<00:14,  3.21it/s][A
Training:  83%|████████▎ | 223/269 [01:18<00:18,  2.48it/s][A
Training:  84%|████████▎ | 225/269 [01:18<00:13,  3.25it/s][A
Training:  84%|████████▍ | 227/269 [01:19<00:16,  2.61i

Epoch: 8/96 - Loss: 11976.6318 - Accuracy: 0.9080



  0%|          | 0/34 [00:00<?, ?it/s][A
  3%|▎         | 1/34 [00:01<01:05,  1.98s/it][A
  9%|▉         | 3/34 [00:02<00:17,  1.80it/s][A
 15%|█▍        | 5/34 [00:03<00:16,  1.77it/s][A
 21%|██        | 7/34 [00:03<00:09,  2.86it/s][A
 26%|██▋       | 9/34 [00:04<00:10,  2.32it/s][A
 32%|███▏      | 11/34 [00:04<00:07,  3.18it/s][A
 38%|███▊      | 13/34 [00:05<00:08,  2.49it/s][A
 47%|████▋     | 16/34 [00:06<00:04,  3.91it/s][A
 53%|█████▎    | 18/34 [00:07<00:05,  3.01it/s][A
 59%|█████▉    | 20/34 [00:07<00:03,  3.84it/s][A
 62%|██████▏   | 21/34 [00:08<00:05,  2.60it/s][A
 68%|██████▊   | 23/34 [00:08<00:03,  3.47it/s][A
 74%|███████▎  | 25/34 [00:09<00:03,  2.69it/s][A
 79%|███████▉  | 27/34 [00:09<00:02,  3.47it/s][A
 85%|████████▌ | 29/34 [00:10<00:01,  2.81it/s][A
 91%|█████████ | 31/34 [00:10<00:00,  3.55it/s][A
100%|██████████| 34/34 [00:11<00:00,  2.87it/s][A
Epochs:   8%|▊         | 8/96 [14:14<2:36:23, 106.63s/it]

Val Loss: 14442.1895 - Val Accuracy: 0.9300



Training:   0%|          | 0/269 [00:00<?, ?it/s][A
Training:   0%|          | 1/269 [00:02<09:34,  2.14s/it][A
Training:   1%|          | 3/269 [00:02<02:46,  1.60it/s][A
Training:   2%|▏         | 5/269 [00:03<02:29,  1.76it/s][A
Training:   3%|▎         | 7/269 [00:03<01:42,  2.57it/s][A
Training:   3%|▎         | 9/269 [00:04<02:02,  2.12it/s][A
Training:   4%|▍         | 11/269 [00:05<01:28,  2.90it/s][A
Training:   5%|▍         | 13/269 [00:06<01:54,  2.25it/s][A
Training:   6%|▌         | 15/269 [00:06<01:26,  2.92it/s][A
Training:   6%|▋         | 17/269 [00:07<01:44,  2.42it/s][A
Training:   7%|▋         | 19/269 [00:07<01:18,  3.19it/s][A
Training:   8%|▊         | 21/269 [00:09<01:34,  2.63it/s][A
Training:   9%|▊         | 23/269 [00:09<01:12,  3.40it/s][A
Training:   9%|▉         | 25/269 [00:10<01:33,  2.61it/s][A
Training:  10%|█         | 27/269 [00:10<01:09,  3.50it/s][A
Training:  11%|█         | 29/269 [00:11<01:35,  2.52it/s][A
Training:  12%|█▏    

Training:  95%|█████████▍| 255/269 [01:30<00:05,  2.48it/s][A
Training:  96%|█████████▌| 257/269 [01:30<00:03,  3.15it/s][A
Training:  96%|█████████▋| 259/269 [01:31<00:03,  2.62it/s][A
Training:  97%|█████████▋| 261/269 [01:32<00:02,  3.51it/s][A
Training:  98%|█████████▊| 263/269 [01:33<00:02,  2.57it/s][A
Training:  99%|█████████▉| 266/269 [01:33<00:00,  3.88it/s][A
Training:  99%|█████████▉| 267/269 [01:34<00:00,  2.67it/s][A
                                                           [A

Epoch: 9/96 - Loss: 12770.1318 - Accuracy: 0.9099



  0%|          | 0/34 [00:00<?, ?it/s][A
  3%|▎         | 1/34 [00:01<00:53,  1.62s/it][A
  9%|▉         | 3/34 [00:01<00:15,  2.04it/s][A
 15%|█▍        | 5/34 [00:02<00:14,  1.97it/s][A
 18%|█▊        | 6/34 [00:02<00:11,  2.50it/s][A
 21%|██        | 7/34 [00:03<00:08,  3.10it/s][A
 26%|██▋       | 9/34 [00:04<00:09,  2.60it/s][A
 32%|███▏      | 11/34 [00:04<00:07,  3.09it/s][A
 38%|███▊      | 13/34 [00:05<00:07,  2.82it/s][A
 44%|████▍     | 15/34 [00:05<00:05,  3.30it/s][A
 50%|█████     | 17/34 [00:06<00:05,  3.06it/s][A
 53%|█████▎    | 18/34 [00:06<00:04,  3.52it/s][A
 56%|█████▌    | 19/34 [00:07<00:04,  3.11it/s][A
 62%|██████▏   | 21/34 [00:07<00:04,  3.07it/s][A
 68%|██████▊   | 23/34 [00:08<00:03,  3.43it/s][A
 74%|███████▎  | 25/34 [00:08<00:02,  3.01it/s][A
 79%|███████▉  | 27/34 [00:09<00:02,  3.14it/s][A
 85%|████████▌ | 29/34 [00:10<00:01,  3.01it/s][A
 91%|█████████ | 31/34 [00:10<00:00,  3.32it/s][A
100%|██████████| 34/34 [00:11<00:00,  2.96it/

Val Loss: 12055.6992 - Val Accuracy: 0.8450



Training:   0%|          | 0/269 [00:00<?, ?it/s][A
Training:   0%|          | 1/269 [00:01<08:34,  1.92s/it][A
Training:   1%|          | 2/269 [00:02<04:11,  1.06it/s][A
Training:   1%|▏         | 4/269 [00:02<01:41,  2.60it/s][A
Training:   2%|▏         | 5/269 [00:03<02:40,  1.65it/s][A
Training:   3%|▎         | 7/269 [00:03<01:35,  2.75it/s][A
Training:   3%|▎         | 9/269 [00:04<02:04,  2.09it/s][A
Training:   4%|▍         | 11/269 [00:04<01:23,  3.07it/s][A
Training:   5%|▍         | 13/269 [00:06<01:51,  2.30it/s][A
Training:   5%|▌         | 14/269 [00:06<01:38,  2.58it/s][A
Training:   6%|▋         | 17/269 [00:07<01:38,  2.57it/s][A
Training:   7%|▋         | 18/269 [00:07<01:31,  2.75it/s][A
Training:   7%|▋         | 19/269 [00:07<01:17,  3.21it/s][A
Training:   8%|▊         | 21/269 [00:09<01:39,  2.50it/s][A
Training:   8%|▊         | 22/269 [00:09<01:31,  2.71it/s][A
Training:   9%|▊         | 23/269 [00:09<01:20,  3.05it/s][A
Training:   9%|▉      

Training:  70%|███████   | 189/269 [01:06<00:24,  3.25it/s][A
Training:  71%|███████   | 190/269 [01:07<00:28,  2.73it/s][A
Training:  71%|███████   | 191/269 [01:07<00:24,  3.23it/s][A
Training:  72%|███████▏  | 193/269 [01:08<00:23,  3.23it/s][A
Training:  72%|███████▏  | 194/269 [01:08<00:26,  2.79it/s][A
Training:  72%|███████▏  | 195/269 [01:08<00:23,  3.17it/s][A
Training:  73%|███████▎  | 197/269 [01:09<00:21,  3.36it/s][A
Training:  74%|███████▎  | 198/269 [01:09<00:24,  2.87it/s][A
Training:  74%|███████▍  | 199/269 [01:10<00:20,  3.45it/s][A
Training:  75%|███████▍  | 201/269 [01:10<00:19,  3.44it/s][A
Training:  75%|███████▌  | 202/269 [01:11<00:23,  2.88it/s][A
Training:  76%|███████▌  | 204/269 [01:11<00:15,  4.17it/s][A
Training:  76%|███████▌  | 205/269 [01:11<00:21,  2.99it/s][A
Training:  77%|███████▋  | 206/269 [01:12<00:27,  2.30it/s][A
Training:  77%|███████▋  | 208/269 [01:12<00:17,  3.53it/s][A
Training:  78%|███████▊  | 209/269 [01:13<00:20,  2.94i

Epoch: 10/96 - Loss: 12294.2969 - Accuracy: 0.9096



  0%|          | 0/34 [00:00<?, ?it/s][A
  3%|▎         | 1/34 [00:01<00:58,  1.78s/it][A
  9%|▉         | 3/34 [00:01<00:16,  1.88it/s][A
 15%|█▍        | 5/34 [00:02<00:14,  2.05it/s][A
 21%|██        | 7/34 [00:03<00:08,  3.23it/s][A
 24%|██▎       | 8/34 [00:03<00:07,  3.71it/s][A
 26%|██▋       | 9/34 [00:04<00:10,  2.28it/s][A
 32%|███▏      | 11/34 [00:04<00:06,  3.60it/s][A
 38%|███▊      | 13/34 [00:05<00:07,  2.70it/s][A
 41%|████      | 14/34 [00:05<00:06,  3.17it/s][A
 47%|████▋     | 16/34 [00:05<00:03,  4.50it/s][A
 53%|█████▎    | 18/34 [00:06<00:05,  3.13it/s][A
 59%|█████▉    | 20/34 [00:06<00:03,  4.24it/s][A
 62%|██████▏   | 21/34 [00:07<00:04,  2.72it/s][A
 68%|██████▊   | 23/34 [00:07<00:02,  3.90it/s][A
 74%|███████▎  | 25/34 [00:08<00:03,  2.80it/s][A
 82%|████████▏ | 28/34 [00:08<00:01,  4.25it/s][A
 88%|████████▊ | 30/34 [00:10<00:01,  3.00it/s][A
 94%|█████████▍| 32/34 [00:10<00:00,  3.88it/s][A
100%|██████████| 34/34 [00:11<00:00,  3.06it/

Val Loss: 12735.8809 - Val Accuracy: 0.9044



Training:   0%|          | 0/269 [00:00<?, ?it/s][A
Training:   0%|          | 1/269 [00:02<09:00,  2.02s/it][A
Training:   1%|▏         | 4/269 [00:02<02:03,  2.15it/s][A
Training:   2%|▏         | 5/269 [00:03<02:47,  1.58it/s][A
Training:   3%|▎         | 8/269 [00:03<01:27,  2.98it/s][A
Training:   3%|▎         | 9/269 [00:04<02:06,  2.05it/s][A
Training:   4%|▎         | 10/269 [00:04<01:44,  2.49it/s][A
Training:   4%|▍         | 12/269 [00:05<01:10,  3.64it/s][A
Training:   5%|▍         | 13/269 [00:06<02:07,  2.01it/s][A
Training:   6%|▌         | 15/269 [00:06<01:23,  3.04it/s][A
Training:   6%|▌         | 16/269 [00:06<01:15,  3.37it/s][A
Training:   6%|▋         | 17/269 [00:07<01:55,  2.17it/s][A
Training:   7%|▋         | 20/269 [00:07<01:12,  3.44it/s][A
Training:   8%|▊         | 21/269 [00:09<01:56,  2.13it/s][A
Training:   9%|▊         | 23/269 [00:09<01:19,  3.10it/s][A
Training:   9%|▉         | 24/269 [00:09<01:15,  3.26it/s][A
Training:   9%|▉     

                                                           [A

Epoch: 11/96 - Loss: 12599.0166 - Accuracy: 0.9114



  0%|          | 0/34 [00:00<?, ?it/s][A
  3%|▎         | 1/34 [00:01<01:05,  1.98s/it][A
 12%|█▏        | 4/34 [00:02<00:13,  2.19it/s][A
 15%|█▍        | 5/34 [00:03<00:15,  1.82it/s][A
 18%|█▊        | 6/34 [00:03<00:12,  2.28it/s][A
 24%|██▎       | 8/34 [00:03<00:07,  3.56it/s][A
 26%|██▋       | 9/34 [00:04<00:10,  2.40it/s][A
 29%|██▉       | 10/34 [00:04<00:08,  2.68it/s][A
 35%|███▌      | 12/34 [00:04<00:05,  4.20it/s][A
 38%|███▊      | 13/34 [00:05<00:07,  2.80it/s][A
 41%|████      | 14/34 [00:05<00:06,  2.99it/s][A
 50%|█████     | 17/34 [00:06<00:04,  3.41it/s][A
 53%|█████▎    | 18/34 [00:06<00:04,  3.27it/s][A
 62%|██████▏   | 21/34 [00:07<00:03,  3.30it/s][A
 65%|██████▍   | 22/34 [00:07<00:03,  3.48it/s][A
 71%|███████   | 24/34 [00:07<00:02,  4.74it/s][A
 74%|███████▎  | 25/34 [00:09<00:03,  2.67it/s][A
 82%|████████▏ | 28/34 [00:09<00:01,  4.24it/s][A
 85%|████████▌ | 29/34 [00:10<00:01,  2.96it/s][A
 88%|████████▊ | 30/34 [00:10<00:01,  3.44it/

Val Loss: 12677.6953 - Val Accuracy: 0.9318



Training:   0%|          | 0/269 [00:00<?, ?it/s][A
Training:   0%|          | 1/269 [00:02<09:30,  2.13s/it][A
Training:   2%|▏         | 5/269 [00:03<02:45,  1.59it/s][A
Training:   3%|▎         | 7/269 [00:03<01:50,  2.36it/s][A
Training:   3%|▎         | 9/269 [00:04<02:06,  2.05it/s][A
Training:   4%|▍         | 11/269 [00:05<01:29,  2.87it/s][A
Training:   5%|▍         | 13/269 [00:06<01:50,  2.32it/s][A
Training:   5%|▌         | 14/269 [00:06<01:39,  2.55it/s][A
Training:   6%|▋         | 17/269 [00:07<01:43,  2.44it/s][A
Training:   7%|▋         | 18/269 [00:08<01:42,  2.45it/s][A
Training:   7%|▋         | 20/269 [00:08<01:12,  3.43it/s][A
Training:   8%|▊         | 21/269 [00:09<01:40,  2.46it/s][A
Training:   8%|▊         | 22/269 [00:09<01:39,  2.47it/s][A
Training:   9%|▉         | 25/269 [00:10<01:32,  2.64it/s][A
Training:  10%|▉         | 26/269 [00:11<01:43,  2.34it/s][A
Training:  10%|█         | 28/269 [00:11<01:12,  3.31it/s][A
Training:  11%|█    

Training:  77%|███████▋  | 206/269 [01:14<00:27,  2.27it/s][A
Training:  78%|███████▊  | 209/269 [01:14<00:18,  3.24it/s][A
Training:  78%|███████▊  | 210/269 [01:15<00:23,  2.56it/s][A
Training:  79%|███████▉  | 213/269 [01:16<00:16,  3.40it/s][A
Training:  80%|███████▉  | 214/269 [01:16<00:21,  2.60it/s][A
Training:  81%|████████  | 217/269 [01:17<00:14,  3.56it/s][A
Training:  81%|████████  | 218/269 [01:18<00:19,  2.66it/s][A
Training:  82%|████████▏ | 221/269 [01:18<00:13,  3.49it/s][A
Training:  83%|████████▎ | 222/269 [01:19<00:17,  2.75it/s][A
Training:  83%|████████▎ | 224/269 [01:19<00:12,  3.75it/s][A
Training:  84%|████████▎ | 225/269 [01:20<00:14,  3.14it/s][A
Training:  84%|████████▍ | 226/269 [01:20<00:17,  2.46it/s][A
Training:  85%|████████▍ | 228/269 [01:20<00:11,  3.60it/s][A
Training:  85%|████████▌ | 229/269 [01:21<00:12,  3.11it/s][A
Training:  86%|████████▌ | 230/269 [01:22<00:15,  2.51it/s][A
Training:  87%|████████▋ | 233/269 [01:22<00:10,  3.41i

Epoch: 12/96 - Loss: 12779.9326 - Accuracy: 0.9112



  0%|          | 0/34 [00:00<?, ?it/s][A
  3%|▎         | 1/34 [00:02<01:06,  2.00s/it][A
 12%|█▏        | 4/34 [00:02<00:12,  2.42it/s][A
 18%|█▊        | 6/34 [00:03<00:13,  2.15it/s][A
 26%|██▋       | 9/34 [00:04<00:10,  2.40it/s][A
 35%|███▌      | 12/34 [00:04<00:05,  3.73it/s][A
 41%|████      | 14/34 [00:05<00:07,  2.82it/s][A
 50%|█████     | 17/34 [00:06<00:06,  2.73it/s][A
 56%|█████▌    | 19/34 [00:06<00:04,  3.50it/s][A
 62%|██████▏   | 21/34 [00:08<00:04,  2.72it/s][A
 68%|██████▊   | 23/34 [00:08<00:03,  3.57it/s][A
 74%|███████▎  | 25/34 [00:08<00:02,  3.19it/s][A
 85%|████████▌ | 29/34 [00:09<00:01,  3.47it/s][A
 91%|█████████ | 31/34 [00:10<00:00,  4.32it/s][A
100%|██████████| 34/34 [00:11<00:00,  3.06it/s][A
Epochs:  12%|█▎        | 12/96 [21:19<2:29:09, 106.54s/it]

Val Loss: 13374.9600 - Val Accuracy: 0.9054



Training:   0%|          | 0/269 [00:00<?, ?it/s][A
Training:   0%|          | 1/269 [00:01<08:52,  1.99s/it][A
Training:   1%|          | 3/269 [00:02<02:30,  1.76it/s][A
Training:   1%|▏         | 4/269 [00:02<01:48,  2.45it/s][A
Training:   2%|▏         | 5/269 [00:03<02:41,  1.63it/s][A
Training:   2%|▏         | 6/269 [00:03<02:17,  1.92it/s][A
Training:   3%|▎         | 8/269 [00:03<01:17,  3.36it/s][A
Training:   3%|▎         | 9/269 [00:04<02:03,  2.11it/s][A
Training:   4%|▎         | 10/269 [00:05<02:03,  2.10it/s][A
Training:   5%|▍         | 13/269 [00:06<01:37,  2.63it/s][A
Training:   5%|▌         | 14/269 [00:06<01:45,  2.42it/s][A
Training:   6%|▌         | 16/269 [00:06<01:13,  3.46it/s][A
Training:   6%|▋         | 17/269 [00:07<01:42,  2.45it/s][A
Training:   7%|▋         | 18/269 [00:08<01:41,  2.48it/s][A
Training:   7%|▋         | 20/269 [00:08<01:06,  3.73it/s][A
Training:   8%|▊         | 21/269 [00:08<01:29,  2.78it/s][A
Training:   8%|▊       

Training:  83%|████████▎ | 224/269 [01:20<00:13,  3.23it/s][A
Training:  84%|████████▎ | 225/269 [01:20<00:12,  3.57it/s][A
Training:  84%|████████▍ | 226/269 [01:21<00:18,  2.37it/s][A
Training:  85%|████████▍ | 228/269 [01:21<00:12,  3.38it/s][A
Training:  86%|████████▌ | 230/269 [01:22<00:15,  2.52it/s][A
Training:  86%|████████▌ | 232/269 [01:22<00:10,  3.38it/s][A
Training:  87%|████████▋ | 234/269 [01:24<00:14,  2.46it/s][A
Training:  88%|████████▊ | 237/269 [01:24<00:08,  3.90it/s][A
Training:  89%|████████▉ | 239/269 [01:25<00:10,  2.78it/s][A
Training:  90%|████████▉ | 242/269 [01:27<00:11,  2.42it/s][A
Training:  91%|█████████▏| 246/269 [01:28<00:08,  2.63it/s][A
Training:  92%|█████████▏| 248/269 [01:28<00:06,  3.25it/s][A
Training:  93%|█████████▎| 250/269 [01:29<00:07,  2.54it/s][A
Training:  94%|█████████▎| 252/269 [01:29<00:05,  3.24it/s][A
Training:  94%|█████████▍| 253/269 [01:30<00:04,  3.61it/s][A
Training:  94%|█████████▍| 254/269 [01:31<00:06,  2.30i

Epoch: 13/96 - Loss: 11791.8232 - Accuracy: 0.9146



  0%|          | 0/34 [00:00<?, ?it/s][A
  3%|▎         | 1/34 [00:01<01:05,  1.97s/it][A
  6%|▌         | 2/34 [00:02<00:27,  1.14it/s][A
  9%|▉         | 3/34 [00:02<00:17,  1.81it/s][A
 15%|█▍        | 5/34 [00:03<00:14,  1.98it/s][A
 18%|█▊        | 6/34 [00:03<00:11,  2.54it/s][A
 21%|██        | 7/34 [00:03<00:09,  2.99it/s][A
 26%|██▋       | 9/34 [00:04<00:09,  2.57it/s][A
 29%|██▉       | 10/34 [00:04<00:07,  3.12it/s][A
 32%|███▏      | 11/34 [00:04<00:07,  3.17it/s][A
 35%|███▌      | 12/34 [00:04<00:05,  3.88it/s][A
 38%|███▊      | 13/34 [00:05<00:08,  2.49it/s][A
 44%|████▍     | 15/34 [00:06<00:05,  3.44it/s][A
 50%|█████     | 17/34 [00:07<00:06,  2.66it/s][A
 56%|█████▌    | 19/34 [00:07<00:04,  3.74it/s][A
 62%|██████▏   | 21/34 [00:08<00:04,  2.72it/s][A
 68%|██████▊   | 23/34 [00:08<00:03,  3.66it/s][A
 74%|███████▎  | 25/34 [00:09<00:03,  2.83it/s][A
 79%|███████▉  | 27/34 [00:09<00:01,  3.84it/s][A
 85%|████████▌ | 29/34 [00:10<00:01,  2.71it/s

Val Loss: 11739.2412 - Val Accuracy: 0.9256



Training:   0%|          | 0/269 [00:00<?, ?it/s][A
Training:   0%|          | 1/269 [00:01<07:05,  1.59s/it][A
Training:   1%|          | 2/269 [00:01<03:56,  1.13it/s][A
Training:   1%|▏         | 4/269 [00:02<01:36,  2.73it/s][A
Training:   2%|▏         | 5/269 [00:03<02:33,  1.72it/s][A
Training:   2%|▏         | 6/269 [00:03<02:20,  1.87it/s][A
Training:   3%|▎         | 8/269 [00:03<01:22,  3.15it/s][A
Training:   3%|▎         | 9/269 [00:04<01:50,  2.35it/s][A
Training:   4%|▎         | 10/269 [00:04<01:48,  2.40it/s][A
Training:   4%|▍         | 12/269 [00:04<01:07,  3.79it/s][A
Training:   5%|▍         | 13/269 [00:05<01:45,  2.42it/s][A
Training:   5%|▌         | 14/269 [00:06<01:41,  2.51it/s][A
Training:   6%|▋         | 17/269 [00:07<01:37,  2.59it/s][A
Training:   7%|▋         | 18/269 [00:07<01:31,  2.74it/s][A
Training:   7%|▋         | 20/269 [00:07<01:03,  3.93it/s][A
Training:   8%|▊         | 21/269 [00:08<01:42,  2.43it/s][A
Training:   8%|▊       

Training:  72%|███████▏  | 195/269 [01:10<00:24,  2.98it/s][A
Training:  73%|███████▎  | 197/269 [01:11<00:29,  2.46it/s][A
Training:  74%|███████▎  | 198/269 [01:11<00:25,  2.80it/s][A
Training:  74%|███████▍  | 200/269 [01:11<00:17,  4.05it/s][A
Training:  75%|███████▍  | 201/269 [01:12<00:27,  2.46it/s][A
Training:  75%|███████▌  | 202/269 [01:12<00:24,  2.76it/s][A
Training:  76%|███████▌  | 205/269 [01:14<00:26,  2.39it/s][A
Training:  77%|███████▋  | 206/269 [01:14<00:22,  2.77it/s][A
Training:  77%|███████▋  | 208/269 [01:14<00:15,  3.83it/s][A
Training:  78%|███████▊  | 209/269 [01:15<00:25,  2.37it/s][A
Training:  78%|███████▊  | 211/269 [01:15<00:17,  3.40it/s][A
Training:  79%|███████▉  | 213/269 [01:16<00:21,  2.62it/s][A
Training:  81%|████████  | 217/269 [01:18<00:18,  2.83it/s][A
Training:  81%|████████  | 218/269 [01:18<00:16,  3.17it/s][A
Training:  82%|████████▏ | 220/269 [01:18<00:11,  4.19it/s][A
Training:  82%|████████▏ | 221/269 [01:19<00:20,  2.38i

Epoch: 14/96 - Loss: 13059.4219 - Accuracy: 0.9108



  0%|          | 0/34 [00:00<?, ?it/s][A
  3%|▎         | 1/34 [00:01<01:03,  1.93s/it][A
  9%|▉         | 3/34 [00:02<00:17,  1.80it/s][A
 15%|█▍        | 5/34 [00:03<00:16,  1.78it/s][A
 18%|█▊        | 6/34 [00:03<00:13,  2.11it/s][A
 26%|██▋       | 9/34 [00:04<00:10,  2.39it/s][A
 29%|██▉       | 10/34 [00:04<00:08,  2.69it/s][A
 38%|███▊      | 13/34 [00:05<00:07,  2.91it/s][A
 41%|████      | 14/34 [00:06<00:06,  2.89it/s][A
 47%|████▋     | 16/34 [00:06<00:04,  4.04it/s][A
 50%|█████     | 17/34 [00:06<00:06,  2.76it/s][A
 53%|█████▎    | 18/34 [00:07<00:05,  2.88it/s][A
 62%|██████▏   | 21/34 [00:08<00:04,  3.14it/s][A
 65%|██████▍   | 22/34 [00:08<00:03,  3.15it/s][A
 74%|███████▎  | 25/34 [00:09<00:02,  3.65it/s][A
 76%|███████▋  | 26/34 [00:09<00:02,  3.12it/s][A
 82%|████████▏ | 28/34 [00:09<00:01,  4.20it/s][A
 85%|████████▌ | 29/34 [00:10<00:01,  3.42it/s][A
 88%|████████▊ | 30/34 [00:10<00:01,  3.17it/s][A
100%|██████████| 34/34 [00:11<00:00,  2.96it

Val Loss: 13228.8516 - Val Accuracy: 0.9295



Training:   0%|          | 0/269 [00:00<?, ?it/s][A
Training:   0%|          | 1/269 [00:02<09:03,  2.03s/it][A
Training:   1%|          | 3/269 [00:02<02:32,  1.74it/s][A
Training:   2%|▏         | 5/269 [00:03<02:24,  1.82it/s][A
Training:   3%|▎         | 7/269 [00:03<01:33,  2.81it/s][A
Training:   3%|▎         | 9/269 [00:04<01:45,  2.47it/s][A
Training:   4%|▎         | 10/269 [00:04<01:32,  2.79it/s][A
Training:   5%|▍         | 13/269 [00:05<01:31,  2.80it/s][A
Training:   5%|▌         | 14/269 [00:05<01:31,  2.78it/s][A
Training:   6%|▌         | 16/269 [00:06<01:03,  3.96it/s][A
Training:   6%|▋         | 17/269 [00:06<01:35,  2.65it/s][A
Training:   7%|▋         | 18/269 [00:07<01:38,  2.54it/s][A
Training:   8%|▊         | 21/269 [00:08<01:23,  2.98it/s][A
Training:   8%|▊         | 22/269 [00:08<01:31,  2.69it/s][A
Training:   9%|▉         | 24/269 [00:08<01:05,  3.75it/s][A
Training:   9%|▉         | 25/269 [00:09<01:22,  2.96it/s][A
Training:  10%|▉     

Training:  73%|███████▎  | 197/269 [01:09<00:24,  2.91it/s][A
Training:  74%|███████▎  | 198/269 [01:10<00:29,  2.42it/s][A
Training:  74%|███████▍  | 200/269 [01:10<00:23,  2.93it/s][A
Training:  75%|███████▍  | 201/269 [01:11<00:22,  3.04it/s][A
Training:  75%|███████▌  | 202/269 [01:11<00:28,  2.37it/s][A
Training:  76%|███████▌  | 204/269 [01:12<00:24,  2.67it/s][A
Training:  77%|███████▋  | 206/269 [01:13<00:23,  2.65it/s][A
Training:  77%|███████▋  | 208/269 [01:14<00:24,  2.52it/s][A
Training:  78%|███████▊  | 210/269 [01:14<00:21,  2.77it/s][A
Training:  79%|███████▉  | 212/269 [01:15<00:23,  2.46it/s][A
Training:  80%|███████▉  | 214/269 [01:16<00:18,  2.97it/s][A
Training:  80%|████████  | 216/269 [01:17<00:19,  2.66it/s][A
Training:  81%|████████  | 218/269 [01:17<00:16,  3.06it/s][A
Training:  82%|████████▏ | 220/269 [01:18<00:18,  2.58it/s][A
Training:  83%|████████▎ | 222/269 [01:18<00:15,  2.94it/s][A
Training:  83%|████████▎ | 224/269 [01:19<00:15,  2.87i

Epoch: 15/96 - Loss: 13247.5967 - Accuracy: 0.9121



  0%|          | 0/34 [00:00<?, ?it/s][A
  3%|▎         | 1/34 [00:01<01:04,  1.96s/it][A
  6%|▌         | 2/34 [00:02<00:28,  1.13it/s][A
 12%|█▏        | 4/34 [00:02<00:11,  2.66it/s][A
 15%|█▍        | 5/34 [00:03<00:16,  1.77it/s][A
 21%|██        | 7/34 [00:03<00:08,  3.01it/s][A
 26%|██▋       | 9/34 [00:04<00:10,  2.45it/s][A
 29%|██▉       | 10/34 [00:04<00:08,  2.85it/s][A
 32%|███▏      | 11/34 [00:04<00:06,  3.43it/s][A
 38%|███▊      | 13/34 [00:05<00:08,  2.59it/s][A
 41%|████      | 14/34 [00:05<00:07,  2.85it/s][A
 47%|████▋     | 16/34 [00:06<00:04,  4.16it/s][A
 50%|█████     | 17/34 [00:06<00:06,  2.73it/s][A
 53%|█████▎    | 18/34 [00:07<00:05,  3.02it/s][A
 59%|█████▉    | 20/34 [00:07<00:03,  4.16it/s][A
 62%|██████▏   | 21/34 [00:08<00:04,  2.63it/s][A
 71%|███████   | 24/34 [00:08<00:02,  4.75it/s][A
 76%|███████▋  | 26/34 [00:09<00:02,  2.93it/s][A
 82%|████████▏ | 28/34 [00:09<00:01,  3.99it/s][A
 88%|████████▊ | 30/34 [00:10<00:01,  2.94it/

Val Loss: 13262.6885 - Val Accuracy: 0.8992



Training:   0%|          | 0/269 [00:00<?, ?it/s][A
Training:   0%|          | 1/269 [00:02<09:15,  2.07s/it][A
Training:   2%|▏         | 5/269 [00:03<02:40,  1.65it/s][A
Training:   3%|▎         | 7/269 [00:03<01:48,  2.42it/s][A
Training:   3%|▎         | 9/269 [00:04<02:05,  2.08it/s][A
Training:   4%|▍         | 12/269 [00:05<01:16,  3.37it/s][A
Training:   5%|▍         | 13/269 [00:06<01:55,  2.22it/s][A
Training:   6%|▌         | 16/269 [00:06<01:09,  3.63it/s][A
Training:   7%|▋         | 18/269 [00:07<01:33,  2.67it/s][A
Training:   7%|▋         | 19/269 [00:07<01:23,  3.00it/s][A
Training:   8%|▊         | 21/269 [00:08<01:43,  2.40it/s][A
Training:   9%|▊         | 23/269 [00:09<01:17,  3.16it/s][A
Training:   9%|▉         | 25/269 [00:10<01:38,  2.49it/s][A
Training:  10%|▉         | 26/269 [00:10<01:25,  2.84it/s][A
Training:  10%|█         | 28/269 [00:10<01:02,  3.84it/s][A
Training:  11%|█         | 29/269 [00:11<01:37,  2.46it/s][A
Training:  11%|█    

Training:  83%|████████▎ | 222/269 [01:20<00:17,  2.71it/s][A
Training:  83%|████████▎ | 224/269 [01:21<00:13,  3.42it/s][A
Training:  84%|████████▍ | 226/269 [01:22<00:17,  2.48it/s][A
Training:  86%|████████▌ | 230/269 [01:23<00:13,  2.80it/s][A
Training:  86%|████████▌ | 232/269 [01:23<00:10,  3.45it/s][A
Training:  87%|████████▋ | 234/269 [01:25<00:12,  2.73it/s][A
Training:  88%|████████▊ | 236/269 [01:25<00:09,  3.53it/s][A
Training:  88%|████████▊ | 238/269 [01:26<00:11,  2.60it/s][A
Training:  90%|████████▉ | 242/269 [01:27<00:09,  2.79it/s][A
Training:  90%|█████████ | 243/269 [01:28<00:08,  2.90it/s][A
Training:  91%|█████████ | 245/269 [01:28<00:06,  3.71it/s][A
Training:  91%|█████████▏| 246/269 [01:29<00:09,  2.53it/s][A
Training:  92%|█████████▏| 247/269 [01:29<00:08,  2.62it/s][A
Training:  93%|█████████▎| 249/269 [01:29<00:05,  3.64it/s][A
Training:  93%|█████████▎| 250/269 [01:30<00:08,  2.34it/s][A
Training:  93%|█████████▎| 251/269 [01:31<00:07,  2.28i

Epoch: 16/96 - Loss: 12344.8701 - Accuracy: 0.9099



  0%|          | 0/34 [00:00<?, ?it/s][A
  3%|▎         | 1/34 [00:02<01:07,  2.06s/it][A
 12%|█▏        | 4/34 [00:02<00:12,  2.37it/s][A
 18%|█▊        | 6/34 [00:03<00:12,  2.16it/s][A
 24%|██▎       | 8/34 [00:03<00:08,  3.19it/s][A
 29%|██▉       | 10/34 [00:04<00:09,  2.41it/s][A
 35%|███▌      | 12/34 [00:04<00:06,  3.33it/s][A
 38%|███▊      | 13/34 [00:05<00:09,  2.17it/s][A
 50%|█████     | 17/34 [00:06<00:06,  2.78it/s][A
 56%|█████▌    | 19/34 [00:07<00:04,  3.60it/s][A
 62%|██████▏   | 21/34 [00:08<00:04,  2.78it/s][A
 68%|██████▊   | 23/34 [00:08<00:03,  3.60it/s][A
 74%|███████▎  | 25/34 [00:09<00:03,  2.83it/s][A
 82%|████████▏ | 28/34 [00:09<00:01,  4.21it/s][A
 88%|████████▊ | 30/34 [00:10<00:01,  3.24it/s][A
100%|██████████| 34/34 [00:11<00:00,  2.89it/s][A
Epochs:  17%|█▋        | 16/96 [28:30<2:23:20, 107.51s/it]

Val Loss: 11270.3838 - Val Accuracy: 0.9246



Training:   0%|          | 0/269 [00:00<?, ?it/s][A
Training:   0%|          | 1/269 [00:02<10:27,  2.34s/it][A
Training:   1%|          | 3/269 [00:02<02:52,  1.54it/s][A
Training:   2%|▏         | 5/269 [00:03<02:46,  1.59it/s][A
Training:   3%|▎         | 7/269 [00:03<01:41,  2.57it/s][A
Training:   3%|▎         | 9/269 [00:05<02:13,  1.95it/s][A
Training:   4%|▍         | 11/269 [00:05<01:30,  2.84it/s][A
Training:   5%|▍         | 13/269 [00:06<01:58,  2.16it/s][A
Training:   6%|▌         | 15/269 [00:06<01:26,  2.93it/s][A
Training:   6%|▋         | 17/269 [00:08<01:49,  2.30it/s][A
Training:   7%|▋         | 19/269 [00:08<01:19,  3.15it/s][A
Training:   8%|▊         | 21/269 [00:09<01:41,  2.43it/s][A
Training:   9%|▊         | 23/269 [00:09<01:14,  3.30it/s][A
Training:   9%|▉         | 25/269 [00:10<01:34,  2.57it/s][A
Training:  10%|█         | 27/269 [00:10<01:10,  3.45it/s][A
Training:  11%|█         | 29/269 [00:12<01:34,  2.54it/s][A
Training:  12%|█▏    

Training:  86%|████████▌ | 231/269 [01:24<00:11,  3.32it/s][A
Training:  87%|████████▋ | 233/269 [01:26<00:15,  2.32it/s][A
Training:  88%|████████▊ | 236/269 [01:26<00:09,  3.53it/s][A
Training:  88%|████████▊ | 237/269 [01:27<00:13,  2.32it/s][A
Training:  89%|████████▉ | 239/269 [01:27<00:09,  3.10it/s][A
Training:  90%|████████▉ | 241/269 [01:29<00:12,  2.31it/s][A
Training:  90%|█████████ | 243/269 [01:29<00:08,  3.13it/s][A
Training:  91%|█████████ | 245/269 [01:30<00:10,  2.36it/s][A
Training:  92%|█████████▏| 248/269 [01:30<00:05,  3.66it/s][A
Training:  93%|█████████▎| 250/269 [01:32<00:06,  2.82it/s][A
Training:  94%|█████████▍| 253/269 [01:33<00:06,  2.45it/s][A
Training:  95%|█████████▍| 255/269 [01:33<00:04,  3.15it/s][A
Training:  96%|█████████▌| 257/269 [01:34<00:04,  2.53it/s][A
Training:  97%|█████████▋| 260/269 [01:34<00:02,  3.75it/s][A
Training:  97%|█████████▋| 262/269 [01:36<00:02,  2.76it/s][A
Training:  98%|█████████▊| 263/269 [01:36<00:01,  3.10i

Epoch: 17/96 - Loss: 12318.2041 - Accuracy: 0.9142



  0%|          | 0/34 [00:00<?, ?it/s][A
  3%|▎         | 1/34 [00:01<00:59,  1.80s/it][A
  6%|▌         | 2/34 [00:02<00:29,  1.09it/s][A
 15%|█▍        | 5/34 [00:03<00:15,  1.92it/s][A
 18%|█▊        | 6/34 [00:03<00:12,  2.25it/s][A
 26%|██▋       | 9/34 [00:04<00:09,  2.53it/s][A
 35%|███▌      | 12/34 [00:04<00:05,  4.10it/s][A
 41%|████      | 14/34 [00:05<00:06,  2.97it/s][A
 44%|████▍     | 15/34 [00:05<00:05,  3.30it/s][A
 50%|█████     | 17/34 [00:06<00:06,  2.78it/s][A
 53%|█████▎    | 18/34 [00:07<00:05,  2.96it/s][A
 59%|█████▉    | 20/34 [00:07<00:03,  4.03it/s][A
 62%|██████▏   | 21/34 [00:08<00:04,  2.70it/s][A
 65%|██████▍   | 22/34 [00:08<00:03,  3.10it/s][A
 71%|███████   | 24/34 [00:08<00:02,  4.26it/s][A
 74%|███████▎  | 25/34 [00:09<00:03,  2.76it/s][A
 79%|███████▉  | 27/34 [00:09<00:01,  3.51it/s][A
 85%|████████▌ | 29/34 [00:10<00:01,  2.80it/s][A
 91%|█████████ | 31/34 [00:10<00:00,  3.62it/s][A
100%|██████████| 34/34 [00:11<00:00,  2.88it

Val Loss: 13321.4912 - Val Accuracy: 0.9233



Training:   0%|          | 0/269 [00:00<?, ?it/s][A
Training:   0%|          | 1/269 [00:01<08:50,  1.98s/it][A
Training:   1%|          | 3/269 [00:02<02:29,  1.78it/s][A
Training:   2%|▏         | 5/269 [00:03<02:34,  1.71it/s][A
Training:   3%|▎         | 7/269 [00:03<01:42,  2.54it/s][A
Training:   3%|▎         | 9/269 [00:04<01:55,  2.24it/s][A
Training:   4%|▎         | 10/269 [00:04<01:43,  2.50it/s][A
Training:   4%|▍         | 12/269 [00:05<01:11,  3.60it/s][A
Training:   5%|▍         | 13/269 [00:06<01:52,  2.28it/s][A
Training:   5%|▌         | 14/269 [00:06<01:53,  2.25it/s][A
Training:   6%|▌         | 15/269 [00:06<01:31,  2.78it/s][A
Training:   6%|▋         | 17/269 [00:07<01:41,  2.48it/s][A
Training:   7%|▋         | 18/269 [00:08<01:43,  2.43it/s][A
Training:   8%|▊         | 21/269 [00:09<01:35,  2.60it/s][A
Training:   8%|▊         | 22/269 [00:09<01:44,  2.36it/s][A
Training:   9%|▉         | 24/269 [00:09<01:13,  3.34it/s][A
Training:   9%|▉     

Training:  70%|██████▉   | 188/269 [01:09<00:31,  2.59it/s][A
Training:  71%|███████   | 190/269 [01:10<00:29,  2.69it/s][A
Training:  71%|███████▏  | 192/269 [01:11<00:28,  2.70it/s][A
Training:  72%|███████▏  | 194/269 [01:11<00:26,  2.83it/s][A
Training:  73%|███████▎  | 196/269 [01:12<00:25,  2.88it/s][A
Training:  74%|███████▎  | 198/269 [01:13<00:25,  2.82it/s][A
Training:  74%|███████▍  | 200/269 [01:13<00:24,  2.79it/s][A
Training:  75%|███████▌  | 202/269 [01:14<00:22,  2.95it/s][A
Training:  76%|███████▌  | 204/269 [01:15<00:21,  2.97it/s][A
Training:  77%|███████▋  | 206/269 [01:15<00:20,  3.01it/s][A
Training:  77%|███████▋  | 208/269 [01:16<00:22,  2.70it/s][A
Training:  78%|███████▊  | 210/269 [01:17<00:21,  2.80it/s][A
Training:  79%|███████▉  | 212/269 [01:18<00:21,  2.66it/s][A
Training:  80%|███████▉  | 214/269 [01:18<00:19,  2.83it/s][A
Training:  80%|████████  | 216/269 [01:19<00:18,  2.83it/s][A
Training:  81%|████████  | 218/269 [01:20<00:18,  2.80i

Epoch: 18/96 - Loss: 13243.5908 - Accuracy: 0.9117



  0%|          | 0/34 [00:00<?, ?it/s][A
  3%|▎         | 1/34 [00:01<00:57,  1.76s/it][A
 15%|█▍        | 5/34 [00:02<00:14,  1.95it/s][A
 21%|██        | 7/34 [00:03<00:09,  2.89it/s][A
 26%|██▋       | 9/34 [00:04<00:10,  2.39it/s][A
 35%|███▌      | 12/34 [00:04<00:05,  3.89it/s][A
 41%|████      | 14/34 [00:05<00:07,  2.70it/s][A
 50%|█████     | 17/34 [00:06<00:06,  2.73it/s][A
 62%|██████▏   | 21/34 [00:07<00:04,  3.16it/s][A
 68%|██████▊   | 23/34 [00:07<00:02,  3.79it/s][A
 71%|███████   | 24/34 [00:07<00:02,  4.14it/s][A
 74%|███████▎  | 25/34 [00:09<00:03,  2.62it/s][A
 79%|███████▉  | 27/34 [00:09<00:01,  3.54it/s][A
 85%|████████▌ | 29/34 [00:10<00:01,  2.68it/s][A
 91%|█████████ | 31/34 [00:10<00:00,  3.64it/s][A
100%|██████████| 34/34 [00:11<00:00,  2.97it/s][A
Epochs:  19%|█▉        | 18/96 [32:10<2:21:23, 108.77s/it]

Val Loss: 13641.0391 - Val Accuracy: 0.9290



Training:   0%|          | 0/269 [00:00<?, ?it/s][A
Training:   0%|          | 1/269 [00:02<10:32,  2.36s/it][A
Training:   1%|          | 3/269 [00:02<02:54,  1.52it/s][A
Training:   2%|▏         | 5/269 [00:03<02:47,  1.57it/s][A
Training:   3%|▎         | 7/269 [00:03<01:43,  2.53it/s][A
Training:   3%|▎         | 9/269 [00:05<02:10,  1.99it/s][A
Training:   4%|▍         | 11/269 [00:05<01:32,  2.79it/s][A
Training:   5%|▍         | 13/269 [00:06<02:02,  2.08it/s][A
Training:   6%|▌         | 15/269 [00:06<01:27,  2.90it/s][A
Training:   6%|▋         | 17/269 [00:08<01:57,  2.15it/s][A
Training:   7%|▋         | 19/269 [00:08<01:26,  2.89it/s][A
Training:   8%|▊         | 21/269 [00:10<01:59,  2.08it/s][A
Training:   9%|▊         | 23/269 [00:10<01:27,  2.82it/s][A
Training:   9%|▉         | 24/269 [00:10<01:16,  3.20it/s][A
Training:   9%|▉         | 25/269 [00:11<01:49,  2.22it/s][A
Training:  10%|█         | 27/269 [00:11<01:16,  3.15it/s][A
Training:  11%|█     

Epoch: 19/96 - Loss: 13041.1572 - Accuracy: 0.9159



  0%|          | 0/34 [00:00<?, ?it/s][A
  3%|▎         | 1/34 [00:01<00:46,  1.40s/it][A
  6%|▌         | 2/34 [00:01<00:22,  1.41it/s][A
 12%|█▏        | 4/34 [00:01<00:09,  3.28it/s][A
 15%|█▍        | 5/34 [00:02<00:13,  2.12it/s][A
 18%|█▊        | 6/34 [00:02<00:11,  2.36it/s][A
 24%|██▎       | 8/34 [00:03<00:06,  3.83it/s][A
 26%|██▋       | 9/34 [00:03<00:10,  2.41it/s][A
 29%|██▉       | 10/34 [00:04<00:09,  2.40it/s][A
 38%|███▊      | 13/34 [00:05<00:06,  3.06it/s][A
 41%|████      | 14/34 [00:05<00:06,  3.07it/s][A
 50%|█████     | 17/34 [00:06<00:05,  3.30it/s][A
 53%|█████▎    | 18/34 [00:06<00:05,  2.83it/s][A
 62%|██████▏   | 21/34 [00:07<00:03,  3.40it/s][A
 65%|██████▍   | 22/34 [00:08<00:04,  2.67it/s][A
 71%|███████   | 24/34 [00:08<00:02,  3.66it/s][A
 74%|███████▎  | 25/34 [00:08<00:02,  3.21it/s][A
 76%|███████▋  | 26/34 [00:09<00:02,  2.81it/s][A
 82%|████████▏ | 28/34 [00:09<00:01,  4.13it/s][A
 85%|████████▌ | 29/34 [00:10<00:01,  3.21it/s

Val Loss: 12837.3350 - Val Accuracy: 0.9341



Training:   0%|          | 0/269 [00:00<?, ?it/s][A
Training:   0%|          | 1/269 [00:01<08:50,  1.98s/it][A
Training:   1%|▏         | 4/269 [00:02<01:53,  2.34it/s][A
Training:   2%|▏         | 5/269 [00:03<03:07,  1.41it/s][A
Training:   3%|▎         | 7/269 [00:03<01:51,  2.35it/s][A
Training:   3%|▎         | 9/269 [00:05<02:19,  1.86it/s][A
Training:   4%|▍         | 12/269 [00:05<01:20,  3.18it/s][A
Training:   5%|▌         | 14/269 [00:06<01:48,  2.36it/s][A
Training:   6%|▌         | 16/269 [00:06<01:19,  3.20it/s][A
Training:   7%|▋         | 18/269 [00:08<01:53,  2.21it/s][A
Training:   7%|▋         | 20/269 [00:08<01:23,  2.99it/s][A
Training:   8%|▊         | 22/269 [00:09<01:43,  2.38it/s][A
Training:   9%|▉         | 24/269 [00:09<01:17,  3.17it/s][A
Training:   9%|▉         | 25/269 [00:11<02:02,  1.99it/s][A
Training:  10%|█         | 27/269 [00:11<01:26,  2.79it/s][A
Training:  11%|█         | 29/269 [00:12<01:50,  2.17it/s][A
Training:  11%|█     

Training:  83%|████████▎ | 222/269 [01:22<00:19,  2.43it/s][A
Training:  84%|████████▍ | 226/269 [01:24<00:17,  2.45it/s][A
Training:  85%|████████▍ | 228/269 [01:24<00:13,  3.03it/s][A
Training:  86%|████████▌ | 230/269 [01:26<00:16,  2.37it/s][A
Training:  86%|████████▌ | 231/269 [01:26<00:14,  2.67it/s][A
Training:  86%|████████▌ | 232/269 [01:26<00:12,  3.07it/s][A
Training:  87%|████████▋ | 234/269 [01:27<00:15,  2.25it/s][A
Training:  88%|████████▊ | 236/269 [01:27<00:10,  3.13it/s][A
Training:  88%|████████▊ | 238/269 [01:29<00:13,  2.27it/s][A
Training:  89%|████████▉ | 240/269 [01:29<00:09,  3.06it/s][A
Training:  90%|████████▉ | 242/269 [01:30<00:12,  2.25it/s][A
Training:  91%|█████████ | 244/269 [01:30<00:08,  3.07it/s][A
Training:  91%|█████████▏| 246/269 [01:32<00:10,  2.25it/s][A
Training:  92%|█████████▏| 248/269 [01:32<00:06,  3.03it/s][A
Training:  93%|█████████▎| 250/269 [01:33<00:08,  2.29it/s][A
Training:  94%|█████████▎| 252/269 [01:33<00:05,  3.08i

Epoch: 20/96 - Loss: 13223.6650 - Accuracy: 0.9144



  0%|          | 0/34 [00:00<?, ?it/s][A
  3%|▎         | 1/34 [00:01<01:01,  1.86s/it][A
 12%|█▏        | 4/34 [00:02<00:11,  2.53it/s][A
 18%|█▊        | 6/34 [00:03<00:13,  2.11it/s][A
 24%|██▎       | 8/34 [00:03<00:08,  3.15it/s][A
 26%|██▋       | 9/34 [00:04<00:12,  1.98it/s][A
 35%|███▌      | 12/34 [00:04<00:06,  3.49it/s][A
 41%|████      | 14/34 [00:05<00:07,  2.67it/s][A
 50%|█████     | 17/34 [00:06<00:06,  2.79it/s][A
 56%|█████▌    | 19/34 [00:06<00:04,  3.46it/s][A
 62%|██████▏   | 21/34 [00:07<00:04,  2.89it/s][A
 68%|██████▊   | 23/34 [00:08<00:03,  3.23it/s][A
 71%|███████   | 24/34 [00:08<00:02,  3.62it/s][A
 74%|███████▎  | 25/34 [00:09<00:03,  2.98it/s][A
 76%|███████▋  | 26/34 [00:09<00:02,  3.09it/s][A
 79%|███████▉  | 27/34 [00:09<00:02,  2.93it/s][A
 85%|████████▌ | 29/34 [00:10<00:01,  2.96it/s][A
 91%|█████████ | 31/34 [00:10<00:00,  3.42it/s][A
100%|██████████| 34/34 [00:11<00:00,  2.92it/s][A
Epochs:  21%|██        | 20/96 [35:52<2:19:0

Val Loss: 13352.7705 - Val Accuracy: 0.9235



Training:   0%|          | 0/269 [00:00<?, ?it/s][A
Training:   0%|          | 1/269 [00:02<10:42,  2.40s/it][A
Training:   1%|          | 3/269 [00:02<02:58,  1.49it/s][A
Training:   2%|▏         | 5/269 [00:03<02:52,  1.53it/s][A
Training:   3%|▎         | 7/269 [00:03<01:44,  2.51it/s][A
Training:   3%|▎         | 9/269 [00:05<02:12,  1.96it/s][A
Training:   5%|▍         | 13/269 [00:06<01:52,  2.28it/s][A
Training:   6%|▌         | 15/269 [00:06<01:25,  2.96it/s][A
Training:   6%|▋         | 17/269 [00:08<01:51,  2.27it/s][A
Training:   7%|▋         | 19/269 [00:08<01:23,  2.99it/s][A
Training:   8%|▊         | 21/269 [00:09<01:41,  2.44it/s][A
Training:   9%|▉         | 24/269 [00:09<01:06,  3.69it/s][A
Training:  10%|▉         | 26/269 [00:11<01:27,  2.78it/s][A
Training:  11%|█         | 29/269 [00:12<01:40,  2.40it/s][A
Training:  12%|█▏        | 31/269 [00:12<01:18,  3.03it/s][A
Training:  12%|█▏        | 33/269 [00:13<01:35,  2.46it/s][A
Training:  13%|█▎    

Training:  91%|█████████▏| 246/269 [01:31<00:09,  2.54it/s][A
Training:  92%|█████████▏| 248/269 [01:31<00:06,  3.26it/s][A
Training:  93%|█████████▎| 249/269 [01:32<00:08,  2.27it/s][A
Training:  93%|█████████▎| 251/269 [01:32<00:05,  3.16it/s][A
Training:  94%|█████████▎| 252/269 [01:32<00:04,  3.46it/s][A
Training:  94%|█████████▍| 253/269 [01:34<00:07,  2.03it/s][A
Training:  95%|█████████▍| 255/269 [01:34<00:04,  3.06it/s][A
Training:  96%|█████████▌| 257/269 [01:35<00:05,  2.29it/s][A
Training:  97%|█████████▋| 260/269 [01:35<00:02,  3.33it/s][A
Training:  97%|█████████▋| 261/269 [01:36<00:03,  2.44it/s][A
Training:  98%|█████████▊| 264/269 [01:37<00:01,  3.35it/s][A
Training:  99%|█████████▊| 265/269 [01:38<00:01,  2.50it/s][A
Training:  99%|█████████▉| 267/269 [01:38<00:00,  3.41it/s][A
Training: 100%|█████████▉| 268/269 [01:38<00:00,  3.37it/s][A
Training: 100%|██████████| 269/269 [01:38<00:00,  3.24it/s][A
                                                       

Epoch: 21/96 - Loss: 13335.5107 - Accuracy: 0.9137



  0%|          | 0/34 [00:00<?, ?it/s][A
  3%|▎         | 1/34 [00:01<00:56,  1.70s/it][A
 12%|█▏        | 4/34 [00:01<00:10,  2.82it/s][A
 18%|█▊        | 6/34 [00:03<00:13,  2.15it/s][A
 26%|██▋       | 9/34 [00:04<00:10,  2.37it/s][A
 35%|███▌      | 12/34 [00:04<00:05,  3.78it/s][A
 41%|████      | 14/34 [00:05<00:07,  2.82it/s][A
 50%|█████     | 17/34 [00:06<00:06,  2.79it/s][A
 59%|█████▉    | 20/34 [00:06<00:03,  4.04it/s][A
 65%|██████▍   | 22/34 [00:07<00:03,  3.01it/s][A
 74%|███████▎  | 25/34 [00:09<00:03,  2.80it/s][A
 79%|███████▉  | 27/34 [00:09<00:01,  3.53it/s][A
 85%|████████▌ | 29/34 [00:10<00:01,  2.66it/s][A
 94%|█████████▍| 32/34 [00:10<00:00,  3.90it/s][A
100%|██████████| 34/34 [00:11<00:00,  2.90it/s][A
Epochs:  22%|██▏       | 21/96 [37:43<2:17:42, 110.17s/it]

Val Loss: 14227.9287 - Val Accuracy: 0.9194



Training:   0%|          | 0/269 [00:00<?, ?it/s][A
Training:   0%|          | 1/269 [00:02<10:36,  2.37s/it][A
Training:   1%|          | 3/269 [00:02<02:56,  1.51it/s][A
Training:   2%|▏         | 5/269 [00:03<02:51,  1.54it/s][A
Training:   3%|▎         | 7/269 [00:03<01:43,  2.52it/s][A
Training:   3%|▎         | 9/269 [00:05<02:12,  1.96it/s][A
Training:   4%|▍         | 12/269 [00:05<01:17,  3.34it/s][A
Training:   5%|▌         | 14/269 [00:06<01:52,  2.26it/s][A
Training:   6%|▋         | 17/269 [00:08<01:47,  2.35it/s][A
Training:   7%|▋         | 20/269 [00:08<01:13,  3.40it/s][A
Training:   8%|▊         | 22/269 [00:09<01:36,  2.57it/s][A
Training:   9%|▉         | 24/269 [00:09<01:13,  3.31it/s][A
Training:  10%|▉         | 26/269 [00:11<01:36,  2.53it/s][A
Training:  11%|█         | 29/269 [00:12<01:36,  2.48it/s][A
Training:  12%|█▏        | 32/269 [00:12<01:05,  3.60it/s][A
Training:  13%|█▎        | 34/269 [00:13<01:21,  2.87it/s][A
Training:  13%|█▎    

Training:  83%|████████▎ | 223/269 [01:20<00:17,  2.59it/s][A
Training:  84%|████████▎ | 225/269 [01:21<00:14,  3.13it/s][A
Training:  84%|████████▍ | 226/269 [01:21<00:12,  3.39it/s][A
Training:  84%|████████▍ | 227/269 [01:22<00:18,  2.29it/s][A
Training:  85%|████████▌ | 229/269 [01:22<00:12,  3.27it/s][A
Training:  86%|████████▌ | 230/269 [01:22<00:11,  3.29it/s][A
Training:  86%|████████▌ | 231/269 [01:23<00:18,  2.06it/s][A
Training:  87%|████████▋ | 233/269 [01:24<00:11,  3.17it/s][A
Training:  87%|████████▋ | 234/269 [01:24<00:10,  3.23it/s][A
Training:  87%|████████▋ | 235/269 [01:25<00:16,  2.00it/s][A
Training:  88%|████████▊ | 237/269 [01:25<00:10,  3.05it/s][A
Training:  88%|████████▊ | 238/269 [01:26<00:10,  2.95it/s][A
Training:  89%|████████▉ | 239/269 [01:27<00:15,  1.96it/s][A
Training:  90%|████████▉ | 241/269 [01:27<00:09,  2.99it/s][A
Training:  90%|████████▉ | 242/269 [01:27<00:09,  2.80it/s][A
Training:  90%|█████████ | 243/269 [01:28<00:12,  2.10i

Epoch: 22/96 - Loss: 13130.0967 - Accuracy: 0.9180



  0%|          | 0/34 [00:00<?, ?it/s][A
  3%|▎         | 1/34 [00:01<01:02,  1.88s/it][A
  6%|▌         | 2/34 [00:01<00:26,  1.19it/s][A
 12%|█▏        | 4/34 [00:02<00:10,  2.83it/s][A
 18%|█▊        | 6/34 [00:03<00:12,  2.26it/s][A
 24%|██▎       | 8/34 [00:03<00:07,  3.43it/s][A
 26%|██▋       | 9/34 [00:04<00:11,  2.21it/s][A
 29%|██▉       | 10/34 [00:04<00:10,  2.30it/s][A
 38%|███▊      | 13/34 [00:05<00:07,  2.63it/s][A
 41%|████      | 14/34 [00:06<00:07,  2.71it/s][A
 47%|████▋     | 16/34 [00:06<00:04,  3.93it/s][A
 50%|█████     | 17/34 [00:06<00:06,  2.76it/s][A
 53%|█████▎    | 18/34 [00:07<00:05,  2.97it/s][A
 59%|█████▉    | 20/34 [00:07<00:03,  4.43it/s][A
 62%|██████▏   | 21/34 [00:08<00:05,  2.42it/s][A
 65%|██████▍   | 22/34 [00:08<00:04,  2.86it/s][A
 71%|███████   | 24/34 [00:08<00:02,  4.22it/s][A
 74%|███████▎  | 25/34 [00:09<00:03,  2.54it/s][A
 76%|███████▋  | 26/34 [00:09<00:02,  2.72it/s][A
 85%|████████▌ | 29/34 [00:10<00:01,  3.08it/

Val Loss: 11896.6680 - Val Accuracy: 0.9154



Training:   0%|          | 0/269 [00:00<?, ?it/s][A
Training:   0%|          | 1/269 [00:02<10:25,  2.33s/it][A
Training:   1%|          | 3/269 [00:02<02:53,  1.53it/s][A
Training:   2%|▏         | 5/269 [00:03<02:54,  1.52it/s][A
Training:   3%|▎         | 7/269 [00:03<01:45,  2.47it/s][A
Training:   3%|▎         | 9/269 [00:05<02:17,  1.90it/s][A
Training:   4%|▍         | 11/269 [00:05<01:34,  2.72it/s][A
Training:   5%|▍         | 13/269 [00:06<02:04,  2.05it/s][A
Training:   6%|▌         | 15/269 [00:07<01:29,  2.84it/s][A
Training:   6%|▋         | 17/269 [00:08<01:56,  2.17it/s][A
Training:   7%|▋         | 19/269 [00:08<01:24,  2.95it/s][A
Training:   8%|▊         | 21/269 [00:09<01:43,  2.40it/s][A
Training:   8%|▊         | 22/269 [00:09<01:30,  2.73it/s][A
Training:   9%|▉         | 24/269 [00:10<01:05,  3.73it/s][A
Training:   9%|▉         | 25/269 [00:11<01:54,  2.14it/s][A
Training:  10%|▉         | 26/269 [00:11<01:34,  2.58it/s][A
Training:  10%|█     

                                                           [A

Epoch: 23/96 - Loss: 12609.9219 - Accuracy: 0.9113



  0%|          | 0/34 [00:00<?, ?it/s][A
  3%|▎         | 1/34 [00:01<00:56,  1.71s/it][A
  6%|▌         | 2/34 [00:01<00:24,  1.28it/s][A
 15%|█▍        | 5/34 [00:02<00:14,  2.02it/s][A
 21%|██        | 7/34 [00:03<00:09,  2.76it/s][A
 26%|██▋       | 9/34 [00:04<00:09,  2.55it/s][A
 32%|███▏      | 11/34 [00:04<00:06,  3.39it/s][A
 38%|███▊      | 13/34 [00:05<00:07,  2.90it/s][A
 44%|████▍     | 15/34 [00:05<00:05,  3.45it/s][A
 47%|████▋     | 16/34 [00:05<00:04,  3.85it/s][A
 50%|█████     | 17/34 [00:06<00:06,  2.81it/s][A
 53%|█████▎    | 18/34 [00:06<00:05,  3.09it/s][A
 56%|█████▌    | 19/34 [00:07<00:04,  3.12it/s][A
 62%|██████▏   | 21/34 [00:07<00:04,  3.10it/s][A
 65%|██████▍   | 22/34 [00:07<00:03,  3.14it/s][A
 68%|██████▊   | 23/34 [00:08<00:03,  3.15it/s][A
 74%|███████▎  | 25/34 [00:08<00:02,  3.13it/s][A
 76%|███████▋  | 26/34 [00:09<00:02,  3.36it/s][A
 79%|███████▉  | 27/34 [00:09<00:02,  3.48it/s][A
 85%|████████▌ | 29/34 [00:10<00:01,  3.20it

Val Loss: 12512.2422 - Val Accuracy: 0.9419



Training:   0%|          | 0/269 [00:00<?, ?it/s][A
Training:   0%|          | 1/269 [00:02<09:50,  2.20s/it][A
Training:   1%|▏         | 4/269 [00:02<02:00,  2.19it/s][A
Training:   2%|▏         | 6/269 [00:03<02:36,  1.68it/s][A
Training:   3%|▎         | 8/269 [00:04<01:41,  2.58it/s][A
Training:   4%|▎         | 10/269 [00:05<02:01,  2.13it/s][A
Training:   4%|▍         | 12/269 [00:05<01:24,  3.04it/s][A
Training:   5%|▌         | 14/269 [00:06<01:49,  2.33it/s][A
Training:   6%|▋         | 17/269 [00:07<01:46,  2.36it/s][A
Training:   7%|▋         | 19/269 [00:07<01:19,  3.13it/s][A
Training:   8%|▊         | 21/269 [00:09<01:45,  2.34it/s][A
Training:   9%|▊         | 23/269 [00:09<01:18,  3.13it/s][A
Training:   9%|▉         | 25/269 [00:10<01:48,  2.25it/s][A
Training:  10%|█         | 27/269 [00:11<01:19,  3.04it/s][A
Training:  11%|█         | 29/269 [00:12<01:47,  2.24it/s][A
Training:  12%|█▏        | 31/269 [00:12<01:19,  2.99it/s][A
Training:  12%|█▏   

Epoch: 24/96 - Loss: 13158.0928 - Accuracy: 0.9181



  0%|          | 0/34 [00:00<?, ?it/s][A
  3%|▎         | 1/34 [00:01<01:02,  1.90s/it][A
 12%|█▏        | 4/34 [00:02<00:12,  2.47it/s][A
 18%|█▊        | 6/34 [00:03<00:12,  2.22it/s][A
 26%|██▋       | 9/34 [00:04<00:10,  2.39it/s][A
 32%|███▏      | 11/34 [00:04<00:07,  3.23it/s][A
 38%|███▊      | 13/34 [00:05<00:08,  2.59it/s][A
 44%|████▍     | 15/34 [00:05<00:05,  3.40it/s][A
 50%|█████     | 17/34 [00:06<00:06,  2.77it/s][A
 62%|██████▏   | 21/34 [00:07<00:04,  2.91it/s][A
 74%|███████▎  | 25/34 [00:09<00:02,  3.04it/s][A
 79%|███████▉  | 27/34 [00:09<00:01,  3.68it/s][A
 85%|████████▌ | 29/34 [00:10<00:01,  2.95it/s][A
 91%|█████████ | 31/34 [00:10<00:00,  3.74it/s][A
100%|██████████| 34/34 [00:11<00:00,  2.87it/s][A
Epochs:  25%|██▌       | 24/96 [43:12<2:12:01, 110.02s/it]

Val Loss: 14887.6250 - Val Accuracy: 0.8818



Training:   0%|          | 0/269 [00:00<?, ?it/s][A
Training:   0%|          | 1/269 [00:02<09:30,  2.13s/it][A
Training:   1%|          | 3/269 [00:02<02:38,  1.68it/s][A
Training:   2%|▏         | 5/269 [00:03<02:43,  1.61it/s][A
Training:   2%|▏         | 6/269 [00:03<02:09,  2.04it/s][A
Training:   3%|▎         | 7/269 [00:03<01:40,  2.60it/s][A
Training:   3%|▎         | 9/269 [00:04<02:00,  2.16it/s][A
Training:   4%|▎         | 10/269 [00:05<01:56,  2.22it/s][A
Training:   4%|▍         | 12/269 [00:05<01:14,  3.47it/s][A
Training:   5%|▍         | 13/269 [00:06<01:50,  2.32it/s][A
Training:   5%|▌         | 14/269 [00:06<01:58,  2.15it/s][A
Training:   6%|▋         | 17/269 [00:07<01:40,  2.52it/s][A
Training:   7%|▋         | 18/269 [00:08<01:47,  2.33it/s][A
Training:   7%|▋         | 20/269 [00:08<01:15,  3.30it/s][A
Training:   8%|▊         | 21/269 [00:09<01:37,  2.53it/s][A
Training:   8%|▊         | 22/269 [00:09<01:33,  2.63it/s][A
Training:   9%|▉      

Training:  93%|█████████▎| 249/269 [01:30<00:07,  2.60it/s][A
Training:  93%|█████████▎| 251/269 [01:30<00:06,  2.70it/s][A
Training:  94%|█████████▍| 253/269 [01:31<00:05,  2.75it/s][A
Training:  95%|█████████▍| 255/269 [01:32<00:04,  2.95it/s][A
Training:  96%|█████████▌| 257/269 [01:33<00:04,  2.79it/s][A
Training:  96%|█████████▋| 259/269 [01:33<00:03,  3.08it/s][A
Training:  97%|█████████▋| 261/269 [01:34<00:02,  2.88it/s][A
Training:  98%|█████████▊| 263/269 [01:34<00:01,  3.18it/s][A
Training:  99%|█████████▊| 265/269 [01:35<00:01,  2.66it/s][A
Training:  99%|█████████▉| 267/269 [01:36<00:00,  3.23it/s][A
Training: 100%|██████████| 269/269 [01:36<00:00,  3.33it/s][A
                                                           [A

Epoch: 25/96 - Loss: 12577.9072 - Accuracy: 0.9165



  0%|          | 0/34 [00:00<?, ?it/s][A
  3%|▎         | 1/34 [00:02<01:10,  2.14s/it][A
 15%|█▍        | 5/34 [00:03<00:15,  1.82it/s][A
 26%|██▋       | 9/34 [00:04<00:10,  2.36it/s][A
 32%|███▏      | 11/34 [00:04<00:07,  3.12it/s][A
 38%|███▊      | 13/34 [00:05<00:08,  2.40it/s][A
 44%|████▍     | 15/34 [00:06<00:05,  3.19it/s][A
 50%|█████     | 17/34 [00:07<00:06,  2.64it/s][A
 62%|██████▏   | 21/34 [00:08<00:04,  3.15it/s][A
 68%|██████▊   | 23/34 [00:08<00:02,  3.91it/s][A
 74%|███████▎  | 25/34 [00:09<00:03,  2.96it/s][A
 85%|████████▌ | 29/34 [00:10<00:01,  3.11it/s][A
 94%|█████████▍| 32/34 [00:10<00:00,  4.26it/s][A
100%|██████████| 34/34 [00:11<00:00,  2.85it/s][A
Epochs:  26%|██▌       | 25/96 [45:01<2:09:47, 109.68s/it]

Val Loss: 14330.2861 - Val Accuracy: 0.9202



Training:   0%|          | 0/269 [00:00<?, ?it/s][A
Training:   0%|          | 1/269 [00:01<08:47,  1.97s/it][A
Training:   1%|          | 2/269 [00:02<04:24,  1.01it/s][A
Training:   1%|▏         | 4/269 [00:02<01:47,  2.47it/s][A
Training:   2%|▏         | 5/269 [00:03<02:34,  1.71it/s][A
Training:   2%|▏         | 6/269 [00:03<02:21,  1.86it/s][A
Training:   3%|▎         | 9/269 [00:04<01:52,  2.31it/s][A
Training:   4%|▎         | 10/269 [00:05<01:49,  2.36it/s][A
Training:   4%|▍         | 12/269 [00:05<01:13,  3.50it/s][A
Training:   5%|▍         | 13/269 [00:06<01:45,  2.42it/s][A
Training:   5%|▌         | 14/269 [00:06<01:46,  2.39it/s][A
Training:   6%|▌         | 16/269 [00:06<01:11,  3.55it/s][A
Training:   6%|▋         | 17/269 [00:07<01:38,  2.57it/s][A
Training:   7%|▋         | 18/269 [00:08<01:45,  2.38it/s][A
Training:   7%|▋         | 20/269 [00:08<01:07,  3.67it/s][A
Training:   8%|▊         | 21/269 [00:08<01:32,  2.68it/s][A
Training:   8%|▊      

Training:  92%|█████████▏| 247/269 [01:28<00:06,  3.21it/s][A
Training:  93%|█████████▎| 249/269 [01:29<00:07,  2.58it/s][A
Training:  93%|█████████▎| 251/269 [01:29<00:05,  3.36it/s][A
Training:  94%|█████████▍| 253/269 [01:30<00:06,  2.53it/s][A
Training:  96%|█████████▌| 257/269 [01:32<00:04,  2.56it/s][A
Training:  96%|█████████▋| 259/269 [01:32<00:03,  3.24it/s][A
Training:  97%|█████████▋| 261/269 [01:33<00:02,  2.72it/s][A
Training:  98%|█████████▊| 263/269 [01:33<00:01,  3.45it/s][A
Training:  99%|█████████▊| 265/269 [01:34<00:01,  2.72it/s][A
Training: 100%|█████████▉| 268/269 [01:35<00:00,  4.11it/s][A
                                                           [A

Epoch: 26/96 - Loss: 12279.2188 - Accuracy: 0.9146



  0%|          | 0/34 [00:00<?, ?it/s][A
  3%|▎         | 1/34 [00:01<00:59,  1.81s/it][A
  9%|▉         | 3/34 [00:01<00:16,  1.88it/s][A
 15%|█▍        | 5/34 [00:03<00:15,  1.88it/s][A
 24%|██▎       | 8/34 [00:03<00:07,  3.63it/s][A
 29%|██▉       | 10/34 [00:04<00:08,  2.92it/s][A
 38%|███▊      | 13/34 [00:05<00:07,  2.91it/s][A
 47%|████▋     | 16/34 [00:05<00:04,  4.36it/s][A
 53%|█████▎    | 18/34 [00:06<00:05,  3.11it/s][A
 56%|█████▌    | 19/34 [00:06<00:04,  3.48it/s][A
 62%|██████▏   | 21/34 [00:07<00:04,  2.77it/s][A
 68%|██████▊   | 23/34 [00:07<00:03,  3.66it/s][A
 74%|███████▎  | 25/34 [00:08<00:03,  2.83it/s][A
 79%|███████▉  | 27/34 [00:08<00:01,  3.72it/s][A
 85%|████████▌ | 29/34 [00:10<00:01,  2.73it/s][A
100%|██████████| 34/34 [00:11<00:00,  2.96it/s][A
Epochs:  27%|██▋       | 26/96 [46:49<2:07:12, 109.04s/it]

Val Loss: 11998.5801 - Val Accuracy: 0.9039



Training:   0%|          | 0/269 [00:00<?, ?it/s][A
Training:   0%|          | 1/269 [00:02<10:25,  2.33s/it][A
Training:   1%|          | 2/269 [00:02<04:32,  1.02s/it][A
Training:   1%|▏         | 4/269 [00:02<01:52,  2.35it/s][A
Training:   2%|▏         | 5/269 [00:03<02:56,  1.50it/s][A
Training:   3%|▎         | 7/269 [00:03<01:40,  2.60it/s][A
Training:   3%|▎         | 9/269 [00:05<02:02,  2.13it/s][A
Training:   4%|▎         | 10/269 [00:05<01:48,  2.39it/s][A
Training:   5%|▍         | 13/269 [00:06<01:52,  2.27it/s][A
Training:   5%|▌         | 14/269 [00:06<01:36,  2.64it/s][A
Training:   6%|▌         | 15/269 [00:06<01:21,  3.13it/s][A
Training:   6%|▋         | 17/269 [00:08<01:48,  2.32it/s][A
Training:   7%|▋         | 18/269 [00:08<01:31,  2.74it/s][A
Training:   7%|▋         | 20/269 [00:08<01:02,  4.01it/s][A
Training:   8%|▊         | 21/269 [00:09<01:44,  2.37it/s][A
Training:   8%|▊         | 22/269 [00:09<01:33,  2.64it/s][A
Training:   9%|▉      

Training:  75%|███████▌  | 202/269 [01:13<00:18,  3.65it/s][A
Training:  75%|███████▌  | 203/269 [01:14<00:26,  2.52it/s][A
Training:  76%|███████▌  | 204/269 [01:14<00:20,  3.12it/s][A
Training:  76%|███████▌  | 205/269 [01:14<00:18,  3.42it/s][A
Training:  77%|███████▋  | 206/269 [01:15<00:20,  3.10it/s][A
Training:  77%|███████▋  | 207/269 [01:15<00:25,  2.47it/s][A
Training:  78%|███████▊  | 209/269 [01:16<00:17,  3.36it/s][A
Training:  78%|███████▊  | 210/269 [01:16<00:19,  3.06it/s][A
Training:  78%|███████▊  | 211/269 [01:16<00:19,  2.94it/s][A
Training:  79%|███████▉  | 213/269 [01:17<00:15,  3.66it/s][A
Training:  80%|███████▉  | 214/269 [01:17<00:17,  3.12it/s][A
Training:  80%|███████▉  | 215/269 [01:18<00:20,  2.67it/s][A
Training:  81%|████████  | 217/269 [01:18<00:15,  3.35it/s][A
Training:  81%|████████  | 218/269 [01:19<00:16,  3.14it/s][A
Training:  81%|████████▏ | 219/269 [01:19<00:19,  2.56it/s][A
Training:  82%|████████▏ | 221/269 [01:20<00:16,  2.85i

Epoch: 27/96 - Loss: 13227.2246 - Accuracy: 0.9168



  0%|          | 0/34 [00:00<?, ?it/s][A
  3%|▎         | 1/34 [00:02<01:07,  2.06s/it][A
  9%|▉         | 3/34 [00:02<00:17,  1.74it/s][A
 15%|█▍        | 5/34 [00:03<00:14,  1.99it/s][A
 26%|██▋       | 9/34 [00:04<00:09,  2.72it/s][A
 32%|███▏      | 11/34 [00:04<00:06,  3.56it/s][A
 35%|███▌      | 12/34 [00:04<00:05,  3.99it/s][A
 38%|███▊      | 13/34 [00:05<00:08,  2.56it/s][A
 47%|████▋     | 16/34 [00:05<00:04,  4.41it/s][A
 53%|█████▎    | 18/34 [00:06<00:05,  3.17it/s][A
 62%|██████▏   | 21/34 [00:07<00:04,  2.85it/s][A
 71%|███████   | 24/34 [00:07<00:02,  4.23it/s][A
 76%|███████▋  | 26/34 [00:09<00:02,  2.93it/s][A
 85%|████████▌ | 29/34 [00:10<00:01,  2.75it/s][A
 91%|█████████ | 31/34 [00:10<00:00,  3.49it/s][A
100%|██████████| 34/34 [00:11<00:00,  2.94it/s][A
Epochs:  28%|██▊       | 27/96 [48:38<2:05:21, 109.01s/it]

Val Loss: 13768.7900 - Val Accuracy: 0.9092



Training:   0%|          | 0/269 [00:00<?, ?it/s][A
Training:   0%|          | 1/269 [00:02<09:23,  2.10s/it][A
Training:   1%|          | 3/269 [00:02<02:47,  1.59it/s][A
Training:   2%|▏         | 5/269 [00:03<02:36,  1.69it/s][A
Training:   3%|▎         | 7/269 [00:03<01:37,  2.69it/s][A
Training:   3%|▎         | 9/269 [00:05<02:12,  1.96it/s][A
Training:   4%|▍         | 11/269 [00:05<01:35,  2.71it/s][A
Training:   5%|▍         | 13/269 [00:06<01:53,  2.25it/s][A
Training:   6%|▌         | 15/269 [00:06<01:28,  2.86it/s][A
Training:   6%|▋         | 17/269 [00:07<01:38,  2.56it/s][A
Training:   7%|▋         | 19/269 [00:07<01:16,  3.26it/s][A
Training:   8%|▊         | 21/269 [00:09<01:41,  2.45it/s][A
Training:   9%|▊         | 23/269 [00:09<01:20,  3.07it/s][A
Training:   9%|▉         | 24/269 [00:09<01:10,  3.50it/s][A
Training:   9%|▉         | 25/269 [00:10<01:47,  2.27it/s][A
Training:  10%|█         | 27/269 [00:10<01:16,  3.18it/s][A
Training:  11%|█     

Training:  87%|████████▋ | 233/269 [01:26<00:14,  2.41it/s][A
Training:  88%|████████▊ | 236/269 [01:26<00:09,  3.54it/s][A
Training:  88%|████████▊ | 238/269 [01:27<00:11,  2.65it/s][A
Training:  90%|████████▉ | 241/269 [01:29<00:12,  2.26it/s][A
Training:  90%|█████████ | 243/269 [01:29<00:09,  2.88it/s][A
Training:  91%|█████████ | 245/269 [01:30<00:09,  2.40it/s][A
Training:  91%|█████████▏| 246/269 [01:30<00:08,  2.72it/s][A
Training:  92%|█████████▏| 247/269 [01:31<00:07,  3.14it/s][A
Training:  93%|█████████▎| 249/269 [01:32<00:08,  2.47it/s][A
Training:  93%|█████████▎| 251/269 [01:32<00:05,  3.37it/s][A
Training:  94%|█████████▍| 253/269 [01:33<00:06,  2.39it/s][A
Training:  95%|█████████▍| 255/269 [01:33<00:04,  3.27it/s][A
Training:  96%|█████████▌| 257/269 [01:35<00:04,  2.43it/s][A
Training:  96%|█████████▋| 259/269 [01:35<00:03,  3.29it/s][A
Training:  97%|█████████▋| 261/269 [01:36<00:03,  2.34it/s][A
Training:  97%|█████████▋| 262/269 [01:36<00:02,  2.71i

Epoch: 28/96 - Loss: 13652.7334 - Accuracy: 0.9165



  0%|          | 0/34 [00:00<?, ?it/s][A
  3%|▎         | 1/34 [00:01<01:01,  1.86s/it][A
  6%|▌         | 2/34 [00:01<00:26,  1.20it/s][A
 15%|█▍        | 5/34 [00:02<00:13,  2.20it/s][A
 18%|█▊        | 6/34 [00:03<00:10,  2.70it/s][A
 26%|██▋       | 9/34 [00:04<00:09,  2.60it/s][A
 32%|███▏      | 11/34 [00:04<00:06,  3.60it/s][A
 38%|███▊      | 13/34 [00:05<00:08,  2.56it/s][A
 50%|█████     | 17/34 [00:06<00:05,  3.01it/s][A
 56%|█████▌    | 19/34 [00:06<00:03,  3.78it/s][A
 59%|█████▉    | 20/34 [00:06<00:03,  4.15it/s][A
 62%|██████▏   | 21/34 [00:07<00:04,  2.64it/s][A
 71%|███████   | 24/34 [00:08<00:02,  4.38it/s][A
 76%|███████▋  | 26/34 [00:09<00:02,  3.08it/s][A
 82%|████████▏ | 28/34 [00:09<00:01,  3.90it/s][A
 88%|████████▊ | 30/34 [00:10<00:01,  2.86it/s][A
100%|██████████| 34/34 [00:11<00:00,  2.90it/s][A
Epochs:  29%|██▉       | 28/96 [50:29<2:04:10, 109.57s/it]

Val Loss: 14829.9922 - Val Accuracy: 0.9088



Training:   0%|          | 0/269 [00:00<?, ?it/s][A
Training:   0%|          | 1/269 [00:02<08:56,  2.00s/it][A
Training:   1%|          | 2/269 [00:02<04:33,  1.02s/it][A
Training:   2%|▏         | 5/269 [00:03<02:27,  1.78it/s][A
Training:   2%|▏         | 6/269 [00:03<02:15,  1.94it/s][A
Training:   3%|▎         | 7/269 [00:03<01:46,  2.47it/s][A
Training:   3%|▎         | 9/269 [00:05<02:08,  2.03it/s][A
Training:   4%|▎         | 10/269 [00:05<01:57,  2.21it/s][A
Training:   4%|▍         | 12/269 [00:05<01:16,  3.38it/s][A
Training:   5%|▍         | 13/269 [00:06<01:53,  2.26it/s][A
Training:   5%|▌         | 14/269 [00:06<01:41,  2.52it/s][A
Training:   6%|▌         | 16/269 [00:06<01:04,  3.90it/s][A
Training:   6%|▋         | 17/269 [00:08<01:51,  2.26it/s][A
Training:   7%|▋         | 18/269 [00:08<01:58,  2.12it/s][A
Training:   7%|▋         | 20/269 [00:08<01:17,  3.20it/s][A
Training:   8%|▊         | 21/269 [00:09<01:50,  2.24it/s][A
Training:   8%|▊      

Training:  77%|███████▋  | 207/269 [01:17<00:22,  2.73it/s][A
Training:  78%|███████▊  | 209/269 [01:17<00:21,  2.74it/s][A
Training:  78%|███████▊  | 211/269 [01:18<00:20,  2.85it/s][A
Training:  79%|███████▉  | 213/269 [01:19<00:20,  2.74it/s][A
Training:  80%|███████▉  | 215/269 [01:19<00:19,  2.84it/s][A
Training:  81%|████████  | 217/269 [01:20<00:19,  2.68it/s][A
Training:  81%|████████▏ | 219/269 [01:21<00:15,  3.23it/s][A
Training:  82%|████████▏ | 221/269 [01:22<00:18,  2.59it/s][A
Training:  83%|████████▎ | 222/269 [01:22<00:15,  2.97it/s][A
Training:  83%|████████▎ | 223/269 [01:22<00:15,  3.01it/s][A
Training:  84%|████████▎ | 225/269 [01:23<00:18,  2.40it/s][A
Training:  84%|████████▍ | 227/269 [01:24<00:14,  2.82it/s][A
Training:  85%|████████▌ | 229/269 [01:25<00:15,  2.52it/s][A
Training:  86%|████████▌ | 231/269 [01:25<00:13,  2.90it/s][A
Training:  87%|████████▋ | 233/269 [01:26<00:14,  2.48it/s][A
Training:  87%|████████▋ | 235/269 [01:27<00:12,  2.78i

Epoch: 29/96 - Loss: 14213.4219 - Accuracy: 0.9144



  0%|          | 0/34 [00:00<?, ?it/s][A
  3%|▎         | 1/34 [00:01<00:50,  1.52s/it][A
  6%|▌         | 2/34 [00:01<00:26,  1.21it/s][A
 15%|█▍        | 5/34 [00:02<00:13,  2.22it/s][A
 18%|█▊        | 6/34 [00:03<00:12,  2.30it/s][A
 24%|██▎       | 8/34 [00:03<00:07,  3.65it/s][A
 26%|██▋       | 9/34 [00:03<00:09,  2.71it/s][A
 29%|██▉       | 10/34 [00:04<00:09,  2.63it/s][A
 38%|███▊      | 13/34 [00:04<00:06,  3.43it/s][A
 41%|████      | 14/34 [00:05<00:07,  2.76it/s][A
 47%|████▋     | 16/34 [00:05<00:04,  3.94it/s][A
 50%|█████     | 17/34 [00:06<00:04,  3.67it/s][A
 53%|█████▎    | 18/34 [00:06<00:05,  2.69it/s][A
 62%|██████▏   | 21/34 [00:07<00:03,  3.67it/s][A
 65%|██████▍   | 22/34 [00:08<00:04,  2.87it/s][A
 68%|██████▊   | 23/34 [00:08<00:03,  3.36it/s][A
 74%|███████▎  | 25/34 [00:08<00:02,  3.43it/s][A
 76%|███████▋  | 26/34 [00:09<00:02,  2.84it/s][A
 85%|████████▌ | 29/34 [00:09<00:01,  3.51it/s][A
 88%|████████▊ | 30/34 [00:10<00:01,  2.70it/

Val Loss: 13183.8506 - Val Accuracy: 0.9103



Training:   0%|          | 0/269 [00:00<?, ?it/s][A
Training:   0%|          | 1/269 [00:02<09:37,  2.15s/it][A
Training:   1%|          | 2/269 [00:02<04:25,  1.01it/s][A
Training:   2%|▏         | 5/269 [00:03<02:30,  1.76it/s][A
Training:   2%|▏         | 6/269 [00:03<02:11,  2.00it/s][A
Training:   3%|▎         | 9/269 [00:05<01:58,  2.20it/s][A
Training:   4%|▎         | 10/269 [00:05<01:49,  2.36it/s][A
Training:   5%|▍         | 13/269 [00:06<01:40,  2.54it/s][A
Training:   5%|▌         | 14/269 [00:06<01:32,  2.74it/s][A
Training:   6%|▋         | 17/269 [00:07<01:33,  2.68it/s][A
Training:   7%|▋         | 18/269 [00:08<01:27,  2.88it/s][A
Training:   8%|▊         | 21/269 [00:09<01:29,  2.77it/s][A
Training:   9%|▊         | 23/269 [00:09<01:08,  3.59it/s][A
Training:   9%|▉         | 24/269 [00:09<01:02,  3.90it/s][A
Training:   9%|▉         | 25/269 [00:10<01:37,  2.51it/s][A
Training:  10%|▉         | 26/269 [00:10<01:30,  2.69it/s][A
Training:  10%|█     

Training:  72%|███████▏  | 195/269 [01:10<00:22,  3.24it/s][A
Training:  73%|███████▎  | 196/269 [01:11<00:19,  3.74it/s][A
Training:  73%|███████▎  | 197/269 [01:12<00:30,  2.35it/s][A
Training:  74%|███████▍  | 199/269 [01:12<00:20,  3.45it/s][A
Training:  75%|███████▍  | 201/269 [01:13<00:28,  2.39it/s][A
Training:  75%|███████▌  | 203/269 [01:13<00:19,  3.43it/s][A
Training:  76%|███████▌  | 205/269 [01:14<00:25,  2.55it/s][A
Training:  77%|███████▋  | 207/269 [01:14<00:18,  3.43it/s][A
Training:  78%|███████▊  | 209/269 [01:16<00:23,  2.59it/s][A
Training:  78%|███████▊  | 211/269 [01:16<00:17,  3.30it/s][A
Training:  79%|███████▉  | 213/269 [01:17<00:22,  2.53it/s][A
Training:  80%|███████▉  | 215/269 [01:17<00:17,  3.17it/s][A
Training:  81%|████████  | 217/269 [01:19<00:20,  2.48it/s][A
Training:  81%|████████▏ | 219/269 [01:19<00:16,  3.08it/s][A
Training:  82%|████████▏ | 221/269 [01:20<00:19,  2.51it/s][A
Training:  83%|████████▎ | 223/269 [01:21<00:16,  2.78i

Epoch: 30/96 - Loss: 13561.4268 - Accuracy: 0.9160



  0%|          | 0/34 [00:00<?, ?it/s][A
  3%|▎         | 1/34 [00:01<01:01,  1.88s/it][A
  6%|▌         | 2/34 [00:01<00:26,  1.20it/s][A
 12%|█▏        | 4/34 [00:02<00:10,  2.80it/s][A
 15%|█▍        | 5/34 [00:03<00:14,  1.94it/s][A
 21%|██        | 7/34 [00:03<00:08,  3.31it/s][A
 26%|██▋       | 9/34 [00:04<00:09,  2.59it/s][A
 32%|███▏      | 11/34 [00:04<00:06,  3.63it/s][A
 38%|███▊      | 13/34 [00:05<00:07,  2.72it/s][A
 47%|████▋     | 16/34 [00:05<00:04,  4.40it/s][A
 53%|█████▎    | 18/34 [00:06<00:05,  2.92it/s][A
 62%|██████▏   | 21/34 [00:07<00:04,  2.98it/s][A
 68%|██████▊   | 23/34 [00:07<00:03,  3.57it/s][A
 74%|███████▎  | 25/34 [00:09<00:03,  2.73it/s][A
 82%|████████▏ | 28/34 [00:09<00:01,  3.97it/s][A
 85%|████████▌ | 29/34 [00:10<00:01,  2.68it/s][A
 91%|█████████ | 31/34 [00:10<00:00,  3.57it/s][A
100%|██████████| 34/34 [00:11<00:00,  2.90it/s][A
Epochs:  31%|███▏      | 30/96 [54:09<2:00:48, 109.82s/it]

Val Loss: 14379.6221 - Val Accuracy: 0.9128



Training:   0%|          | 0/269 [00:00<?, ?it/s][A
Training:   0%|          | 1/269 [00:02<10:06,  2.26s/it][A
Training:   1%|          | 3/269 [00:02<02:47,  1.59it/s][A
Training:   2%|▏         | 5/269 [00:03<02:53,  1.52it/s][A
Training:   3%|▎         | 7/269 [00:03<01:46,  2.47it/s][A
Training:   3%|▎         | 9/269 [00:05<02:15,  1.93it/s][A
Training:   4%|▎         | 10/269 [00:05<01:52,  2.30it/s][A
Training:   5%|▍         | 13/269 [00:06<01:41,  2.53it/s][A
Training:   5%|▌         | 14/269 [00:06<01:26,  2.93it/s][A
Training:   6%|▌         | 16/269 [00:06<01:01,  4.14it/s][A
Training:   7%|▋         | 18/269 [00:08<01:36,  2.60it/s][A
Training:   7%|▋         | 19/269 [00:08<01:25,  2.94it/s][A
Training:   8%|▊         | 21/269 [00:09<01:33,  2.65it/s][A
Training:   8%|▊         | 22/269 [00:09<01:29,  2.75it/s][A
Training:   9%|▊         | 23/269 [00:09<01:15,  3.26it/s][A
Training:   9%|▉         | 25/269 [00:10<01:34,  2.57it/s][A
Training:  10%|█     

Training:  70%|███████   | 189/269 [01:09<00:29,  2.75it/s][A
Training:  71%|███████   | 190/269 [01:10<00:37,  2.13it/s][A
Training:  71%|███████▏  | 192/269 [01:10<00:30,  2.55it/s][A
Training:  72%|███████▏  | 194/269 [01:11<00:30,  2.43it/s][A
Training:  73%|███████▎  | 196/269 [01:12<00:25,  2.91it/s][A
Training:  74%|███████▎  | 198/269 [01:12<00:24,  2.85it/s][A
Training:  74%|███████▍  | 200/269 [01:13<00:23,  2.93it/s][A
Training:  75%|███████▍  | 201/269 [01:13<00:22,  3.08it/s][A
Training:  75%|███████▌  | 202/269 [01:14<00:24,  2.78it/s][A
Training:  76%|███████▌  | 204/269 [01:14<00:20,  3.23it/s][A
Training:  76%|███████▌  | 205/269 [01:15<00:20,  3.07it/s][A
Training:  77%|███████▋  | 206/269 [01:15<00:22,  2.84it/s][A
Training:  77%|███████▋  | 208/269 [01:16<00:17,  3.46it/s][A
Training:  78%|███████▊  | 209/269 [01:16<00:20,  2.87it/s][A
Training:  78%|███████▊  | 210/269 [01:17<00:21,  2.72it/s][A
Training:  79%|███████▉  | 212/269 [01:17<00:19,  2.93i

Epoch: 31/96 - Loss: 13495.1230 - Accuracy: 0.9213



  0%|          | 0/34 [00:00<?, ?it/s][A
  3%|▎         | 1/34 [00:01<01:00,  1.83s/it][A
  6%|▌         | 2/34 [00:01<00:26,  1.19it/s][A
 15%|█▍        | 5/34 [00:03<00:15,  1.88it/s][A
 26%|██▋       | 9/34 [00:04<00:09,  2.70it/s][A
 29%|██▉       | 10/34 [00:04<00:07,  3.07it/s][A
 38%|███▊      | 13/34 [00:05<00:07,  2.84it/s][A
 41%|████      | 14/34 [00:05<00:06,  3.20it/s][A
 50%|█████     | 17/34 [00:06<00:06,  2.79it/s][A
 56%|█████▌    | 19/34 [00:06<00:04,  3.69it/s][A
 62%|██████▏   | 21/34 [00:07<00:04,  2.98it/s][A
 65%|██████▍   | 22/34 [00:08<00:03,  3.23it/s][A
 71%|███████   | 24/34 [00:08<00:02,  4.34it/s][A
 74%|███████▎  | 25/34 [00:09<00:03,  2.95it/s][A
 76%|███████▋  | 26/34 [00:09<00:02,  2.84it/s][A
 82%|████████▏ | 28/34 [00:09<00:01,  4.09it/s][A
 85%|████████▌ | 29/34 [00:10<00:01,  2.84it/s][A
 88%|████████▊ | 30/34 [00:10<00:01,  2.95it/s][A
100%|██████████| 34/34 [00:11<00:00,  2.93it/s][A
Epochs:  32%|███▏      | 31/96 [55:59<1:59:

Val Loss: 13730.7266 - Val Accuracy: 0.9247



Training:   0%|          | 0/269 [00:00<?, ?it/s][A
Training:   0%|          | 1/269 [00:02<09:13,  2.07s/it][A
Training:   1%|          | 2/269 [00:02<04:09,  1.07it/s][A
Training:   2%|▏         | 5/269 [00:03<02:34,  1.71it/s][A
Training:   2%|▏         | 6/269 [00:03<02:04,  2.11it/s][A
Training:   3%|▎         | 8/269 [00:03<01:17,  3.35it/s][A
Training:   3%|▎         | 9/269 [00:04<02:09,  2.01it/s][A
Training:   4%|▎         | 10/269 [00:05<01:50,  2.34it/s][A
Training:   5%|▍         | 13/269 [00:06<01:50,  2.32it/s][A
Training:   5%|▌         | 14/269 [00:06<01:44,  2.43it/s][A
Training:   6%|▌         | 16/269 [00:06<01:11,  3.55it/s][A
Training:   6%|▋         | 17/269 [00:07<01:37,  2.58it/s][A
Training:   7%|▋         | 18/269 [00:08<01:40,  2.50it/s][A
Training:   8%|▊         | 21/269 [00:09<01:33,  2.67it/s][A
Training:   8%|▊         | 22/269 [00:09<01:35,  2.59it/s][A
Training:   9%|▉         | 24/269 [00:09<01:06,  3.67it/s][A
Training:   9%|▉      

Training:  78%|███████▊  | 210/269 [01:17<00:23,  2.51it/s][A
Training:  79%|███████▉  | 213/269 [01:17<00:14,  3.78it/s][A
Training:  80%|███████▉  | 215/269 [01:18<00:19,  2.80it/s][A
Training:  81%|████████  | 218/269 [01:20<00:19,  2.60it/s][A
Training:  82%|████████▏ | 220/269 [01:20<00:14,  3.30it/s][A
Training:  82%|████████▏ | 221/269 [01:20<00:13,  3.67it/s][A
Training:  83%|████████▎ | 222/269 [01:21<00:21,  2.24it/s][A
Training:  84%|████████▎ | 225/269 [01:21<00:13,  3.37it/s][A
Training:  84%|████████▍ | 226/269 [01:23<00:19,  2.23it/s][A
Training:  85%|████████▍ | 228/269 [01:23<00:13,  3.13it/s][A
Training:  86%|████████▌ | 230/269 [01:24<00:16,  2.41it/s][A
Training:  87%|████████▋ | 233/269 [01:24<00:10,  3.45it/s][A
Training:  87%|████████▋ | 234/269 [01:26<00:15,  2.25it/s][A
Training:  88%|████████▊ | 236/269 [01:26<00:10,  3.09it/s][A
Training:  88%|████████▊ | 237/269 [01:26<00:10,  3.11it/s][A
Training:  88%|████████▊ | 238/269 [01:27<00:14,  2.11i

Epoch: 32/96 - Loss: 13505.3555 - Accuracy: 0.9147



  0%|          | 0/34 [00:00<?, ?it/s][A
  3%|▎         | 1/34 [00:01<00:55,  1.68s/it][A
  6%|▌         | 2/34 [00:01<00:24,  1.33it/s][A
 15%|█▍        | 5/34 [00:02<00:13,  2.19it/s][A
 18%|█▊        | 6/34 [00:03<00:11,  2.54it/s][A
 24%|██▎       | 8/34 [00:03<00:07,  3.63it/s][A
 26%|██▋       | 9/34 [00:03<00:09,  2.64it/s][A
 29%|██▉       | 10/34 [00:04<00:07,  3.22it/s][A
 32%|███▏      | 11/34 [00:04<00:05,  3.90it/s][A
 35%|███▌      | 12/34 [00:04<00:04,  4.62it/s][A
 38%|███▊      | 13/34 [00:04<00:07,  2.82it/s][A
 41%|████      | 14/34 [00:05<00:05,  3.47it/s][A
 44%|████▍     | 15/34 [00:05<00:05,  3.73it/s][A
 47%|████▋     | 16/34 [00:05<00:04,  4.48it/s][A
 50%|█████     | 17/34 [00:06<00:06,  2.75it/s][A
 56%|█████▌    | 19/34 [00:06<00:04,  3.53it/s][A
 62%|██████▏   | 21/34 [00:07<00:04,  2.83it/s][A
 68%|██████▊   | 23/34 [00:07<00:03,  3.59it/s][A
 74%|███████▎  | 25/34 [00:08<00:02,  3.14it/s][A
 76%|███████▋  | 26/34 [00:08<00:02,  3.53it/

Val Loss: 16083.5371 - Val Accuracy: 0.9275



Training:   0%|          | 0/269 [00:00<?, ?it/s][A
Training:   0%|          | 1/269 [00:02<11:31,  2.58s/it][A
Training:   1%|          | 3/269 [00:02<03:13,  1.38it/s][A
Training:   2%|▏         | 5/269 [00:03<02:52,  1.53it/s][A
Training:   3%|▎         | 7/269 [00:04<01:44,  2.50it/s][A
Training:   3%|▎         | 9/269 [00:05<02:17,  1.89it/s][A
Training:   4%|▍         | 12/269 [00:05<01:21,  3.16it/s][A
Training:   5%|▌         | 14/269 [00:07<01:51,  2.28it/s][A
Training:   6%|▌         | 16/269 [00:07<01:23,  3.04it/s][A
Training:   6%|▋         | 17/269 [00:08<02:03,  2.04it/s][A
Training:   7%|▋         | 19/269 [00:08<01:28,  2.82it/s][A
Training:   8%|▊         | 21/269 [00:09<01:50,  2.25it/s][A
Training:   9%|▉         | 24/269 [00:10<01:07,  3.62it/s][A
Training:  10%|▉         | 26/269 [00:11<01:30,  2.68it/s][A
Training:  10%|█         | 28/269 [00:11<01:09,  3.48it/s][A
Training:  11%|█         | 30/269 [00:12<01:39,  2.41it/s][A
Training:  12%|█▏    

Epoch: 33/96 - Loss: 13276.7197 - Accuracy: 0.9162



  0%|          | 0/34 [00:00<?, ?it/s][A
  3%|▎         | 1/34 [00:02<01:07,  2.03s/it][A
  9%|▉         | 3/34 [00:02<00:17,  1.74it/s][A
 15%|█▍        | 5/34 [00:03<00:16,  1.73it/s][A
 26%|██▋       | 9/34 [00:04<00:09,  2.52it/s][A
 35%|███▌      | 12/34 [00:04<00:05,  3.89it/s][A
 41%|████      | 14/34 [00:05<00:07,  2.84it/s][A
 47%|████▋     | 16/34 [00:05<00:04,  3.72it/s][A
 53%|█████▎    | 18/34 [00:07<00:05,  2.79it/s][A
 62%|██████▏   | 21/34 [00:08<00:04,  2.76it/s][A
 71%|███████   | 24/34 [00:08<00:02,  4.01it/s][A
 76%|███████▋  | 26/34 [00:09<00:02,  3.10it/s][A
 85%|████████▌ | 29/34 [00:10<00:01,  3.02it/s][A
 91%|█████████ | 31/34 [00:10<00:00,  3.74it/s][A
100%|██████████| 34/34 [00:11<00:00,  2.94it/s][A
Epochs:  34%|███▍      | 33/96 [59:36<1:54:42, 109.25s/it]

Val Loss: 15245.0488 - Val Accuracy: 0.9260



Training:   0%|          | 0/269 [00:00<?, ?it/s][A
Training:   0%|          | 1/269 [00:02<09:43,  2.18s/it][A
Training:   1%|          | 3/269 [00:02<02:41,  1.65it/s][A
Training:   2%|▏         | 5/269 [00:03<02:36,  1.69it/s][A
Training:   3%|▎         | 7/269 [00:03<01:40,  2.62it/s][A
Training:   3%|▎         | 9/269 [00:04<02:02,  2.13it/s][A
Training:   4%|▍         | 11/269 [00:05<01:27,  2.96it/s][A
Training:   4%|▍         | 12/269 [00:05<01:14,  3.45it/s][A
Training:   5%|▍         | 13/269 [00:06<01:54,  2.24it/s][A
Training:   5%|▌         | 14/269 [00:06<01:33,  2.71it/s][A
Training:   6%|▌         | 15/269 [00:06<01:19,  3.19it/s][A
Training:   6%|▋         | 17/269 [00:07<01:41,  2.48it/s][A
Training:   7%|▋         | 19/269 [00:07<01:19,  3.16it/s][A
Training:   8%|▊         | 21/269 [00:08<01:31,  2.71it/s][A
Training:   8%|▊         | 22/269 [00:08<01:20,  3.08it/s][A
Training:   9%|▊         | 23/269 [00:09<01:25,  2.88it/s][A
Training:   9%|▉     

Training:  70%|██████▉   | 188/269 [01:07<00:27,  2.92it/s][A
Training:  70%|███████   | 189/269 [01:08<00:25,  3.12it/s][A
Training:  71%|███████   | 190/269 [01:09<00:38,  2.07it/s][A
Training:  71%|███████▏  | 192/269 [01:09<00:26,  2.92it/s][A
Training:  72%|███████▏  | 193/269 [01:09<00:22,  3.36it/s][A
Training:  72%|███████▏  | 194/269 [01:10<00:36,  2.08it/s][A
Training:  73%|███████▎  | 196/269 [01:10<00:24,  2.98it/s][A
Training:  74%|███████▎  | 198/269 [01:11<00:29,  2.44it/s][A
Training:  74%|███████▍  | 200/269 [01:12<00:21,  3.23it/s][A
Training:  75%|███████▌  | 202/269 [01:13<00:24,  2.69it/s][A
Training:  76%|███████▌  | 204/269 [01:13<00:18,  3.48it/s][A
Training:  76%|███████▌  | 205/269 [01:13<00:17,  3.72it/s][A
Training:  77%|███████▋  | 206/269 [01:14<00:27,  2.27it/s][A
Training:  77%|███████▋  | 208/269 [01:14<00:18,  3.28it/s][A
Training:  78%|███████▊  | 209/269 [01:14<00:16,  3.58it/s][A
Training:  78%|███████▊  | 210/269 [01:15<00:26,  2.24i

Epoch: 34/96 - Loss: 13630.1484 - Accuracy: 0.9226



  0%|          | 0/34 [00:00<?, ?it/s][A
  3%|▎         | 1/34 [00:02<01:09,  2.10s/it][A
  9%|▉         | 3/34 [00:02<00:18,  1.70it/s][A
 15%|█▍        | 5/34 [00:03<00:15,  1.84it/s][A
 24%|██▎       | 8/34 [00:03<00:07,  3.42it/s][A
 29%|██▉       | 10/34 [00:04<00:08,  2.69it/s][A
 35%|███▌      | 12/34 [00:04<00:06,  3.61it/s][A
 38%|███▊      | 13/34 [00:05<00:08,  2.47it/s][A
 41%|████      | 14/34 [00:05<00:07,  2.71it/s][A
 47%|████▋     | 16/34 [00:05<00:04,  3.98it/s][A
 50%|█████     | 17/34 [00:06<00:06,  2.50it/s][A
 53%|█████▎    | 18/34 [00:07<00:05,  2.69it/s][A
 59%|█████▉    | 20/34 [00:07<00:03,  4.03it/s][A
 62%|██████▏   | 21/34 [00:08<00:04,  2.84it/s][A
 65%|██████▍   | 22/34 [00:08<00:04,  2.94it/s][A
 71%|███████   | 24/34 [00:08<00:02,  4.39it/s][A
 74%|███████▎  | 25/34 [00:09<00:03,  2.96it/s][A
 76%|███████▋  | 26/34 [00:09<00:02,  2.72it/s][A
 82%|████████▏ | 28/34 [00:09<00:01,  4.11it/s][A
 85%|████████▌ | 29/34 [00:10<00:01,  2.94i

Val Loss: 17976.5332 - Val Accuracy: 0.8803



Training:   0%|          | 0/269 [00:00<?, ?it/s][A
Training:   0%|          | 1/269 [00:01<07:50,  1.76s/it][A
Training:   1%|          | 3/269 [00:01<02:15,  1.96it/s][A
Training:   2%|▏         | 5/269 [00:03<02:38,  1.67it/s][A
Training:   2%|▏         | 6/269 [00:03<02:03,  2.13it/s][A
Training:   3%|▎         | 9/269 [00:04<01:53,  2.29it/s][A
Training:   5%|▍         | 13/269 [00:06<01:41,  2.52it/s][A
Training:   6%|▋         | 17/269 [00:07<01:30,  2.80it/s][A
Training:   8%|▊         | 21/269 [00:08<01:26,  2.87it/s][A
Training:   8%|▊         | 22/269 [00:08<01:19,  3.10it/s][A
Training:   9%|▉         | 24/269 [00:08<01:03,  3.86it/s][A
Training:   9%|▉         | 25/269 [00:10<01:37,  2.50it/s][A
Training:  10%|█         | 27/269 [00:10<01:13,  3.28it/s][A
Training:  10%|█         | 28/269 [00:10<01:08,  3.50it/s][A
Training:  11%|█         | 29/269 [00:11<01:44,  2.29it/s][A
Training:  12%|█▏        | 31/269 [00:11<01:11,  3.31it/s][A
Training:  12%|█▏    

Training:  71%|███████   | 190/269 [01:08<00:30,  2.58it/s][A
Training:  71%|███████▏  | 192/269 [01:08<00:27,  2.76it/s][A
Training:  72%|███████▏  | 193/269 [01:09<00:25,  2.98it/s][A
Training:  72%|███████▏  | 194/269 [01:09<00:30,  2.44it/s][A
Training:  73%|███████▎  | 196/269 [01:10<00:25,  2.85it/s][A
Training:  73%|███████▎  | 197/269 [01:10<00:23,  3.06it/s][A
Training:  74%|███████▎  | 198/269 [01:11<00:28,  2.50it/s][A
Training:  74%|███████▍  | 200/269 [01:11<00:24,  2.85it/s][A
Training:  75%|███████▍  | 201/269 [01:11<00:21,  3.11it/s][A
Training:  75%|███████▌  | 202/269 [01:12<00:23,  2.81it/s][A
Training:  76%|███████▌  | 204/269 [01:12<00:22,  2.89it/s][A
Training:  76%|███████▌  | 205/269 [01:13<00:21,  2.96it/s][A
Training:  77%|███████▋  | 206/269 [01:13<00:23,  2.64it/s][A
Training:  77%|███████▋  | 208/269 [01:14<00:22,  2.77it/s][A
Training:  78%|███████▊  | 209/269 [01:14<00:21,  2.75it/s][A
Training:  78%|███████▊  | 210/269 [01:15<00:22,  2.66i

Epoch: 35/96 - Loss: 14029.7510 - Accuracy: 0.9156



  0%|          | 0/34 [00:00<?, ?it/s][A
  3%|▎         | 1/34 [00:01<01:04,  1.94s/it][A
 12%|█▏        | 4/34 [00:02<00:12,  2.40it/s][A
 18%|█▊        | 6/34 [00:03<00:13,  2.06it/s][A
 24%|██▎       | 8/34 [00:03<00:08,  3.03it/s][A
 26%|██▋       | 9/34 [00:04<00:12,  1.99it/s][A
 38%|███▊      | 13/34 [00:05<00:07,  2.69it/s][A
 47%|████▋     | 16/34 [00:05<00:04,  4.06it/s][A
 53%|█████▎    | 18/34 [00:06<00:05,  2.93it/s][A
 59%|█████▉    | 20/34 [00:07<00:03,  3.69it/s][A
 65%|██████▍   | 22/34 [00:08<00:04,  2.76it/s][A
 71%|███████   | 24/34 [00:08<00:02,  3.58it/s][A
 74%|███████▎  | 25/34 [00:09<00:03,  2.59it/s][A
 76%|███████▋  | 26/34 [00:09<00:02,  2.97it/s][A
 82%|████████▏ | 28/34 [00:09<00:01,  3.98it/s][A
 85%|████████▌ | 29/34 [00:10<00:01,  2.57it/s][A
 91%|█████████ | 31/34 [00:10<00:00,  3.66it/s][A
 94%|█████████▍| 32/34 [00:10<00:00,  4.05it/s][A
100%|██████████| 34/34 [00:11<00:00,  2.84it/s][A
Epochs:  36%|███▋      | 35/96 [1:03:12<1:50

Val Loss: 13056.9395 - Val Accuracy: 0.9257



Training:   0%|          | 0/269 [00:00<?, ?it/s][A
Training:   0%|          | 1/269 [00:01<08:20,  1.87s/it][A
Training:   1%|          | 2/269 [00:01<03:41,  1.20it/s][A
Training:   2%|▏         | 5/269 [00:03<02:12,  1.99it/s][A
Training:   2%|▏         | 6/269 [00:03<01:50,  2.37it/s][A
Training:   3%|▎         | 8/269 [00:03<01:11,  3.65it/s][A
Training:   3%|▎         | 9/269 [00:04<01:56,  2.23it/s][A
Training:   4%|▎         | 10/269 [00:04<01:41,  2.55it/s][A
Training:   5%|▍         | 13/269 [00:05<01:41,  2.51it/s][A
Training:   6%|▌         | 16/269 [00:06<01:03,  3.98it/s][A
Training:   6%|▋         | 17/269 [00:07<01:40,  2.52it/s][A
Training:   7%|▋         | 18/269 [00:07<01:30,  2.78it/s][A
Training:   7%|▋         | 20/269 [00:07<01:03,  3.94it/s][A
Training:   8%|▊         | 21/269 [00:08<01:42,  2.41it/s][A
Training:   8%|▊         | 22/269 [00:08<01:37,  2.53it/s][A
Training:   9%|▉         | 25/269 [00:10<01:40,  2.43it/s][A
Training:  10%|▉      

Training:  94%|█████████▍| 253/269 [01:30<00:05,  2.83it/s][A
Training:  96%|█████████▌| 257/269 [01:32<00:04,  2.84it/s][A
Training:  96%|█████████▋| 259/269 [01:32<00:02,  3.47it/s][A
Training:  97%|█████████▋| 261/269 [01:33<00:03,  2.50it/s][A
Training:  99%|█████████▊| 265/269 [01:35<00:01,  2.74it/s][A
Training:  99%|█████████▉| 267/269 [01:35<00:00,  3.39it/s][A
Training: 100%|██████████| 269/269 [01:35<00:00,  3.26it/s][A
                                                           [A

Epoch: 36/96 - Loss: 13108.9922 - Accuracy: 0.9202



  0%|          | 0/34 [00:00<?, ?it/s][A
  3%|▎         | 1/34 [00:01<00:53,  1.63s/it][A
  9%|▉         | 3/34 [00:01<00:14,  2.14it/s][A
 15%|█▍        | 5/34 [00:02<00:14,  1.94it/s][A
 24%|██▎       | 8/34 [00:03<00:07,  3.62it/s][A
 29%|██▉       | 10/34 [00:04<00:08,  2.72it/s][A
 32%|███▏      | 11/34 [00:04<00:07,  3.15it/s][A
 38%|███▊      | 13/34 [00:05<00:08,  2.35it/s][A
 41%|████      | 14/34 [00:05<00:07,  2.76it/s][A
 47%|████▋     | 16/34 [00:05<00:04,  3.98it/s][A
 53%|█████▎    | 18/34 [00:07<00:06,  2.62it/s][A
 62%|██████▏   | 21/34 [00:08<00:04,  2.64it/s][A
 68%|██████▊   | 23/34 [00:08<00:03,  3.51it/s][A
 74%|███████▎  | 25/34 [00:09<00:03,  2.71it/s][A
 82%|████████▏ | 28/34 [00:09<00:01,  4.05it/s][A
 88%|████████▊ | 30/34 [00:10<00:01,  3.04it/s][A
100%|██████████| 34/34 [00:11<00:00,  2.85it/s][A
Epochs:  38%|███▊      | 36/96 [1:05:00<1:48:21, 108.36s/it]

Val Loss: 13776.3975 - Val Accuracy: 0.9173



Training:   0%|          | 0/269 [00:00<?, ?it/s][A
Training:   0%|          | 1/269 [00:02<10:06,  2.26s/it][A
Training:   1%|          | 3/269 [00:02<02:48,  1.58it/s][A
Training:   2%|▏         | 5/269 [00:03<02:46,  1.59it/s][A
Training:   3%|▎         | 8/269 [00:03<01:26,  3.02it/s][A
Training:   4%|▎         | 10/269 [00:05<01:50,  2.35it/s][A
Training:   4%|▍         | 12/269 [00:05<01:18,  3.26it/s][A
Training:   5%|▌         | 14/269 [00:06<01:36,  2.65it/s][A
Training:   6%|▌         | 15/269 [00:06<01:24,  3.00it/s][A
Training:   6%|▋         | 17/269 [00:07<01:54,  2.19it/s][A
Training:   7%|▋         | 19/269 [00:07<01:21,  3.08it/s][A
Training:   8%|▊         | 21/269 [00:09<01:52,  2.21it/s][A
Training:   9%|▊         | 23/269 [00:09<01:20,  3.05it/s][A
Training:   9%|▉         | 25/269 [00:10<01:35,  2.55it/s][A
Training:  10%|█         | 27/269 [00:10<01:11,  3.39it/s][A
Training:  11%|█         | 29/269 [00:11<01:34,  2.54it/s][A
Training:  12%|█▏   

Epoch: 37/96 - Loss: 14068.9219 - Accuracy: 0.9162



  0%|          | 0/34 [00:00<?, ?it/s][A
  3%|▎         | 1/34 [00:01<01:02,  1.89s/it][A
 12%|█▏        | 4/34 [00:02<00:12,  2.47it/s][A
 18%|█▊        | 6/34 [00:03<00:12,  2.28it/s][A
 21%|██        | 7/34 [00:03<00:10,  2.58it/s][A
 26%|██▋       | 9/34 [00:04<00:10,  2.47it/s][A
 32%|███▏      | 11/34 [00:04<00:07,  3.20it/s][A
 38%|███▊      | 13/34 [00:05<00:07,  2.71it/s][A
 44%|████▍     | 15/34 [00:05<00:05,  3.32it/s][A
 50%|█████     | 17/34 [00:06<00:06,  2.75it/s][A
 56%|█████▌    | 19/34 [00:06<00:04,  3.40it/s][A
 62%|██████▏   | 21/34 [00:07<00:04,  2.94it/s][A
 68%|██████▊   | 23/34 [00:08<00:03,  3.15it/s][A
 74%|███████▎  | 25/34 [00:09<00:02,  3.02it/s][A
 79%|███████▉  | 27/34 [00:09<00:02,  3.20it/s][A
 85%|████████▌ | 29/34 [00:10<00:01,  3.09it/s][A
 91%|█████████ | 31/34 [00:10<00:00,  3.21it/s][A
100%|██████████| 34/34 [00:11<00:00,  2.90it/s][A
Epochs:  39%|███▊      | 37/96 [1:06:47<1:46:16, 108.08s/it]

Val Loss: 15159.1836 - Val Accuracy: 0.9080



Training:   0%|          | 0/269 [00:00<?, ?it/s][A
Training:   0%|          | 1/269 [00:01<08:06,  1.82s/it][A
Training:   1%|          | 2/269 [00:01<03:43,  1.19it/s][A
Training:   2%|▏         | 5/269 [00:03<02:16,  1.94it/s][A
Training:   2%|▏         | 6/269 [00:03<02:00,  2.19it/s][A
Training:   3%|▎         | 8/269 [00:03<01:16,  3.39it/s][A
Training:   3%|▎         | 9/269 [00:04<02:02,  2.12it/s][A
Training:   4%|▎         | 10/269 [00:04<01:47,  2.41it/s][A
Training:   5%|▍         | 13/269 [00:05<01:38,  2.59it/s][A
Training:   5%|▌         | 14/269 [00:06<01:40,  2.54it/s][A
Training:   6%|▌         | 16/269 [00:06<01:09,  3.62it/s][A
Training:   6%|▋         | 17/269 [00:07<01:49,  2.31it/s][A
Training:   7%|▋         | 18/269 [00:07<01:45,  2.37it/s][A
Training:   8%|▊         | 21/269 [00:08<01:34,  2.64it/s][A
Training:   8%|▊         | 22/269 [00:09<01:33,  2.65it/s][A
Training:   9%|▉         | 24/269 [00:09<01:05,  3.76it/s][A
Training:   9%|▉      

Training:  79%|███████▉  | 212/269 [01:15<00:20,  2.84it/s][A
Training:  79%|███████▉  | 213/269 [01:16<00:22,  2.47it/s][A
Training:  80%|███████▉  | 215/269 [01:16<00:15,  3.50it/s][A
Training:  80%|████████  | 216/269 [01:16<00:19,  2.71it/s][A
Training:  81%|████████  | 217/269 [01:17<00:20,  2.52it/s][A
Training:  81%|████████▏ | 219/269 [01:17<00:14,  3.55it/s][A
Training:  82%|████████▏ | 220/269 [01:18<00:18,  2.67it/s][A
Training:  82%|████████▏ | 221/269 [01:19<00:21,  2.24it/s][A
Training:  83%|████████▎ | 223/269 [01:19<00:13,  3.37it/s][A
Training:  83%|████████▎ | 224/269 [01:19<00:17,  2.65it/s][A
Training:  84%|████████▎ | 225/269 [01:20<00:19,  2.21it/s][A
Training:  85%|████████▍ | 228/269 [01:21<00:14,  2.89it/s][A
Training:  85%|████████▌ | 229/269 [01:22<00:16,  2.37it/s][A
Training:  86%|████████▌ | 232/269 [01:22<00:11,  3.30it/s][A
Training:  87%|████████▋ | 233/269 [01:23<00:15,  2.34it/s][A
Training:  88%|████████▊ | 236/269 [01:23<00:09,  3.32i

Epoch: 38/96 - Loss: 14211.2588 - Accuracy: 0.9153



  0%|          | 0/34 [00:00<?, ?it/s][A
  3%|▎         | 1/34 [00:01<01:02,  1.91s/it][A
 15%|█▍        | 5/34 [00:02<00:14,  2.00it/s][A
 26%|██▋       | 9/34 [00:04<00:09,  2.69it/s][A
 32%|███▏      | 11/34 [00:04<00:06,  3.37it/s][A
 38%|███▊      | 13/34 [00:05<00:07,  2.78it/s][A
 44%|████▍     | 15/34 [00:05<00:05,  3.55it/s][A
 50%|█████     | 17/34 [00:06<00:06,  2.72it/s][A
 62%|██████▏   | 21/34 [00:07<00:04,  3.02it/s][A
 68%|██████▊   | 23/34 [00:07<00:02,  3.74it/s][A
 74%|███████▎  | 25/34 [00:08<00:03,  2.91it/s][A
 79%|███████▉  | 27/34 [00:09<00:01,  3.50it/s][A
 85%|████████▌ | 29/34 [00:10<00:01,  2.93it/s][A
 88%|████████▊ | 30/34 [00:10<00:01,  3.21it/s][A
100%|██████████| 34/34 [00:11<00:00,  2.98it/s][A
Epochs:  40%|███▉      | 38/96 [1:08:35<1:44:18, 107.91s/it]

Val Loss: 13793.0078 - Val Accuracy: 0.9324



Training:   0%|          | 0/269 [00:00<?, ?it/s][A
Training:   0%|          | 1/269 [00:02<09:35,  2.15s/it][A
Training:   1%|▏         | 4/269 [00:02<01:56,  2.27it/s][A
Training:   2%|▏         | 6/269 [00:03<02:23,  1.84it/s][A
Training:   3%|▎         | 9/269 [00:04<02:09,  2.01it/s][A
Training:   4%|▍         | 12/269 [00:05<01:20,  3.21it/s][A
Training:   5%|▌         | 14/269 [00:06<01:43,  2.47it/s][A
Training:   6%|▌         | 16/269 [00:06<01:17,  3.27it/s][A
Training:   7%|▋         | 18/269 [00:07<01:42,  2.46it/s][A
Training:   7%|▋         | 20/269 [00:07<01:16,  3.25it/s][A
Training:   8%|▊         | 22/269 [00:09<01:51,  2.22it/s][A
Training:   9%|▉         | 24/269 [00:09<01:21,  3.01it/s][A
Training:  10%|▉         | 26/269 [00:11<01:49,  2.22it/s][A
Training:  11%|█         | 29/269 [00:12<01:52,  2.13it/s][A
Training:  12%|█▏        | 31/269 [00:12<01:25,  2.79it/s][A
Training:  12%|█▏        | 33/269 [00:14<01:43,  2.28it/s][A
Training:  14%|█▍   

Epoch: 39/96 - Loss: 13826.0645 - Accuracy: 0.9197



  0%|          | 0/34 [00:00<?, ?it/s][A
  3%|▎         | 1/34 [00:01<00:47,  1.43s/it][A
  6%|▌         | 2/34 [00:01<00:22,  1.40it/s][A
 15%|█▍        | 5/34 [00:02<00:12,  2.32it/s][A
 18%|█▊        | 6/34 [00:02<00:10,  2.68it/s][A
 24%|██▎       | 8/34 [00:02<00:06,  4.04it/s][A
 26%|██▋       | 9/34 [00:03<00:09,  2.68it/s][A
 29%|██▉       | 10/34 [00:03<00:07,  3.07it/s][A
 32%|███▏      | 11/34 [00:04<00:06,  3.53it/s][A
 38%|███▊      | 13/34 [00:04<00:07,  2.93it/s][A
 41%|████      | 14/34 [00:05<00:06,  3.14it/s][A
 44%|████▍     | 15/34 [00:05<00:05,  3.67it/s][A
 47%|████▋     | 16/34 [00:05<00:04,  4.38it/s][A
 50%|█████     | 17/34 [00:06<00:05,  2.90it/s][A
 53%|█████▎    | 18/34 [00:06<00:05,  2.74it/s][A
 62%|██████▏   | 21/34 [00:07<00:03,  3.44it/s][A
 65%|██████▍   | 22/34 [00:07<00:03,  3.07it/s][A
 71%|███████   | 24/34 [00:07<00:02,  4.34it/s][A
 74%|███████▎  | 25/34 [00:08<00:02,  3.49it/s][A
 76%|███████▋  | 26/34 [00:08<00:02,  2.90it/

Val Loss: 14375.9668 - Val Accuracy: 0.9346



Training:   0%|          | 0/269 [00:00<?, ?it/s][A
Training:   0%|          | 1/269 [00:02<09:35,  2.15s/it][A
Training:   1%|▏         | 4/269 [00:02<01:55,  2.29it/s][A
Training:   2%|▏         | 6/269 [00:03<02:29,  1.76it/s][A
Training:   3%|▎         | 8/269 [00:03<01:39,  2.62it/s][A
Training:   4%|▎         | 10/269 [00:05<01:56,  2.22it/s][A
Training:   5%|▍         | 13/269 [00:06<01:52,  2.28it/s][A
Training:   5%|▌         | 14/269 [00:06<01:46,  2.39it/s][A
Training:   6%|▌         | 16/269 [00:06<01:17,  3.25it/s][A
Training:   6%|▋         | 17/269 [00:07<01:49,  2.30it/s][A
Training:   7%|▋         | 18/269 [00:08<01:44,  2.41it/s][A
Training:   7%|▋         | 20/269 [00:08<01:09,  3.56it/s][A
Training:   8%|▊         | 21/269 [00:09<01:42,  2.41it/s][A
Training:   8%|▊         | 22/269 [00:09<01:39,  2.48it/s][A
Training:   9%|▉         | 25/269 [00:10<01:41,  2.40it/s][A
Training:  10%|▉         | 26/269 [00:11<01:35,  2.55it/s][A
Training:  10%|█    

Training:  90%|████████▉ | 241/269 [01:25<00:11,  2.54it/s][A
Training:  90%|████████▉ | 242/269 [01:26<00:08,  3.01it/s][A
Training:  91%|█████████ | 244/269 [01:26<00:06,  3.92it/s][A
Training:  91%|█████████ | 245/269 [01:27<00:10,  2.30it/s][A
Training:  92%|█████████▏| 248/269 [01:27<00:05,  3.91it/s][A
Training:  93%|█████████▎| 249/269 [01:28<00:08,  2.33it/s][A
Training:  93%|█████████▎| 251/269 [01:28<00:05,  3.28it/s][A
Training:  94%|█████████▍| 253/269 [01:30<00:06,  2.39it/s][A
Training:  95%|█████████▍| 255/269 [01:30<00:04,  3.26it/s][A
Training:  96%|█████████▌| 257/269 [01:31<00:05,  2.35it/s][A
Training:  96%|█████████▋| 259/269 [01:31<00:03,  3.21it/s][A
Training:  97%|█████████▋| 261/269 [01:33<00:03,  2.46it/s][A
Training:  98%|█████████▊| 263/269 [01:33<00:01,  3.27it/s][A
Training:  98%|█████████▊| 264/269 [01:33<00:01,  3.70it/s][A
Training:  99%|█████████▊| 265/269 [01:34<00:01,  2.22it/s][A
Training: 100%|█████████▉| 268/269 [01:34<00:00,  3.56i

Epoch: 40/96 - Loss: 13576.6631 - Accuracy: 0.9189



  0%|          | 0/34 [00:00<?, ?it/s][A
  3%|▎         | 1/34 [00:01<01:00,  1.84s/it][A
 12%|█▏        | 4/34 [00:01<00:11,  2.66it/s][A
 18%|█▊        | 6/34 [00:03<00:13,  2.12it/s][A
 24%|██▎       | 8/34 [00:03<00:08,  3.21it/s][A
 29%|██▉       | 10/34 [00:04<00:09,  2.53it/s][A
 35%|███▌      | 12/34 [00:04<00:06,  3.52it/s][A
 41%|████      | 14/34 [00:05<00:07,  2.59it/s][A
 47%|████▋     | 16/34 [00:05<00:05,  3.53it/s][A
 53%|█████▎    | 18/34 [00:06<00:05,  2.72it/s][A
 56%|█████▌    | 19/34 [00:07<00:04,  3.12it/s][A
 62%|██████▏   | 21/34 [00:08<00:05,  2.53it/s][A
 71%|███████   | 24/34 [00:08<00:02,  4.00it/s][A
 76%|███████▋  | 26/34 [00:09<00:02,  3.07it/s][A
 85%|████████▌ | 29/34 [00:10<00:01,  2.84it/s][A
 91%|█████████ | 31/34 [00:10<00:00,  3.66it/s][A
100%|██████████| 34/34 [00:11<00:00,  2.89it/s][A
Epochs:  42%|████▏     | 40/96 [1:12:09<1:40:21, 107.53s/it]

Val Loss: 14537.9746 - Val Accuracy: 0.9309



Training:   0%|          | 0/269 [00:00<?, ?it/s][A
Training:   0%|          | 1/269 [00:01<07:42,  1.72s/it][A
Training:   1%|          | 2/269 [00:01<03:29,  1.27it/s][A
Training:   2%|▏         | 5/269 [00:02<02:08,  2.06it/s][A
Training:   3%|▎         | 7/269 [00:03<01:23,  3.14it/s][A
Training:   3%|▎         | 9/269 [00:04<01:51,  2.33it/s][A
Training:   4%|▎         | 10/269 [00:04<01:41,  2.56it/s][A
Training:   4%|▍         | 12/269 [00:04<01:08,  3.75it/s][A
Training:   5%|▍         | 13/269 [00:05<01:41,  2.53it/s][A
Training:   5%|▌         | 14/269 [00:05<01:35,  2.68it/s][A
Training:   6%|▌         | 16/269 [00:06<01:03,  4.01it/s][A
Training:   6%|▋         | 17/269 [00:06<01:34,  2.67it/s][A
Training:   7%|▋         | 18/269 [00:07<01:34,  2.64it/s][A
Training:   7%|▋         | 19/269 [00:07<01:17,  3.25it/s][A
Training:   8%|▊         | 21/269 [00:08<01:20,  3.07it/s][A
Training:   8%|▊         | 22/269 [00:08<01:31,  2.71it/s][A
Training:   9%|▊     

Training:  97%|█████████▋| 262/269 [01:34<00:02,  2.51it/s][A
Training:  99%|█████████▊| 265/269 [01:34<00:01,  3.79it/s][A
Training:  99%|█████████▉| 267/269 [01:35<00:00,  2.96it/s][A
                                                           [A

Epoch: 41/96 - Loss: 13072.5684 - Accuracy: 0.9192



  0%|          | 0/34 [00:00<?, ?it/s][A
  3%|▎         | 1/34 [00:01<00:58,  1.77s/it][A
 15%|█▍        | 5/34 [00:02<00:14,  2.00it/s][A
 24%|██▎       | 8/34 [00:03<00:07,  3.55it/s][A
 29%|██▉       | 10/34 [00:04<00:09,  2.60it/s][A
 35%|███▌      | 12/34 [00:04<00:06,  3.56it/s][A
 41%|████      | 14/34 [00:05<00:07,  2.78it/s][A
 50%|█████     | 17/34 [00:06<00:06,  2.65it/s][A
 56%|█████▌    | 19/34 [00:06<00:04,  3.45it/s][A
 62%|██████▏   | 21/34 [00:07<00:04,  2.75it/s][A
 68%|██████▊   | 23/34 [00:07<00:03,  3.63it/s][A
 74%|███████▎  | 25/34 [00:09<00:03,  2.69it/s][A
 85%|████████▌ | 29/34 [00:10<00:01,  3.12it/s][A
 94%|█████████▍| 32/34 [00:10<00:00,  4.32it/s][A
100%|██████████| 34/34 [00:11<00:00,  2.96it/s][A
Epochs:  43%|████▎     | 41/96 [1:13:56<1:38:25, 107.37s/it]

Val Loss: 15970.6270 - Val Accuracy: 0.9177



Training:   0%|          | 0/269 [00:00<?, ?it/s][A
Training:   0%|          | 1/269 [00:01<08:38,  1.93s/it][A
Training:   1%|▏         | 4/269 [00:02<01:44,  2.53it/s][A
Training:   2%|▏         | 6/269 [00:03<02:06,  2.08it/s][A
Training:   3%|▎         | 8/269 [00:03<01:24,  3.09it/s][A
Training:   4%|▎         | 10/269 [00:04<01:52,  2.31it/s][A
Training:   4%|▍         | 11/269 [00:04<01:34,  2.72it/s][A
Training:   5%|▍         | 13/269 [00:05<01:55,  2.22it/s][A
Training:   6%|▌         | 15/269 [00:06<01:20,  3.17it/s][A
Training:   6%|▋         | 17/269 [00:07<01:35,  2.64it/s][A
Training:   7%|▋         | 19/269 [00:07<01:11,  3.51it/s][A
Training:   7%|▋         | 20/269 [00:07<01:03,  3.94it/s][A
Training:   8%|▊         | 21/269 [00:08<01:55,  2.15it/s][A
Training:   9%|▉         | 24/269 [00:08<01:03,  3.84it/s][A
Training:  10%|▉         | 26/269 [00:10<01:36,  2.52it/s][A
Training:  11%|█         | 29/269 [00:11<01:40,  2.40it/s][A
Training:  11%|█    

Training:  88%|████████▊ | 237/269 [01:25<00:13,  2.39it/s][A
Training:  89%|████████▉ | 239/269 [01:25<00:09,  3.14it/s][A
Training:  90%|████████▉ | 241/269 [01:26<00:11,  2.54it/s][A
Training:  91%|█████████ | 245/269 [01:27<00:08,  2.71it/s][A
Training:  92%|█████████▏| 247/269 [01:27<00:06,  3.36it/s][A
Training:  93%|█████████▎| 249/269 [01:29<00:07,  2.63it/s][A
Training:  94%|█████████▍| 253/269 [01:30<00:05,  2.68it/s][A
Training:  96%|█████████▌| 257/269 [01:32<00:04,  2.69it/s][A
Training:  96%|█████████▋| 259/269 [01:32<00:03,  3.29it/s][A
Training:  97%|█████████▋| 261/269 [01:33<00:03,  2.65it/s][A
Training:  98%|█████████▊| 263/269 [01:33<00:01,  3.30it/s][A
Training:  98%|█████████▊| 264/269 [01:33<00:01,  3.67it/s][A
Training:  99%|█████████▊| 265/269 [01:34<00:01,  2.43it/s][A
Training: 100%|█████████▉| 268/269 [01:34<00:00,  4.02it/s][A
                                                           [A

Epoch: 42/96 - Loss: 13166.0967 - Accuracy: 0.9168



  0%|          | 0/34 [00:00<?, ?it/s][A
  3%|▎         | 1/34 [00:01<01:02,  1.89s/it][A
  9%|▉         | 3/34 [00:02<00:16,  1.87it/s][A
 15%|█▍        | 5/34 [00:02<00:14,  1.97it/s][A
 21%|██        | 7/34 [00:03<00:08,  3.06it/s][A
 26%|██▋       | 9/34 [00:04<00:09,  2.53it/s][A
 32%|███▏      | 11/34 [00:04<00:06,  3.58it/s][A
 38%|███▊      | 13/34 [00:05<00:07,  2.80it/s][A
 41%|████      | 14/34 [00:05<00:06,  3.13it/s][A
 47%|████▋     | 16/34 [00:05<00:04,  4.26it/s][A
 50%|█████     | 17/34 [00:06<00:06,  2.59it/s][A
 53%|█████▎    | 18/34 [00:06<00:05,  3.08it/s][A
 59%|█████▉    | 20/34 [00:06<00:03,  4.48it/s][A
 62%|██████▏   | 21/34 [00:07<00:04,  2.62it/s][A
 65%|██████▍   | 22/34 [00:07<00:03,  3.04it/s][A
 74%|███████▎  | 25/34 [00:09<00:03,  2.69it/s][A
 76%|███████▋  | 26/34 [00:09<00:02,  3.12it/s][A
 82%|████████▏ | 28/34 [00:09<00:01,  4.45it/s][A
 88%|████████▊ | 30/34 [00:10<00:01,  2.97it/s][A
100%|██████████| 34/34 [00:11<00:00,  2.89it

Val Loss: 15758.4316 - Val Accuracy: 0.8728



Training:   0%|          | 0/269 [00:00<?, ?it/s][A
Training:   0%|          | 1/269 [00:01<08:45,  1.96s/it][A
Training:   1%|          | 3/269 [00:02<02:25,  1.82it/s][A
Training:   2%|▏         | 5/269 [00:03<02:35,  1.70it/s][A
Training:   3%|▎         | 7/269 [00:03<01:36,  2.73it/s][A
Training:   3%|▎         | 9/269 [00:04<01:53,  2.28it/s][A
Training:   4%|▍         | 11/269 [00:04<01:21,  3.17it/s][A
Training:   5%|▍         | 13/269 [00:05<01:41,  2.52it/s][A
Training:   5%|▌         | 14/269 [00:05<01:27,  2.91it/s][A
Training:   6%|▋         | 17/269 [00:07<01:30,  2.79it/s][A
Training:   7%|▋         | 18/269 [00:07<01:20,  3.10it/s][A
Training:   7%|▋         | 19/269 [00:07<01:10,  3.55it/s][A
Training:   8%|▊         | 21/269 [00:08<01:36,  2.57it/s][A
Training:   8%|▊         | 22/269 [00:08<01:26,  2.85it/s][A
Training:   9%|▊         | 23/269 [00:08<01:13,  3.36it/s][A
Training:   9%|▉         | 25/269 [00:10<01:46,  2.30it/s][A
Training:  10%|▉     

Training:  96%|█████████▌| 257/269 [01:31<00:04,  2.59it/s][A
Training:  96%|█████████▋| 259/269 [01:31<00:03,  3.33it/s][A
Training:  97%|█████████▋| 261/269 [01:32<00:02,  2.77it/s][A
Training:  98%|█████████▊| 264/269 [01:32<00:01,  4.00it/s][A
Training:  99%|█████████▊| 265/269 [01:33<00:01,  2.65it/s][A
Training: 100%|█████████▉| 268/269 [01:34<00:00,  3.72it/s][A
Training: 100%|██████████| 269/269 [01:34<00:00,  3.09it/s][A
                                                           [A

Epoch: 43/96 - Loss: 13606.8115 - Accuracy: 0.9170



  0%|          | 0/34 [00:00<?, ?it/s][A
  3%|▎         | 1/34 [00:01<00:52,  1.59s/it][A
  6%|▌         | 2/34 [00:01<00:22,  1.40it/s][A
 12%|█▏        | 4/34 [00:01<00:10,  2.85it/s][A
 15%|█▍        | 5/34 [00:02<00:13,  2.16it/s][A
 18%|█▊        | 6/34 [00:02<00:11,  2.49it/s][A
 24%|██▎       | 8/34 [00:03<00:07,  3.68it/s][A
 26%|██▋       | 9/34 [00:03<00:09,  2.66it/s][A
 29%|██▉       | 10/34 [00:04<00:08,  2.80it/s][A
 35%|███▌      | 12/34 [00:04<00:06,  3.64it/s][A
 38%|███▊      | 13/34 [00:05<00:07,  2.74it/s][A
 41%|████      | 14/34 [00:05<00:06,  2.90it/s][A
 47%|████▋     | 16/34 [00:05<00:05,  3.57it/s][A
 50%|█████     | 17/34 [00:06<00:05,  3.11it/s][A
 53%|█████▎    | 18/34 [00:06<00:04,  3.50it/s][A
 56%|█████▌    | 19/34 [00:06<00:04,  3.66it/s][A
 59%|█████▉    | 20/34 [00:07<00:04,  3.46it/s][A
 62%|██████▏   | 21/34 [00:07<00:04,  2.75it/s][A
 68%|██████▊   | 23/34 [00:07<00:02,  4.35it/s][A
 71%|███████   | 24/34 [00:08<00:03,  3.26it/s

Val Loss: 14465.6748 - Val Accuracy: 0.8187



Training:   0%|          | 0/269 [00:00<?, ?it/s][A
Training:   0%|          | 1/269 [00:02<09:37,  2.16s/it][A
Training:   1%|▏         | 4/269 [00:02<02:00,  2.21it/s][A
Training:   2%|▏         | 6/269 [00:03<02:14,  1.95it/s][A
Training:   3%|▎         | 9/269 [00:05<02:14,  1.93it/s][A
Training:   4%|▍         | 12/269 [00:05<01:22,  3.10it/s][A
Training:   5%|▌         | 14/269 [00:06<01:47,  2.37it/s][A
Training:   6%|▌         | 16/269 [00:06<01:20,  3.15it/s][A
Training:   7%|▋         | 18/269 [00:08<01:45,  2.38it/s][A
Training:   8%|▊         | 21/269 [00:09<01:51,  2.22it/s][A
Training:   9%|▉         | 24/269 [00:09<01:14,  3.30it/s][A
Training:  10%|▉         | 26/269 [00:10<01:35,  2.55it/s][A
Training:  10%|█         | 28/269 [00:11<01:12,  3.31it/s][A
Training:  11%|█         | 30/269 [00:12<01:39,  2.40it/s][A
Training:  12%|█▏        | 32/269 [00:12<01:15,  3.15it/s][A
Training:  13%|█▎        | 34/269 [00:13<01:38,  2.38it/s][A
Training:  14%|█▍   

Training:  80%|████████  | 216/269 [01:16<00:17,  3.05it/s][A
Training:  81%|████████  | 217/269 [01:17<00:16,  3.14it/s][A
Training:  81%|████████▏ | 219/269 [01:17<00:17,  2.88it/s][A
Training:  82%|████████▏ | 220/269 [01:18<00:17,  2.86it/s][A
Training:  82%|████████▏ | 221/269 [01:18<00:14,  3.31it/s][A
Training:  83%|████████▎ | 223/269 [01:19<00:18,  2.52it/s][A
Training:  83%|████████▎ | 224/269 [01:19<00:16,  2.66it/s][A
Training:  84%|████████▎ | 225/269 [01:19<00:13,  3.22it/s][A
Training:  84%|████████▍ | 227/269 [01:20<00:17,  2.44it/s][A
Training:  85%|████████▍ | 228/269 [01:20<00:13,  2.94it/s][A
Training:  85%|████████▌ | 229/269 [01:21<00:11,  3.34it/s][A
Training:  86%|████████▌ | 231/269 [01:22<00:15,  2.49it/s][A
Training:  87%|████████▋ | 233/269 [01:22<00:10,  3.39it/s][A
Training:  87%|████████▋ | 234/269 [01:22<00:09,  3.74it/s][A
Training:  87%|████████▋ | 235/269 [01:23<00:16,  2.06it/s][A
Training:  88%|████████▊ | 237/269 [01:24<00:10,  3.12i

Epoch: 44/96 - Loss: 13377.7529 - Accuracy: 0.9210



  0%|          | 0/34 [00:00<?, ?it/s][A
  3%|▎         | 1/34 [00:02<01:07,  2.06s/it][A
 12%|█▏        | 4/34 [00:02<00:12,  2.36it/s][A
 18%|█▊        | 6/34 [00:03<00:13,  2.14it/s][A
 26%|██▋       | 9/34 [00:04<00:10,  2.31it/s][A
 29%|██▉       | 10/34 [00:04<00:09,  2.60it/s][A
 35%|███▌      | 12/34 [00:04<00:06,  3.60it/s][A
 38%|███▊      | 13/34 [00:05<00:08,  2.53it/s][A
 41%|████      | 14/34 [00:05<00:06,  2.90it/s][A
 50%|█████     | 17/34 [00:06<00:05,  2.87it/s][A
 59%|█████▉    | 20/34 [00:06<00:03,  4.51it/s][A
 65%|██████▍   | 22/34 [00:08<00:04,  2.91it/s][A
 74%|███████▎  | 25/34 [00:09<00:03,  2.75it/s][A
 79%|███████▉  | 27/34 [00:09<00:01,  3.56it/s][A
 85%|████████▌ | 29/34 [00:10<00:01,  2.87it/s][A
100%|██████████| 34/34 [00:11<00:00,  2.85it/s][A
Epochs:  46%|████▌     | 44/96 [1:19:18<1:32:55, 107.21s/it]

Val Loss: 16201.8516 - Val Accuracy: 0.8810



Training:   0%|          | 0/269 [00:00<?, ?it/s][A
Training:   0%|          | 1/269 [00:02<09:31,  2.13s/it][A
Training:   1%|          | 2/269 [00:02<04:17,  1.04it/s][A
Training:   2%|▏         | 5/269 [00:03<02:31,  1.74it/s][A
Training:   3%|▎         | 7/269 [00:03<01:34,  2.76it/s][A
Training:   3%|▎         | 9/269 [00:04<01:59,  2.18it/s][A
Training:   5%|▍         | 13/269 [00:06<01:41,  2.52it/s][A
Training:   5%|▌         | 14/269 [00:06<01:33,  2.74it/s][A
Training:   6%|▌         | 16/269 [00:06<01:09,  3.66it/s][A
Training:   6%|▋         | 17/269 [00:07<01:55,  2.18it/s][A
Training:   7%|▋         | 19/269 [00:08<01:21,  3.05it/s][A
Training:   8%|▊         | 21/269 [00:09<01:41,  2.44it/s][A
Training:   8%|▊         | 22/269 [00:09<01:28,  2.79it/s][A
Training:   9%|▉         | 25/269 [00:10<01:35,  2.56it/s][A
Training:  10%|█         | 27/269 [00:10<01:10,  3.42it/s][A
Training:  11%|█         | 29/269 [00:12<01:37,  2.47it/s][A
Training:  11%|█     

Training:  88%|████████▊ | 237/269 [01:23<00:12,  2.51it/s][A
Training:  89%|████████▉ | 239/269 [01:24<00:08,  3.36it/s][A
Training:  90%|████████▉ | 241/269 [01:25<00:11,  2.35it/s][A
Training:  90%|████████▉ | 242/269 [01:25<00:09,  2.71it/s][A
Training:  91%|█████████ | 244/269 [01:25<00:06,  3.68it/s][A
Training:  91%|█████████ | 245/269 [01:27<00:11,  2.17it/s][A
Training:  92%|█████████▏| 248/269 [01:27<00:05,  3.70it/s][A
Training:  93%|█████████▎| 250/269 [01:28<00:07,  2.39it/s][A
Training:  94%|█████████▎| 252/269 [01:28<00:05,  3.13it/s][A
Training:  94%|█████████▍| 253/269 [01:30<00:07,  2.06it/s][A
Training:  95%|█████████▌| 256/269 [01:30<00:03,  3.39it/s][A
Training:  96%|█████████▌| 258/269 [01:31<00:04,  2.50it/s][A
Training:  97%|█████████▋| 260/269 [01:31<00:02,  3.33it/s][A
Training:  97%|█████████▋| 262/269 [01:33<00:02,  2.39it/s][A
Training:  99%|█████████▊| 265/269 [01:34<00:01,  2.32it/s][A
Training: 100%|█████████▉| 268/269 [01:34<00:00,  3.46i

Epoch: 45/96 - Loss: 13953.0742 - Accuracy: 0.9169



  0%|          | 0/34 [00:00<?, ?it/s][A
  3%|▎         | 1/34 [00:02<01:08,  2.08s/it][A
 12%|█▏        | 4/34 [00:02<00:12,  2.37it/s][A
 18%|█▊        | 6/34 [00:03<00:12,  2.19it/s][A
 24%|██▎       | 8/34 [00:03<00:08,  3.13it/s][A
 29%|██▉       | 10/34 [00:04<00:10,  2.37it/s][A
 35%|███▌      | 12/34 [00:04<00:06,  3.25it/s][A
 38%|███▊      | 13/34 [00:05<00:08,  2.42it/s][A
 50%|█████     | 17/34 [00:06<00:05,  3.04it/s][A
 56%|█████▌    | 19/34 [00:06<00:03,  3.91it/s][A
 62%|██████▏   | 21/34 [00:07<00:04,  2.91it/s][A
 68%|██████▊   | 23/34 [00:08<00:02,  3.81it/s][A
 74%|███████▎  | 25/34 [00:09<00:03,  2.83it/s][A
 82%|████████▏ | 28/34 [00:09<00:01,  4.29it/s][A
 88%|████████▊ | 30/34 [00:10<00:01,  3.27it/s][A
 94%|█████████▍| 32/34 [00:10<00:00,  4.22it/s][A
100%|██████████| 34/34 [00:11<00:00,  2.95it/s][A
Epochs:  47%|████▋     | 45/96 [1:21:05<1:31:07, 107.20s/it]

Val Loss: 15400.0596 - Val Accuracy: 0.9296



Training:   0%|          | 0/269 [00:00<?, ?it/s][A
Training:   0%|          | 1/269 [00:02<09:32,  2.14s/it][A
Training:   2%|▏         | 5/269 [00:03<02:44,  1.60it/s][A
Training:   3%|▎         | 7/269 [00:03<01:49,  2.39it/s][A
Training:   3%|▎         | 9/269 [00:05<02:10,  2.00it/s][A
Training:   4%|▍         | 11/269 [00:05<01:32,  2.80it/s][A
Training:   5%|▍         | 13/269 [00:06<01:54,  2.24it/s][A
Training:   6%|▌         | 16/269 [00:06<01:11,  3.54it/s][A
Training:   7%|▋         | 18/269 [00:08<01:41,  2.48it/s][A
Training:   7%|▋         | 20/269 [00:08<01:16,  3.28it/s][A
Training:   8%|▊         | 22/269 [00:09<01:40,  2.46it/s][A
Training:   9%|▉         | 24/269 [00:09<01:15,  3.23it/s][A
Training:   9%|▉         | 25/269 [00:10<01:56,  2.10it/s][A
Training:  10%|█         | 27/269 [00:11<01:22,  2.92it/s][A
Training:  11%|█         | 29/269 [00:12<01:36,  2.48it/s][A
Training:  12%|█▏        | 31/269 [00:12<01:10,  3.37it/s][A
Training:  12%|█▏   

Training:  95%|█████████▌| 256/269 [01:30<00:03,  3.54it/s][A
Training:  96%|█████████▌| 258/269 [01:31<00:04,  2.51it/s][A
Training:  97%|█████████▋| 260/269 [01:31<00:02,  3.36it/s][A
Training:  97%|█████████▋| 262/269 [01:32<00:02,  2.40it/s][A
Training:  99%|█████████▊| 265/269 [01:34<00:01,  2.38it/s][A
Training: 100%|█████████▉| 268/269 [01:34<00:00,  3.52it/s][A
                                                           [A

Epoch: 46/96 - Loss: 14074.1729 - Accuracy: 0.9156



  0%|          | 0/34 [00:00<?, ?it/s][A
  3%|▎         | 1/34 [00:02<01:07,  2.05s/it][A
 15%|█▍        | 5/34 [00:03<00:16,  1.81it/s][A
 24%|██▎       | 8/34 [00:03<00:08,  3.20it/s][A
 29%|██▉       | 10/34 [00:04<00:09,  2.64it/s][A
 38%|███▊      | 13/34 [00:05<00:07,  2.79it/s][A
 41%|████      | 14/34 [00:05<00:06,  2.87it/s][A
 47%|████▋     | 16/34 [00:05<00:04,  3.80it/s][A
 50%|█████     | 17/34 [00:06<00:05,  3.01it/s][A
 53%|█████▎    | 18/34 [00:06<00:05,  2.97it/s][A
 56%|█████▌    | 19/34 [00:07<00:04,  3.30it/s][A
 62%|██████▏   | 21/34 [00:07<00:04,  3.24it/s][A
 65%|██████▍   | 22/34 [00:07<00:03,  3.44it/s][A
 68%|██████▊   | 23/34 [00:08<00:03,  3.64it/s][A
 74%|███████▎  | 25/34 [00:08<00:02,  3.14it/s][A
 76%|███████▋  | 26/34 [00:08<00:02,  3.67it/s][A
 79%|███████▉  | 27/34 [00:09<00:01,  3.79it/s][A
 85%|████████▌ | 29/34 [00:10<00:01,  3.18it/s][A
 88%|████████▊ | 30/34 [00:10<00:01,  3.75it/s][A
100%|██████████| 34/34 [00:11<00:00,  3.04

Val Loss: 14989.9033 - Val Accuracy: 0.9116



Training:   0%|          | 0/269 [00:00<?, ?it/s][A
Training:   0%|          | 1/269 [00:02<09:33,  2.14s/it][A
Training:   1%|          | 3/269 [00:02<02:37,  1.68it/s][A
Training:   2%|▏         | 5/269 [00:03<02:52,  1.53it/s][A
Training:   2%|▏         | 6/269 [00:03<02:16,  1.93it/s][A
Training:   3%|▎         | 9/269 [00:05<02:02,  2.11it/s][A
Training:   4%|▍         | 11/269 [00:05<01:26,  2.99it/s][A
Training:   5%|▍         | 13/269 [00:06<01:57,  2.17it/s][A
Training:   6%|▋         | 17/269 [00:08<01:43,  2.45it/s][A
Training:   7%|▋         | 19/269 [00:08<01:19,  3.13it/s][A
Training:   8%|▊         | 21/269 [00:09<01:41,  2.44it/s][A
Training:   9%|▊         | 23/269 [00:09<01:16,  3.21it/s][A
Training:   9%|▉         | 25/269 [00:11<01:46,  2.29it/s][A
Training:  10%|█         | 27/269 [00:11<01:19,  3.04it/s][A
Training:  11%|█         | 29/269 [00:12<01:43,  2.32it/s][A
Training:  12%|█▏        | 31/269 [00:12<01:16,  3.12it/s][A
Training:  12%|█▏    

Training:  89%|████████▉ | 239/269 [01:26<00:10,  2.88it/s][A
Training:  90%|████████▉ | 241/269 [01:26<00:07,  3.69it/s][A
Training:  90%|█████████ | 243/269 [01:27<00:08,  2.94it/s][A
Training:  91%|█████████ | 245/269 [01:27<00:06,  3.50it/s][A
Training:  91%|█████████▏| 246/269 [01:28<00:08,  2.62it/s][A
Training:  93%|█████████▎| 249/269 [01:28<00:05,  3.39it/s][A
Training:  93%|█████████▎| 250/269 [01:29<00:07,  2.52it/s][A
Training:  94%|█████████▎| 252/269 [01:29<00:04,  3.45it/s][A
Training:  94%|█████████▍| 253/269 [01:30<00:04,  3.64it/s][A
Training:  94%|█████████▍| 254/269 [01:31<00:06,  2.25it/s][A
Training:  95%|█████████▌| 256/269 [01:31<00:03,  3.35it/s][A
Training:  96%|█████████▌| 257/269 [01:31<00:03,  3.74it/s][A
Training:  96%|█████████▌| 258/269 [01:32<00:05,  1.96it/s][A
Training:  97%|█████████▋| 261/269 [01:32<00:02,  3.57it/s][A
Training:  98%|█████████▊| 263/269 [01:34<00:02,  2.52it/s][A
Training:  99%|█████████▊| 265/269 [01:34<00:01,  3.40i

Epoch: 47/96 - Loss: 13300.2002 - Accuracy: 0.9234



  0%|          | 0/34 [00:00<?, ?it/s][A
  3%|▎         | 1/34 [00:01<00:59,  1.79s/it][A
 12%|█▏        | 4/34 [00:01<00:11,  2.67it/s][A
 18%|█▊        | 6/34 [00:03<00:13,  2.15it/s][A
 24%|██▎       | 8/34 [00:03<00:08,  3.16it/s][A
 29%|██▉       | 10/34 [00:04<00:09,  2.59it/s][A
 38%|███▊      | 13/34 [00:05<00:07,  2.66it/s][A
 41%|████      | 14/34 [00:05<00:06,  2.97it/s][A
 47%|████▋     | 16/34 [00:05<00:04,  4.10it/s][A
 53%|█████▎    | 18/34 [00:06<00:05,  2.83it/s][A
 62%|██████▏   | 21/34 [00:07<00:04,  2.94it/s][A
 65%|██████▍   | 22/34 [00:07<00:03,  3.12it/s][A
 71%|███████   | 24/34 [00:08<00:02,  4.16it/s][A
 74%|███████▎  | 25/34 [00:08<00:03,  2.95it/s][A
 76%|███████▋  | 26/34 [00:09<00:02,  3.01it/s][A
 82%|████████▏ | 28/34 [00:09<00:01,  4.37it/s][A
 85%|████████▌ | 29/34 [00:09<00:01,  3.11it/s][A
 88%|████████▊ | 30/34 [00:10<00:01,  3.24it/s][A
100%|██████████| 34/34 [00:11<00:00,  3.02it/s][A
Epochs:  49%|████▉     | 47/96 [1:24:38<1:2

Val Loss: 14940.5342 - Val Accuracy: 0.9284



Training:   0%|          | 0/269 [00:00<?, ?it/s][A
Training:   0%|          | 1/269 [00:01<08:36,  1.93s/it][A
Training:   1%|          | 2/269 [00:02<04:00,  1.11it/s][A
Training:   2%|▏         | 5/269 [00:03<02:21,  1.87it/s][A
Training:   3%|▎         | 8/269 [00:03<01:14,  3.51it/s][A
Training:   4%|▎         | 10/269 [00:04<01:52,  2.31it/s][A
Training:   4%|▍         | 12/269 [00:04<01:20,  3.21it/s][A
Training:   5%|▌         | 14/269 [00:06<01:49,  2.32it/s][A
Training:   6%|▋         | 17/269 [00:07<01:47,  2.35it/s][A
Training:   8%|▊         | 21/269 [00:08<01:34,  2.63it/s][A
Training:   9%|▊         | 23/269 [00:09<01:16,  3.22it/s][A
Training:   9%|▉         | 25/269 [00:10<01:39,  2.46it/s][A
Training:  10%|█         | 28/269 [00:10<01:07,  3.55it/s][A
Training:  11%|█         | 30/269 [00:11<01:26,  2.77it/s][A
Training:  12%|█▏        | 32/269 [00:11<01:06,  3.55it/s][A
Training:  13%|█▎        | 34/269 [00:12<01:21,  2.87it/s][A
Training:  13%|█▎   

Epoch: 48/96 - Loss: 14803.0264 - Accuracy: 0.9184



  0%|          | 0/34 [00:00<?, ?it/s][A
  3%|▎         | 1/34 [00:01<01:00,  1.83s/it][A
  9%|▉         | 3/34 [00:01<00:16,  1.92it/s][A
 15%|█▍        | 5/34 [00:03<00:16,  1.79it/s][A
 24%|██▎       | 8/34 [00:03<00:07,  3.43it/s][A
 29%|██▉       | 10/34 [00:04<00:09,  2.49it/s][A
 38%|███▊      | 13/34 [00:05<00:08,  2.51it/s][A
 44%|████▍     | 15/34 [00:05<00:05,  3.24it/s][A
 50%|█████     | 17/34 [00:07<00:06,  2.54it/s][A
 59%|█████▉    | 20/34 [00:07<00:03,  3.87it/s][A
 65%|██████▍   | 22/34 [00:08<00:03,  3.07it/s][A
 74%|███████▎  | 25/34 [00:09<00:03,  2.99it/s][A
 76%|███████▋  | 26/34 [00:09<00:02,  3.29it/s][A
 85%|████████▌ | 29/34 [00:10<00:01,  3.11it/s][A
 88%|████████▊ | 30/34 [00:10<00:01,  3.25it/s][A
100%|██████████| 34/34 [00:11<00:00,  2.91it/s][A
Epochs:  50%|█████     | 48/96 [1:26:25<1:25:32, 106.92s/it]

Val Loss: 15820.2646 - Val Accuracy: 0.8526



Training:   0%|          | 0/269 [00:00<?, ?it/s][A
Training:   0%|          | 1/269 [00:02<09:12,  2.06s/it][A
Training:   2%|▏         | 5/269 [00:03<02:34,  1.71it/s][A
Training:   3%|▎         | 7/269 [00:03<01:40,  2.61it/s][A
Training:   3%|▎         | 9/269 [00:04<02:09,  2.01it/s][A
Training:   5%|▍         | 13/269 [00:06<01:53,  2.26it/s][A
Training:   6%|▋         | 17/269 [00:07<01:38,  2.56it/s][A
Training:   7%|▋         | 20/269 [00:07<01:09,  3.57it/s][A
Training:   8%|▊         | 22/269 [00:09<01:34,  2.60it/s][A
Training:   9%|▊         | 23/269 [00:09<01:25,  2.87it/s][A
Training:   9%|▉         | 25/269 [00:10<01:42,  2.37it/s][A
Training:  10%|▉         | 26/269 [00:10<01:29,  2.70it/s][A
Training:  10%|█         | 28/269 [00:10<01:05,  3.71it/s][A
Training:  11%|█         | 29/269 [00:11<01:41,  2.36it/s][A
Training:  11%|█         | 30/269 [00:12<01:30,  2.63it/s][A
Training:  12%|█▏        | 33/269 [00:13<01:27,  2.69it/s][A
Training:  13%|█▎   

Training:  80%|████████  | 216/269 [01:18<00:13,  3.91it/s][A
Training:  81%|████████  | 217/269 [01:19<00:21,  2.41it/s][A
Training:  81%|████████  | 218/269 [01:19<00:19,  2.62it/s][A
Training:  82%|████████▏ | 220/269 [01:19<00:12,  3.80it/s][A
Training:  82%|████████▏ | 221/269 [01:20<00:20,  2.37it/s][A
Training:  83%|████████▎ | 223/269 [01:20<00:13,  3.54it/s][A
Training:  84%|████████▎ | 225/269 [01:22<00:17,  2.51it/s][A
Training:  84%|████████▍ | 227/269 [01:22<00:12,  3.32it/s][A
Training:  85%|████████▌ | 229/269 [01:23<00:17,  2.35it/s][A
Training:  86%|████████▌ | 231/269 [01:23<00:11,  3.20it/s][A
Training:  87%|████████▋ | 233/269 [01:24<00:14,  2.54it/s][A
Training:  87%|████████▋ | 235/269 [01:25<00:10,  3.22it/s][A
Training:  88%|████████▊ | 237/269 [01:26<00:13,  2.44it/s][A
Training:  89%|████████▉ | 239/269 [01:26<00:10,  2.96it/s][A
Training:  90%|████████▉ | 241/269 [01:27<00:10,  2.56it/s][A
Training:  90%|█████████ | 243/269 [01:28<00:09,  2.87i

Epoch: 49/96 - Loss: 13921.9453 - Accuracy: 0.9218



  0%|          | 0/34 [00:00<?, ?it/s][A
  3%|▎         | 1/34 [00:01<00:57,  1.75s/it][A
  9%|▉         | 3/34 [00:01<00:15,  1.99it/s][A
 15%|█▍        | 5/34 [00:03<00:15,  1.82it/s][A
 21%|██        | 7/34 [00:03<00:09,  2.94it/s][A
 26%|██▋       | 9/34 [00:04<00:10,  2.28it/s][A
 35%|███▌      | 12/34 [00:04<00:05,  3.82it/s][A
 41%|████      | 14/34 [00:05<00:06,  2.99it/s][A
 47%|████▋     | 16/34 [00:05<00:04,  3.83it/s][A
 50%|█████     | 17/34 [00:06<00:07,  2.42it/s][A
 59%|█████▉    | 20/34 [00:06<00:03,  3.91it/s][A
 65%|██████▍   | 22/34 [00:07<00:03,  3.05it/s][A
 71%|███████   | 24/34 [00:08<00:02,  4.00it/s][A
 76%|███████▋  | 26/34 [00:09<00:02,  3.06it/s][A
 82%|████████▏ | 28/34 [00:09<00:01,  3.87it/s][A
 85%|████████▌ | 29/34 [00:10<00:01,  2.74it/s][A
 91%|█████████ | 31/34 [00:10<00:00,  3.78it/s][A
100%|██████████| 34/34 [00:11<00:00,  2.96it/s][A
Epochs:  51%|█████     | 49/96 [1:28:14<1:24:13, 107.52s/it]

Val Loss: 15159.7793 - Val Accuracy: 0.9286



Training:   0%|          | 0/269 [00:00<?, ?it/s][A
Training:   0%|          | 1/269 [00:02<09:27,  2.12s/it][A
Training:   1%|          | 3/269 [00:02<02:36,  1.70it/s][A
Training:   2%|▏         | 5/269 [00:03<02:47,  1.58it/s][A
Training:   3%|▎         | 7/269 [00:03<01:42,  2.57it/s][A
Training:   3%|▎         | 9/269 [00:04<02:05,  2.08it/s][A
Training:   4%|▍         | 11/269 [00:05<01:25,  3.01it/s][A
Training:   5%|▍         | 13/269 [00:06<01:57,  2.18it/s][A
Training:   6%|▌         | 15/269 [00:06<01:24,  3.02it/s][A
Training:   6%|▋         | 17/269 [00:07<01:48,  2.33it/s][A
Training:   7%|▋         | 20/269 [00:08<01:07,  3.68it/s][A
Training:   8%|▊         | 22/269 [00:09<01:35,  2.59it/s][A
Training:   9%|▉         | 24/269 [00:09<01:14,  3.30it/s][A
Training:   9%|▉         | 25/269 [00:10<01:56,  2.10it/s][A
Training:  10%|▉         | 26/269 [00:11<01:38,  2.47it/s][A
Training:  11%|█         | 29/269 [00:12<01:37,  2.47it/s][A
Training:  11%|█     

Epoch: 50/96 - Loss: 14206.8721 - Accuracy: 0.9172



  0%|          | 0/34 [00:00<?, ?it/s][A
  3%|▎         | 1/34 [00:01<00:59,  1.80s/it][A
 12%|█▏        | 4/34 [00:01<00:11,  2.68it/s][A
 18%|█▊        | 6/34 [00:03<00:12,  2.27it/s][A
 24%|██▎       | 8/34 [00:03<00:07,  3.43it/s][A
 29%|██▉       | 10/34 [00:04<00:09,  2.50it/s][A
 35%|███▌      | 12/34 [00:04<00:06,  3.52it/s][A
 41%|████      | 14/34 [00:05<00:07,  2.70it/s][A
 50%|█████     | 17/34 [00:06<00:06,  2.61it/s][A
 59%|█████▉    | 20/34 [00:06<00:03,  3.94it/s][A
 65%|██████▍   | 22/34 [00:07<00:03,  3.02it/s][A
 71%|███████   | 24/34 [00:08<00:02,  3.78it/s][A
 76%|███████▋  | 26/34 [00:09<00:02,  2.99it/s][A
 85%|████████▌ | 29/34 [00:10<00:01,  3.04it/s][A
 88%|████████▊ | 30/34 [00:10<00:01,  3.40it/s][A
100%|██████████| 34/34 [00:11<00:00,  3.00it/s][A
Epochs:  52%|█████▏    | 50/96 [1:30:03<1:22:39, 107.81s/it]

Val Loss: 14472.0381 - Val Accuracy: 0.9390



Training:   0%|          | 0/269 [00:00<?, ?it/s][A
Training:   0%|          | 1/269 [00:02<09:39,  2.16s/it][A
Training:   1%|          | 3/269 [00:02<02:44,  1.61it/s][A
Training:   2%|▏         | 5/269 [00:03<02:54,  1.52it/s][A
Training:   3%|▎         | 7/269 [00:03<01:47,  2.45it/s][A
Training:   3%|▎         | 9/269 [00:05<02:14,  1.93it/s][A
Training:   4%|▍         | 12/269 [00:05<01:18,  3.29it/s][A
Training:   5%|▌         | 14/269 [00:06<01:52,  2.26it/s][A
Training:   6%|▋         | 17/269 [00:08<01:51,  2.27it/s][A
Training:   7%|▋         | 20/269 [00:08<01:15,  3.31it/s][A
Training:   8%|▊         | 22/269 [00:09<01:36,  2.56it/s][A
Training:   9%|▊         | 23/269 [00:09<01:25,  2.87it/s][A
Training:   9%|▉         | 25/269 [00:11<01:55,  2.12it/s][A
Training:  10%|█         | 27/269 [00:11<01:23,  2.90it/s][A
Training:  11%|█         | 29/269 [00:12<01:45,  2.27it/s][A
Training:  12%|█▏        | 31/269 [00:12<01:17,  3.08it/s][A
Training:  12%|█▏    

                                                           [A

Epoch: 51/96 - Loss: 14345.5283 - Accuracy: 0.9188



  0%|          | 0/34 [00:00<?, ?it/s][A
  3%|▎         | 1/34 [00:01<01:03,  1.92s/it][A
  9%|▉         | 3/34 [00:02<00:16,  1.84it/s][A
 15%|█▍        | 5/34 [00:03<00:15,  1.88it/s][A
 18%|█▊        | 6/34 [00:03<00:11,  2.34it/s][A
 24%|██▎       | 8/34 [00:03<00:07,  3.68it/s][A
 26%|██▋       | 9/34 [00:04<00:11,  2.26it/s][A
 29%|██▉       | 10/34 [00:04<00:08,  2.81it/s][A
 32%|███▏      | 11/34 [00:04<00:07,  3.13it/s][A
 38%|███▊      | 13/34 [00:05<00:07,  2.82it/s][A
 44%|████▍     | 15/34 [00:05<00:05,  3.67it/s][A
 50%|█████     | 17/34 [00:06<00:05,  3.26it/s][A
 56%|█████▌    | 19/34 [00:06<00:03,  3.88it/s][A
 62%|██████▏   | 21/34 [00:07<00:03,  3.33it/s][A
 68%|██████▊   | 23/34 [00:08<00:03,  3.61it/s][A
 74%|███████▎  | 25/34 [00:08<00:02,  3.33it/s][A
 79%|███████▉  | 27/34 [00:09<00:01,  3.88it/s][A
 85%|████████▌ | 29/34 [00:09<00:01,  3.42it/s][A
 91%|█████████ | 31/34 [00:10<00:00,  3.96it/s][A
100%|██████████| 34/34 [00:10<00:00,  3.10it/

Val Loss: 16004.2314 - Val Accuracy: 0.9246



Training:   0%|          | 0/269 [00:00<?, ?it/s][A
Training:   0%|          | 1/269 [00:02<11:26,  2.56s/it][A
Training:   1%|          | 3/269 [00:02<03:07,  1.42it/s][A
Training:   2%|▏         | 5/269 [00:03<02:51,  1.54it/s][A
Training:   3%|▎         | 7/269 [00:04<01:45,  2.48it/s][A
Training:   3%|▎         | 9/269 [00:05<02:08,  2.02it/s][A
Training:   4%|▍         | 11/269 [00:05<01:30,  2.86it/s][A
Training:   5%|▍         | 13/269 [00:06<02:00,  2.12it/s][A
Training:   6%|▌         | 15/269 [00:07<01:26,  2.92it/s][A
Training:   6%|▋         | 17/269 [00:08<01:55,  2.19it/s][A
Training:   7%|▋         | 20/269 [00:08<01:13,  3.40it/s][A
Training:   8%|▊         | 22/269 [00:09<01:37,  2.52it/s][A
Training:   9%|▉         | 25/269 [00:11<01:43,  2.35it/s][A
Training:  10%|█         | 28/269 [00:11<01:09,  3.45it/s][A
Training:  11%|█         | 30/269 [00:12<01:36,  2.48it/s][A
Training:  12%|█▏        | 33/269 [00:14<01:40,  2.36it/s][A
Training:  14%|█▍    

Epoch: 52/96 - Loss: 14095.1357 - Accuracy: 0.9191



  0%|          | 0/34 [00:00<?, ?it/s][A
  3%|▎         | 1/34 [00:01<00:55,  1.67s/it][A
  9%|▉         | 3/34 [00:01<00:16,  1.86it/s][A
 15%|█▍        | 5/34 [00:03<00:15,  1.83it/s][A
 21%|██        | 7/34 [00:03<00:09,  2.94it/s][A
 26%|██▋       | 9/34 [00:04<00:10,  2.50it/s][A
 32%|███▏      | 11/34 [00:04<00:07,  3.20it/s][A
 38%|███▊      | 13/34 [00:05<00:07,  2.85it/s][A
 44%|████▍     | 15/34 [00:05<00:05,  3.52it/s][A
 50%|█████     | 17/34 [00:06<00:05,  3.26it/s][A
 53%|█████▎    | 18/34 [00:06<00:04,  3.60it/s][A
 56%|█████▌    | 19/34 [00:07<00:04,  3.07it/s][A
 62%|██████▏   | 21/34 [00:07<00:04,  3.01it/s][A
 65%|██████▍   | 22/34 [00:07<00:03,  3.50it/s][A
 68%|██████▊   | 23/34 [00:08<00:03,  3.20it/s][A
 74%|███████▎  | 25/34 [00:08<00:02,  3.13it/s][A
 76%|███████▋  | 26/34 [00:09<00:02,  3.57it/s][A
 79%|███████▉  | 27/34 [00:09<00:01,  3.80it/s][A
 85%|████████▌ | 29/34 [00:09<00:01,  3.41it/s][A
 91%|█████████ | 31/34 [00:10<00:00,  4.32it

Val Loss: 16006.2520 - Val Accuracy: 0.9322



Training:   0%|          | 0/269 [00:00<?, ?it/s][A
Training:   0%|          | 1/269 [00:02<09:05,  2.03s/it][A
Training:   1%|▏         | 4/269 [00:02<01:53,  2.34it/s][A
Training:   2%|▏         | 6/269 [00:03<02:28,  1.78it/s][A
Training:   3%|▎         | 8/269 [00:03<01:38,  2.66it/s][A
Training:   3%|▎         | 9/269 [00:04<02:22,  1.83it/s][A
Training:   4%|▎         | 10/269 [00:05<01:59,  2.17it/s][A
Training:   4%|▍         | 12/269 [00:05<01:19,  3.25it/s][A
Training:   5%|▍         | 13/269 [00:06<02:11,  1.95it/s][A
Training:   6%|▌         | 15/269 [00:06<01:24,  3.01it/s][A
Training:   6%|▋         | 17/269 [00:07<01:50,  2.29it/s][A
Training:   7%|▋         | 18/269 [00:08<01:36,  2.61it/s][A
Training:   7%|▋         | 20/269 [00:08<01:05,  3.80it/s][A
Training:   8%|▊         | 22/269 [00:09<01:33,  2.65it/s][A
Training:   9%|▉         | 24/269 [00:09<01:06,  3.69it/s][A
Training:  10%|▉         | 26/269 [00:10<01:40,  2.41it/s][A
Training:  10%|█     

Training:  72%|███████▏  | 194/269 [01:10<00:27,  2.71it/s][A
Training:  72%|███████▏  | 195/269 [01:10<00:25,  2.91it/s][A
Training:  73%|███████▎  | 197/269 [01:11<00:22,  3.15it/s][A
Training:  74%|███████▎  | 198/269 [01:11<00:24,  2.88it/s][A
Training:  74%|███████▍  | 199/269 [01:12<00:26,  2.60it/s][A
Training:  75%|███████▍  | 201/269 [01:12<00:20,  3.38it/s][A
Training:  75%|███████▌  | 202/269 [01:13<00:24,  2.74it/s][A
Training:  75%|███████▌  | 203/269 [01:13<00:27,  2.38it/s][A
Training:  76%|███████▌  | 205/269 [01:14<00:18,  3.52it/s][A
Training:  77%|███████▋  | 206/269 [01:14<00:24,  2.56it/s][A
Training:  77%|███████▋  | 207/269 [01:15<00:27,  2.25it/s][A
Training:  78%|███████▊  | 210/269 [01:16<00:20,  2.93it/s][A
Training:  78%|███████▊  | 211/269 [01:16<00:21,  2.64it/s][A
Training:  79%|███████▉  | 213/269 [01:16<00:15,  3.68it/s][A
Training:  80%|███████▉  | 214/269 [01:17<00:22,  2.42it/s][A
Training:  80%|███████▉  | 215/269 [01:18<00:21,  2.46i

Epoch: 53/96 - Loss: 14877.5117 - Accuracy: 0.9220



  0%|          | 0/34 [00:00<?, ?it/s][A
  3%|▎         | 1/34 [00:02<01:09,  2.11s/it][A
 12%|█▏        | 4/34 [00:02<00:12,  2.31it/s][A
 18%|█▊        | 6/34 [00:03<00:14,  1.95it/s][A
 26%|██▋       | 9/34 [00:04<00:10,  2.44it/s][A
 35%|███▌      | 12/34 [00:04<00:05,  3.85it/s][A
 41%|████      | 14/34 [00:05<00:06,  2.90it/s][A
 50%|█████     | 17/34 [00:06<00:06,  2.78it/s][A
 56%|█████▌    | 19/34 [00:06<00:04,  3.55it/s][A
 62%|██████▏   | 21/34 [00:07<00:04,  2.86it/s][A
 74%|███████▎  | 25/34 [00:09<00:02,  3.03it/s][A
 79%|███████▉  | 27/34 [00:09<00:01,  3.77it/s][A
 85%|████████▌ | 29/34 [00:10<00:01,  3.11it/s][A
 91%|█████████ | 31/34 [00:10<00:00,  3.57it/s][A
100%|██████████| 34/34 [00:11<00:00,  2.93it/s][A
Epochs:  55%|█████▌    | 53/96 [1:35:29<1:17:40, 108.38s/it]

Val Loss: 16755.2656 - Val Accuracy: 0.9251



Training:   0%|          | 0/269 [00:00<?, ?it/s][A
Training:   0%|          | 1/269 [00:02<10:24,  2.33s/it][A
Training:   2%|▏         | 5/269 [00:03<02:38,  1.66it/s][A
Training:   2%|▏         | 6/269 [00:03<02:09,  2.03it/s][A
Training:   3%|▎         | 9/269 [00:04<01:54,  2.26it/s][A
Training:   4%|▎         | 10/269 [00:05<01:43,  2.50it/s][A
Training:   4%|▍         | 12/269 [00:05<01:12,  3.55it/s][A
Training:   5%|▍         | 13/269 [00:06<01:58,  2.17it/s][A
Training:   5%|▌         | 14/269 [00:06<01:46,  2.40it/s][A
Training:   6%|▋         | 17/269 [00:07<01:35,  2.64it/s][A
Training:   7%|▋         | 18/269 [00:07<01:32,  2.72it/s][A
Training:   7%|▋         | 20/269 [00:08<01:04,  3.84it/s][A
Training:   8%|▊         | 21/269 [00:09<01:38,  2.53it/s][A
Training:   8%|▊         | 22/269 [00:09<01:34,  2.60it/s][A
Training:   9%|▉         | 25/269 [00:10<01:31,  2.65it/s][A
Training:  10%|▉         | 26/269 [00:10<01:28,  2.76it/s][A
Training:  10%|█    

Training:  81%|████████  | 218/269 [01:19<00:17,  2.90it/s][A
Training:  82%|████████▏ | 221/269 [01:20<00:17,  2.75it/s][A
Training:  83%|████████▎ | 222/269 [01:20<00:16,  2.94it/s][A
Training:  83%|████████▎ | 224/269 [01:20<00:11,  4.08it/s][A
Training:  84%|████████▎ | 225/269 [01:21<00:18,  2.33it/s][A
Training:  84%|████████▍ | 226/269 [01:22<00:16,  2.57it/s][A
Training:  85%|████████▍ | 228/269 [01:22<00:10,  3.86it/s][A
Training:  85%|████████▌ | 229/269 [01:23<00:19,  2.08it/s][A
Training:  86%|████████▌ | 231/269 [01:23<00:12,  3.05it/s][A
Training:  87%|████████▋ | 233/269 [01:24<00:16,  2.22it/s][A
Training:  87%|████████▋ | 235/269 [01:25<00:10,  3.15it/s][A
Training:  88%|████████▊ | 237/269 [01:26<00:14,  2.24it/s][A
Training:  89%|████████▉ | 239/269 [01:26<00:09,  3.07it/s][A
Training:  90%|████████▉ | 241/269 [01:28<00:12,  2.28it/s][A
Training:  90%|████████▉ | 242/269 [01:28<00:10,  2.49it/s][A
Training:  91%|█████████ | 244/269 [01:28<00:07,  3.50i

Epoch: 54/96 - Loss: 12878.7979 - Accuracy: 0.9227



  0%|          | 0/34 [00:00<?, ?it/s][A
  3%|▎         | 1/34 [00:01<01:04,  1.95s/it][A
  9%|▉         | 3/34 [00:02<00:17,  1.79it/s][A
 15%|█▍        | 5/34 [00:03<00:16,  1.77it/s][A
 21%|██        | 7/34 [00:03<00:09,  2.82it/s][A
 26%|██▋       | 9/34 [00:04<00:09,  2.53it/s][A
 29%|██▉       | 10/34 [00:04<00:09,  2.59it/s][A
 38%|███▊      | 13/34 [00:05<00:07,  2.80it/s][A
 41%|████      | 14/34 [00:05<00:06,  2.92it/s][A
 47%|████▋     | 16/34 [00:06<00:04,  4.00it/s][A
 50%|█████     | 17/34 [00:06<00:06,  2.79it/s][A
 53%|█████▎    | 18/34 [00:07<00:05,  3.03it/s][A
 62%|██████▏   | 21/34 [00:08<00:04,  3.13it/s][A
 65%|██████▍   | 22/34 [00:08<00:03,  3.27it/s][A
 74%|███████▎  | 25/34 [00:09<00:02,  3.07it/s][A
 76%|███████▋  | 26/34 [00:09<00:02,  3.02it/s][A
 82%|████████▏ | 28/34 [00:09<00:01,  4.20it/s][A
 85%|████████▌ | 29/34 [00:10<00:01,  2.88it/s][A
 88%|████████▊ | 30/34 [00:10<00:01,  3.05it/s][A
100%|██████████| 34/34 [00:11<00:00,  2.87it

Val Loss: 15191.8057 - Val Accuracy: 0.9368



Training:   0%|          | 0/269 [00:00<?, ?it/s][A
Training:   0%|          | 1/269 [00:02<09:52,  2.21s/it][A
Training:   1%|          | 3/269 [00:02<02:49,  1.57it/s][A
Training:   2%|▏         | 5/269 [00:03<02:57,  1.49it/s][A
Training:   2%|▏         | 6/269 [00:03<02:16,  1.93it/s][A
Training:   3%|▎         | 8/269 [00:04<01:22,  3.15it/s][A
Training:   4%|▎         | 10/269 [00:05<01:54,  2.25it/s][A
Training:   5%|▍         | 13/269 [00:06<01:59,  2.14it/s][A
Training:   6%|▌         | 16/269 [00:06<01:15,  3.37it/s][A
Training:   7%|▋         | 18/269 [00:08<01:40,  2.50it/s][A
Training:   8%|▊         | 21/269 [00:09<01:35,  2.59it/s][A
Training:   9%|▊         | 23/269 [00:09<01:15,  3.26it/s][A
Training:   9%|▉         | 25/269 [00:10<01:38,  2.48it/s][A
Training:  10%|█         | 27/269 [00:10<01:15,  3.21it/s][A
Training:  11%|█         | 29/269 [00:12<01:37,  2.46it/s][A
Training:  12%|█▏        | 32/269 [00:12<01:03,  3.73it/s][A
Training:  13%|█▎    

Epoch: 55/96 - Loss: 13768.9053 - Accuracy: 0.9196



  0%|          | 0/34 [00:00<?, ?it/s][A
  3%|▎         | 1/34 [00:01<00:57,  1.74s/it][A
 15%|█▍        | 5/34 [00:02<00:14,  1.95it/s][A
 26%|██▋       | 9/34 [00:04<00:10,  2.43it/s][A
 32%|███▏      | 11/34 [00:04<00:07,  3.23it/s][A
 38%|███▊      | 13/34 [00:05<00:07,  2.65it/s][A
 47%|████▋     | 16/34 [00:05<00:04,  4.02it/s][A
 53%|█████▎    | 18/34 [00:06<00:05,  3.10it/s][A
 62%|██████▏   | 21/34 [00:07<00:04,  2.87it/s][A
 68%|██████▊   | 23/34 [00:07<00:03,  3.66it/s][A
 74%|███████▎  | 25/34 [00:09<00:03,  2.70it/s][A
 79%|███████▉  | 27/34 [00:09<00:02,  3.50it/s][A
 85%|████████▌ | 29/34 [00:10<00:01,  2.67it/s][A
 94%|█████████▍| 32/34 [00:10<00:00,  4.00it/s][A
100%|██████████| 34/34 [00:11<00:00,  2.88it/s][A
Epochs:  57%|█████▋    | 55/96 [1:39:07<1:14:14, 108.65s/it]

Val Loss: 13730.8066 - Val Accuracy: 0.9162



Training:   0%|          | 0/269 [00:00<?, ?it/s][A
Training:   0%|          | 1/269 [00:02<09:36,  2.15s/it][A
Training:   1%|          | 3/269 [00:02<02:40,  1.66it/s][A
Training:   2%|▏         | 5/269 [00:03<03:00,  1.47it/s][A
Training:   3%|▎         | 7/269 [00:03<01:51,  2.35it/s][A
Training:   3%|▎         | 9/269 [00:05<02:14,  1.93it/s][A
Training:   4%|▍         | 12/269 [00:05<01:18,  3.28it/s][A
Training:   5%|▌         | 14/269 [00:06<01:45,  2.43it/s][A
Training:   6%|▋         | 17/269 [00:08<01:47,  2.35it/s][A
Training:   7%|▋         | 19/269 [00:08<01:22,  3.04it/s][A
Training:   8%|▊         | 21/269 [00:09<01:49,  2.27it/s][A
Training:   9%|▊         | 23/269 [00:09<01:22,  2.98it/s][A
Training:   9%|▉         | 25/269 [00:10<01:39,  2.46it/s][A
Training:  10%|█         | 28/269 [00:11<01:04,  3.76it/s][A
Training:  11%|█         | 30/269 [00:12<01:31,  2.60it/s][A
Training:  12%|█▏        | 32/269 [00:12<01:11,  3.33it/s][A
Training:  13%|█▎    

Training:  97%|█████████▋| 261/269 [01:34<00:03,  2.28it/s][A
Training:  98%|█████████▊| 263/269 [01:34<00:01,  3.11it/s][A
Training:  99%|█████████▊| 265/269 [01:35<00:01,  2.66it/s][A
Training:  99%|█████████▉| 267/269 [01:35<00:00,  3.09it/s][A
Training: 100%|██████████| 269/269 [01:36<00:00,  3.08it/s][A
                                                           [A

Epoch: 56/96 - Loss: 13582.3926 - Accuracy: 0.9180



  0%|          | 0/34 [00:00<?, ?it/s][A
  3%|▎         | 1/34 [00:01<00:57,  1.75s/it][A
 15%|█▍        | 5/34 [00:02<00:15,  1.93it/s][A
 21%|██        | 7/34 [00:03<00:09,  2.83it/s][A
 26%|██▋       | 9/34 [00:04<00:10,  2.29it/s][A
 35%|███▌      | 12/34 [00:04<00:05,  3.74it/s][A
 41%|████      | 14/34 [00:05<00:06,  3.01it/s][A
 47%|████▋     | 16/34 [00:05<00:04,  3.92it/s][A
 53%|█████▎    | 18/34 [00:06<00:05,  3.19it/s][A
 59%|█████▉    | 20/34 [00:06<00:03,  3.98it/s][A
 62%|██████▏   | 21/34 [00:07<00:04,  2.66it/s][A
 71%|███████   | 24/34 [00:07<00:02,  3.90it/s][A
 74%|███████▎  | 25/34 [00:08<00:03,  2.83it/s][A
 82%|████████▏ | 28/34 [00:09<00:01,  3.99it/s][A
 85%|████████▌ | 29/34 [00:10<00:01,  2.75it/s][A
 94%|█████████▍| 32/34 [00:10<00:00,  4.38it/s][A
100%|██████████| 34/34 [00:11<00:00,  3.01it/s][A
Epochs:  58%|█████▊    | 56/96 [1:40:55<1:12:17, 108.43s/it]

Val Loss: 14296.7598 - Val Accuracy: 0.8885



Training:   0%|          | 0/269 [00:00<?, ?it/s][A
Training:   0%|          | 1/269 [00:02<09:16,  2.07s/it][A
Training:   1%|▏         | 4/269 [00:02<01:52,  2.37it/s][A
Training:   2%|▏         | 6/269 [00:03<02:31,  1.74it/s][A
Training:   3%|▎         | 9/269 [00:05<02:11,  1.98it/s][A
Training:   4%|▎         | 10/269 [00:05<01:52,  2.31it/s][A
Training:   5%|▍         | 13/269 [00:06<01:51,  2.30it/s][A
Training:   5%|▌         | 14/269 [00:06<01:39,  2.57it/s][A
Training:   6%|▌         | 16/269 [00:06<01:10,  3.59it/s][A
Training:   6%|▋         | 17/269 [00:07<01:53,  2.22it/s][A
Training:   7%|▋         | 18/269 [00:08<01:39,  2.51it/s][A
Training:   7%|▋         | 20/269 [00:08<01:06,  3.74it/s][A
Training:   8%|▊         | 21/269 [00:09<01:50,  2.25it/s][A
Training:   8%|▊         | 22/269 [00:09<01:44,  2.36it/s][A
Training:   9%|▉         | 25/269 [00:10<01:40,  2.44it/s][A
Training:  10%|▉         | 26/269 [00:11<01:33,  2.59it/s][A
Training:  11%|█    

Training:  80%|███████▉  | 214/269 [01:18<00:21,  2.54it/s][A
Training:  81%|████████  | 217/269 [01:19<00:17,  2.96it/s][A
Training:  81%|████████  | 218/269 [01:19<00:18,  2.72it/s][A
Training:  81%|████████▏ | 219/269 [01:19<00:15,  3.21it/s][A
Training:  82%|████████▏ | 221/269 [01:20<00:17,  2.71it/s][A
Training:  83%|████████▎ | 222/269 [01:21<00:18,  2.58it/s][A
Training:  84%|████████▎ | 225/269 [01:21<00:15,  2.91it/s][A
Training:  84%|████████▍ | 226/269 [01:22<00:15,  2.76it/s][A
Training:  85%|████████▌ | 229/269 [01:23<00:12,  3.26it/s][A
Training:  86%|████████▌ | 230/269 [01:23<00:14,  2.67it/s][A
Training:  86%|████████▌ | 232/269 [01:23<00:10,  3.67it/s][A
Training:  87%|████████▋ | 233/269 [01:24<00:11,  3.01it/s][A
Training:  87%|████████▋ | 234/269 [01:25<00:15,  2.30it/s][A
Training:  88%|████████▊ | 236/269 [01:25<00:09,  3.41it/s][A
Training:  88%|████████▊ | 237/269 [01:26<00:11,  2.73it/s][A
Training:  88%|████████▊ | 238/269 [01:26<00:13,  2.29i

Epoch: 57/96 - Loss: 14051.8047 - Accuracy: 0.9155



  0%|          | 0/34 [00:00<?, ?it/s][A
  3%|▎         | 1/34 [00:02<01:06,  2.01s/it][A
  9%|▉         | 3/34 [00:02<00:18,  1.69it/s][A
 15%|█▍        | 5/34 [00:03<00:16,  1.71it/s][A
 21%|██        | 7/34 [00:03<00:09,  2.73it/s][A
 26%|██▋       | 9/34 [00:04<00:11,  2.23it/s][A
 32%|███▏      | 11/34 [00:04<00:07,  3.14it/s][A
 38%|███▊      | 13/34 [00:06<00:08,  2.36it/s][A
 47%|████▋     | 16/34 [00:06<00:04,  3.73it/s][A
 53%|█████▎    | 18/34 [00:07<00:05,  2.87it/s][A
 62%|██████▏   | 21/34 [00:08<00:04,  2.90it/s][A
 74%|███████▎  | 25/34 [00:09<00:02,  3.20it/s][A
 82%|████████▏ | 28/34 [00:09<00:01,  4.38it/s][A
 88%|████████▊ | 30/34 [00:10<00:01,  3.27it/s][A
 91%|█████████ | 31/34 [00:10<00:00,  3.55it/s][A
 94%|█████████▍| 32/34 [00:10<00:00,  3.97it/s][A
100%|██████████| 34/34 [00:11<00:00,  2.87it/s][A
Epochs:  59%|█████▉    | 57/96 [1:42:44<1:10:37, 108.67s/it]

Val Loss: 14994.6865 - Val Accuracy: 0.8709



Training:   0%|          | 0/269 [00:00<?, ?it/s][A
Training:   0%|          | 1/269 [00:01<08:16,  1.85s/it][A
Training:   1%|          | 2/269 [00:01<03:44,  1.19it/s][A
Training:   1%|          | 3/269 [00:02<02:13,  1.99it/s][A
Training:   2%|▏         | 5/269 [00:03<02:22,  1.86it/s][A
Training:   2%|▏         | 6/269 [00:03<02:07,  2.06it/s][A
Training:   3%|▎         | 9/269 [00:04<01:47,  2.41it/s][A
Training:   4%|▎         | 10/269 [00:04<01:36,  2.68it/s][A
Training:   4%|▍         | 11/269 [00:05<01:22,  3.12it/s][A
Training:   5%|▍         | 13/269 [00:06<01:46,  2.40it/s][A
Training:   5%|▌         | 14/269 [00:06<01:36,  2.64it/s][A
Training:   6%|▋         | 17/269 [00:07<01:43,  2.44it/s][A
Training:   7%|▋         | 18/269 [00:07<01:35,  2.62it/s][A
Training:   7%|▋         | 20/269 [00:08<01:08,  3.65it/s][A
Training:   8%|▊         | 21/269 [00:09<01:42,  2.42it/s][A
Training:   8%|▊         | 22/269 [00:09<01:45,  2.33it/s][A
Training:   9%|▉      

Training:  76%|███████▌  | 205/269 [01:15<00:20,  3.14it/s][A
Training:  77%|███████▋  | 206/269 [01:16<00:25,  2.49it/s][A
Training:  77%|███████▋  | 208/269 [01:16<00:15,  3.85it/s][A
Training:  78%|███████▊  | 209/269 [01:16<00:18,  3.31it/s][A
Training:  78%|███████▊  | 210/269 [01:17<00:28,  2.06it/s][A
Training:  79%|███████▉  | 212/269 [01:17<00:17,  3.26it/s][A
Training:  79%|███████▉  | 213/269 [01:18<00:17,  3.23it/s][A
Training:  80%|███████▉  | 214/269 [01:19<00:28,  1.94it/s][A
Training:  80%|████████  | 216/269 [01:19<00:17,  3.09it/s][A
Training:  81%|████████  | 217/269 [01:19<00:15,  3.47it/s][A
Training:  81%|████████  | 218/269 [01:20<00:24,  2.12it/s][A
Training:  82%|████████▏ | 220/269 [01:20<00:14,  3.31it/s][A
Training:  82%|████████▏ | 221/269 [01:20<00:12,  3.85it/s][A
Training:  83%|████████▎ | 222/269 [01:21<00:22,  2.08it/s][A
Training:  83%|████████▎ | 224/269 [01:22<00:13,  3.26it/s][A
Training:  84%|████████▎ | 225/269 [01:22<00:13,  3.18i

Epoch: 58/96 - Loss: 14559.1309 - Accuracy: 0.9223



  0%|          | 0/34 [00:00<?, ?it/s][A
  3%|▎         | 1/34 [00:01<01:00,  1.84s/it][A
  6%|▌         | 2/34 [00:02<00:28,  1.11it/s][A
 12%|█▏        | 4/34 [00:02<00:11,  2.64it/s][A
 15%|█▍        | 5/34 [00:03<00:16,  1.79it/s][A
 18%|█▊        | 6/34 [00:03<00:13,  2.09it/s][A
 26%|██▋       | 9/34 [00:04<00:09,  2.71it/s][A
 29%|██▉       | 10/34 [00:04<00:09,  2.49it/s][A
 38%|███▊      | 13/34 [00:05<00:06,  3.14it/s][A
 41%|████      | 14/34 [00:06<00:07,  2.78it/s][A
 47%|████▋     | 16/34 [00:06<00:04,  3.92it/s][A
 50%|█████     | 17/34 [00:06<00:05,  3.32it/s][A
 53%|█████▎    | 18/34 [00:07<00:06,  2.65it/s][A
 62%|██████▏   | 21/34 [00:07<00:03,  3.51it/s][A
 65%|██████▍   | 22/34 [00:08<00:04,  2.74it/s][A
 71%|███████   | 24/34 [00:08<00:02,  3.80it/s][A
 74%|███████▎  | 25/34 [00:09<00:02,  3.26it/s][A
 76%|███████▋  | 26/34 [00:09<00:03,  2.50it/s][A
 85%|████████▌ | 29/34 [00:10<00:01,  3.75it/s][A
 88%|████████▊ | 30/34 [00:10<00:01,  3.20it/

Val Loss: 14993.5156 - Val Accuracy: 0.8996



Training:   0%|          | 0/269 [00:00<?, ?it/s][A
Training:   0%|          | 1/269 [00:02<09:23,  2.10s/it][A
Training:   1%|          | 3/269 [00:02<02:35,  1.71it/s][A
Training:   2%|▏         | 5/269 [00:03<02:31,  1.74it/s][A
Training:   3%|▎         | 7/269 [00:03<01:32,  2.83it/s][A
Training:   3%|▎         | 9/269 [00:04<02:07,  2.05it/s][A
Training:   4%|▍         | 11/269 [00:05<01:27,  2.94it/s][A
Training:   5%|▍         | 13/269 [00:06<01:52,  2.27it/s][A
Training:   6%|▌         | 15/269 [00:06<01:20,  3.15it/s][A
Training:   6%|▋         | 17/269 [00:07<01:53,  2.21it/s][A
Training:   7%|▋         | 19/269 [00:08<01:23,  3.01it/s][A
Training:   8%|▊         | 21/269 [00:09<01:43,  2.40it/s][A
Training:   9%|▉         | 24/269 [00:09<01:05,  3.75it/s][A
Training:  10%|▉         | 26/269 [00:10<01:34,  2.56it/s][A
Training:  11%|█         | 29/269 [00:12<01:39,  2.41it/s][A
Training:  12%|█▏        | 33/269 [00:13<01:31,  2.57it/s][A
Training:  13%|█▎    

Training:  91%|█████████ | 245/269 [01:27<00:10,  2.36it/s][A
Training:  92%|█████████▏| 247/269 [01:27<00:06,  3.22it/s][A
Training:  93%|█████████▎| 249/269 [01:29<00:08,  2.40it/s][A
Training:  94%|█████████▎| 252/269 [01:29<00:04,  3.75it/s][A
Training:  94%|█████████▍| 254/269 [01:30<00:05,  2.85it/s][A
Training:  96%|█████████▌| 257/269 [01:31<00:04,  2.64it/s][A
Training:  97%|█████████▋| 261/269 [01:33<00:02,  2.71it/s][A
Training:  98%|█████████▊| 263/269 [01:33<00:01,  3.37it/s][A
Training:  99%|█████████▊| 265/269 [01:34<00:01,  2.81it/s][A
Training: 100%|██████████| 269/269 [01:35<00:00,  3.31it/s][A
                                                           [A

Epoch: 59/96 - Loss: 14458.9795 - Accuracy: 0.9194



  0%|          | 0/34 [00:00<?, ?it/s][A
  3%|▎         | 1/34 [00:01<00:50,  1.52s/it][A
  6%|▌         | 2/34 [00:01<00:24,  1.31it/s][A
  9%|▉         | 3/34 [00:01<00:14,  2.16it/s][A
 12%|█▏        | 4/34 [00:01<00:09,  3.07it/s][A
 15%|█▍        | 5/34 [00:02<00:14,  2.02it/s][A
 21%|██        | 7/34 [00:02<00:07,  3.62it/s][A
 24%|██▎       | 8/34 [00:03<00:06,  4.06it/s][A
 26%|██▋       | 9/34 [00:04<00:11,  2.17it/s][A
 29%|██▉       | 10/34 [00:04<00:08,  2.77it/s][A
 35%|███▌      | 12/34 [00:04<00:05,  3.97it/s][A
 38%|███▊      | 13/34 [00:05<00:08,  2.38it/s][A
 47%|████▋     | 16/34 [00:05<00:04,  4.39it/s][A
 53%|█████▎    | 18/34 [00:06<00:05,  2.99it/s][A
 59%|█████▉    | 20/34 [00:06<00:03,  3.97it/s][A
 62%|██████▏   | 21/34 [00:07<00:04,  2.72it/s][A
 65%|██████▍   | 22/34 [00:07<00:03,  3.20it/s][A
 68%|██████▊   | 23/34 [00:07<00:03,  3.59it/s][A
 71%|███████   | 24/34 [00:08<00:02,  4.15it/s][A
 74%|███████▎  | 25/34 [00:08<00:03,  2.42it/s]

Val Loss: 14766.9717 - Val Accuracy: 0.9172



Training:   0%|          | 0/269 [00:00<?, ?it/s][A
Training:   0%|          | 1/269 [00:01<07:04,  1.58s/it][A
Training:   1%|          | 2/269 [00:01<03:27,  1.29it/s][A
Training:   1%|▏         | 4/269 [00:01<01:26,  3.08it/s][A
Training:   2%|▏         | 5/269 [00:02<02:05,  2.10it/s][A
Training:   2%|▏         | 6/269 [00:03<02:10,  2.01it/s][A
Training:   3%|▎         | 8/269 [00:03<01:16,  3.43it/s][A
Training:   3%|▎         | 9/269 [00:04<01:45,  2.46it/s][A
Training:   4%|▎         | 10/269 [00:04<01:48,  2.38it/s][A
Training:   5%|▍         | 13/269 [00:05<01:31,  2.79it/s][A
Training:   5%|▌         | 14/269 [00:05<01:32,  2.76it/s][A
Training:   6%|▋         | 17/269 [00:06<01:30,  2.79it/s][A
Training:   7%|▋         | 18/269 [00:07<01:28,  2.84it/s][A
Training:   8%|▊         | 21/269 [00:08<01:24,  2.94it/s][A
Training:   8%|▊         | 22/269 [00:08<01:28,  2.80it/s][A
Training:   9%|▉         | 24/269 [00:08<01:03,  3.83it/s][A
Training:   9%|▉       

Training:  81%|████████  | 218/269 [01:17<00:23,  2.16it/s][A
Training:  82%|████████▏ | 220/269 [01:17<00:16,  3.04it/s][A
Training:  83%|████████▎ | 222/269 [01:18<00:20,  2.27it/s][A
Training:  83%|████████▎ | 224/269 [01:18<00:14,  3.07it/s][A
Training:  84%|████████▍ | 226/269 [01:20<00:18,  2.28it/s][A
Training:  85%|████████▌ | 229/269 [01:20<00:11,  3.59it/s][A
Training:  86%|████████▌ | 231/269 [01:21<00:15,  2.43it/s][A
Training:  87%|████████▋ | 233/269 [01:21<00:11,  3.23it/s][A
Training:  87%|████████▋ | 235/269 [01:23<00:13,  2.52it/s][A
Training:  88%|████████▊ | 238/269 [01:24<00:12,  2.40it/s][A
Training:  90%|████████▉ | 241/269 [01:24<00:07,  3.51it/s][A
Training:  90%|█████████ | 243/269 [01:25<00:09,  2.61it/s][A
Training:  91%|█████████ | 245/269 [01:26<00:07,  3.38it/s][A
Training:  92%|█████████▏| 247/269 [01:27<00:08,  2.51it/s][A
Training:  93%|█████████▎| 250/269 [01:28<00:07,  2.41it/s][A
Training:  94%|█████████▎| 252/269 [01:28<00:05,  2.98i

Epoch: 60/96 - Loss: 14630.4893 - Accuracy: 0.9184



  0%|          | 0/34 [00:00<?, ?it/s][A
  3%|▎         | 1/34 [00:01<00:53,  1.61s/it][A
  6%|▌         | 2/34 [00:01<00:23,  1.36it/s][A
 15%|█▍        | 5/34 [00:02<00:13,  2.17it/s][A
 21%|██        | 7/34 [00:02<00:08,  3.22it/s][A
 26%|██▋       | 9/34 [00:04<00:09,  2.54it/s][A
 32%|███▏      | 11/34 [00:04<00:06,  3.56it/s][A
 38%|███▊      | 13/34 [00:05<00:07,  2.76it/s][A
 41%|████      | 14/34 [00:05<00:06,  3.14it/s][A
 50%|█████     | 17/34 [00:06<00:05,  2.95it/s][A
 59%|█████▉    | 20/34 [00:06<00:03,  4.42it/s][A
 62%|██████▏   | 21/34 [00:07<00:04,  2.73it/s][A
 68%|██████▊   | 23/34 [00:07<00:03,  3.64it/s][A
 74%|███████▎  | 25/34 [00:09<00:03,  2.66it/s][A
 79%|███████▉  | 27/34 [00:09<00:01,  3.60it/s][A
 85%|████████▌ | 29/34 [00:10<00:01,  2.66it/s][A
 94%|█████████▍| 32/34 [00:10<00:00,  4.01it/s][A
100%|██████████| 34/34 [00:11<00:00,  2.88it/s][A
Epochs:  62%|██████▎   | 60/96 [1:48:06<1:04:37, 107.70s/it]

Val Loss: 14850.6436 - Val Accuracy: 0.9227



Training:   0%|          | 0/269 [00:00<?, ?it/s][A
Training:   0%|          | 1/269 [00:01<08:20,  1.87s/it][A
Training:   1%|          | 2/269 [00:01<03:42,  1.20it/s][A
Training:   1%|▏         | 4/269 [00:02<01:33,  2.83it/s][A
Training:   2%|▏         | 5/269 [00:03<02:37,  1.67it/s][A
Training:   2%|▏         | 6/269 [00:03<02:00,  2.18it/s][A
Training:   3%|▎         | 8/269 [00:03<01:13,  3.57it/s][A
Training:   3%|▎         | 9/269 [00:04<02:01,  2.14it/s][A
Training:   4%|▍         | 11/269 [00:04<01:19,  3.25it/s][A
Training:   5%|▍         | 13/269 [00:06<01:52,  2.28it/s][A
Training:   6%|▌         | 15/269 [00:06<01:18,  3.23it/s][A
Training:   6%|▋         | 17/269 [00:07<01:43,  2.44it/s][A
Training:   7%|▋         | 18/269 [00:07<01:30,  2.78it/s][A
Training:   7%|▋         | 19/269 [00:07<01:16,  3.29it/s][A
Training:   8%|▊         | 21/269 [00:08<01:35,  2.58it/s][A
Training:   8%|▊         | 22/269 [00:08<01:22,  2.99it/s][A
Training:   9%|▉       

Training:  88%|████████▊ | 238/269 [01:27<00:11,  2.70it/s][A
Training:  90%|████████▉ | 241/269 [01:29<00:11,  2.50it/s][A
Training:  90%|█████████ | 243/269 [01:29<00:08,  3.13it/s][A
Training:  91%|█████████ | 245/269 [01:30<00:09,  2.51it/s][A
Training:  92%|█████████▏| 247/269 [01:30<00:06,  3.27it/s][A
Training:  93%|█████████▎| 249/269 [01:31<00:07,  2.55it/s][A
Training:  93%|█████████▎| 251/269 [01:31<00:05,  3.34it/s][A
Training:  94%|█████████▍| 253/269 [01:33<00:06,  2.45it/s][A
Training:  95%|█████████▍| 255/269 [01:33<00:04,  3.21it/s][A
Training:  96%|█████████▌| 257/269 [01:34<00:04,  2.48it/s][A
Training:  96%|█████████▋| 259/269 [01:34<00:03,  3.28it/s][A
Training:  97%|█████████▋| 261/269 [01:36<00:03,  2.33it/s][A
Training:  98%|█████████▊| 263/269 [01:36<00:01,  3.08it/s][A
Training:  99%|█████████▊| 265/269 [01:37<00:01,  2.58it/s][A
Training:  99%|█████████▉| 267/269 [01:37<00:00,  3.46it/s][A
Training: 100%|██████████| 269/269 [01:38<00:00,  2.91i

Epoch: 61/96 - Loss: 13875.7441 - Accuracy: 0.9153



  0%|          | 0/34 [00:00<?, ?it/s][A
  3%|▎         | 1/34 [00:01<00:58,  1.78s/it][A
  9%|▉         | 3/34 [00:01<00:15,  2.01it/s][A
 15%|█▍        | 5/34 [00:03<00:15,  1.86it/s][A
 21%|██        | 7/34 [00:03<00:08,  3.01it/s][A
 26%|██▋       | 9/34 [00:04<00:11,  2.18it/s][A
 35%|███▌      | 12/34 [00:04<00:06,  3.67it/s][A
 41%|████      | 14/34 [00:05<00:06,  2.92it/s][A
 50%|█████     | 17/34 [00:06<00:06,  2.65it/s][A
 56%|█████▌    | 19/34 [00:07<00:04,  3.36it/s][A
 62%|██████▏   | 21/34 [00:08<00:04,  2.67it/s][A
 74%|███████▎  | 25/34 [00:09<00:02,  3.03it/s][A
 82%|████████▏ | 28/34 [00:09<00:01,  4.21it/s][A
 88%|████████▊ | 30/34 [00:10<00:01,  3.37it/s][A
100%|██████████| 34/34 [00:11<00:00,  2.89it/s][A
Epochs:  64%|██████▎   | 61/96 [1:49:57<1:03:19, 108.57s/it]

Val Loss: 13671.5605 - Val Accuracy: 0.9373



Training:   0%|          | 0/269 [00:00<?, ?it/s][A
Training:   0%|          | 1/269 [00:02<09:29,  2.12s/it][A
Training:   1%|          | 3/269 [00:02<02:44,  1.62it/s][A
Training:   2%|▏         | 5/269 [00:03<02:58,  1.48it/s][A
Training:   3%|▎         | 7/269 [00:03<01:48,  2.41it/s][A
Training:   3%|▎         | 9/269 [00:05<02:10,  1.99it/s][A
Training:   4%|▍         | 11/269 [00:05<01:28,  2.91it/s][A
Training:   5%|▍         | 13/269 [00:06<01:53,  2.27it/s][A
Training:   5%|▌         | 14/269 [00:06<01:36,  2.65it/s][A
Training:   6%|▌         | 16/269 [00:06<01:09,  3.65it/s][A
Training:   6%|▋         | 17/269 [00:08<01:58,  2.12it/s][A
Training:   7%|▋         | 20/269 [00:08<01:07,  3.71it/s][A
Training:   8%|▊         | 22/269 [00:09<01:37,  2.54it/s][A
Training:   9%|▉         | 24/269 [00:09<01:11,  3.41it/s][A
Training:  10%|▉         | 26/269 [00:11<01:46,  2.28it/s][A
Training:  10%|█         | 28/269 [00:11<01:17,  3.11it/s][A
Training:  11%|█     

Epoch: 62/96 - Loss: 13882.6201 - Accuracy: 0.9208



  0%|          | 0/34 [00:00<?, ?it/s][A
  3%|▎         | 1/34 [00:01<00:57,  1.75s/it][A
  9%|▉         | 3/34 [00:01<00:15,  2.00it/s][A
 12%|█▏        | 4/34 [00:01<00:10,  2.75it/s][A
 15%|█▍        | 5/34 [00:02<00:14,  2.02it/s][A
 24%|██▎       | 8/34 [00:02<00:06,  4.15it/s][A
 26%|██▋       | 9/34 [00:03<00:09,  2.68it/s][A
 32%|███▏      | 11/34 [00:03<00:05,  4.01it/s][A
 38%|███▊      | 13/34 [00:05<00:07,  2.76it/s][A
 47%|████▋     | 16/34 [00:05<00:03,  4.53it/s][A
 53%|█████▎    | 18/34 [00:05<00:04,  3.56it/s][A
 62%|██████▏   | 21/34 [00:07<00:04,  3.23it/s][A
 71%|███████   | 24/34 [00:07<00:02,  4.71it/s][A
 76%|███████▋  | 26/34 [00:08<00:02,  3.59it/s][A
 85%|████████▌ | 29/34 [00:09<00:01,  3.38it/s][A
 94%|█████████▍| 32/34 [00:09<00:00,  4.79it/s][A
100%|██████████| 34/34 [00:10<00:00,  3.39it/s][A
Epochs:  65%|██████▍   | 62/96 [1:51:45<1:01:29, 108.53s/it]

Val Loss: 14458.2412 - Val Accuracy: 0.9128



Training:   0%|          | 0/269 [00:00<?, ?it/s][A
Training:   0%|          | 1/269 [00:01<06:12,  1.39s/it][A
Training:   1%|          | 2/269 [00:01<02:49,  1.57it/s][A
Training:   2%|▏         | 5/269 [00:02<01:50,  2.40it/s][A
Training:   2%|▏         | 6/269 [00:02<01:30,  2.90it/s][A
Training:   3%|▎         | 9/269 [00:03<01:26,  3.02it/s][A
Training:   4%|▍         | 11/269 [00:03<01:02,  4.12it/s][A
Training:   5%|▍         | 13/269 [00:04<01:22,  3.10it/s][A
Training:   5%|▌         | 14/269 [00:04<01:12,  3.53it/s][A
Training:   6%|▋         | 17/269 [00:06<01:24,  2.99it/s][A
Training:   8%|▊         | 21/269 [00:06<01:13,  3.38it/s][A
Training:   9%|▉         | 25/269 [00:08<01:14,  3.28it/s][A
Training:  10%|█         | 27/269 [00:08<01:00,  4.02it/s][A
Training:  11%|█         | 29/269 [00:09<01:17,  3.08it/s][A
Training:  12%|█▏        | 32/269 [00:09<00:54,  4.38it/s][A
Training:  13%|█▎        | 34/269 [00:10<01:14,  3.17it/s][A
Training:  14%|█▍    

Epoch: 63/96 - Loss: 14329.5752 - Accuracy: 0.9202



  0%|          | 0/34 [00:00<?, ?it/s][A
  3%|▎         | 1/34 [00:01<00:47,  1.44s/it][A
 12%|█▏        | 4/34 [00:01<00:09,  3.32it/s][A
 18%|█▊        | 6/34 [00:02<00:10,  2.55it/s][A
 26%|██▋       | 9/34 [00:03<00:08,  2.92it/s][A
 29%|██▉       | 10/34 [00:03<00:07,  3.26it/s][A
 38%|███▊      | 13/34 [00:04<00:06,  3.50it/s][A
 41%|████      | 14/34 [00:04<00:05,  3.81it/s][A
 50%|█████     | 17/34 [00:05<00:04,  3.78it/s][A
 53%|█████▎    | 18/34 [00:05<00:04,  3.86it/s][A
 62%|██████▏   | 21/34 [00:06<00:03,  3.95it/s][A
 65%|██████▍   | 22/34 [00:06<00:02,  4.24it/s][A
 74%|███████▎  | 25/34 [00:06<00:01,  4.76it/s][A
 76%|███████▋  | 26/34 [00:07<00:01,  4.82it/s][A
 85%|████████▌ | 29/34 [00:07<00:00,  5.28it/s][A
 88%|████████▊ | 30/34 [00:07<00:00,  5.29it/s][A
100%|██████████| 34/34 [00:08<00:00,  4.06it/s][A
Epochs:  66%|██████▌   | 63/96 [1:53:11<55:51, 101.56s/it]  

Val Loss: 16326.3477 - Val Accuracy: 0.9105



Training:   0%|          | 0/269 [00:00<?, ?it/s][A
Training:   0%|          | 1/269 [00:01<04:43,  1.06s/it][A
Training:   1%|▏         | 4/269 [00:01<01:02,  4.23it/s][A
Training:   2%|▏         | 6/269 [00:01<01:13,  3.56it/s][A
Training:   3%|▎         | 9/269 [00:02<01:05,  3.99it/s][A
Training:   4%|▎         | 10/269 [00:02<01:00,  4.26it/s][A
Training:   5%|▍         | 13/269 [00:03<01:00,  4.20it/s][A
Training:   5%|▌         | 14/269 [00:03<00:56,  4.54it/s][A
Training:   6%|▌         | 16/269 [00:03<00:41,  6.08it/s][A
Training:   7%|▋         | 18/269 [00:04<00:59,  4.25it/s][A
Training:   8%|▊         | 21/269 [00:05<00:57,  4.29it/s][A
Training:   9%|▊         | 23/269 [00:05<00:45,  5.46it/s][A
Training:   9%|▉         | 25/269 [00:06<01:00,  4.05it/s][A
Training:  10%|█         | 28/269 [00:06<00:43,  5.55it/s][A
Training:  11%|█         | 29/269 [00:06<00:58,  4.09it/s][A
Training:  12%|█▏        | 32/269 [00:07<00:40,  5.83it/s][A
Training:  13%|█▎   

Epoch: 64/96 - Loss: 14039.3457 - Accuracy: 0.9199



  0%|          | 0/34 [00:00<?, ?it/s][A
  3%|▎         | 1/34 [00:00<00:32,  1.02it/s][A
 15%|█▍        | 5/34 [00:01<00:09,  3.06it/s][A
 24%|██▎       | 8/34 [00:01<00:04,  5.31it/s][A
 29%|██▉       | 10/34 [00:02<00:05,  4.29it/s][A
 38%|███▊      | 13/34 [00:03<00:04,  4.41it/s][A
 41%|████      | 14/34 [00:03<00:04,  4.77it/s][A
 50%|█████     | 17/34 [00:04<00:03,  4.61it/s][A
 53%|█████▎    | 18/34 [00:04<00:03,  4.79it/s][A
 62%|██████▏   | 21/34 [00:04<00:02,  4.95it/s][A
 65%|██████▍   | 22/34 [00:04<00:02,  5.01it/s][A
 74%|███████▎  | 25/34 [00:05<00:01,  5.29it/s][A
 76%|███████▋  | 26/34 [00:05<00:01,  5.19it/s][A
 85%|████████▌ | 29/34 [00:06<00:01,  4.97it/s][A
 88%|████████▊ | 30/34 [00:06<00:00,  5.23it/s][A
100%|██████████| 34/34 [00:07<00:00,  4.82it/s][A
Epochs:  67%|██████▋   | 64/96 [1:54:15<48:11, 90.37s/it] 

Val Loss: 15754.1504 - Val Accuracy: 0.9094



Training:   0%|          | 0/269 [00:00<?, ?it/s][A
Training:   0%|          | 1/269 [00:01<04:38,  1.04s/it][A
Training:   2%|▏         | 5/269 [00:01<01:26,  3.04it/s][A
Training:   3%|▎         | 9/269 [00:02<01:07,  3.86it/s][A
Training:   5%|▍         | 13/269 [00:03<01:02,  4.11it/s][A
Training:   6%|▋         | 17/269 [00:04<00:56,  4.43it/s][A
Training:   8%|▊         | 21/269 [00:05<00:55,  4.49it/s][A
Training:   9%|▉         | 25/269 [00:06<00:53,  4.58it/s][A
Training:  10%|█         | 28/269 [00:06<00:41,  5.87it/s][A
Training:  11%|█         | 30/269 [00:06<00:50,  4.72it/s][A
Training:  12%|█▏        | 32/269 [00:07<00:41,  5.69it/s][A
Training:  13%|█▎        | 34/269 [00:07<00:55,  4.25it/s][A
Training:  14%|█▍        | 37/269 [00:08<00:56,  4.14it/s][A
Training:  15%|█▌        | 41/269 [00:09<00:53,  4.29it/s][A
Training:  16%|█▌        | 43/269 [00:09<00:43,  5.17it/s][A
Training:  17%|█▋        | 45/269 [00:10<00:53,  4.16it/s][A
Training:  17%|█▋  

Epoch: 65/96 - Loss: 13619.8672 - Accuracy: 0.9166



  0%|          | 0/34 [00:00<?, ?it/s][A
  3%|▎         | 1/34 [00:01<00:34,  1.04s/it][A
 15%|█▍        | 5/34 [00:01<00:09,  3.01it/s][A
 24%|██▎       | 8/34 [00:01<00:04,  5.25it/s][A
 29%|██▉       | 10/34 [00:02<00:05,  4.01it/s][A
 38%|███▊      | 13/34 [00:03<00:05,  4.11it/s][A
 47%|████▋     | 16/34 [00:03<00:03,  5.99it/s][A
 53%|█████▎    | 18/34 [00:04<00:03,  4.58it/s][A
 62%|██████▏   | 21/34 [00:04<00:02,  4.66it/s][A
 74%|███████▎  | 25/34 [00:05<00:01,  5.21it/s][A
 85%|████████▌ | 29/34 [00:06<00:00,  5.25it/s][A
100%|██████████| 34/34 [00:06<00:00,  4.86it/s][A
Epochs:  68%|██████▊   | 65/96 [1:55:20<42:41, 82.63s/it]

Val Loss: 15489.7900 - Val Accuracy: 0.9359



Training:   0%|          | 0/269 [00:00<?, ?it/s][A
Training:   0%|          | 1/269 [00:01<05:19,  1.19s/it][A
Training:   2%|▏         | 5/269 [00:02<01:35,  2.78it/s][A
Training:   3%|▎         | 9/269 [00:02<01:12,  3.61it/s][A
Training:   5%|▍         | 13/269 [00:03<01:04,  3.94it/s][A
Training:   6%|▋         | 17/269 [00:04<01:01,  4.11it/s][A
Training:   8%|▊         | 21/269 [00:05<00:56,  4.36it/s][A
Training:   9%|▉         | 25/269 [00:06<00:56,  4.29it/s][A
Training:  11%|█         | 29/269 [00:07<00:53,  4.45it/s][A
Training:  12%|█▏        | 33/269 [00:08<00:52,  4.48it/s][A
Training:  14%|█▍        | 37/269 [00:09<00:51,  4.54it/s][A
Training:  15%|█▌        | 41/269 [00:09<00:49,  4.64it/s][A
Training:  17%|█▋        | 45/269 [00:10<00:49,  4.52it/s][A
Training:  18%|█▊        | 48/269 [00:10<00:38,  5.69it/s][A
Training:  19%|█▊        | 50/269 [00:11<00:46,  4.70it/s][A
Training:  20%|█▉        | 53/269 [00:12<00:50,  4.31it/s][A
Training:  21%|██  

Epoch: 66/96 - Loss: 15056.7100 - Accuracy: 0.9223



  0%|          | 0/34 [00:00<?, ?it/s][A
  3%|▎         | 1/34 [00:01<00:37,  1.14s/it][A
 15%|█▍        | 5/34 [00:01<00:09,  3.14it/s][A
 24%|██▎       | 8/34 [00:01<00:04,  5.44it/s][A
 29%|██▉       | 10/34 [00:02<00:05,  4.09it/s][A
 38%|███▊      | 13/34 [00:03<00:05,  4.08it/s][A
 50%|█████     | 17/34 [00:04<00:03,  4.87it/s][A
 62%|██████▏   | 21/34 [00:04<00:02,  4.92it/s][A
 74%|███████▎  | 25/34 [00:05<00:01,  5.19it/s][A
 85%|████████▌ | 29/34 [00:06<00:00,  5.51it/s][A
 91%|█████████ | 31/34 [00:06<00:00,  6.28it/s][A
100%|██████████| 34/34 [00:06<00:00,  4.90it/s][A
Epochs:  69%|██████▉   | 66/96 [1:56:24<38:34, 77.14s/it]

Val Loss: 14864.0430 - Val Accuracy: 0.9040



Training:   0%|          | 0/269 [00:00<?, ?it/s][A
Training:   0%|          | 1/269 [00:01<05:06,  1.14s/it][A
Training:   1%|▏         | 4/269 [00:01<01:05,  4.03it/s][A
Training:   2%|▏         | 6/269 [00:02<01:20,  3.25it/s][A
Training:   3%|▎         | 7/269 [00:02<01:08,  3.85it/s][A
Training:   3%|▎         | 9/269 [00:02<01:12,  3.58it/s][A
Training:   4%|▍         | 11/269 [00:02<00:51,  4.97it/s][A
Training:   5%|▍         | 13/269 [00:03<01:04,  3.97it/s][A
Training:   5%|▌         | 14/269 [00:03<00:59,  4.28it/s][A
Training:   6%|▋         | 17/269 [00:04<00:59,  4.25it/s][A
Training:   7%|▋         | 18/269 [00:04<00:54,  4.57it/s][A
Training:   8%|▊         | 21/269 [00:05<00:55,  4.46it/s][A
Training:   8%|▊         | 22/269 [00:05<00:52,  4.71it/s][A
Training:   9%|▉         | 25/269 [00:06<00:54,  4.50it/s][A
Training:  10%|▉         | 26/269 [00:06<00:50,  4.78it/s][A
Training:  11%|█         | 29/269 [00:06<00:51,  4.62it/s][A
Training:  11%|█     

Training:  96%|█████████▌| 257/269 [00:54<00:02,  4.40it/s][A
Training:  96%|█████████▋| 259/269 [00:55<00:02,  4.95it/s][A
Training:  97%|█████████▋| 261/269 [00:55<00:01,  4.23it/s][A
Training:  98%|█████████▊| 263/269 [00:55<00:01,  4.96it/s][A
Training:  99%|█████████▊| 265/269 [00:56<00:00,  4.58it/s][A
Training:  99%|█████████▉| 267/269 [00:56<00:00,  5.39it/s][A
Training: 100%|██████████| 269/269 [00:56<00:00,  5.89it/s][A
                                                           [A

Epoch: 67/96 - Loss: 14010.0742 - Accuracy: 0.9187



  0%|          | 0/34 [00:00<?, ?it/s][A
  3%|▎         | 1/34 [00:01<00:35,  1.07s/it][A
 12%|█▏        | 4/34 [00:01<00:06,  4.36it/s][A
 18%|█▊        | 6/34 [00:01<00:07,  3.69it/s][A
 26%|██▋       | 9/34 [00:02<00:06,  3.80it/s][A
 32%|███▏      | 11/34 [00:02<00:04,  4.95it/s][A
 38%|███▊      | 13/34 [00:03<00:05,  4.15it/s][A
 50%|█████     | 17/34 [00:03<00:03,  5.05it/s][A
 62%|██████▏   | 21/34 [00:04<00:02,  4.99it/s][A
 74%|███████▎  | 25/34 [00:05<00:01,  5.09it/s][A
 85%|████████▌ | 29/34 [00:06<00:00,  5.51it/s][A
100%|██████████| 34/34 [00:06<00:00,  4.95it/s][A
Epochs:  70%|██████▉   | 67/96 [1:57:28<35:22, 73.20s/it]

Val Loss: 16241.7109 - Val Accuracy: 0.9324



Training:   0%|          | 0/269 [00:00<?, ?it/s][A
Training:   0%|          | 1/269 [00:01<05:17,  1.18s/it][A
Training:   2%|▏         | 5/269 [00:02<01:36,  2.74it/s][A
Training:   3%|▎         | 9/269 [00:02<01:12,  3.58it/s][A
Training:   5%|▍         | 13/269 [00:03<01:03,  4.02it/s][A
Training:   6%|▋         | 17/269 [00:04<01:00,  4.20it/s][A
Training:   8%|▊         | 21/269 [00:05<00:56,  4.41it/s][A
Training:   9%|▉         | 25/269 [00:06<00:55,  4.42it/s][A
Training:  10%|█         | 27/269 [00:06<00:46,  5.19it/s][A
Training:  11%|█         | 29/269 [00:07<00:56,  4.25it/s][A
Training:  12%|█▏        | 33/269 [00:08<00:52,  4.49it/s][A
Training:  14%|█▍        | 37/269 [00:08<00:52,  4.40it/s][A
Training:  15%|█▌        | 41/269 [00:09<00:49,  4.58it/s][A
Training:  17%|█▋        | 45/269 [00:10<00:50,  4.42it/s][A
Training:  18%|█▊        | 48/269 [00:10<00:39,  5.57it/s][A
Training:  19%|█▊        | 50/269 [00:11<00:47,  4.63it/s][A
Training:  20%|█▉  

Epoch: 68/96 - Loss: 14377.2100 - Accuracy: 0.9232



  0%|          | 0/34 [00:00<?, ?it/s][A
  3%|▎         | 1/34 [00:01<00:33,  1.00s/it][A
 15%|█▍        | 5/34 [00:01<00:09,  3.20it/s][A
 26%|██▋       | 9/34 [00:02<00:05,  4.23it/s][A
 38%|███▊      | 13/34 [00:03<00:04,  4.78it/s][A
 50%|█████     | 17/34 [00:03<00:03,  4.88it/s][A
 62%|██████▏   | 21/34 [00:04<00:02,  5.22it/s][A
 74%|███████▎  | 25/34 [00:05<00:01,  5.31it/s][A
 85%|████████▌ | 29/34 [00:06<00:00,  5.14it/s][A
100%|██████████| 34/34 [00:06<00:00,  4.96it/s][A
Epochs:  71%|███████   | 68/96 [1:58:33<32:59, 70.69s/it]

Val Loss: 14312.6455 - Val Accuracy: 0.9086



Training:   0%|          | 0/269 [00:00<?, ?it/s][A
Training:   0%|          | 1/269 [00:01<05:10,  1.16s/it][A
Training:   1%|          | 2/269 [00:01<02:25,  1.84it/s][A
Training:   2%|▏         | 5/269 [00:02<01:26,  3.04it/s][A
Training:   2%|▏         | 6/269 [00:02<01:12,  3.61it/s][A
Training:   3%|▎         | 9/269 [00:02<01:07,  3.85it/s][A
Training:   4%|▎         | 10/269 [00:03<01:01,  4.21it/s][A
Training:   5%|▍         | 13/269 [00:03<01:04,  3.99it/s][A
Training:   5%|▌         | 14/269 [00:03<00:58,  4.36it/s][A
Training:   6%|▋         | 17/269 [00:04<00:56,  4.43it/s][A
Training:   7%|▋         | 18/269 [00:04<00:52,  4.74it/s][A
Training:   8%|▊         | 21/269 [00:05<00:54,  4.54it/s][A
Training:   8%|▊         | 22/269 [00:05<00:50,  4.87it/s][A
Training:   9%|▉         | 25/269 [00:06<00:55,  4.40it/s][A
Training:  10%|▉         | 26/269 [00:06<00:50,  4.85it/s][A
Training:  11%|█         | 29/269 [00:07<00:52,  4.56it/s][A
Training:  12%|█▏    

Epoch: 69/96 - Loss: 13656.5762 - Accuracy: 0.9187



  0%|          | 0/34 [00:00<?, ?it/s][A
  3%|▎         | 1/34 [00:01<00:34,  1.04s/it][A
 12%|█▏        | 4/34 [00:01<00:06,  4.46it/s][A
 18%|█▊        | 6/34 [00:01<00:08,  3.41it/s][A
 26%|██▋       | 9/34 [00:02<00:06,  3.90it/s][A
 38%|███▊      | 13/34 [00:03<00:04,  4.60it/s][A
 50%|█████     | 17/34 [00:04<00:03,  4.71it/s][A
 59%|█████▉    | 20/34 [00:04<00:02,  6.29it/s][A
 65%|██████▍   | 22/34 [00:04<00:02,  5.34it/s][A
 74%|███████▎  | 25/34 [00:05<00:01,  5.20it/s][A
 85%|████████▌ | 29/34 [00:06<00:00,  5.10it/s][A
100%|██████████| 34/34 [00:06<00:00,  4.99it/s][A
Epochs:  72%|███████▏  | 69/96 [1:59:37<30:55, 68.71s/it]

Val Loss: 16010.2148 - Val Accuracy: 0.9263



Training:   0%|          | 0/269 [00:00<?, ?it/s][A
Training:   0%|          | 1/269 [00:01<05:26,  1.22s/it][A
Training:   2%|▏         | 5/269 [00:02<01:31,  2.87it/s][A
Training:   3%|▎         | 9/269 [00:02<01:12,  3.60it/s][A
Training:   5%|▍         | 13/269 [00:03<01:03,  4.01it/s][A
Training:   6%|▋         | 17/269 [00:04<00:58,  4.33it/s][A
Training:   7%|▋         | 20/269 [00:04<00:43,  5.77it/s][A
Training:   8%|▊         | 22/269 [00:05<00:57,  4.31it/s][A
Training:   9%|▉         | 25/269 [00:06<00:57,  4.22it/s][A
Training:  11%|█         | 29/269 [00:07<00:56,  4.27it/s][A
Training:  12%|█▏        | 33/269 [00:08<00:54,  4.37it/s][A
Training:  14%|█▍        | 37/269 [00:08<00:52,  4.45it/s][A
Training:  15%|█▌        | 41/269 [00:09<00:51,  4.44it/s][A
Training:  16%|█▋        | 44/269 [00:09<00:40,  5.62it/s][A
Training:  17%|█▋        | 46/269 [00:10<00:48,  4.59it/s][A
Training:  18%|█▊        | 49/269 [00:11<00:50,  4.34it/s][A
Training:  20%|█▉  

Epoch: 70/96 - Loss: 14028.1621 - Accuracy: 0.9188



  0%|          | 0/34 [00:00<?, ?it/s][A
  3%|▎         | 1/34 [00:00<00:28,  1.17it/s][A
 15%|█▍        | 5/34 [00:01<00:06,  4.22it/s][A
 26%|██▋       | 9/34 [00:01<00:04,  5.74it/s][A
 38%|███▊      | 13/34 [00:02<00:03,  6.18it/s][A
 50%|█████     | 17/34 [00:02<00:02,  6.59it/s][A
 62%|██████▏   | 21/34 [00:03<00:01,  7.09it/s][A
 74%|███████▎  | 25/34 [00:04<00:01,  6.92it/s][A
 85%|████████▌ | 29/34 [00:04<00:00,  7.03it/s][A
100%|██████████| 34/34 [00:05<00:00,  6.58it/s][A
Epochs:  73%|███████▎  | 70/96 [2:00:32<27:57, 64.52s/it]

Val Loss: 14866.8193 - Val Accuracy: 0.9352



Training:   0%|          | 0/269 [00:00<?, ?it/s][A
Training:   0%|          | 1/269 [00:00<04:25,  1.01it/s][A
Training:   2%|▏         | 5/269 [00:01<01:11,  3.71it/s][A
Training:   3%|▎         | 9/269 [00:02<00:54,  4.80it/s][A
Training:   5%|▍         | 13/269 [00:02<00:47,  5.35it/s][A
Training:   6%|▋         | 17/269 [00:03<00:41,  6.04it/s][A
Training:   8%|▊         | 21/269 [00:03<00:40,  6.19it/s][A
Training:   9%|▉         | 25/269 [00:04<00:38,  6.34it/s][A
Training:  11%|█         | 29/269 [00:05<00:35,  6.71it/s][A
Training:  12%|█▏        | 33/269 [00:05<00:35,  6.64it/s][A
Training:  14%|█▍        | 37/269 [00:06<00:35,  6.58it/s][A
Training:  15%|█▌        | 41/269 [00:06<00:33,  6.84it/s][A
Training:  17%|█▋        | 45/269 [00:07<00:34,  6.53it/s][A
Training:  18%|█▊        | 49/269 [00:08<00:32,  6.73it/s][A
Training:  20%|█▉        | 53/269 [00:08<00:31,  6.92it/s][A
Training:  21%|██        | 57/269 [00:09<00:32,  6.55it/s][A
Training:  23%|██▎ 

Epoch: 71/96 - Loss: 14456.7852 - Accuracy: 0.9166



  0%|          | 0/34 [00:00<?, ?it/s][A
  3%|▎         | 1/34 [00:00<00:28,  1.17it/s][A
 15%|█▍        | 5/34 [00:01<00:06,  4.29it/s][A
 26%|██▋       | 9/34 [00:01<00:04,  5.51it/s][A
 38%|███▊      | 13/34 [00:02<00:03,  6.00it/s][A
 50%|█████     | 17/34 [00:03<00:02,  6.60it/s][A
 62%|██████▏   | 21/34 [00:03<00:01,  6.88it/s][A
 74%|███████▎  | 25/34 [00:04<00:01,  6.94it/s][A
 85%|████████▌ | 29/34 [00:04<00:00,  7.33it/s][A
100%|██████████| 34/34 [00:05<00:00,  6.60it/s][A
Epochs:  74%|███████▍  | 71/96 [2:01:17<24:31, 58.84s/it]

Val Loss: 14798.3965 - Val Accuracy: 0.9351



Training:   0%|          | 0/269 [00:00<?, ?it/s][A
Training:   0%|          | 1/269 [00:00<03:40,  1.22it/s][A
Training:   2%|▏         | 5/269 [00:01<01:04,  4.12it/s][A
Training:   3%|▎         | 9/269 [00:02<00:51,  5.01it/s][A
Training:   5%|▍         | 13/269 [00:02<00:43,  5.85it/s][A
Training:   6%|▋         | 17/269 [00:03<00:40,  6.24it/s][A
Training:   8%|▊         | 21/269 [00:03<00:39,  6.21it/s][A
Training:   9%|▉         | 25/269 [00:04<00:36,  6.62it/s][A
Training:  11%|█         | 29/269 [00:04<00:35,  6.80it/s][A
Training:  12%|█▏        | 33/269 [00:05<00:35,  6.58it/s][A
Training:  14%|█▍        | 37/269 [00:06<00:33,  6.86it/s][A
Training:  15%|█▌        | 41/269 [00:06<00:32,  6.99it/s][A
Training:  17%|█▋        | 45/269 [00:07<00:33,  6.59it/s][A
Training:  18%|█▊        | 49/269 [00:07<00:32,  6.78it/s][A
Training:  20%|█▉        | 53/269 [00:08<00:31,  6.82it/s][A
Training:  21%|██        | 57/269 [00:09<00:32,  6.56it/s][A
Training:  23%|██▎ 

Epoch: 72/96 - Loss: 14486.9648 - Accuracy: 0.9213



  0%|          | 0/34 [00:00<?, ?it/s][A
  3%|▎         | 1/34 [00:00<00:27,  1.22it/s][A
 15%|█▍        | 5/34 [00:01<00:06,  4.47it/s][A
 26%|██▋       | 9/34 [00:01<00:04,  5.49it/s][A
 38%|███▊      | 13/34 [00:02<00:03,  6.12it/s][A
 50%|█████     | 17/34 [00:02<00:02,  6.83it/s][A
 62%|██████▏   | 21/34 [00:03<00:01,  6.93it/s][A
 74%|███████▎  | 25/34 [00:04<00:01,  7.03it/s][A
 85%|████████▌ | 29/34 [00:04<00:00,  7.38it/s][A
100%|██████████| 34/34 [00:05<00:00,  6.61it/s][A
Epochs:  75%|███████▌  | 72/96 [2:02:03<21:55, 54.81s/it]

Val Loss: 16504.4824 - Val Accuracy: 0.8864



Training:   0%|          | 0/269 [00:00<?, ?it/s][A
Training:   0%|          | 1/269 [00:00<03:31,  1.27it/s][A
Training:   2%|▏         | 5/269 [00:01<01:09,  3.80it/s][A
Training:   3%|▎         | 9/269 [00:02<00:50,  5.11it/s][A
Training:   5%|▍         | 13/269 [00:02<00:44,  5.81it/s][A
Training:   6%|▋         | 17/269 [00:03<00:42,  5.89it/s][A
Training:   8%|▊         | 21/269 [00:03<00:38,  6.42it/s][A
Training:   9%|▉         | 25/269 [00:04<00:37,  6.48it/s][A
Training:  11%|█         | 29/269 [00:04<00:36,  6.54it/s][A
Training:  12%|█▏        | 33/269 [00:05<00:34,  6.82it/s][A
Training:  14%|█▍        | 37/269 [00:06<00:34,  6.70it/s][A
Training:  15%|█▌        | 41/269 [00:06<00:33,  6.74it/s][A
Training:  17%|█▋        | 45/269 [00:07<00:32,  6.88it/s][A
Training:  18%|█▊        | 49/269 [00:07<00:33,  6.56it/s][A
Training:  20%|█▉        | 53/269 [00:08<00:32,  6.73it/s][A
Training:  21%|██        | 57/269 [00:09<00:30,  6.90it/s][A
Training:  23%|██▎ 

Epoch: 73/96 - Loss: 14850.5225 - Accuracy: 0.9190



  0%|          | 0/34 [00:00<?, ?it/s][A
  3%|▎         | 1/34 [00:00<00:29,  1.12it/s][A
 15%|█▍        | 5/34 [00:01<00:07,  4.08it/s][A
 26%|██▋       | 9/34 [00:01<00:04,  5.52it/s][A
 38%|███▊      | 13/34 [00:02<00:03,  5.82it/s][A
 50%|█████     | 17/34 [00:03<00:02,  6.37it/s][A
 62%|██████▏   | 21/34 [00:03<00:01,  6.91it/s][A
 74%|███████▎  | 25/34 [00:04<00:01,  6.98it/s][A
 85%|████████▌ | 29/34 [00:04<00:00,  7.00it/s][A
100%|██████████| 34/34 [00:05<00:00,  6.46it/s][A
Epochs:  76%|███████▌  | 73/96 [2:02:48<19:58, 52.10s/it]

Val Loss: 14673.2773 - Val Accuracy: 0.8638



Training:   0%|          | 0/269 [00:00<?, ?it/s][A
Training:   0%|          | 1/269 [00:00<04:05,  1.09it/s][A
Training:   2%|▏         | 5/269 [00:01<01:07,  3.92it/s][A
Training:   3%|▎         | 9/269 [00:02<00:51,  5.03it/s][A
Training:   5%|▍         | 13/269 [00:02<00:45,  5.60it/s][A
Training:   6%|▋         | 17/269 [00:03<00:40,  6.24it/s][A
Training:   8%|▊         | 21/269 [00:03<00:39,  6.34it/s][A
Training:   9%|▉         | 25/269 [00:04<00:37,  6.51it/s][A
Training:  11%|█         | 29/269 [00:04<00:35,  6.72it/s][A
Training:  12%|█▏        | 33/269 [00:05<00:36,  6.50it/s][A
Training:  14%|█▍        | 37/269 [00:06<00:34,  6.69it/s][A
Training:  15%|█▌        | 41/269 [00:06<00:33,  6.82it/s][A
Training:  17%|█▋        | 45/269 [00:07<00:34,  6.46it/s][A
Training:  18%|█▊        | 49/269 [00:07<00:32,  6.76it/s][A
Training:  20%|█▉        | 53/269 [00:08<00:31,  6.90it/s][A
Training:  21%|██        | 57/269 [00:09<00:32,  6.59it/s][A
Training:  23%|██▎ 

Epoch: 74/96 - Loss: 14137.0635 - Accuracy: 0.9192



  0%|          | 0/34 [00:00<?, ?it/s][A
  3%|▎         | 1/34 [00:00<00:25,  1.31it/s][A
 15%|█▍        | 5/34 [00:01<00:06,  4.60it/s][A
 26%|██▋       | 9/34 [00:01<00:04,  5.45it/s][A
 38%|███▊      | 13/34 [00:02<00:03,  6.37it/s][A
 50%|█████     | 17/34 [00:02<00:02,  6.84it/s][A
 62%|██████▏   | 21/34 [00:03<00:01,  6.74it/s][A
 74%|███████▎  | 25/34 [00:03<00:01,  7.15it/s][A
 85%|████████▌ | 29/34 [00:04<00:00,  7.26it/s][A
100%|██████████| 34/34 [00:05<00:00,  6.59it/s][A
Epochs:  77%|███████▋  | 74/96 [2:03:34<18:23, 50.17s/it]

Val Loss: 16877.4512 - Val Accuracy: 0.9206



Training:   0%|          | 0/269 [00:00<?, ?it/s][A
Training:   0%|          | 1/269 [00:00<03:47,  1.18it/s][A
Training:   2%|▏         | 5/269 [00:01<01:09,  3.78it/s][A
Training:   3%|▎         | 9/269 [00:02<00:50,  5.15it/s][A
Training:   5%|▍         | 13/269 [00:02<00:45,  5.58it/s][A
Training:   6%|▋         | 17/269 [00:03<00:42,  5.88it/s][A
Training:   8%|▊         | 21/269 [00:03<00:38,  6.38it/s][A
Training:   9%|▉         | 25/269 [00:04<00:39,  6.22it/s][A
Training:  11%|█         | 29/269 [00:05<00:36,  6.49it/s][A
Training:  12%|█▏        | 33/269 [00:05<00:35,  6.71it/s][A
Training:  14%|█▍        | 37/269 [00:06<00:36,  6.30it/s][A
Training:  15%|█▌        | 41/269 [00:06<00:34,  6.59it/s][A
Training:  17%|█▋        | 45/269 [00:07<00:33,  6.63it/s][A
Training:  18%|█▊        | 49/269 [00:08<00:33,  6.58it/s][A
Training:  20%|█▉        | 53/269 [00:08<00:31,  6.84it/s][A
Training:  21%|██        | 57/269 [00:09<00:30,  6.92it/s][A
Training:  23%|██▎ 

Epoch: 75/96 - Loss: 14321.7656 - Accuracy: 0.9220



  0%|          | 0/34 [00:00<?, ?it/s][A
  3%|▎         | 1/34 [00:00<00:27,  1.21it/s][A
 15%|█▍        | 5/34 [00:01<00:06,  4.30it/s][A
 26%|██▋       | 9/34 [00:01<00:04,  5.35it/s][A
 38%|███▊      | 13/34 [00:02<00:03,  6.19it/s][A
 50%|█████     | 17/34 [00:02<00:02,  6.92it/s][A
 62%|██████▏   | 21/34 [00:03<00:01,  6.91it/s][A
 74%|███████▎  | 25/34 [00:04<00:01,  7.04it/s][A
 85%|████████▌ | 29/34 [00:04<00:00,  7.35it/s][A
100%|██████████| 34/34 [00:05<00:00,  6.61it/s][A
Epochs:  78%|███████▊  | 75/96 [2:04:20<17:04, 48.79s/it]

Val Loss: 14789.7734 - Val Accuracy: 0.9234



Training:   0%|          | 0/269 [00:00<?, ?it/s][A
Training:   0%|          | 1/269 [00:00<03:32,  1.26it/s][A
Training:   2%|▏         | 5/269 [00:01<01:04,  4.07it/s][A
Training:   3%|▎         | 9/269 [00:02<00:50,  5.16it/s][A
Training:   5%|▍         | 13/269 [00:02<00:42,  6.00it/s][A
Training:   6%|▋         | 17/269 [00:03<00:40,  6.24it/s][A
Training:   8%|▊         | 21/269 [00:03<00:38,  6.45it/s][A
Training:   9%|▉         | 25/269 [00:04<00:36,  6.74it/s][A
Training:  10%|█         | 28/269 [00:04<00:28,  8.47it/s][A
Training:  11%|█         | 30/269 [00:04<00:37,  6.37it/s][A
Training:  12%|█▏        | 33/269 [00:05<00:38,  6.16it/s][A
Training:  14%|█▍        | 37/269 [00:06<00:35,  6.56it/s][A
Training:  15%|█▌        | 41/269 [00:06<00:36,  6.30it/s][A
Training:  17%|█▋        | 45/269 [00:07<00:33,  6.62it/s][A
Training:  18%|█▊        | 49/269 [00:07<00:31,  6.91it/s][A
Training:  20%|█▉        | 53/269 [00:08<00:33,  6.48it/s][A
Training:  21%|██  

Epoch: 76/96 - Loss: 14652.5645 - Accuracy: 0.9207



  0%|          | 0/34 [00:00<?, ?it/s][A
  3%|▎         | 1/34 [00:00<00:27,  1.21it/s][A
 15%|█▍        | 5/34 [00:01<00:06,  4.23it/s][A
 26%|██▋       | 9/34 [00:01<00:04,  5.76it/s][A
 38%|███▊      | 13/34 [00:02<00:03,  6.29it/s][A
 50%|█████     | 17/34 [00:02<00:02,  6.58it/s][A
 62%|██████▏   | 21/34 [00:03<00:01,  7.00it/s][A
 74%|███████▎  | 25/34 [00:04<00:01,  6.67it/s][A
 85%|████████▌ | 29/34 [00:04<00:00,  6.98it/s][A
100%|██████████| 34/34 [00:05<00:00,  6.51it/s][A
Epochs:  79%|███████▉  | 76/96 [2:05:05<15:57, 47.86s/it]

Val Loss: 14389.4941 - Val Accuracy: 0.8970



Training:   0%|          | 0/269 [00:00<?, ?it/s][A
Training:   0%|          | 1/269 [00:00<04:11,  1.06it/s][A
Training:   2%|▏         | 5/269 [00:01<01:07,  3.92it/s][A
Training:   3%|▎         | 9/269 [00:02<00:49,  5.23it/s][A
Training:   4%|▍         | 11/269 [00:02<00:39,  6.58it/s][A
Training:   5%|▍         | 13/269 [00:02<00:47,  5.39it/s][A
Training:   6%|▋         | 17/269 [00:03<00:40,  6.16it/s][A
Training:   8%|▊         | 21/269 [00:03<00:40,  6.15it/s][A
Training:   9%|▉         | 25/269 [00:04<00:38,  6.42it/s][A
Training:  11%|█         | 29/269 [00:04<00:35,  6.68it/s][A
Training:  12%|█▏        | 33/269 [00:05<00:37,  6.35it/s][A
Training:  14%|█▍        | 37/269 [00:06<00:35,  6.62it/s][A
Training:  15%|█▌        | 41/269 [00:06<00:33,  6.81it/s][A
Training:  17%|█▋        | 45/269 [00:07<00:34,  6.45it/s][A
Training:  18%|█▊        | 49/269 [00:08<00:32,  6.76it/s][A
Training:  20%|█▉        | 53/269 [00:08<00:32,  6.67it/s][A
Training:  21%|██  

Epoch: 77/96 - Loss: 15156.0098 - Accuracy: 0.9224



  0%|          | 0/34 [00:00<?, ?it/s][A
  3%|▎         | 1/34 [00:00<00:26,  1.27it/s][A
 15%|█▍        | 5/34 [00:01<00:07,  4.08it/s][A
 26%|██▋       | 9/34 [00:01<00:04,  5.72it/s][A
 38%|███▊      | 13/34 [00:02<00:03,  6.41it/s][A
 50%|█████     | 17/34 [00:02<00:02,  6.48it/s][A
 62%|██████▏   | 21/34 [00:03<00:01,  7.05it/s][A
 74%|███████▎  | 25/34 [00:03<00:01,  7.26it/s][A
 85%|████████▌ | 29/34 [00:04<00:00,  6.99it/s][A
100%|██████████| 34/34 [00:05<00:00,  6.58it/s][A
Epochs:  80%|████████  | 77/96 [2:05:51<14:57, 47.25s/it]

Val Loss: 15307.2852 - Val Accuracy: 0.9283



Training:   0%|          | 0/269 [00:00<?, ?it/s][A
Training:   0%|          | 1/269 [00:00<03:56,  1.13it/s][A
Training:   2%|▏         | 5/269 [00:01<01:06,  3.99it/s][A
Training:   3%|▎         | 9/269 [00:01<00:48,  5.32it/s][A
Training:   5%|▍         | 13/269 [00:02<00:45,  5.66it/s][A
Training:   6%|▋         | 17/269 [00:03<00:40,  6.16it/s][A
Training:   8%|▊         | 21/269 [00:03<00:39,  6.24it/s][A
Training:   9%|▉         | 25/269 [00:04<00:39,  6.25it/s][A
Training:  11%|█         | 29/269 [00:04<00:36,  6.62it/s][A
Training:  12%|█▏        | 33/269 [00:05<00:36,  6.49it/s][A
Training:  14%|█▍        | 37/269 [00:06<00:35,  6.54it/s][A
Training:  15%|█▌        | 41/269 [00:06<00:33,  6.80it/s][A
Training:  17%|█▋        | 45/269 [00:07<00:34,  6.58it/s][A
Training:  18%|█▊        | 49/269 [00:08<00:33,  6.64it/s][A
Training:  20%|█▉        | 53/269 [00:08<00:31,  6.88it/s][A
Training:  21%|██        | 57/269 [00:09<00:31,  6.67it/s][A
Training:  23%|██▎ 

Epoch: 78/96 - Loss: 14716.1074 - Accuracy: 0.9190



  0%|          | 0/34 [00:00<?, ?it/s][A
  3%|▎         | 1/34 [00:00<00:27,  1.21it/s][A
 15%|█▍        | 5/34 [00:01<00:07,  3.99it/s][A
 26%|██▋       | 9/34 [00:01<00:04,  5.58it/s][A
 38%|███▊      | 13/34 [00:02<00:03,  6.46it/s][A
 50%|█████     | 17/34 [00:03<00:02,  6.41it/s][A
 62%|██████▏   | 21/34 [00:03<00:01,  6.92it/s][A
 74%|███████▎  | 25/34 [00:04<00:01,  7.36it/s][A
 85%|████████▌ | 29/34 [00:04<00:00,  7.23it/s][A
100%|██████████| 34/34 [00:05<00:00,  6.54it/s][A
Epochs:  81%|████████▏ | 78/96 [2:06:37<14:01, 46.77s/it]

Val Loss: 16176.6641 - Val Accuracy: 0.9131



Training:   0%|          | 0/269 [00:00<?, ?it/s][A
Training:   0%|          | 1/269 [00:00<03:32,  1.26it/s][A
Training:   2%|▏         | 5/269 [00:01<01:07,  3.89it/s][A
Training:   3%|▎         | 9/269 [00:02<00:50,  5.16it/s][A
Training:   5%|▍         | 13/269 [00:02<00:44,  5.78it/s][A
Training:   6%|▋         | 17/269 [00:03<00:41,  6.00it/s][A
Training:   8%|▊         | 21/269 [00:03<00:38,  6.49it/s][A
Training:   9%|▉         | 25/269 [00:04<00:37,  6.43it/s][A
Training:  11%|█         | 29/269 [00:04<00:37,  6.47it/s][A
Training:  12%|█▏        | 33/269 [00:05<00:34,  6.78it/s][A
Training:  14%|█▍        | 37/269 [00:06<00:34,  6.68it/s][A
Training:  15%|█▌        | 41/269 [00:06<00:34,  6.70it/s][A
Training:  17%|█▋        | 45/269 [00:07<00:32,  6.93it/s][A
Training:  18%|█▊        | 49/269 [00:07<00:32,  6.70it/s][A
Training:  20%|█▉        | 53/269 [00:08<00:31,  6.78it/s][A
Training:  21%|██        | 57/269 [00:09<00:30,  6.93it/s][A
Training:  23%|██▎ 

Epoch: 79/96 - Loss: 13822.0713 - Accuracy: 0.9207



  0%|          | 0/34 [00:00<?, ?it/s][A
  3%|▎         | 1/34 [00:00<00:26,  1.25it/s][A
 15%|█▍        | 5/34 [00:01<00:06,  4.17it/s][A
 26%|██▋       | 9/34 [00:01<00:04,  5.74it/s][A
 38%|███▊      | 13/34 [00:02<00:03,  6.41it/s][A
 50%|█████     | 17/34 [00:02<00:02,  6.57it/s][A
 62%|██████▏   | 21/34 [00:03<00:01,  7.06it/s][A
 74%|███████▎  | 25/34 [00:03<00:01,  7.36it/s][A
 85%|████████▌ | 29/34 [00:04<00:00,  7.11it/s][A
100%|██████████| 34/34 [00:05<00:00,  6.66it/s][A
Epochs:  82%|████████▏ | 79/96 [2:07:22<13:08, 46.41s/it]

Val Loss: 14349.7734 - Val Accuracy: 0.9325



Training:   0%|          | 0/269 [00:00<?, ?it/s][A
Training:   0%|          | 1/269 [00:00<04:06,  1.09it/s][A
Training:   2%|▏         | 5/269 [00:01<01:07,  3.90it/s][A
Training:   3%|▎         | 9/269 [00:02<00:49,  5.23it/s][A
Training:   5%|▍         | 13/269 [00:02<00:46,  5.45it/s][A
Training:   6%|▋         | 17/269 [00:03<00:41,  6.11it/s][A
Training:   8%|▊         | 21/269 [00:03<00:38,  6.41it/s][A
Training:   9%|▉         | 25/269 [00:04<00:39,  6.19it/s][A
Training:  11%|█         | 29/269 [00:05<00:36,  6.55it/s][A
Training:  12%|█▏        | 33/269 [00:05<00:36,  6.53it/s][A
Training:  14%|█▍        | 37/269 [00:06<00:36,  6.39it/s][A
Training:  15%|█▌        | 41/269 [00:06<00:34,  6.59it/s][A
Training:  17%|█▋        | 45/269 [00:07<00:32,  6.84it/s][A
Training:  18%|█▊        | 49/269 [00:08<00:33,  6.63it/s][A
Training:  19%|█▉        | 52/269 [00:08<00:26,  8.18it/s][A
Training:  20%|██        | 54/269 [00:08<00:31,  6.77it/s][A
Training:  21%|██  

Epoch: 80/96 - Loss: 14271.2344 - Accuracy: 0.9202



  0%|          | 0/34 [00:00<?, ?it/s][A
  3%|▎         | 1/34 [00:00<00:25,  1.28it/s][A
 15%|█▍        | 5/34 [00:01<00:06,  4.21it/s][A
 26%|██▋       | 9/34 [00:01<00:04,  5.74it/s][A
 38%|███▊      | 13/34 [00:02<00:03,  6.25it/s][A
 50%|█████     | 17/34 [00:02<00:02,  6.57it/s][A
 62%|██████▏   | 21/34 [00:03<00:01,  7.08it/s][A
 74%|███████▎  | 25/34 [00:04<00:01,  7.04it/s][A
 85%|████████▌ | 29/34 [00:04<00:00,  7.19it/s][A
100%|██████████| 34/34 [00:05<00:00,  6.68it/s][A
Epochs:  83%|████████▎ | 80/96 [2:08:08<12:18, 46.17s/it]

Val Loss: 14906.6318 - Val Accuracy: 0.9261



Training:   0%|          | 0/269 [00:00<?, ?it/s][A
Training:   0%|          | 1/269 [00:00<04:05,  1.09it/s][A
Training:   2%|▏         | 5/269 [00:01<01:05,  4.05it/s][A
Training:   3%|▎         | 9/269 [00:01<00:48,  5.37it/s][A
Training:   5%|▍         | 13/269 [00:02<00:45,  5.67it/s][A
Training:   6%|▋         | 17/269 [00:03<00:40,  6.20it/s][A
Training:   8%|▊         | 21/269 [00:03<00:38,  6.40it/s][A
Training:   9%|▉         | 24/269 [00:03<00:30,  8.14it/s][A
Training:  10%|▉         | 26/269 [00:04<00:38,  6.36it/s][A
Training:  11%|█         | 29/269 [00:04<00:37,  6.37it/s][A
Training:  12%|█▏        | 32/269 [00:05<00:28,  8.38it/s][A
Training:  13%|█▎        | 34/269 [00:05<00:37,  6.28it/s][A
Training:  14%|█▍        | 37/269 [00:06<00:39,  5.89it/s][A
Training:  15%|█▌        | 41/269 [00:06<00:35,  6.40it/s][A
Training:  17%|█▋        | 45/269 [00:07<00:35,  6.33it/s][A
Training:  18%|█▊        | 49/269 [00:07<00:33,  6.51it/s][A
Training:  20%|█▉  

Training:  98%|█████████▊| 263/269 [00:39<00:00,  7.57it/s][A
Training:  99%|█████████▊| 265/269 [00:40<00:00,  6.04it/s][A
Training:  99%|█████████▉| 267/269 [00:40<00:00,  7.85it/s][A
Training: 100%|██████████| 269/269 [00:40<00:00,  7.22it/s][A
                                                           [A

Epoch: 81/96 - Loss: 13968.0078 - Accuracy: 0.9209



  0%|          | 0/34 [00:00<?, ?it/s][A
  3%|▎         | 1/34 [00:00<00:24,  1.36it/s][A
 15%|█▍        | 5/34 [00:01<00:06,  4.51it/s][A
 26%|██▋       | 9/34 [00:01<00:04,  5.68it/s][A
 38%|███▊      | 13/34 [00:02<00:03,  6.36it/s][A
 50%|█████     | 17/34 [00:02<00:02,  6.91it/s][A
 62%|██████▏   | 21/34 [00:03<00:01,  6.72it/s][A
 74%|███████▎  | 25/34 [00:04<00:01,  6.78it/s][A
 85%|████████▌ | 29/34 [00:04<00:00,  7.15it/s][A
100%|██████████| 34/34 [00:05<00:00,  6.61it/s][A
Epochs:  84%|████████▍ | 81/96 [2:08:54<11:30, 46.04s/it]

Val Loss: 15340.9600 - Val Accuracy: 0.9318



Training:   0%|          | 0/269 [00:00<?, ?it/s][A
Training:   0%|          | 1/269 [00:00<03:31,  1.27it/s][A
Training:   2%|▏         | 5/269 [00:01<01:07,  3.93it/s][A
Training:   3%|▎         | 9/269 [00:02<00:52,  4.95it/s][A
Training:   5%|▍         | 13/269 [00:02<00:44,  5.81it/s][A
Training:   6%|▋         | 17/269 [00:03<00:42,  5.89it/s][A
Training:   8%|▊         | 21/269 [00:03<00:39,  6.22it/s][A
Training:   9%|▉         | 25/269 [00:04<00:36,  6.60it/s][A
Training:  11%|█         | 29/269 [00:05<00:36,  6.51it/s][A
Training:  12%|█▏        | 33/269 [00:05<00:35,  6.71it/s][A
Training:  14%|█▍        | 37/269 [00:06<00:33,  6.89it/s][A
Training:  15%|█▌        | 41/269 [00:06<00:34,  6.60it/s][A
Training:  17%|█▋        | 45/269 [00:07<00:32,  6.80it/s][A
Training:  18%|█▊        | 49/269 [00:07<00:32,  6.83it/s][A
Training:  19%|█▉        | 52/269 [00:08<00:26,  8.24it/s][A
Training:  20%|██        | 54/269 [00:08<00:32,  6.59it/s][A
Training:  21%|██  

Epoch: 82/96 - Loss: 14683.0430 - Accuracy: 0.9222



  0%|          | 0/34 [00:00<?, ?it/s][A
  3%|▎         | 1/34 [00:00<00:25,  1.28it/s][A
 15%|█▍        | 5/34 [00:01<00:06,  4.22it/s][A
 26%|██▋       | 9/34 [00:01<00:04,  5.67it/s][A
 38%|███▊      | 13/34 [00:02<00:03,  6.55it/s][A
 44%|████▍     | 15/34 [00:02<00:02,  7.78it/s][A
 50%|█████     | 17/34 [00:02<00:02,  6.12it/s][A
 56%|█████▌    | 19/34 [00:03<00:02,  7.46it/s][A
 62%|██████▏   | 21/34 [00:03<00:01,  6.67it/s][A
 71%|███████   | 24/34 [00:03<00:01,  9.31it/s][A
 76%|███████▋  | 26/34 [00:03<00:01,  7.57it/s][A
 85%|████████▌ | 29/34 [00:04<00:00,  6.55it/s][A
 91%|█████████ | 31/34 [00:04<00:00,  7.78it/s][A
100%|██████████| 34/34 [00:05<00:00,  6.62it/s][A
Epochs:  85%|████████▌ | 82/96 [2:09:39<10:43, 45.94s/it]

Val Loss: 14393.3506 - Val Accuracy: 0.8109



Training:   0%|          | 0/269 [00:00<?, ?it/s][A
Training:   0%|          | 1/269 [00:00<03:56,  1.13it/s][A
Training:   2%|▏         | 5/269 [00:01<01:08,  3.86it/s][A
Training:   3%|▎         | 9/269 [00:02<00:49,  5.27it/s][A
Training:   5%|▍         | 13/269 [00:02<00:44,  5.76it/s][A
Training:   6%|▋         | 17/269 [00:03<00:41,  6.06it/s][A
Training:   8%|▊         | 21/269 [00:03<00:38,  6.47it/s][A
Training:   9%|▉         | 25/269 [00:04<00:38,  6.41it/s][A
Training:  11%|█         | 29/269 [00:05<00:37,  6.46it/s][A
Training:  12%|█▏        | 33/269 [00:05<00:35,  6.71it/s][A
Training:  14%|█▍        | 37/269 [00:06<00:36,  6.40it/s][A
Training:  15%|█▌        | 41/269 [00:06<00:34,  6.64it/s][A
Training:  17%|█▋        | 45/269 [00:07<00:32,  6.80it/s][A
Training:  18%|█▊        | 49/269 [00:08<00:33,  6.62it/s][A
Training:  20%|█▉        | 53/269 [00:08<00:31,  6.80it/s][A
Training:  21%|██        | 57/269 [00:09<00:30,  6.94it/s][A
Training:  23%|██▎ 

Epoch: 83/96 - Loss: 14471.8232 - Accuracy: 0.9210



  0%|          | 0/34 [00:00<?, ?it/s][A
  3%|▎         | 1/34 [00:00<00:27,  1.22it/s][A
 15%|█▍        | 5/34 [00:01<00:06,  4.31it/s][A
 26%|██▋       | 9/34 [00:01<00:04,  5.66it/s][A
 38%|███▊      | 13/34 [00:02<00:03,  6.13it/s][A
 50%|█████     | 17/34 [00:02<00:02,  6.78it/s][A
 62%|██████▏   | 21/34 [00:03<00:01,  7.13it/s][A
 74%|███████▎  | 25/34 [00:04<00:01,  6.89it/s][A
 85%|████████▌ | 29/34 [00:04<00:00,  7.32it/s][A
100%|██████████| 34/34 [00:05<00:00,  6.65it/s][A
Epochs:  86%|████████▋ | 83/96 [2:10:25<09:55, 45.80s/it]

Val Loss: 15290.0908 - Val Accuracy: 0.9273



Training:   0%|          | 0/269 [00:00<?, ?it/s][A
Training:   0%|          | 1/269 [00:00<03:41,  1.21it/s][A
Training:   2%|▏         | 5/269 [00:01<01:05,  4.05it/s][A
Training:   3%|▎         | 9/269 [00:02<00:51,  5.05it/s][A
Training:   5%|▍         | 13/269 [00:02<00:43,  5.83it/s][A
Training:   6%|▋         | 17/269 [00:03<00:39,  6.36it/s][A
Training:   8%|▊         | 21/269 [00:03<00:39,  6.26it/s][A
Training:   9%|▉         | 25/269 [00:04<00:36,  6.63it/s][A
Training:  11%|█         | 29/269 [00:04<00:36,  6.66it/s][A
Training:  12%|█▏        | 33/269 [00:05<00:36,  6.54it/s][A
Training:  14%|█▍        | 37/269 [00:06<00:33,  6.83it/s][A
Training:  15%|█▌        | 41/269 [00:06<00:34,  6.60it/s][A
Training:  17%|█▋        | 45/269 [00:07<00:34,  6.50it/s][A
Training:  18%|█▊        | 49/269 [00:07<00:32,  6.74it/s][A
Training:  20%|█▉        | 53/269 [00:08<00:33,  6.40it/s][A
Training:  21%|██        | 57/269 [00:09<00:32,  6.57it/s][A
Training:  23%|██▎ 

Epoch: 84/96 - Loss: 14421.4551 - Accuracy: 0.9185



  0%|          | 0/34 [00:00<?, ?it/s][A
  3%|▎         | 1/34 [00:00<00:26,  1.25it/s][A
 15%|█▍        | 5/34 [00:01<00:07,  4.09it/s][A
 26%|██▋       | 9/34 [00:01<00:04,  5.60it/s][A
 38%|███▊      | 13/34 [00:02<00:03,  6.15it/s][A
 50%|█████     | 17/34 [00:03<00:02,  6.49it/s][A
 62%|██████▏   | 21/34 [00:03<00:01,  7.02it/s][A
 74%|███████▎  | 25/34 [00:04<00:01,  7.00it/s][A
 85%|████████▌ | 29/34 [00:04<00:00,  7.00it/s][A
100%|██████████| 34/34 [00:05<00:00,  6.57it/s][A
Epochs:  88%|████████▊ | 84/96 [2:11:11<09:09, 45.82s/it]

Val Loss: 16987.2441 - Val Accuracy: 0.9139



Training:   0%|          | 0/269 [00:00<?, ?it/s][A
Training:   0%|          | 1/269 [00:00<04:13,  1.06it/s][A
Training:   2%|▏         | 5/269 [00:01<01:08,  3.87it/s][A
Training:   3%|▎         | 9/269 [00:02<00:52,  4.91it/s][A
Training:   5%|▍         | 13/269 [00:02<00:45,  5.57it/s][A
Training:   6%|▋         | 17/269 [00:03<00:41,  6.09it/s][A
Training:   8%|▊         | 21/269 [00:03<00:39,  6.21it/s][A
Training:   9%|▉         | 25/269 [00:04<00:38,  6.28it/s][A
Training:  11%|█         | 29/269 [00:05<00:36,  6.64it/s][A
Training:  12%|█▏        | 33/269 [00:05<00:36,  6.50it/s][A
Training:  14%|█▍        | 37/269 [00:06<00:34,  6.66it/s][A
Training:  15%|█▌        | 41/269 [00:06<00:32,  6.93it/s][A
Training:  17%|█▋        | 45/269 [00:07<00:33,  6.61it/s][A
Training:  18%|█▊        | 49/269 [00:08<00:32,  6.85it/s][A
Training:  20%|█▉        | 53/269 [00:08<00:30,  7.01it/s][A
Training:  21%|██        | 57/269 [00:09<00:31,  6.72it/s][A
Training:  23%|██▎ 

Epoch: 85/96 - Loss: 14224.3418 - Accuracy: 0.9185



  0%|          | 0/34 [00:00<?, ?it/s][A
  3%|▎         | 1/34 [00:00<00:29,  1.13it/s][A
 15%|█▍        | 5/34 [00:01<00:06,  4.27it/s][A
 26%|██▋       | 9/34 [00:01<00:04,  5.58it/s][A
 38%|███▊      | 13/34 [00:02<00:03,  6.02it/s][A
 50%|█████     | 17/34 [00:02<00:02,  6.69it/s][A
 62%|██████▏   | 21/34 [00:03<00:01,  7.04it/s][A
 74%|███████▎  | 25/34 [00:04<00:01,  6.80it/s][A
 85%|████████▌ | 29/34 [00:04<00:00,  7.20it/s][A
100%|██████████| 34/34 [00:05<00:00,  6.56it/s][A
Epochs:  89%|████████▊ | 85/96 [2:11:56<08:23, 45.75s/it]

Val Loss: 15204.6895 - Val Accuracy: 0.9283



Training:   0%|          | 0/269 [00:00<?, ?it/s][A
Training:   0%|          | 1/269 [00:00<03:44,  1.19it/s][A
Training:   2%|▏         | 5/269 [00:01<01:04,  4.08it/s][A
Training:   3%|▎         | 9/269 [00:02<00:53,  4.89it/s][A
Training:   5%|▍         | 13/269 [00:02<00:44,  5.80it/s][A
Training:   6%|▋         | 17/269 [00:03<00:40,  6.20it/s][A
Training:   8%|▊         | 21/269 [00:03<00:40,  6.14it/s][A
Training:   9%|▉         | 25/269 [00:04<00:37,  6.57it/s][A
Training:  11%|█         | 29/269 [00:04<00:36,  6.53it/s][A
Training:  12%|█▏        | 33/269 [00:05<00:36,  6.51it/s][A
Training:  14%|█▍        | 37/269 [00:06<00:34,  6.78it/s][A
Training:  15%|█▌        | 41/269 [00:06<00:34,  6.56it/s][A
Training:  17%|█▋        | 45/269 [00:07<00:33,  6.62it/s][A
Training:  18%|█▊        | 49/269 [00:07<00:32,  6.75it/s][A
Training:  20%|█▉        | 53/269 [00:08<00:32,  6.61it/s][A
Training:  21%|██        | 56/269 [00:08<00:26,  8.09it/s][A
Training:  22%|██▏ 

Epoch: 86/96 - Loss: 15057.3291 - Accuracy: 0.9202



  0%|          | 0/34 [00:00<?, ?it/s][A
  3%|▎         | 1/34 [00:00<00:29,  1.13it/s][A
 15%|█▍        | 5/34 [00:01<00:06,  4.27it/s][A
 26%|██▋       | 9/34 [00:01<00:04,  5.66it/s][A
 38%|███▊      | 13/34 [00:02<00:03,  6.05it/s][A
 50%|█████     | 17/34 [00:02<00:02,  6.68it/s][A
 62%|██████▏   | 21/34 [00:03<00:01,  7.05it/s][A
 74%|███████▎  | 25/34 [00:04<00:01,  6.87it/s][A
 85%|████████▌ | 29/34 [00:04<00:00,  7.18it/s][A
100%|██████████| 34/34 [00:05<00:00,  6.56it/s][A
Epochs:  90%|████████▉ | 86/96 [2:12:42<07:38, 45.85s/it]

Val Loss: 15261.3086 - Val Accuracy: 0.8078



Training:   0%|          | 0/269 [00:00<?, ?it/s][A
Training:   0%|          | 1/269 [00:00<03:49,  1.17it/s][A
Training:   2%|▏         | 5/269 [00:01<01:07,  3.91it/s][A
Training:   3%|▎         | 9/269 [00:02<00:53,  4.85it/s][A
Training:   5%|▍         | 13/269 [00:02<00:44,  5.75it/s][A
Training:   6%|▋         | 17/269 [00:03<00:41,  6.07it/s][A
Training:   8%|▊         | 21/269 [00:03<00:40,  6.14it/s][A
Training:   9%|▉         | 25/269 [00:04<00:37,  6.50it/s][A
Training:  11%|█         | 29/269 [00:05<00:37,  6.46it/s][A
Training:  12%|█▏        | 33/269 [00:05<00:36,  6.53it/s][A
Training:  14%|█▍        | 37/269 [00:06<00:34,  6.76it/s][A
Training:  15%|█▌        | 41/269 [00:06<00:34,  6.65it/s][A
Training:  17%|█▋        | 45/269 [00:07<00:34,  6.58it/s][A
Training:  18%|█▊        | 49/269 [00:07<00:32,  6.84it/s][A
Training:  20%|█▉        | 53/269 [00:08<00:32,  6.56it/s][A
Training:  21%|██        | 57/269 [00:09<00:31,  6.69it/s][A
Training:  23%|██▎ 

Epoch: 87/96 - Loss: 14251.3799 - Accuracy: 0.9227



  0%|          | 0/34 [00:00<?, ?it/s][A
  3%|▎         | 1/34 [00:00<00:28,  1.16it/s][A
 15%|█▍        | 5/34 [00:01<00:07,  4.11it/s][A
 26%|██▋       | 9/34 [00:01<00:04,  5.59it/s][A
 38%|███▊      | 13/34 [00:02<00:03,  5.88it/s][A
 50%|█████     | 17/34 [00:03<00:02,  6.51it/s][A
 62%|██████▏   | 21/34 [00:03<00:01,  6.99it/s][A
 74%|███████▎  | 25/34 [00:04<00:01,  7.00it/s][A
 85%|████████▌ | 29/34 [00:04<00:00,  7.10it/s][A
100%|██████████| 34/34 [00:05<00:00,  6.51it/s][A
Epochs:  91%|█████████ | 87/96 [2:13:29<06:53, 45.92s/it]

Val Loss: 15311.2031 - Val Accuracy: 0.9212



Training:   0%|          | 0/269 [00:00<?, ?it/s][A
Training:   0%|          | 1/269 [00:00<03:44,  1.19it/s][A
Training:   2%|▏         | 5/269 [00:01<01:03,  4.14it/s][A
Training:   3%|▎         | 9/269 [00:02<00:51,  5.01it/s][A
Training:   5%|▍         | 13/269 [00:02<00:43,  5.84it/s][A
Training:   6%|▋         | 17/269 [00:03<00:39,  6.41it/s][A
Training:   8%|▊         | 21/269 [00:03<00:38,  6.36it/s][A
Training:   9%|▉         | 25/269 [00:04<00:37,  6.46it/s][A
Training:  11%|█         | 29/269 [00:04<00:35,  6.70it/s][A
Training:  12%|█▏        | 33/269 [00:05<00:36,  6.52it/s][A
Training:  14%|█▍        | 37/269 [00:06<00:34,  6.72it/s][A
Training:  15%|█▌        | 41/269 [00:06<00:33,  6.84it/s][A
Training:  17%|█▋        | 45/269 [00:07<00:34,  6.49it/s][A
Training:  18%|█▊        | 49/269 [00:07<00:32,  6.80it/s][A
Training:  20%|█▉        | 53/269 [00:08<00:32,  6.68it/s][A
Training:  21%|██        | 57/269 [00:09<00:32,  6.61it/s][A
Training:  23%|██▎ 

Epoch: 88/96 - Loss: 13934.8799 - Accuracy: 0.9191



  0%|          | 0/34 [00:00<?, ?it/s][A
  3%|▎         | 1/34 [00:00<00:25,  1.31it/s][A
 15%|█▍        | 5/34 [00:01<00:06,  4.41it/s][A
 26%|██▋       | 9/34 [00:01<00:04,  5.38it/s][A
 38%|███▊      | 13/34 [00:02<00:03,  6.37it/s][A
 50%|█████     | 17/34 [00:02<00:02,  6.83it/s][A
 62%|██████▏   | 21/34 [00:03<00:01,  6.72it/s][A
 74%|███████▎  | 25/34 [00:04<00:01,  7.08it/s][A
 85%|████████▌ | 29/34 [00:04<00:00,  7.34it/s][A
100%|██████████| 34/34 [00:05<00:00,  6.61it/s][A
Epochs:  92%|█████████▏| 88/96 [2:14:14<06:06, 45.77s/it]

Val Loss: 16351.2939 - Val Accuracy: 0.9312



Training:   0%|          | 0/269 [00:00<?, ?it/s][A
Training:   0%|          | 1/269 [00:00<03:38,  1.23it/s][A
Training:   2%|▏         | 5/269 [00:01<01:08,  3.87it/s][A
Training:   3%|▎         | 9/269 [00:01<00:49,  5.29it/s][A
Training:   5%|▍         | 13/269 [00:02<00:43,  5.88it/s][A
Training:   6%|▋         | 17/269 [00:03<00:41,  6.02it/s][A
Training:   8%|▊         | 21/269 [00:03<00:38,  6.49it/s][A
Training:   9%|▉         | 25/269 [00:04<00:37,  6.43it/s][A
Training:  11%|█         | 29/269 [00:04<00:37,  6.47it/s][A
Training:  12%|█▏        | 33/269 [00:05<00:34,  6.84it/s][A
Training:  14%|█▍        | 37/269 [00:06<00:34,  6.66it/s][A
Training:  15%|█▌        | 41/269 [00:06<00:33,  6.77it/s][A
Training:  17%|█▋        | 45/269 [00:07<00:31,  7.03it/s][A
Training:  18%|█▊        | 49/269 [00:07<00:32,  6.75it/s][A
Training:  19%|█▉        | 52/269 [00:07<00:26,  8.31it/s][A
Training:  20%|██        | 54/269 [00:08<00:31,  6.83it/s][A
Training:  21%|██  

Epoch: 89/96 - Loss: 14297.2373 - Accuracy: 0.9188



  0%|          | 0/34 [00:00<?, ?it/s][A
  3%|▎         | 1/34 [00:00<00:25,  1.30it/s][A
 15%|█▍        | 5/34 [00:01<00:06,  4.15it/s][A
 26%|██▋       | 9/34 [00:01<00:04,  5.70it/s][A
 38%|███▊      | 13/34 [00:02<00:03,  6.38it/s][A
 47%|████▋     | 16/34 [00:02<00:02,  8.51it/s][A
 53%|█████▎    | 18/34 [00:03<00:02,  6.62it/s][A
 62%|██████▏   | 21/34 [00:03<00:01,  6.75it/s][A
 71%|███████   | 24/34 [00:03<00:01,  8.98it/s][A
 76%|███████▋  | 26/34 [00:04<00:01,  6.82it/s][A
 85%|████████▌ | 29/34 [00:04<00:00,  6.36it/s][A
100%|██████████| 34/34 [00:05<00:00,  6.64it/s][A
Epochs:  93%|█████████▎| 89/96 [2:15:00<05:20, 45.74s/it]

Val Loss: 16223.6270 - Val Accuracy: 0.9328



Training:   0%|          | 0/269 [00:00<?, ?it/s][A
Training:   0%|          | 1/269 [00:00<04:05,  1.09it/s][A
Training:   2%|▏         | 5/269 [00:01<01:06,  3.96it/s][A
Training:   3%|▎         | 9/269 [00:02<00:51,  5.06it/s][A
Training:   5%|▍         | 13/269 [00:02<00:45,  5.60it/s][A
Training:   6%|▋         | 17/269 [00:03<00:41,  6.06it/s][A
Training:   8%|▊         | 21/269 [00:03<00:41,  6.04it/s][A
Training:   9%|▉         | 25/269 [00:04<00:38,  6.40it/s][A
Training:  11%|█         | 29/269 [00:05<00:36,  6.54it/s][A
Training:  12%|█▏        | 33/269 [00:05<00:36,  6.40it/s][A
Training:  14%|█▍        | 37/269 [00:06<00:34,  6.71it/s][A
Training:  15%|█▌        | 41/269 [00:06<00:34,  6.65it/s][A
Training:  17%|█▋        | 45/269 [00:07<00:33,  6.62it/s][A
Training:  18%|█▊        | 49/269 [00:08<00:32,  6.87it/s][A
Training:  20%|█▉        | 53/269 [00:08<00:31,  6.80it/s][A
Training:  21%|██        | 56/269 [00:08<00:25,  8.36it/s][A
Training:  22%|██▏ 

Epoch: 90/96 - Loss: 14174.2656 - Accuracy: 0.9228



  0%|          | 0/34 [00:00<?, ?it/s][A
  3%|▎         | 1/34 [00:00<00:26,  1.26it/s][A
 15%|█▍        | 5/34 [00:01<00:06,  4.19it/s][A
 26%|██▋       | 9/34 [00:01<00:04,  5.66it/s][A
 38%|███▊      | 13/34 [00:02<00:03,  6.23it/s][A
 50%|█████     | 17/34 [00:02<00:02,  6.58it/s][A
 62%|██████▏   | 21/34 [00:03<00:01,  7.12it/s][A
 74%|███████▎  | 25/34 [00:04<00:01,  7.13it/s][A
 85%|████████▌ | 29/34 [00:04<00:00,  7.16it/s][A
 94%|█████████▍| 32/34 [00:04<00:00,  8.83it/s][A
100%|██████████| 34/34 [00:05<00:00,  6.65it/s][A
Epochs:  94%|█████████▍| 90/96 [2:15:45<04:34, 45.73s/it]

Val Loss: 12849.1348 - Val Accuracy: 0.9329



Training:   0%|          | 0/269 [00:00<?, ?it/s][A
Training:   0%|          | 1/269 [00:00<04:19,  1.03it/s][A
Training:   2%|▏         | 5/269 [00:01<01:11,  3.68it/s][A
Training:   3%|▎         | 9/269 [00:02<00:50,  5.15it/s][A
Training:   5%|▍         | 13/269 [00:02<00:46,  5.47it/s][A
Training:   6%|▋         | 17/269 [00:03<00:42,  5.88it/s][A
Training:   8%|▊         | 21/269 [00:03<00:38,  6.37it/s][A
Training:   9%|▉         | 25/269 [00:04<00:38,  6.41it/s][A
Training:  11%|█         | 29/269 [00:05<00:36,  6.57it/s][A
Training:  12%|█▏        | 33/269 [00:05<00:35,  6.72it/s][A
Training:  14%|█▍        | 37/269 [00:06<00:35,  6.55it/s][A
Training:  15%|█▌        | 41/269 [00:06<00:33,  6.81it/s][A
Training:  17%|█▋        | 45/269 [00:07<00:32,  6.85it/s][A
Training:  18%|█▊        | 48/269 [00:07<00:26,  8.34it/s][A
Training:  19%|█▊        | 50/269 [00:08<00:33,  6.60it/s][A
Training:  20%|█▉        | 53/269 [00:08<00:33,  6.38it/s][A
Training:  21%|██  

Epoch: 91/96 - Loss: 14060.3643 - Accuracy: 0.9188



  0%|          | 0/34 [00:00<?, ?it/s][A
  3%|▎         | 1/34 [00:00<00:25,  1.29it/s][A
 15%|█▍        | 5/34 [00:01<00:06,  4.18it/s][A
 26%|██▋       | 9/34 [00:01<00:04,  5.72it/s][A
 38%|███▊      | 13/34 [00:02<00:03,  6.57it/s][A
 47%|████▋     | 16/34 [00:02<00:02,  8.75it/s][A
 53%|█████▎    | 18/34 [00:03<00:02,  6.53it/s][A
 62%|██████▏   | 21/34 [00:03<00:02,  6.47it/s][A
 74%|███████▎  | 25/34 [00:03<00:01,  7.02it/s][A
 85%|████████▌ | 29/34 [00:04<00:00,  6.94it/s][A
 91%|█████████ | 31/34 [00:04<00:00,  7.93it/s][A
100%|██████████| 34/34 [00:05<00:00,  6.61it/s][A
Epochs:  95%|█████████▍| 91/96 [2:16:31<03:48, 45.71s/it]

Val Loss: 14652.2100 - Val Accuracy: 0.9181



Training:   0%|          | 0/269 [00:00<?, ?it/s][A
Training:   0%|          | 1/269 [00:00<04:05,  1.09it/s][A
Training:   2%|▏         | 5/269 [00:01<01:08,  3.85it/s][A
Training:   3%|▎         | 9/269 [00:02<00:50,  5.17it/s][A
Training:   5%|▍         | 13/269 [00:02<00:46,  5.55it/s][A
Training:   6%|▋         | 17/269 [00:03<00:41,  6.10it/s][A
Training:   8%|▊         | 21/269 [00:03<00:39,  6.32it/s][A
Training:   9%|▉         | 25/269 [00:04<00:38,  6.30it/s][A
Training:  11%|█         | 29/269 [00:05<00:36,  6.66it/s][A
Training:  12%|█▏        | 33/269 [00:05<00:36,  6.54it/s][A
Training:  14%|█▍        | 37/269 [00:06<00:35,  6.56it/s][A
Training:  15%|█▌        | 41/269 [00:06<00:33,  6.81it/s][A
Training:  17%|█▋        | 45/269 [00:07<00:33,  6.65it/s][A
Training:  18%|█▊        | 49/269 [00:08<00:33,  6.63it/s][A
Training:  20%|█▉        | 53/269 [00:08<00:31,  6.82it/s][A
Training:  21%|██        | 57/269 [00:09<00:32,  6.47it/s][A
Training:  23%|██▎ 

Epoch: 92/96 - Loss: 14541.7021 - Accuracy: 0.9237



  0%|          | 0/34 [00:00<?, ?it/s][A
  3%|▎         | 1/34 [00:00<00:28,  1.15it/s][A
 15%|█▍        | 5/34 [00:01<00:06,  4.24it/s][A
 26%|██▋       | 9/34 [00:01<00:04,  5.34it/s][A
 38%|███▊      | 13/34 [00:02<00:03,  6.06it/s][A
 50%|█████     | 17/34 [00:03<00:02,  6.70it/s][A
 62%|██████▏   | 21/34 [00:03<00:01,  6.76it/s][A
 74%|███████▎  | 25/34 [00:04<00:01,  6.94it/s][A
 85%|████████▌ | 29/34 [00:04<00:00,  7.26it/s][A
100%|██████████| 34/34 [00:05<00:00,  6.45it/s][A
Epochs:  96%|█████████▌| 92/96 [2:17:17<03:02, 45.73s/it]

Val Loss: 16339.3564 - Val Accuracy: 0.8892



Training:   0%|          | 0/269 [00:00<?, ?it/s][A
Training:   0%|          | 1/269 [00:00<03:41,  1.21it/s][A
Training:   2%|▏         | 5/269 [00:01<01:07,  3.89it/s][A
Training:   3%|▎         | 9/269 [00:02<00:51,  5.09it/s][A
Training:   5%|▍         | 13/269 [00:02<00:43,  5.89it/s][A
Training:   6%|▋         | 17/269 [00:03<00:41,  6.10it/s][A
Training:   8%|▊         | 21/269 [00:03<00:37,  6.58it/s][A
Training:   9%|▉         | 25/269 [00:04<00:35,  6.83it/s][A
Training:  11%|█         | 29/269 [00:04<00:36,  6.58it/s][A
Training:  12%|█▏        | 33/269 [00:05<00:34,  6.75it/s][A
Training:  14%|█▍        | 37/269 [00:06<00:33,  6.83it/s][A
Training:  15%|█▌        | 41/269 [00:06<00:34,  6.55it/s][A
Training:  17%|█▋        | 45/269 [00:07<00:32,  6.85it/s][A
Training:  18%|█▊        | 49/269 [00:07<00:32,  6.85it/s][A
Training:  19%|█▊        | 50/269 [00:07<00:31,  6.99it/s][A
Training:  20%|█▉        | 53/269 [00:08<00:32,  6.59it/s][A
Training:  21%|██  

Epoch: 93/96 - Loss: 14127.7920 - Accuracy: 0.9187



  0%|          | 0/34 [00:00<?, ?it/s][A
  3%|▎         | 1/34 [00:00<00:25,  1.32it/s][A
 15%|█▍        | 5/34 [00:01<00:06,  4.22it/s][A
 26%|██▋       | 9/34 [00:01<00:04,  5.74it/s][A
 38%|███▊      | 13/34 [00:02<00:03,  6.27it/s][A
 50%|█████     | 17/34 [00:02<00:02,  6.61it/s][A
 62%|██████▏   | 21/34 [00:03<00:01,  7.17it/s][A
 74%|███████▎  | 25/34 [00:03<00:01,  7.09it/s][A
 85%|████████▌ | 29/34 [00:04<00:00,  7.14it/s][A
100%|██████████| 34/34 [00:05<00:00,  6.67it/s][A
Epochs:  97%|█████████▋| 93/96 [2:18:02<02:16, 45.62s/it]

Val Loss: 16751.3691 - Val Accuracy: 0.9268



Training:   0%|          | 0/269 [00:00<?, ?it/s][A
Training:   0%|          | 1/269 [00:00<04:11,  1.07it/s][A
Training:   2%|▏         | 5/269 [00:01<01:07,  3.91it/s][A
Training:   3%|▎         | 9/269 [00:02<00:50,  5.12it/s][A
Training:   5%|▍         | 13/269 [00:02<00:45,  5.68it/s][A
Training:   6%|▋         | 17/269 [00:03<00:40,  6.22it/s][A
Training:   8%|▊         | 21/269 [00:03<00:39,  6.34it/s][A
Training:   9%|▉         | 25/269 [00:04<00:37,  6.48it/s][A
Training:  11%|█         | 29/269 [00:04<00:35,  6.80it/s][A
Training:  12%|█▏        | 33/269 [00:05<00:35,  6.60it/s][A
Training:  14%|█▍        | 37/269 [00:06<00:34,  6.66it/s][A
Training:  15%|█▌        | 41/269 [00:06<00:33,  6.87it/s][A
Training:  17%|█▋        | 45/269 [00:07<00:32,  6.81it/s][A
Training:  18%|█▊        | 49/269 [00:07<00:33,  6.62it/s][A
Training:  20%|█▉        | 53/269 [00:08<00:31,  6.94it/s][A
Training:  21%|██        | 57/269 [00:09<00:31,  6.69it/s][A
Training:  23%|██▎ 

Epoch: 94/96 - Loss: 15594.0000 - Accuracy: 0.9192



  0%|          | 0/34 [00:00<?, ?it/s][A
  3%|▎         | 1/34 [00:00<00:27,  1.18it/s][A
 15%|█▍        | 5/34 [00:01<00:06,  4.17it/s][A
 26%|██▋       | 9/34 [00:01<00:04,  5.67it/s][A
 38%|███▊      | 13/34 [00:02<00:03,  6.19it/s][A
 50%|█████     | 17/34 [00:03<00:02,  6.51it/s][A
 62%|██████▏   | 21/34 [00:03<00:01,  6.99it/s][A
 74%|███████▎  | 25/34 [00:04<00:01,  7.05it/s][A
 85%|████████▌ | 29/34 [00:04<00:00,  7.10it/s][A
100%|██████████| 34/34 [00:05<00:00,  6.60it/s][A
Epochs:  98%|█████████▊| 94/96 [2:18:47<01:31, 45.54s/it]

Val Loss: 16884.5781 - Val Accuracy: 0.9239



Training:   0%|          | 0/269 [00:00<?, ?it/s][A
Training:   0%|          | 1/269 [00:00<04:02,  1.11it/s][A
Training:   2%|▏         | 5/269 [00:01<01:05,  4.03it/s][A
Training:   3%|▎         | 9/269 [00:02<00:51,  5.06it/s][A
Training:   5%|▍         | 13/269 [00:02<00:45,  5.64it/s][A
Training:   6%|▋         | 17/269 [00:03<00:40,  6.17it/s][A
Training:   8%|▊         | 21/269 [00:03<00:40,  6.18it/s][A
Training:   9%|▉         | 25/269 [00:04<00:37,  6.49it/s][A
Training:  11%|█         | 29/269 [00:04<00:35,  6.79it/s][A
Training:  12%|█▏        | 33/269 [00:05<00:36,  6.46it/s][A
Training:  14%|█▍        | 37/269 [00:06<00:34,  6.75it/s][A
Training:  15%|█▌        | 41/269 [00:06<00:33,  6.77it/s][A
Training:  17%|█▋        | 45/269 [00:07<00:34,  6.52it/s][A
Training:  18%|█▊        | 49/269 [00:07<00:32,  6.85it/s][A
Training:  20%|█▉        | 53/269 [00:08<00:32,  6.74it/s][A
Training:  21%|██        | 57/269 [00:09<00:31,  6.77it/s][A
Training:  23%|██▎ 

Epoch: 95/96 - Loss: 14744.0381 - Accuracy: 0.9229



  0%|          | 0/34 [00:00<?, ?it/s][A
  3%|▎         | 1/34 [00:00<00:27,  1.20it/s][A
 15%|█▍        | 5/34 [00:01<00:06,  4.33it/s][A
 26%|██▋       | 9/34 [00:01<00:04,  5.48it/s][A
 38%|███▊      | 13/34 [00:02<00:03,  6.33it/s][A
 50%|█████     | 17/34 [00:02<00:02,  6.97it/s][A
 62%|██████▏   | 21/34 [00:03<00:01,  6.72it/s][A
 71%|███████   | 24/34 [00:03<00:01,  8.54it/s][A
 76%|███████▋  | 26/34 [00:04<00:01,  7.19it/s][A
 85%|████████▌ | 29/34 [00:04<00:00,  7.01it/s][A
100%|██████████| 34/34 [00:05<00:00,  6.59it/s][A
Epochs:  99%|█████████▉| 95/96 [2:19:33<00:45, 45.50s/it]

Val Loss: 17925.6035 - Val Accuracy: 0.9025



Training:   0%|          | 0/269 [00:00<?, ?it/s][A
Training:   0%|          | 1/269 [00:00<03:32,  1.26it/s][A
Training:   2%|▏         | 5/269 [00:01<01:09,  3.79it/s][A
Training:   3%|▎         | 9/269 [00:02<00:49,  5.21it/s][A
Training:   5%|▍         | 13/269 [00:02<00:42,  6.00it/s][A
Training:   6%|▋         | 17/269 [00:03<00:41,  6.08it/s][A
Training:   8%|▊         | 21/269 [00:03<00:38,  6.50it/s][A
Training:   9%|▉         | 25/269 [00:04<00:35,  6.79it/s][A
Training:  11%|█         | 29/269 [00:04<00:36,  6.54it/s][A
Training:  12%|█▏        | 33/269 [00:05<00:35,  6.64it/s][A
Training:  14%|█▍        | 37/269 [00:06<00:33,  6.84it/s][A
Training:  15%|█▌        | 41/269 [00:06<00:34,  6.54it/s][A
Training:  17%|█▋        | 45/269 [00:07<00:33,  6.75it/s][A
Training:  18%|█▊        | 49/269 [00:07<00:32,  6.77it/s][A
Training:  20%|█▉        | 53/269 [00:08<00:32,  6.70it/s][A
Training:  21%|██        | 57/269 [00:09<00:30,  6.94it/s][A
Training:  23%|██▎ 

Epoch: 96/96 - Loss: 14990.3213 - Accuracy: 0.9194



  0%|          | 0/34 [00:00<?, ?it/s][A
  3%|▎         | 1/34 [00:00<00:24,  1.36it/s][A
 15%|█▍        | 5/34 [00:01<00:06,  4.42it/s][A
 26%|██▋       | 9/34 [00:01<00:04,  5.57it/s][A
 38%|███▊      | 13/34 [00:02<00:03,  6.50it/s][A
 50%|█████     | 17/34 [00:02<00:02,  6.77it/s][A
 62%|██████▏   | 21/34 [00:03<00:01,  6.88it/s][A
 74%|███████▎  | 25/34 [00:03<00:01,  7.34it/s][A
 85%|████████▌ | 29/34 [00:04<00:00,  7.18it/s][A
100%|██████████| 34/34 [00:05<00:00,  6.68it/s][A
Epochs: 100%|██████████| 96/96 [2:20:18<00:00, 87.69s/it]
[32m[I 2023-12-15 01:30:11,441][0m Trial 1 finished with value: 0.8679981827735901 and parameters: {'learning_rate': 0.09367970229059014, 'weight_decay': 0.00011786297022567189, 'epsilon': 1.3474912558273086e-08, 'batch_size': 52, 'epochs': 96}. Best is trial 0 with value: 0.937110424041748.[0m


Val Loss: 15448.6875 - Val Accuracy: 0.8680
Learning rate: 0.00014936159954798418
Weight decay: 0.000648991059773433
Epsilon: 6.582574844800083e-09
Batch size: 157
Number of epochs: 89


Epochs:   0%|          | 0/89 [00:00<?, ?it/s]
Training:   0%|          | 0/89 [00:00<?, ?it/s][A
Training:   1%|          | 1/89 [00:02<03:06,  2.12s/it][A
Training:   4%|▍         | 4/89 [00:02<00:36,  2.30it/s][A
Training:   7%|▋         | 6/89 [00:03<00:50,  1.63it/s][A
Training:  10%|█         | 9/89 [00:05<00:47,  1.67it/s][A
Training:  13%|█▎        | 12/89 [00:05<00:28,  2.69it/s][A
Training:  16%|█▌        | 14/89 [00:07<00:37,  2.01it/s][A
Training:  19%|█▉        | 17/89 [00:09<00:38,  1.89it/s][A
Training:  22%|██▏       | 20/89 [00:09<00:24,  2.80it/s][A
Training:  25%|██▍       | 22/89 [00:10<00:31,  2.11it/s][A
Training:  28%|██▊       | 25/89 [00:12<00:32,  1.97it/s][A
Training:  31%|███▏      | 28/89 [00:12<00:21,  2.84it/s][A
Training:  34%|███▎      | 30/89 [00:14<00:27,  2.11it/s][A
Training:  37%|███▋      | 33/89 [00:16<00:28,  1.96it/s][A
Training:  40%|████      | 36/89 [00:16<00:18,  2.81it/s][A
Training:  43%|████▎     | 38/89 [00:18<00:24,  2.1

Epoch: 1/89 - Loss: 4.8678 - Accuracy: 0.7381



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:21,  1.91s/it][A
 33%|███▎      | 4/12 [00:02<00:03,  2.53it/s][A
 50%|█████     | 6/12 [00:03<00:03,  1.80it/s][A
100%|██████████| 12/12 [00:05<00:00,  2.28it/s][A
Epochs:   1%|          | 1/89 [00:46<1:07:29, 46.02s/it]

Val Loss: 3.6019 - Val Accuracy: 0.8473



Training:   0%|          | 0/89 [00:00<?, ?it/s][A
Training:   1%|          | 1/89 [00:02<03:07,  2.13s/it][A
Training:   4%|▍         | 4/89 [00:02<00:37,  2.29it/s][A
Training:   7%|▋         | 6/89 [00:03<00:50,  1.63it/s][A
Training:  10%|█         | 9/89 [00:05<00:47,  1.68it/s][A
Training:  13%|█▎        | 12/89 [00:05<00:28,  2.70it/s][A
Training:  16%|█▌        | 14/89 [00:07<00:37,  2.01it/s][A
Training:  19%|█▉        | 17/89 [00:09<00:38,  1.89it/s][A
Training:  22%|██▏       | 20/89 [00:09<00:24,  2.79it/s][A
Training:  25%|██▍       | 22/89 [00:11<00:32,  2.09it/s][A
Training:  28%|██▊       | 25/89 [00:12<00:32,  1.95it/s][A
Training:  31%|███▏      | 28/89 [00:12<00:21,  2.81it/s][A
Training:  34%|███▎      | 30/89 [00:14<00:28,  2.07it/s][A
Training:  37%|███▋      | 33/89 [00:16<00:28,  1.96it/s][A
Training:  40%|████      | 36/89 [00:16<00:18,  2.82it/s][A
Training:  43%|████▎     | 38/89 [00:18<00:23,  2.15it/s][A
Training:  46%|████▌     | 41/89 [00

Epoch: 2/89 - Loss: 2.7377 - Accuracy: 0.8729



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:20,  1.91s/it][A
 33%|███▎      | 4/12 [00:02<00:03,  2.56it/s][A
 50%|█████     | 6/12 [00:03<00:03,  1.79it/s][A
100%|██████████| 12/12 [00:05<00:00,  2.30it/s][A
Epochs:   2%|▏         | 2/89 [01:32<1:06:43, 46.01s/it]

Val Loss: 2.3412 - Val Accuracy: 0.8916



Training:   0%|          | 0/89 [00:00<?, ?it/s][A
Training:   1%|          | 1/89 [00:02<03:04,  2.10s/it][A
Training:   4%|▍         | 4/89 [00:02<00:36,  2.34it/s][A
Training:   7%|▋         | 6/89 [00:03<00:50,  1.64it/s][A
Training:  10%|█         | 9/89 [00:05<00:46,  1.70it/s][A
Training:  13%|█▎        | 12/89 [00:05<00:28,  2.74it/s][A
Training:  16%|█▌        | 14/89 [00:07<00:37,  2.00it/s][A
Training:  19%|█▉        | 17/89 [00:09<00:37,  1.91it/s][A
Training:  22%|██▏       | 20/89 [00:09<00:24,  2.80it/s][A
Training:  25%|██▍       | 22/89 [00:10<00:31,  2.10it/s][A
Training:  28%|██▊       | 25/89 [00:12<00:32,  1.96it/s][A
Training:  31%|███▏      | 28/89 [00:12<00:21,  2.83it/s][A
Training:  34%|███▎      | 30/89 [00:14<00:27,  2.15it/s][A
Training:  37%|███▋      | 33/89 [00:16<00:28,  1.99it/s][A
Training:  40%|████      | 36/89 [00:16<00:18,  2.85it/s][A
Training:  43%|████▎     | 38/89 [00:17<00:23,  2.14it/s][A
Training:  46%|████▌     | 41/89 [00

Epoch: 3/89 - Loss: 2.1403 - Accuracy: 0.9032



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:21,  1.93s/it][A
 33%|███▎      | 4/12 [00:02<00:03,  2.51it/s][A
 50%|█████     | 6/12 [00:03<00:03,  1.78it/s][A
100%|██████████| 12/12 [00:05<00:00,  2.27it/s][A
Epochs:   3%|▎         | 3/89 [02:18<1:05:56, 46.01s/it]

Val Loss: 1.8530 - Val Accuracy: 0.8960



Training:   0%|          | 0/89 [00:00<?, ?it/s][A
Training:   1%|          | 1/89 [00:02<03:06,  2.12s/it][A
Training:   4%|▍         | 4/89 [00:02<00:37,  2.29it/s][A
Training:   7%|▋         | 6/89 [00:03<00:51,  1.61it/s][A
Training:  10%|█         | 9/89 [00:05<00:47,  1.68it/s][A
Training:  13%|█▎        | 12/89 [00:05<00:28,  2.70it/s][A
Training:  16%|█▌        | 14/89 [00:07<00:38,  1.96it/s][A
Training:  19%|█▉        | 17/89 [00:09<00:38,  1.89it/s][A
Training:  20%|██        | 18/89 [00:09<00:33,  2.14it/s][A
Training:  24%|██▎       | 21/89 [00:10<00:33,  2.01it/s][A
Training:  25%|██▍       | 22/89 [00:11<00:29,  2.28it/s][A
Training:  28%|██▊       | 25/89 [00:12<00:30,  2.09it/s][A
Training:  29%|██▉       | 26/89 [00:12<00:26,  2.34it/s][A
Training:  33%|███▎      | 29/89 [00:14<00:27,  2.15it/s][A
Training:  34%|███▎      | 30/89 [00:14<00:24,  2.41it/s][A
Training:  37%|███▋      | 33/89 [00:16<00:25,  2.19it/s][A
Training:  38%|███▊      | 34/89 [00

Epoch: 4/89 - Loss: 1.7433 - Accuracy: 0.9177



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:21,  1.98s/it][A
 33%|███▎      | 4/12 [00:02<00:03,  2.46it/s][A
 50%|█████     | 6/12 [00:03<00:03,  1.79it/s][A
100%|██████████| 12/12 [00:05<00:00,  2.29it/s][A
Epochs:   4%|▍         | 4/89 [03:03<1:05:07, 45.97s/it]

Val Loss: 1.6118 - Val Accuracy: 0.9143



Training:   0%|          | 0/89 [00:00<?, ?it/s][A
Training:   1%|          | 1/89 [00:02<03:07,  2.14s/it][A
Training:   4%|▍         | 4/89 [00:02<00:37,  2.28it/s][A
Training:   7%|▋         | 6/89 [00:03<00:49,  1.66it/s][A
Training:  10%|█         | 9/89 [00:05<00:46,  1.72it/s][A
Training:  12%|█▏        | 11/89 [00:05<00:32,  2.41it/s][A
Training:  15%|█▍        | 13/89 [00:07<00:41,  1.85it/s][A
Training:  17%|█▋        | 15/89 [00:07<00:29,  2.55it/s][A
Training:  19%|█▉        | 17/89 [00:09<00:37,  1.91it/s][A
Training:  21%|██▏       | 19/89 [00:09<00:26,  2.60it/s][A
Training:  24%|██▎       | 21/89 [00:10<00:34,  1.95it/s][A
Training:  27%|██▋       | 24/89 [00:10<00:21,  3.05it/s][A
Training:  29%|██▉       | 26/89 [00:12<00:29,  2.14it/s][A
Training:  33%|███▎      | 29/89 [00:14<00:29,  2.01it/s][A
Training:  34%|███▎      | 30/89 [00:14<00:25,  2.28it/s][A
Training:  37%|███▋      | 33/89 [00:16<00:27,  2.06it/s][A
Training:  40%|████      | 36/89 [00

Epoch: 5/89 - Loss: 1.4905 - Accuracy: 0.9241



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:02<00:22,  2.01s/it][A
 33%|███▎      | 4/12 [00:02<00:03,  2.45it/s][A
 50%|█████     | 6/12 [00:03<00:03,  1.76it/s][A
100%|██████████| 12/12 [00:05<00:00,  2.24it/s][A
Epochs:   6%|▌         | 5/89 [03:50<1:04:25, 46.02s/it]

Val Loss: 1.4625 - Val Accuracy: 0.9228



Training:   0%|          | 0/89 [00:00<?, ?it/s][A
Training:   1%|          | 1/89 [00:02<03:01,  2.07s/it][A
Training:   4%|▍         | 4/89 [00:02<00:36,  2.34it/s][A
Training:   7%|▋         | 6/89 [00:03<00:49,  1.67it/s][A
Training:  10%|█         | 9/89 [00:05<00:47,  1.68it/s][A
Training:  13%|█▎        | 12/89 [00:05<00:28,  2.72it/s][A
Training:  16%|█▌        | 14/89 [00:07<00:37,  2.00it/s][A
Training:  19%|█▉        | 17/89 [00:09<00:37,  1.90it/s][A
Training:  21%|██▏       | 19/89 [00:09<00:28,  2.49it/s][A
Training:  24%|██▎       | 21/89 [00:10<00:34,  1.95it/s][A
Training:  26%|██▌       | 23/89 [00:10<00:25,  2.58it/s][A
Training:  28%|██▊       | 25/89 [00:12<00:32,  1.97it/s][A
Training:  29%|██▉       | 26/89 [00:12<00:27,  2.27it/s][A
Training:  33%|███▎      | 29/89 [00:14<00:29,  2.04it/s][A
Training:  36%|███▌      | 32/89 [00:14<00:18,  3.13it/s][A
Training:  38%|███▊      | 34/89 [00:16<00:25,  2.16it/s][A
Training:  42%|████▏     | 37/89 [00

Epoch: 6/89 - Loss: 1.3403 - Accuracy: 0.9284



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:21,  1.92s/it][A
 33%|███▎      | 4/12 [00:02<00:03,  2.55it/s][A
 50%|█████     | 6/12 [00:03<00:03,  1.79it/s][A
100%|██████████| 12/12 [00:05<00:00,  2.27it/s][A
Epochs:   7%|▋         | 6/89 [04:36<1:03:41, 46.04s/it]

Val Loss: 1.2064 - Val Accuracy: 0.9322



Training:   0%|          | 0/89 [00:00<?, ?it/s][A
Training:   1%|          | 1/89 [00:02<03:00,  2.06s/it][A
Training:   4%|▍         | 4/89 [00:02<00:35,  2.36it/s][A
Training:   7%|▋         | 6/89 [00:03<00:49,  1.66it/s][A
Training:  10%|█         | 9/89 [00:05<00:46,  1.72it/s][A
Training:  12%|█▏        | 11/89 [00:05<00:32,  2.39it/s][A
Training:  15%|█▍        | 13/89 [00:07<00:40,  1.85it/s][A
Training:  16%|█▌        | 14/89 [00:07<00:34,  2.16it/s][A
Training:  19%|█▉        | 17/89 [00:09<00:35,  2.01it/s][A
Training:  20%|██        | 18/89 [00:09<00:30,  2.29it/s][A
Training:  24%|██▎       | 21/89 [00:10<00:32,  2.09it/s][A
Training:  25%|██▍       | 22/89 [00:10<00:28,  2.35it/s][A
Training:  28%|██▊       | 25/89 [00:12<00:30,  2.12it/s][A
Training:  29%|██▉       | 26/89 [00:12<00:26,  2.36it/s][A
Training:  33%|███▎      | 29/89 [00:14<00:28,  2.10it/s][A
Training:  34%|███▎      | 30/89 [00:14<00:24,  2.38it/s][A
Training:  37%|███▋      | 33/89 [00

Epoch: 7/89 - Loss: 1.2539 - Accuracy: 0.9317



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:21,  1.94s/it][A
 33%|███▎      | 4/12 [00:02<00:03,  2.52it/s][A
 50%|█████     | 6/12 [00:03<00:03,  1.80it/s][A
100%|██████████| 12/12 [00:05<00:00,  2.28it/s][A
Epochs:   8%|▊         | 7/89 [05:22<1:03:02, 46.13s/it]

Val Loss: 1.2905 - Val Accuracy: 0.9379



Training:   0%|          | 0/89 [00:00<?, ?it/s][A
Training:   1%|          | 1/89 [00:02<03:05,  2.11s/it][A
Training:   4%|▍         | 4/89 [00:02<00:36,  2.32it/s][A
Training:   7%|▋         | 6/89 [00:03<00:50,  1.65it/s][A
Training:  10%|█         | 9/89 [00:05<00:47,  1.68it/s][A
Training:  13%|█▎        | 12/89 [00:05<00:28,  2.72it/s][A
Training:  16%|█▌        | 14/89 [00:07<00:37,  2.02it/s][A
Training:  19%|█▉        | 17/89 [00:09<00:38,  1.89it/s][A
Training:  22%|██▏       | 20/89 [00:09<00:24,  2.78it/s][A
Training:  25%|██▍       | 22/89 [00:10<00:31,  2.11it/s][A
Training:  28%|██▊       | 25/89 [00:12<00:32,  1.96it/s][A
Training:  31%|███▏      | 28/89 [00:12<00:21,  2.83it/s][A
Training:  34%|███▎      | 30/89 [00:14<00:28,  2.09it/s][A
Training:  37%|███▋      | 33/89 [00:16<00:28,  1.96it/s][A
Training:  40%|████      | 36/89 [00:16<00:18,  2.81it/s][A
Training:  43%|████▎     | 38/89 [00:18<00:23,  2.13it/s][A
Training:  46%|████▌     | 41/89 [00

Epoch: 8/89 - Loss: 1.1123 - Accuracy: 0.9334



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:02<00:22,  2.01s/it][A
 33%|███▎      | 4/12 [00:02<00:03,  2.45it/s][A
 50%|█████     | 6/12 [00:03<00:03,  1.77it/s][A
100%|██████████| 12/12 [00:05<00:00,  2.25it/s][A
Epochs:   9%|▉         | 8/89 [06:08<1:02:20, 46.18s/it]

Val Loss: 1.1885 - Val Accuracy: 0.9166



Training:   0%|          | 0/89 [00:00<?, ?it/s][A
Training:   1%|          | 1/89 [00:02<03:06,  2.11s/it][A
Training:   4%|▍         | 4/89 [00:02<00:36,  2.31it/s][A
Training:   7%|▋         | 6/89 [00:03<00:50,  1.63it/s][A
Training:  10%|█         | 9/89 [00:05<00:48,  1.66it/s][A
Training:  13%|█▎        | 12/89 [00:05<00:28,  2.69it/s][A
Training:  16%|█▌        | 14/89 [00:07<00:38,  1.94it/s][A
Training:  19%|█▉        | 17/89 [00:09<00:38,  1.86it/s][A
Training:  22%|██▏       | 20/89 [00:09<00:25,  2.74it/s][A
Training:  25%|██▍       | 22/89 [00:11<00:32,  2.07it/s][A
Training:  28%|██▊       | 25/89 [00:12<00:32,  1.96it/s][A
Training:  30%|███       | 27/89 [00:12<00:24,  2.51it/s][A
Training:  33%|███▎      | 29/89 [00:14<00:30,  1.96it/s][A
Training:  36%|███▌      | 32/89 [00:14<00:19,  2.92it/s][A
Training:  38%|███▊      | 34/89 [00:16<00:25,  2.12it/s][A
Training:  42%|████▏     | 37/89 [00:18<00:26,  1.93it/s][A
Training:  45%|████▍     | 40/89 [00

Epoch: 9/89 - Loss: 1.0928 - Accuracy: 0.9367



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:21,  1.98s/it][A
 33%|███▎      | 4/12 [00:02<00:03,  2.49it/s][A
 50%|█████     | 6/12 [00:03<00:03,  1.75it/s][A
100%|██████████| 12/12 [00:05<00:00,  2.26it/s][A
Epochs:  10%|█         | 9/89 [06:55<1:01:38, 46.24s/it]

Val Loss: 0.9942 - Val Accuracy: 0.9274



Training:   0%|          | 0/89 [00:00<?, ?it/s][A
Training:   1%|          | 1/89 [00:02<03:05,  2.11s/it][A
Training:   4%|▍         | 4/89 [00:02<00:36,  2.30it/s][A
Training:   7%|▋         | 6/89 [00:03<00:50,  1.64it/s][A
Training:  10%|█         | 9/89 [00:05<00:47,  1.69it/s][A
Training:  13%|█▎        | 12/89 [00:05<00:28,  2.72it/s][A
Training:  16%|█▌        | 14/89 [00:07<00:37,  2.00it/s][A
Training:  19%|█▉        | 17/89 [00:09<00:37,  1.90it/s][A
Training:  22%|██▏       | 20/89 [00:09<00:24,  2.81it/s][A
Training:  25%|██▍       | 22/89 [00:10<00:32,  2.08it/s][A
Training:  28%|██▊       | 25/89 [00:12<00:32,  1.96it/s][A
Training:  31%|███▏      | 28/89 [00:12<00:21,  2.84it/s][A
Training:  34%|███▎      | 30/89 [00:14<00:27,  2.14it/s][A
Training:  37%|███▋      | 33/89 [00:16<00:28,  1.97it/s][A
Training:  40%|████      | 36/89 [00:16<00:18,  2.83it/s][A
Training:  43%|████▎     | 38/89 [00:18<00:24,  2.12it/s][A
Training:  46%|████▌     | 41/89 [00

Epoch: 10/89 - Loss: 0.9925 - Accuracy: 0.9392



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:21,  1.94s/it][A
 33%|███▎      | 4/12 [00:02<00:03,  2.52it/s][A
 50%|█████     | 6/12 [00:03<00:03,  1.79it/s][A
100%|██████████| 12/12 [00:05<00:00,  2.29it/s][A
Epochs:  11%|█         | 10/89 [07:41<1:00:52, 46.24s/it]

Val Loss: 1.0011 - Val Accuracy: 0.9349



Training:   0%|          | 0/89 [00:00<?, ?it/s][A
Training:   1%|          | 1/89 [00:02<02:59,  2.04s/it][A
Training:   4%|▍         | 4/89 [00:02<00:35,  2.37it/s][A
Training:   7%|▋         | 6/89 [00:03<00:50,  1.64it/s][A
Training:  10%|█         | 9/89 [00:05<00:48,  1.66it/s][A
Training:  13%|█▎        | 12/89 [00:05<00:28,  2.68it/s][A
Training:  16%|█▌        | 14/89 [00:07<00:38,  1.96it/s][A
Training:  19%|█▉        | 17/89 [00:09<00:38,  1.87it/s][A
Training:  21%|██▏       | 19/89 [00:09<00:28,  2.45it/s][A
Training:  24%|██▎       | 21/89 [00:10<00:35,  1.92it/s][A
Training:  27%|██▋       | 24/89 [00:11<00:22,  2.91it/s][A
Training:  29%|██▉       | 26/89 [00:12<00:29,  2.11it/s][A
Training:  33%|███▎      | 29/89 [00:14<00:30,  1.95it/s][A
Training:  36%|███▌      | 32/89 [00:14<00:20,  2.82it/s][A
Training:  38%|███▊      | 34/89 [00:16<00:26,  2.11it/s][A
Training:  42%|████▏     | 37/89 [00:18<00:26,  1.97it/s][A
Training:  45%|████▍     | 40/89 [00

Epoch: 11/89 - Loss: 0.9355 - Accuracy: 0.9398



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:21,  1.92s/it][A
 33%|███▎      | 4/12 [00:02<00:03,  2.54it/s][A
 50%|█████     | 6/12 [00:03<00:03,  1.78it/s][A
100%|██████████| 12/12 [00:05<00:00,  2.28it/s][A
Epochs:  12%|█▏        | 11/89 [08:27<1:00:07, 46.25s/it]

Val Loss: 0.9613 - Val Accuracy: 0.9249



Training:   0%|          | 0/89 [00:00<?, ?it/s][A
Training:   1%|          | 1/89 [00:02<03:08,  2.14s/it][A
Training:   3%|▎         | 3/89 [00:02<00:51,  1.68it/s][A
Training:   6%|▌         | 5/89 [00:03<01:00,  1.40it/s][A
Training:   9%|▉         | 8/89 [00:04<00:29,  2.75it/s][A
Training:  11%|█         | 10/89 [00:05<00:41,  1.93it/s][A
Training:  15%|█▍        | 13/89 [00:07<00:40,  1.86it/s][A
Training:  18%|█▊        | 16/89 [00:07<00:25,  2.85it/s][A
Training:  20%|██        | 18/89 [00:09<00:34,  2.06it/s][A
Training:  24%|██▎       | 21/89 [00:10<00:35,  1.93it/s][A
Training:  27%|██▋       | 24/89 [00:11<00:23,  2.82it/s][A
Training:  29%|██▉       | 26/89 [00:12<00:29,  2.10it/s][A
Training:  33%|███▎      | 29/89 [00:14<00:30,  1.98it/s][A
Training:  36%|███▌      | 32/89 [00:14<00:20,  2.84it/s][A
Training:  38%|███▊      | 34/89 [00:16<00:25,  2.15it/s][A
Training:  42%|████▏     | 37/89 [00:17<00:26,  1.99it/s][A
Training:  45%|████▍     | 40/89 [00

Epoch: 12/89 - Loss: 0.8919 - Accuracy: 0.9407



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:02<00:22,  2.01s/it][A
 33%|███▎      | 4/12 [00:02<00:03,  2.44it/s][A
 50%|█████     | 6/12 [00:03<00:03,  1.77it/s][A
100%|██████████| 12/12 [00:05<00:00,  2.24it/s][A
Epochs:  13%|█▎        | 12/89 [09:13<59:22, 46.26s/it]  

Val Loss: 0.9805 - Val Accuracy: 0.9453



Training:   0%|          | 0/89 [00:00<?, ?it/s][A
Training:   1%|          | 1/89 [00:02<03:04,  2.10s/it][A
Training:   4%|▍         | 4/89 [00:02<00:36,  2.32it/s][A
Training:   7%|▋         | 6/89 [00:03<00:50,  1.63it/s][A
Training:  10%|█         | 9/89 [00:05<00:46,  1.70it/s][A
Training:  13%|█▎        | 12/89 [00:05<00:28,  2.73it/s][A
Training:  16%|█▌        | 14/89 [00:07<00:37,  2.00it/s][A
Training:  19%|█▉        | 17/89 [00:09<00:38,  1.87it/s][A
Training:  22%|██▏       | 20/89 [00:09<00:25,  2.76it/s][A
Training:  25%|██▍       | 22/89 [00:10<00:32,  2.09it/s][A
Training:  28%|██▊       | 25/89 [00:12<00:32,  1.94it/s][A
Training:  30%|███       | 27/89 [00:12<00:24,  2.50it/s][A
Training:  33%|███▎      | 29/89 [00:14<00:30,  1.95it/s][A
Training:  35%|███▍      | 31/89 [00:14<00:22,  2.58it/s][A
Training:  37%|███▋      | 33/89 [00:16<00:28,  1.94it/s][A
Training:  40%|████      | 36/89 [00:16<00:17,  2.95it/s][A
Training:  43%|████▎     | 38/89 [00

Epoch: 13/89 - Loss: 0.8571 - Accuracy: 0.9430



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:21,  1.91s/it][A
 33%|███▎      | 4/12 [00:02<00:03,  2.54it/s][A
 50%|█████     | 6/12 [00:03<00:03,  1.77it/s][A
100%|██████████| 12/12 [00:05<00:00,  2.29it/s][A
Epochs:  15%|█▍        | 13/89 [10:00<58:35, 46.26s/it]

Val Loss: 0.8779 - Val Accuracy: 0.9359



Training:   0%|          | 0/89 [00:00<?, ?it/s][A
Training:   1%|          | 1/89 [00:02<03:10,  2.17s/it][A
Training:   4%|▍         | 4/89 [00:02<00:37,  2.26it/s][A
Training:   7%|▋         | 6/89 [00:03<00:51,  1.61it/s][A
Training:  10%|█         | 9/89 [00:05<00:48,  1.65it/s][A
Training:  13%|█▎        | 12/89 [00:05<00:28,  2.66it/s][A
Training:  16%|█▌        | 14/89 [00:07<00:37,  1.98it/s][A
Training:  19%|█▉        | 17/89 [00:09<00:38,  1.89it/s][A
Training:  22%|██▏       | 20/89 [00:09<00:24,  2.79it/s][A
Training:  25%|██▍       | 22/89 [00:11<00:32,  2.09it/s][A
Training:  28%|██▊       | 25/89 [00:12<00:32,  1.95it/s][A
Training:  31%|███▏      | 28/89 [00:12<00:21,  2.81it/s][A
Training:  34%|███▎      | 30/89 [00:14<00:28,  2.09it/s][A
Training:  37%|███▋      | 33/89 [00:16<00:28,  1.96it/s][A
Training:  39%|███▉      | 35/89 [00:16<00:21,  2.50it/s][A
Training:  42%|████▏     | 37/89 [00:18<00:26,  1.96it/s][A
Training:  44%|████▍     | 39/89 [00

Epoch: 14/89 - Loss: 0.8368 - Accuracy: 0.9415



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:20,  1.86s/it][A
 33%|███▎      | 4/12 [00:01<00:03,  2.60it/s][A
 50%|█████     | 6/12 [00:03<00:03,  1.82it/s][A
 75%|███████▌  | 9/12 [00:05<00:01,  1.89it/s][A
100%|██████████| 12/12 [00:05<00:00,  2.29it/s][A
Epochs:  16%|█▌        | 14/89 [10:46<57:49, 46.27s/it]

Val Loss: 0.8232 - Val Accuracy: 0.9349



Training:   0%|          | 0/89 [00:00<?, ?it/s][A
Training:   1%|          | 1/89 [00:02<03:00,  2.05s/it][A
Training:   4%|▍         | 4/89 [00:02<00:36,  2.36it/s][A
Training:   7%|▋         | 6/89 [00:03<00:50,  1.65it/s][A
Training:  10%|█         | 9/89 [00:05<00:47,  1.70it/s][A
Training:  13%|█▎        | 12/89 [00:05<00:28,  2.73it/s][A
Training:  16%|█▌        | 14/89 [00:07<00:37,  2.02it/s][A
Training:  19%|█▉        | 17/89 [00:09<00:38,  1.89it/s][A
Training:  22%|██▏       | 20/89 [00:09<00:24,  2.79it/s][A
Training:  25%|██▍       | 22/89 [00:10<00:32,  2.06it/s][A
Training:  28%|██▊       | 25/89 [00:12<00:32,  1.94it/s][A
Training:  30%|███       | 27/89 [00:12<00:24,  2.50it/s][A
Training:  33%|███▎      | 29/89 [00:14<00:30,  1.96it/s][A
Training:  36%|███▌      | 32/89 [00:14<00:19,  2.93it/s][A
Training:  38%|███▊      | 34/89 [00:16<00:26,  2.09it/s][A
Training:  42%|████▏     | 37/89 [00:17<00:26,  1.99it/s][A
Training:  43%|████▎     | 38/89 [00

Epoch: 15/89 - Loss: 0.8238 - Accuracy: 0.9429



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:21,  1.96s/it][A
 33%|███▎      | 4/12 [00:02<00:03,  2.49it/s][A
 50%|█████     | 6/12 [00:03<00:03,  1.76it/s][A
100%|██████████| 12/12 [00:05<00:00,  2.25it/s][A
Epochs:  17%|█▋        | 15/89 [11:32<57:03, 46.26s/it]

Val Loss: 0.9849 - Val Accuracy: 0.9365



Training:   0%|          | 0/89 [00:00<?, ?it/s][A
Training:   1%|          | 1/89 [00:02<02:59,  2.04s/it][A
Training:   4%|▍         | 4/89 [00:02<00:35,  2.37it/s][A
Training:   7%|▋         | 6/89 [00:03<00:50,  1.65it/s][A
Training:  10%|█         | 9/89 [00:05<00:47,  1.70it/s][A
Training:  11%|█         | 10/89 [00:05<00:39,  2.00it/s][A
Training:  15%|█▍        | 13/89 [00:07<00:39,  1.93it/s][A
Training:  16%|█▌        | 14/89 [00:07<00:33,  2.21it/s][A
Training:  19%|█▉        | 17/89 [00:09<00:35,  2.00it/s][A
Training:  21%|██▏       | 19/89 [00:09<00:25,  2.70it/s][A
Training:  24%|██▎       | 21/89 [00:10<00:34,  1.98it/s][A
Training:  27%|██▋       | 24/89 [00:11<00:21,  3.07it/s][A
Training:  29%|██▉       | 26/89 [00:12<00:29,  2.13it/s][A
Training:  33%|███▎      | 29/89 [00:14<00:30,  1.98it/s][A
Training:  36%|███▌      | 32/89 [00:14<00:19,  2.89it/s][A
Training:  38%|███▊      | 34/89 [00:16<00:25,  2.13it/s][A
Training:  42%|████▏     | 37/89 [00

Epoch: 16/89 - Loss: 0.7893 - Accuracy: 0.9430



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:21,  1.97s/it][A
 33%|███▎      | 4/12 [00:02<00:03,  2.46it/s][A
 50%|█████     | 6/12 [00:03<00:03,  1.77it/s][A
100%|██████████| 12/12 [00:05<00:00,  2.27it/s][A
Epochs:  18%|█▊        | 16/89 [12:18<56:17, 46.27s/it]

Val Loss: 0.7315 - Val Accuracy: 0.9327



Training:   0%|          | 0/89 [00:00<?, ?it/s][A
Training:   1%|          | 1/89 [00:02<03:05,  2.11s/it][A
Training:   4%|▍         | 4/89 [00:02<00:37,  2.29it/s][A
Training:   7%|▋         | 6/89 [00:03<00:50,  1.63it/s][A
Training:  10%|█         | 9/89 [00:05<00:47,  1.68it/s][A
Training:  13%|█▎        | 12/89 [00:05<00:28,  2.71it/s][A
Training:  16%|█▌        | 14/89 [00:07<00:37,  2.00it/s][A
Training:  19%|█▉        | 17/89 [00:09<00:38,  1.89it/s][A
Training:  22%|██▏       | 20/89 [00:09<00:24,  2.78it/s][A
Training:  25%|██▍       | 22/89 [00:11<00:32,  2.06it/s][A
Training:  28%|██▊       | 25/89 [00:12<00:33,  1.93it/s][A
Training:  31%|███▏      | 28/89 [00:12<00:21,  2.78it/s][A
Training:  34%|███▎      | 30/89 [00:14<00:28,  2.09it/s][A
Training:  37%|███▋      | 33/89 [00:16<00:28,  1.96it/s][A
Training:  40%|████      | 36/89 [00:16<00:18,  2.80it/s][A
Training:  43%|████▎     | 38/89 [00:18<00:24,  2.11it/s][A
Training:  46%|████▌     | 41/89 [00

Epoch: 17/89 - Loss: 0.7563 - Accuracy: 0.9413



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:21,  1.93s/it][A
 33%|███▎      | 4/12 [00:02<00:03,  2.54it/s][A
 50%|█████     | 6/12 [00:03<00:03,  1.77it/s][A
100%|██████████| 12/12 [00:05<00:00,  2.27it/s][A
Epochs:  19%|█▉        | 17/89 [13:05<55:29, 46.24s/it]

Val Loss: 0.8600 - Val Accuracy: 0.9453



Training:   0%|          | 0/89 [00:00<?, ?it/s][A
Training:   1%|          | 1/89 [00:02<03:06,  2.12s/it][A
Training:   4%|▍         | 4/89 [00:02<00:37,  2.30it/s][A
Training:   7%|▋         | 6/89 [00:04<00:52,  1.58it/s][A
Training:  10%|█         | 9/89 [00:05<00:48,  1.64it/s][A
Training:  12%|█▏        | 11/89 [00:05<00:33,  2.31it/s][A
Training:  15%|█▍        | 13/89 [00:07<00:42,  1.79it/s][A
Training:  18%|█▊        | 16/89 [00:07<00:25,  2.87it/s][A
Training:  20%|██        | 18/89 [00:09<00:34,  2.03it/s][A
Training:  24%|██▎       | 21/89 [00:11<00:35,  1.90it/s][A
Training:  27%|██▋       | 24/89 [00:11<00:23,  2.79it/s][A
Training:  29%|██▉       | 26/89 [00:12<00:29,  2.12it/s][A
Training:  33%|███▎      | 29/89 [00:14<00:30,  1.96it/s][A
Training:  36%|███▌      | 32/89 [00:14<00:20,  2.83it/s][A
Training:  38%|███▊      | 34/89 [00:16<00:25,  2.12it/s][A
Training:  42%|████▏     | 37/89 [00:18<00:26,  1.97it/s][A
Training:  45%|████▍     | 40/89 [00

Epoch: 18/89 - Loss: 0.7340 - Accuracy: 0.9440



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:02<00:22,  2.00s/it][A
 33%|███▎      | 4/12 [00:02<00:03,  2.44it/s][A
 50%|█████     | 6/12 [00:03<00:03,  1.76it/s][A
100%|██████████| 12/12 [00:05<00:00,  2.24it/s][A
Epochs:  20%|██        | 18/89 [13:51<54:53, 46.38s/it]

Val Loss: 0.8062 - Val Accuracy: 0.9469



Training:   0%|          | 0/89 [00:00<?, ?it/s][A
Training:   1%|          | 1/89 [00:02<03:05,  2.11s/it][A
Training:   4%|▍         | 4/89 [00:02<00:36,  2.32it/s][A
Training:   7%|▋         | 6/89 [00:03<00:50,  1.63it/s][A
Training:  10%|█         | 9/89 [00:05<00:47,  1.68it/s][A
Training:  13%|█▎        | 12/89 [00:05<00:28,  2.72it/s][A
Training:  16%|█▌        | 14/89 [00:07<00:37,  2.00it/s][A
Training:  19%|█▉        | 17/89 [00:09<00:38,  1.89it/s][A
Training:  22%|██▏       | 20/89 [00:09<00:24,  2.79it/s][A
Training:  25%|██▍       | 22/89 [00:11<00:32,  2.07it/s][A
Training:  28%|██▊       | 25/89 [00:12<00:32,  1.94it/s][A
Training:  31%|███▏      | 28/89 [00:12<00:21,  2.81it/s][A
Training:  34%|███▎      | 30/89 [00:14<00:28,  2.06it/s][A
Training:  37%|███▋      | 33/89 [00:16<00:29,  1.93it/s][A
Training:  40%|████      | 36/89 [00:16<00:19,  2.77it/s][A
Training:  43%|████▎     | 38/89 [00:18<00:24,  2.11it/s][A
Training:  46%|████▌     | 41/89 [00

Epoch: 19/89 - Loss: 0.7443 - Accuracy: 0.9444



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:20,  1.87s/it][A
 33%|███▎      | 4/12 [00:01<00:03,  2.60it/s][A
 50%|█████     | 6/12 [00:03<00:03,  1.78it/s][A
100%|██████████| 12/12 [00:05<00:00,  2.28it/s][A
Epochs:  21%|██▏       | 19/89 [14:38<54:07, 46.40s/it]

Val Loss: 0.8132 - Val Accuracy: 0.9365



Training:   0%|          | 0/89 [00:00<?, ?it/s][A
Training:   1%|          | 1/89 [00:02<03:01,  2.06s/it][A
Training:   4%|▍         | 4/89 [00:02<00:36,  2.35it/s][A
Training:   7%|▋         | 6/89 [00:03<00:51,  1.62it/s][A
Training:  10%|█         | 9/89 [00:05<00:47,  1.68it/s][A
Training:  13%|█▎        | 12/89 [00:05<00:28,  2.71it/s][A
Training:  16%|█▌        | 14/89 [00:07<00:37,  1.98it/s][A
Training:  19%|█▉        | 17/89 [00:09<00:38,  1.85it/s][A
Training:  22%|██▏       | 20/89 [00:09<00:25,  2.74it/s][A
Training:  25%|██▍       | 22/89 [00:11<00:32,  2.09it/s][A
Training:  28%|██▊       | 25/89 [00:12<00:32,  1.96it/s][A
Training:  31%|███▏      | 28/89 [00:12<00:21,  2.82it/s][A
Training:  34%|███▎      | 30/89 [00:14<00:28,  2.10it/s][A
Training:  37%|███▋      | 33/89 [00:16<00:28,  1.95it/s][A
Training:  40%|████      | 36/89 [00:16<00:18,  2.80it/s][A
Training:  43%|████▎     | 38/89 [00:18<00:24,  2.12it/s][A
Training:  46%|████▌     | 41/89 [00

Epoch: 20/89 - Loss: 0.7051 - Accuracy: 0.9450



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:21,  1.95s/it][A
 33%|███▎      | 4/12 [00:02<00:03,  2.50it/s][A
 50%|█████     | 6/12 [00:03<00:03,  1.79it/s][A
100%|██████████| 12/12 [00:05<00:00,  2.26it/s][A
Epochs:  22%|██▏       | 20/89 [15:24<53:21, 46.39s/it]

Val Loss: 0.7601 - Val Accuracy: 0.9421



Training:   0%|          | 0/89 [00:00<?, ?it/s][A
Training:   1%|          | 1/89 [00:02<03:08,  2.14s/it][A
Training:   4%|▍         | 4/89 [00:02<00:37,  2.28it/s][A
Training:   7%|▋         | 6/89 [00:03<00:51,  1.61it/s][A
Training:  10%|█         | 9/89 [00:05<00:47,  1.68it/s][A
Training:  13%|█▎        | 12/89 [00:05<00:28,  2.72it/s][A
Training:  16%|█▌        | 14/89 [00:07<00:37,  1.98it/s][A
Training:  19%|█▉        | 17/89 [00:09<00:38,  1.89it/s][A
Training:  22%|██▏       | 20/89 [00:09<00:24,  2.80it/s][A
Training:  25%|██▍       | 22/89 [00:11<00:31,  2.10it/s][A
Training:  28%|██▊       | 25/89 [00:12<00:32,  1.94it/s][A
Training:  31%|███▏      | 28/89 [00:12<00:21,  2.82it/s][A
Training:  34%|███▎      | 30/89 [00:14<00:28,  2.09it/s][A
Training:  37%|███▋      | 33/89 [00:16<00:28,  1.98it/s][A
Training:  40%|████      | 36/89 [00:16<00:18,  2.83it/s][A
Training:  43%|████▎     | 38/89 [00:18<00:24,  2.12it/s][A
Training:  46%|████▌     | 41/89 [00

Epoch: 21/89 - Loss: 0.6829 - Accuracy: 0.9449



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:02<00:22,  2.02s/it][A
 42%|████▏     | 5/12 [00:03<00:04,  1.54it/s][A
 67%|██████▋   | 8/12 [00:03<00:01,  2.79it/s][A
100%|██████████| 12/12 [00:05<00:00,  2.24it/s][A
Epochs:  24%|██▎       | 21/89 [16:11<52:37, 46.43s/it]

Val Loss: 0.6747 - Val Accuracy: 0.9459



Training:   0%|          | 0/89 [00:00<?, ?it/s][A
Training:   1%|          | 1/89 [00:02<03:13,  2.20s/it][A
Training:   3%|▎         | 3/89 [00:02<00:52,  1.64it/s][A
Training:   6%|▌         | 5/89 [00:03<00:59,  1.41it/s][A
Training:   9%|▉         | 8/89 [00:04<00:29,  2.76it/s][A
Training:  11%|█         | 10/89 [00:05<00:41,  1.89it/s][A
Training:  15%|█▍        | 13/89 [00:07<00:41,  1.81it/s][A
Training:  18%|█▊        | 16/89 [00:07<00:26,  2.78it/s][A
Training:  20%|██        | 18/89 [00:09<00:35,  2.02it/s][A
Training:  24%|██▎       | 21/89 [00:11<00:35,  1.90it/s][A
Training:  27%|██▋       | 24/89 [00:11<00:23,  2.78it/s][A
Training:  29%|██▉       | 26/89 [00:12<00:29,  2.11it/s][A
Training:  33%|███▎      | 29/89 [00:14<00:30,  1.95it/s][A
Training:  36%|███▌      | 32/89 [00:14<00:20,  2.81it/s][A
Training:  38%|███▊      | 34/89 [00:16<00:26,  2.11it/s][A
Training:  42%|████▏     | 37/89 [00:18<00:26,  1.96it/s][A
Training:  45%|████▍     | 40/89 [00

Epoch: 22/89 - Loss: 0.6737 - Accuracy: 0.9455



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:21,  1.93s/it][A
 33%|███▎      | 4/12 [00:02<00:03,  2.51it/s][A
 50%|█████     | 6/12 [00:03<00:03,  1.77it/s][A
100%|██████████| 12/12 [00:05<00:00,  2.28it/s][A
Epochs:  25%|██▍       | 22/89 [16:57<51:48, 46.40s/it]

Val Loss: 0.7039 - Val Accuracy: 0.9386



Training:   0%|          | 0/89 [00:00<?, ?it/s][A
Training:   1%|          | 1/89 [00:02<03:04,  2.10s/it][A
Training:   4%|▍         | 4/89 [00:02<00:36,  2.32it/s][A
Training:   7%|▋         | 6/89 [00:03<00:50,  1.65it/s][A
Training:  10%|█         | 9/89 [00:05<00:46,  1.71it/s][A
Training:  13%|█▎        | 12/89 [00:05<00:27,  2.76it/s][A
Training:  16%|█▌        | 14/89 [00:07<00:37,  2.02it/s][A
Training:  19%|█▉        | 17/89 [00:09<00:37,  1.90it/s][A
Training:  22%|██▏       | 20/89 [00:09<00:24,  2.80it/s][A
Training:  25%|██▍       | 22/89 [00:10<00:32,  2.09it/s][A
Training:  28%|██▊       | 25/89 [00:12<00:32,  1.97it/s][A
Training:  31%|███▏      | 28/89 [00:12<00:21,  2.83it/s][A
Training:  34%|███▎      | 30/89 [00:14<00:27,  2.11it/s][A
Training:  37%|███▋      | 33/89 [00:16<00:28,  1.96it/s][A
Training:  40%|████      | 36/89 [00:16<00:18,  2.81it/s][A
Training:  43%|████▎     | 38/89 [00:18<00:24,  2.10it/s][A
Training:  46%|████▌     | 41/89 [00

Epoch: 23/89 - Loss: 0.6527 - Accuracy: 0.9456



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:20,  1.89s/it][A
 33%|███▎      | 4/12 [00:02<00:03,  2.57it/s][A
 50%|█████     | 6/12 [00:03<00:03,  1.81it/s][A
100%|██████████| 12/12 [00:05<00:00,  2.32it/s][A
Epochs:  26%|██▌       | 23/89 [17:43<50:58, 46.35s/it]

Val Loss: 0.6667 - Val Accuracy: 0.9443



Training:   0%|          | 0/89 [00:00<?, ?it/s][A
Training:   1%|          | 1/89 [00:02<03:08,  2.14s/it][A
Training:   4%|▍         | 4/89 [00:02<00:37,  2.30it/s][A
Training:   7%|▋         | 6/89 [00:03<00:51,  1.61it/s][A
Training:  10%|█         | 9/89 [00:05<00:48,  1.65it/s][A
Training:  13%|█▎        | 12/89 [00:05<00:28,  2.67it/s][A
Training:  16%|█▌        | 14/89 [00:07<00:37,  1.99it/s][A
Training:  19%|█▉        | 17/89 [00:09<00:38,  1.86it/s][A
Training:  22%|██▏       | 20/89 [00:09<00:25,  2.76it/s][A
Training:  25%|██▍       | 22/89 [00:11<00:32,  2.06it/s][A
Training:  28%|██▊       | 25/89 [00:12<00:33,  1.93it/s][A
Training:  31%|███▏      | 28/89 [00:12<00:21,  2.80it/s][A
Training:  34%|███▎      | 30/89 [00:14<00:27,  2.12it/s][A
Training:  37%|███▋      | 33/89 [00:16<00:28,  1.98it/s][A
Training:  40%|████      | 36/89 [00:16<00:18,  2.85it/s][A
Training:  43%|████▎     | 38/89 [00:18<00:23,  2.13it/s][A
Training:  46%|████▌     | 41/89 [00

Epoch: 24/89 - Loss: 0.6403 - Accuracy: 0.9453



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:21,  1.98s/it][A
 33%|███▎      | 4/12 [00:02<00:03,  2.46it/s][A
 50%|█████     | 6/12 [00:03<00:03,  1.77it/s][A
100%|██████████| 12/12 [00:05<00:00,  2.28it/s][A
Epochs:  27%|██▋       | 24/89 [18:30<50:17, 46.43s/it]

Val Loss: 0.7517 - Val Accuracy: 0.9390



Training:   0%|          | 0/89 [00:00<?, ?it/s][A
Training:   1%|          | 1/89 [00:02<03:02,  2.07s/it][A
Training:   4%|▍         | 4/89 [00:02<00:36,  2.36it/s][A
Training:   7%|▋         | 6/89 [00:03<00:49,  1.66it/s][A
Training:  10%|█         | 9/89 [00:05<00:47,  1.68it/s][A
Training:  13%|█▎        | 12/89 [00:05<00:28,  2.71it/s][A
Training:  16%|█▌        | 14/89 [00:07<00:37,  2.00it/s][A
Training:  19%|█▉        | 17/89 [00:09<00:37,  1.90it/s][A
Training:  22%|██▏       | 20/89 [00:09<00:24,  2.81it/s][A
Training:  25%|██▍       | 22/89 [00:10<00:32,  2.08it/s][A
Training:  28%|██▊       | 25/89 [00:12<00:32,  1.95it/s][A
Training:  31%|███▏      | 28/89 [00:12<00:21,  2.82it/s][A
Training:  34%|███▎      | 30/89 [00:14<00:27,  2.13it/s][A
Training:  37%|███▋      | 33/89 [00:16<00:28,  1.96it/s][A
Training:  40%|████      | 36/89 [00:16<00:18,  2.79it/s][A
Training:  43%|████▎     | 38/89 [00:18<00:24,  2.09it/s][A
Training:  46%|████▌     | 41/89 [00

Epoch: 25/89 - Loss: 0.6429 - Accuracy: 0.9470



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:21,  1.92s/it][A
 33%|███▎      | 4/12 [00:02<00:03,  2.50it/s][A
 50%|█████     | 6/12 [00:03<00:03,  1.75it/s][A
100%|██████████| 12/12 [00:05<00:00,  2.25it/s][A
Epochs:  28%|██▊       | 25/89 [19:16<49:29, 46.41s/it]

Val Loss: 0.7474 - Val Accuracy: 0.9407



Training:   0%|          | 0/89 [00:00<?, ?it/s][A
Training:   1%|          | 1/89 [00:02<03:06,  2.12s/it][A
Training:   4%|▍         | 4/89 [00:02<00:36,  2.32it/s][A
Training:   7%|▋         | 6/89 [00:03<00:51,  1.62it/s][A
Training:  10%|█         | 9/89 [00:05<00:47,  1.69it/s][A
Training:  13%|█▎        | 12/89 [00:05<00:28,  2.73it/s][A
Training:  16%|█▌        | 14/89 [00:07<00:37,  1.99it/s][A
Training:  19%|█▉        | 17/89 [00:09<00:38,  1.87it/s][A
Training:  22%|██▏       | 20/89 [00:09<00:24,  2.76it/s][A
Training:  25%|██▍       | 22/89 [00:11<00:32,  2.05it/s][A
Training:  28%|██▊       | 25/89 [00:12<00:33,  1.93it/s][A
Training:  31%|███▏      | 28/89 [00:12<00:21,  2.78it/s][A
Training:  34%|███▎      | 30/89 [00:14<00:28,  2.11it/s][A
Training:  37%|███▋      | 33/89 [00:16<00:28,  1.95it/s][A
Training:  40%|████      | 36/89 [00:16<00:18,  2.79it/s][A
Training:  43%|████▎     | 38/89 [00:18<00:24,  2.07it/s][A
Training:  46%|████▌     | 41/89 [00

Epoch: 26/89 - Loss: 0.6227 - Accuracy: 0.9459



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:21,  1.95s/it][A
 33%|███▎      | 4/12 [00:02<00:03,  2.49it/s][A
 50%|█████     | 6/12 [00:03<00:03,  1.80it/s][A
100%|██████████| 12/12 [00:05<00:00,  2.29it/s][A
Epochs:  29%|██▉       | 26/89 [20:03<48:46, 46.45s/it]

Val Loss: 0.7571 - Val Accuracy: 0.9427



Training:   0%|          | 0/89 [00:00<?, ?it/s][A
Training:   1%|          | 1/89 [00:02<03:08,  2.14s/it][A
Training:   4%|▍         | 4/89 [00:02<00:37,  2.28it/s][A
Training:   7%|▋         | 6/89 [00:03<00:51,  1.61it/s][A
Training:  10%|█         | 9/89 [00:05<00:48,  1.64it/s][A
Training:  13%|█▎        | 12/89 [00:05<00:28,  2.67it/s][A
Training:  16%|█▌        | 14/89 [00:07<00:37,  1.99it/s][A
Training:  19%|█▉        | 17/89 [00:09<00:38,  1.88it/s][A
Training:  22%|██▏       | 20/89 [00:09<00:24,  2.78it/s][A
Training:  25%|██▍       | 22/89 [00:11<00:32,  2.06it/s][A
Training:  28%|██▊       | 25/89 [00:12<00:33,  1.94it/s][A
Training:  31%|███▏      | 28/89 [00:12<00:21,  2.79it/s][A
Training:  34%|███▎      | 30/89 [00:14<00:28,  2.10it/s][A
Training:  37%|███▋      | 33/89 [00:16<00:28,  1.94it/s][A
Training:  40%|████      | 36/89 [00:16<00:19,  2.78it/s][A
Training:  43%|████▎     | 38/89 [00:18<00:23,  2.13it/s][A
Training:  46%|████▌     | 41/89 [00

Epoch: 27/89 - Loss: 0.6057 - Accuracy: 0.9473



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:21,  1.98s/it][A
 33%|███▎      | 4/12 [00:02<00:03,  2.49it/s][A
 50%|█████     | 6/12 [00:03<00:03,  1.77it/s][A
100%|██████████| 12/12 [00:05<00:00,  2.25it/s][A
Epochs:  30%|███       | 27/89 [20:49<48:01, 46.47s/it]

Val Loss: 0.6399 - Val Accuracy: 0.9480



Training:   0%|          | 0/89 [00:00<?, ?it/s][A
Training:   1%|          | 1/89 [00:02<02:59,  2.04s/it][A
Training:   4%|▍         | 4/89 [00:02<00:35,  2.36it/s][A
Training:   7%|▋         | 6/89 [00:03<00:50,  1.64it/s][A
Training:  10%|█         | 9/89 [00:05<00:47,  1.70it/s][A
Training:  12%|█▏        | 11/89 [00:05<00:33,  2.36it/s][A
Training:  15%|█▍        | 13/89 [00:07<00:42,  1.80it/s][A
Training:  17%|█▋        | 15/89 [00:07<00:29,  2.48it/s][A
Training:  19%|█▉        | 17/89 [00:09<00:38,  1.88it/s][A
Training:  22%|██▏       | 20/89 [00:09<00:23,  2.95it/s][A
Training:  25%|██▍       | 22/89 [00:11<00:32,  2.09it/s][A
Training:  28%|██▊       | 25/89 [00:12<00:32,  1.99it/s][A
Training:  31%|███▏      | 28/89 [00:12<00:20,  2.91it/s][A
Training:  34%|███▎      | 30/89 [00:14<00:27,  2.14it/s][A
Training:  37%|███▋      | 33/89 [00:16<00:28,  1.98it/s][A
Training:  40%|████      | 36/89 [00:16<00:18,  2.84it/s][A
Training:  43%|████▎     | 38/89 [00

Epoch: 28/89 - Loss: 0.6045 - Accuracy: 0.9470



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:21,  1.94s/it][A
 33%|███▎      | 4/12 [00:02<00:03,  2.50it/s][A
 50%|█████     | 6/12 [00:03<00:03,  1.77it/s][A
100%|██████████| 12/12 [00:05<00:00,  2.24it/s][A
Epochs:  31%|███▏      | 28/89 [21:36<47:12, 46.43s/it]

Val Loss: 0.7165 - Val Accuracy: 0.9363



Training:   0%|          | 0/89 [00:00<?, ?it/s][A
Training:   1%|          | 1/89 [00:02<03:10,  2.16s/it][A
Training:   2%|▏         | 2/89 [00:02<01:23,  1.04it/s][A
Training:   6%|▌         | 5/89 [00:03<00:56,  1.50it/s][A
Training:   7%|▋         | 6/89 [00:04<00:44,  1.89it/s][A
Training:  10%|█         | 9/89 [00:05<00:43,  1.85it/s][A
Training:  11%|█         | 10/89 [00:05<00:36,  2.17it/s][A
Training:  15%|█▍        | 13/89 [00:07<00:37,  2.01it/s][A
Training:  16%|█▌        | 14/89 [00:07<00:32,  2.32it/s][A
Training:  19%|█▉        | 17/89 [00:09<00:34,  2.06it/s][A
Training:  21%|██▏       | 19/89 [00:09<00:25,  2.77it/s][A
Training:  24%|██▎       | 21/89 [00:11<00:33,  2.01it/s][A
Training:  26%|██▌       | 23/89 [00:11<00:24,  2.73it/s][A
Training:  28%|██▊       | 25/89 [00:12<00:32,  1.98it/s][A
Training:  31%|███▏      | 28/89 [00:12<00:19,  3.10it/s][A
Training:  34%|███▎      | 30/89 [00:14<00:27,  2.16it/s][A
Training:  37%|███▋      | 33/89 [00:

Epoch: 29/89 - Loss: 0.6076 - Accuracy: 0.9467



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:21,  1.93s/it][A
 33%|███▎      | 4/12 [00:02<00:03,  2.54it/s][A
 50%|█████     | 6/12 [00:03<00:03,  1.82it/s][A
100%|██████████| 12/12 [00:05<00:00,  2.32it/s][A
Epochs:  33%|███▎      | 29/89 [22:22<46:24, 46.41s/it]

Val Loss: 0.6291 - Val Accuracy: 0.9365



Training:   0%|          | 0/89 [00:00<?, ?it/s][A
Training:   1%|          | 1/89 [00:02<03:05,  2.11s/it][A
Training:   4%|▍         | 4/89 [00:02<00:36,  2.30it/s][A
Training:   7%|▋         | 6/89 [00:03<00:51,  1.63it/s][A
Training:  10%|█         | 9/89 [00:05<00:47,  1.68it/s][A
Training:  13%|█▎        | 12/89 [00:05<00:28,  2.72it/s][A
Training:  16%|█▌        | 14/89 [00:07<00:37,  2.00it/s][A
Training:  19%|█▉        | 17/89 [00:09<00:38,  1.88it/s][A
Training:  22%|██▏       | 20/89 [00:09<00:24,  2.78it/s][A
Training:  25%|██▍       | 22/89 [00:11<00:32,  2.08it/s][A
Training:  28%|██▊       | 25/89 [00:12<00:32,  1.95it/s][A
Training:  31%|███▏      | 28/89 [00:12<00:21,  2.80it/s][A
Training:  34%|███▎      | 30/89 [00:14<00:28,  2.08it/s][A
Training:  37%|███▋      | 33/89 [00:16<00:28,  1.94it/s][A
Training:  40%|████      | 36/89 [00:16<00:19,  2.77it/s][A
Training:  43%|████▎     | 38/89 [00:18<00:24,  2.09it/s][A
Training:  46%|████▌     | 41/89 [00

Epoch: 30/89 - Loss: 0.5919 - Accuracy: 0.9482



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:21,  1.95s/it][A
 33%|███▎      | 4/12 [00:02<00:03,  2.50it/s][A
 50%|█████     | 6/12 [00:03<00:03,  1.78it/s][A
100%|██████████| 12/12 [00:05<00:00,  2.27it/s][A
Epochs:  34%|███▎      | 30/89 [23:08<45:38, 46.42s/it]

Val Loss: 0.6682 - Val Accuracy: 0.9453



Training:   0%|          | 0/89 [00:00<?, ?it/s][A
Training:   1%|          | 1/89 [00:02<03:05,  2.11s/it][A
Training:   4%|▍         | 4/89 [00:02<00:37,  2.30it/s][A
Training:   7%|▋         | 6/89 [00:03<00:49,  1.66it/s][A
Training:  10%|█         | 9/89 [00:05<00:47,  1.69it/s][A
Training:  13%|█▎        | 12/89 [00:05<00:28,  2.72it/s][A
Training:  16%|█▌        | 14/89 [00:07<00:37,  2.02it/s][A
Training:  19%|█▉        | 17/89 [00:09<00:37,  1.90it/s][A
Training:  22%|██▏       | 20/89 [00:09<00:24,  2.80it/s][A
Training:  25%|██▍       | 22/89 [00:10<00:32,  2.09it/s][A
Training:  28%|██▊       | 25/89 [00:12<00:32,  1.97it/s][A
Training:  31%|███▏      | 28/89 [00:12<00:21,  2.83it/s][A
Training:  34%|███▎      | 30/89 [00:14<00:27,  2.11it/s][A
Training:  37%|███▋      | 33/89 [00:16<00:28,  1.97it/s][A
Training:  40%|████      | 36/89 [00:16<00:18,  2.81it/s][A
Training:  43%|████▎     | 38/89 [00:18<00:24,  2.11it/s][A
Training:  46%|████▌     | 41/89 [00

Epoch: 31/89 - Loss: 0.5756 - Accuracy: 0.9477



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:21,  1.98s/it][A
 33%|███▎      | 4/12 [00:02<00:03,  2.47it/s][A
 50%|█████     | 6/12 [00:03<00:03,  1.82it/s][A
100%|██████████| 12/12 [00:05<00:00,  2.28it/s][A
Epochs:  35%|███▍      | 31/89 [23:55<44:50, 46.39s/it]

Val Loss: 0.6481 - Val Accuracy: 0.9375



Training:   0%|          | 0/89 [00:00<?, ?it/s][A
Training:   1%|          | 1/89 [00:02<03:02,  2.08s/it][A
Training:   4%|▍         | 4/89 [00:02<00:36,  2.33it/s][A
Training:   7%|▋         | 6/89 [00:03<00:50,  1.65it/s][A
Training:  10%|█         | 9/89 [00:05<00:47,  1.69it/s][A
Training:  13%|█▎        | 12/89 [00:05<00:28,  2.73it/s][A
Training:  16%|█▌        | 14/89 [00:07<00:37,  2.00it/s][A
Training:  19%|█▉        | 17/89 [00:09<00:37,  1.90it/s][A
Training:  22%|██▏       | 20/89 [00:09<00:24,  2.79it/s][A
Training:  25%|██▍       | 22/89 [00:10<00:32,  2.07it/s][A
Training:  28%|██▊       | 25/89 [00:12<00:32,  1.94it/s][A
Training:  30%|███       | 27/89 [00:12<00:24,  2.50it/s][A
Training:  33%|███▎      | 29/89 [00:14<00:31,  1.93it/s][A
Training:  36%|███▌      | 32/89 [00:14<00:19,  2.89it/s][A
Training:  38%|███▊      | 34/89 [00:16<00:25,  2.13it/s][A
Training:  42%|████▏     | 37/89 [00:18<00:26,  1.95it/s][A
Training:  45%|████▍     | 40/89 [00

Epoch: 32/89 - Loss: 0.5975 - Accuracy: 0.9482



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:21,  1.97s/it][A
 33%|███▎      | 4/12 [00:02<00:03,  2.48it/s][A
 50%|█████     | 6/12 [00:03<00:03,  1.76it/s][A
100%|██████████| 12/12 [00:05<00:00,  2.26it/s][A
Epochs:  36%|███▌      | 32/89 [24:41<44:07, 46.44s/it]

Val Loss: 0.6377 - Val Accuracy: 0.9386



Training:   0%|          | 0/89 [00:00<?, ?it/s][A
Training:   1%|          | 1/89 [00:02<03:04,  2.10s/it][A
Training:   4%|▍         | 4/89 [00:02<00:36,  2.33it/s][A
Training:   7%|▋         | 6/89 [00:03<00:51,  1.62it/s][A
Training:  10%|█         | 9/89 [00:05<00:47,  1.67it/s][A
Training:  13%|█▎        | 12/89 [00:05<00:28,  2.71it/s][A
Training:  16%|█▌        | 14/89 [00:07<00:37,  2.00it/s][A
Training:  19%|█▉        | 17/89 [00:09<00:38,  1.86it/s][A
Training:  22%|██▏       | 20/89 [00:09<00:25,  2.75it/s][A
Training:  25%|██▍       | 22/89 [00:11<00:32,  2.07it/s][A
Training:  28%|██▊       | 25/89 [00:12<00:33,  1.93it/s][A
Training:  31%|███▏      | 28/89 [00:12<00:21,  2.78it/s][A
Training:  34%|███▎      | 30/89 [00:14<00:28,  2.08it/s][A
Training:  37%|███▋      | 33/89 [00:16<00:28,  1.94it/s][A
Training:  39%|███▉      | 35/89 [00:16<00:21,  2.48it/s][A
Training:  42%|████▏     | 37/89 [00:18<00:26,  1.93it/s][A
Training:  45%|████▍     | 40/89 [00

Epoch: 33/89 - Loss: 0.5768 - Accuracy: 0.9488



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:21,  1.95s/it][A
 25%|██▌       | 3/12 [00:02<00:04,  1.82it/s][A
 42%|████▏     | 5/12 [00:03<00:04,  1.51it/s][A
 67%|██████▋   | 8/12 [00:03<00:01,  2.98it/s][A
100%|██████████| 12/12 [00:05<00:00,  2.25it/s][A
Epochs:  37%|███▋      | 33/89 [25:28<43:23, 46.48s/it]

Val Loss: 0.6122 - Val Accuracy: 0.9453



Training:   0%|          | 0/89 [00:00<?, ?it/s][A
Training:   1%|          | 1/89 [00:02<03:07,  2.13s/it][A
Training:   4%|▍         | 4/89 [00:02<00:36,  2.31it/s][A
Training:   7%|▋         | 6/89 [00:03<00:50,  1.63it/s][A
Training:  10%|█         | 9/89 [00:05<00:47,  1.67it/s][A
Training:  13%|█▎        | 12/89 [00:05<00:28,  2.70it/s][A
Training:  16%|█▌        | 14/89 [00:07<00:37,  2.00it/s][A
Training:  19%|█▉        | 17/89 [00:09<00:38,  1.88it/s][A
Training:  22%|██▏       | 20/89 [00:09<00:24,  2.78it/s][A
Training:  25%|██▍       | 22/89 [00:11<00:32,  2.06it/s][A
Training:  28%|██▊       | 25/89 [00:12<00:33,  1.92it/s][A
Training:  31%|███▏      | 28/89 [00:12<00:22,  2.77it/s][A
Training:  34%|███▎      | 30/89 [00:14<00:28,  2.09it/s][A
Training:  37%|███▋      | 33/89 [00:16<00:28,  1.95it/s][A
Training:  40%|████      | 36/89 [00:16<00:18,  2.80it/s][A
Training:  43%|████▎     | 38/89 [00:18<00:24,  2.06it/s][A
Training:  46%|████▌     | 41/89 [00

Epoch: 34/89 - Loss: 0.5560 - Accuracy: 0.9480



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:21,  1.94s/it][A
 33%|███▎      | 4/12 [00:02<00:03,  2.51it/s][A
 50%|█████     | 6/12 [00:03<00:03,  1.73it/s][A
 75%|███████▌  | 9/12 [00:05<00:01,  1.82it/s][A
100%|██████████| 12/12 [00:05<00:00,  2.22it/s][A
Epochs:  38%|███▊      | 34/89 [26:15<42:42, 46.60s/it]

Val Loss: 0.6119 - Val Accuracy: 0.9453



Training:   0%|          | 0/89 [00:00<?, ?it/s][A
Training:   1%|          | 1/89 [00:02<03:06,  2.12s/it][A
Training:   4%|▍         | 4/89 [00:02<00:37,  2.29it/s][A
Training:   7%|▋         | 6/89 [00:03<00:51,  1.61it/s][A
Training:  10%|█         | 9/89 [00:05<00:48,  1.66it/s][A
Training:  13%|█▎        | 12/89 [00:05<00:28,  2.68it/s][A
Training:  16%|█▌        | 14/89 [00:07<00:37,  1.98it/s][A
Training:  19%|█▉        | 17/89 [00:09<00:38,  1.88it/s][A
Training:  22%|██▏       | 20/89 [00:09<00:24,  2.77it/s][A
Training:  25%|██▍       | 22/89 [00:11<00:32,  2.07it/s][A
Training:  28%|██▊       | 25/89 [00:12<00:32,  1.94it/s][A
Training:  31%|███▏      | 28/89 [00:12<00:21,  2.79it/s][A
Training:  34%|███▎      | 30/89 [00:14<00:27,  2.11it/s][A
Training:  37%|███▋      | 33/89 [00:16<00:28,  1.97it/s][A
Training:  40%|████      | 36/89 [00:16<00:18,  2.83it/s][A
Training:  43%|████▎     | 38/89 [00:18<00:23,  2.13it/s][A
Training:  46%|████▌     | 41/89 [00

Epoch: 35/89 - Loss: 0.5481 - Accuracy: 0.9493



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:21,  1.94s/it][A
 33%|███▎      | 4/12 [00:02<00:03,  2.50it/s][A
 50%|█████     | 6/12 [00:03<00:03,  1.76it/s][A
100%|██████████| 12/12 [00:05<00:00,  2.27it/s][A
Epochs:  39%|███▉      | 35/89 [27:01<41:55, 46.57s/it]

Val Loss: 0.6125 - Val Accuracy: 0.9448



Training:   0%|          | 0/89 [00:00<?, ?it/s][A
Training:   1%|          | 1/89 [00:02<03:01,  2.07s/it][A
Training:   3%|▎         | 3/89 [00:02<00:49,  1.74it/s][A
Training:   6%|▌         | 5/89 [00:03<01:00,  1.40it/s][A
Training:   8%|▊         | 7/89 [00:03<00:35,  2.29it/s][A
Training:  10%|█         | 9/89 [00:05<00:47,  1.70it/s][A
Training:  12%|█▏        | 11/89 [00:05<00:31,  2.47it/s][A
Training:  15%|█▍        | 13/89 [00:07<00:41,  1.84it/s][A
Training:  17%|█▋        | 15/89 [00:07<00:28,  2.60it/s][A
Training:  19%|█▉        | 17/89 [00:09<00:37,  1.91it/s][A
Training:  21%|██▏       | 19/89 [00:09<00:26,  2.63it/s][A
Training:  24%|██▎       | 21/89 [00:10<00:34,  1.97it/s][A
Training:  25%|██▍       | 22/89 [00:11<00:29,  2.27it/s][A
Training:  28%|██▊       | 25/89 [00:12<00:30,  2.07it/s][A
Training:  29%|██▉       | 26/89 [00:12<00:26,  2.37it/s][A
Training:  33%|███▎      | 29/89 [00:14<00:28,  2.08it/s][A
Training:  34%|███▎      | 30/89 [00:

Epoch: 36/89 - Loss: 0.5495 - Accuracy: 0.9480



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:21,  1.95s/it][A
 33%|███▎      | 4/12 [00:02<00:03,  2.48it/s][A
 50%|█████     | 6/12 [00:03<00:03,  1.78it/s][A
100%|██████████| 12/12 [00:05<00:00,  2.25it/s][A
Epochs:  40%|████      | 36/89 [27:48<41:04, 46.50s/it]

Val Loss: 0.5958 - Val Accuracy: 0.9396



Training:   0%|          | 0/89 [00:00<?, ?it/s][A
Training:   1%|          | 1/89 [00:02<03:04,  2.10s/it][A
Training:   4%|▍         | 4/89 [00:02<00:36,  2.33it/s][A
Training:   7%|▋         | 6/89 [00:03<00:50,  1.65it/s][A
Training:  10%|█         | 9/89 [00:05<00:47,  1.70it/s][A
Training:  13%|█▎        | 12/89 [00:05<00:28,  2.74it/s][A
Training:  16%|█▌        | 14/89 [00:07<00:37,  1.99it/s][A
Training:  19%|█▉        | 17/89 [00:09<00:38,  1.89it/s][A
Training:  22%|██▏       | 20/89 [00:09<00:24,  2.79it/s][A
Training:  25%|██▍       | 22/89 [00:10<00:32,  2.08it/s][A
Training:  28%|██▊       | 25/89 [00:12<00:32,  1.95it/s][A
Training:  31%|███▏      | 28/89 [00:12<00:21,  2.81it/s][A
Training:  34%|███▎      | 30/89 [00:14<00:28,  2.10it/s][A
Training:  37%|███▋      | 33/89 [00:16<00:28,  1.95it/s][A
Training:  40%|████      | 36/89 [00:16<00:18,  2.79it/s][A
Training:  43%|████▎     | 38/89 [00:18<00:24,  2.08it/s][A
Training:  46%|████▌     | 41/89 [00

Epoch: 37/89 - Loss: 0.5590 - Accuracy: 0.9495



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:21,  1.93s/it][A
 33%|███▎      | 4/12 [00:02<00:03,  2.51it/s][A
 50%|█████     | 6/12 [00:03<00:03,  1.79it/s][A
100%|██████████| 12/12 [00:05<00:00,  2.29it/s][A
Epochs:  42%|████▏     | 37/89 [28:34<40:15, 46.45s/it]

Val Loss: 0.6739 - Val Accuracy: 0.9400



Training:   0%|          | 0/89 [00:00<?, ?it/s][A
Training:   1%|          | 1/89 [00:02<03:08,  2.15s/it][A
Training:   4%|▍         | 4/89 [00:02<00:37,  2.28it/s][A
Training:   7%|▋         | 6/89 [00:03<00:50,  1.64it/s][A
Training:  10%|█         | 9/89 [00:05<00:48,  1.66it/s][A
Training:  13%|█▎        | 12/89 [00:05<00:28,  2.69it/s][A
Training:  16%|█▌        | 14/89 [00:07<00:38,  1.97it/s][A
Training:  19%|█▉        | 17/89 [00:09<00:38,  1.87it/s][A
Training:  22%|██▏       | 20/89 [00:09<00:24,  2.76it/s][A
Training:  25%|██▍       | 22/89 [00:11<00:32,  2.07it/s][A
Training:  28%|██▊       | 25/89 [00:12<00:32,  1.94it/s][A
Training:  31%|███▏      | 28/89 [00:12<00:21,  2.80it/s][A
Training:  34%|███▎      | 30/89 [00:14<00:27,  2.11it/s][A
Training:  37%|███▋      | 33/89 [00:16<00:28,  1.96it/s][A
Training:  40%|████      | 36/89 [00:16<00:18,  2.81it/s][A
Training:  43%|████▎     | 38/89 [00:18<00:24,  2.10it/s][A
Training:  46%|████▌     | 41/89 [00

Epoch: 38/89 - Loss: 0.5302 - Accuracy: 0.9478



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:21,  1.95s/it][A
 33%|███▎      | 4/12 [00:02<00:03,  2.51it/s][A
 50%|█████     | 6/12 [00:03<00:03,  1.78it/s][A
100%|██████████| 12/12 [00:05<00:00,  2.28it/s][A
Epochs:  43%|████▎     | 38/89 [29:20<39:29, 46.46s/it]

Val Loss: 0.5822 - Val Accuracy: 0.9443



Training:   0%|          | 0/89 [00:00<?, ?it/s][A
Training:   1%|          | 1/89 [00:02<03:05,  2.11s/it][A
Training:   4%|▍         | 4/89 [00:02<00:36,  2.32it/s][A
Training:   7%|▋         | 6/89 [00:03<00:50,  1.66it/s][A
Training:  10%|█         | 9/89 [00:05<00:47,  1.69it/s][A
Training:  13%|█▎        | 12/89 [00:05<00:28,  2.73it/s][A
Training:  16%|█▌        | 14/89 [00:07<00:37,  2.00it/s][A
Training:  19%|█▉        | 17/89 [00:09<00:37,  1.90it/s][A
Training:  22%|██▏       | 20/89 [00:09<00:24,  2.81it/s][A
Training:  25%|██▍       | 22/89 [00:10<00:31,  2.11it/s][A
Training:  28%|██▊       | 25/89 [00:12<00:32,  1.99it/s][A
Training:  31%|███▏      | 28/89 [00:12<00:21,  2.86it/s][A
Training:  34%|███▎      | 30/89 [00:14<00:27,  2.13it/s][A
Training:  37%|███▋      | 33/89 [00:16<00:28,  1.96it/s][A
Training:  40%|████      | 36/89 [00:16<00:18,  2.80it/s][A
Training:  43%|████▎     | 38/89 [00:18<00:24,  2.10it/s][A
Training:  46%|████▌     | 41/89 [00

Epoch: 39/89 - Loss: 0.5292 - Accuracy: 0.9470



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:21,  1.95s/it][A
 33%|███▎      | 4/12 [00:02<00:03,  2.50it/s][A
 50%|█████     | 6/12 [00:03<00:03,  1.80it/s][A
100%|██████████| 12/12 [00:05<00:00,  2.28it/s][A
Epochs:  44%|████▍     | 39/89 [30:07<38:38, 46.37s/it]

Val Loss: 0.5425 - Val Accuracy: 0.9443



Training:   0%|          | 0/89 [00:00<?, ?it/s][A
Training:   1%|          | 1/89 [00:02<02:59,  2.04s/it][A
Training:   4%|▍         | 4/89 [00:02<00:35,  2.39it/s][A
Training:   7%|▋         | 6/89 [00:03<00:49,  1.68it/s][A
Training:  10%|█         | 9/89 [00:05<00:46,  1.72it/s][A
Training:  13%|█▎        | 12/89 [00:05<00:27,  2.77it/s][A
Training:  16%|█▌        | 14/89 [00:07<00:37,  1.98it/s][A
Training:  19%|█▉        | 17/89 [00:09<00:38,  1.87it/s][A
Training:  22%|██▏       | 20/89 [00:09<00:25,  2.76it/s][A
Training:  25%|██▍       | 22/89 [00:11<00:33,  2.03it/s][A
Training:  28%|██▊       | 25/89 [00:12<00:33,  1.92it/s][A
Training:  31%|███▏      | 28/89 [00:12<00:22,  2.77it/s][A
Training:  34%|███▎      | 30/89 [00:14<00:27,  2.11it/s][A
Training:  37%|███▋      | 33/89 [00:16<00:28,  1.96it/s][A
Training:  40%|████      | 36/89 [00:16<00:18,  2.79it/s][A
Training:  43%|████▎     | 38/89 [00:18<00:24,  2.12it/s][A
Training:  46%|████▌     | 41/89 [00

Epoch: 40/89 - Loss: 0.5327 - Accuracy: 0.9487



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:21,  1.94s/it][A
 33%|███▎      | 4/12 [00:02<00:03,  2.52it/s][A
 50%|█████     | 6/12 [00:03<00:03,  1.76it/s][A
100%|██████████| 12/12 [00:05<00:00,  2.26it/s][A
Epochs:  45%|████▍     | 40/89 [30:53<37:52, 46.37s/it]

Val Loss: 0.6390 - Val Accuracy: 0.9432



Training:   0%|          | 0/89 [00:00<?, ?it/s][A
Training:   1%|          | 1/89 [00:02<03:04,  2.09s/it][A
Training:   4%|▍         | 4/89 [00:02<00:36,  2.30it/s][A
Training:   7%|▋         | 6/89 [00:03<00:50,  1.63it/s][A
Training:  10%|█         | 9/89 [00:05<00:47,  1.67it/s][A
Training:  13%|█▎        | 12/89 [00:05<00:28,  2.69it/s][A
Training:  16%|█▌        | 14/89 [00:07<00:37,  1.99it/s][A
Training:  19%|█▉        | 17/89 [00:09<00:37,  1.90it/s][A
Training:  21%|██▏       | 19/89 [00:09<00:28,  2.46it/s][A
Training:  24%|██▎       | 21/89 [00:10<00:34,  1.95it/s][A
Training:  26%|██▌       | 23/89 [00:11<00:25,  2.55it/s][A
Training:  28%|██▊       | 25/89 [00:12<00:32,  1.97it/s][A
Training:  30%|███       | 27/89 [00:12<00:24,  2.56it/s][A
Training:  33%|███▎      | 29/89 [00:14<00:30,  1.99it/s][A
Training:  35%|███▍      | 31/89 [00:14<00:21,  2.64it/s][A
Training:  37%|███▋      | 33/89 [00:16<00:28,  2.00it/s][A
Training:  39%|███▉      | 35/89 [00

Epoch: 41/89 - Loss: 0.5230 - Accuracy: 0.9490



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:21,  1.99s/it][A
 42%|████▏     | 5/12 [00:03<00:04,  1.58it/s][A
 67%|██████▋   | 8/12 [00:03<00:01,  2.86it/s][A
100%|██████████| 12/12 [00:05<00:00,  2.27it/s][A
Epochs:  46%|████▌     | 41/89 [31:39<37:02, 46.29s/it]

Val Loss: 0.5692 - Val Accuracy: 0.9448



Training:   0%|          | 0/89 [00:00<?, ?it/s][A
Training:   1%|          | 1/89 [00:02<03:03,  2.09s/it][A
Training:   4%|▍         | 4/89 [00:02<00:36,  2.33it/s][A
Training:   7%|▋         | 6/89 [00:03<00:50,  1.66it/s][A
Training:  10%|█         | 9/89 [00:05<00:47,  1.70it/s][A
Training:  13%|█▎        | 12/89 [00:05<00:28,  2.73it/s][A
Training:  16%|█▌        | 14/89 [00:07<00:37,  2.00it/s][A
Training:  19%|█▉        | 17/89 [00:09<00:38,  1.89it/s][A
Training:  22%|██▏       | 20/89 [00:09<00:24,  2.80it/s][A
Training:  25%|██▍       | 22/89 [00:10<00:32,  2.08it/s][A
Training:  28%|██▊       | 25/89 [00:12<00:32,  1.94it/s][A
Training:  31%|███▏      | 28/89 [00:12<00:21,  2.81it/s][A
Training:  34%|███▎      | 30/89 [00:14<00:27,  2.13it/s][A
Training:  37%|███▋      | 33/89 [00:16<00:28,  1.96it/s][A
Training:  40%|████      | 36/89 [00:16<00:18,  2.79it/s][A
Training:  43%|████▎     | 38/89 [00:18<00:24,  2.12it/s][A
Training:  46%|████▌     | 41/89 [00

Epoch: 42/89 - Loss: 0.5163 - Accuracy: 0.9488



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:21,  1.91s/it][A
 33%|███▎      | 4/12 [00:02<00:03,  2.54it/s][A
 50%|█████     | 6/12 [00:03<00:03,  1.82it/s][A
100%|██████████| 12/12 [00:05<00:00,  2.31it/s][A
Epochs:  47%|████▋     | 42/89 [32:25<36:13, 46.24s/it]

Val Loss: 0.5955 - Val Accuracy: 0.9459



Training:   0%|          | 0/89 [00:00<?, ?it/s][A
Training:   1%|          | 1/89 [00:02<03:03,  2.08s/it][A
Training:   4%|▍         | 4/89 [00:02<00:36,  2.35it/s][A
Training:   7%|▋         | 6/89 [00:03<00:50,  1.66it/s][A
Training:  10%|█         | 9/89 [00:05<00:47,  1.68it/s][A
Training:  13%|█▎        | 12/89 [00:05<00:28,  2.72it/s][A
Training:  16%|█▌        | 14/89 [00:07<00:37,  1.98it/s][A
Training:  19%|█▉        | 17/89 [00:09<00:38,  1.88it/s][A
Training:  22%|██▏       | 20/89 [00:09<00:24,  2.78it/s][A
Training:  25%|██▍       | 22/89 [00:10<00:32,  2.09it/s][A
Training:  28%|██▊       | 25/89 [00:12<00:32,  1.99it/s][A
Training:  31%|███▏      | 28/89 [00:12<00:21,  2.88it/s][A
Training:  34%|███▎      | 30/89 [00:14<00:27,  2.16it/s][A
Training:  37%|███▋      | 33/89 [00:16<00:27,  2.01it/s][A
Training:  40%|████      | 36/89 [00:16<00:18,  2.88it/s][A
Training:  43%|████▎     | 38/89 [00:17<00:23,  2.14it/s][A
Training:  46%|████▌     | 41/89 [00

Epoch: 43/89 - Loss: 0.5084 - Accuracy: 0.9495



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:20,  1.88s/it][A
 33%|███▎      | 4/12 [00:01<00:03,  2.59it/s][A
 50%|█████     | 6/12 [00:03<00:03,  1.78it/s][A
100%|██████████| 12/12 [00:05<00:00,  2.29it/s][A
Epochs:  48%|████▊     | 43/89 [33:11<35:23, 46.17s/it]

Val Loss: 0.5654 - Val Accuracy: 0.9437



Training:   0%|          | 0/89 [00:00<?, ?it/s][A
Training:   1%|          | 1/89 [00:02<02:59,  2.04s/it][A
Training:   4%|▍         | 4/89 [00:02<00:35,  2.38it/s][A
Training:   7%|▋         | 6/89 [00:03<00:49,  1.68it/s][A
Training:  10%|█         | 9/89 [00:05<00:47,  1.69it/s][A
Training:  13%|█▎        | 12/89 [00:05<00:28,  2.74it/s][A
Training:  16%|█▌        | 14/89 [00:07<00:37,  2.00it/s][A
Training:  19%|█▉        | 17/89 [00:09<00:38,  1.89it/s][A
Training:  22%|██▏       | 20/89 [00:09<00:24,  2.79it/s][A
Training:  25%|██▍       | 22/89 [00:10<00:31,  2.10it/s][A
Training:  28%|██▊       | 25/89 [00:12<00:32,  1.94it/s][A
Training:  31%|███▏      | 28/89 [00:12<00:21,  2.80it/s][A
Training:  34%|███▎      | 30/89 [00:14<00:27,  2.11it/s][A
Training:  37%|███▋      | 33/89 [00:16<00:28,  1.99it/s][A
Training:  40%|████      | 36/89 [00:16<00:18,  2.84it/s][A
Training:  43%|████▎     | 38/89 [00:17<00:24,  2.10it/s][A
Training:  46%|████▌     | 41/89 [00

Epoch: 44/89 - Loss: 0.5313 - Accuracy: 0.9488



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:20,  1.86s/it][A
 25%|██▌       | 3/12 [00:01<00:04,  1.90it/s][A
 42%|████▏     | 5/12 [00:03<00:04,  1.56it/s][A
 50%|█████     | 6/12 [00:03<00:03,  1.95it/s][A
 75%|███████▌  | 9/12 [00:05<00:01,  2.05it/s][A
100%|██████████| 12/12 [00:05<00:00,  2.25it/s][A
Epochs:  49%|████▉     | 44/89 [33:57<34:35, 46.13s/it]

Val Loss: 0.5586 - Val Accuracy: 0.9432



Training:   0%|          | 0/89 [00:00<?, ?it/s][A
Training:   1%|          | 1/89 [00:02<03:00,  2.05s/it][A
Training:   4%|▍         | 4/89 [00:02<00:36,  2.36it/s][A
Training:   7%|▋         | 6/89 [00:03<00:49,  1.66it/s][A
Training:  10%|█         | 9/89 [00:05<00:47,  1.70it/s][A
Training:  13%|█▎        | 12/89 [00:05<00:27,  2.75it/s][A
Training:  16%|█▌        | 14/89 [00:07<00:37,  1.99it/s][A
Training:  19%|█▉        | 17/89 [00:09<00:38,  1.88it/s][A
Training:  22%|██▏       | 20/89 [00:09<00:24,  2.78it/s][A
Training:  25%|██▍       | 22/89 [00:10<00:32,  2.08it/s][A
Training:  28%|██▊       | 25/89 [00:12<00:32,  1.94it/s][A
Training:  31%|███▏      | 28/89 [00:12<00:21,  2.80it/s][A
Training:  34%|███▎      | 30/89 [00:14<00:27,  2.11it/s][A
Training:  37%|███▋      | 33/89 [00:16<00:28,  1.96it/s][A
Training:  40%|████      | 36/89 [00:16<00:18,  2.82it/s][A
Training:  43%|████▎     | 38/89 [00:18<00:24,  2.11it/s][A
Training:  46%|████▌     | 41/89 [00

Epoch: 45/89 - Loss: 0.5102 - Accuracy: 0.9481



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:21,  1.95s/it][A
 33%|███▎      | 4/12 [00:02<00:03,  2.49it/s][A
 50%|█████     | 6/12 [00:03<00:03,  1.80it/s][A
100%|██████████| 12/12 [00:05<00:00,  2.30it/s][A
Epochs:  51%|█████     | 45/89 [34:43<33:49, 46.13s/it]

Val Loss: 0.5706 - Val Accuracy: 0.9432



Training:   0%|          | 0/89 [00:00<?, ?it/s][A
Training:   1%|          | 1/89 [00:02<03:10,  2.16s/it][A
Training:   4%|▍         | 4/89 [00:02<00:37,  2.27it/s][A
Training:   7%|▋         | 6/89 [00:03<00:50,  1.64it/s][A
Training:  10%|█         | 9/89 [00:05<00:47,  1.70it/s][A
Training:  13%|█▎        | 12/89 [00:05<00:28,  2.75it/s][A
Training:  16%|█▌        | 14/89 [00:07<00:37,  2.01it/s][A
Training:  19%|█▉        | 17/89 [00:09<00:37,  1.91it/s][A
Training:  22%|██▏       | 20/89 [00:09<00:24,  2.82it/s][A
Training:  25%|██▍       | 22/89 [00:10<00:31,  2.11it/s][A
Training:  28%|██▊       | 25/89 [00:12<00:32,  1.95it/s][A
Training:  31%|███▏      | 28/89 [00:12<00:21,  2.82it/s][A
Training:  34%|███▎      | 30/89 [00:14<00:27,  2.12it/s][A
Training:  37%|███▋      | 33/89 [00:16<00:28,  1.98it/s][A
Training:  40%|████      | 36/89 [00:16<00:18,  2.84it/s][A
Training:  43%|████▎     | 38/89 [00:17<00:23,  2.14it/s][A
Training:  46%|████▌     | 41/89 [00

Epoch: 46/89 - Loss: 0.5140 - Accuracy: 0.9459



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:21,  1.99s/it][A
 33%|███▎      | 4/12 [00:02<00:03,  2.47it/s][A
 50%|█████     | 6/12 [00:03<00:03,  1.81it/s][A
 75%|███████▌  | 9/12 [00:05<00:01,  1.92it/s][A
100%|██████████| 12/12 [00:05<00:00,  2.29it/s][A
Epochs:  52%|█████▏    | 46/89 [35:29<33:00, 46.05s/it]

Val Loss: 0.6443 - Val Accuracy: 0.9370



Training:   0%|          | 0/89 [00:00<?, ?it/s][A
Training:   1%|          | 1/89 [00:02<02:59,  2.03s/it][A
Training:   4%|▍         | 4/89 [00:02<00:35,  2.38it/s][A
Training:   7%|▋         | 6/89 [00:03<00:50,  1.66it/s][A
Training:  10%|█         | 9/89 [00:05<00:47,  1.68it/s][A
Training:  13%|█▎        | 12/89 [00:05<00:28,  2.71it/s][A
Training:  16%|█▌        | 14/89 [00:07<00:37,  1.99it/s][A
Training:  19%|█▉        | 17/89 [00:09<00:38,  1.89it/s][A
Training:  22%|██▏       | 20/89 [00:09<00:24,  2.80it/s][A
Training:  25%|██▍       | 22/89 [00:10<00:32,  2.06it/s][A
Training:  28%|██▊       | 25/89 [00:12<00:32,  1.95it/s][A
Training:  31%|███▏      | 28/89 [00:12<00:21,  2.82it/s][A
Training:  34%|███▎      | 30/89 [00:14<00:27,  2.12it/s][A
Training:  37%|███▋      | 33/89 [00:16<00:28,  1.96it/s][A
Training:  40%|████      | 36/89 [00:16<00:18,  2.81it/s][A
Training:  43%|████▎     | 38/89 [00:18<00:23,  2.13it/s][A
Training:  46%|████▌     | 41/89 [00

Epoch: 47/89 - Loss: 0.5239 - Accuracy: 0.9500



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:02<00:22,  2.03s/it][A
 33%|███▎      | 4/12 [00:02<00:03,  2.43it/s][A
 50%|█████     | 6/12 [00:03<00:03,  1.73it/s][A
100%|██████████| 12/12 [00:05<00:00,  2.22it/s][A
Epochs:  53%|█████▎    | 47/89 [36:15<32:15, 46.09s/it]

Val Loss: 0.5863 - Val Accuracy: 0.9459



Training:   0%|          | 0/89 [00:00<?, ?it/s][A
Training:   1%|          | 1/89 [00:02<03:04,  2.09s/it][A
Training:   4%|▍         | 4/89 [00:02<00:36,  2.32it/s][A
Training:   7%|▋         | 6/89 [00:03<00:50,  1.63it/s][A
Training:  10%|█         | 9/89 [00:05<00:48,  1.65it/s][A
Training:  13%|█▎        | 12/89 [00:05<00:28,  2.67it/s][A
Training:  16%|█▌        | 14/89 [00:07<00:37,  1.98it/s][A
Training:  19%|█▉        | 17/89 [00:09<00:38,  1.88it/s][A
Training:  22%|██▏       | 20/89 [00:09<00:24,  2.78it/s][A
Training:  25%|██▍       | 22/89 [00:11<00:32,  2.09it/s][A
Training:  28%|██▊       | 25/89 [00:12<00:32,  1.95it/s][A
Training:  31%|███▏      | 28/89 [00:12<00:21,  2.81it/s][A
Training:  34%|███▎      | 30/89 [00:14<00:27,  2.13it/s][A
Training:  37%|███▋      | 33/89 [00:16<00:28,  1.98it/s][A
Training:  40%|████      | 36/89 [00:16<00:18,  2.84it/s][A
Training:  43%|████▎     | 38/89 [00:17<00:23,  2.19it/s][A
Training:  46%|████▌     | 41/89 [00

Epoch: 48/89 - Loss: 0.5245 - Accuracy: 0.9470



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:20,  1.90s/it][A
 33%|███▎      | 4/12 [00:02<00:03,  2.55it/s][A
 50%|█████     | 6/12 [00:03<00:03,  1.81it/s][A
100%|██████████| 12/12 [00:05<00:00,  2.28it/s][A
Epochs:  54%|█████▍    | 48/89 [37:02<31:30, 46.10s/it]

Val Loss: 0.5969 - Val Accuracy: 0.9411



Training:   0%|          | 0/89 [00:00<?, ?it/s][A
Training:   1%|          | 1/89 [00:02<03:08,  2.14s/it][A
Training:   4%|▍         | 4/89 [00:02<00:37,  2.28it/s][A
Training:   7%|▋         | 6/89 [00:03<00:51,  1.62it/s][A
Training:  10%|█         | 9/89 [00:05<00:47,  1.67it/s][A
Training:  13%|█▎        | 12/89 [00:05<00:28,  2.70it/s][A
Training:  16%|█▌        | 14/89 [00:07<00:38,  1.96it/s][A
Training:  19%|█▉        | 17/89 [00:09<00:38,  1.87it/s][A
Training:  22%|██▏       | 20/89 [00:09<00:25,  2.76it/s][A
Training:  25%|██▍       | 22/89 [00:11<00:32,  2.09it/s][A
Training:  28%|██▊       | 25/89 [00:12<00:32,  1.97it/s][A
Training:  31%|███▏      | 28/89 [00:12<00:21,  2.82it/s][A
Training:  34%|███▎      | 30/89 [00:14<00:28,  2.10it/s][A
Training:  37%|███▋      | 33/89 [00:16<00:28,  1.98it/s][A
Training:  40%|████      | 36/89 [00:16<00:18,  2.83it/s][A
Training:  43%|████▎     | 38/89 [00:18<00:23,  2.14it/s][A
Training:  46%|████▌     | 41/89 [00

Epoch: 49/89 - Loss: 0.5073 - Accuracy: 0.9503



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:21,  1.95s/it][A
 33%|███▎      | 4/12 [00:02<00:03,  2.51it/s][A
 50%|█████     | 6/12 [00:03<00:03,  1.77it/s][A
100%|██████████| 12/12 [00:05<00:00,  2.26it/s][A
Epochs:  55%|█████▌    | 49/89 [37:48<30:46, 46.16s/it]

Val Loss: 0.5713 - Val Accuracy: 0.9432



Training:   0%|          | 0/89 [00:00<?, ?it/s][A
Training:   1%|          | 1/89 [00:02<03:00,  2.05s/it][A
Training:   4%|▍         | 4/89 [00:02<00:36,  2.35it/s][A
Training:   7%|▋         | 6/89 [00:03<00:50,  1.66it/s][A
Training:  10%|█         | 9/89 [00:05<00:47,  1.69it/s][A
Training:  12%|█▏        | 11/89 [00:05<00:32,  2.38it/s][A
Training:  15%|█▍        | 13/89 [00:07<00:42,  1.79it/s][A
Training:  18%|█▊        | 16/89 [00:07<00:25,  2.84it/s][A
Training:  20%|██        | 18/89 [00:09<00:34,  2.08it/s][A
Training:  24%|██▎       | 21/89 [00:10<00:35,  1.93it/s][A
Training:  27%|██▋       | 24/89 [00:11<00:22,  2.84it/s][A
Training:  29%|██▉       | 26/89 [00:12<00:29,  2.12it/s][A
Training:  33%|███▎      | 29/89 [00:14<00:30,  1.98it/s][A
Training:  36%|███▌      | 32/89 [00:14<00:20,  2.85it/s][A
Training:  38%|███▊      | 34/89 [00:16<00:25,  2.15it/s][A
Training:  42%|████▏     | 37/89 [00:17<00:26,  1.97it/s][A
Training:  45%|████▍     | 40/89 [00

Epoch: 50/89 - Loss: 0.4985 - Accuracy: 0.9464



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:20,  1.89s/it][A
 33%|███▎      | 4/12 [00:02<00:03,  2.56it/s][A
 50%|█████     | 6/12 [00:03<00:03,  1.80it/s][A
100%|██████████| 12/12 [00:05<00:00,  2.29it/s][A
Epochs:  56%|█████▌    | 50/89 [38:34<29:59, 46.13s/it]

Val Loss: 0.5445 - Val Accuracy: 0.9443



Training:   0%|          | 0/89 [00:00<?, ?it/s][A
Training:   1%|          | 1/89 [00:02<03:04,  2.10s/it][A
Training:   4%|▍         | 4/89 [00:02<00:36,  2.32it/s][A
Training:   7%|▋         | 6/89 [00:03<00:50,  1.64it/s][A
Training:  10%|█         | 9/89 [00:05<00:47,  1.69it/s][A
Training:  13%|█▎        | 12/89 [00:05<00:28,  2.72it/s][A
Training:  16%|█▌        | 14/89 [00:07<00:36,  2.03it/s][A
Training:  19%|█▉        | 17/89 [00:09<00:37,  1.94it/s][A
Training:  22%|██▏       | 20/89 [00:09<00:24,  2.85it/s][A
Training:  25%|██▍       | 22/89 [00:10<00:32,  2.08it/s][A
Training:  28%|██▊       | 25/89 [00:12<00:33,  1.93it/s][A
Training:  31%|███▏      | 28/89 [00:12<00:21,  2.78it/s][A
Training:  34%|███▎      | 30/89 [00:14<00:28,  2.08it/s][A
Training:  37%|███▋      | 33/89 [00:16<00:28,  1.96it/s][A
Training:  40%|████      | 36/89 [00:16<00:18,  2.80it/s][A
Training:  43%|████▎     | 38/89 [00:18<00:24,  2.11it/s][A
Training:  46%|████▌     | 41/89 [00

Epoch: 51/89 - Loss: 0.4965 - Accuracy: 0.9495



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:02<00:21,  2.00s/it][A
 33%|███▎      | 4/12 [00:02<00:03,  2.45it/s][A
 50%|█████     | 6/12 [00:03<00:03,  1.76it/s][A
100%|██████████| 12/12 [00:05<00:00,  2.24it/s][A
Epochs:  57%|█████▋    | 51/89 [39:20<29:16, 46.21s/it]

Val Loss: 0.6033 - Val Accuracy: 0.9443



Training:   0%|          | 0/89 [00:00<?, ?it/s][A
Training:   1%|          | 1/89 [00:02<03:05,  2.11s/it][A
Training:   3%|▎         | 3/89 [00:02<00:50,  1.71it/s][A
Training:   6%|▌         | 5/89 [00:03<01:00,  1.39it/s][A
Training:   9%|▉         | 8/89 [00:04<00:29,  2.75it/s][A
Training:  11%|█         | 10/89 [00:05<00:41,  1.92it/s][A
Training:  15%|█▍        | 13/89 [00:07<00:41,  1.84it/s][A
Training:  18%|█▊        | 16/89 [00:07<00:25,  2.82it/s][A
Training:  20%|██        | 18/89 [00:09<00:33,  2.09it/s][A
Training:  24%|██▎       | 21/89 [00:10<00:34,  1.96it/s][A
Training:  27%|██▋       | 24/89 [00:11<00:22,  2.85it/s][A
Training:  29%|██▉       | 26/89 [00:12<00:29,  2.14it/s][A
Training:  33%|███▎      | 29/89 [00:14<00:30,  1.99it/s][A
Training:  36%|███▌      | 32/89 [00:14<00:19,  2.86it/s][A
Training:  38%|███▊      | 34/89 [00:16<00:25,  2.12it/s][A
Training:  42%|████▏     | 37/89 [00:17<00:26,  1.97it/s][A
Training:  45%|████▍     | 40/89 [00

Epoch: 52/89 - Loss: 0.4954 - Accuracy: 0.9484



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:21,  1.94s/it][A
 33%|███▎      | 4/12 [00:02<00:03,  2.53it/s][A
 50%|█████     | 6/12 [00:03<00:03,  1.80it/s][A
100%|██████████| 12/12 [00:05<00:00,  2.27it/s][A
Epochs:  58%|█████▊    | 52/89 [40:06<28:29, 46.21s/it]

Val Loss: 0.6230 - Val Accuracy: 0.9359



Training:   0%|          | 0/89 [00:00<?, ?it/s][A
Training:   1%|          | 1/89 [00:02<03:08,  2.14s/it][A
Training:   4%|▍         | 4/89 [00:02<00:37,  2.28it/s][A
Training:   7%|▋         | 6/89 [00:03<00:50,  1.64it/s][A
Training:  10%|█         | 9/89 [00:05<00:47,  1.70it/s][A
Training:  13%|█▎        | 12/89 [00:05<00:28,  2.74it/s][A
Training:  16%|█▌        | 14/89 [00:07<00:37,  1.99it/s][A
Training:  19%|█▉        | 17/89 [00:09<00:38,  1.88it/s][A
Training:  22%|██▏       | 20/89 [00:09<00:24,  2.77it/s][A
Training:  25%|██▍       | 22/89 [00:11<00:32,  2.09it/s][A
Training:  28%|██▊       | 25/89 [00:12<00:32,  1.95it/s][A
Training:  30%|███       | 27/89 [00:12<00:24,  2.50it/s][A
Training:  33%|███▎      | 29/89 [00:14<00:31,  1.93it/s][A
Training:  36%|███▌      | 32/89 [00:14<00:19,  2.89it/s][A
Training:  38%|███▊      | 34/89 [00:16<00:26,  2.10it/s][A
Training:  42%|████▏     | 37/89 [00:18<00:26,  1.95it/s][A
Training:  45%|████▍     | 40/89 [00

Epoch: 53/89 - Loss: 0.4931 - Accuracy: 0.9476



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:21,  1.98s/it][A
 33%|███▎      | 4/12 [00:02<00:03,  2.44it/s][A
 50%|█████     | 6/12 [00:03<00:03,  1.74it/s][A
100%|██████████| 12/12 [00:05<00:00,  2.23it/s][A
Epochs:  60%|█████▉    | 53/89 [40:53<27:46, 46.28s/it]

Val Loss: 0.5957 - Val Accuracy: 0.9432



Training:   0%|          | 0/89 [00:00<?, ?it/s][A
Training:   1%|          | 1/89 [00:02<03:02,  2.08s/it][A
Training:   4%|▍         | 4/89 [00:02<00:36,  2.35it/s][A
Training:   7%|▋         | 6/89 [00:03<00:50,  1.64it/s][A
Training:  10%|█         | 9/89 [00:05<00:47,  1.69it/s][A
Training:  13%|█▎        | 12/89 [00:05<00:28,  2.71it/s][A
Training:  16%|█▌        | 14/89 [00:07<00:37,  1.98it/s][A
Training:  19%|█▉        | 17/89 [00:09<00:38,  1.88it/s][A
Training:  22%|██▏       | 20/89 [00:09<00:24,  2.77it/s][A
Training:  25%|██▍       | 22/89 [00:11<00:32,  2.08it/s][A
Training:  27%|██▋       | 24/89 [00:11<00:23,  2.72it/s][A
Training:  29%|██▉       | 26/89 [00:12<00:31,  2.00it/s][A
Training:  33%|███▎      | 29/89 [00:14<00:31,  1.89it/s][A
Training:  36%|███▌      | 32/89 [00:14<00:20,  2.78it/s][A
Training:  38%|███▊      | 34/89 [00:16<00:26,  2.07it/s][A
Training:  42%|████▏     | 37/89 [00:18<00:26,  1.93it/s][A
Training:  45%|████▍     | 40/89 [00

Epoch: 54/89 - Loss: 0.4945 - Accuracy: 0.9444



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:21,  1.98s/it][A
 33%|███▎      | 4/12 [00:02<00:03,  2.45it/s][A
 50%|█████     | 6/12 [00:03<00:03,  1.79it/s][A
100%|██████████| 12/12 [00:05<00:00,  2.28it/s][A
Epochs:  61%|██████    | 54/89 [41:39<27:01, 46.32s/it]

Val Loss: 0.5445 - Val Accuracy: 0.9432



Training:   0%|          | 0/89 [00:00<?, ?it/s][A
Training:   1%|          | 1/89 [00:02<03:10,  2.16s/it][A
Training:   4%|▍         | 4/89 [00:02<00:37,  2.27it/s][A
Training:   7%|▋         | 6/89 [00:03<00:50,  1.64it/s][A
Training:  10%|█         | 9/89 [00:05<00:47,  1.68it/s][A
Training:  13%|█▎        | 12/89 [00:05<00:28,  2.72it/s][A
Training:  16%|█▌        | 14/89 [00:07<00:37,  1.98it/s][A
Training:  19%|█▉        | 17/89 [00:09<00:38,  1.87it/s][A
Training:  22%|██▏       | 20/89 [00:09<00:24,  2.77it/s][A
Training:  25%|██▍       | 22/89 [00:11<00:32,  2.09it/s][A
Training:  28%|██▊       | 25/89 [00:12<00:32,  1.96it/s][A
Training:  31%|███▏      | 28/89 [00:12<00:21,  2.83it/s][A
Training:  34%|███▎      | 30/89 [00:14<00:27,  2.13it/s][A
Training:  37%|███▋      | 33/89 [00:16<00:28,  1.98it/s][A
Training:  40%|████      | 36/89 [00:16<00:18,  2.84it/s][A
Training:  43%|████▎     | 38/89 [00:18<00:23,  2.14it/s][A
Training:  46%|████▌     | 41/89 [00

Epoch: 55/89 - Loss: 0.4840 - Accuracy: 0.9521



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:20,  1.89s/it][A
 33%|███▎      | 4/12 [00:02<00:03,  2.56it/s][A
 50%|█████     | 6/12 [00:03<00:03,  1.80it/s][A
100%|██████████| 12/12 [00:05<00:00,  2.30it/s][A
Epochs:  62%|██████▏   | 55/89 [42:25<26:12, 46.25s/it]

Val Loss: 0.5729 - Val Accuracy: 0.9407



Training:   0%|          | 0/89 [00:00<?, ?it/s][A
Training:   1%|          | 1/89 [00:02<03:09,  2.15s/it][A
Training:   4%|▍         | 4/89 [00:02<00:37,  2.27it/s][A
Training:   7%|▋         | 6/89 [00:03<00:50,  1.66it/s][A
Training:  10%|█         | 9/89 [00:05<00:47,  1.69it/s][A
Training:  13%|█▎        | 12/89 [00:05<00:28,  2.74it/s][A
Training:  16%|█▌        | 14/89 [00:07<00:37,  2.00it/s][A
Training:  19%|█▉        | 17/89 [00:09<00:38,  1.88it/s][A
Training:  22%|██▏       | 20/89 [00:09<00:24,  2.77it/s][A
Training:  25%|██▍       | 22/89 [00:11<00:32,  2.05it/s][A
Training:  28%|██▊       | 25/89 [00:12<00:32,  1.95it/s][A
Training:  31%|███▏      | 28/89 [00:12<00:21,  2.83it/s][A
Training:  34%|███▎      | 30/89 [00:14<00:27,  2.13it/s][A
Training:  37%|███▋      | 33/89 [00:16<00:28,  1.99it/s][A
Training:  40%|████      | 36/89 [00:16<00:18,  2.84it/s][A
Training:  43%|████▎     | 38/89 [00:17<00:23,  2.15it/s][A
Training:  46%|████▌     | 41/89 [00

Epoch: 56/89 - Loss: 0.4860 - Accuracy: 0.9498



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:21,  1.96s/it][A
 33%|███▎      | 4/12 [00:02<00:03,  2.50it/s][A
 50%|█████     | 6/12 [00:03<00:03,  1.79it/s][A
100%|██████████| 12/12 [00:05<00:00,  2.28it/s][A
Epochs:  63%|██████▎   | 56/89 [43:12<25:25, 46.23s/it]

Val Loss: 0.5663 - Val Accuracy: 0.9349



Training:   0%|          | 0/89 [00:00<?, ?it/s][A
Training:   1%|          | 1/89 [00:02<03:05,  2.11s/it][A
Training:   4%|▍         | 4/89 [00:02<00:36,  2.32it/s][A
Training:   7%|▋         | 6/89 [00:03<00:51,  1.61it/s][A
Training:  10%|█         | 9/89 [00:05<00:47,  1.67it/s][A
Training:  13%|█▎        | 12/89 [00:05<00:28,  2.70it/s][A
Training:  16%|█▌        | 14/89 [00:07<00:37,  1.99it/s][A
Training:  19%|█▉        | 17/89 [00:09<00:38,  1.88it/s][A
Training:  22%|██▏       | 20/89 [00:09<00:24,  2.78it/s][A
Training:  25%|██▍       | 22/89 [00:11<00:32,  2.06it/s][A
Training:  28%|██▊       | 25/89 [00:12<00:33,  1.92it/s][A
Training:  31%|███▏      | 28/89 [00:12<00:21,  2.78it/s][A
Training:  34%|███▎      | 30/89 [00:14<00:28,  2.08it/s][A
Training:  37%|███▋      | 33/89 [00:16<00:28,  1.96it/s][A
Training:  40%|████      | 36/89 [00:16<00:18,  2.81it/s][A
Training:  43%|████▎     | 38/89 [00:18<00:24,  2.10it/s][A
Training:  46%|████▌     | 41/89 [00

Epoch: 57/89 - Loss: 0.4812 - Accuracy: 0.9505



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:21,  1.95s/it][A
 33%|███▎      | 4/12 [00:02<00:03,  2.49it/s][A
 50%|█████     | 6/12 [00:03<00:03,  1.76it/s][A
100%|██████████| 12/12 [00:05<00:00,  2.25it/s][A
Epochs:  64%|██████▍   | 57/89 [43:58<24:40, 46.28s/it]

Val Loss: 0.5639 - Val Accuracy: 0.9427



Training:   0%|          | 0/89 [00:00<?, ?it/s][A
Training:   1%|          | 1/89 [00:02<02:58,  2.03s/it][A
Training:   4%|▍         | 4/89 [00:02<00:35,  2.40it/s][A
Training:   7%|▋         | 6/89 [00:03<00:49,  1.69it/s][A
Training:  10%|█         | 9/89 [00:05<00:46,  1.71it/s][A
Training:  13%|█▎        | 12/89 [00:05<00:27,  2.77it/s][A
Training:  16%|█▌        | 14/89 [00:07<00:37,  2.01it/s][A
Training:  19%|█▉        | 17/89 [00:09<00:38,  1.89it/s][A
Training:  22%|██▏       | 20/89 [00:09<00:24,  2.79it/s][A
Training:  25%|██▍       | 22/89 [00:10<00:32,  2.09it/s][A
Training:  28%|██▊       | 25/89 [00:12<00:32,  1.94it/s][A
Training:  31%|███▏      | 28/89 [00:12<00:21,  2.80it/s][A
Training:  34%|███▎      | 30/89 [00:14<00:28,  2.06it/s][A
Training:  37%|███▋      | 33/89 [00:16<00:29,  1.90it/s][A
Training:  40%|████      | 36/89 [00:16<00:19,  2.73it/s][A
Training:  43%|████▎     | 38/89 [00:18<00:24,  2.06it/s][A
Training:  46%|████▌     | 41/89 [00

Epoch: 58/89 - Loss: 0.4831 - Accuracy: 0.9492



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:21,  1.93s/it][A
 33%|███▎      | 4/12 [00:02<00:03,  2.55it/s][A
 50%|█████     | 6/12 [00:03<00:03,  1.78it/s][A
100%|██████████| 12/12 [00:05<00:00,  2.27it/s][A
Epochs:  65%|██████▌   | 58/89 [44:44<23:56, 46.33s/it]

Val Loss: 0.5481 - Val Accuracy: 0.9368



Training:   0%|          | 0/89 [00:00<?, ?it/s][A
Training:   1%|          | 1/89 [00:02<03:10,  2.17s/it][A
Training:   4%|▍         | 4/89 [00:02<00:37,  2.27it/s][A
Training:   7%|▋         | 6/89 [00:03<00:51,  1.61it/s][A
Training:  10%|█         | 9/89 [00:05<00:47,  1.67it/s][A
Training:  13%|█▎        | 12/89 [00:05<00:28,  2.69it/s][A
Training:  16%|█▌        | 14/89 [00:07<00:37,  1.99it/s][A
Training:  19%|█▉        | 17/89 [00:09<00:38,  1.86it/s][A
Training:  22%|██▏       | 20/89 [00:09<00:25,  2.75it/s][A
Training:  25%|██▍       | 22/89 [00:11<00:32,  2.07it/s][A
Training:  28%|██▊       | 25/89 [00:12<00:32,  1.94it/s][A
Training:  31%|███▏      | 28/89 [00:12<00:21,  2.80it/s][A
Training:  34%|███▎      | 30/89 [00:14<00:27,  2.12it/s][A
Training:  37%|███▋      | 33/89 [00:16<00:28,  1.98it/s][A
Training:  40%|████      | 36/89 [00:16<00:18,  2.84it/s][A
Training:  43%|████▎     | 38/89 [00:18<00:24,  2.12it/s][A
Training:  46%|████▌     | 41/89 [00

Epoch: 59/89 - Loss: 0.4945 - Accuracy: 0.9485



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:21,  1.99s/it][A
 33%|███▎      | 4/12 [00:02<00:03,  2.45it/s][A
 50%|█████     | 6/12 [00:03<00:03,  1.78it/s][A
100%|██████████| 12/12 [00:05<00:00,  2.27it/s][A
Epochs:  66%|██████▋   | 59/89 [45:31<23:10, 46.34s/it]

Val Loss: 0.5537 - Val Accuracy: 0.9427



Training:   0%|          | 0/89 [00:00<?, ?it/s][A
Training:   1%|          | 1/89 [00:02<03:05,  2.11s/it][A
Training:   4%|▍         | 4/89 [00:02<00:36,  2.31it/s][A
Training:   7%|▋         | 6/89 [00:03<00:50,  1.65it/s][A
Training:  10%|█         | 9/89 [00:05<00:46,  1.71it/s][A
Training:  12%|█▏        | 11/89 [00:05<00:32,  2.39it/s][A
Training:  15%|█▍        | 13/89 [00:07<00:41,  1.82it/s][A
Training:  18%|█▊        | 16/89 [00:07<00:25,  2.89it/s][A
Training:  20%|██        | 18/89 [00:09<00:34,  2.08it/s][A
Training:  24%|██▎       | 21/89 [00:10<00:34,  1.96it/s][A
Training:  26%|██▌       | 23/89 [00:10<00:25,  2.54it/s][A
Training:  28%|██▊       | 25/89 [00:12<00:32,  1.97it/s][A
Training:  29%|██▉       | 26/89 [00:12<00:28,  2.23it/s][A
Training:  33%|███▎      | 29/89 [00:14<00:29,  2.03it/s][A
Training:  35%|███▍      | 31/89 [00:14<00:21,  2.70it/s][A
Training:  37%|███▋      | 33/89 [00:16<00:28,  1.97it/s][A
Training:  40%|████      | 36/89 [00

Epoch: 60/89 - Loss: 0.4809 - Accuracy: 0.9495



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:21,  1.95s/it][A
 33%|███▎      | 4/12 [00:02<00:03,  2.47it/s][A
 50%|█████     | 6/12 [00:03<00:03,  1.75it/s][A
100%|██████████| 12/12 [00:05<00:00,  2.24it/s][A
Epochs:  67%|██████▋   | 60/89 [46:17<22:24, 46.37s/it]

Val Loss: 0.5348 - Val Accuracy: 0.9391



Training:   0%|          | 0/89 [00:00<?, ?it/s][A
Training:   1%|          | 1/89 [00:02<03:07,  2.13s/it][A
Training:   4%|▍         | 4/89 [00:02<00:37,  2.30it/s][A
Training:   7%|▋         | 6/89 [00:03<00:50,  1.63it/s][A
Training:  10%|█         | 9/89 [00:05<00:46,  1.72it/s][A
Training:  13%|█▎        | 12/89 [00:05<00:28,  2.75it/s][A
Training:  16%|█▌        | 14/89 [00:07<00:37,  1.98it/s][A
Training:  19%|█▉        | 17/89 [00:09<00:38,  1.88it/s][A
Training:  22%|██▏       | 20/89 [00:09<00:24,  2.78it/s][A
Training:  25%|██▍       | 22/89 [00:10<00:32,  2.08it/s][A
Training:  28%|██▊       | 25/89 [00:12<00:32,  1.96it/s][A
Training:  31%|███▏      | 28/89 [00:12<00:21,  2.83it/s][A
Training:  34%|███▎      | 30/89 [00:14<00:27,  2.15it/s][A
Training:  36%|███▌      | 32/89 [00:14<00:20,  2.79it/s][A
Training:  38%|███▊      | 34/89 [00:16<00:26,  2.06it/s][A
Training:  40%|████      | 36/89 [00:16<00:19,  2.73it/s][A
Training:  43%|████▎     | 38/89 [00

Epoch: 61/89 - Loss: 0.4748 - Accuracy: 0.9481



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:21,  1.91s/it][A
 33%|███▎      | 4/12 [00:02<00:03,  2.56it/s][A
 50%|█████     | 6/12 [00:03<00:03,  1.78it/s][A
100%|██████████| 12/12 [00:05<00:00,  2.27it/s][A
Epochs:  69%|██████▊   | 61/89 [47:04<21:38, 46.37s/it]

Val Loss: 0.5555 - Val Accuracy: 0.9406



Training:   0%|          | 0/89 [00:00<?, ?it/s][A
Training:   1%|          | 1/89 [00:02<03:09,  2.15s/it][A
Training:   3%|▎         | 3/89 [00:02<00:51,  1.67it/s][A
Training:   6%|▌         | 5/89 [00:03<01:01,  1.36it/s][A
Training:   9%|▉         | 8/89 [00:04<00:29,  2.71it/s][A
Training:  11%|█         | 10/89 [00:05<00:41,  1.90it/s][A
Training:  15%|█▍        | 13/89 [00:07<00:41,  1.85it/s][A
Training:  17%|█▋        | 15/89 [00:07<00:29,  2.48it/s][A
Training:  19%|█▉        | 17/89 [00:09<00:37,  1.92it/s][A
Training:  21%|██▏       | 19/89 [00:09<00:27,  2.59it/s][A
Training:  24%|██▎       | 21/89 [00:10<00:35,  1.94it/s][A
Training:  26%|██▌       | 23/89 [00:11<00:25,  2.61it/s][A
Training:  28%|██▊       | 25/89 [00:12<00:33,  1.94it/s][A
Training:  30%|███       | 27/89 [00:12<00:23,  2.64it/s][A
Training:  33%|███▎      | 29/89 [00:14<00:30,  1.96it/s][A
Training:  35%|███▍      | 31/89 [00:14<00:21,  2.67it/s][A
Training:  37%|███▋      | 33/89 [00

Epoch: 62/89 - Loss: 0.4920 - Accuracy: 0.9464



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:21,  1.91s/it][A
 33%|███▎      | 4/12 [00:02<00:03,  2.55it/s][A
 50%|█████     | 6/12 [00:03<00:03,  1.84it/s][A
100%|██████████| 12/12 [00:05<00:00,  2.36it/s][A
Epochs:  70%|██████▉   | 62/89 [47:50<20:51, 46.36s/it]

Val Loss: 0.5026 - Val Accuracy: 0.9432



Training:   0%|          | 0/89 [00:00<?, ?it/s][A
Training:   1%|          | 1/89 [00:02<03:06,  2.12s/it][A
Training:   4%|▍         | 4/89 [00:02<00:36,  2.30it/s][A
Training:   7%|▋         | 6/89 [00:03<00:50,  1.65it/s][A
Training:  10%|█         | 9/89 [00:05<00:47,  1.69it/s][A
Training:  13%|█▎        | 12/89 [00:05<00:28,  2.73it/s][A
Training:  16%|█▌        | 14/89 [00:07<00:37,  2.00it/s][A
Training:  19%|█▉        | 17/89 [00:09<00:37,  1.91it/s][A
Training:  21%|██▏       | 19/89 [00:09<00:28,  2.48it/s][A
Training:  24%|██▎       | 21/89 [00:10<00:34,  1.95it/s][A
Training:  26%|██▌       | 23/89 [00:11<00:25,  2.58it/s][A
Training:  28%|██▊       | 25/89 [00:12<00:33,  1.91it/s][A
Training:  30%|███       | 27/89 [00:12<00:24,  2.58it/s][A
Training:  33%|███▎      | 29/89 [00:14<00:30,  1.95it/s][A
Training:  34%|███▎      | 30/89 [00:14<00:26,  2.26it/s][A
Training:  37%|███▋      | 33/89 [00:16<00:27,  2.05it/s][A
Training:  38%|███▊      | 34/89 [00

Epoch: 63/89 - Loss: 0.4782 - Accuracy: 0.9509



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:21,  1.96s/it][A
 33%|███▎      | 4/12 [00:02<00:03,  2.47it/s][A
 50%|█████     | 6/12 [00:03<00:03,  1.78it/s][A
100%|██████████| 12/12 [00:05<00:00,  2.26it/s][A
Epochs:  71%|███████   | 63/89 [48:36<20:04, 46.32s/it]

Val Loss: 0.4862 - Val Accuracy: 0.9418



Training:   0%|          | 0/89 [00:00<?, ?it/s][A
Training:   1%|          | 1/89 [00:02<03:03,  2.08s/it][A
Training:   4%|▍         | 4/89 [00:02<00:36,  2.35it/s][A
Training:   7%|▋         | 6/89 [00:03<00:49,  1.67it/s][A
Training:  10%|█         | 9/89 [00:05<00:46,  1.72it/s][A
Training:  13%|█▎        | 12/89 [00:05<00:27,  2.77it/s][A
Training:  16%|█▌        | 14/89 [00:07<00:36,  2.04it/s][A
Training:  19%|█▉        | 17/89 [00:09<00:37,  1.91it/s][A
Training:  22%|██▏       | 20/89 [00:09<00:24,  2.81it/s][A
Training:  25%|██▍       | 22/89 [00:10<00:31,  2.11it/s][A
Training:  28%|██▊       | 25/89 [00:12<00:32,  1.97it/s][A
Training:  30%|███       | 27/89 [00:12<00:24,  2.54it/s][A
Training:  33%|███▎      | 29/89 [00:14<00:30,  1.98it/s][A
Training:  35%|███▍      | 31/89 [00:14<00:22,  2.61it/s][A
Training:  37%|███▋      | 33/89 [00:16<00:28,  1.99it/s][A
Training:  39%|███▉      | 35/89 [00:16<00:20,  2.67it/s][A
Training:  42%|████▏     | 37/89 [00

Epoch: 64/89 - Loss: 0.4627 - Accuracy: 0.9503



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:21,  1.95s/it][A
 33%|███▎      | 4/12 [00:02<00:03,  2.49it/s][A
 50%|█████     | 6/12 [00:03<00:03,  1.83it/s][A
100%|██████████| 12/12 [00:05<00:00,  2.30it/s][A
Epochs:  72%|███████▏  | 64/89 [49:22<19:15, 46.21s/it]

Val Loss: 0.5114 - Val Accuracy: 0.9421



Training:   0%|          | 0/89 [00:00<?, ?it/s][A
Training:   1%|          | 1/89 [00:02<03:07,  2.14s/it][A
Training:   4%|▍         | 4/89 [00:02<00:37,  2.27it/s][A
Training:   7%|▋         | 6/89 [00:03<00:51,  1.61it/s][A
Training:  10%|█         | 9/89 [00:05<00:47,  1.70it/s][A
Training:  13%|█▎        | 12/89 [00:05<00:28,  2.73it/s][A
Training:  16%|█▌        | 14/89 [00:07<00:36,  2.03it/s][A
Training:  19%|█▉        | 17/89 [00:09<00:37,  1.91it/s][A
Training:  22%|██▏       | 20/89 [00:09<00:24,  2.82it/s][A
Training:  25%|██▍       | 22/89 [00:10<00:31,  2.11it/s][A
Training:  28%|██▊       | 25/89 [00:12<00:32,  1.97it/s][A
Training:  30%|███       | 27/89 [00:12<00:24,  2.54it/s][A
Training:  33%|███▎      | 29/89 [00:14<00:30,  1.95it/s][A
Training:  35%|███▍      | 31/89 [00:14<00:22,  2.58it/s][A
Training:  37%|███▋      | 33/89 [00:16<00:28,  1.96it/s][A
Training:  39%|███▉      | 35/89 [00:16<00:20,  2.63it/s][A
Training:  42%|████▏     | 37/89 [00

Epoch: 65/89 - Loss: 0.4531 - Accuracy: 0.9490



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:21,  1.93s/it][A
 33%|███▎      | 4/12 [00:02<00:03,  2.51it/s][A
 50%|█████     | 6/12 [00:03<00:03,  1.77it/s][A
100%|██████████| 12/12 [00:05<00:00,  2.27it/s][A
Epochs:  73%|███████▎  | 65/89 [50:08<18:29, 46.22s/it]

Val Loss: 0.5273 - Val Accuracy: 0.9427



Training:   0%|          | 0/89 [00:00<?, ?it/s][A
Training:   1%|          | 1/89 [00:02<03:03,  2.09s/it][A
Training:   4%|▍         | 4/89 [00:02<00:36,  2.34it/s][A
Training:   7%|▋         | 6/89 [00:03<00:50,  1.65it/s][A
Training:  10%|█         | 9/89 [00:05<00:47,  1.68it/s][A
Training:  12%|█▏        | 11/89 [00:05<00:33,  2.34it/s][A
Training:  15%|█▍        | 13/89 [00:07<00:42,  1.80it/s][A
Training:  18%|█▊        | 16/89 [00:07<00:25,  2.86it/s][A
Training:  20%|██        | 18/89 [00:09<00:34,  2.04it/s][A
Training:  24%|██▎       | 21/89 [00:10<00:35,  1.92it/s][A
Training:  27%|██▋       | 24/89 [00:11<00:22,  2.83it/s][A
Training:  29%|██▉       | 26/89 [00:12<00:29,  2.10it/s][A
Training:  33%|███▎      | 29/89 [00:14<00:31,  1.93it/s][A
Training:  36%|███▌      | 32/89 [00:14<00:20,  2.78it/s][A
Training:  38%|███▊      | 34/89 [00:16<00:25,  2.13it/s][A
Training:  42%|████▏     | 37/89 [00:18<00:26,  1.97it/s][A
Training:  45%|████▍     | 40/89 [00

Epoch: 66/89 - Loss: 0.4780 - Accuracy: 0.9458



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:21,  1.93s/it][A
 33%|███▎      | 4/12 [00:02<00:03,  2.51it/s][A
 50%|█████     | 6/12 [00:03<00:03,  1.77it/s][A
100%|██████████| 12/12 [00:05<00:00,  2.25it/s][A
Epochs:  74%|███████▍  | 66/89 [50:55<17:43, 46.25s/it]

Val Loss: 0.5658 - Val Accuracy: 0.9480



Training:   0%|          | 0/89 [00:00<?, ?it/s][A
Training:   1%|          | 1/89 [00:02<03:08,  2.14s/it][A
Training:   4%|▍         | 4/89 [00:02<00:37,  2.28it/s][A
Training:   7%|▋         | 6/89 [00:03<00:50,  1.64it/s][A
Training:  10%|█         | 9/89 [00:05<00:47,  1.69it/s][A
Training:  13%|█▎        | 12/89 [00:05<00:28,  2.73it/s][A
Training:  16%|█▌        | 14/89 [00:07<00:37,  2.01it/s][A
Training:  19%|█▉        | 17/89 [00:09<00:37,  1.90it/s][A
Training:  22%|██▏       | 20/89 [00:09<00:24,  2.81it/s][A
Training:  25%|██▍       | 22/89 [00:10<00:31,  2.09it/s][A
Training:  28%|██▊       | 25/89 [00:12<00:32,  1.96it/s][A
Training:  31%|███▏      | 28/89 [00:12<00:21,  2.82it/s][A
Training:  34%|███▎      | 30/89 [00:14<00:28,  2.10it/s][A
Training:  37%|███▋      | 33/89 [00:16<00:28,  1.96it/s][A
Training:  40%|████      | 36/89 [00:16<00:18,  2.82it/s][A
Training:  43%|████▎     | 38/89 [00:18<00:24,  2.12it/s][A
Training:  46%|████▌     | 41/89 [00

Epoch: 67/89 - Loss: 0.4787 - Accuracy: 0.9483



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:21,  1.95s/it][A
 33%|███▎      | 4/12 [00:02<00:03,  2.51it/s][A
 50%|█████     | 6/12 [00:03<00:03,  1.76it/s][A
100%|██████████| 12/12 [00:05<00:00,  2.28it/s][A
Epochs:  75%|███████▌  | 67/89 [51:41<16:57, 46.27s/it]

Val Loss: 0.5142 - Val Accuracy: 0.9475



Training:   0%|          | 0/89 [00:00<?, ?it/s][A
Training:   1%|          | 1/89 [00:02<03:04,  2.09s/it][A
Training:   4%|▍         | 4/89 [00:02<00:36,  2.35it/s][A
Training:   7%|▋         | 6/89 [00:03<00:51,  1.62it/s][A
Training:  10%|█         | 9/89 [00:05<00:47,  1.68it/s][A
Training:  13%|█▎        | 12/89 [00:05<00:28,  2.70it/s][A
Training:  16%|█▌        | 14/89 [00:07<00:37,  2.00it/s][A
Training:  19%|█▉        | 17/89 [00:09<00:38,  1.88it/s][A
Training:  22%|██▏       | 20/89 [00:09<00:24,  2.77it/s][A
Training:  25%|██▍       | 22/89 [00:11<00:32,  2.08it/s][A
Training:  28%|██▊       | 25/89 [00:12<00:32,  1.95it/s][A
Training:  31%|███▏      | 28/89 [00:12<00:21,  2.80it/s][A
Training:  34%|███▎      | 30/89 [00:14<00:28,  2.10it/s][A
Training:  37%|███▋      | 33/89 [00:16<00:28,  1.96it/s][A
Training:  40%|████      | 36/89 [00:16<00:19,  2.79it/s][A
Training:  43%|████▎     | 38/89 [00:18<00:24,  2.10it/s][A
Training:  45%|████▍     | 40/89 [00

Epoch: 68/89 - Loss: 0.4650 - Accuracy: 0.9483



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:21,  1.93s/it][A
 33%|███▎      | 4/12 [00:02<00:03,  2.51it/s][A
 50%|█████     | 6/12 [00:03<00:03,  1.81it/s][A
100%|██████████| 12/12 [00:05<00:00,  2.28it/s][A
Epochs:  76%|███████▋  | 68/89 [52:27<16:11, 46.28s/it]

Val Loss: 0.5300 - Val Accuracy: 0.9490



Training:   0%|          | 0/89 [00:00<?, ?it/s][A
Training:   1%|          | 1/89 [00:02<03:00,  2.05s/it][A
Training:   4%|▍         | 4/89 [00:02<00:36,  2.35it/s][A
Training:   7%|▋         | 6/89 [00:03<00:50,  1.65it/s][A
Training:  10%|█         | 9/89 [00:05<00:47,  1.70it/s][A
Training:  13%|█▎        | 12/89 [00:05<00:28,  2.73it/s][A
Training:  16%|█▌        | 14/89 [00:07<00:37,  1.99it/s][A
Training:  19%|█▉        | 17/89 [00:09<00:38,  1.89it/s][A
Training:  22%|██▏       | 20/89 [00:09<00:24,  2.79it/s][A
Training:  25%|██▍       | 22/89 [00:10<00:32,  2.08it/s][A
Training:  28%|██▊       | 25/89 [00:12<00:32,  1.96it/s][A
Training:  31%|███▏      | 28/89 [00:12<00:21,  2.83it/s][A
Training:  34%|███▎      | 30/89 [00:14<00:27,  2.13it/s][A
Training:  37%|███▋      | 33/89 [00:16<00:28,  1.99it/s][A
Training:  39%|███▉      | 35/89 [00:16<00:21,  2.53it/s][A
Training:  42%|████▏     | 37/89 [00:17<00:26,  1.94it/s][A
Training:  45%|████▍     | 40/89 [00

Epoch: 69/89 - Loss: 0.4782 - Accuracy: 0.9496



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:21,  1.96s/it][A
 33%|███▎      | 4/12 [00:02<00:03,  2.47it/s][A
 50%|█████     | 6/12 [00:03<00:03,  1.80it/s][A
100%|██████████| 12/12 [00:05<00:00,  2.29it/s][A
Epochs:  78%|███████▊  | 69/89 [53:14<15:25, 46.27s/it]

Val Loss: 0.4892 - Val Accuracy: 0.9432



Training:   0%|          | 0/89 [00:00<?, ?it/s][A
Training:   1%|          | 1/89 [00:02<03:02,  2.08s/it][A
Training:   4%|▍         | 4/89 [00:02<00:36,  2.35it/s][A
Training:   7%|▋         | 6/89 [00:03<00:49,  1.66it/s][A
Training:  10%|█         | 9/89 [00:05<00:46,  1.70it/s][A
Training:  13%|█▎        | 12/89 [00:05<00:28,  2.75it/s][A
Training:  16%|█▌        | 14/89 [00:07<00:36,  2.04it/s][A
Training:  19%|█▉        | 17/89 [00:09<00:37,  1.92it/s][A
Training:  22%|██▏       | 20/89 [00:09<00:24,  2.82it/s][A
Training:  25%|██▍       | 22/89 [00:10<00:32,  2.07it/s][A
Training:  28%|██▊       | 25/89 [00:12<00:33,  1.93it/s][A
Training:  31%|███▏      | 28/89 [00:12<00:22,  2.77it/s][A
Training:  34%|███▎      | 30/89 [00:14<00:27,  2.11it/s][A
Training:  37%|███▋      | 33/89 [00:16<00:28,  1.97it/s][A
Training:  40%|████      | 36/89 [00:16<00:18,  2.81it/s][A
Training:  43%|████▎     | 38/89 [00:18<00:24,  2.11it/s][A
Training:  46%|████▌     | 41/89 [00

Epoch: 70/89 - Loss: 0.4577 - Accuracy: 0.9492



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:21,  1.97s/it][A
 33%|███▎      | 4/12 [00:02<00:03,  2.47it/s][A
 50%|█████     | 6/12 [00:03<00:03,  1.78it/s][A
100%|██████████| 12/12 [00:05<00:00,  2.28it/s][A
Epochs:  79%|███████▊  | 70/89 [54:00<14:38, 46.26s/it]

Val Loss: 0.5266 - Val Accuracy: 0.9411



Training:   0%|          | 0/89 [00:00<?, ?it/s][A
Training:   1%|          | 1/89 [00:02<03:04,  2.10s/it][A
Training:   3%|▎         | 3/89 [00:02<00:50,  1.71it/s][A
Training:   6%|▌         | 5/89 [00:03<00:59,  1.41it/s][A
Training:   9%|▉         | 8/89 [00:03<00:29,  2.79it/s][A
Training:  11%|█         | 10/89 [00:05<00:40,  1.93it/s][A
Training:  15%|█▍        | 13/89 [00:07<00:41,  1.85it/s][A
Training:  18%|█▊        | 16/89 [00:07<00:25,  2.82it/s][A
Training:  20%|██        | 18/89 [00:09<00:33,  2.11it/s][A
Training:  24%|██▎       | 21/89 [00:10<00:34,  1.97it/s][A
Training:  27%|██▋       | 24/89 [00:10<00:22,  2.85it/s][A
Training:  29%|██▉       | 26/89 [00:12<00:29,  2.13it/s][A
Training:  30%|███       | 27/89 [00:12<00:25,  2.40it/s][A
Training:  33%|███▎      | 29/89 [00:14<00:32,  1.86it/s][A
Training:  36%|███▌      | 32/89 [00:14<00:19,  2.91it/s][A
Training:  38%|███▊      | 34/89 [00:16<00:26,  2.07it/s][A
Training:  42%|████▏     | 37/89 [00

Epoch: 71/89 - Loss: 0.4549 - Accuracy: 0.9500



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:21,  1.96s/it][A
 33%|███▎      | 4/12 [00:02<00:03,  2.51it/s][A
 50%|█████     | 6/12 [00:03<00:03,  1.77it/s][A
100%|██████████| 12/12 [00:05<00:00,  2.27it/s][A
Epochs:  80%|███████▉  | 71/89 [54:46<13:52, 46.27s/it]

Val Loss: 0.5377 - Val Accuracy: 0.9443



Training:   0%|          | 0/89 [00:00<?, ?it/s][A
Training:   1%|          | 1/89 [00:02<03:07,  2.13s/it][A
Training:   4%|▍         | 4/89 [00:02<00:37,  2.29it/s][A
Training:   7%|▋         | 6/89 [00:03<00:50,  1.63it/s][A
Training:  10%|█         | 9/89 [00:05<00:47,  1.67it/s][A
Training:  13%|█▎        | 12/89 [00:05<00:28,  2.70it/s][A
Training:  16%|█▌        | 14/89 [00:07<00:37,  1.99it/s][A
Training:  19%|█▉        | 17/89 [00:09<00:38,  1.89it/s][A
Training:  22%|██▏       | 20/89 [00:09<00:24,  2.78it/s][A
Training:  25%|██▍       | 22/89 [00:11<00:32,  2.07it/s][A
Training:  28%|██▊       | 25/89 [00:12<00:33,  1.94it/s][A
Training:  31%|███▏      | 28/89 [00:12<00:21,  2.79it/s][A
Training:  34%|███▎      | 30/89 [00:14<00:28,  2.09it/s][A
Training:  37%|███▋      | 33/89 [00:16<00:28,  1.96it/s][A
Training:  40%|████      | 36/89 [00:16<00:18,  2.79it/s][A
Training:  43%|████▎     | 38/89 [00:18<00:24,  2.11it/s][A
Training:  46%|████▌     | 41/89 [00

Epoch: 72/89 - Loss: 0.4678 - Accuracy: 0.9498



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:21,  1.96s/it][A
 33%|███▎      | 4/12 [00:02<00:03,  2.50it/s][A
 50%|█████     | 6/12 [00:03<00:03,  1.78it/s][A
100%|██████████| 12/12 [00:05<00:00,  2.28it/s][A
Epochs:  81%|████████  | 72/89 [55:33<13:07, 46.31s/it]

Val Loss: 0.5304 - Val Accuracy: 0.9427



Training:   0%|          | 0/89 [00:00<?, ?it/s][A
Training:   1%|          | 1/89 [00:02<03:05,  2.11s/it][A
Training:   4%|▍         | 4/89 [00:02<00:36,  2.32it/s][A
Training:   7%|▋         | 6/89 [00:03<00:50,  1.65it/s][A
Training:  10%|█         | 9/89 [00:05<00:47,  1.69it/s][A
Training:  13%|█▎        | 12/89 [00:05<00:28,  2.72it/s][A
Training:  16%|█▌        | 14/89 [00:07<00:37,  1.99it/s][A
Training:  19%|█▉        | 17/89 [00:09<00:38,  1.89it/s][A
Training:  22%|██▏       | 20/89 [00:09<00:24,  2.79it/s][A
Training:  25%|██▍       | 22/89 [00:11<00:32,  2.06it/s][A
Training:  28%|██▊       | 25/89 [00:12<00:33,  1.92it/s][A
Training:  30%|███       | 27/89 [00:12<00:25,  2.48it/s][A
Training:  33%|███▎      | 29/89 [00:14<00:31,  1.93it/s][A
Training:  35%|███▍      | 31/89 [00:14<00:22,  2.56it/s][A
Training:  37%|███▋      | 33/89 [00:16<00:28,  1.93it/s][A
Training:  39%|███▉      | 35/89 [00:16<00:21,  2.55it/s][A
Training:  42%|████▏     | 37/89 [00

Epoch: 73/89 - Loss: 0.4665 - Accuracy: 0.9500



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:21,  1.92s/it][A
 33%|███▎      | 4/12 [00:02<00:03,  2.52it/s][A
 50%|█████     | 6/12 [00:03<00:03,  1.82it/s][A
100%|██████████| 12/12 [00:05<00:00,  2.30it/s][A
Epochs:  82%|████████▏ | 73/89 [56:19<12:21, 46.34s/it]

Val Loss: 0.5460 - Val Accuracy: 0.9464



Training:   0%|          | 0/89 [00:00<?, ?it/s][A
Training:   1%|          | 1/89 [00:02<03:00,  2.05s/it][A
Training:   4%|▍         | 4/89 [00:02<00:35,  2.39it/s][A
Training:   7%|▋         | 6/89 [00:03<00:49,  1.67it/s][A
Training:  10%|█         | 9/89 [00:05<00:47,  1.69it/s][A
Training:  13%|█▎        | 12/89 [00:05<00:28,  2.72it/s][A
Training:  16%|█▌        | 14/89 [00:07<00:37,  1.99it/s][A
Training:  19%|█▉        | 17/89 [00:09<00:37,  1.90it/s][A
Training:  22%|██▏       | 20/89 [00:09<00:24,  2.81it/s][A
Training:  25%|██▍       | 22/89 [00:10<00:31,  2.10it/s][A
Training:  28%|██▊       | 25/89 [00:12<00:32,  1.94it/s][A
Training:  31%|███▏      | 28/89 [00:12<00:21,  2.81it/s][A
Training:  34%|███▎      | 30/89 [00:14<00:27,  2.12it/s][A
Training:  37%|███▋      | 33/89 [00:16<00:28,  1.94it/s][A
Training:  40%|████      | 36/89 [00:16<00:19,  2.77it/s][A
Training:  43%|████▎     | 38/89 [00:18<00:24,  2.07it/s][A
Training:  46%|████▌     | 41/89 [00

Epoch: 74/89 - Loss: 0.4535 - Accuracy: 0.9498



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:21,  1.93s/it][A
 33%|███▎      | 4/12 [00:02<00:03,  2.51it/s][A
 50%|█████     | 6/12 [00:03<00:03,  1.79it/s][A
100%|██████████| 12/12 [00:05<00:00,  2.28it/s][A
Epochs:  83%|████████▎ | 74/89 [57:05<11:35, 46.36s/it]

Val Loss: 0.5579 - Val Accuracy: 0.9432



Training:   0%|          | 0/89 [00:00<?, ?it/s][A
Training:   1%|          | 1/89 [00:02<03:02,  2.07s/it][A
Training:   3%|▎         | 3/89 [00:02<00:49,  1.74it/s][A
Training:   6%|▌         | 5/89 [00:03<00:59,  1.41it/s][A
Training:   9%|▉         | 8/89 [00:03<00:29,  2.77it/s][A
Training:  11%|█         | 10/89 [00:05<00:41,  1.92it/s][A
Training:  15%|█▍        | 13/89 [00:07<00:41,  1.84it/s][A
Training:  18%|█▊        | 16/89 [00:07<00:25,  2.81it/s][A
Training:  20%|██        | 18/89 [00:09<00:34,  2.03it/s][A
Training:  24%|██▎       | 21/89 [00:11<00:35,  1.90it/s][A
Training:  26%|██▌       | 23/89 [00:11<00:27,  2.44it/s][A
Training:  28%|██▊       | 25/89 [00:12<00:33,  1.91it/s][A
Training:  30%|███       | 27/89 [00:12<00:24,  2.55it/s][A
Training:  33%|███▎      | 29/89 [00:14<00:31,  1.93it/s][A
Training:  36%|███▌      | 32/89 [00:14<00:19,  2.97it/s][A
Training:  38%|███▊      | 34/89 [00:16<00:26,  2.10it/s][A
Training:  42%|████▏     | 37/89 [00

Epoch: 75/89 - Loss: 0.4567 - Accuracy: 0.9495



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:21,  1.94s/it][A
 33%|███▎      | 4/12 [00:02<00:03,  2.51it/s][A
 50%|█████     | 6/12 [00:03<00:03,  1.75it/s][A
100%|██████████| 12/12 [00:05<00:00,  2.27it/s][A
Epochs:  84%|████████▍ | 75/89 [57:52<10:50, 46.45s/it]

Val Loss: 0.5259 - Val Accuracy: 0.9375



Training:   0%|          | 0/89 [00:00<?, ?it/s][A
Training:   1%|          | 1/89 [00:02<03:09,  2.16s/it][A
Training:   4%|▍         | 4/89 [00:02<00:37,  2.25it/s][A
Training:   7%|▋         | 6/89 [00:04<00:52,  1.59it/s][A
Training:  10%|█         | 9/89 [00:05<00:48,  1.66it/s][A
Training:  13%|█▎        | 12/89 [00:05<00:28,  2.69it/s][A
Training:  16%|█▌        | 14/89 [00:07<00:37,  1.99it/s][A
Training:  19%|█▉        | 17/89 [00:09<00:38,  1.89it/s][A
Training:  22%|██▏       | 20/89 [00:09<00:24,  2.79it/s][A
Training:  25%|██▍       | 22/89 [00:11<00:32,  2.08it/s][A
Training:  28%|██▊       | 25/89 [00:12<00:32,  1.95it/s][A
Training:  31%|███▏      | 28/89 [00:12<00:21,  2.82it/s][A
Training:  34%|███▎      | 30/89 [00:14<00:28,  2.10it/s][A
Training:  37%|███▋      | 33/89 [00:16<00:28,  1.95it/s][A
Training:  40%|████      | 36/89 [00:16<00:18,  2.79it/s][A
Training:  43%|████▎     | 38/89 [00:18<00:23,  2.13it/s][A
Training:  46%|████▌     | 41/89 [00

Epoch: 76/89 - Loss: 0.4533 - Accuracy: 0.9483



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:02<00:22,  2.07s/it][A
 33%|███▎      | 4/12 [00:02<00:03,  2.38it/s][A
 50%|█████     | 6/12 [00:03<00:03,  1.72it/s][A
100%|██████████| 12/12 [00:05<00:00,  2.19it/s][A
Epochs:  85%|████████▌ | 76/89 [58:39<10:05, 46.59s/it]

Val Loss: 0.4980 - Val Accuracy: 0.9459



Training:   0%|          | 0/89 [00:00<?, ?it/s][A
Training:   1%|          | 1/89 [00:02<03:07,  2.13s/it][A
Training:   4%|▍         | 4/89 [00:02<00:36,  2.30it/s][A
Training:   7%|▋         | 6/89 [00:03<00:50,  1.63it/s][A
Training:  10%|█         | 9/89 [00:05<00:48,  1.66it/s][A
Training:  13%|█▎        | 12/89 [00:05<00:28,  2.69it/s][A
Training:  16%|█▌        | 14/89 [00:07<00:37,  1.98it/s][A
Training:  19%|█▉        | 17/89 [00:09<00:38,  1.89it/s][A
Training:  22%|██▏       | 20/89 [00:09<00:24,  2.78it/s][A
Training:  25%|██▍       | 22/89 [00:11<00:32,  2.06it/s][A
Training:  28%|██▊       | 25/89 [00:12<00:32,  1.94it/s][A
Training:  31%|███▏      | 28/89 [00:12<00:21,  2.79it/s][A
Training:  34%|███▎      | 30/89 [00:14<00:27,  2.11it/s][A
Training:  37%|███▋      | 33/89 [00:16<00:28,  1.95it/s][A
Training:  40%|████      | 36/89 [00:16<00:18,  2.79it/s][A
Training:  43%|████▎     | 38/89 [00:18<00:24,  2.09it/s][A
Training:  46%|████▌     | 41/89 [00

Epoch: 77/89 - Loss: 0.4622 - Accuracy: 0.9504



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:21,  1.97s/it][A
 33%|███▎      | 4/12 [00:02<00:03,  2.48it/s][A
 50%|█████     | 6/12 [00:03<00:03,  1.76it/s][A
100%|██████████| 12/12 [00:05<00:00,  2.24it/s][A
Epochs:  87%|████████▋ | 77/89 [59:25<09:18, 46.55s/it]

Val Loss: 0.5598 - Val Accuracy: 0.9459



Training:   0%|          | 0/89 [00:00<?, ?it/s][A
Training:   1%|          | 1/89 [00:02<03:04,  2.10s/it][A
Training:   4%|▍         | 4/89 [00:02<00:36,  2.31it/s][A
Training:   7%|▋         | 6/89 [00:03<00:51,  1.62it/s][A
Training:  10%|█         | 9/89 [00:05<00:47,  1.68it/s][A
Training:  13%|█▎        | 12/89 [00:05<00:28,  2.70it/s][A
Training:  16%|█▌        | 14/89 [00:07<00:38,  1.95it/s][A
Training:  19%|█▉        | 17/89 [00:09<00:38,  1.86it/s][A
Training:  22%|██▏       | 20/89 [00:09<00:25,  2.76it/s][A
Training:  25%|██▍       | 22/89 [00:11<00:32,  2.06it/s][A
Training:  28%|██▊       | 25/89 [00:12<00:33,  1.93it/s][A
Training:  31%|███▏      | 28/89 [00:12<00:21,  2.78it/s][A
Training:  34%|███▎      | 30/89 [00:14<00:28,  2.08it/s][A
Training:  37%|███▋      | 33/89 [00:16<00:28,  1.95it/s][A
Training:  40%|████      | 36/89 [00:16<00:19,  2.79it/s][A
Training:  43%|████▎     | 38/89 [00:18<00:24,  2.11it/s][A
Training:  46%|████▌     | 41/89 [00

Epoch: 78/89 - Loss: 0.4463 - Accuracy: 0.9518



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:21,  1.93s/it][A
 33%|███▎      | 4/12 [00:02<00:03,  2.52it/s][A
 50%|█████     | 6/12 [00:03<00:03,  1.78it/s][A
100%|██████████| 12/12 [00:05<00:00,  2.27it/s][A
Epochs:  88%|████████▊ | 78/89 [1:00:12<08:32, 46.59s/it]

Val Loss: 0.5407 - Val Accuracy: 0.9464



Training:   0%|          | 0/89 [00:00<?, ?it/s][A
Training:   1%|          | 1/89 [00:02<03:11,  2.18s/it][A
Training:   3%|▎         | 3/89 [00:02<00:52,  1.64it/s][A
Training:   6%|▌         | 5/89 [00:03<01:01,  1.38it/s][A
Training:   8%|▊         | 7/89 [00:04<00:37,  2.20it/s][A
Training:  10%|█         | 9/89 [00:05<00:46,  1.72it/s][A
Training:  12%|█▏        | 11/89 [00:05<00:31,  2.46it/s][A
Training:  15%|█▍        | 13/89 [00:07<00:41,  1.83it/s][A
Training:  17%|█▋        | 15/89 [00:07<00:28,  2.57it/s][A
Training:  19%|█▉        | 17/89 [00:09<00:38,  1.88it/s][A
Training:  22%|██▏       | 20/89 [00:09<00:22,  3.00it/s][A
Training:  25%|██▍       | 22/89 [00:11<00:31,  2.14it/s][A
Training:  27%|██▋       | 24/89 [00:11<00:22,  2.86it/s][A
Training:  29%|██▉       | 26/89 [00:12<00:31,  2.02it/s][A
Training:  33%|███▎      | 29/89 [00:14<00:31,  1.90it/s][A
Training:  36%|███▌      | 32/89 [00:14<00:20,  2.81it/s][A
Training:  38%|███▊      | 34/89 [00:

Epoch: 79/89 - Loss: 0.4420 - Accuracy: 0.9508



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:21,  1.97s/it][A
 33%|███▎      | 4/12 [00:02<00:03,  2.46it/s][A
 50%|█████     | 6/12 [00:03<00:03,  1.75it/s][A
100%|██████████| 12/12 [00:05<00:00,  2.25it/s][A
Epochs:  89%|████████▉ | 79/89 [1:00:59<07:46, 46.60s/it]

Val Loss: 0.5120 - Val Accuracy: 0.9459



Training:   0%|          | 0/89 [00:00<?, ?it/s][A
Training:   1%|          | 1/89 [00:02<03:03,  2.09s/it][A
Training:   4%|▍         | 4/89 [00:02<00:36,  2.33it/s][A
Training:   7%|▋         | 6/89 [00:03<00:49,  1.66it/s][A
Training:  10%|█         | 9/89 [00:05<00:46,  1.70it/s][A
Training:  13%|█▎        | 12/89 [00:05<00:28,  2.74it/s][A
Training:  16%|█▌        | 14/89 [00:07<00:37,  1.99it/s][A
Training:  19%|█▉        | 17/89 [00:09<00:37,  1.90it/s][A
Training:  22%|██▏       | 20/89 [00:09<00:24,  2.80it/s][A
Training:  25%|██▍       | 22/89 [00:10<00:31,  2.13it/s][A
Training:  28%|██▊       | 25/89 [00:12<00:32,  1.99it/s][A
Training:  31%|███▏      | 28/89 [00:12<00:21,  2.87it/s][A
Training:  34%|███▎      | 30/89 [00:14<00:27,  2.14it/s][A
Training:  37%|███▋      | 33/89 [00:16<00:28,  1.97it/s][A
Training:  40%|████      | 36/89 [00:16<00:18,  2.82it/s][A
Training:  43%|████▎     | 38/89 [00:17<00:24,  2.11it/s][A
Training:  46%|████▌     | 41/89 [00

Epoch: 80/89 - Loss: 0.4515 - Accuracy: 0.9510



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:21,  1.99s/it][A
 33%|███▎      | 4/12 [00:02<00:03,  2.47it/s][A
 50%|█████     | 6/12 [00:03<00:03,  1.79it/s][A
100%|██████████| 12/12 [00:05<00:00,  2.29it/s][A
Epochs:  90%|████████▉ | 80/89 [1:01:45<06:57, 46.42s/it]

Val Loss: 0.5024 - Val Accuracy: 0.9416



Training:   0%|          | 0/89 [00:00<?, ?it/s][A
Training:   1%|          | 1/89 [00:02<02:56,  2.01s/it][A
Training:   3%|▎         | 3/89 [00:02<00:48,  1.78it/s][A
Training:   6%|▌         | 5/89 [00:03<00:58,  1.43it/s][A
Training:   9%|▉         | 8/89 [00:03<00:28,  2.81it/s][A
Training:  11%|█         | 10/89 [00:05<00:40,  1.93it/s][A
Training:  15%|█▍        | 13/89 [00:07<00:40,  1.86it/s][A
Training:  18%|█▊        | 16/89 [00:07<00:25,  2.83it/s][A
Training:  20%|██        | 18/89 [00:09<00:34,  2.08it/s][A
Training:  24%|██▎       | 21/89 [00:10<00:35,  1.94it/s][A
Training:  27%|██▋       | 24/89 [00:10<00:23,  2.82it/s][A
Training:  29%|██▉       | 26/89 [00:12<00:29,  2.12it/s][A
Training:  33%|███▎      | 29/89 [00:14<00:30,  1.98it/s][A
Training:  36%|███▌      | 32/89 [00:14<00:20,  2.83it/s][A
Training:  38%|███▊      | 34/89 [00:16<00:25,  2.13it/s][A
Training:  42%|████▏     | 37/89 [00:17<00:26,  1.98it/s][A
Training:  45%|████▍     | 40/89 [00

Epoch: 81/89 - Loss: 0.4658 - Accuracy: 0.9493



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:20,  1.90s/it][A
 33%|███▎      | 4/12 [00:02<00:03,  2.58it/s][A
 50%|█████     | 6/12 [00:03<00:03,  1.81it/s][A
100%|██████████| 12/12 [00:05<00:00,  2.31it/s][A
Epochs:  91%|█████████ | 81/89 [1:02:31<06:10, 46.29s/it]

Val Loss: 0.5028 - Val Accuracy: 0.9480



Training:   0%|          | 0/89 [00:00<?, ?it/s][A
Training:   1%|          | 1/89 [00:02<03:04,  2.10s/it][A
Training:   4%|▍         | 4/89 [00:02<00:36,  2.34it/s][A
Training:   7%|▋         | 6/89 [00:03<00:50,  1.63it/s][A
Training:  10%|█         | 9/89 [00:05<00:47,  1.68it/s][A
Training:  13%|█▎        | 12/89 [00:05<00:28,  2.74it/s][A
Training:  16%|█▌        | 14/89 [00:07<00:37,  2.00it/s][A
Training:  19%|█▉        | 17/89 [00:09<00:38,  1.86it/s][A
Training:  22%|██▏       | 20/89 [00:09<00:24,  2.76it/s][A
Training:  25%|██▍       | 22/89 [00:10<00:31,  2.10it/s][A
Training:  28%|██▊       | 25/89 [00:12<00:32,  1.97it/s][A
Training:  31%|███▏      | 28/89 [00:12<00:21,  2.85it/s][A
Training:  34%|███▎      | 30/89 [00:14<00:27,  2.12it/s][A
Training:  37%|███▋      | 33/89 [00:16<00:28,  1.99it/s][A
Training:  40%|████      | 36/89 [00:16<00:18,  2.86it/s][A
Training:  43%|████▎     | 38/89 [00:17<00:23,  2.14it/s][A
Training:  46%|████▌     | 41/89 [00

Epoch: 82/89 - Loss: 0.4514 - Accuracy: 0.9481



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:21,  1.94s/it][A
 33%|███▎      | 4/12 [00:02<00:03,  2.51it/s][A
 50%|█████     | 6/12 [00:03<00:03,  1.83it/s][A
100%|██████████| 12/12 [00:05<00:00,  2.31it/s][A
Epochs:  92%|█████████▏| 82/89 [1:03:17<05:23, 46.21s/it]

Val Loss: 0.5622 - Val Accuracy: 0.9363



Training:   0%|          | 0/89 [00:00<?, ?it/s][A
Training:   1%|          | 1/89 [00:02<03:08,  2.14s/it][A
Training:   4%|▍         | 4/89 [00:02<00:37,  2.28it/s][A
Training:   7%|▋         | 6/89 [00:03<00:50,  1.64it/s][A
Training:  10%|█         | 9/89 [00:05<00:47,  1.69it/s][A
Training:  13%|█▎        | 12/89 [00:05<00:28,  2.74it/s][A
Training:  16%|█▌        | 14/89 [00:07<00:37,  2.01it/s][A
Training:  19%|█▉        | 17/89 [00:09<00:37,  1.90it/s][A
Training:  22%|██▏       | 20/89 [00:09<00:24,  2.80it/s][A
Training:  25%|██▍       | 22/89 [00:10<00:31,  2.11it/s][A
Training:  28%|██▊       | 25/89 [00:12<00:32,  1.98it/s][A
Training:  31%|███▏      | 28/89 [00:12<00:21,  2.85it/s][A
Training:  34%|███▎      | 30/89 [00:14<00:27,  2.15it/s][A
Training:  37%|███▋      | 33/89 [00:16<00:27,  2.00it/s][A
Training:  40%|████      | 36/89 [00:16<00:18,  2.86it/s][A
Training:  43%|████▎     | 38/89 [00:17<00:23,  2.13it/s][A
Training:  46%|████▌     | 41/89 [00

Epoch: 83/89 - Loss: 0.4558 - Accuracy: 0.9481



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:21,  1.91s/it][A
 33%|███▎      | 4/12 [00:02<00:03,  2.56it/s][A
 50%|█████     | 6/12 [00:03<00:03,  1.82it/s][A
100%|██████████| 12/12 [00:05<00:00,  2.28it/s][A
Epochs:  93%|█████████▎| 83/89 [1:04:03<04:36, 46.13s/it]

Val Loss: 0.5528 - Val Accuracy: 0.9380



Training:   0%|          | 0/89 [00:00<?, ?it/s][A
Training:   1%|          | 1/89 [00:02<03:06,  2.12s/it][A
Training:   3%|▎         | 3/89 [00:02<00:50,  1.69it/s][A
Training:   6%|▌         | 5/89 [00:03<00:59,  1.40it/s][A
Training:   8%|▊         | 7/89 [00:03<00:35,  2.31it/s][A
Training:  10%|█         | 9/89 [00:05<00:46,  1.71it/s][A
Training:  13%|█▎        | 12/89 [00:05<00:26,  2.91it/s][A
Training:  16%|█▌        | 14/89 [00:07<00:36,  2.05it/s][A
Training:  19%|█▉        | 17/89 [00:09<00:37,  1.94it/s][A
Training:  22%|██▏       | 20/89 [00:09<00:23,  2.90it/s][A
Training:  25%|██▍       | 22/89 [00:10<00:31,  2.11it/s][A
Training:  28%|██▊       | 25/89 [00:12<00:32,  1.95it/s][A
Training:  31%|███▏      | 28/89 [00:12<00:21,  2.82it/s][A
Training:  34%|███▎      | 30/89 [00:14<00:27,  2.14it/s][A
Training:  37%|███▋      | 33/89 [00:16<00:28,  2.00it/s][A
Training:  39%|███▉      | 35/89 [00:16<00:21,  2.56it/s][A
Training:  42%|████▏     | 37/89 [00:

Epoch: 84/89 - Loss: 0.4525 - Accuracy: 0.9499



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:21,  1.92s/it][A
 25%|██▌       | 3/12 [00:02<00:04,  1.87it/s][A
 42%|████▏     | 5/12 [00:03<00:04,  1.55it/s][A
 67%|██████▋   | 8/12 [00:03<00:01,  3.05it/s][A
100%|██████████| 12/12 [00:05<00:00,  2.29it/s][A
Epochs:  94%|█████████▍| 84/89 [1:04:49<03:50, 46.06s/it]

Val Loss: 0.5128 - Val Accuracy: 0.9432



Training:   0%|          | 0/89 [00:00<?, ?it/s][A
Training:   1%|          | 1/89 [00:02<03:07,  2.13s/it][A
Training:   4%|▍         | 4/89 [00:02<00:37,  2.28it/s][A
Training:   7%|▋         | 6/89 [00:03<00:50,  1.63it/s][A
Training:  10%|█         | 9/89 [00:05<00:47,  1.69it/s][A
Training:  13%|█▎        | 12/89 [00:05<00:28,  2.73it/s][A
Training:  16%|█▌        | 14/89 [00:07<00:37,  2.01it/s][A
Training:  19%|█▉        | 17/89 [00:09<00:37,  1.91it/s][A
Training:  22%|██▏       | 20/89 [00:09<00:24,  2.82it/s][A
Training:  25%|██▍       | 22/89 [00:10<00:32,  2.09it/s][A
Training:  28%|██▊       | 25/89 [00:12<00:32,  1.96it/s][A
Training:  31%|███▏      | 28/89 [00:12<00:21,  2.82it/s][A
Training:  34%|███▎      | 30/89 [00:14<00:27,  2.13it/s][A
Training:  37%|███▋      | 33/89 [00:16<00:28,  1.99it/s][A
Training:  40%|████      | 36/89 [00:16<00:18,  2.84it/s][A
Training:  43%|████▎     | 38/89 [00:17<00:23,  2.14it/s][A
Training:  46%|████▌     | 41/89 [00

Epoch: 85/89 - Loss: 0.4538 - Accuracy: 0.9487



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:20,  1.87s/it][A
 33%|███▎      | 4/12 [00:02<00:03,  2.56it/s][A
 50%|█████     | 6/12 [00:03<00:03,  1.82it/s][A
 75%|███████▌  | 9/12 [00:04<00:01,  1.92it/s][A
100%|██████████| 12/12 [00:05<00:00,  2.31it/s][A
Epochs:  96%|█████████▌| 85/89 [1:05:34<03:03, 46.00s/it]

Val Loss: 0.5362 - Val Accuracy: 0.9485



Training:   0%|          | 0/89 [00:00<?, ?it/s][A
Training:   1%|          | 1/89 [00:02<03:02,  2.08s/it][A
Training:   4%|▍         | 4/89 [00:02<00:35,  2.37it/s][A
Training:   7%|▋         | 6/89 [00:03<00:49,  1.69it/s][A
Training:  10%|█         | 9/89 [00:05<00:45,  1.74it/s][A
Training:  12%|█▏        | 11/89 [00:05<00:32,  2.41it/s][A
Training:  15%|█▍        | 13/89 [00:07<00:40,  1.87it/s][A
Training:  17%|█▋        | 15/89 [00:07<00:28,  2.56it/s][A
Training:  19%|█▉        | 17/89 [00:08<00:36,  1.95it/s][A
Training:  21%|██▏       | 19/89 [00:09<00:26,  2.65it/s][A
Training:  24%|██▎       | 21/89 [00:10<00:34,  1.97it/s][A
Training:  26%|██▌       | 23/89 [00:10<00:25,  2.61it/s][A
Training:  28%|██▊       | 25/89 [00:12<00:32,  1.98it/s][A
Training:  30%|███       | 27/89 [00:12<00:23,  2.63it/s][A
Training:  33%|███▎      | 29/89 [00:14<00:29,  2.01it/s][A
Training:  35%|███▍      | 31/89 [00:14<00:21,  2.69it/s][A
Training:  37%|███▋      | 33/89 [00

Epoch: 86/89 - Loss: 0.4495 - Accuracy: 0.9501



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:02<00:22,  2.02s/it][A
 33%|███▎      | 4/12 [00:02<00:03,  2.44it/s][A
 50%|█████     | 6/12 [00:03<00:03,  1.79it/s][A
100%|██████████| 12/12 [00:05<00:00,  2.28it/s][A
Epochs:  97%|█████████▋| 86/89 [1:06:20<02:17, 45.98s/it]

Val Loss: 0.5373 - Val Accuracy: 0.9365



Training:   0%|          | 0/89 [00:00<?, ?it/s][A
Training:   1%|          | 1/89 [00:02<03:01,  2.06s/it][A
Training:   4%|▍         | 4/89 [00:02<00:36,  2.36it/s][A
Training:   7%|▋         | 6/89 [00:03<00:49,  1.68it/s][A
Training:  10%|█         | 9/89 [00:05<00:47,  1.70it/s][A
Training:  13%|█▎        | 12/89 [00:05<00:28,  2.75it/s][A
Training:  16%|█▌        | 14/89 [00:07<00:36,  2.03it/s][A
Training:  19%|█▉        | 17/89 [00:09<00:37,  1.90it/s][A
Training:  22%|██▏       | 20/89 [00:09<00:24,  2.81it/s][A
Training:  25%|██▍       | 22/89 [00:10<00:32,  2.09it/s][A
Training:  28%|██▊       | 25/89 [00:12<00:32,  1.97it/s][A
Training:  31%|███▏      | 28/89 [00:12<00:21,  2.85it/s][A
Training:  34%|███▎      | 30/89 [00:14<00:28,  2.10it/s][A
Training:  37%|███▋      | 33/89 [00:16<00:28,  1.95it/s][A
Training:  40%|████      | 36/89 [00:16<00:18,  2.79it/s][A
Training:  43%|████▎     | 38/89 [00:17<00:24,  2.11it/s][A
Training:  46%|████▌     | 41/89 [00

Epoch: 87/89 - Loss: 0.4381 - Accuracy: 0.9505



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:21,  1.95s/it][A
 33%|███▎      | 4/12 [00:02<00:03,  2.49it/s][A
 50%|█████     | 6/12 [00:03<00:03,  1.78it/s][A
100%|██████████| 12/12 [00:05<00:00,  2.26it/s][A
Epochs:  98%|█████████▊| 87/89 [1:07:07<01:32, 46.04s/it]

Val Loss: 0.5642 - Val Accuracy: 0.9391



Training:   0%|          | 0/89 [00:00<?, ?it/s][A
Training:   1%|          | 1/89 [00:02<02:59,  2.04s/it][A
Training:   4%|▍         | 4/89 [00:02<00:35,  2.38it/s][A
Training:   7%|▋         | 6/89 [00:03<00:49,  1.67it/s][A
Training:  10%|█         | 9/89 [00:05<00:46,  1.72it/s][A
Training:  13%|█▎        | 12/89 [00:05<00:27,  2.77it/s][A
Training:  16%|█▌        | 14/89 [00:07<00:36,  2.04it/s][A
Training:  19%|█▉        | 17/89 [00:09<00:37,  1.91it/s][A
Training:  21%|██▏       | 19/89 [00:09<00:28,  2.50it/s][A
Training:  24%|██▎       | 21/89 [00:10<00:34,  1.95it/s][A
Training:  26%|██▌       | 23/89 [00:10<00:25,  2.60it/s][A
Training:  28%|██▊       | 25/89 [00:12<00:32,  1.95it/s][A
Training:  30%|███       | 27/89 [00:12<00:23,  2.64it/s][A
Training:  33%|███▎      | 29/89 [00:14<00:30,  1.97it/s][A
Training:  36%|███▌      | 32/89 [00:14<00:18,  3.05it/s][A
Training:  38%|███▊      | 34/89 [00:16<00:25,  2.16it/s][A
Training:  42%|████▏     | 37/89 [00

Epoch: 88/89 - Loss: 0.4435 - Accuracy: 0.9483



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:21,  1.94s/it][A
 33%|███▎      | 4/12 [00:02<00:03,  2.52it/s][A
 50%|█████     | 6/12 [00:03<00:03,  1.79it/s][A
100%|██████████| 12/12 [00:05<00:00,  2.27it/s][A
Epochs:  99%|█████████▉| 88/89 [1:07:53<00:46, 46.03s/it]

Val Loss: 0.5333 - Val Accuracy: 0.9400



Training:   0%|          | 0/89 [00:00<?, ?it/s][A
Training:   1%|          | 1/89 [00:02<03:05,  2.11s/it][A
Training:   3%|▎         | 3/89 [00:02<00:50,  1.71it/s][A
Training:   6%|▌         | 5/89 [00:03<01:00,  1.38it/s][A
Training:   9%|▉         | 8/89 [00:04<00:29,  2.75it/s][A
Training:  11%|█         | 10/89 [00:05<00:41,  1.92it/s][A
Training:  15%|█▍        | 13/89 [00:07<00:41,  1.84it/s][A
Training:  18%|█▊        | 16/89 [00:07<00:25,  2.81it/s][A
Training:  20%|██        | 18/89 [00:09<00:34,  2.05it/s][A
Training:  24%|██▎       | 21/89 [00:10<00:35,  1.93it/s][A
Training:  27%|██▋       | 24/89 [00:11<00:23,  2.82it/s][A
Training:  29%|██▉       | 26/89 [00:12<00:30,  2.10it/s][A
Training:  33%|███▎      | 29/89 [00:14<00:30,  1.97it/s][A
Training:  36%|███▌      | 32/89 [00:14<00:20,  2.83it/s][A
Training:  38%|███▊      | 34/89 [00:16<00:25,  2.17it/s][A
Training:  42%|████▏     | 37/89 [00:18<00:26,  1.97it/s][A
Training:  45%|████▍     | 40/89 [00

Epoch: 89/89 - Loss: 0.4462 - Accuracy: 0.9493



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:21,  1.96s/it][A
 33%|███▎      | 4/12 [00:02<00:03,  2.48it/s][A
 50%|█████     | 6/12 [00:03<00:03,  1.76it/s][A
100%|██████████| 12/12 [00:05<00:00,  2.26it/s][A
Epochs: 100%|██████████| 89/89 [1:08:39<00:00, 46.28s/it]
[32m[I 2023-12-15 02:38:50,913][0m Trial 2 finished with value: 0.9405519962310791 and parameters: {'learning_rate': 0.00014936159954798418, 'weight_decay': 0.000648991059773433, 'epsilon': 6.582574844800083e-09, 'batch_size': 157, 'epochs': 89}. Best is trial 2 with value: 0.9405519962310791.[0m


Val Loss: 0.5691 - Val Accuracy: 0.9406
Saving best model...
Learning rate: 0.0077757503835996266
Weight decay: 0.0007839042688318305
Epsilon: 4.069014959579636e-08
Batch size: 198
Number of epochs: 10


Epochs:   0%|          | 0/10 [00:00<?, ?it/s]
Training:   0%|          | 0/71 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/71 [00:02<03:00,  2.59s/it][A
Training:   4%|▍         | 3/71 [00:02<00:48,  1.41it/s][A
Training:   7%|▋         | 5/71 [00:04<00:58,  1.14it/s][A
Training:  10%|▉         | 7/71 [00:04<00:33,  1.89it/s][A
Training:  13%|█▎        | 9/71 [00:07<00:45,  1.37it/s][A
Training:  15%|█▌        | 11/71 [00:07<00:29,  2.02it/s][A
Training:  18%|█▊        | 13/71 [00:09<00:39,  1.46it/s][A
Training:  21%|██        | 15/71 [00:09<00:26,  2.08it/s][A
Training:  24%|██▍       | 17/71 [00:11<00:35,  1.51it/s][A
Training:  27%|██▋       | 19/71 [00:11<00:24,  2.12it/s][A
Training:  30%|██▉       | 21/71 [00:13<00:32,  1.55it/s][A
Training:  32%|███▏      | 23/71 [00:13<00:22,  2.15it/s][A
Training:  35%|███▌      | 25/71 [00:15<00:29,  1.55it/s][A
Training:  38%|███▊      | 27/71 [00:15<00:20,  2.14it/s][A
Training:  41%|████      | 29/71 [00:18<00:27,  1.54

Epoch: 1/10 - Loss: 15.4215 - Accuracy: 0.8333



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:02<00:19,  2.39s/it][A
 44%|████▍     | 4/9 [00:02<00:02,  2.04it/s][A
 67%|██████▋   | 6/9 [00:04<00:02,  1.45it/s][A
100%|██████████| 9/9 [00:05<00:00,  1.50it/s][A
Epochs:  10%|█         | 1/10 [00:46<06:56, 46.31s/it]

Val Loss: 13.9846 - Val Accuracy: 0.9029



Training:   0%|          | 0/71 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/71 [00:02<03:02,  2.60s/it][A
Training:   4%|▍         | 3/71 [00:02<00:48,  1.39it/s][A
Training:   7%|▋         | 5/71 [00:04<00:59,  1.11it/s][A
Training:  11%|█▏        | 8/71 [00:04<00:28,  2.22it/s][A
Training:  14%|█▍        | 10/71 [00:07<00:40,  1.52it/s][A
Training:  18%|█▊        | 13/71 [00:09<00:39,  1.46it/s][A
Training:  21%|██        | 15/71 [00:09<00:28,  1.97it/s][A
Training:  24%|██▍       | 17/71 [00:11<00:35,  1.50it/s][A
Training:  28%|██▊       | 20/71 [00:11<00:21,  2.33it/s][A
Training:  31%|███       | 22/71 [00:13<00:28,  1.69it/s][A
Training:  34%|███▍      | 24/71 [00:13<00:20,  2.26it/s][A
Training:  37%|███▋      | 26/71 [00:16<00:28,  1.59it/s][A
Training:  41%|████      | 29/71 [00:18<00:27,  1.53it/s][A
Training:  44%|████▎     | 31/71 [00:18<00:19,  2.01it/s][A
Training:  46%|████▋     | 33/71 [00:20<00:24,  1.53it/s][A
Training:  49%|████▉     | 35/71 [00

Epoch: 2/10 - Loss: 17.3070 - Accuracy: 0.8890



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:02<00:18,  2.31s/it][A
 44%|████▍     | 4/9 [00:02<00:02,  2.12it/s][A
 67%|██████▋   | 6/9 [00:04<00:02,  1.45it/s][A
100%|██████████| 9/9 [00:05<00:00,  1.51it/s][A
Epochs:  20%|██        | 2/10 [01:32<06:11, 46.42s/it]

Val Loss: 21.6467 - Val Accuracy: 0.7610



Training:   0%|          | 0/71 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/71 [00:02<03:05,  2.65s/it][A
Training:   4%|▍         | 3/71 [00:02<00:49,  1.38it/s][A
Training:   7%|▋         | 5/71 [00:04<01:00,  1.10it/s][A
Training:  11%|█▏        | 8/71 [00:05<00:28,  2.19it/s][A
Training:  14%|█▍        | 10/71 [00:07<00:39,  1.54it/s][A
Training:  18%|█▊        | 13/71 [00:09<00:39,  1.46it/s][A
Training:  23%|██▎       | 16/71 [00:09<00:24,  2.24it/s][A
Training:  25%|██▌       | 18/71 [00:11<00:32,  1.65it/s][A
Training:  30%|██▉       | 21/71 [00:13<00:32,  1.54it/s][A
Training:  32%|███▏      | 23/71 [00:13<00:23,  2.01it/s][A
Training:  35%|███▌      | 25/71 [00:15<00:29,  1.54it/s][A
Training:  39%|███▉      | 28/71 [00:16<00:18,  2.33it/s][A
Training:  42%|████▏     | 30/71 [00:18<00:24,  1.69it/s][A
Training:  46%|████▋     | 33/71 [00:20<00:23,  1.59it/s][A
Training:  49%|████▉     | 35/71 [00:20<00:17,  2.08it/s][A
Training:  52%|█████▏    | 37/71 [00

Epoch: 3/10 - Loss: 20.4174 - Accuracy: 0.8826



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:02<00:19,  2.41s/it][A
 44%|████▍     | 4/9 [00:02<00:02,  2.04it/s][A
 67%|██████▋   | 6/9 [00:04<00:02,  1.45it/s][A
100%|██████████| 9/9 [00:06<00:00,  1.49it/s][A
Epochs:  30%|███       | 3/10 [02:19<05:25, 46.51s/it]

Val Loss: 20.1715 - Val Accuracy: 0.8641



Training:   0%|          | 0/71 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/71 [00:02<02:52,  2.47s/it][A
Training:   4%|▍         | 3/71 [00:02<00:46,  1.46it/s][A
Training:   7%|▋         | 5/71 [00:04<00:58,  1.13it/s][A
Training:  11%|█▏        | 8/71 [00:04<00:28,  2.25it/s][A
Training:  14%|█▍        | 10/71 [00:06<00:39,  1.54it/s][A
Training:  18%|█▊        | 13/71 [00:09<00:39,  1.48it/s][A
Training:  23%|██▎       | 16/71 [00:09<00:24,  2.28it/s][A
Training:  25%|██▌       | 18/71 [00:11<00:32,  1.65it/s][A
Training:  30%|██▉       | 21/71 [00:13<00:32,  1.55it/s][A
Training:  34%|███▍      | 24/71 [00:13<00:20,  2.26it/s][A
Training:  37%|███▋      | 26/71 [00:15<00:26,  1.70it/s][A
Training:  41%|████      | 29/71 [00:18<00:27,  1.54it/s][A
Training:  45%|████▌     | 32/71 [00:18<00:17,  2.22it/s][A
Training:  48%|████▊     | 34/71 [00:20<00:21,  1.70it/s][A
Training:  51%|█████     | 36/71 [00:20<00:15,  2.21it/s][A
Training:  54%|█████▎    | 38/71 [00

Epoch: 4/10 - Loss: 23.6550 - Accuracy: 0.8899



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:02<00:19,  2.44s/it][A
 44%|████▍     | 4/9 [00:02<00:02,  2.01it/s][A
 67%|██████▋   | 6/9 [00:04<00:02,  1.44it/s][A
100%|██████████| 9/9 [00:06<00:00,  1.49it/s][A
Epochs:  40%|████      | 4/10 [03:05<04:38, 46.44s/it]

Val Loss: 23.1975 - Val Accuracy: 0.9174



Training:   0%|          | 0/71 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/71 [00:02<03:04,  2.64s/it][A
Training:   6%|▌         | 4/71 [00:02<00:36,  1.85it/s][A
Training:   8%|▊         | 6/71 [00:04<00:48,  1.33it/s][A
Training:  11%|█▏        | 8/71 [00:04<00:30,  2.07it/s][A
Training:  14%|█▍        | 10/71 [00:07<00:42,  1.43it/s][A
Training:  18%|█▊        | 13/71 [00:09<00:41,  1.41it/s][A
Training:  23%|██▎       | 16/71 [00:09<00:25,  2.19it/s][A
Training:  25%|██▌       | 18/71 [00:11<00:33,  1.59it/s][A
Training:  28%|██▊       | 20/71 [00:11<00:23,  2.14it/s][A
Training:  31%|███       | 22/71 [00:13<00:31,  1.56it/s][A
Training:  35%|███▌      | 25/71 [00:16<00:30,  1.50it/s][A
Training:  39%|███▉      | 28/71 [00:16<00:19,  2.23it/s][A
Training:  42%|████▏     | 30/71 [00:18<00:24,  1.66it/s][A
Training:  46%|████▋     | 33/71 [00:20<00:24,  1.53it/s][A
Training:  51%|█████     | 36/71 [00:20<00:15,  2.21it/s][A
Training:  54%|█████▎    | 38/71 [00

Epoch: 5/10 - Loss: 24.9051 - Accuracy: 0.9074



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:02<00:18,  2.31s/it][A
 33%|███▎      | 3/9 [00:02<00:03,  1.56it/s][A
 56%|█████▌    | 5/9 [00:04<00:03,  1.23it/s][A
100%|██████████| 9/9 [00:06<00:00,  1.49it/s][A
Epochs:  50%|█████     | 5/10 [03:52<03:52, 46.55s/it]

Val Loss: 25.5787 - Val Accuracy: 0.9110



Training:   0%|          | 0/71 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/71 [00:02<02:57,  2.53s/it][A
Training:   4%|▍         | 3/71 [00:02<00:47,  1.43it/s][A
Training:   7%|▋         | 5/71 [00:04<00:59,  1.10it/s][A
Training:  11%|█▏        | 8/71 [00:04<00:28,  2.19it/s][A
Training:  14%|█▍        | 10/71 [00:07<00:39,  1.54it/s][A
Training:  18%|█▊        | 13/71 [00:09<00:39,  1.46it/s][A
Training:  21%|██        | 15/71 [00:09<00:28,  1.98it/s][A
Training:  24%|██▍       | 17/71 [00:11<00:35,  1.52it/s][A
Training:  27%|██▋       | 19/71 [00:11<00:25,  2.08it/s][A
Training:  30%|██▉       | 21/71 [00:13<00:32,  1.54it/s][A
Training:  34%|███▍      | 24/71 [00:13<00:19,  2.40it/s][A
Training:  37%|███▋      | 26/71 [00:15<00:26,  1.68it/s][A
Training:  41%|████      | 29/71 [00:18<00:27,  1.55it/s][A
Training:  44%|████▎     | 31/71 [00:18<00:19,  2.04it/s][A
Training:  46%|████▋     | 33/71 [00:20<00:24,  1.56it/s][A
Training:  51%|█████     | 36/71 [00

Epoch: 6/10 - Loss: 23.5188 - Accuracy: 0.9306



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:02<00:18,  2.28s/it][A
 44%|████▍     | 4/9 [00:02<00:02,  2.12it/s][A
 67%|██████▋   | 6/9 [00:04<00:02,  1.44it/s][A
100%|██████████| 9/9 [00:05<00:00,  1.50it/s][A
Epochs:  60%|██████    | 6/10 [04:38<03:06, 46.51s/it]

Val Loss: 28.1695 - Val Accuracy: 0.9193



Training:   0%|          | 0/71 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/71 [00:02<02:57,  2.53s/it][A
Training:   6%|▌         | 4/71 [00:02<00:34,  1.94it/s][A
Training:   8%|▊         | 6/71 [00:04<00:49,  1.31it/s][A
Training:  13%|█▎        | 9/71 [00:06<00:45,  1.35it/s][A
Training:  17%|█▋        | 12/71 [00:07<00:26,  2.19it/s][A
Training:  20%|█▉        | 14/71 [00:09<00:35,  1.60it/s][A
Training:  24%|██▍       | 17/71 [00:11<00:36,  1.50it/s][A
Training:  28%|██▊       | 20/71 [00:11<00:22,  2.22it/s][A
Training:  31%|███       | 22/71 [00:13<00:29,  1.67it/s][A
Training:  34%|███▍      | 24/71 [00:13<00:21,  2.20it/s][A
Training:  37%|███▋      | 26/71 [00:16<00:28,  1.57it/s][A
Training:  41%|████      | 29/71 [00:18<00:28,  1.47it/s][A
Training:  45%|████▌     | 32/71 [00:18<00:17,  2.17it/s][A
Training:  48%|████▊     | 34/71 [00:20<00:22,  1.65it/s][A
Training:  52%|█████▏    | 37/71 [00:22<00:22,  1.54it/s][A
Training:  56%|█████▋    | 40/71 [00

Epoch: 7/10 - Loss: 22.8976 - Accuracy: 0.9251



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:02<00:18,  2.34s/it][A
 33%|███▎      | 3/9 [00:02<00:03,  1.55it/s][A
 56%|█████▌    | 5/9 [00:04<00:03,  1.22it/s][A
100%|██████████| 9/9 [00:06<00:00,  1.48it/s][A
Epochs:  70%|███████   | 7/10 [05:25<02:19, 46.65s/it]

Val Loss: 21.9656 - Val Accuracy: 0.9041



Training:   0%|          | 0/71 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/71 [00:02<03:04,  2.63s/it][A
Training:   4%|▍         | 3/71 [00:02<00:49,  1.37it/s][A
Training:   7%|▋         | 5/71 [00:04<00:59,  1.11it/s][A
Training:  11%|█▏        | 8/71 [00:05<00:28,  2.21it/s][A
Training:  14%|█▍        | 10/71 [00:07<00:39,  1.54it/s][A
Training:  18%|█▊        | 13/71 [00:09<00:39,  1.45it/s][A
Training:  21%|██        | 15/71 [00:09<00:28,  1.97it/s][A
Training:  24%|██▍       | 17/71 [00:11<00:36,  1.49it/s][A
Training:  28%|██▊       | 20/71 [00:11<00:21,  2.32it/s][A
Training:  31%|███       | 22/71 [00:13<00:29,  1.68it/s][A
Training:  35%|███▌      | 25/71 [00:16<00:29,  1.55it/s][A
Training:  39%|███▉      | 28/71 [00:16<00:19,  2.26it/s][A
Training:  42%|████▏     | 30/71 [00:18<00:24,  1.70it/s][A
Training:  46%|████▋     | 33/71 [00:20<00:23,  1.59it/s][A
Training:  49%|████▉     | 35/71 [00:20<00:17,  2.05it/s][A
Training:  52%|█████▏    | 37/71 [00

Epoch: 8/10 - Loss: 22.3497 - Accuracy: 0.9284



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:02<00:18,  2.34s/it][A
 44%|████▍     | 4/9 [00:02<00:02,  2.09it/s][A
 67%|██████▋   | 6/9 [00:04<00:02,  1.43it/s][A
100%|██████████| 9/9 [00:06<00:00,  1.49it/s][A
Epochs:  80%|████████  | 8/10 [06:12<01:33, 46.67s/it]

Val Loss: 22.7717 - Val Accuracy: 0.9177



Training:   0%|          | 0/71 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/71 [00:02<03:00,  2.58s/it][A
Training:   4%|▍         | 3/71 [00:02<00:48,  1.42it/s][A
Training:   7%|▋         | 5/71 [00:04<00:59,  1.11it/s][A
Training:  10%|▉         | 7/71 [00:04<00:34,  1.85it/s][A
Training:  13%|█▎        | 9/71 [00:07<00:45,  1.36it/s][A
Training:  15%|█▌        | 11/71 [00:07<00:29,  2.02it/s][A
Training:  18%|█▊        | 13/71 [00:09<00:38,  1.49it/s][A
Training:  21%|██        | 15/71 [00:09<00:26,  2.11it/s][A
Training:  24%|██▍       | 17/71 [00:11<00:35,  1.52it/s][A
Training:  27%|██▋       | 19/71 [00:11<00:24,  2.09it/s][A
Training:  30%|██▉       | 21/71 [00:13<00:32,  1.53it/s][A
Training:  32%|███▏      | 23/71 [00:13<00:22,  2.12it/s][A
Training:  35%|███▌      | 25/71 [00:15<00:29,  1.56it/s][A
Training:  38%|███▊      | 27/71 [00:16<00:20,  2.14it/s][A
Training:  41%|████      | 29/71 [00:18<00:26,  1.58it/s][A
Training:  44%|████▎     | 31/71 [00:

Epoch: 9/10 - Loss: 23.0768 - Accuracy: 0.9299



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:02<00:19,  2.40s/it][A
 33%|███▎      | 3/9 [00:02<00:03,  1.51it/s][A
 56%|█████▌    | 5/9 [00:04<00:03,  1.19it/s][A
100%|██████████| 9/9 [00:06<00:00,  1.46it/s][A
Epochs:  90%|█████████ | 9/10 [06:59<00:46, 46.66s/it]

Val Loss: 23.6893 - Val Accuracy: 0.9206



Training:   0%|          | 0/71 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/71 [00:02<03:04,  2.63s/it][A
Training:   4%|▍         | 3/71 [00:02<00:49,  1.38it/s][A
Training:   7%|▋         | 5/71 [00:04<00:58,  1.13it/s][A
Training:  11%|█▏        | 8/71 [00:04<00:28,  2.24it/s][A
Training:  14%|█▍        | 10/71 [00:07<00:39,  1.53it/s][A
Training:  17%|█▋        | 12/71 [00:07<00:27,  2.17it/s][A
Training:  20%|█▉        | 14/71 [00:09<00:37,  1.54it/s][A
Training:  24%|██▍       | 17/71 [00:11<00:36,  1.47it/s][A
Training:  27%|██▋       | 19/71 [00:11<00:26,  1.97it/s][A
Training:  30%|██▉       | 21/71 [00:13<00:32,  1.52it/s][A
Training:  32%|███▏      | 23/71 [00:13<00:23,  2.05it/s][A
Training:  35%|███▌      | 25/71 [00:15<00:29,  1.53it/s][A
Training:  37%|███▋      | 26/71 [00:16<00:25,  1.74it/s][A
Training:  41%|████      | 29/71 [00:18<00:26,  1.60it/s][A
Training:  42%|████▏     | 30/71 [00:18<00:22,  1.85it/s][A
Training:  46%|████▋     | 33/71 [00

Epoch: 10/10 - Loss: 24.3207 - Accuracy: 0.9294



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:02<00:18,  2.30s/it][A
 33%|███▎      | 3/9 [00:02<00:03,  1.58it/s][A
 56%|█████▌    | 5/9 [00:04<00:03,  1.25it/s][A
100%|██████████| 9/9 [00:05<00:00,  1.50it/s][A
Epochs: 100%|██████████| 10/10 [07:46<00:00, 46.61s/it]
[32m[I 2023-12-15 02:46:37,207][0m Trial 3 finished with value: 0.9292545318603516 and parameters: {'learning_rate': 0.0077757503835996266, 'weight_decay': 0.0007839042688318305, 'epsilon': 4.069014959579636e-08, 'batch_size': 198, 'epochs': 10}. Best is trial 2 with value: 0.9405519962310791.[0m


Val Loss: 22.4919 - Val Accuracy: 0.9293
Learning rate: 0.005636386581730127
Weight decay: 0.002103450540847856
Epsilon: 9.093448187942482e-09
Batch size: 216
Number of epochs: 77


Epochs:   0%|          | 0/77 [00:00<?, ?it/s]
Training:   0%|          | 0/65 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/65 [00:02<02:54,  2.73s/it][A
Training:   5%|▍         | 3/65 [00:02<00:46,  1.33it/s][A
Training:   8%|▊         | 5/65 [00:05<00:58,  1.02it/s][A
Training:  12%|█▏        | 8/65 [00:05<00:27,  2.04it/s][A
Training:  15%|█▌        | 10/65 [00:07<00:38,  1.42it/s][A
Training:  20%|██        | 13/65 [00:10<00:39,  1.32it/s][A
Training:  25%|██▍       | 16/65 [00:10<00:24,  2.03it/s][A
Training:  28%|██▊       | 18/65 [00:12<00:30,  1.52it/s][A
Training:  31%|███       | 20/65 [00:12<00:22,  2.02it/s][A
Training:  34%|███▍      | 22/65 [00:14<00:29,  1.46it/s][A
Training:  37%|███▋      | 24/65 [00:15<00:20,  1.98it/s][A
Training:  40%|████      | 26/65 [00:17<00:26,  1.45it/s][A
Training:  45%|████▍     | 29/65 [00:19<00:26,  1.35it/s][A
Training:  49%|████▉     | 32/65 [00:20<00:16,  2.02it/s][A
Training:  52%|█████▏    | 34/65 [00:22<00:20,  1.5

Epoch: 1/77 - Loss: 9.0907 - Accuracy: 0.8218



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:02<00:20,  2.57s/it][A
 44%|████▍     | 4/9 [00:02<00:02,  1.90it/s][A
 67%|██████▋   | 6/9 [00:04<00:02,  1.31it/s][A
100%|██████████| 9/9 [00:05<00:00,  1.78it/s][A
Epochs:   1%|▏         | 1/77 [00:46<58:17, 46.02s/it]

Val Loss: 10.5640 - Val Accuracy: 0.5848



Training:   0%|          | 0/65 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/65 [00:02<03:02,  2.85s/it][A
Training:   5%|▍         | 3/65 [00:02<00:48,  1.29it/s][A
Training:   8%|▊         | 5/65 [00:05<00:57,  1.04it/s][A
Training:  12%|█▏        | 8/65 [00:05<00:27,  2.08it/s][A
Training:  15%|█▌        | 10/65 [00:07<00:38,  1.42it/s][A
Training:  18%|█▊        | 12/65 [00:07<00:26,  2.02it/s][A
Training:  22%|██▏       | 14/65 [00:10<00:35,  1.42it/s][A
Training:  26%|██▌       | 17/65 [00:12<00:35,  1.36it/s][A
Training:  29%|██▉       | 19/65 [00:12<00:25,  1.81it/s][A
Training:  32%|███▏      | 21/65 [00:14<00:31,  1.38it/s][A
Training:  37%|███▋      | 24/65 [00:15<00:19,  2.13it/s][A
Training:  40%|████      | 26/65 [00:17<00:25,  1.54it/s][A
Training:  45%|████▍     | 29/65 [00:19<00:25,  1.43it/s][A
Training:  49%|████▉     | 32/65 [00:19<00:15,  2.09it/s][A
Training:  52%|█████▏    | 34/65 [00:22<00:19,  1.56it/s][A
Training:  57%|█████▋    | 37/65 [00

Epoch: 2/77 - Loss: 8.6326 - Accuracy: 0.8660



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:02<00:20,  2.51s/it][A
 33%|███▎      | 3/9 [00:02<00:04,  1.43it/s][A
 56%|█████▌    | 5/9 [00:04<00:03,  1.10it/s][A
100%|██████████| 9/9 [00:05<00:00,  1.77it/s][A
Epochs:   3%|▎         | 2/77 [01:31<57:26, 45.95s/it]

Val Loss: 8.3362 - Val Accuracy: 0.9190



Training:   0%|          | 0/65 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/65 [00:02<02:56,  2.75s/it][A
Training:   5%|▍         | 3/65 [00:02<00:46,  1.32it/s][A
Training:   8%|▊         | 5/65 [00:05<00:57,  1.05it/s][A
Training:  11%|█         | 7/65 [00:05<00:33,  1.75it/s][A
Training:  14%|█▍        | 9/65 [00:07<00:44,  1.26it/s][A
Training:  17%|█▋        | 11/65 [00:07<00:28,  1.86it/s][A
Training:  20%|██        | 13/65 [00:09<00:38,  1.35it/s][A
Training:  23%|██▎       | 15/65 [00:10<00:25,  1.93it/s][A
Training:  26%|██▌       | 17/65 [00:12<00:34,  1.38it/s][A
Training:  29%|██▉       | 19/65 [00:12<00:23,  1.93it/s][A
Training:  32%|███▏      | 21/65 [00:14<00:30,  1.42it/s][A
Training:  35%|███▌      | 23/65 [00:14<00:21,  1.97it/s][A
Training:  38%|███▊      | 25/65 [00:17<00:28,  1.39it/s][A
Training:  42%|████▏     | 27/65 [00:17<00:19,  1.91it/s][A
Training:  45%|████▍     | 29/65 [00:19<00:25,  1.41it/s][A
Training:  48%|████▊     | 31/65 [00:

Epoch: 3/77 - Loss: 9.3574 - Accuracy: 0.9049



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:02<00:20,  2.54s/it][A
 44%|████▍     | 4/9 [00:02<00:02,  1.93it/s][A
 67%|██████▋   | 6/9 [00:04<00:02,  1.35it/s][A
100%|██████████| 9/9 [00:04<00:00,  1.82it/s][A
Epochs:   4%|▍         | 3/77 [02:17<56:33, 45.86s/it]

Val Loss: 9.8286 - Val Accuracy: 0.9213



Training:   0%|          | 0/65 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/65 [00:02<03:00,  2.82s/it][A
Training:   6%|▌         | 4/65 [00:02<00:34,  1.75it/s][A
Training:   9%|▉         | 6/65 [00:05<00:48,  1.21it/s][A
Training:  14%|█▍        | 9/65 [00:07<00:45,  1.23it/s][A
Training:  18%|█▊        | 12/65 [00:07<00:26,  2.00it/s][A
Training:  22%|██▏       | 14/65 [00:10<00:34,  1.47it/s][A
Training:  26%|██▌       | 17/65 [00:12<00:35,  1.36it/s][A
Training:  31%|███       | 20/65 [00:12<00:22,  2.02it/s][A
Training:  34%|███▍      | 22/65 [00:14<00:28,  1.53it/s][A
Training:  37%|███▋      | 24/65 [00:15<00:20,  2.02it/s][A
Training:  40%|████      | 26/65 [00:17<00:26,  1.48it/s][A
Training:  43%|████▎     | 28/65 [00:17<00:18,  2.00it/s][A
Training:  46%|████▌     | 30/65 [00:19<00:24,  1.42it/s][A
Training:  49%|████▉     | 32/65 [00:20<00:16,  1.95it/s][A
Training:  52%|█████▏    | 34/65 [00:22<00:21,  1.44it/s][A
Training:  55%|█████▌    | 36/65 [00

Epoch: 4/77 - Loss: 10.0264 - Accuracy: 0.9099



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:02<00:20,  2.54s/it][A
 33%|███▎      | 3/9 [00:02<00:04,  1.42it/s][A
 56%|█████▌    | 5/9 [00:04<00:03,  1.13it/s][A
100%|██████████| 9/9 [00:05<00:00,  1.79it/s][A
Epochs:   5%|▌         | 4/77 [03:03<55:49, 45.89s/it]

Val Loss: 11.0771 - Val Accuracy: 0.9146



Training:   0%|          | 0/65 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/65 [00:02<02:57,  2.77s/it][A
Training:   5%|▍         | 3/65 [00:02<00:47,  1.32it/s][A
Training:   8%|▊         | 5/65 [00:05<00:56,  1.05it/s][A
Training:  11%|█         | 7/65 [00:05<00:33,  1.75it/s][A
Training:  14%|█▍        | 9/65 [00:07<00:44,  1.26it/s][A
Training:  17%|█▋        | 11/65 [00:07<00:28,  1.87it/s][A
Training:  20%|██        | 13/65 [00:09<00:38,  1.36it/s][A
Training:  23%|██▎       | 15/65 [00:10<00:25,  1.93it/s][A
Training:  26%|██▌       | 17/65 [00:12<00:34,  1.39it/s][A
Training:  28%|██▊       | 18/65 [00:12<00:28,  1.66it/s][A
Training:  32%|███▏      | 21/65 [00:14<00:29,  1.48it/s][A
Training:  35%|███▌      | 23/65 [00:14<00:20,  2.03it/s][A
Training:  38%|███▊      | 25/65 [00:17<00:27,  1.43it/s][A
Training:  42%|████▏     | 27/65 [00:17<00:19,  1.97it/s][A
Training:  45%|████▍     | 29/65 [00:19<00:25,  1.43it/s][A
Training:  49%|████▉     | 32/65 [00:

Epoch: 5/77 - Loss: 11.1997 - Accuracy: 0.9120



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:02<00:20,  2.60s/it][A
 33%|███▎      | 3/9 [00:02<00:04,  1.41it/s][A
 56%|█████▌    | 5/9 [00:04<00:03,  1.11it/s][A
100%|██████████| 9/9 [00:05<00:00,  1.77it/s][A
Epochs:   6%|▋         | 5/77 [03:49<55:01, 45.86s/it]

Val Loss: 13.3791 - Val Accuracy: 0.9218



Training:   0%|          | 0/65 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/65 [00:02<02:59,  2.80s/it][A
Training:   5%|▍         | 3/65 [00:02<00:48,  1.29it/s][A
Training:   8%|▊         | 5/65 [00:05<00:57,  1.04it/s][A
Training:  11%|█         | 7/65 [00:05<00:33,  1.74it/s][A
Training:  14%|█▍        | 9/65 [00:07<00:45,  1.24it/s][A
Training:  17%|█▋        | 11/65 [00:07<00:29,  1.84it/s][A
Training:  20%|██        | 13/65 [00:10<00:39,  1.33it/s][A
Training:  25%|██▍       | 16/65 [00:10<00:22,  2.18it/s][A
Training:  28%|██▊       | 18/65 [00:12<00:30,  1.55it/s][A
Training:  31%|███       | 20/65 [00:12<00:21,  2.11it/s][A
Training:  34%|███▍      | 22/65 [00:14<00:29,  1.47it/s][A
Training:  38%|███▊      | 25/65 [00:17<00:28,  1.41it/s][A
Training:  43%|████▎     | 28/65 [00:17<00:17,  2.11it/s][A
Training:  46%|████▌     | 30/65 [00:19<00:23,  1.52it/s][A
Training:  51%|█████     | 33/65 [00:22<00:22,  1.44it/s][A
Training:  54%|█████▍    | 35/65 [00:

Epoch: 6/77 - Loss: 11.7744 - Accuracy: 0.9086



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:02<00:20,  2.56s/it][A
 33%|███▎      | 3/9 [00:02<00:04,  1.42it/s][A
 56%|█████▌    | 5/9 [00:04<00:03,  1.14it/s][A
100%|██████████| 9/9 [00:04<00:00,  1.81it/s][A
Epochs:   8%|▊         | 6/77 [04:35<54:13, 45.83s/it]

Val Loss: 11.8294 - Val Accuracy: 0.8985



Training:   0%|          | 0/65 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/65 [00:02<03:01,  2.83s/it][A
Training:   5%|▍         | 3/65 [00:02<00:48,  1.29it/s][A
Training:   8%|▊         | 5/65 [00:05<00:58,  1.03it/s][A
Training:  12%|█▏        | 8/65 [00:05<00:27,  2.06it/s][A
Training:  15%|█▌        | 10/65 [00:07<00:39,  1.38it/s][A
Training:  18%|█▊        | 12/65 [00:07<00:26,  1.97it/s][A
Training:  22%|██▏       | 14/65 [00:10<00:35,  1.42it/s][A
Training:  26%|██▌       | 17/65 [00:12<00:35,  1.34it/s][A
Training:  29%|██▉       | 19/65 [00:12<00:25,  1.80it/s][A
Training:  32%|███▏      | 21/65 [00:14<00:31,  1.39it/s][A
Training:  37%|███▋      | 24/65 [00:15<00:19,  2.15it/s][A
Training:  40%|████      | 26/65 [00:17<00:25,  1.51it/s][A
Training:  45%|████▍     | 29/65 [00:19<00:25,  1.42it/s][A
Training:  49%|████▉     | 32/65 [00:20<00:15,  2.08it/s][A
Training:  52%|█████▏    | 34/65 [00:22<00:20,  1.54it/s][A
Training:  57%|█████▋    | 37/65 [00

Epoch: 7/77 - Loss: 11.8230 - Accuracy: 0.9037



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:02<00:21,  2.64s/it][A
 33%|███▎      | 3/9 [00:02<00:04,  1.38it/s][A
 56%|█████▌    | 5/9 [00:04<00:03,  1.10it/s][A
100%|██████████| 9/9 [00:05<00:00,  1.76it/s][A
Epochs:   9%|▉         | 7/77 [05:21<53:31, 45.88s/it]

Val Loss: 11.3209 - Val Accuracy: 0.9372



Training:   0%|          | 0/65 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/65 [00:02<03:02,  2.85s/it][A
Training:   5%|▍         | 3/65 [00:02<00:48,  1.29it/s][A
Training:   8%|▊         | 5/65 [00:05<00:57,  1.05it/s][A
Training:  11%|█         | 7/65 [00:05<00:33,  1.74it/s][A
Training:  14%|█▍        | 9/65 [00:07<00:44,  1.25it/s][A
Training:  17%|█▋        | 11/65 [00:07<00:29,  1.86it/s][A
Training:  20%|██        | 13/65 [00:10<00:38,  1.36it/s][A
Training:  23%|██▎       | 15/65 [00:10<00:25,  1.94it/s][A
Training:  26%|██▌       | 17/65 [00:12<00:34,  1.38it/s][A
Training:  29%|██▉       | 19/65 [00:12<00:23,  1.93it/s][A
Training:  32%|███▏      | 21/65 [00:14<00:31,  1.42it/s][A
Training:  35%|███▌      | 23/65 [00:14<00:21,  1.97it/s][A
Training:  38%|███▊      | 25/65 [00:17<00:28,  1.42it/s][A
Training:  42%|████▏     | 27/65 [00:17<00:19,  1.96it/s][A
Training:  45%|████▍     | 29/65 [00:19<00:25,  1.42it/s][A
Training:  48%|████▊     | 31/65 [00:

Epoch: 8/77 - Loss: 12.4005 - Accuracy: 0.9246



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:02<00:21,  2.68s/it][A
 44%|████▍     | 4/9 [00:02<00:02,  1.84it/s][A
 67%|██████▋   | 6/9 [00:04<00:02,  1.32it/s][A
100%|██████████| 9/9 [00:05<00:00,  1.78it/s][A
Epochs:  10%|█         | 8/77 [06:06<52:44, 45.86s/it]

Val Loss: 15.5396 - Val Accuracy: 0.9017



Training:   0%|          | 0/65 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/65 [00:02<03:01,  2.83s/it][A
Training:   5%|▍         | 3/65 [00:02<00:48,  1.29it/s][A
Training:   8%|▊         | 5/65 [00:05<00:57,  1.04it/s][A
Training:  11%|█         | 7/65 [00:05<00:33,  1.73it/s][A
Training:  14%|█▍        | 9/65 [00:07<00:45,  1.24it/s][A
Training:  18%|█▊        | 12/65 [00:07<00:24,  2.14it/s][A
Training:  22%|██▏       | 14/65 [00:10<00:33,  1.51it/s][A
Training:  26%|██▌       | 17/65 [00:12<00:34,  1.38it/s][A
Training:  29%|██▉       | 19/65 [00:12<00:24,  1.84it/s][A
Training:  32%|███▏      | 21/65 [00:14<00:30,  1.42it/s][A
Training:  37%|███▋      | 24/65 [00:15<00:18,  2.18it/s][A
Training:  40%|████      | 26/65 [00:17<00:25,  1.52it/s][A
Training:  45%|████▍     | 29/65 [00:19<00:25,  1.43it/s][A
Training:  48%|████▊     | 31/65 [00:19<00:18,  1.88it/s][A
Training:  51%|█████     | 33/65 [00:22<00:22,  1.40it/s][A
Training:  55%|█████▌    | 36/65 [00:

Epoch: 9/77 - Loss: 12.7664 - Accuracy: 0.9305



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:02<00:20,  2.51s/it][A
 33%|███▎      | 3/9 [00:02<00:04,  1.45it/s][A
 56%|█████▌    | 5/9 [00:04<00:03,  1.16it/s][A
100%|██████████| 9/9 [00:04<00:00,  1.82it/s][A
Epochs:  12%|█▏        | 9/77 [06:52<52:00, 45.89s/it]

Val Loss: 11.8361 - Val Accuracy: 0.9306



Training:   0%|          | 0/65 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/65 [00:02<02:49,  2.66s/it][A
Training:   5%|▍         | 3/65 [00:02<00:45,  1.36it/s][A
Training:   8%|▊         | 5/65 [00:05<00:57,  1.05it/s][A
Training:   9%|▉         | 6/65 [00:05<00:43,  1.36it/s][A
Training:  14%|█▍        | 9/65 [00:07<00:41,  1.34it/s][A
Training:  15%|█▌        | 10/65 [00:07<00:34,  1.61it/s][A
Training:  20%|██        | 13/65 [00:10<00:36,  1.43it/s][A
Training:  22%|██▏       | 14/65 [00:10<00:30,  1.69it/s][A
Training:  26%|██▌       | 17/65 [00:12<00:31,  1.52it/s][A
Training:  28%|██▊       | 18/65 [00:12<00:26,  1.77it/s][A
Training:  32%|███▏      | 21/65 [00:14<00:29,  1.51it/s][A
Training:  35%|███▌      | 23/65 [00:14<00:20,  2.06it/s][A
Training:  38%|███▊      | 25/65 [00:17<00:26,  1.49it/s][A
Training:  40%|████      | 26/65 [00:17<00:22,  1.75it/s][A
Training:  43%|████▎     | 28/65 [00:17<00:14,  2.49it/s][A
Training:  46%|████▌     | 30/65 [00:

Epoch: 10/77 - Loss: 12.4532 - Accuracy: 0.9312



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:02<00:20,  2.50s/it][A
 44%|████▍     | 4/9 [00:02<00:02,  1.96it/s][A
 67%|██████▋   | 6/9 [00:04<00:02,  1.30it/s][A
100%|██████████| 9/9 [00:05<00:00,  1.79it/s][A
Epochs:  13%|█▎        | 10/77 [07:38<51:12, 45.87s/it]

Val Loss: 12.8663 - Val Accuracy: 0.9326



Training:   0%|          | 0/65 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/65 [00:02<03:06,  2.92s/it][A
Training:   5%|▍         | 3/65 [00:03<00:49,  1.26it/s][A
Training:   8%|▊         | 5/65 [00:05<00:57,  1.04it/s][A
Training:  11%|█         | 7/65 [00:05<00:33,  1.73it/s][A
Training:  14%|█▍        | 9/65 [00:07<00:45,  1.23it/s][A
Training:  17%|█▋        | 11/65 [00:07<00:29,  1.83it/s][A
Training:  20%|██        | 13/65 [00:10<00:38,  1.34it/s][A
Training:  23%|██▎       | 15/65 [00:10<00:26,  1.91it/s][A
Training:  26%|██▌       | 17/65 [00:12<00:35,  1.37it/s][A
Training:  29%|██▉       | 19/65 [00:12<00:24,  1.91it/s][A
Training:  32%|███▏      | 21/65 [00:15<00:31,  1.40it/s][A
Training:  37%|███▋      | 24/65 [00:15<00:18,  2.23it/s][A
Training:  40%|████      | 26/65 [00:17<00:25,  1.53it/s][A
Training:  45%|████▍     | 29/65 [00:19<00:25,  1.43it/s][A
Training:  49%|████▉     | 32/65 [00:20<00:15,  2.11it/s][A
Training:  52%|█████▏    | 34/65 [00:

Epoch: 11/77 - Loss: 12.2597 - Accuracy: 0.9265



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:02<00:20,  2.58s/it][A
 44%|████▍     | 4/9 [00:02<00:02,  1.90it/s][A
 67%|██████▋   | 6/9 [00:04<00:02,  1.32it/s][A
100%|██████████| 9/9 [00:05<00:00,  1.79it/s][A
Epochs:  14%|█▍        | 11/77 [08:24<50:29, 45.91s/it]

Val Loss: 11.9062 - Val Accuracy: 0.9012



Training:   0%|          | 0/65 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/65 [00:02<03:00,  2.82s/it][A
Training:   5%|▍         | 3/65 [00:02<00:47,  1.29it/s][A
Training:   8%|▊         | 5/65 [00:05<00:57,  1.04it/s][A
Training:  11%|█         | 7/65 [00:05<00:33,  1.74it/s][A
Training:  14%|█▍        | 9/65 [00:07<00:45,  1.24it/s][A
Training:  18%|█▊        | 12/65 [00:07<00:24,  2.13it/s][A
Training:  22%|██▏       | 14/65 [00:10<00:34,  1.49it/s][A
Training:  26%|██▌       | 17/65 [00:12<00:34,  1.38it/s][A
Training:  31%|███       | 20/65 [00:12<00:21,  2.08it/s][A
Training:  34%|███▍      | 22/65 [00:14<00:27,  1.55it/s][A
Training:  38%|███▊      | 25/65 [00:17<00:27,  1.43it/s][A
Training:  43%|████▎     | 28/65 [00:17<00:17,  2.08it/s][A
Training:  46%|████▌     | 30/65 [00:19<00:22,  1.55it/s][A
Training:  51%|█████     | 33/65 [00:22<00:22,  1.44it/s][A
Training:  54%|█████▍    | 35/65 [00:22<00:16,  1.86it/s][A
Training:  57%|█████▋    | 37/65 [00:

Epoch: 12/77 - Loss: 12.4831 - Accuracy: 0.9265



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:02<00:20,  2.61s/it][A
 33%|███▎      | 3/9 [00:02<00:04,  1.39it/s][A
 56%|█████▌    | 5/9 [00:04<00:03,  1.14it/s][A
100%|██████████| 9/9 [00:05<00:00,  1.80it/s][A
Epochs:  16%|█▌        | 12/77 [09:10<49:42, 45.88s/it]

Val Loss: 11.0110 - Val Accuracy: 0.9306



Training:   0%|          | 0/65 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/65 [00:02<02:59,  2.81s/it][A
Training:   6%|▌         | 4/65 [00:02<00:34,  1.75it/s][A
Training:   9%|▉         | 6/65 [00:05<00:48,  1.21it/s][A
Training:  12%|█▏        | 8/65 [00:05<00:30,  1.87it/s][A
Training:  15%|█▌        | 10/65 [00:07<00:41,  1.33it/s][A
Training:  20%|██        | 13/65 [00:10<00:39,  1.30it/s][A
Training:  23%|██▎       | 15/65 [00:10<00:28,  1.78it/s][A
Training:  26%|██▌       | 17/65 [00:12<00:36,  1.33it/s][A
Training:  31%|███       | 20/65 [00:12<00:21,  2.08it/s][A
Training:  34%|███▍      | 22/65 [00:15<00:28,  1.52it/s][A
Training:  37%|███▋      | 24/65 [00:15<00:20,  2.04it/s][A
Training:  40%|████      | 26/65 [00:17<00:26,  1.46it/s][A
Training:  45%|████▍     | 29/65 [00:19<00:25,  1.40it/s][A
Training:  48%|████▊     | 31/65 [00:19<00:18,  1.84it/s][A
Training:  51%|█████     | 33/65 [00:22<00:23,  1.38it/s][A
Training:  54%|█████▍    | 35/65 [00

Epoch: 13/77 - Loss: 12.3015 - Accuracy: 0.9359



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:02<00:19,  2.49s/it][A
 33%|███▎      | 3/9 [00:02<00:04,  1.46it/s][A
 56%|█████▌    | 5/9 [00:04<00:03,  1.13it/s][A
100%|██████████| 9/9 [00:04<00:00,  1.80it/s][A
Epochs:  17%|█▋        | 13/77 [09:56<48:57, 45.91s/it]

Val Loss: 11.9977 - Val Accuracy: 0.9317



Training:   0%|          | 0/65 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/65 [00:02<02:58,  2.78s/it][A
Training:   5%|▍         | 3/65 [00:02<00:47,  1.32it/s][A
Training:   8%|▊         | 5/65 [00:05<00:57,  1.04it/s][A
Training:  12%|█▏        | 8/65 [00:05<00:27,  2.06it/s][A
Training:  15%|█▌        | 10/65 [00:07<00:38,  1.42it/s][A
Training:  18%|█▊        | 12/65 [00:07<00:26,  2.02it/s][A
Training:  22%|██▏       | 14/65 [00:10<00:36,  1.42it/s][A
Training:  25%|██▍       | 16/65 [00:10<00:24,  1.99it/s][A
Training:  28%|██▊       | 18/65 [00:12<00:33,  1.41it/s][A
Training:  32%|███▏      | 21/65 [00:14<00:32,  1.35it/s][A
Training:  35%|███▌      | 23/65 [00:15<00:23,  1.81it/s][A
Training:  38%|███▊      | 25/65 [00:17<00:29,  1.37it/s][A
Training:  42%|████▏     | 27/65 [00:17<00:20,  1.86it/s][A
Training:  45%|████▍     | 29/65 [00:19<00:25,  1.41it/s][A
Training:  48%|████▊     | 31/65 [00:19<00:17,  1.94it/s][A
Training:  51%|█████     | 33/65 [00

Epoch: 14/77 - Loss: 12.1888 - Accuracy: 0.9345



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:02<00:21,  2.68s/it][A
 44%|████▍     | 4/9 [00:02<00:02,  1.83it/s][A
 67%|██████▋   | 6/9 [00:04<00:02,  1.29it/s][A
100%|██████████| 9/9 [00:05<00:00,  1.75it/s][A
Epochs:  18%|█▊        | 14/77 [10:42<48:13, 45.93s/it]

Val Loss: 13.3998 - Val Accuracy: 0.9328



Training:   0%|          | 0/65 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/65 [00:02<03:00,  2.83s/it][A
Training:   5%|▍         | 3/65 [00:02<00:47,  1.30it/s][A
Training:   8%|▊         | 5/65 [00:05<00:57,  1.05it/s][A
Training:  11%|█         | 7/65 [00:05<00:33,  1.75it/s][A
Training:  14%|█▍        | 9/65 [00:07<00:45,  1.24it/s][A
Training:  18%|█▊        | 12/65 [00:07<00:24,  2.14it/s][A
Training:  22%|██▏       | 14/65 [00:10<00:34,  1.50it/s][A
Training:  25%|██▍       | 16/65 [00:10<00:23,  2.06it/s][A
Training:  28%|██▊       | 18/65 [00:12<00:32,  1.45it/s][A
Training:  31%|███       | 20/65 [00:12<00:22,  2.00it/s][A
Training:  34%|███▍      | 22/65 [00:14<00:29,  1.45it/s][A
Training:  37%|███▋      | 24/65 [00:15<00:20,  2.01it/s][A
Training:  40%|████      | 26/65 [00:17<00:27,  1.41it/s][A
Training:  45%|████▍     | 29/65 [00:19<00:26,  1.37it/s][A
Training:  48%|████▊     | 31/65 [00:19<00:18,  1.82it/s][A
Training:  51%|█████     | 33/65 [00:

Epoch: 15/77 - Loss: 12.2088 - Accuracy: 0.9363



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:02<00:19,  2.48s/it][A
 33%|███▎      | 3/9 [00:02<00:04,  1.47it/s][A
 56%|█████▌    | 5/9 [00:04<00:03,  1.13it/s][A
100%|██████████| 9/9 [00:04<00:00,  1.80it/s][A
Epochs:  19%|█▉        | 15/77 [11:28<47:25, 45.90s/it]

Val Loss: 15.4005 - Val Accuracy: 0.9250



Training:   0%|          | 0/65 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/65 [00:02<02:57,  2.78s/it][A
Training:   6%|▌         | 4/65 [00:02<00:34,  1.77it/s][A
Training:   9%|▉         | 6/65 [00:05<00:49,  1.19it/s][A
Training:  14%|█▍        | 9/65 [00:07<00:45,  1.23it/s][A
Training:  17%|█▋        | 11/65 [00:07<00:30,  1.75it/s][A
Training:  20%|██        | 13/65 [00:10<00:39,  1.32it/s][A
Training:  25%|██▍       | 16/65 [00:10<00:23,  2.11it/s][A
Training:  28%|██▊       | 18/65 [00:12<00:30,  1.52it/s][A
Training:  32%|███▏      | 21/65 [00:14<00:31,  1.39it/s][A
Training:  37%|███▋      | 24/65 [00:15<00:19,  2.06it/s][A
Training:  40%|████      | 26/65 [00:17<00:25,  1.54it/s][A
Training:  43%|████▎     | 28/65 [00:17<00:18,  2.04it/s][A
Training:  46%|████▌     | 30/65 [00:19<00:24,  1.44it/s][A
Training:  51%|█████     | 33/65 [00:22<00:23,  1.38it/s][A
Training:  55%|█████▌    | 36/65 [00:22<00:14,  2.04it/s][A
Training:  58%|█████▊    | 38/65 [00

Epoch: 16/77 - Loss: 11.6875 - Accuracy: 0.9390



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:02<00:20,  2.52s/it][A
 33%|███▎      | 3/9 [00:02<00:04,  1.43it/s][A
 56%|█████▌    | 5/9 [00:04<00:03,  1.11it/s][A
100%|██████████| 9/9 [00:05<00:00,  1.78it/s][A
Epochs:  21%|██        | 16/77 [12:14<46:44, 45.98s/it]

Val Loss: 11.2051 - Val Accuracy: 0.9383



Training:   0%|          | 0/65 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/65 [00:02<02:59,  2.81s/it][A
Training:   5%|▍         | 3/65 [00:02<00:47,  1.30it/s][A
Training:   8%|▊         | 5/65 [00:05<00:57,  1.04it/s][A
Training:  11%|█         | 7/65 [00:05<00:33,  1.74it/s][A
Training:  14%|█▍        | 9/65 [00:07<00:45,  1.23it/s][A
Training:  18%|█▊        | 12/65 [00:07<00:24,  2.13it/s][A
Training:  22%|██▏       | 14/65 [00:10<00:33,  1.50it/s][A
Training:  25%|██▍       | 16/65 [00:10<00:23,  2.07it/s][A
Training:  28%|██▊       | 18/65 [00:12<00:32,  1.44it/s][A
Training:  31%|███       | 20/65 [00:12<00:22,  1.99it/s][A
Training:  34%|███▍      | 22/65 [00:14<00:29,  1.44it/s][A
Training:  37%|███▋      | 24/65 [00:15<00:20,  1.99it/s][A
Training:  40%|████      | 26/65 [00:17<00:27,  1.40it/s][A
Training:  43%|████▎     | 28/65 [00:17<00:19,  1.94it/s][A
Training:  46%|████▌     | 30/65 [00:19<00:24,  1.43it/s][A
Training:  51%|█████     | 33/65 [00:

Epoch: 17/77 - Loss: 11.5459 - Accuracy: 0.9407



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:02<00:20,  2.60s/it][A
 44%|████▍     | 4/9 [00:02<00:02,  1.89it/s][A
 67%|██████▋   | 6/9 [00:04<00:02,  1.27it/s][A
100%|██████████| 9/9 [00:05<00:00,  1.73it/s][A
Epochs:  22%|██▏       | 17/77 [13:00<46:03, 46.06s/it]

Val Loss: 12.4252 - Val Accuracy: 0.9328



Training:   0%|          | 0/65 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/65 [00:02<02:55,  2.74s/it][A
Training:   5%|▍         | 3/65 [00:02<00:46,  1.34it/s][A
Training:   8%|▊         | 5/65 [00:05<00:57,  1.04it/s][A
Training:  11%|█         | 7/65 [00:05<00:33,  1.74it/s][A
Training:  14%|█▍        | 9/65 [00:07<00:44,  1.27it/s][A
Training:  17%|█▋        | 11/65 [00:07<00:28,  1.88it/s][A
Training:  20%|██        | 13/65 [00:10<00:38,  1.34it/s][A
Training:  23%|██▎       | 15/65 [00:10<00:26,  1.91it/s][A
Training:  26%|██▌       | 17/65 [00:12<00:34,  1.39it/s][A
Training:  31%|███       | 20/65 [00:12<00:20,  2.23it/s][A
Training:  34%|███▍      | 22/65 [00:14<00:28,  1.53it/s][A
Training:  37%|███▋      | 24/65 [00:15<00:19,  2.07it/s][A
Training:  40%|████      | 26/65 [00:17<00:26,  1.49it/s][A
Training:  43%|████▎     | 28/65 [00:17<00:18,  2.03it/s][A
Training:  46%|████▌     | 30/65 [00:19<00:24,  1.43it/s][A
Training:  49%|████▉     | 32/65 [00:

Epoch: 18/77 - Loss: 11.5653 - Accuracy: 0.9410



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:02<00:20,  2.56s/it][A
 44%|████▍     | 4/9 [00:02<00:02,  1.92it/s][A
 67%|██████▋   | 6/9 [00:04<00:02,  1.31it/s][A
100%|██████████| 9/9 [00:05<00:00,  1.79it/s][A
Epochs:  23%|██▎       | 18/77 [13:46<45:17, 46.06s/it]

Val Loss: 13.1425 - Val Accuracy: 0.9383



Training:   0%|          | 0/65 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/65 [00:02<03:07,  2.94s/it][A
Training:   6%|▌         | 4/65 [00:03<00:36,  1.68it/s][A
Training:   9%|▉         | 6/65 [00:05<00:48,  1.21it/s][A
Training:  12%|█▏        | 8/65 [00:05<00:30,  1.88it/s][A
Training:  15%|█▌        | 10/65 [00:07<00:41,  1.31it/s][A
Training:  18%|█▊        | 12/65 [00:07<00:27,  1.91it/s][A
Training:  22%|██▏       | 14/65 [00:10<00:36,  1.39it/s][A
Training:  26%|██▌       | 17/65 [00:12<00:36,  1.33it/s][A
Training:  29%|██▉       | 19/65 [00:12<00:25,  1.79it/s][A
Training:  32%|███▏      | 21/65 [00:14<00:31,  1.39it/s][A
Training:  35%|███▌      | 23/65 [00:15<00:22,  1.89it/s][A
Training:  38%|███▊      | 25/65 [00:17<00:28,  1.41it/s][A
Training:  42%|████▏     | 27/65 [00:17<00:19,  1.94it/s][A
Training:  45%|████▍     | 29/65 [00:19<00:25,  1.41it/s][A
Training:  48%|████▊     | 31/65 [00:19<00:17,  1.94it/s][A
Training:  51%|█████     | 33/65 [00

Epoch: 19/77 - Loss: 11.9177 - Accuracy: 0.9407



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:02<00:20,  2.56s/it][A
 33%|███▎      | 3/9 [00:02<00:04,  1.43it/s][A
 56%|█████▌    | 5/9 [00:04<00:03,  1.12it/s][A
100%|██████████| 9/9 [00:05<00:00,  1.79it/s][A
Epochs:  25%|██▍       | 19/77 [14:32<44:31, 46.06s/it]

Val Loss: 14.9120 - Val Accuracy: 0.9439



Training:   0%|          | 0/65 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/65 [00:02<03:03,  2.87s/it][A
Training:   5%|▍         | 3/65 [00:02<00:48,  1.27it/s][A
Training:   8%|▊         | 5/65 [00:05<00:57,  1.04it/s][A
Training:  11%|█         | 7/65 [00:05<00:33,  1.74it/s][A
Training:  14%|█▍        | 9/65 [00:07<00:45,  1.24it/s][A
Training:  17%|█▋        | 11/65 [00:07<00:29,  1.84it/s][A
Training:  20%|██        | 13/65 [00:10<00:38,  1.34it/s][A
Training:  23%|██▎       | 15/65 [00:10<00:26,  1.91it/s][A
Training:  26%|██▌       | 17/65 [00:12<00:34,  1.37it/s][A
Training:  29%|██▉       | 19/65 [00:12<00:23,  1.93it/s][A
Training:  32%|███▏      | 21/65 [00:15<00:31,  1.38it/s][A
Training:  35%|███▌      | 23/65 [00:15<00:21,  1.93it/s][A
Training:  38%|███▊      | 25/65 [00:17<00:28,  1.41it/s][A
Training:  42%|████▏     | 27/65 [00:17<00:19,  1.96it/s][A
Training:  45%|████▍     | 29/65 [00:19<00:26,  1.38it/s][A
Training:  49%|████▉     | 32/65 [00:

Epoch: 20/77 - Loss: 12.2169 - Accuracy: 0.9410



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:02<00:20,  2.61s/it][A
 33%|███▎      | 3/9 [00:02<00:04,  1.40it/s][A
 56%|█████▌    | 5/9 [00:04<00:03,  1.14it/s][A
100%|██████████| 9/9 [00:04<00:00,  1.80it/s][A
Epochs:  26%|██▌       | 20/77 [15:18<43:44, 46.04s/it]

Val Loss: 16.5839 - Val Accuracy: 0.9231



Training:   0%|          | 0/65 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/65 [00:02<03:03,  2.86s/it][A
Training:   6%|▌         | 4/65 [00:03<00:35,  1.72it/s][A
Training:   9%|▉         | 6/65 [00:05<00:48,  1.21it/s][A
Training:  12%|█▏        | 8/65 [00:05<00:30,  1.90it/s][A
Training:  15%|█▌        | 10/65 [00:07<00:41,  1.31it/s][A
Training:  18%|█▊        | 12/65 [00:07<00:27,  1.91it/s][A
Training:  22%|██▏       | 14/65 [00:10<00:37,  1.37it/s][A
Training:  25%|██▍       | 16/65 [00:10<00:25,  1.95it/s][A
Training:  28%|██▊       | 18/65 [00:12<00:33,  1.39it/s][A
Training:  31%|███       | 20/65 [00:12<00:23,  1.94it/s][A
Training:  34%|███▍      | 22/65 [00:15<00:30,  1.40it/s][A
Training:  38%|███▊      | 25/65 [00:17<00:29,  1.34it/s][A
Training:  43%|████▎     | 28/65 [00:17<00:18,  2.03it/s][A
Training:  46%|████▌     | 30/65 [00:19<00:23,  1.51it/s][A
Training:  51%|█████     | 33/65 [00:22<00:22,  1.43it/s][A
Training:  55%|█████▌    | 36/65 [00

Epoch: 21/77 - Loss: 13.1117 - Accuracy: 0.9380



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:02<00:20,  2.53s/it][A
 33%|███▎      | 3/9 [00:02<00:04,  1.42it/s][A
 56%|█████▌    | 5/9 [00:04<00:03,  1.13it/s][A
100%|██████████| 9/9 [00:05<00:00,  1.80it/s][A
Epochs:  27%|██▋       | 21/77 [16:04<42:58, 46.05s/it]

Val Loss: 11.6604 - Val Accuracy: 0.9400



Training:   0%|          | 0/65 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/65 [00:02<03:03,  2.87s/it][A
Training:   5%|▍         | 3/65 [00:02<00:48,  1.28it/s][A
Training:   8%|▊         | 5/65 [00:05<00:57,  1.04it/s][A
Training:  11%|█         | 7/65 [00:05<00:33,  1.73it/s][A
Training:  14%|█▍        | 9/65 [00:07<00:44,  1.27it/s][A
Training:  17%|█▋        | 11/65 [00:07<00:28,  1.88it/s][A
Training:  20%|██        | 13/65 [00:10<00:38,  1.35it/s][A
Training:  23%|██▎       | 15/65 [00:10<00:26,  1.92it/s][A
Training:  26%|██▌       | 17/65 [00:12<00:34,  1.40it/s][A
Training:  28%|██▊       | 18/65 [00:12<00:28,  1.64it/s][A
Training:  31%|███       | 20/65 [00:12<00:18,  2.40it/s][A
Training:  34%|███▍      | 22/65 [00:14<00:28,  1.52it/s][A
Training:  35%|███▌      | 23/65 [00:15<00:23,  1.80it/s][A
Training:  38%|███▊      | 25/65 [00:17<00:29,  1.36it/s][A
Training:  40%|████      | 26/65 [00:17<00:24,  1.61it/s][A
Training:  42%|████▏     | 27/65 [00:

Epoch: 22/77 - Loss: 11.9849 - Accuracy: 0.9405



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:02<00:20,  2.53s/it][A
 44%|████▍     | 4/9 [00:02<00:02,  1.95it/s][A
 67%|██████▋   | 6/9 [00:04<00:02,  1.33it/s][A
100%|██████████| 9/9 [00:04<00:00,  1.80it/s][A
Epochs:  29%|██▊       | 22/77 [16:50<42:08, 45.97s/it]

Val Loss: 11.8958 - Val Accuracy: 0.9352



Training:   0%|          | 0/65 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/65 [00:02<02:50,  2.67s/it][A
Training:   5%|▍         | 3/65 [00:02<00:45,  1.37it/s][A
Training:   8%|▊         | 5/65 [00:05<00:57,  1.05it/s][A
Training:  12%|█▏        | 8/65 [00:05<00:27,  2.10it/s][A
Training:  15%|█▌        | 10/65 [00:07<00:37,  1.47it/s][A
Training:  18%|█▊        | 12/65 [00:07<00:25,  2.09it/s][A
Training:  22%|██▏       | 14/65 [00:09<00:36,  1.41it/s][A
Training:  26%|██▌       | 17/65 [00:12<00:34,  1.39it/s][A
Training:  28%|██▊       | 18/65 [00:12<00:29,  1.60it/s][A
Training:  32%|███▏      | 21/65 [00:14<00:29,  1.47it/s][A
Training:  34%|███▍      | 22/65 [00:14<00:25,  1.67it/s][A
Training:  38%|███▊      | 25/65 [00:16<00:25,  1.55it/s][A
Training:  40%|████      | 26/65 [00:17<00:22,  1.76it/s][A
Training:  45%|████▍     | 29/65 [00:19<00:22,  1.58it/s][A
Training:  46%|████▌     | 30/65 [00:19<00:19,  1.76it/s][A
Training:  49%|████▉     | 32/65 [00

Epoch: 23/77 - Loss: 12.0111 - Accuracy: 0.9409



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:02<00:20,  2.61s/it][A
 33%|███▎      | 3/9 [00:02<00:04,  1.39it/s][A
 56%|█████▌    | 5/9 [00:04<00:03,  1.15it/s][A
100%|██████████| 9/9 [00:04<00:00,  1.81it/s][A
Epochs:  30%|██▉       | 23/77 [17:36<41:11, 45.77s/it]

Val Loss: 9.4827 - Val Accuracy: 0.9429



Training:   0%|          | 0/65 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/65 [00:02<02:56,  2.75s/it][A
Training:   5%|▍         | 3/65 [00:02<00:46,  1.32it/s][A
Training:   8%|▊         | 5/65 [00:05<00:57,  1.04it/s][A
Training:  11%|█         | 7/65 [00:05<00:33,  1.74it/s][A
Training:  14%|█▍        | 9/65 [00:07<00:44,  1.26it/s][A
Training:  17%|█▋        | 11/65 [00:07<00:28,  1.87it/s][A
Training:  20%|██        | 13/65 [00:09<00:37,  1.37it/s][A
Training:  23%|██▎       | 15/65 [00:10<00:25,  1.95it/s][A
Training:  26%|██▌       | 17/65 [00:12<00:35,  1.37it/s][A
Training:  29%|██▉       | 19/65 [00:12<00:23,  1.92it/s][A
Training:  32%|███▏      | 21/65 [00:14<00:31,  1.42it/s][A
Training:  35%|███▌      | 23/65 [00:14<00:21,  1.97it/s][A
Training:  38%|███▊      | 25/65 [00:17<00:28,  1.40it/s][A
Training:  43%|████▎     | 28/65 [00:17<00:16,  2.21it/s][A
Training:  46%|████▌     | 30/65 [00:19<00:22,  1.57it/s][A
Training:  49%|████▉     | 32/65 [00:

Epoch: 24/77 - Loss: 12.0715 - Accuracy: 0.9380



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:02<00:20,  2.54s/it][A
 33%|███▎      | 3/9 [00:02<00:04,  1.42it/s][A
 56%|█████▌    | 5/9 [00:04<00:03,  1.13it/s][A
100%|██████████| 9/9 [00:05<00:00,  1.80it/s][A
Epochs:  31%|███       | 24/77 [18:21<40:22, 45.70s/it]

Val Loss: 14.0532 - Val Accuracy: 0.9343



Training:   0%|          | 0/65 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/65 [00:02<02:58,  2.80s/it][A
Training:   5%|▍         | 3/65 [00:02<00:47,  1.31it/s][A
Training:   8%|▊         | 5/65 [00:05<00:56,  1.06it/s][A
Training:  11%|█         | 7/65 [00:05<00:32,  1.76it/s][A
Training:  14%|█▍        | 9/65 [00:07<00:43,  1.28it/s][A
Training:  17%|█▋        | 11/65 [00:07<00:28,  1.88it/s][A
Training:  20%|██        | 13/65 [00:09<00:38,  1.36it/s][A
Training:  23%|██▎       | 15/65 [00:10<00:25,  1.94it/s][A
Training:  26%|██▌       | 17/65 [00:12<00:34,  1.41it/s][A
Training:  29%|██▉       | 19/65 [00:12<00:23,  1.97it/s][A
Training:  32%|███▏      | 21/65 [00:14<00:31,  1.41it/s][A
Training:  35%|███▌      | 23/65 [00:14<00:21,  1.97it/s][A
Training:  38%|███▊      | 25/65 [00:17<00:27,  1.44it/s][A
Training:  42%|████▏     | 27/65 [00:17<00:19,  1.99it/s][A
Training:  45%|████▍     | 29/65 [00:19<00:25,  1.41it/s][A
Training:  49%|████▉     | 32/65 [00:

Epoch: 25/77 - Loss: 12.9804 - Accuracy: 0.9377



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:02<00:20,  2.52s/it][A
 33%|███▎      | 3/9 [00:02<00:04,  1.45it/s][A
 56%|█████▌    | 5/9 [00:04<00:03,  1.15it/s][A
100%|██████████| 9/9 [00:04<00:00,  1.82it/s][A
Epochs:  32%|███▏      | 25/77 [19:06<39:31, 45.61s/it]

Val Loss: 13.7872 - Val Accuracy: 0.9359



Training:   0%|          | 0/65 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/65 [00:02<02:57,  2.78s/it][A
Training:   6%|▌         | 4/65 [00:02<00:34,  1.77it/s][A
Training:   9%|▉         | 6/65 [00:05<00:48,  1.22it/s][A
Training:  14%|█▍        | 9/65 [00:07<00:45,  1.24it/s][A
Training:  17%|█▋        | 11/65 [00:07<00:30,  1.76it/s][A
Training:  20%|██        | 13/65 [00:09<00:38,  1.34it/s][A
Training:  23%|██▎       | 15/65 [00:10<00:26,  1.87it/s][A
Training:  26%|██▌       | 17/65 [00:12<00:34,  1.38it/s][A
Training:  29%|██▉       | 19/65 [00:12<00:23,  1.92it/s][A
Training:  32%|███▏      | 21/65 [00:14<00:30,  1.43it/s][A
Training:  35%|███▌      | 23/65 [00:14<00:21,  1.98it/s][A
Training:  38%|███▊      | 25/65 [00:17<00:27,  1.43it/s][A
Training:  42%|████▏     | 27/65 [00:17<00:19,  1.97it/s][A
Training:  45%|████▍     | 29/65 [00:19<00:24,  1.46it/s][A
Training:  48%|████▊     | 31/65 [00:19<00:16,  2.00it/s][A
Training:  51%|█████     | 33/65 [00

Epoch: 26/77 - Loss: 12.3432 - Accuracy: 0.9417



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:02<00:20,  2.60s/it][A
 33%|███▎      | 3/9 [00:02<00:04,  1.41it/s][A
 56%|█████▌    | 5/9 [00:04<00:03,  1.14it/s][A
 78%|███████▊  | 7/9 [00:04<00:01,  1.89it/s][A
100%|██████████| 9/9 [00:05<00:00,  1.78it/s][A
Epochs:  34%|███▍      | 26/77 [19:52<38:46, 45.61s/it]

Val Loss: 12.1731 - Val Accuracy: 0.9256



Training:   0%|          | 0/65 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/65 [00:02<02:49,  2.64s/it][A
Training:   5%|▍         | 3/65 [00:02<00:44,  1.38it/s][A
Training:   8%|▊         | 5/65 [00:05<00:56,  1.06it/s][A
Training:  12%|█▏        | 8/65 [00:05<00:27,  2.10it/s][A
Training:  15%|█▌        | 10/65 [00:07<00:38,  1.43it/s][A
Training:  18%|█▊        | 12/65 [00:07<00:25,  2.04it/s][A
Training:  22%|██▏       | 14/65 [00:09<00:35,  1.42it/s][A
Training:  25%|██▍       | 16/65 [00:10<00:24,  1.99it/s][A
Training:  28%|██▊       | 18/65 [00:12<00:33,  1.42it/s][A
Training:  31%|███       | 20/65 [00:12<00:22,  1.98it/s][A
Training:  34%|███▍      | 22/65 [00:14<00:30,  1.43it/s][A
Training:  38%|███▊      | 25/65 [00:17<00:29,  1.35it/s][A
Training:  42%|████▏     | 27/65 [00:17<00:20,  1.82it/s][A
Training:  45%|████▍     | 29/65 [00:19<00:26,  1.38it/s][A
Training:  49%|████▉     | 32/65 [00:19<00:15,  2.13it/s][A
Training:  52%|█████▏    | 34/65 [00

Epoch: 27/77 - Loss: 12.3935 - Accuracy: 0.9386



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:02<00:21,  2.63s/it][A
 44%|████▍     | 4/9 [00:02<00:02,  1.88it/s][A
 67%|██████▋   | 6/9 [00:04<00:02,  1.33it/s][A
100%|██████████| 9/9 [00:04<00:00,  1.80it/s][A
Epochs:  35%|███▌      | 27/77 [20:38<37:59, 45.59s/it]

Val Loss: 11.5813 - Val Accuracy: 0.9336



Training:   0%|          | 0/65 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/65 [00:02<02:59,  2.81s/it][A
Training:   5%|▍         | 3/65 [00:02<00:47,  1.30it/s][A
Training:   8%|▊         | 5/65 [00:05<00:57,  1.04it/s][A
Training:  12%|█▏        | 8/65 [00:05<00:27,  2.08it/s][A
Training:  15%|█▌        | 10/65 [00:07<00:39,  1.40it/s][A
Training:  20%|██        | 13/65 [00:09<00:38,  1.36it/s][A
Training:  23%|██▎       | 15/65 [00:10<00:27,  1.84it/s][A
Training:  26%|██▌       | 17/65 [00:12<00:35,  1.35it/s][A
Training:  31%|███       | 20/65 [00:12<00:21,  2.10it/s][A
Training:  34%|███▍      | 22/65 [00:14<00:27,  1.55it/s][A
Training:  38%|███▊      | 25/65 [00:17<00:28,  1.41it/s][A
Training:  43%|████▎     | 28/65 [00:17<00:17,  2.08it/s][A
Training:  46%|████▌     | 30/65 [00:19<00:22,  1.57it/s][A
Training:  51%|█████     | 33/65 [00:22<00:22,  1.44it/s][A
Training:  55%|█████▌    | 36/65 [00:22<00:13,  2.08it/s][A
Training:  58%|█████▊    | 38/65 [00

Epoch: 28/77 - Loss: 12.5777 - Accuracy: 0.9411



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:02<00:20,  2.62s/it][A
 33%|███▎      | 3/9 [00:02<00:04,  1.39it/s][A
 56%|█████▌    | 5/9 [00:04<00:03,  1.13it/s][A
100%|██████████| 9/9 [00:05<00:00,  1.78it/s][A
Epochs:  36%|███▋      | 28/77 [21:23<37:13, 45.59s/it]

Val Loss: 13.8640 - Val Accuracy: 0.9307



Training:   0%|          | 0/65 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/65 [00:02<02:59,  2.81s/it][A
Training:   6%|▌         | 4/65 [00:02<00:34,  1.76it/s][A
Training:   9%|▉         | 6/65 [00:05<00:48,  1.22it/s][A
Training:  12%|█▏        | 8/65 [00:05<00:29,  1.90it/s][A
Training:  15%|█▌        | 10/65 [00:07<00:42,  1.31it/s][A
Training:  20%|██        | 13/65 [00:10<00:39,  1.31it/s][A
Training:  23%|██▎       | 15/65 [00:10<00:27,  1.79it/s][A
Training:  26%|██▌       | 17/65 [00:12<00:35,  1.35it/s][A
Training:  29%|██▉       | 19/65 [00:12<00:24,  1.86it/s][A
Training:  32%|███▏      | 21/65 [00:14<00:31,  1.40it/s][A
Training:  35%|███▌      | 23/65 [00:15<00:21,  1.93it/s][A
Training:  38%|███▊      | 25/65 [00:17<00:28,  1.41it/s][A
Training:  42%|████▏     | 27/65 [00:17<00:19,  1.96it/s][A
Training:  45%|████▍     | 29/65 [00:19<00:25,  1.42it/s][A
Training:  49%|████▉     | 32/65 [00:19<00:14,  2.24it/s][A
Training:  52%|█████▏    | 34/65 [00

Epoch: 29/77 - Loss: 12.5565 - Accuracy: 0.9384



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:02<00:20,  2.52s/it][A
 44%|████▍     | 4/9 [00:02<00:02,  1.94it/s][A
 67%|██████▋   | 6/9 [00:04<00:02,  1.32it/s][A
100%|██████████| 9/9 [00:05<00:00,  1.79it/s][A
Epochs:  38%|███▊      | 29/77 [22:09<36:29, 45.62s/it]

Val Loss: 12.2607 - Val Accuracy: 0.9312



Training:   0%|          | 0/65 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/65 [00:02<02:54,  2.73s/it][A
Training:   5%|▍         | 3/65 [00:02<00:46,  1.33it/s][A
Training:   8%|▊         | 5/65 [00:05<00:57,  1.04it/s][A
Training:  12%|█▏        | 8/65 [00:05<00:27,  2.06it/s][A
Training:  15%|█▌        | 10/65 [00:07<00:38,  1.42it/s][A
Training:  20%|██        | 13/65 [00:10<00:38,  1.34it/s][A
Training:  25%|██▍       | 16/65 [00:10<00:23,  2.07it/s][A
Training:  28%|██▊       | 18/65 [00:12<00:31,  1.50it/s][A
Training:  31%|███       | 20/65 [00:12<00:22,  2.01it/s][A
Training:  34%|███▍      | 22/65 [00:14<00:29,  1.47it/s][A
Training:  38%|███▊      | 25/65 [00:17<00:28,  1.39it/s][A
Training:  43%|████▎     | 28/65 [00:17<00:17,  2.07it/s][A
Training:  46%|████▌     | 30/65 [00:19<00:22,  1.54it/s][A
Training:  51%|█████     | 33/65 [00:22<00:22,  1.44it/s][A
Training:  55%|█████▌    | 36/65 [00:22<00:13,  2.09it/s][A
Training:  58%|█████▊    | 38/65 [00

Epoch: 30/77 - Loss: 13.2056 - Accuracy: 0.9401



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:02<00:20,  2.52s/it][A
 33%|███▎      | 3/9 [00:02<00:04,  1.45it/s][A
 56%|█████▌    | 5/9 [00:04<00:03,  1.13it/s][A
100%|██████████| 9/9 [00:05<00:00,  1.79it/s][A
Epochs:  39%|███▉      | 30/77 [22:54<35:43, 45.62s/it]

Val Loss: 11.6521 - Val Accuracy: 0.9307



Training:   0%|          | 0/65 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/65 [00:02<02:55,  2.74s/it][A
Training:   5%|▍         | 3/65 [00:02<00:46,  1.33it/s][A
Training:   8%|▊         | 5/65 [00:05<00:59,  1.02it/s][A
Training:  12%|█▏        | 8/65 [00:05<00:28,  2.03it/s][A
Training:  15%|█▌        | 10/65 [00:07<00:38,  1.42it/s][A
Training:  18%|█▊        | 12/65 [00:07<00:26,  2.02it/s][A
Training:  22%|██▏       | 14/65 [00:10<00:35,  1.43it/s][A
Training:  25%|██▍       | 16/65 [00:10<00:24,  2.00it/s][A
Training:  28%|██▊       | 18/65 [00:12<00:32,  1.44it/s][A
Training:  31%|███       | 20/65 [00:12<00:22,  2.01it/s][A
Training:  34%|███▍      | 22/65 [00:14<00:29,  1.46it/s][A
Training:  37%|███▋      | 24/65 [00:14<00:20,  2.02it/s][A
Training:  40%|████      | 26/65 [00:17<00:27,  1.41it/s][A
Training:  43%|████▎     | 28/65 [00:17<00:18,  1.95it/s][A
Training:  46%|████▌     | 30/65 [00:19<00:24,  1.45it/s][A
Training:  49%|████▉     | 32/65 [00

Epoch: 31/77 - Loss: 12.3701 - Accuracy: 0.9419



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:02<00:20,  2.59s/it][A
 44%|████▍     | 4/9 [00:02<00:02,  1.89it/s][A
 67%|██████▋   | 6/9 [00:04<00:02,  1.30it/s][A
100%|██████████| 9/9 [00:05<00:00,  1.78it/s][A
Epochs:  40%|████      | 31/77 [23:40<34:59, 45.64s/it]

Val Loss: 13.6970 - Val Accuracy: 0.9410



Training:   0%|          | 0/65 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/65 [00:02<03:02,  2.85s/it][A
Training:   5%|▍         | 3/65 [00:02<00:48,  1.28it/s][A
Training:   8%|▊         | 5/65 [00:05<00:57,  1.05it/s][A
Training:  11%|█         | 7/65 [00:05<00:33,  1.75it/s][A
Training:  14%|█▍        | 9/65 [00:07<00:45,  1.23it/s][A
Training:  17%|█▋        | 11/65 [00:07<00:29,  1.82it/s][A
Training:  20%|██        | 13/65 [00:10<00:39,  1.33it/s][A
Training:  25%|██▍       | 16/65 [00:10<00:22,  2.18it/s][A
Training:  28%|██▊       | 18/65 [00:12<00:30,  1.52it/s][A
Training:  31%|███       | 20/65 [00:12<00:21,  2.06it/s][A
Training:  34%|███▍      | 22/65 [00:15<00:29,  1.47it/s][A
Training:  38%|███▊      | 25/65 [00:17<00:28,  1.39it/s][A
Training:  42%|████▏     | 27/65 [00:17<00:20,  1.84it/s][A
Training:  45%|████▍     | 29/65 [00:19<00:25,  1.40it/s][A
Training:  48%|████▊     | 31/65 [00:19<00:17,  1.89it/s][A
Training:  51%|█████     | 33/65 [00:

Epoch: 32/77 - Loss: 13.2367 - Accuracy: 0.9396



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:02<00:20,  2.58s/it][A
 44%|████▍     | 4/9 [00:02<00:02,  1.90it/s][A
 67%|██████▋   | 6/9 [00:04<00:02,  1.30it/s][A
100%|██████████| 9/9 [00:05<00:00,  1.77it/s][A
Epochs:  42%|████▏     | 32/77 [24:26<34:19, 45.76s/it]

Val Loss: 12.8337 - Val Accuracy: 0.9378



Training:   0%|          | 0/65 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/65 [00:02<03:02,  2.86s/it][A
Training:   5%|▍         | 3/65 [00:02<00:48,  1.27it/s][A
Training:   8%|▊         | 5/65 [00:05<00:57,  1.05it/s][A
Training:  11%|█         | 7/65 [00:05<00:33,  1.75it/s][A
Training:  14%|█▍        | 9/65 [00:07<00:44,  1.27it/s][A
Training:  15%|█▌        | 10/65 [00:07<00:35,  1.55it/s][A
Training:  20%|██        | 13/65 [00:10<00:36,  1.42it/s][A
Training:  23%|██▎       | 15/65 [00:10<00:25,  1.99it/s][A
Training:  26%|██▌       | 17/65 [00:12<00:33,  1.44it/s][A
Training:  29%|██▉       | 19/65 [00:12<00:22,  2.00it/s][A
Training:  32%|███▏      | 21/65 [00:14<00:31,  1.40it/s][A
Training:  35%|███▌      | 23/65 [00:15<00:21,  1.94it/s][A
Training:  38%|███▊      | 25/65 [00:17<00:27,  1.43it/s][A
Training:  42%|████▏     | 27/65 [00:17<00:19,  1.98it/s][A
Training:  45%|████▍     | 29/65 [00:19<00:25,  1.41it/s][A
Training:  48%|████▊     | 31/65 [00:

Epoch: 33/77 - Loss: 13.2976 - Accuracy: 0.9408



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:02<00:20,  2.60s/it][A
 33%|███▎      | 3/9 [00:02<00:04,  1.40it/s][A
 56%|█████▌    | 5/9 [00:04<00:03,  1.11it/s][A
100%|██████████| 9/9 [00:05<00:00,  1.77it/s][A
Epochs:  43%|████▎     | 33/77 [25:12<33:34, 45.78s/it]

Val Loss: 12.4968 - Val Accuracy: 0.9359



Training:   0%|          | 0/65 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/65 [00:02<02:55,  2.74s/it][A
Training:   5%|▍         | 3/65 [00:02<00:46,  1.33it/s][A
Training:   8%|▊         | 5/65 [00:05<00:57,  1.04it/s][A
Training:  12%|█▏        | 8/65 [00:05<00:27,  2.07it/s][A
Training:  15%|█▌        | 10/65 [00:07<00:38,  1.43it/s][A
Training:  20%|██        | 13/65 [00:10<00:39,  1.33it/s][A
Training:  25%|██▍       | 16/65 [00:10<00:23,  2.04it/s][A
Training:  28%|██▊       | 18/65 [00:12<00:30,  1.52it/s][A
Training:  31%|███       | 20/65 [00:12<00:22,  2.03it/s][A
Training:  34%|███▍      | 22/65 [00:14<00:29,  1.46it/s][A
Training:  38%|███▊      | 25/65 [00:17<00:28,  1.40it/s][A
Training:  42%|████▏     | 27/65 [00:17<00:20,  1.83it/s][A
Training:  45%|████▍     | 29/65 [00:19<00:25,  1.43it/s][A
Training:  46%|████▌     | 30/65 [00:19<00:21,  1.65it/s][A
Training:  49%|████▉     | 32/65 [00:19<00:14,  2.34it/s][A
Training:  52%|█████▏    | 34/65 [00

Epoch: 34/77 - Loss: 12.7086 - Accuracy: 0.9418



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:02<00:20,  2.57s/it][A
 33%|███▎      | 3/9 [00:02<00:04,  1.42it/s][A
 56%|█████▌    | 5/9 [00:04<00:03,  1.15it/s][A
100%|██████████| 9/9 [00:04<00:00,  1.81it/s][A
Epochs:  44%|████▍     | 34/77 [25:58<32:47, 45.75s/it]

Val Loss: 14.2890 - Val Accuracy: 0.9388



Training:   0%|          | 0/65 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/65 [00:02<02:57,  2.77s/it][A
Training:   5%|▍         | 3/65 [00:02<00:47,  1.32it/s][A
Training:   8%|▊         | 5/65 [00:05<00:57,  1.04it/s][A
Training:  11%|█         | 7/65 [00:05<00:33,  1.72it/s][A
Training:  14%|█▍        | 9/65 [00:07<00:44,  1.27it/s][A
Training:  17%|█▋        | 11/65 [00:07<00:29,  1.86it/s][A
Training:  20%|██        | 13/65 [00:09<00:37,  1.39it/s][A
Training:  22%|██▏       | 14/65 [00:10<00:30,  1.65it/s][A
Training:  25%|██▍       | 16/65 [00:10<00:20,  2.43it/s][A
Training:  28%|██▊       | 18/65 [00:12<00:31,  1.49it/s][A
Training:  31%|███       | 20/65 [00:12<00:21,  2.12it/s][A
Training:  34%|███▍      | 22/65 [00:14<00:28,  1.49it/s][A
Training:  37%|███▋      | 24/65 [00:14<00:19,  2.09it/s][A
Training:  40%|████      | 26/65 [00:17<00:26,  1.47it/s][A
Training:  43%|████▎     | 28/65 [00:17<00:18,  2.03it/s][A
Training:  46%|████▌     | 30/65 [00:

Epoch: 35/77 - Loss: 13.0645 - Accuracy: 0.9405



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:02<00:21,  2.65s/it][A
 44%|████▍     | 4/9 [00:02<00:02,  1.85it/s][A
 67%|██████▋   | 6/9 [00:04<00:02,  1.33it/s][A
100%|██████████| 9/9 [00:05<00:00,  1.79it/s][A
Epochs:  45%|████▌     | 35/77 [26:43<32:00, 45.73s/it]

Val Loss: 12.5436 - Val Accuracy: 0.9359



Training:   0%|          | 0/65 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/65 [00:02<02:59,  2.80s/it][A
Training:   5%|▍         | 3/65 [00:02<00:47,  1.30it/s][A
Training:   8%|▊         | 5/65 [00:05<00:57,  1.04it/s][A
Training:  11%|█         | 7/65 [00:05<00:33,  1.73it/s][A
Training:  14%|█▍        | 9/65 [00:07<00:45,  1.24it/s][A
Training:  18%|█▊        | 12/65 [00:07<00:24,  2.14it/s][A
Training:  22%|██▏       | 14/65 [00:10<00:34,  1.46it/s][A
Training:  25%|██▍       | 16/65 [00:10<00:24,  2.01it/s][A
Training:  28%|██▊       | 18/65 [00:12<00:32,  1.45it/s][A
Training:  32%|███▏      | 21/65 [00:14<00:31,  1.38it/s][A
Training:  35%|███▌      | 23/65 [00:15<00:22,  1.85it/s][A
Training:  38%|███▊      | 25/65 [00:17<00:28,  1.40it/s][A
Training:  43%|████▎     | 28/65 [00:17<00:17,  2.14it/s][A
Training:  46%|████▌     | 30/65 [00:19<00:22,  1.55it/s][A
Training:  49%|████▉     | 32/65 [00:19<00:15,  2.07it/s][A
Training:  52%|█████▏    | 34/65 [00:

Epoch: 36/77 - Loss: 12.5486 - Accuracy: 0.9421



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:02<00:20,  2.61s/it][A
 33%|███▎      | 3/9 [00:02<00:04,  1.40it/s][A
 56%|█████▌    | 5/9 [00:04<00:03,  1.11it/s][A
100%|██████████| 9/9 [00:05<00:00,  1.76it/s][A
Epochs:  47%|████▋     | 36/77 [27:29<31:18, 45.82s/it]

Val Loss: 15.9141 - Val Accuracy: 0.9389



Training:   0%|          | 0/65 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/65 [00:02<03:00,  2.82s/it][A
Training:   5%|▍         | 3/65 [00:02<00:47,  1.30it/s][A
Training:   8%|▊         | 5/65 [00:05<00:57,  1.05it/s][A
Training:  11%|█         | 7/65 [00:05<00:33,  1.74it/s][A
Training:  14%|█▍        | 9/65 [00:07<00:44,  1.25it/s][A
Training:  17%|█▋        | 11/65 [00:07<00:29,  1.85it/s][A
Training:  20%|██        | 13/65 [00:10<00:38,  1.36it/s][A
Training:  25%|██▍       | 16/65 [00:10<00:22,  2.22it/s][A
Training:  28%|██▊       | 18/65 [00:12<00:31,  1.50it/s][A
Training:  32%|███▏      | 21/65 [00:14<00:30,  1.42it/s][A
Training:  35%|███▌      | 23/65 [00:14<00:22,  1.88it/s][A
Training:  38%|███▊      | 25/65 [00:17<00:28,  1.40it/s][A
Training:  42%|████▏     | 27/65 [00:17<00:19,  1.90it/s][A
Training:  45%|████▍     | 29/65 [00:19<00:25,  1.41it/s][A
Training:  49%|████▉     | 32/65 [00:19<00:15,  2.19it/s][A
Training:  52%|█████▏    | 34/65 [00:

Epoch: 37/77 - Loss: 13.4583 - Accuracy: 0.9402



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:02<00:20,  2.59s/it][A
 44%|████▍     | 4/9 [00:02<00:02,  1.90it/s][A
 67%|██████▋   | 6/9 [00:04<00:02,  1.33it/s][A
100%|██████████| 9/9 [00:05<00:00,  1.80it/s][A
Epochs:  48%|████▊     | 37/77 [28:15<30:32, 45.80s/it]

Val Loss: 13.9756 - Val Accuracy: 0.9276



Training:   0%|          | 0/65 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/65 [00:02<03:00,  2.81s/it][A
Training:   5%|▍         | 3/65 [00:02<00:47,  1.30it/s][A
Training:   8%|▊         | 5/65 [00:05<00:57,  1.04it/s][A
Training:  12%|█▏        | 8/65 [00:05<00:27,  2.08it/s][A
Training:  15%|█▌        | 10/65 [00:07<00:39,  1.39it/s][A
Training:  20%|██        | 13/65 [00:10<00:38,  1.35it/s][A
Training:  23%|██▎       | 15/65 [00:10<00:27,  1.83it/s][A
Training:  26%|██▌       | 17/65 [00:12<00:35,  1.36it/s][A
Training:  29%|██▉       | 19/65 [00:12<00:24,  1.86it/s][A
Training:  32%|███▏      | 21/65 [00:14<00:31,  1.40it/s][A
Training:  35%|███▌      | 23/65 [00:15<00:21,  1.93it/s][A
Training:  38%|███▊      | 25/65 [00:17<00:29,  1.38it/s][A
Training:  43%|████▎     | 28/65 [00:17<00:17,  2.16it/s][A
Training:  46%|████▌     | 30/65 [00:19<00:22,  1.55it/s][A
Training:  49%|████▉     | 32/65 [00:20<00:15,  2.08it/s][A
Training:  52%|█████▏    | 34/65 [00

Epoch: 38/77 - Loss: 13.0122 - Accuracy: 0.9404



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:02<00:20,  2.59s/it][A
 33%|███▎      | 3/9 [00:02<00:04,  1.39it/s][A
 56%|█████▌    | 5/9 [00:04<00:03,  1.13it/s][A
100%|██████████| 9/9 [00:05<00:00,  1.78it/s][A
Epochs:  49%|████▉     | 38/77 [29:01<29:49, 45.89s/it]

Val Loss: 15.4074 - Val Accuracy: 0.9364



Training:   0%|          | 0/65 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/65 [00:02<03:02,  2.86s/it][A
Training:   6%|▌         | 4/65 [00:02<00:35,  1.73it/s][A
Training:   9%|▉         | 6/65 [00:05<00:48,  1.21it/s][A
Training:  14%|█▍        | 9/65 [00:07<00:46,  1.21it/s][A
Training:  17%|█▋        | 11/65 [00:07<00:31,  1.72it/s][A
Training:  20%|██        | 13/65 [00:10<00:39,  1.32it/s][A
Training:  23%|██▎       | 15/65 [00:10<00:27,  1.85it/s][A
Training:  26%|██▌       | 17/65 [00:12<00:35,  1.35it/s][A
Training:  29%|██▉       | 19/65 [00:12<00:24,  1.88it/s][A
Training:  32%|███▏      | 21/65 [00:15<00:31,  1.40it/s][A
Training:  37%|███▋      | 24/65 [00:15<00:18,  2.21it/s][A
Training:  40%|████      | 26/65 [00:17<00:25,  1.51it/s][A
Training:  43%|████▎     | 28/65 [00:17<00:18,  2.04it/s][A
Training:  46%|████▌     | 30/65 [00:20<00:23,  1.47it/s][A
Training:  49%|████▉     | 32/65 [00:20<00:16,  2.01it/s][A
Training:  52%|█████▏    | 34/65 [00

Epoch: 39/77 - Loss: 13.3230 - Accuracy: 0.9429



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:02<00:20,  2.57s/it][A
 33%|███▎      | 3/9 [00:02<00:04,  1.42it/s][A
 56%|█████▌    | 5/9 [00:04<00:03,  1.12it/s][A
100%|██████████| 9/9 [00:05<00:00,  1.79it/s][A
Epochs:  51%|█████     | 39/77 [29:47<29:05, 45.94s/it]

Val Loss: 12.4990 - Val Accuracy: 0.9353



Training:   0%|          | 0/65 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/65 [00:02<03:02,  2.86s/it][A
Training:   5%|▍         | 3/65 [00:02<00:48,  1.28it/s][A
Training:   8%|▊         | 5/65 [00:05<00:57,  1.05it/s][A
Training:  11%|█         | 7/65 [00:05<00:33,  1.75it/s][A
Training:  14%|█▍        | 9/65 [00:07<00:45,  1.23it/s][A
Training:  18%|█▊        | 12/65 [00:07<00:24,  2.13it/s][A
Training:  22%|██▏       | 14/65 [00:10<00:33,  1.50it/s][A
Training:  25%|██▍       | 16/65 [00:10<00:23,  2.07it/s][A
Training:  28%|██▊       | 18/65 [00:12<00:32,  1.43it/s][A
Training:  31%|███       | 20/65 [00:12<00:22,  1.99it/s][A
Training:  34%|███▍      | 22/65 [00:14<00:29,  1.45it/s][A
Training:  37%|███▋      | 24/65 [00:15<00:20,  2.01it/s][A
Training:  40%|████      | 26/65 [00:17<00:27,  1.40it/s][A
Training:  45%|████▍     | 29/65 [00:19<00:26,  1.34it/s][A
Training:  49%|████▉     | 32/65 [00:20<00:16,  2.02it/s][A
Training:  52%|█████▏    | 34/65 [00:

Epoch: 40/77 - Loss: 12.6314 - Accuracy: 0.9419



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:02<00:21,  2.66s/it][A
 44%|████▍     | 4/9 [00:02<00:02,  1.86it/s][A
 67%|██████▋   | 6/9 [00:04<00:02,  1.33it/s][A
100%|██████████| 9/9 [00:05<00:00,  1.80it/s][A
Epochs:  52%|█████▏    | 40/77 [30:33<28:21, 45.97s/it]

Val Loss: 13.7615 - Val Accuracy: 0.9312



Training:   0%|          | 0/65 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/65 [00:02<03:02,  2.85s/it][A
Training:   5%|▍         | 3/65 [00:02<00:48,  1.29it/s][A
Training:   8%|▊         | 5/65 [00:05<00:58,  1.03it/s][A
Training:  12%|█▏        | 8/65 [00:05<00:27,  2.05it/s][A
Training:  15%|█▌        | 10/65 [00:07<00:39,  1.39it/s][A
Training:  18%|█▊        | 12/65 [00:07<00:26,  1.98it/s][A
Training:  22%|██▏       | 14/65 [00:10<00:35,  1.42it/s][A
Training:  26%|██▌       | 17/65 [00:12<00:35,  1.34it/s][A
Training:  29%|██▉       | 19/65 [00:12<00:25,  1.81it/s][A
Training:  32%|███▏      | 21/65 [00:14<00:31,  1.39it/s][A
Training:  35%|███▌      | 23/65 [00:15<00:22,  1.89it/s][A
Training:  38%|███▊      | 25/65 [00:17<00:28,  1.39it/s][A
Training:  42%|████▏     | 27/65 [00:17<00:19,  1.91it/s][A
Training:  45%|████▍     | 29/65 [00:19<00:24,  1.44it/s][A
Training:  48%|████▊     | 31/65 [00:19<00:17,  1.97it/s][A
Training:  51%|█████     | 33/65 [00

Epoch: 41/77 - Loss: 13.2519 - Accuracy: 0.9426



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:02<00:20,  2.58s/it][A
 33%|███▎      | 3/9 [00:02<00:04,  1.41it/s][A
 56%|█████▌    | 5/9 [00:04<00:03,  1.14it/s][A
100%|██████████| 9/9 [00:04<00:00,  1.80it/s][A
Epochs:  53%|█████▎    | 41/77 [31:19<27:32, 45.91s/it]

Val Loss: 15.8129 - Val Accuracy: 0.9343



Training:   0%|          | 0/65 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/65 [00:02<02:58,  2.78s/it][A
Training:   3%|▎         | 2/65 [00:02<01:16,  1.21s/it][A
Training:   8%|▊         | 5/65 [00:05<00:53,  1.12it/s][A
Training:  11%|█         | 7/65 [00:05<00:32,  1.81it/s][A
Training:  14%|█▍        | 9/65 [00:07<00:43,  1.28it/s][A
Training:  17%|█▋        | 11/65 [00:07<00:28,  1.89it/s][A
Training:  20%|██        | 13/65 [00:10<00:39,  1.33it/s][A
Training:  23%|██▎       | 15/65 [00:10<00:26,  1.88it/s][A
Training:  26%|██▌       | 17/65 [00:12<00:34,  1.40it/s][A
Training:  29%|██▉       | 19/65 [00:12<00:23,  1.96it/s][A
Training:  32%|███▏      | 21/65 [00:15<00:31,  1.39it/s][A
Training:  35%|███▌      | 23/65 [00:15<00:21,  1.94it/s][A
Training:  38%|███▊      | 25/65 [00:17<00:28,  1.41it/s][A
Training:  42%|████▏     | 27/65 [00:17<00:19,  1.97it/s][A
Training:  45%|████▍     | 29/65 [00:19<00:25,  1.41it/s][A
Training:  48%|████▊     | 31/65 [00:

Epoch: 42/77 - Loss: 13.7438 - Accuracy: 0.9390



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:02<00:19,  2.49s/it][A
 33%|███▎      | 3/9 [00:02<00:04,  1.46it/s][A
 56%|█████▌    | 5/9 [00:04<00:03,  1.13it/s][A
100%|██████████| 9/9 [00:04<00:00,  1.80it/s][A
Epochs:  55%|█████▍    | 42/77 [32:05<26:47, 45.94s/it]

Val Loss: 13.1582 - Val Accuracy: 0.9348



Training:   0%|          | 0/65 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/65 [00:02<03:02,  2.85s/it][A
Training:   6%|▌         | 4/65 [00:03<00:35,  1.72it/s][A
Training:   9%|▉         | 6/65 [00:05<00:48,  1.21it/s][A
Training:  12%|█▏        | 8/65 [00:05<00:30,  1.88it/s][A
Training:  15%|█▌        | 10/65 [00:07<00:42,  1.31it/s][A
Training:  18%|█▊        | 12/65 [00:07<00:27,  1.91it/s][A
Training:  22%|██▏       | 14/65 [00:10<00:37,  1.38it/s][A
Training:  25%|██▍       | 16/65 [00:10<00:25,  1.95it/s][A
Training:  28%|██▊       | 18/65 [00:12<00:33,  1.41it/s][A
Training:  31%|███       | 20/65 [00:12<00:22,  1.97it/s][A
Training:  34%|███▍      | 22/65 [00:15<00:30,  1.40it/s][A
Training:  37%|███▋      | 24/65 [00:15<00:21,  1.95it/s][A
Training:  40%|████      | 26/65 [00:17<00:27,  1.42it/s][A
Training:  43%|████▎     | 28/65 [00:17<00:18,  1.97it/s][A
Training:  46%|████▌     | 30/65 [00:19<00:24,  1.41it/s][A
Training:  49%|████▉     | 32/65 [00

Epoch: 43/77 - Loss: 12.9905 - Accuracy: 0.9389



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:02<00:20,  2.52s/it][A
 33%|███▎      | 3/9 [00:02<00:04,  1.44it/s][A
 56%|█████▌    | 5/9 [00:04<00:03,  1.10it/s][A
100%|██████████| 9/9 [00:05<00:00,  1.76it/s][A
Epochs:  56%|█████▌    | 43/77 [32:51<26:03, 45.99s/it]

Val Loss: 15.0182 - Val Accuracy: 0.9352



Training:   0%|          | 0/65 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/65 [00:02<02:54,  2.73s/it][A
Training:   5%|▍         | 3/65 [00:02<00:46,  1.34it/s][A
Training:   8%|▊         | 5/65 [00:05<00:58,  1.02it/s][A
Training:  12%|█▏        | 8/65 [00:05<00:27,  2.05it/s][A
Training:  15%|█▌        | 10/65 [00:07<00:38,  1.42it/s][A
Training:  18%|█▊        | 12/65 [00:07<00:26,  2.02it/s][A
Training:  22%|██▏       | 14/65 [00:10<00:36,  1.39it/s][A
Training:  26%|██▌       | 17/65 [00:12<00:35,  1.36it/s][A
Training:  29%|██▉       | 19/65 [00:12<00:25,  1.84it/s][A
Training:  32%|███▏      | 21/65 [00:14<00:31,  1.38it/s][A
Training:  37%|███▋      | 24/65 [00:15<00:19,  2.14it/s][A
Training:  40%|████      | 26/65 [00:17<00:25,  1.55it/s][A
Training:  45%|████▍     | 29/65 [00:19<00:24,  1.44it/s][A
Training:  48%|████▊     | 31/65 [00:19<00:17,  1.89it/s][A
Training:  51%|█████     | 33/65 [00:22<00:22,  1.42it/s][A
Training:  54%|█████▍    | 35/65 [00

Epoch: 44/77 - Loss: 12.8312 - Accuracy: 0.9443



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:02<00:20,  2.57s/it][A
 44%|████▍     | 4/9 [00:02<00:02,  1.92it/s][A
 67%|██████▋   | 6/9 [00:04<00:02,  1.35it/s][A
100%|██████████| 9/9 [00:04<00:00,  1.83it/s][A
Epochs:  57%|█████▋    | 44/77 [33:37<25:14, 45.90s/it]

Val Loss: 10.2883 - Val Accuracy: 0.9455



Training:   0%|          | 0/65 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/65 [00:02<02:56,  2.75s/it][A
Training:   5%|▍         | 3/65 [00:02<00:46,  1.33it/s][A
Training:   8%|▊         | 5/65 [00:05<00:58,  1.03it/s][A
Training:  12%|█▏        | 8/65 [00:05<00:27,  2.06it/s][A
Training:  15%|█▌        | 10/65 [00:07<00:38,  1.43it/s][A
Training:  18%|█▊        | 12/65 [00:07<00:25,  2.04it/s][A
Training:  22%|██▏       | 14/65 [00:10<00:35,  1.42it/s][A
Training:  25%|██▍       | 16/65 [00:10<00:24,  1.98it/s][A
Training:  28%|██▊       | 18/65 [00:12<00:33,  1.39it/s][A
Training:  31%|███       | 20/65 [00:12<00:23,  1.94it/s][A
Training:  34%|███▍      | 22/65 [00:15<00:30,  1.40it/s][A
Training:  37%|███▋      | 24/65 [00:15<00:21,  1.94it/s][A
Training:  40%|████      | 26/65 [00:17<00:27,  1.42it/s][A
Training:  43%|████▎     | 28/65 [00:17<00:18,  1.96it/s][A
Training:  46%|████▌     | 30/65 [00:19<00:24,  1.42it/s][A
Training:  51%|█████     | 33/65 [00

Epoch: 45/77 - Loss: 12.6402 - Accuracy: 0.9411



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:02<00:20,  2.61s/it][A
 44%|████▍     | 4/9 [00:02<00:02,  1.88it/s][A
 67%|██████▋   | 6/9 [00:04<00:02,  1.29it/s][A
100%|██████████| 9/9 [00:05<00:00,  1.75it/s][A
Epochs:  58%|█████▊    | 45/77 [34:23<24:29, 45.91s/it]

Val Loss: 12.5060 - Val Accuracy: 0.9388



Training:   0%|          | 0/65 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/65 [00:02<02:56,  2.75s/it][A
Training:   6%|▌         | 4/65 [00:02<00:34,  1.78it/s][A
Training:   9%|▉         | 6/65 [00:05<00:48,  1.21it/s][A
Training:  14%|█▍        | 9/65 [00:07<00:44,  1.25it/s][A
Training:  17%|█▋        | 11/65 [00:07<00:30,  1.77it/s][A
Training:  20%|██        | 13/65 [00:10<00:39,  1.31it/s][A
Training:  23%|██▎       | 15/65 [00:10<00:27,  1.84it/s][A
Training:  26%|██▌       | 17/65 [00:12<00:34,  1.40it/s][A
Training:  29%|██▉       | 19/65 [00:12<00:23,  1.94it/s][A
Training:  32%|███▏      | 21/65 [00:14<00:32,  1.37it/s][A
Training:  35%|███▌      | 23/65 [00:15<00:22,  1.91it/s][A
Training:  38%|███▊      | 25/65 [00:17<00:28,  1.41it/s][A
Training:  43%|████▎     | 28/65 [00:17<00:16,  2.22it/s][A
Training:  46%|████▌     | 30/65 [00:19<00:22,  1.53it/s][A
Training:  51%|█████     | 33/65 [00:22<00:22,  1.44it/s][A
Training:  54%|█████▍    | 35/65 [00

Epoch: 46/77 - Loss: 13.0210 - Accuracy: 0.9392



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:02<00:19,  2.45s/it][A
 33%|███▎      | 3/9 [00:02<00:04,  1.48it/s][A
 56%|█████▌    | 5/9 [00:04<00:03,  1.14it/s][A
100%|██████████| 9/9 [00:04<00:00,  1.81it/s][A
Epochs:  60%|█████▉    | 46/77 [35:09<23:42, 45.88s/it]

Val Loss: 12.4830 - Val Accuracy: 0.9398



Training:   0%|          | 0/65 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/65 [00:02<02:53,  2.71s/it][A
Training:   5%|▍         | 3/65 [00:02<00:46,  1.33it/s][A
Training:   8%|▊         | 5/65 [00:05<00:57,  1.03it/s][A
Training:  11%|█         | 7/65 [00:05<00:33,  1.72it/s][A
Training:  14%|█▍        | 9/65 [00:07<00:43,  1.28it/s][A
Training:  17%|█▋        | 11/65 [00:07<00:28,  1.88it/s][A
Training:  20%|██        | 13/65 [00:10<00:39,  1.33it/s][A
Training:  23%|██▎       | 15/65 [00:10<00:26,  1.90it/s][A
Training:  26%|██▌       | 17/65 [00:12<00:34,  1.39it/s][A
Training:  29%|██▉       | 19/65 [00:12<00:23,  1.95it/s][A
Training:  32%|███▏      | 21/65 [00:14<00:31,  1.38it/s][A
Training:  35%|███▌      | 23/65 [00:15<00:21,  1.93it/s][A
Training:  38%|███▊      | 25/65 [00:17<00:28,  1.41it/s][A
Training:  42%|████▏     | 27/65 [00:17<00:19,  1.96it/s][A
Training:  45%|████▍     | 29/65 [00:19<00:26,  1.38it/s][A
Training:  49%|████▉     | 32/65 [00:

Epoch: 47/77 - Loss: 13.9210 - Accuracy: 0.9426



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:02<00:19,  2.49s/it][A
 33%|███▎      | 3/9 [00:02<00:04,  1.45it/s][A
 56%|█████▌    | 5/9 [00:04<00:03,  1.13it/s][A
100%|██████████| 9/9 [00:04<00:00,  1.81it/s][A
Epochs:  61%|██████    | 47/77 [35:55<22:56, 45.89s/it]

Val Loss: 13.8206 - Val Accuracy: 0.9424



Training:   0%|          | 0/65 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/65 [00:02<02:55,  2.74s/it][A
Training:   5%|▍         | 3/65 [00:02<00:46,  1.33it/s][A
Training:   8%|▊         | 5/65 [00:05<00:57,  1.04it/s][A
Training:  11%|█         | 7/65 [00:05<00:33,  1.73it/s][A
Training:  14%|█▍        | 9/65 [00:07<00:44,  1.27it/s][A
Training:  18%|█▊        | 12/65 [00:07<00:24,  2.20it/s][A
Training:  22%|██▏       | 14/65 [00:10<00:34,  1.48it/s][A
Training:  26%|██▌       | 17/65 [00:12<00:34,  1.41it/s][A
Training:  31%|███       | 20/65 [00:12<00:21,  2.12it/s][A
Training:  34%|███▍      | 22/65 [00:14<00:28,  1.51it/s][A
Training:  38%|███▊      | 25/65 [00:17<00:28,  1.41it/s][A
Training:  43%|████▎     | 28/65 [00:17<00:18,  2.05it/s][A
Training:  46%|████▌     | 30/65 [00:19<00:23,  1.51it/s][A
Training:  51%|█████     | 33/65 [00:22<00:22,  1.44it/s][A
Training:  55%|█████▌    | 36/65 [00:22<00:14,  2.07it/s][A
Training:  58%|█████▊    | 38/65 [00:

Epoch: 48/77 - Loss: 13.2497 - Accuracy: 0.9411



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:02<00:20,  2.52s/it][A
 33%|███▎      | 3/9 [00:02<00:04,  1.45it/s][A
 56%|█████▌    | 5/9 [00:04<00:03,  1.11it/s][A
100%|██████████| 9/9 [00:05<00:00,  1.79it/s][A
Epochs:  62%|██████▏   | 48/77 [36:40<22:10, 45.87s/it]

Val Loss: 16.1571 - Val Accuracy: 0.9347



Training:   0%|          | 0/65 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/65 [00:02<03:00,  2.82s/it][A
Training:   5%|▍         | 3/65 [00:02<00:47,  1.30it/s][A
Training:   8%|▊         | 5/65 [00:05<00:57,  1.05it/s][A
Training:  11%|█         | 7/65 [00:05<00:33,  1.74it/s][A
Training:  14%|█▍        | 9/65 [00:07<00:45,  1.24it/s][A
Training:  17%|█▋        | 11/65 [00:07<00:29,  1.84it/s][A
Training:  20%|██        | 13/65 [00:10<00:38,  1.34it/s][A
Training:  25%|██▍       | 16/65 [00:10<00:22,  2.19it/s][A
Training:  28%|██▊       | 18/65 [00:12<00:31,  1.51it/s][A
Training:  32%|███▏      | 21/65 [00:14<00:30,  1.42it/s][A
Training:  37%|███▋      | 24/65 [00:15<00:19,  2.12it/s][A
Training:  40%|████      | 26/65 [00:17<00:25,  1.55it/s][A
Training:  45%|████▍     | 29/65 [00:19<00:25,  1.41it/s][A
Training:  48%|████▊     | 31/65 [00:19<00:18,  1.83it/s][A
Training:  51%|█████     | 33/65 [00:22<00:22,  1.43it/s][A
Training:  54%|█████▍    | 35/65 [00:

Epoch: 49/77 - Loss: 13.5202 - Accuracy: 0.9407



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:02<00:20,  2.58s/it][A
 44%|████▍     | 4/9 [00:02<00:02,  1.90it/s][A
 67%|██████▋   | 6/9 [00:04<00:02,  1.31it/s][A
100%|██████████| 9/9 [00:05<00:00,  1.78it/s][A
Epochs:  64%|██████▎   | 49/77 [37:26<21:24, 45.89s/it]

Val Loss: 13.4926 - Val Accuracy: 0.9408



Training:   0%|          | 0/65 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/65 [00:02<03:01,  2.83s/it][A
Training:   5%|▍         | 3/65 [00:02<00:48,  1.28it/s][A
Training:   8%|▊         | 5/65 [00:05<00:57,  1.04it/s][A
Training:  11%|█         | 7/65 [00:05<00:33,  1.71it/s][A
Training:  14%|█▍        | 9/65 [00:07<00:45,  1.24it/s][A
Training:  17%|█▋        | 11/65 [00:07<00:29,  1.84it/s][A
Training:  20%|██        | 13/65 [00:10<00:38,  1.36it/s][A
Training:  23%|██▎       | 15/65 [00:10<00:25,  1.95it/s][A
Training:  26%|██▌       | 17/65 [00:12<00:35,  1.37it/s][A
Training:  31%|███       | 20/65 [00:12<00:20,  2.19it/s][A
Training:  34%|███▍      | 22/65 [00:14<00:27,  1.55it/s][A
Training:  37%|███▋      | 24/65 [00:15<00:19,  2.10it/s][A
Training:  40%|████      | 26/65 [00:17<00:26,  1.47it/s][A
Training:  43%|████▎     | 28/65 [00:17<00:18,  2.01it/s][A
Training:  46%|████▌     | 30/65 [00:19<00:23,  1.47it/s][A
Training:  49%|████▉     | 32/65 [00:

Epoch: 50/77 - Loss: 14.0773 - Accuracy: 0.9391



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:02<00:20,  2.54s/it][A
 33%|███▎      | 3/9 [00:02<00:04,  1.44it/s][A
 56%|█████▌    | 5/9 [00:04<00:03,  1.11it/s][A
100%|██████████| 9/9 [00:05<00:00,  1.78it/s][A
Epochs:  65%|██████▍   | 50/77 [38:12<20:40, 45.95s/it]

Val Loss: 13.3031 - Val Accuracy: 0.9374



Training:   0%|          | 0/65 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/65 [00:02<02:55,  2.74s/it][A
Training:   5%|▍         | 3/65 [00:02<00:46,  1.33it/s][A
Training:   8%|▊         | 5/65 [00:05<00:58,  1.02it/s][A
Training:  11%|█         | 7/65 [00:05<00:33,  1.71it/s][A
Training:  14%|█▍        | 9/65 [00:07<00:44,  1.27it/s][A
Training:  17%|█▋        | 11/65 [00:07<00:28,  1.88it/s][A
Training:  20%|██        | 13/65 [00:10<00:38,  1.35it/s][A
Training:  23%|██▎       | 15/65 [00:10<00:25,  1.92it/s][A
Training:  26%|██▌       | 17/65 [00:12<00:34,  1.39it/s][A
Training:  29%|██▉       | 19/65 [00:12<00:23,  1.95it/s][A
Training:  32%|███▏      | 21/65 [00:14<00:31,  1.41it/s][A
Training:  35%|███▌      | 23/65 [00:14<00:21,  1.95it/s][A
Training:  38%|███▊      | 25/65 [00:17<00:28,  1.40it/s][A
Training:  42%|████▏     | 27/65 [00:17<00:19,  1.95it/s][A
Training:  45%|████▍     | 29/65 [00:19<00:25,  1.42it/s][A
Training:  48%|████▊     | 31/65 [00:

Epoch: 51/77 - Loss: 13.1765 - Accuracy: 0.9411



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:02<00:19,  2.49s/it][A
 33%|███▎      | 3/9 [00:02<00:04,  1.46it/s][A
 56%|█████▌    | 5/9 [00:04<00:03,  1.13it/s][A
100%|██████████| 9/9 [00:04<00:00,  1.80it/s][A
Epochs:  66%|██████▌   | 51/77 [38:58<19:55, 45.96s/it]

Val Loss: 13.0644 - Val Accuracy: 0.9317



Training:   0%|          | 0/65 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/65 [00:02<02:55,  2.75s/it][A
Training:   5%|▍         | 3/65 [00:02<00:46,  1.33it/s][A
Training:   8%|▊         | 5/65 [00:05<00:58,  1.03it/s][A
Training:  12%|█▏        | 8/65 [00:05<00:27,  2.05it/s][A
Training:  15%|█▌        | 10/65 [00:07<00:38,  1.43it/s][A
Training:  18%|█▊        | 12/65 [00:07<00:26,  2.04it/s][A
Training:  22%|██▏       | 14/65 [00:10<00:36,  1.40it/s][A
Training:  26%|██▌       | 17/65 [00:12<00:35,  1.34it/s][A
Training:  31%|███       | 20/65 [00:12<00:22,  2.04it/s][A
Training:  34%|███▍      | 22/65 [00:15<00:28,  1.49it/s][A
Training:  37%|███▋      | 24/65 [00:15<00:20,  1.98it/s][A
Training:  40%|████      | 26/65 [00:17<00:26,  1.48it/s][A
Training:  45%|████▍     | 29/65 [00:19<00:26,  1.37it/s][A
Training:  49%|████▉     | 32/65 [00:19<00:16,  2.02it/s][A
Training:  52%|█████▏    | 34/65 [00:22<00:20,  1.53it/s][A
Training:  55%|█████▌    | 36/65 [00

Epoch: 52/77 - Loss: 13.7599 - Accuracy: 0.9437



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:02<00:20,  2.53s/it][A
 44%|████▍     | 4/9 [00:02<00:02,  1.94it/s][A
 67%|██████▋   | 6/9 [00:04<00:02,  1.29it/s][A
100%|██████████| 9/9 [00:05<00:00,  1.78it/s][A
Epochs:  68%|██████▊   | 52/77 [39:44<19:08, 45.95s/it]

Val Loss: 15.1352 - Val Accuracy: 0.9369



Training:   0%|          | 0/65 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/65 [00:02<02:58,  2.78s/it][A
Training:   5%|▍         | 3/65 [00:02<00:47,  1.30it/s][A
Training:   8%|▊         | 5/65 [00:05<00:58,  1.03it/s][A
Training:  11%|█         | 7/65 [00:05<00:33,  1.71it/s][A
Training:  14%|█▍        | 9/65 [00:07<00:45,  1.24it/s][A
Training:  17%|█▋        | 11/65 [00:07<00:29,  1.84it/s][A
Training:  20%|██        | 13/65 [00:10<00:39,  1.32it/s][A
Training:  23%|██▎       | 15/65 [00:10<00:26,  1.89it/s][A
Training:  26%|██▌       | 17/65 [00:12<00:34,  1.37it/s][A
Training:  29%|██▉       | 19/65 [00:12<00:23,  1.92it/s][A
Training:  32%|███▏      | 21/65 [00:15<00:31,  1.39it/s][A
Training:  35%|███▌      | 23/65 [00:15<00:21,  1.94it/s][A
Training:  38%|███▊      | 25/65 [00:17<00:28,  1.40it/s][A
Training:  42%|████▏     | 27/65 [00:17<00:19,  1.95it/s][A
Training:  45%|████▍     | 29/65 [00:19<00:25,  1.41it/s][A
Training:  49%|████▉     | 32/65 [00:

Epoch: 53/77 - Loss: 13.5800 - Accuracy: 0.9418



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:02<00:21,  2.63s/it][A
 44%|████▍     | 4/9 [00:02<00:02,  1.87it/s][A
 67%|██████▋   | 6/9 [00:04<00:02,  1.29it/s][A
100%|██████████| 9/9 [00:05<00:00,  1.76it/s][A
Epochs:  69%|██████▉   | 53/77 [40:31<18:24, 46.01s/it]

Val Loss: 11.9559 - Val Accuracy: 0.9347



Training:   0%|          | 0/65 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/65 [00:02<03:00,  2.82s/it][A
Training:   5%|▍         | 3/65 [00:02<00:47,  1.30it/s][A
Training:   8%|▊         | 5/65 [00:05<00:57,  1.04it/s][A
Training:  11%|█         | 7/65 [00:05<00:33,  1.73it/s][A
Training:  14%|█▍        | 9/65 [00:07<00:45,  1.24it/s][A
Training:  17%|█▋        | 11/65 [00:07<00:29,  1.85it/s][A
Training:  20%|██        | 13/65 [00:10<00:38,  1.34it/s][A
Training:  23%|██▎       | 15/65 [00:10<00:26,  1.91it/s][A
Training:  26%|██▌       | 17/65 [00:12<00:35,  1.36it/s][A
Training:  29%|██▉       | 19/65 [00:12<00:24,  1.91it/s][A
Training:  32%|███▏      | 21/65 [00:14<00:31,  1.40it/s][A
Training:  37%|███▋      | 24/65 [00:15<00:18,  2.23it/s][A
Training:  40%|████      | 26/65 [00:17<00:25,  1.52it/s][A
Training:  45%|████▍     | 29/65 [00:19<00:25,  1.43it/s][A
Training:  49%|████▉     | 32/65 [00:19<00:15,  2.12it/s][A
Training:  52%|█████▏    | 34/65 [00:

Epoch: 54/77 - Loss: 13.4174 - Accuracy: 0.9401



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:02<00:20,  2.58s/it][A
 33%|███▎      | 3/9 [00:02<00:04,  1.42it/s][A
 56%|█████▌    | 5/9 [00:04<00:03,  1.14it/s][A
100%|██████████| 9/9 [00:04<00:00,  1.80it/s][A
Epochs:  70%|███████   | 54/77 [41:16<17:37, 45.97s/it]

Val Loss: 14.3327 - Val Accuracy: 0.9331



Training:   0%|          | 0/65 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/65 [00:02<02:58,  2.80s/it][A
Training:   5%|▍         | 3/65 [00:02<00:47,  1.31it/s][A
Training:   8%|▊         | 5/65 [00:05<00:57,  1.05it/s][A
Training:  12%|█▏        | 8/65 [00:05<00:27,  2.09it/s][A
Training:  15%|█▌        | 10/65 [00:07<00:40,  1.36it/s][A
Training:  20%|██        | 13/65 [00:10<00:38,  1.33it/s][A
Training:  25%|██▍       | 16/65 [00:10<00:23,  2.05it/s][A
Training:  28%|██▊       | 18/65 [00:12<00:31,  1.48it/s][A
Training:  32%|███▏      | 21/65 [00:15<00:31,  1.40it/s][A
Training:  37%|███▋      | 24/65 [00:15<00:19,  2.05it/s][A
Training:  40%|████      | 26/65 [00:17<00:25,  1.52it/s][A
Training:  43%|████▎     | 28/65 [00:17<00:18,  2.00it/s][A
Training:  46%|████▌     | 30/65 [00:19<00:23,  1.49it/s][A
Training:  49%|████▉     | 32/65 [00:19<00:16,  2.00it/s][A
Training:  52%|█████▏    | 34/65 [00:22<00:21,  1.43it/s][A
Training:  55%|█████▌    | 36/65 [00

Epoch: 55/77 - Loss: 13.3767 - Accuracy: 0.9431



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:02<00:20,  2.53s/it][A
 33%|███▎      | 3/9 [00:02<00:04,  1.44it/s][A
 56%|█████▌    | 5/9 [00:04<00:03,  1.12it/s][A
100%|██████████| 9/9 [00:05<00:00,  1.78it/s][A
Epochs:  71%|███████▏  | 55/77 [42:03<16:52, 46.01s/it]

Val Loss: 14.0614 - Val Accuracy: 0.9460



Training:   0%|          | 0/65 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/65 [00:02<02:50,  2.67s/it][A
Training:   5%|▍         | 3/65 [00:02<00:46,  1.35it/s][A
Training:   8%|▊         | 5/65 [00:05<00:58,  1.03it/s][A
Training:  11%|█         | 7/65 [00:05<00:33,  1.71it/s][A
Training:  14%|█▍        | 9/65 [00:07<00:44,  1.27it/s][A
Training:  17%|█▋        | 11/65 [00:07<00:28,  1.88it/s][A
Training:  20%|██        | 13/65 [00:10<00:39,  1.33it/s][A
Training:  23%|██▎       | 15/65 [00:10<00:26,  1.90it/s][A
Training:  26%|██▌       | 17/65 [00:12<00:34,  1.41it/s][A
Training:  29%|██▉       | 19/65 [00:12<00:23,  1.98it/s][A
Training:  32%|███▏      | 21/65 [00:14<00:31,  1.42it/s][A
Training:  34%|███▍      | 22/65 [00:14<00:26,  1.65it/s][A
Training:  38%|███▊      | 25/65 [00:17<00:26,  1.50it/s][A
Training:  40%|████      | 26/65 [00:17<00:22,  1.75it/s][A
Training:  45%|████▍     | 29/65 [00:19<00:23,  1.52it/s][A
Training:  48%|████▊     | 31/65 [00:

Epoch: 56/77 - Loss: 12.9772 - Accuracy: 0.9417



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:02<00:19,  2.50s/it][A
 44%|████▍     | 4/9 [00:02<00:02,  1.96it/s][A
 67%|██████▋   | 6/9 [00:04<00:02,  1.30it/s][A
100%|██████████| 9/9 [00:05<00:00,  1.78it/s][A
Epochs:  73%|███████▎  | 56/77 [42:48<16:05, 45.99s/it]

Val Loss: 15.9994 - Val Accuracy: 0.9384



Training:   0%|          | 0/65 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/65 [00:02<02:54,  2.73s/it][A
Training:   5%|▍         | 3/65 [00:02<00:46,  1.34it/s][A
Training:   8%|▊         | 5/65 [00:05<00:58,  1.02it/s][A
Training:  11%|█         | 7/65 [00:05<00:33,  1.71it/s][A
Training:  14%|█▍        | 9/65 [00:07<00:44,  1.27it/s][A
Training:  17%|█▋        | 11/65 [00:07<00:28,  1.89it/s][A
Training:  20%|██        | 13/65 [00:10<00:39,  1.32it/s][A
Training:  23%|██▎       | 15/65 [00:10<00:26,  1.89it/s][A
Training:  26%|██▌       | 17/65 [00:12<00:34,  1.38it/s][A
Training:  29%|██▉       | 19/65 [00:12<00:23,  1.94it/s][A
Training:  32%|███▏      | 21/65 [00:14<00:31,  1.38it/s][A
Training:  35%|███▌      | 23/65 [00:15<00:21,  1.93it/s][A
Training:  38%|███▊      | 25/65 [00:17<00:28,  1.42it/s][A
Training:  43%|████▎     | 28/65 [00:17<00:16,  2.24it/s][A
Training:  46%|████▌     | 30/65 [00:19<00:22,  1.53it/s][A
Training:  51%|█████     | 33/65 [00:

Epoch: 57/77 - Loss: 13.5644 - Accuracy: 0.9446



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:02<00:20,  2.59s/it][A
 44%|████▍     | 4/9 [00:02<00:02,  1.89it/s][A
 67%|██████▋   | 6/9 [00:04<00:02,  1.30it/s][A
100%|██████████| 9/9 [00:05<00:00,  1.76it/s][A
Epochs:  74%|███████▍  | 57/77 [43:35<15:20, 46.02s/it]

Val Loss: 13.0811 - Val Accuracy: 0.9369



Training:   0%|          | 0/65 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/65 [00:02<02:56,  2.76s/it][A
Training:   5%|▍         | 3/65 [00:02<00:47,  1.32it/s][A
Training:   8%|▊         | 5/65 [00:05<00:58,  1.02it/s][A
Training:  12%|█▏        | 8/65 [00:05<00:27,  2.05it/s][A
Training:  15%|█▌        | 10/65 [00:07<00:39,  1.39it/s][A
Training:  18%|█▊        | 12/65 [00:07<00:26,  1.98it/s][A
Training:  22%|██▏       | 14/65 [00:10<00:36,  1.41it/s][A
Training:  26%|██▌       | 17/65 [00:12<00:36,  1.32it/s][A
Training:  29%|██▉       | 19/65 [00:12<00:25,  1.79it/s][A
Training:  32%|███▏      | 21/65 [00:15<00:32,  1.36it/s][A
Training:  37%|███▋      | 24/65 [00:15<00:19,  2.11it/s][A
Training:  40%|████      | 26/65 [00:17<00:25,  1.50it/s][A
Training:  43%|████▎     | 28/65 [00:17<00:18,  2.01it/s][A
Training:  46%|████▌     | 30/65 [00:20<00:24,  1.45it/s][A
Training:  51%|█████     | 33/65 [00:22<00:23,  1.38it/s][A
Training:  55%|█████▌    | 36/65 [00

Epoch: 58/77 - Loss: 14.6045 - Accuracy: 0.9417



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:02<00:21,  2.65s/it][A
 33%|███▎      | 3/9 [00:02<00:04,  1.37it/s][A
 56%|█████▌    | 5/9 [00:04<00:03,  1.15it/s][A
100%|██████████| 9/9 [00:05<00:00,  1.79it/s][A
Epochs:  75%|███████▌  | 58/77 [44:21<14:35, 46.07s/it]

Val Loss: 13.8332 - Val Accuracy: 0.9419



Training:   0%|          | 0/65 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/65 [00:02<02:55,  2.74s/it][A
Training:   5%|▍         | 3/65 [00:02<00:46,  1.33it/s][A
Training:   8%|▊         | 5/65 [00:05<00:57,  1.04it/s][A
Training:  11%|█         | 7/65 [00:05<00:33,  1.71it/s][A
Training:  14%|█▍        | 9/65 [00:07<00:44,  1.24it/s][A
Training:  17%|█▋        | 11/65 [00:07<00:29,  1.85it/s][A
Training:  20%|██        | 13/65 [00:10<00:39,  1.33it/s][A
Training:  23%|██▎       | 15/65 [00:10<00:26,  1.90it/s][A
Training:  26%|██▌       | 17/65 [00:12<00:34,  1.38it/s][A
Training:  29%|██▉       | 19/65 [00:12<00:23,  1.94it/s][A
Training:  32%|███▏      | 21/65 [00:14<00:31,  1.40it/s][A
Training:  35%|███▌      | 23/65 [00:15<00:21,  1.94it/s][A
Training:  38%|███▊      | 25/65 [00:17<00:27,  1.43it/s][A
Training:  42%|████▏     | 27/65 [00:17<00:19,  1.98it/s][A
Training:  45%|████▍     | 29/65 [00:19<00:25,  1.39it/s][A
Training:  46%|████▌     | 30/65 [00:

Epoch: 59/77 - Loss: 13.8478 - Accuracy: 0.9436



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:02<00:20,  2.54s/it][A
 33%|███▎      | 3/9 [00:02<00:04,  1.41it/s][A
 56%|█████▌    | 5/9 [00:04<00:03,  1.12it/s][A
100%|██████████| 9/9 [00:05<00:00,  1.79it/s][A
Epochs:  77%|███████▋  | 59/77 [45:07<13:49, 46.11s/it]

Val Loss: 14.8312 - Val Accuracy: 0.9429



Training:   0%|          | 0/65 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/65 [00:02<03:02,  2.85s/it][A
Training:   5%|▍         | 3/65 [00:02<00:48,  1.29it/s][A
Training:   8%|▊         | 5/65 [00:05<00:57,  1.05it/s][A
Training:  12%|█▏        | 8/65 [00:05<00:27,  2.09it/s][A
Training:  15%|█▌        | 10/65 [00:07<00:39,  1.39it/s][A
Training:  20%|██        | 13/65 [00:10<00:38,  1.35it/s][A
Training:  25%|██▍       | 16/65 [00:10<00:23,  2.07it/s][A
Training:  28%|██▊       | 18/65 [00:12<00:31,  1.49it/s][A
Training:  31%|███       | 20/65 [00:12<00:22,  1.99it/s][A
Training:  34%|███▍      | 22/65 [00:14<00:29,  1.47it/s][A
Training:  37%|███▋      | 24/65 [00:15<00:20,  2.00it/s][A
Training:  40%|████      | 26/65 [00:17<00:27,  1.41it/s][A
Training:  45%|████▍     | 29/65 [00:19<00:26,  1.36it/s][A
Training:  48%|████▊     | 31/65 [00:19<00:18,  1.81it/s][A
Training:  51%|█████     | 33/65 [00:22<00:23,  1.39it/s][A
Training:  55%|█████▌    | 36/65 [00

Epoch: 60/77 - Loss: 13.7129 - Accuracy: 0.9439



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:02<00:21,  2.67s/it][A
 33%|███▎      | 3/9 [00:02<00:04,  1.35it/s][A
 56%|█████▌    | 5/9 [00:04<00:03,  1.10it/s][A
100%|██████████| 9/9 [00:05<00:00,  1.75it/s][A
Epochs:  78%|███████▊  | 60/77 [45:53<13:04, 46.14s/it]

Val Loss: 13.1789 - Val Accuracy: 0.9388



Training:   0%|          | 0/65 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/65 [00:02<02:59,  2.80s/it][A
Training:   5%|▍         | 3/65 [00:02<00:47,  1.30it/s][A
Training:   8%|▊         | 5/65 [00:05<00:58,  1.03it/s][A
Training:  12%|█▏        | 8/65 [00:05<00:27,  2.06it/s][A
Training:  15%|█▌        | 10/65 [00:07<00:40,  1.37it/s][A
Training:  20%|██        | 13/65 [00:10<00:38,  1.34it/s][A
Training:  23%|██▎       | 15/65 [00:10<00:27,  1.81it/s][A
Training:  26%|██▌       | 17/65 [00:12<00:35,  1.34it/s][A
Training:  29%|██▉       | 19/65 [00:12<00:24,  1.84it/s][A
Training:  32%|███▏      | 21/65 [00:15<00:31,  1.40it/s][A
Training:  35%|███▌      | 23/65 [00:15<00:21,  1.92it/s][A
Training:  38%|███▊      | 25/65 [00:17<00:29,  1.37it/s][A
Training:  42%|████▏     | 27/65 [00:17<00:20,  1.89it/s][A
Training:  45%|████▍     | 29/65 [00:20<00:25,  1.40it/s][A
Training:  48%|████▊     | 31/65 [00:20<00:17,  1.94it/s][A
Training:  51%|█████     | 33/65 [00

Epoch: 61/77 - Loss: 13.9704 - Accuracy: 0.9367



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:02<00:20,  2.58s/it][A
 33%|███▎      | 3/9 [00:02<00:04,  1.40it/s][A
 56%|█████▌    | 5/9 [00:04<00:03,  1.10it/s][A
100%|██████████| 9/9 [00:05<00:00,  1.76it/s][A
Epochs:  79%|███████▉  | 61/77 [46:40<12:19, 46.23s/it]

Val Loss: 13.1710 - Val Accuracy: 0.9348



Training:   0%|          | 0/65 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/65 [00:02<03:00,  2.82s/it][A
Training:   5%|▍         | 3/65 [00:02<00:48,  1.29it/s][A
Training:   8%|▊         | 5/65 [00:05<00:57,  1.04it/s][A
Training:  11%|█         | 7/65 [00:05<00:33,  1.73it/s][A
Training:  14%|█▍        | 9/65 [00:07<00:45,  1.24it/s][A
Training:  17%|█▋        | 11/65 [00:07<00:29,  1.84it/s][A
Training:  20%|██        | 13/65 [00:10<00:38,  1.33it/s][A
Training:  23%|██▎       | 15/65 [00:10<00:26,  1.90it/s][A
Training:  26%|██▌       | 17/65 [00:12<00:34,  1.38it/s][A
Training:  29%|██▉       | 19/65 [00:12<00:24,  1.91it/s][A
Training:  32%|███▏      | 21/65 [00:15<00:31,  1.40it/s][A
Training:  35%|███▌      | 23/65 [00:15<00:21,  1.94it/s][A
Training:  38%|███▊      | 25/65 [00:17<00:28,  1.40it/s][A
Training:  43%|████▎     | 28/65 [00:17<00:16,  2.22it/s][A
Training:  46%|████▌     | 30/65 [00:19<00:22,  1.53it/s][A
Training:  51%|█████     | 33/65 [00:

Epoch: 62/77 - Loss: 13.9942 - Accuracy: 0.9395



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:02<00:20,  2.60s/it][A
 33%|███▎      | 3/9 [00:02<00:04,  1.39it/s][A
 56%|█████▌    | 5/9 [00:04<00:03,  1.14it/s][A
100%|██████████| 9/9 [00:05<00:00,  1.80it/s][A
Epochs:  81%|████████  | 62/77 [47:25<11:32, 46.13s/it]

Val Loss: 17.1964 - Val Accuracy: 0.9170



Training:   0%|          | 0/65 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/65 [00:02<02:58,  2.80s/it][A
Training:   5%|▍         | 3/65 [00:02<00:47,  1.31it/s][A
Training:   8%|▊         | 5/65 [00:05<00:58,  1.03it/s][A
Training:  11%|█         | 7/65 [00:05<00:33,  1.71it/s][A
Training:  14%|█▍        | 9/65 [00:07<00:44,  1.25it/s][A
Training:  17%|█▋        | 11/65 [00:07<00:29,  1.85it/s][A
Training:  20%|██        | 13/65 [00:10<00:38,  1.36it/s][A
Training:  25%|██▍       | 16/65 [00:10<00:22,  2.22it/s][A
Training:  28%|██▊       | 18/65 [00:12<00:30,  1.52it/s][A
Training:  31%|███       | 20/65 [00:12<00:21,  2.06it/s][A
Training:  34%|███▍      | 22/65 [00:14<00:29,  1.47it/s][A
Training:  37%|███▋      | 24/65 [00:15<00:20,  2.02it/s][A
Training:  40%|████      | 26/65 [00:17<00:26,  1.45it/s][A
Training:  43%|████▎     | 28/65 [00:17<00:18,  2.00it/s][A
Training:  46%|████▌     | 30/65 [00:19<00:24,  1.43it/s][A
Training:  51%|█████     | 33/65 [00:

Epoch: 63/77 - Loss: 13.1681 - Accuracy: 0.9410



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:02<00:21,  2.66s/it][A
 44%|████▍     | 4/9 [00:02<00:02,  1.86it/s][A
 67%|██████▋   | 6/9 [00:04<00:02,  1.32it/s][A
100%|██████████| 9/9 [00:05<00:00,  1.78it/s][A
Epochs:  82%|████████▏ | 63/77 [48:12<10:45, 46.12s/it]

Val Loss: 13.1549 - Val Accuracy: 0.9226



Training:   0%|          | 0/65 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/65 [00:02<02:53,  2.71s/it][A
Training:   5%|▍         | 3/65 [00:02<00:46,  1.34it/s][A
Training:   8%|▊         | 5/65 [00:05<00:57,  1.04it/s][A
Training:  11%|█         | 7/65 [00:05<00:33,  1.73it/s][A
Training:  14%|█▍        | 9/65 [00:07<00:43,  1.28it/s][A
Training:  17%|█▋        | 11/65 [00:07<00:28,  1.90it/s][A
Training:  20%|██        | 13/65 [00:09<00:38,  1.35it/s][A
Training:  23%|██▎       | 15/65 [00:10<00:25,  1.94it/s][A
Training:  26%|██▌       | 17/65 [00:12<00:34,  1.38it/s][A
Training:  31%|███       | 20/65 [00:12<00:20,  2.22it/s][A
Training:  34%|███▍      | 22/65 [00:14<00:27,  1.55it/s][A
Training:  37%|███▋      | 24/65 [00:14<00:19,  2.10it/s][A
Training:  40%|████      | 26/65 [00:17<00:26,  1.48it/s][A
Training:  45%|████▍     | 29/65 [00:19<00:25,  1.41it/s][A
Training:  48%|████▊     | 31/65 [00:19<00:18,  1.88it/s][A
Training:  51%|█████     | 33/65 [00:

Epoch: 64/77 - Loss: 12.8562 - Accuracy: 0.9407



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:02<00:20,  2.55s/it][A
 44%|████▍     | 4/9 [00:02<00:02,  1.92it/s][A
 67%|██████▋   | 6/9 [00:04<00:02,  1.34it/s][A
100%|██████████| 9/9 [00:04<00:00,  1.81it/s][A
Epochs:  83%|████████▎ | 64/77 [48:57<09:57, 45.93s/it]

Val Loss: 13.0261 - Val Accuracy: 0.9364



Training:   0%|          | 0/65 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/65 [00:02<02:58,  2.80s/it][A
Training:   5%|▍         | 3/65 [00:02<00:47,  1.31it/s][A
Training:   8%|▊         | 5/65 [00:05<00:58,  1.03it/s][A
Training:  11%|█         | 7/65 [00:05<00:33,  1.71it/s][A
Training:  14%|█▍        | 9/65 [00:07<00:44,  1.26it/s][A
Training:  18%|█▊        | 12/65 [00:07<00:24,  2.17it/s][A
Training:  22%|██▏       | 14/65 [00:09<00:33,  1.53it/s][A
Training:  25%|██▍       | 16/65 [00:10<00:23,  2.11it/s][A
Training:  28%|██▊       | 18/65 [00:12<00:32,  1.46it/s][A
Training:  32%|███▏      | 21/65 [00:14<00:31,  1.40it/s][A
Training:  35%|███▌      | 23/65 [00:14<00:22,  1.87it/s][A
Training:  38%|███▊      | 25/65 [00:17<00:28,  1.40it/s][A
Training:  42%|████▏     | 27/65 [00:17<00:20,  1.88it/s][A
Training:  45%|████▍     | 29/65 [00:19<00:24,  1.45it/s][A
Training:  46%|████▌     | 30/65 [00:19<00:20,  1.68it/s][A
Training:  51%|█████     | 33/65 [00:

Epoch: 65/77 - Loss: 13.5660 - Accuracy: 0.9415



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:02<00:20,  2.61s/it][A
 33%|███▎      | 3/9 [00:02<00:04,  1.40it/s][A
 56%|█████▌    | 5/9 [00:04<00:03,  1.14it/s][A
100%|██████████| 9/9 [00:05<00:00,  1.80it/s][A
Epochs:  84%|████████▍ | 65/77 [49:43<09:09, 45.79s/it]

Val Loss: 15.5346 - Val Accuracy: 0.9312



Training:   0%|          | 0/65 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/65 [00:02<02:59,  2.80s/it][A
Training:   6%|▌         | 4/65 [00:02<00:34,  1.76it/s][A
Training:   9%|▉         | 6/65 [00:05<00:49,  1.19it/s][A
Training:  12%|█▏        | 8/65 [00:05<00:30,  1.86it/s][A
Training:  15%|█▌        | 10/65 [00:07<00:41,  1.31it/s][A
Training:  20%|██        | 13/65 [00:10<00:39,  1.32it/s][A
Training:  23%|██▎       | 15/65 [00:10<00:27,  1.82it/s][A
Training:  26%|██▌       | 17/65 [00:12<00:35,  1.34it/s][A
Training:  31%|███       | 20/65 [00:12<00:21,  2.10it/s][A
Training:  34%|███▍      | 22/65 [00:14<00:27,  1.56it/s][A
Training:  37%|███▋      | 24/65 [00:14<00:19,  2.10it/s][A
Training:  40%|████      | 26/65 [00:17<00:26,  1.46it/s][A
Training:  43%|████▎     | 28/65 [00:17<00:18,  1.99it/s][A
Training:  46%|████▌     | 30/65 [00:19<00:23,  1.47it/s][A
Training:  49%|████▉     | 32/65 [00:19<00:16,  2.01it/s][A
Training:  52%|█████▏    | 34/65 [00

Epoch: 66/77 - Loss: 13.0704 - Accuracy: 0.9428



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:02<00:20,  2.51s/it][A
 44%|████▍     | 4/9 [00:02<00:02,  1.96it/s][A
 67%|██████▋   | 6/9 [00:04<00:02,  1.32it/s][A
100%|██████████| 9/9 [00:05<00:00,  1.80it/s][A
Epochs:  86%|████████▌ | 66/77 [50:28<08:23, 45.75s/it]

Val Loss: 12.9803 - Val Accuracy: 0.9431



Training:   0%|          | 0/65 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/65 [00:02<02:53,  2.71s/it][A
Training:   5%|▍         | 3/65 [00:02<00:45,  1.35it/s][A
Training:   8%|▊         | 5/65 [00:05<00:57,  1.04it/s][A
Training:  11%|█         | 7/65 [00:05<00:33,  1.74it/s][A
Training:  14%|█▍        | 9/65 [00:07<00:43,  1.28it/s][A
Training:  17%|█▋        | 11/65 [00:07<00:28,  1.89it/s][A
Training:  20%|██        | 13/65 [00:09<00:38,  1.35it/s][A
Training:  23%|██▎       | 15/65 [00:10<00:25,  1.93it/s][A
Training:  26%|██▌       | 17/65 [00:12<00:34,  1.40it/s][A
Training:  29%|██▉       | 19/65 [00:12<00:23,  1.96it/s][A
Training:  32%|███▏      | 21/65 [00:14<00:31,  1.39it/s][A
Training:  35%|███▌      | 23/65 [00:14<00:21,  1.94it/s][A
Training:  38%|███▊      | 25/65 [00:17<00:27,  1.43it/s][A
Training:  42%|████▏     | 27/65 [00:17<00:19,  1.99it/s][A
Training:  45%|████▍     | 29/65 [00:19<00:25,  1.42it/s][A
Training:  48%|████▊     | 31/65 [00:

Epoch: 67/77 - Loss: 13.0023 - Accuracy: 0.9419



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:02<00:20,  2.57s/it][A
 33%|███▎      | 3/9 [00:02<00:04,  1.41it/s][A
 56%|█████▌    | 5/9 [00:04<00:03,  1.15it/s][A
100%|██████████| 9/9 [00:04<00:00,  1.80it/s][A
Epochs:  87%|████████▋ | 67/77 [51:14<07:36, 45.64s/it]

Val Loss: 12.6821 - Val Accuracy: 0.9465



Training:   0%|          | 0/65 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/65 [00:02<02:52,  2.70s/it][A
Training:   5%|▍         | 3/65 [00:02<00:45,  1.35it/s][A
Training:   8%|▊         | 5/65 [00:05<00:57,  1.04it/s][A
Training:  11%|█         | 7/65 [00:05<00:33,  1.73it/s][A
Training:  14%|█▍        | 9/65 [00:07<00:44,  1.26it/s][A
Training:  17%|█▋        | 11/65 [00:07<00:28,  1.88it/s][A
Training:  20%|██        | 13/65 [00:09<00:38,  1.36it/s][A
Training:  25%|██▍       | 16/65 [00:10<00:22,  2.22it/s][A
Training:  28%|██▊       | 18/65 [00:12<00:30,  1.52it/s][A
Training:  32%|███▏      | 21/65 [00:14<00:30,  1.44it/s][A
Training:  35%|███▌      | 23/65 [00:14<00:22,  1.90it/s][A
Training:  38%|███▊      | 25/65 [00:17<00:28,  1.40it/s][A
Training:  43%|████▎     | 28/65 [00:17<00:17,  2.14it/s][A
Training:  46%|████▌     | 30/65 [00:19<00:22,  1.57it/s][A
Training:  51%|█████     | 33/65 [00:22<00:22,  1.43it/s][A
Training:  55%|█████▌    | 36/65 [00:

Epoch: 68/77 - Loss: 14.0527 - Accuracy: 0.9443



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:02<00:20,  2.50s/it][A
 44%|████▍     | 4/9 [00:02<00:02,  1.97it/s][A
 67%|██████▋   | 6/9 [00:04<00:02,  1.32it/s][A
100%|██████████| 9/9 [00:04<00:00,  1.81it/s][A
Epochs:  88%|████████▊ | 68/77 [51:59<06:50, 45.64s/it]

Val Loss: 13.3395 - Val Accuracy: 0.9374



Training:   0%|          | 0/65 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/65 [00:02<02:57,  2.77s/it][A
Training:   6%|▌         | 4/65 [00:02<00:34,  1.77it/s][A
Training:   9%|▉         | 6/65 [00:05<00:48,  1.22it/s][A
Training:  14%|█▍        | 9/65 [00:07<00:44,  1.25it/s][A
Training:  18%|█▊        | 12/65 [00:07<00:26,  2.03it/s][A
Training:  22%|██▏       | 14/65 [00:10<00:35,  1.45it/s][A
Training:  26%|██▌       | 17/65 [00:12<00:34,  1.38it/s][A
Training:  31%|███       | 20/65 [00:12<00:21,  2.05it/s][A
Training:  34%|███▍      | 22/65 [00:14<00:28,  1.51it/s][A
Training:  38%|███▊      | 25/65 [00:17<00:27,  1.45it/s][A
Training:  42%|████▏     | 27/65 [00:17<00:20,  1.88it/s][A
Training:  45%|████▍     | 29/65 [00:19<00:25,  1.42it/s][A
Training:  48%|████▊     | 31/65 [00:19<00:17,  1.90it/s][A
Training:  51%|█████     | 33/65 [00:22<00:22,  1.43it/s][A
Training:  54%|█████▍    | 35/65 [00:22<00:15,  1.94it/s][A
Training:  57%|█████▋    | 37/65 [00

Epoch: 69/77 - Loss: 13.6844 - Accuracy: 0.9434



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:02<00:19,  2.43s/it][A
 33%|███▎      | 3/9 [00:02<00:04,  1.48it/s][A
 56%|█████▌    | 5/9 [00:04<00:03,  1.14it/s][A
100%|██████████| 9/9 [00:04<00:00,  1.83it/s][A
Epochs:  90%|████████▉ | 69/77 [52:45<06:04, 45.61s/it]

Val Loss: 15.2014 - Val Accuracy: 0.9379



Training:   0%|          | 0/65 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/65 [00:02<02:56,  2.76s/it][A
Training:   6%|▌         | 4/65 [00:02<00:34,  1.78it/s][A
Training:   9%|▉         | 6/65 [00:05<00:49,  1.20it/s][A
Training:  12%|█▏        | 8/65 [00:05<00:30,  1.87it/s][A
Training:  15%|█▌        | 10/65 [00:07<00:41,  1.32it/s][A
Training:  18%|█▊        | 12/65 [00:07<00:27,  1.93it/s][A
Training:  22%|██▏       | 14/65 [00:10<00:36,  1.38it/s][A
Training:  26%|██▌       | 17/65 [00:12<00:35,  1.33it/s][A
Training:  31%|███       | 20/65 [00:12<00:22,  2.04it/s][A
Training:  34%|███▍      | 22/65 [00:14<00:28,  1.51it/s][A
Training:  38%|███▊      | 25/65 [00:17<00:27,  1.44it/s][A
Training:  43%|████▎     | 28/65 [00:17<00:17,  2.10it/s][A
Training:  46%|████▌     | 30/65 [00:19<00:22,  1.53it/s][A
Training:  49%|████▉     | 32/65 [00:19<00:16,  2.01it/s][A
Training:  52%|█████▏    | 34/65 [00:22<00:20,  1.49it/s][A
Training:  57%|█████▋    | 37/65 [00

Epoch: 70/77 - Loss: 13.9037 - Accuracy: 0.9374



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:02<00:20,  2.52s/it][A
 33%|███▎      | 3/9 [00:02<00:04,  1.45it/s][A
 56%|█████▌    | 5/9 [00:04<00:03,  1.12it/s][A
100%|██████████| 9/9 [00:05<00:00,  1.79it/s][A
Epochs:  91%|█████████ | 70/77 [53:30<05:19, 45.64s/it]

Val Loss: 16.5725 - Val Accuracy: 0.9317



Training:   0%|          | 0/65 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/65 [00:02<02:57,  2.77s/it][A
Training:   5%|▍         | 3/65 [00:02<00:47,  1.32it/s][A
Training:   8%|▊         | 5/65 [00:05<00:57,  1.04it/s][A
Training:  11%|█         | 7/65 [00:05<00:33,  1.74it/s][A
Training:  14%|█▍        | 9/65 [00:07<00:44,  1.26it/s][A
Training:  17%|█▋        | 11/65 [00:07<00:28,  1.87it/s][A
Training:  20%|██        | 13/65 [00:10<00:38,  1.34it/s][A
Training:  23%|██▎       | 15/65 [00:10<00:26,  1.91it/s][A
Training:  26%|██▌       | 17/65 [00:12<00:34,  1.40it/s][A
Training:  31%|███       | 20/65 [00:12<00:20,  2.24it/s][A
Training:  34%|███▍      | 22/65 [00:14<00:27,  1.54it/s][A
Training:  37%|███▋      | 24/65 [00:15<00:19,  2.09it/s][A
Training:  40%|████      | 26/65 [00:17<00:26,  1.49it/s][A
Training:  43%|████▎     | 28/65 [00:17<00:18,  2.04it/s][A
Training:  46%|████▌     | 30/65 [00:19<00:24,  1.42it/s][A
Training:  49%|████▉     | 32/65 [00:

Epoch: 71/77 - Loss: 12.9655 - Accuracy: 0.9439



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:02<00:19,  2.46s/it][A
 33%|███▎      | 3/9 [00:02<00:04,  1.47it/s][A
 56%|█████▌    | 5/9 [00:04<00:03,  1.15it/s][A
100%|██████████| 9/9 [00:04<00:00,  1.83it/s][A
Epochs:  92%|█████████▏| 71/77 [54:16<04:33, 45.63s/it]

Val Loss: 14.2358 - Val Accuracy: 0.9297



Training:   0%|          | 0/65 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/65 [00:02<02:52,  2.69s/it][A
Training:   5%|▍         | 3/65 [00:02<00:45,  1.35it/s][A
Training:   8%|▊         | 5/65 [00:05<00:58,  1.02it/s][A
Training:  11%|█         | 7/65 [00:05<00:33,  1.71it/s][A
Training:  14%|█▍        | 9/65 [00:07<00:44,  1.27it/s][A
Training:  17%|█▋        | 11/65 [00:07<00:28,  1.89it/s][A
Training:  20%|██        | 13/65 [00:09<00:38,  1.36it/s][A
Training:  25%|██▍       | 16/65 [00:10<00:22,  2.22it/s][A
Training:  28%|██▊       | 18/65 [00:12<00:30,  1.53it/s][A
Training:  31%|███       | 20/65 [00:12<00:21,  2.08it/s][A
Training:  34%|███▍      | 22/65 [00:14<00:28,  1.50it/s][A
Training:  37%|███▋      | 24/65 [00:14<00:19,  2.06it/s][A
Training:  40%|████      | 26/65 [00:17<00:26,  1.45it/s][A
Training:  45%|████▍     | 29/65 [00:19<00:25,  1.40it/s][A
Training:  48%|████▊     | 31/65 [00:19<00:18,  1.86it/s][A
Training:  51%|█████     | 33/65 [00:

Epoch: 72/77 - Loss: 12.8171 - Accuracy: 0.9438



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:02<00:20,  2.62s/it][A
 44%|████▍     | 4/9 [00:02<00:02,  1.88it/s][A
 67%|██████▋   | 6/9 [00:04<00:02,  1.32it/s][A
100%|██████████| 9/9 [00:05<00:00,  1.79it/s][A
Epochs:  94%|█████████▎| 72/77 [55:02<03:47, 45.58s/it]

Val Loss: 14.1848 - Val Accuracy: 0.9353



Training:   0%|          | 0/65 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/65 [00:02<03:00,  2.82s/it][A
Training:   5%|▍         | 3/65 [00:02<00:47,  1.29it/s][A
Training:   8%|▊         | 5/65 [00:05<00:57,  1.04it/s][A
Training:  12%|█▏        | 8/65 [00:05<00:27,  2.07it/s][A
Training:  15%|█▌        | 10/65 [00:07<00:39,  1.41it/s][A
Training:  18%|█▊        | 12/65 [00:07<00:26,  2.01it/s][A
Training:  22%|██▏       | 14/65 [00:10<00:36,  1.41it/s][A
Training:  25%|██▍       | 16/65 [00:10<00:24,  1.98it/s][A
Training:  28%|██▊       | 18/65 [00:12<00:33,  1.41it/s][A
Training:  31%|███       | 20/65 [00:12<00:22,  1.96it/s][A
Training:  34%|███▍      | 22/65 [00:14<00:29,  1.44it/s][A
Training:  38%|███▊      | 25/65 [00:17<00:29,  1.35it/s][A
Training:  42%|████▏     | 27/65 [00:17<00:20,  1.81it/s][A
Training:  45%|████▍     | 29/65 [00:19<00:25,  1.39it/s][A
Training:  49%|████▉     | 32/65 [00:19<00:15,  2.14it/s][A
Training:  52%|█████▏    | 34/65 [00

Epoch: 73/77 - Loss: 13.5156 - Accuracy: 0.9408



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:02<00:21,  2.64s/it][A
 44%|████▍     | 4/9 [00:02<00:02,  1.86it/s][A
 67%|██████▋   | 6/9 [00:04<00:02,  1.29it/s][A
100%|██████████| 9/9 [00:05<00:00,  1.76it/s][A
Epochs:  95%|█████████▍| 73/77 [55:47<03:02, 45.67s/it]

Val Loss: 14.4453 - Val Accuracy: 0.9292



Training:   0%|          | 0/65 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/65 [00:02<02:58,  2.78s/it][A
Training:   5%|▍         | 3/65 [00:02<00:47,  1.31it/s][A
Training:   8%|▊         | 5/65 [00:05<00:57,  1.05it/s][A
Training:  11%|█         | 7/65 [00:05<00:33,  1.72it/s][A
Training:  14%|█▍        | 9/65 [00:07<00:44,  1.25it/s][A
Training:  17%|█▋        | 11/65 [00:07<00:29,  1.85it/s][A
Training:  20%|██        | 13/65 [00:10<00:38,  1.35it/s][A
Training:  23%|██▎       | 15/65 [00:10<00:26,  1.92it/s][A
Training:  26%|██▌       | 17/65 [00:12<00:34,  1.38it/s][A
Training:  29%|██▉       | 19/65 [00:12<00:23,  1.94it/s][A
Training:  32%|███▏      | 21/65 [00:14<00:31,  1.41it/s][A
Training:  35%|███▌      | 23/65 [00:14<00:21,  1.96it/s][A
Training:  38%|███▊      | 25/65 [00:17<00:28,  1.41it/s][A
Training:  42%|████▏     | 27/65 [00:17<00:19,  1.96it/s][A
Training:  45%|████▍     | 29/65 [00:19<00:24,  1.45it/s][A
Training:  48%|████▊     | 31/65 [00:

Epoch: 74/77 - Loss: 13.7002 - Accuracy: 0.9437



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:02<00:20,  2.57s/it][A
 33%|███▎      | 3/9 [00:02<00:04,  1.42it/s][A
 56%|█████▌    | 5/9 [00:04<00:03,  1.11it/s][A
100%|██████████| 9/9 [00:05<00:00,  1.77it/s][A
Epochs:  96%|█████████▌| 74/77 [56:33<02:17, 45.71s/it]

Val Loss: 17.9518 - Val Accuracy: 0.9333



Training:   0%|          | 0/65 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/65 [00:02<02:56,  2.76s/it][A
Training:   5%|▍         | 3/65 [00:02<00:46,  1.32it/s][A
Training:   8%|▊         | 5/65 [00:05<00:57,  1.04it/s][A
Training:  11%|█         | 7/65 [00:05<00:33,  1.72it/s][A
Training:  14%|█▍        | 9/65 [00:07<00:44,  1.26it/s][A
Training:  15%|█▌        | 10/65 [00:07<00:35,  1.55it/s][A
Training:  18%|█▊        | 12/65 [00:07<00:22,  2.36it/s][A
Training:  22%|██▏       | 14/65 [00:10<00:34,  1.46it/s][A
Training:  25%|██▍       | 16/65 [00:10<00:23,  2.12it/s][A
Training:  28%|██▊       | 18/65 [00:12<00:32,  1.45it/s][A
Training:  31%|███       | 20/65 [00:12<00:22,  2.05it/s][A
Training:  34%|███▍      | 22/65 [00:15<00:30,  1.42it/s][A
Training:  37%|███▋      | 24/65 [00:15<00:20,  1.99it/s][A
Training:  40%|████      | 26/65 [00:17<00:27,  1.43it/s][A
Training:  43%|████▎     | 28/65 [00:17<00:18,  1.99it/s][A
Training:  46%|████▌     | 30/65 [00:

Epoch: 75/77 - Loss: 13.3690 - Accuracy: 0.9380



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:02<00:20,  2.57s/it][A
 44%|████▍     | 4/9 [00:02<00:02,  1.91it/s][A
 67%|██████▋   | 6/9 [00:04<00:02,  1.30it/s][A
100%|██████████| 9/9 [00:05<00:00,  1.78it/s][A
Epochs:  97%|█████████▋| 75/77 [57:19<01:31, 45.81s/it]

Val Loss: 11.3973 - Val Accuracy: 0.9470



Training:   0%|          | 0/65 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/65 [00:02<03:06,  2.91s/it][A
Training:   6%|▌         | 4/65 [00:03<00:35,  1.70it/s][A
Training:   9%|▉         | 6/65 [00:05<00:48,  1.21it/s][A
Training:  12%|█▏        | 8/65 [00:05<00:30,  1.90it/s][A
Training:  15%|█▌        | 10/65 [00:07<00:42,  1.29it/s][A
Training:  20%|██        | 13/65 [00:10<00:40,  1.28it/s][A
Training:  23%|██▎       | 15/65 [00:10<00:28,  1.76it/s][A
Training:  26%|██▌       | 17/65 [00:12<00:35,  1.34it/s][A
Training:  29%|██▉       | 19/65 [00:12<00:24,  1.84it/s][A
Training:  32%|███▏      | 21/65 [00:15<00:31,  1.40it/s][A
Training:  35%|███▌      | 23/65 [00:15<00:21,  1.92it/s][A
Training:  38%|███▊      | 25/65 [00:17<00:28,  1.40it/s][A
Training:  42%|████▏     | 27/65 [00:17<00:19,  1.94it/s][A
Training:  45%|████▍     | 29/65 [00:19<00:25,  1.43it/s][A
Training:  48%|████▊     | 31/65 [00:19<00:17,  1.97it/s][A
Training:  51%|█████     | 33/65 [00

Epoch: 76/77 - Loss: 13.4752 - Accuracy: 0.9442



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:02<00:19,  2.50s/it][A
 44%|████▍     | 4/9 [00:02<00:02,  1.97it/s][A
 67%|██████▋   | 6/9 [00:04<00:02,  1.33it/s][A
100%|██████████| 9/9 [00:04<00:00,  1.81it/s][A
Epochs:  99%|█████████▊| 76/77 [58:05<00:45, 45.90s/it]

Val Loss: 16.2288 - Val Accuracy: 0.9414



Training:   0%|          | 0/65 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/65 [00:02<02:53,  2.71s/it][A
Training:   5%|▍         | 3/65 [00:02<00:46,  1.34it/s][A
Training:   8%|▊         | 5/65 [00:05<00:58,  1.03it/s][A
Training:  12%|█▏        | 8/65 [00:05<00:27,  2.05it/s][A
Training:  15%|█▌        | 10/65 [00:07<00:38,  1.42it/s][A
Training:  18%|█▊        | 12/65 [00:07<00:26,  2.02it/s][A
Training:  22%|██▏       | 14/65 [00:10<00:36,  1.42it/s][A
Training:  25%|██▍       | 16/65 [00:10<00:24,  1.99it/s][A
Training:  28%|██▊       | 18/65 [00:12<00:32,  1.45it/s][A
Training:  31%|███       | 20/65 [00:12<00:22,  2.01it/s][A
Training:  34%|███▍      | 22/65 [00:14<00:30,  1.39it/s][A
Training:  38%|███▊      | 25/65 [00:17<00:29,  1.36it/s][A
Training:  43%|████▎     | 28/65 [00:17<00:18,  2.05it/s][A
Training:  46%|████▌     | 30/65 [00:19<00:23,  1.49it/s][A
Training:  49%|████▉     | 32/65 [00:19<00:16,  1.98it/s][A
Training:  52%|█████▏    | 34/65 [00

Epoch: 77/77 - Loss: 14.4034 - Accuracy: 0.9376



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:02<00:20,  2.60s/it][A
 33%|███▎      | 3/9 [00:02<00:04,  1.41it/s][A
 56%|█████▌    | 5/9 [00:04<00:03,  1.13it/s][A
100%|██████████| 9/9 [00:05<00:00,  1.79it/s][A
Epochs: 100%|██████████| 77/77 [58:51<00:00, 45.86s/it]
[32m[I 2023-12-15 03:45:29,050][0m Trial 4 finished with value: 0.929314911365509 and parameters: {'learning_rate': 0.005636386581730127, 'weight_decay': 0.002103450540847856, 'epsilon': 9.093448187942482e-09, 'batch_size': 216, 'epochs': 77}. Best is trial 2 with value: 0.9405519962310791.[0m


Val Loss: 13.8939 - Val Accuracy: 0.9293
Learning rate: 0.003886358253060439
Weight decay: 0.0008526891911782017
Epsilon: 1.245899493377082e-08
Batch size: 148
Number of epochs: 25


Epochs:   0%|          | 0/25 [00:00<?, ?it/s]
Training:   0%|          | 0/95 [00:00<?, ?it/s][A
Training:   1%|          | 1/95 [00:02<03:08,  2.01s/it][A
Training:   4%|▍         | 4/95 [00:02<00:37,  2.43it/s][A
Training:   6%|▋         | 6/95 [00:03<00:50,  1.78it/s][A
Training:   9%|▉         | 9/95 [00:05<00:47,  1.80it/s][A
Training:  13%|█▎        | 12/95 [00:05<00:28,  2.89it/s][A
Training:  15%|█▍        | 14/95 [00:06<00:37,  2.16it/s][A
Training:  17%|█▋        | 16/95 [00:07<00:27,  2.87it/s][A
Training:  19%|█▉        | 18/95 [00:08<00:36,  2.11it/s][A
Training:  22%|██▏       | 21/95 [00:10<00:37,  2.00it/s][A
Training:  24%|██▍       | 23/95 [00:10<00:27,  2.62it/s][A
Training:  26%|██▋       | 25/95 [00:11<00:33,  2.08it/s][A
Training:  28%|██▊       | 27/95 [00:11<00:24,  2.78it/s][A
Training:  31%|███       | 29/95 [00:13<00:31,  2.06it/s][A
Training:  34%|███▎      | 32/95 [00:13<00:20,  3.14it/s][A
Training:  36%|███▌      | 34/95 [00:15<00:27,  2.2

Epoch: 1/25 - Loss: 7.1214 - Accuracy: 0.8409



  0%|          | 0/12 [00:00<?, ?it/s][A
  8%|▊         | 1/12 [00:01<00:19,  1.81s/it][A
 33%|███▎      | 4/12 [00:01<00:02,  2.68it/s][A
 50%|█████     | 6/12 [00:03<00:03,  1.88it/s][A
100%|██████████| 12/12 [00:05<00:00,  2.39it/s][A
Epochs:   0%|          | 0/25 [00:45<?, ?it/s]
[32m[I 2023-12-15 03:46:14,606][0m Trial 5 pruned. [0m


Val Loss: 5.5159 - Val Accuracy: 0.8949
Learning rate: 0.01582111238388192
Weight decay: 0.004824567100704621
Epsilon: 4.6928002671499806e-09
Batch size: 145
Number of epochs: 53


Epochs:   0%|          | 0/53 [00:00<?, ?it/s]
Training:   0%|          | 0/97 [00:00<?, ?it/s][A
Training:   1%|          | 1/97 [00:01<03:04,  1.92s/it][A
Training:   4%|▍         | 4/97 [00:02<00:36,  2.52it/s][A
Training:   6%|▌         | 6/97 [00:03<00:51,  1.76it/s][A
Training:   9%|▉         | 9/97 [00:05<00:49,  1.79it/s][A
Training:  12%|█▏        | 12/97 [00:05<00:29,  2.88it/s][A
Training:  14%|█▍        | 14/97 [00:06<00:38,  2.14it/s][A
Training:  18%|█▊        | 17/97 [00:08<00:39,  2.04it/s][A
Training:  21%|██        | 20/97 [00:08<00:25,  3.01it/s][A
Training:  23%|██▎       | 22/97 [00:10<00:33,  2.24it/s][A
Training:  26%|██▌       | 25/97 [00:11<00:34,  2.07it/s][A
Training:  29%|██▉       | 28/97 [00:11<00:23,  2.99it/s][A
Training:  31%|███       | 30/97 [00:13<00:29,  2.24it/s][A
Training:  34%|███▍      | 33/97 [00:15<00:31,  2.06it/s][A
Training:  37%|███▋      | 36/97 [00:15<00:20,  2.95it/s][A
Training:  39%|███▉      | 38/97 [00:16<00:26,  2.2

Epoch: 1/53 - Loss: 75.1551 - Accuracy: 0.8436



  0%|          | 0/13 [00:00<?, ?it/s][A
  8%|▊         | 1/13 [00:01<00:21,  1.83s/it][A
 31%|███       | 4/13 [00:01<00:03,  2.65it/s][A
 46%|████▌     | 6/13 [00:03<00:03,  1.92it/s][A
 69%|██████▉   | 9/13 [00:04<00:01,  2.09it/s][A
100%|██████████| 13/13 [00:04<00:00,  2.68it/s][A
Epochs:   0%|          | 0/53 [00:45<?, ?it/s]
[32m[I 2023-12-15 03:47:00,136][0m Trial 6 pruned. [0m


Val Loss: 108.1581 - Val Accuracy: 0.8902
Learning rate: 5.454745933133334e-05
Weight decay: 0.005275943553828053
Epsilon: 7.658475817508726e-08
Batch size: 273
Number of epochs: 74


Epochs:   0%|          | 0/74 [00:00<?, ?it/s]
Training:   0%|          | 0/52 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/52 [00:03<02:56,  3.46s/it][A
Training:   6%|▌         | 3/52 [00:03<00:46,  1.06it/s][A
Training:  10%|▉         | 5/52 [00:06<00:57,  1.21s/it][A
Training:  13%|█▎        | 7/52 [00:06<00:32,  1.38it/s][A
Training:  17%|█▋        | 9/52 [00:09<00:42,  1.00it/s][A
Training:  21%|██        | 11/52 [00:09<00:27,  1.49it/s][A
Training:  25%|██▌       | 13/52 [00:12<00:36,  1.08it/s][A
Training:  29%|██▉       | 15/52 [00:12<00:24,  1.53it/s][A
Training:  33%|███▎      | 17/52 [00:15<00:31,  1.10it/s][A
Training:  37%|███▋      | 19/52 [00:15<00:21,  1.55it/s][A
Training:  40%|████      | 21/52 [00:18<00:28,  1.10it/s][A
Training:  44%|████▍     | 23/52 [00:18<00:18,  1.54it/s][A
Training:  48%|████▊     | 25/52 [00:21<00:24,  1.10it/s][A
Training:  52%|█████▏    | 27/52 [00:22<00:16,  1.53it/s][A
Training:  56%|█████▌    | 29/52 [00:25<00:20,  1.10

Epoch: 1/74 - Loss: 6.9302 - Accuracy: 0.5647



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:03<00:18,  3.10s/it][A
 43%|████▎     | 3/7 [00:03<00:03,  1.18it/s][A
 71%|███████▏  | 5/7 [00:05<00:02,  1.06s/it][A
100%|██████████| 7/7 [00:05<00:00,  1.18it/s][A
Epochs:   0%|          | 0/74 [00:46<?, ?it/s]
[32m[I 2023-12-15 03:47:46,805][0m Trial 7 pruned. [0m


Val Loss: 5.1598 - Val Accuracy: 0.6331
Learning rate: 0.0029188373717898906
Weight decay: 0.005180504916971047
Epsilon: 1.160123268963261e-08
Batch size: 285
Number of epochs: 51


Epochs:   0%|          | 0/51 [00:00<?, ?it/s]
Training:   0%|          | 0/50 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/50 [00:03<02:55,  3.59s/it][A
Training:   6%|▌         | 3/50 [00:03<00:46,  1.02it/s][A
Training:  10%|█         | 5/50 [00:06<00:56,  1.26s/it][A
Training:  14%|█▍        | 7/50 [00:06<00:32,  1.33it/s][A
Training:  18%|█▊        | 9/50 [00:09<00:43,  1.05s/it][A
Training:  22%|██▏       | 11/50 [00:10<00:27,  1.42it/s][A
Training:  26%|██▌       | 13/50 [00:13<00:36,  1.02it/s][A
Training:  30%|███       | 15/50 [00:13<00:23,  1.46it/s][A
Training:  34%|███▍      | 17/50 [00:16<00:31,  1.06it/s][A
Training:  38%|███▊      | 19/50 [00:16<00:20,  1.48it/s][A
Training:  42%|████▏     | 21/50 [00:19<00:27,  1.07it/s][A
Training:  46%|████▌     | 23/50 [00:19<00:18,  1.50it/s][A
Training:  50%|█████     | 25/50 [00:22<00:23,  1.07it/s][A
Training:  54%|█████▍    | 27/50 [00:22<00:15,  1.49it/s][A
Training:  58%|█████▊    | 29/50 [00:25<00:19,  1.08

Epoch: 1/51 - Loss: 4.4280 - Accuracy: 0.8398



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:03<00:20,  3.35s/it][A
 43%|████▎     | 3/7 [00:03<00:03,  1.10it/s][A
100%|██████████| 7/7 [00:06<00:00,  1.11it/s][A
Epochs:   2%|▏         | 1/51 [00:48<40:05, 48.12s/it]

Val Loss: 3.9297 - Val Accuracy: 0.9066



Training:   0%|          | 0/50 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/50 [00:03<02:55,  3.59s/it][A
Training:   6%|▌         | 3/50 [00:03<00:46,  1.02it/s][A
Training:  10%|█         | 5/50 [00:06<00:55,  1.24s/it][A
Training:  12%|█▏        | 6/50 [00:06<00:41,  1.07it/s][A
Training:  16%|█▌        | 8/50 [00:06<00:23,  1.80it/s][A
Training:  18%|█▊        | 9/50 [00:09<00:46,  1.13s/it][A
Training:  20%|██        | 10/50 [00:10<00:35,  1.13it/s][A
Training:  24%|██▍       | 12/50 [00:10<00:20,  1.84it/s][A
Training:  26%|██▌       | 13/50 [00:13<00:39,  1.08s/it][A
Training:  28%|██▊       | 14/50 [00:13<00:30,  1.17it/s][A
Training:  32%|███▏      | 16/50 [00:13<00:17,  1.90it/s][A
Training:  34%|███▍      | 17/50 [00:16<00:35,  1.07s/it][A
Training:  36%|███▌      | 18/50 [00:16<00:26,  1.19it/s][A
Training:  40%|████      | 20/50 [00:16<00:15,  1.92it/s][A
Training:  42%|████▏     | 21/50 [00:19<00:31,  1.07s/it][A
Training:  44%|████▍     | 22/50 [00:1

Epoch: 2/51 - Loss: 3.7140 - Accuracy: 0.9129



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:03<00:19,  3.30s/it][A
 43%|████▎     | 3/7 [00:03<00:03,  1.11it/s][A
100%|██████████| 7/7 [00:06<00:00,  1.11it/s][A
Epochs:   4%|▍         | 2/51 [01:36<39:21, 48.19s/it]

Val Loss: 2.5814 - Val Accuracy: 0.9080



Training:   0%|          | 0/50 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/50 [00:03<02:59,  3.67s/it][A
Training:   6%|▌         | 3/50 [00:03<00:47,  1.00s/it][A
Training:  10%|█         | 5/50 [00:06<00:57,  1.29s/it][A
Training:  14%|█▍        | 7/50 [00:07<00:33,  1.30it/s][A
Training:  18%|█▊        | 9/50 [00:10<00:42,  1.04s/it][A
Training:  22%|██▏       | 11/50 [00:10<00:27,  1.42it/s][A
Training:  26%|██▌       | 13/50 [00:13<00:35,  1.04it/s][A
Training:  30%|███       | 15/50 [00:13<00:23,  1.49it/s][A
Training:  34%|███▍      | 17/50 [00:16<00:31,  1.05it/s][A
Training:  38%|███▊      | 19/50 [00:16<00:20,  1.48it/s][A
Training:  42%|████▏     | 21/50 [00:19<00:27,  1.06it/s][A
Training:  46%|████▌     | 23/50 [00:19<00:18,  1.48it/s][A
Training:  50%|█████     | 25/50 [00:22<00:23,  1.06it/s][A
Training:  54%|█████▍    | 27/50 [00:22<00:15,  1.48it/s][A
Training:  58%|█████▊    | 29/50 [00:26<00:19,  1.07it/s][A
Training:  62%|██████▏   | 31/50 [00:

Epoch: 3/51 - Loss: 3.0189 - Accuracy: 0.9245



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:03<00:19,  3.30s/it][A
 43%|████▎     | 3/7 [00:03<00:03,  1.11it/s][A
100%|██████████| 7/7 [00:06<00:00,  1.12it/s][A
Epochs:   6%|▌         | 3/51 [02:24<38:33, 48.20s/it]

Val Loss: 2.6529 - Val Accuracy: 0.9407



Training:   0%|          | 0/50 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/50 [00:03<02:49,  3.47s/it][A
Training:   6%|▌         | 3/50 [00:03<00:44,  1.05it/s][A
Training:  10%|█         | 5/50 [00:06<00:56,  1.25s/it][A
Training:  14%|█▍        | 7/50 [00:06<00:32,  1.34it/s][A
Training:  18%|█▊        | 9/50 [00:09<00:42,  1.04s/it][A
Training:  22%|██▏       | 11/50 [00:09<00:27,  1.44it/s][A
Training:  26%|██▌       | 13/50 [00:13<00:36,  1.02it/s][A
Training:  30%|███       | 15/50 [00:13<00:23,  1.46it/s][A
Training:  34%|███▍      | 17/50 [00:16<00:31,  1.04it/s][A
Training:  38%|███▊      | 19/50 [00:16<00:21,  1.46it/s][A
Training:  42%|████▏     | 21/50 [00:19<00:27,  1.06it/s][A
Training:  46%|████▌     | 23/50 [00:19<00:18,  1.48it/s][A
Training:  50%|█████     | 25/50 [00:22<00:23,  1.06it/s][A
Training:  54%|█████▍    | 27/50 [00:22<00:15,  1.48it/s][A
Training:  58%|█████▊    | 29/50 [00:25<00:19,  1.07it/s][A
Training:  62%|██████▏   | 31/50 [00:

Epoch: 4/51 - Loss: 3.1170 - Accuracy: 0.9197



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:03<00:19,  3.29s/it][A
 43%|████▎     | 3/7 [00:03<00:03,  1.11it/s][A
100%|██████████| 7/7 [00:06<00:00,  1.12it/s][A
Epochs:   8%|▊         | 4/51 [03:12<37:38, 48.06s/it]

Val Loss: 2.6209 - Val Accuracy: 0.9044



Training:   0%|          | 0/50 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/50 [00:03<02:52,  3.52s/it][A
Training:   6%|▌         | 3/50 [00:03<00:45,  1.03it/s][A
Training:  10%|█         | 5/50 [00:06<00:56,  1.25s/it][A
Training:  14%|█▍        | 7/50 [00:06<00:32,  1.34it/s][A
Training:  18%|█▊        | 9/50 [00:09<00:43,  1.06s/it][A
Training:  22%|██▏       | 11/50 [00:10<00:27,  1.41it/s][A
Training:  26%|██▌       | 13/50 [00:13<00:36,  1.01it/s][A
Training:  30%|███       | 15/50 [00:13<00:24,  1.45it/s][A
Training:  34%|███▍      | 17/50 [00:16<00:31,  1.05it/s][A
Training:  38%|███▊      | 19/50 [00:16<00:20,  1.48it/s][A
Training:  42%|████▏     | 21/50 [00:19<00:27,  1.06it/s][A
Training:  46%|████▌     | 23/50 [00:19<00:18,  1.49it/s][A
Training:  50%|█████     | 25/50 [00:22<00:23,  1.08it/s][A
Training:  54%|█████▍    | 27/50 [00:22<00:15,  1.51it/s][A
Training:  58%|█████▊    | 29/50 [00:25<00:19,  1.08it/s][A
Training:  62%|██████▏   | 31/50 [00:

Epoch: 5/51 - Loss: 4.3392 - Accuracy: 0.9057



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:03<00:19,  3.28s/it][A
 43%|████▎     | 3/7 [00:03<00:03,  1.12it/s][A
100%|██████████| 7/7 [00:06<00:00,  1.11it/s][A
Epochs:  10%|▉         | 5/51 [04:00<36:51, 48.08s/it]

Val Loss: 3.5280 - Val Accuracy: 0.9152



Training:   0%|          | 0/50 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/50 [00:03<02:53,  3.55s/it][A
Training:   6%|▌         | 3/50 [00:03<00:45,  1.03it/s][A
Training:  10%|█         | 5/50 [00:06<00:57,  1.28s/it][A
Training:  14%|█▍        | 7/50 [00:06<00:33,  1.30it/s][A
Training:  18%|█▊        | 9/50 [00:10<00:43,  1.06s/it][A
Training:  22%|██▏       | 11/50 [00:10<00:27,  1.41it/s][A
Training:  26%|██▌       | 13/50 [00:13<00:36,  1.02it/s][A
Training:  30%|███       | 15/50 [00:13<00:24,  1.46it/s][A
Training:  34%|███▍      | 17/50 [00:16<00:31,  1.06it/s][A
Training:  38%|███▊      | 19/50 [00:16<00:20,  1.49it/s][A
Training:  42%|████▏     | 21/50 [00:19<00:27,  1.07it/s][A
Training:  46%|████▌     | 23/50 [00:19<00:18,  1.49it/s][A
Training:  50%|█████     | 25/50 [00:22<00:23,  1.08it/s][A
Training:  54%|█████▍    | 27/50 [00:22<00:15,  1.50it/s][A
Training:  58%|█████▊    | 29/50 [00:25<00:19,  1.08it/s][A
Training:  62%|██████▏   | 31/50 [00:

Epoch: 6/51 - Loss: 3.4743 - Accuracy: 0.8994



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:03<00:19,  3.29s/it][A
 43%|████▎     | 3/7 [00:03<00:03,  1.11it/s][A
100%|██████████| 7/7 [00:06<00:00,  1.12it/s][A
Epochs:  12%|█▏        | 6/51 [04:48<36:06, 48.14s/it]

Val Loss: 3.1104 - Val Accuracy: 0.8216



Training:   0%|          | 0/50 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/50 [00:03<02:58,  3.64s/it][A
Training:   6%|▌         | 3/50 [00:03<00:46,  1.01it/s][A
Training:  10%|█         | 5/50 [00:06<00:56,  1.26s/it][A
Training:  14%|█▍        | 7/50 [00:06<00:32,  1.33it/s][A
Training:  18%|█▊        | 9/50 [00:09<00:42,  1.05s/it][A
Training:  22%|██▏       | 11/50 [00:10<00:27,  1.42it/s][A
Training:  26%|██▌       | 13/50 [00:13<00:36,  1.01it/s][A
Training:  30%|███       | 15/50 [00:13<00:24,  1.45it/s][A
Training:  34%|███▍      | 17/50 [00:16<00:31,  1.05it/s][A
Training:  38%|███▊      | 19/50 [00:16<00:21,  1.48it/s][A
Training:  42%|████▏     | 21/50 [00:19<00:27,  1.07it/s][A
Training:  46%|████▌     | 23/50 [00:19<00:18,  1.49it/s][A
Training:  50%|█████     | 25/50 [00:22<00:23,  1.07it/s][A
Training:  54%|█████▍    | 27/50 [00:22<00:15,  1.50it/s][A
Training:  58%|█████▊    | 29/50 [00:25<00:19,  1.08it/s][A
Training:  62%|██████▏   | 31/50 [00:

Epoch: 7/51 - Loss: 3.8530 - Accuracy: 0.9020



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:03<00:20,  3.34s/it][A
 43%|████▎     | 3/7 [00:03<00:03,  1.10it/s][A
100%|██████████| 7/7 [00:06<00:00,  1.12it/s][A
Epochs:  14%|█▎        | 7/51 [05:36<35:18, 48.14s/it]

Val Loss: 3.4756 - Val Accuracy: 0.9242



Training:   0%|          | 0/50 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/50 [00:03<02:57,  3.63s/it][A
Training:   6%|▌         | 3/50 [00:03<00:46,  1.01it/s][A
Training:  10%|█         | 5/50 [00:06<00:57,  1.29s/it][A
Training:  14%|█▍        | 7/50 [00:07<00:33,  1.30it/s][A
Training:  18%|█▊        | 9/50 [00:10<00:43,  1.06s/it][A
Training:  22%|██▏       | 11/50 [00:10<00:27,  1.41it/s][A
Training:  26%|██▌       | 13/50 [00:13<00:36,  1.01it/s][A
Training:  30%|███       | 15/50 [00:13<00:24,  1.46it/s][A
Training:  34%|███▍      | 17/50 [00:16<00:31,  1.04it/s][A
Training:  38%|███▊      | 19/50 [00:16<00:21,  1.47it/s][A
Training:  42%|████▏     | 21/50 [00:19<00:27,  1.06it/s][A
Training:  46%|████▌     | 23/50 [00:19<00:18,  1.48it/s][A
Training:  50%|█████     | 25/50 [00:22<00:23,  1.06it/s][A
Training:  54%|█████▍    | 27/50 [00:23<00:15,  1.48it/s][A
Training:  58%|█████▊    | 29/50 [00:26<00:19,  1.07it/s][A
Training:  62%|██████▏   | 31/50 [00:

Epoch: 8/51 - Loss: 3.6623 - Accuracy: 0.9106



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:03<00:19,  3.32s/it][A
 43%|████▎     | 3/7 [00:03<00:03,  1.10it/s][A
100%|██████████| 7/7 [00:06<00:00,  1.11it/s][A
Epochs:  16%|█▌        | 8/51 [06:25<34:32, 48.19s/it]

Val Loss: 3.1129 - Val Accuracy: 0.9388



Training:   0%|          | 0/50 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/50 [00:03<02:56,  3.60s/it][A
Training:   6%|▌         | 3/50 [00:03<00:46,  1.02it/s][A
Training:  10%|█         | 5/50 [00:06<00:56,  1.25s/it][A
Training:  14%|█▍        | 7/50 [00:06<00:32,  1.34it/s][A
Training:  18%|█▊        | 9/50 [00:09<00:42,  1.05s/it][A
Training:  22%|██▏       | 11/50 [00:10<00:27,  1.42it/s][A
Training:  26%|██▌       | 13/50 [00:13<00:36,  1.00it/s][A
Training:  30%|███       | 15/50 [00:13<00:24,  1.43it/s][A
Training:  34%|███▍      | 17/50 [00:16<00:32,  1.02it/s][A
Training:  38%|███▊      | 19/50 [00:16<00:21,  1.44it/s][A
Training:  42%|████▏     | 21/50 [00:19<00:27,  1.05it/s][A
Training:  46%|████▌     | 23/50 [00:19<00:18,  1.47it/s][A
Training:  50%|█████     | 25/50 [00:22<00:23,  1.06it/s][A
Training:  54%|█████▍    | 27/50 [00:23<00:15,  1.48it/s][A
Training:  58%|█████▊    | 29/50 [00:26<00:19,  1.07it/s][A
Training:  62%|██████▏   | 31/50 [00:

Epoch: 9/51 - Loss: 3.8618 - Accuracy: 0.9220



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:03<00:19,  3.33s/it][A
 43%|████▎     | 3/7 [00:03<00:03,  1.10it/s][A
100%|██████████| 7/7 [00:06<00:00,  1.12it/s][A
Epochs:  18%|█▊        | 9/51 [07:13<33:48, 48.29s/it]

Val Loss: 3.5101 - Val Accuracy: 0.8920



Training:   0%|          | 0/50 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/50 [00:03<02:57,  3.63s/it][A
Training:   6%|▌         | 3/50 [00:03<00:46,  1.01it/s][A
Training:  10%|█         | 5/50 [00:06<00:56,  1.26s/it][A
Training:  14%|█▍        | 7/50 [00:06<00:32,  1.32it/s][A
Training:  18%|█▊        | 9/50 [00:10<00:43,  1.05s/it][A
Training:  22%|██▏       | 11/50 [00:10<00:27,  1.41it/s][A
Training:  26%|██▌       | 13/50 [00:13<00:36,  1.02it/s][A
Training:  30%|███       | 15/50 [00:13<00:24,  1.46it/s][A
Training:  34%|███▍      | 17/50 [00:16<00:31,  1.05it/s][A
Training:  38%|███▊      | 19/50 [00:16<00:21,  1.48it/s][A
Training:  42%|████▏     | 21/50 [00:19<00:27,  1.06it/s][A
Training:  46%|████▌     | 23/50 [00:19<00:18,  1.49it/s][A
Training:  50%|█████     | 25/50 [00:22<00:23,  1.06it/s][A
Training:  54%|█████▍    | 27/50 [00:22<00:15,  1.48it/s][A
Training:  58%|█████▊    | 29/50 [00:26<00:19,  1.07it/s][A
Training:  62%|██████▏   | 31/50 [00:

Epoch: 10/51 - Loss: 4.1593 - Accuracy: 0.9260



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:03<00:19,  3.31s/it][A
 43%|████▎     | 3/7 [00:03<00:03,  1.11it/s][A
100%|██████████| 7/7 [00:06<00:00,  1.11it/s][A
Epochs:  20%|█▉        | 10/51 [08:02<33:02, 48.36s/it]

Val Loss: 4.1283 - Val Accuracy: 0.8213



Training:   0%|          | 0/50 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/50 [00:03<02:57,  3.62s/it][A
Training:   6%|▌         | 3/50 [00:03<00:46,  1.01it/s][A
Training:  10%|█         | 5/50 [00:06<00:56,  1.26s/it][A
Training:  14%|█▍        | 7/50 [00:06<00:32,  1.32it/s][A
Training:  18%|█▊        | 9/50 [00:10<00:43,  1.06s/it][A
Training:  22%|██▏       | 11/50 [00:10<00:27,  1.41it/s][A
Training:  26%|██▌       | 13/50 [00:13<00:36,  1.02it/s][A
Training:  30%|███       | 15/50 [00:13<00:24,  1.45it/s][A
Training:  34%|███▍      | 17/50 [00:16<00:31,  1.04it/s][A
Training:  38%|███▊      | 19/50 [00:16<00:21,  1.46it/s][A
Training:  42%|████▏     | 21/50 [00:19<00:27,  1.05it/s][A
Training:  46%|████▌     | 23/50 [00:19<00:18,  1.46it/s][A
Training:  50%|█████     | 25/50 [00:22<00:23,  1.07it/s][A
Training:  54%|█████▍    | 27/50 [00:23<00:15,  1.48it/s][A
Training:  58%|█████▊    | 29/50 [00:26<00:19,  1.07it/s][A
Training:  62%|██████▏   | 31/50 [00:

Epoch: 11/51 - Loss: 3.9676 - Accuracy: 0.9047



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:03<00:19,  3.33s/it][A
 43%|████▎     | 3/7 [00:03<00:03,  1.10it/s][A
100%|██████████| 7/7 [00:06<00:00,  1.12it/s][A
Epochs:  22%|██▏       | 11/51 [08:50<32:15, 48.38s/it]

Val Loss: 3.8410 - Val Accuracy: 0.9055



Training:   0%|          | 0/50 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/50 [00:03<02:54,  3.57s/it][A
Training:   6%|▌         | 3/50 [00:03<00:45,  1.02it/s][A
Training:  10%|█         | 5/50 [00:06<00:55,  1.23s/it][A
Training:  14%|█▍        | 7/50 [00:06<00:31,  1.36it/s][A
Training:  18%|█▊        | 9/50 [00:09<00:42,  1.03s/it][A
Training:  22%|██▏       | 11/50 [00:09<00:27,  1.43it/s][A
Training:  26%|██▌       | 13/50 [00:13<00:36,  1.02it/s][A
Training:  30%|███       | 15/50 [00:13<00:23,  1.46it/s][A
Training:  34%|███▍      | 17/50 [00:16<00:31,  1.05it/s][A
Training:  38%|███▊      | 19/50 [00:16<00:21,  1.47it/s][A
Training:  42%|████▏     | 21/50 [00:19<00:27,  1.06it/s][A
Training:  46%|████▌     | 23/50 [00:19<00:18,  1.49it/s][A
Training:  50%|█████     | 25/50 [00:22<00:23,  1.07it/s][A
Training:  54%|█████▍    | 27/50 [00:22<00:15,  1.49it/s][A
Training:  58%|█████▊    | 29/50 [00:25<00:19,  1.08it/s][A
Training:  62%|██████▏   | 31/50 [00:

Epoch: 12/51 - Loss: 6.3873 - Accuracy: 0.9225



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:03<00:19,  3.30s/it][A
 43%|████▎     | 3/7 [00:03<00:03,  1.11it/s][A
100%|██████████| 7/7 [00:06<00:00,  1.13it/s][A
Epochs:  24%|██▎       | 12/51 [09:38<31:23, 48.30s/it]

Val Loss: 5.9419 - Val Accuracy: 0.8929



Training:   0%|          | 0/50 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/50 [00:03<02:57,  3.63s/it][A
Training:   6%|▌         | 3/50 [00:03<00:46,  1.01it/s][A
Training:  10%|█         | 5/50 [00:06<00:56,  1.27s/it][A
Training:  14%|█▍        | 7/50 [00:06<00:32,  1.33it/s][A
Training:  18%|█▊        | 9/50 [00:09<00:42,  1.04s/it][A
Training:  22%|██▏       | 11/50 [00:10<00:27,  1.43it/s][A
Training:  26%|██▌       | 13/50 [00:13<00:36,  1.02it/s][A
Training:  30%|███       | 15/50 [00:13<00:23,  1.46it/s][A
Training:  34%|███▍      | 17/50 [00:16<00:31,  1.06it/s][A
Training:  38%|███▊      | 19/50 [00:16<00:20,  1.49it/s][A
Training:  42%|████▏     | 21/50 [00:19<00:27,  1.07it/s][A
Training:  46%|████▌     | 23/50 [00:19<00:18,  1.49it/s][A
Training:  50%|█████     | 25/50 [00:22<00:23,  1.07it/s][A
Training:  54%|█████▍    | 27/50 [00:22<00:15,  1.50it/s][A
Training:  58%|█████▊    | 29/50 [00:25<00:19,  1.07it/s][A
Training:  62%|██████▏   | 31/50 [00:

Epoch: 13/51 - Loss: 5.8898 - Accuracy: 0.8819



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:03<00:19,  3.18s/it][A
 43%|████▎     | 3/7 [00:03<00:03,  1.15it/s][A
100%|██████████| 7/7 [00:06<00:00,  1.16it/s][A
Epochs:  25%|██▌       | 13/51 [10:26<30:30, 48.18s/it]

Val Loss: 6.6722 - Val Accuracy: 0.8110



Training:   0%|          | 0/50 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/50 [00:03<02:55,  3.58s/it][A
Training:   6%|▌         | 3/50 [00:03<00:46,  1.01it/s][A
Training:  10%|█         | 5/50 [00:06<00:57,  1.27s/it][A
Training:  14%|█▍        | 7/50 [00:06<00:32,  1.31it/s][A
Training:  18%|█▊        | 9/50 [00:10<00:43,  1.05s/it][A
Training:  22%|██▏       | 11/50 [00:10<00:27,  1.42it/s][A
Training:  26%|██▌       | 13/50 [00:13<00:36,  1.00it/s][A
Training:  30%|███       | 15/50 [00:13<00:24,  1.43it/s][A
Training:  34%|███▍      | 17/50 [00:16<00:31,  1.04it/s][A
Training:  38%|███▊      | 19/50 [00:16<00:21,  1.46it/s][A
Training:  42%|████▏     | 21/50 [00:19<00:27,  1.05it/s][A
Training:  46%|████▌     | 23/50 [00:19<00:18,  1.47it/s][A
Training:  50%|█████     | 25/50 [00:22<00:23,  1.07it/s][A
Training:  54%|█████▍    | 27/50 [00:23<00:15,  1.49it/s][A
Training:  58%|█████▊    | 29/50 [00:26<00:19,  1.06it/s][A
Training:  62%|██████▏   | 31/50 [00:

Epoch: 14/51 - Loss: 8.0465 - Accuracy: 0.8929



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:03<00:19,  3.28s/it][A
 43%|████▎     | 3/7 [00:03<00:03,  1.11it/s][A
100%|██████████| 7/7 [00:06<00:00,  1.13it/s][A
Epochs:  27%|██▋       | 14/51 [11:15<29:44, 48.22s/it]

Val Loss: 3.9353 - Val Accuracy: 0.9235



Training:   0%|          | 0/50 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/50 [00:03<02:58,  3.64s/it][A
Training:   6%|▌         | 3/50 [00:03<00:46,  1.00it/s][A
Training:  10%|█         | 5/50 [00:06<00:58,  1.30s/it][A
Training:  14%|█▍        | 7/50 [00:07<00:33,  1.29it/s][A
Training:  18%|█▊        | 9/50 [00:10<00:42,  1.04s/it][A
Training:  20%|██        | 10/50 [00:10<00:33,  1.18it/s][A
Training:  24%|██▍       | 12/50 [00:10<00:21,  1.81it/s][A
Training:  26%|██▌       | 13/50 [00:13<00:39,  1.06s/it][A
Training:  28%|██▊       | 14/50 [00:13<00:30,  1.19it/s][A
Training:  32%|███▏      | 16/50 [00:13<00:18,  1.88it/s][A
Training:  34%|███▍      | 17/50 [00:16<00:35,  1.07s/it][A
Training:  36%|███▌      | 18/50 [00:16<00:27,  1.18it/s][A
Training:  40%|████      | 20/50 [00:16<00:15,  1.89it/s][A
Training:  42%|████▏     | 21/50 [00:19<00:31,  1.08s/it][A
Training:  46%|████▌     | 23/50 [00:19<00:18,  1.46it/s][A
Training:  50%|█████     | 25/50 [00:

Epoch: 15/51 - Loss: 4.5011 - Accuracy: 0.9284



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:03<00:19,  3.25s/it][A
 43%|████▎     | 3/7 [00:03<00:03,  1.13it/s][A
100%|██████████| 7/7 [00:06<00:00,  1.13it/s][A
Epochs:  29%|██▉       | 15/51 [12:03<28:55, 48.22s/it]

Val Loss: 3.9912 - Val Accuracy: 0.9352



Training:   0%|          | 0/50 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/50 [00:03<02:51,  3.51s/it][A
Training:   6%|▌         | 3/50 [00:03<00:45,  1.04it/s][A
Training:  10%|█         | 5/50 [00:06<00:55,  1.24s/it][A
Training:  12%|█▏        | 6/50 [00:06<00:41,  1.05it/s][A
Training:  16%|█▌        | 8/50 [00:06<00:23,  1.78it/s][A
Training:  18%|█▊        | 9/50 [00:09<00:46,  1.13s/it][A
Training:  22%|██▏       | 11/50 [00:10<00:27,  1.42it/s][A
Training:  26%|██▌       | 13/50 [00:13<00:36,  1.00it/s][A
Training:  30%|███       | 15/50 [00:13<00:23,  1.46it/s][A
Training:  34%|███▍      | 17/50 [00:16<00:31,  1.05it/s][A
Training:  38%|███▊      | 19/50 [00:16<00:20,  1.49it/s][A
Training:  42%|████▏     | 21/50 [00:19<00:27,  1.06it/s][A
Training:  46%|████▌     | 23/50 [00:19<00:18,  1.49it/s][A
Training:  50%|█████     | 25/50 [00:22<00:23,  1.08it/s][A
Training:  54%|█████▍    | 27/50 [00:22<00:15,  1.50it/s][A
Training:  58%|█████▊    | 29/50 [00:2

Epoch: 16/51 - Loss: 3.6750 - Accuracy: 0.9411



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:03<00:18,  3.17s/it][A
 43%|████▎     | 3/7 [00:03<00:03,  1.14it/s][A
100%|██████████| 7/7 [00:06<00:00,  1.15it/s][A
Epochs:  31%|███▏      | 16/51 [12:51<28:04, 48.12s/it]

Val Loss: 2.8725 - Val Accuracy: 0.9392



Training:   0%|          | 0/50 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/50 [00:03<02:55,  3.57s/it][A
Training:   6%|▌         | 3/50 [00:03<00:45,  1.03it/s][A
Training:  10%|█         | 5/50 [00:06<00:56,  1.26s/it][A
Training:  14%|█▍        | 7/50 [00:06<00:32,  1.33it/s][A
Training:  18%|█▊        | 9/50 [00:09<00:42,  1.05s/it][A
Training:  22%|██▏       | 11/50 [00:10<00:27,  1.43it/s][A
Training:  26%|██▌       | 13/50 [00:13<00:36,  1.02it/s][A
Training:  30%|███       | 15/50 [00:13<00:23,  1.47it/s][A
Training:  34%|███▍      | 17/50 [00:16<00:31,  1.05it/s][A
Training:  38%|███▊      | 19/50 [00:16<00:20,  1.48it/s][A
Training:  42%|████▏     | 21/50 [00:19<00:27,  1.07it/s][A
Training:  46%|████▌     | 23/50 [00:19<00:18,  1.50it/s][A
Training:  50%|█████     | 25/50 [00:22<00:23,  1.06it/s][A
Training:  54%|█████▍    | 27/50 [00:22<00:15,  1.48it/s][A
Training:  58%|█████▊    | 29/50 [00:25<00:19,  1.08it/s][A
Training:  62%|██████▏   | 31/50 [00:

Epoch: 17/51 - Loss: 2.9516 - Accuracy: 0.9374



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:03<00:19,  3.22s/it][A
 43%|████▎     | 3/7 [00:03<00:03,  1.14it/s][A
100%|██████████| 7/7 [00:06<00:00,  1.16it/s][A
Epochs:  33%|███▎      | 17/51 [13:39<27:14, 48.08s/it]

Val Loss: 2.9747 - Val Accuracy: 0.9287



Training:   0%|          | 0/50 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/50 [00:03<02:54,  3.57s/it][A
Training:   6%|▌         | 3/50 [00:03<00:45,  1.03it/s][A
Training:  10%|█         | 5/50 [00:06<00:57,  1.27s/it][A
Training:  14%|█▍        | 7/50 [00:06<00:32,  1.32it/s][A
Training:  18%|█▊        | 9/50 [00:10<00:43,  1.05s/it][A
Training:  22%|██▏       | 11/50 [00:10<00:27,  1.41it/s][A
Training:  26%|██▌       | 13/50 [00:13<00:36,  1.01it/s][A
Training:  30%|███       | 15/50 [00:13<00:24,  1.44it/s][A
Training:  34%|███▍      | 17/50 [00:16<00:32,  1.03it/s][A
Training:  38%|███▊      | 19/50 [00:16<00:21,  1.45it/s][A
Training:  42%|████▏     | 21/50 [00:19<00:27,  1.05it/s][A
Training:  46%|████▌     | 23/50 [00:19<00:18,  1.46it/s][A
Training:  50%|█████     | 25/50 [00:23<00:24,  1.04it/s][A
Training:  54%|█████▍    | 27/50 [00:23<00:15,  1.45it/s][A
Training:  58%|█████▊    | 29/50 [00:26<00:19,  1.06it/s][A
Training:  62%|██████▏   | 31/50 [00:

Epoch: 18/51 - Loss: 3.6170 - Accuracy: 0.9327



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:03<00:19,  3.23s/it][A
 43%|████▎     | 3/7 [00:03<00:03,  1.13it/s][A
100%|██████████| 7/7 [00:06<00:00,  1.15it/s][A
Epochs:  35%|███▌      | 18/51 [14:27<26:31, 48.22s/it]

Val Loss: 3.3966 - Val Accuracy: 0.9301



Training:   0%|          | 0/50 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/50 [00:03<02:57,  3.62s/it][A
Training:   6%|▌         | 3/50 [00:03<00:46,  1.01it/s][A
Training:  10%|█         | 5/50 [00:06<00:57,  1.28s/it][A
Training:  14%|█▍        | 7/50 [00:06<00:32,  1.31it/s][A
Training:  18%|█▊        | 9/50 [00:10<00:43,  1.06s/it][A
Training:  22%|██▏       | 11/50 [00:10<00:27,  1.41it/s][A
Training:  26%|██▌       | 13/50 [00:13<00:37,  1.01s/it][A
Training:  30%|███       | 15/50 [00:13<00:24,  1.42it/s][A
Training:  34%|███▍      | 17/50 [00:16<00:32,  1.02it/s][A
Training:  38%|███▊      | 19/50 [00:16<00:21,  1.43it/s][A
Training:  42%|████▏     | 21/50 [00:19<00:27,  1.06it/s][A
Training:  44%|████▍     | 22/50 [00:20<00:22,  1.24it/s][A
Training:  48%|████▊     | 24/50 [00:20<00:14,  1.81it/s][A
Training:  50%|█████     | 25/50 [00:23<00:25,  1.01s/it][A
Training:  52%|█████▏    | 26/50 [00:23<00:19,  1.20it/s][A
Training:  56%|█████▌    | 28/50 [00:

Epoch: 19/51 - Loss: 5.3872 - Accuracy: 0.9318



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:03<00:19,  3.26s/it][A
 43%|████▎     | 3/7 [00:03<00:03,  1.12it/s][A
100%|██████████| 7/7 [00:06<00:00,  1.15it/s][A
Epochs:  37%|███▋      | 19/51 [15:15<25:43, 48.23s/it]

Val Loss: 4.4629 - Val Accuracy: 0.9261



Training:   0%|          | 0/50 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/50 [00:03<02:57,  3.61s/it][A
Training:   6%|▌         | 3/50 [00:03<00:46,  1.02it/s][A
Training:  10%|█         | 5/50 [00:06<00:57,  1.28s/it][A
Training:  14%|█▍        | 7/50 [00:06<00:32,  1.31it/s][A
Training:  18%|█▊        | 9/50 [00:10<00:43,  1.06s/it][A
Training:  22%|██▏       | 11/50 [00:10<00:27,  1.41it/s][A
Training:  26%|██▌       | 13/50 [00:13<00:36,  1.01it/s][A
Training:  30%|███       | 15/50 [00:13<00:24,  1.44it/s][A
Training:  34%|███▍      | 17/50 [00:16<00:31,  1.04it/s][A
Training:  38%|███▊      | 19/50 [00:16<00:21,  1.47it/s][A
Training:  42%|████▏     | 21/50 [00:19<00:27,  1.06it/s][A
Training:  46%|████▌     | 23/50 [00:19<00:18,  1.49it/s][A
Training:  50%|█████     | 25/50 [00:22<00:23,  1.07it/s][A
Training:  54%|█████▍    | 27/50 [00:23<00:15,  1.49it/s][A
Training:  58%|█████▊    | 29/50 [00:26<00:19,  1.07it/s][A
Training:  62%|██████▏   | 31/50 [00:

Epoch: 20/51 - Loss: 4.9949 - Accuracy: 0.9325



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:03<00:19,  3.26s/it][A
 43%|████▎     | 3/7 [00:03<00:03,  1.12it/s][A
100%|██████████| 7/7 [00:06<00:00,  1.13it/s][A
Epochs:  39%|███▉      | 20/51 [16:04<24:55, 48.25s/it]

Val Loss: 3.9341 - Val Accuracy: 0.9387



Training:   0%|          | 0/50 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/50 [00:03<02:52,  3.52s/it][A
Training:   6%|▌         | 3/50 [00:03<00:45,  1.04it/s][A
Training:  10%|█         | 5/50 [00:06<00:57,  1.28s/it][A
Training:  14%|█▍        | 7/50 [00:06<00:32,  1.31it/s][A
Training:  18%|█▊        | 9/50 [00:10<00:43,  1.06s/it][A
Training:  22%|██▏       | 11/50 [00:10<00:27,  1.40it/s][A
Training:  26%|██▌       | 13/50 [00:13<00:36,  1.01it/s][A
Training:  30%|███       | 15/50 [00:13<00:24,  1.45it/s][A
Training:  34%|███▍      | 17/50 [00:16<00:32,  1.03it/s][A
Training:  38%|███▊      | 19/50 [00:16<00:21,  1.45it/s][A
Training:  42%|████▏     | 21/50 [00:19<00:27,  1.05it/s][A
Training:  46%|████▌     | 23/50 [00:19<00:18,  1.47it/s][A
Training:  50%|█████     | 25/50 [00:22<00:23,  1.06it/s][A
Training:  54%|█████▍    | 27/50 [00:23<00:15,  1.48it/s][A
Training:  58%|█████▊    | 29/50 [00:26<00:19,  1.06it/s][A
Training:  62%|██████▏   | 31/50 [00:

Epoch: 21/51 - Loss: 3.4673 - Accuracy: 0.9370



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:03<00:19,  3.30s/it][A
 43%|████▎     | 3/7 [00:03<00:03,  1.12it/s][A
100%|██████████| 7/7 [00:06<00:00,  1.13it/s][A
Epochs:  41%|████      | 21/51 [16:52<24:10, 48.35s/it]

Val Loss: 3.0553 - Val Accuracy: 0.9312



Training:   0%|          | 0/50 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/50 [00:03<02:54,  3.57s/it][A
Training:   6%|▌         | 3/50 [00:03<00:45,  1.03it/s][A
Training:  10%|█         | 5/50 [00:06<00:57,  1.27s/it][A
Training:  14%|█▍        | 7/50 [00:06<00:32,  1.31it/s][A
Training:  18%|█▊        | 9/50 [00:10<00:43,  1.05s/it][A
Training:  22%|██▏       | 11/50 [00:10<00:27,  1.41it/s][A
Training:  26%|██▌       | 13/50 [00:13<00:36,  1.02it/s][A
Training:  30%|███       | 15/50 [00:13<00:24,  1.46it/s][A
Training:  34%|███▍      | 17/50 [00:16<00:31,  1.05it/s][A
Training:  38%|███▊      | 19/50 [00:16<00:20,  1.48it/s][A
Training:  42%|████▏     | 21/50 [00:19<00:26,  1.08it/s][A
Training:  46%|████▌     | 23/50 [00:19<00:17,  1.50it/s][A
Training:  50%|█████     | 25/50 [00:22<00:23,  1.08it/s][A
Training:  54%|█████▍    | 27/50 [00:22<00:15,  1.50it/s][A
Training:  58%|█████▊    | 29/50 [00:25<00:19,  1.07it/s][A
Training:  62%|██████▏   | 31/50 [00:

Epoch: 22/51 - Loss: 3.7755 - Accuracy: 0.9333



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:03<00:18,  3.15s/it][A
 43%|████▎     | 3/7 [00:03<00:03,  1.15it/s][A
100%|██████████| 7/7 [00:06<00:00,  1.16it/s][A
Epochs:  43%|████▎     | 22/51 [17:40<23:19, 48.26s/it]

Val Loss: 3.4414 - Val Accuracy: 0.9261



Training:   0%|          | 0/50 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/50 [00:03<02:55,  3.58s/it][A
Training:   6%|▌         | 3/50 [00:03<00:45,  1.02it/s][A
Training:  10%|█         | 5/50 [00:06<00:56,  1.26s/it][A
Training:  14%|█▍        | 7/50 [00:06<00:32,  1.33it/s][A
Training:  18%|█▊        | 9/50 [00:09<00:43,  1.05s/it][A
Training:  20%|██        | 10/50 [00:10<00:34,  1.17it/s][A
Training:  24%|██▍       | 12/50 [00:10<00:21,  1.80it/s][A
Training:  26%|██▌       | 13/50 [00:13<00:39,  1.06s/it][A
Training:  30%|███       | 15/50 [00:13<00:24,  1.45it/s][A
Training:  34%|███▍      | 17/50 [00:16<00:32,  1.01it/s][A
Training:  38%|███▊      | 19/50 [00:16<00:21,  1.47it/s][A
Training:  42%|████▏     | 21/50 [00:19<00:27,  1.04it/s][A
Training:  46%|████▌     | 23/50 [00:19<00:18,  1.47it/s][A
Training:  50%|█████     | 25/50 [00:22<00:23,  1.06it/s][A
Training:  54%|█████▍    | 27/50 [00:22<00:15,  1.49it/s][A
Training:  58%|█████▊    | 29/50 [00:

Epoch: 23/51 - Loss: 3.3793 - Accuracy: 0.9420



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:03<00:18,  3.15s/it][A
 43%|████▎     | 3/7 [00:03<00:03,  1.16it/s][A
100%|██████████| 7/7 [00:05<00:00,  1.17it/s][A
Epochs:  43%|████▎     | 22/51 [18:28<24:21, 50.40s/it]
[32m[I 2023-12-15 04:06:15,775][0m Trial 8 pruned. [0m


Val Loss: 3.2549 - Val Accuracy: 0.9272
Learning rate: 0.01581821468524964
Weight decay: 0.0009021648335101662
Epsilon: 2.385849272257235e-09
Batch size: 203
Number of epochs: 85


Epochs:   0%|          | 0/85 [00:00<?, ?it/s]
Training:   0%|          | 0/69 [00:00<?, ?it/s][A
Training:   1%|▏         | 1/69 [00:02<02:57,  2.61s/it][A
Training:   4%|▍         | 3/69 [00:02<00:47,  1.40it/s][A
Training:   7%|▋         | 5/69 [00:04<00:57,  1.11it/s][A
Training:  12%|█▏        | 8/69 [00:05<00:27,  2.20it/s][A
Training:  14%|█▍        | 10/69 [00:07<00:38,  1.53it/s][A
Training:  19%|█▉        | 13/69 [00:09<00:39,  1.42it/s][A
Training:  23%|██▎       | 16/69 [00:09<00:24,  2.18it/s][A
Training:  26%|██▌       | 18/69 [00:11<00:32,  1.58it/s][A
Training:  30%|███       | 21/69 [00:14<00:31,  1.50it/s][A
Training:  33%|███▎      | 23/69 [00:14<00:23,  1.94it/s][A
Training:  36%|███▌      | 25/69 [00:16<00:29,  1.49it/s][A
Training:  39%|███▉      | 27/69 [00:16<00:21,  2.00it/s][A
Training:  42%|████▏     | 29/69 [00:18<00:26,  1.51it/s][A
Training:  45%|████▍     | 31/69 [00:18<00:18,  2.05it/s][A
Training:  48%|████▊     | 33/69 [00:20<00:23,  1.5

Epoch: 1/85 - Loss: 52.8115 - Accuracy: 0.7548



  0%|          | 0/9 [00:00<?, ?it/s][A
 11%|█         | 1/9 [00:02<00:19,  2.46s/it][A
 44%|████▍     | 4/9 [00:02<00:02,  2.01it/s][A
 67%|██████▋   | 6/9 [00:04<00:02,  1.42it/s][A
100%|██████████| 9/9 [00:05<00:00,  1.59it/s][A
Epochs:   0%|          | 0/85 [00:46<?, ?it/s]
[32m[I 2023-12-15 04:07:02,751][0m Trial 9 pruned. [0m


Val Loss: 50.1088 - Val Accuracy: 0.8850
Learning rate: 1.4539371411801274e-05
Weight decay: 0.00022165882053756236
Epsilon: 1.6952800184100311e-09
Batch size: 103
Number of epochs: 99


Epochs:   0%|          | 0/99 [00:00<?, ?it/s]
Training:   0%|          | 0/136 [00:00<?, ?it/s][A
Training:   1%|          | 1/136 [00:01<03:24,  1.52s/it][A
Training:   4%|▎         | 5/136 [00:02<01:01,  2.15it/s][A
Training:   7%|▋         | 9/136 [00:03<00:46,  2.72it/s][A
Training:  10%|▉         | 13/136 [00:05<00:41,  2.95it/s][A
Training:  12%|█▎        | 17/136 [00:06<00:38,  3.08it/s][A
Training:  15%|█▌        | 21/136 [00:07<00:35,  3.23it/s][A
Training:  18%|█▊        | 25/136 [00:08<00:33,  3.32it/s][A
Training:  21%|██▏       | 29/136 [00:09<00:32,  3.34it/s][A
Training:  24%|██▍       | 33/136 [00:10<00:30,  3.40it/s][A
Training:  27%|██▋       | 37/136 [00:11<00:28,  3.47it/s][A
Training:  30%|███       | 41/136 [00:13<00:27,  3.42it/s][A
Training:  33%|███▎      | 45/136 [00:14<00:26,  3.42it/s][A
Training:  36%|███▌      | 49/136 [00:15<00:24,  3.50it/s][A
Training:  39%|███▉      | 53/136 [00:16<00:23,  3.48it/s][A
Training:  42%|████▏     | 57/136 [

Epoch: 1/99 - Loss: 7.8706 - Accuracy: 0.5479



  0%|          | 0/17 [00:00<?, ?it/s][A
  6%|▌         | 1/17 [00:01<00:21,  1.36s/it][A
 29%|██▉       | 5/17 [00:02<00:04,  2.50it/s][A
 53%|█████▎    | 9/17 [00:03<00:02,  3.07it/s][A
 76%|███████▋  | 13/17 [00:04<00:01,  3.38it/s][A
100%|██████████| 17/17 [00:05<00:00,  3.18it/s][A
Epochs:   0%|          | 0/99 [00:45<?, ?it/s]
[32m[I 2023-12-15 04:07:48,053][0m Trial 10 pruned. [0m


Val Loss: 6.6390 - Val Accuracy: 0.6113
Learning rate: 0.0002823858251405799
Weight decay: 0.00036934903983322265
Epsilon: 4.3482407552971556e-09
Batch size: 89
Number of epochs: 38


Epochs:   0%|          | 0/38 [00:00<?, ?it/s]
Training:   0%|          | 0/157 [00:00<?, ?it/s][A
Training:   1%|          | 1/157 [00:01<03:14,  1.25s/it][A
Training:   3%|▎         | 5/157 [00:02<01:02,  2.43it/s][A
Training:   6%|▌         | 9/157 [00:03<00:46,  3.17it/s][A
Training:   8%|▊         | 13/157 [00:04<00:41,  3.48it/s][A
Training:  11%|█         | 17/157 [00:05<00:38,  3.62it/s][A
Training:  13%|█▎        | 21/157 [00:06<00:35,  3.81it/s][A
Training:  16%|█▌        | 25/157 [00:07<00:34,  3.80it/s][A
Training:  18%|█▊        | 29/157 [00:08<00:33,  3.87it/s][A
Training:  21%|██        | 33/157 [00:09<00:31,  3.91it/s][A
Training:  24%|██▎       | 37/157 [00:10<00:31,  3.86it/s][A
Training:  26%|██▌       | 41/157 [00:11<00:29,  3.91it/s][A
Training:  29%|██▊       | 45/157 [00:12<00:28,  3.91it/s][A
Training:  31%|███       | 49/157 [00:13<00:27,  3.87it/s][A
Training:  34%|███▍      | 53/157 [00:14<00:26,  4.00it/s][A
Training:  36%|███▋      | 57/157 [

Epoch: 1/38 - Loss: 3.6341 - Accuracy: 0.8224



  0%|          | 0/20 [00:00<?, ?it/s][A
  5%|▌         | 1/20 [00:01<00:22,  1.16s/it][A
 25%|██▌       | 5/20 [00:02<00:05,  2.70it/s][A
 45%|████▌     | 9/20 [00:02<00:03,  3.55it/s][A
 65%|██████▌   | 13/20 [00:03<00:01,  3.83it/s][A
100%|██████████| 20/20 [00:04<00:00,  4.17it/s][A
Epochs:   3%|▎         | 1/38 [00:45<27:53, 45.24s/it]

Val Loss: 2.2281 - Val Accuracy: 0.9012



Training:   0%|          | 0/157 [00:00<?, ?it/s][A
Training:   1%|          | 1/157 [00:01<03:11,  1.22s/it][A
Training:   3%|▎         | 5/157 [00:02<01:02,  2.42it/s][A
Training:   6%|▌         | 9/157 [00:03<00:47,  3.10it/s][A
Training:   8%|▊         | 13/157 [00:04<00:41,  3.43it/s][A
Training:  11%|█         | 17/157 [00:05<00:39,  3.55it/s][A
Training:  13%|█▎        | 21/157 [00:06<00:36,  3.77it/s][A
Training:  16%|█▌        | 25/157 [00:07<00:34,  3.79it/s][A
Training:  18%|█▊        | 29/157 [00:08<00:33,  3.82it/s][A
Training:  21%|██        | 33/157 [00:09<00:31,  3.95it/s][A
Training:  24%|██▎       | 37/157 [00:10<00:31,  3.84it/s][A
Training:  26%|██▌       | 41/157 [00:11<00:29,  3.95it/s][A
Training:  29%|██▊       | 45/157 [00:12<00:28,  3.94it/s][A
Training:  31%|███       | 49/157 [00:13<00:27,  3.91it/s][A
Training:  34%|███▍      | 53/157 [00:14<00:25,  4.00it/s][A
Training:  36%|███▋      | 57/157 [00:15<00:25,  3.90it/s][A
Training:  39%|███▉

Epoch: 2/38 - Loss: 1.8041 - Accuracy: 0.9138



  0%|          | 0/20 [00:00<?, ?it/s][A
  5%|▌         | 1/20 [00:01<00:23,  1.23s/it][A
 25%|██▌       | 5/20 [00:02<00:05,  2.70it/s][A
 45%|████▌     | 9/20 [00:03<00:03,  3.46it/s][A
 65%|██████▌   | 13/20 [00:03<00:01,  3.82it/s][A
100%|██████████| 20/20 [00:04<00:00,  4.11it/s][A
Epochs:   5%|▌         | 2/38 [01:30<27:12, 45.34s/it]

Val Loss: 1.6194 - Val Accuracy: 0.9169



Training:   0%|          | 0/157 [00:00<?, ?it/s][A
Training:   1%|          | 1/157 [00:01<03:28,  1.34s/it][A
Training:   3%|▎         | 5/157 [00:02<01:03,  2.40it/s][A
Training:   6%|▌         | 9/157 [00:03<00:47,  3.13it/s][A
Training:   8%|▊         | 13/157 [00:04<00:42,  3.39it/s][A
Training:  11%|█         | 17/157 [00:05<00:38,  3.64it/s][A
Training:  13%|█▎        | 21/157 [00:06<00:35,  3.79it/s][A
Training:  16%|█▌        | 25/157 [00:07<00:34,  3.79it/s][A
Training:  18%|█▊        | 29/157 [00:08<00:32,  3.92it/s][A
Training:  21%|██        | 33/157 [00:09<00:32,  3.84it/s][A
Training:  24%|██▎       | 37/157 [00:10<00:30,  3.96it/s][A
Training:  26%|██▌       | 41/157 [00:11<00:29,  3.97it/s][A
Training:  29%|██▊       | 45/157 [00:12<00:28,  3.92it/s][A
Training:  31%|███       | 49/157 [00:13<00:26,  4.04it/s][A
Training:  34%|███▍      | 53/157 [00:14<00:26,  3.97it/s][A
Training:  36%|███▋      | 57/157 [00:15<00:24,  4.12it/s][A
Training:  38%|███▊

Epoch: 3/38 - Loss: 1.4450 - Accuracy: 0.9248



  0%|          | 0/20 [00:00<?, ?it/s][A
  5%|▌         | 1/20 [00:01<00:22,  1.19s/it][A
 25%|██▌       | 5/20 [00:02<00:05,  2.81it/s][A
 45%|████▌     | 9/20 [00:02<00:03,  3.42it/s][A
 65%|██████▌   | 13/20 [00:03<00:01,  3.92it/s][A
100%|██████████| 20/20 [00:04<00:00,  4.12it/s][A
Epochs:   8%|▊         | 3/38 [02:15<26:26, 45.33s/it]

Val Loss: 1.2606 - Val Accuracy: 0.9321



Training:   0%|          | 0/157 [00:00<?, ?it/s][A
Training:   1%|          | 1/157 [00:01<03:30,  1.35s/it][A
Training:   3%|▎         | 5/157 [00:02<01:01,  2.47it/s][A
Training:   6%|▌         | 9/157 [00:03<00:47,  3.11it/s][A
Training:   8%|▊         | 13/157 [00:04<00:42,  3.37it/s][A
Training:  11%|█         | 17/157 [00:05<00:37,  3.69it/s][A
Training:  13%|█▎        | 20/157 [00:05<00:27,  4.96it/s][A
Training:  14%|█▍        | 22/157 [00:06<00:35,  3.80it/s][A
Training:  16%|█▌        | 25/157 [00:07<00:37,  3.56it/s][A
Training:  18%|█▊        | 29/157 [00:08<00:34,  3.72it/s][A
Training:  21%|██        | 33/157 [00:09<00:32,  3.76it/s][A
Training:  24%|██▎       | 37/157 [00:10<00:30,  3.96it/s][A
Training:  26%|██▌       | 41/157 [00:11<00:29,  3.92it/s][A
Training:  29%|██▊       | 45/157 [00:12<00:28,  3.93it/s][A
Training:  30%|██▉       | 47/157 [00:12<00:23,  4.61it/s][A
Training:  31%|███       | 49/157 [00:13<00:28,  3.80it/s][A
Training:  34%|███▍

Epoch: 4/38 - Loss: 1.1630 - Accuracy: 0.9351



  0%|          | 0/20 [00:00<?, ?it/s][A
  5%|▌         | 1/20 [00:01<00:22,  1.17s/it][A
 25%|██▌       | 5/20 [00:02<00:05,  2.69it/s][A
 45%|████▌     | 9/20 [00:02<00:03,  3.48it/s][A
 65%|██████▌   | 13/20 [00:03<00:01,  3.82it/s][A
100%|██████████| 20/20 [00:04<00:00,  4.10it/s][A
Epochs:  11%|█         | 4/38 [03:01<25:40, 45.31s/it]

Val Loss: 1.2331 - Val Accuracy: 0.9309



Training:   0%|          | 0/157 [00:00<?, ?it/s][A
Training:   1%|          | 1/157 [00:01<03:21,  1.29s/it][A
Training:   3%|▎         | 5/157 [00:02<01:03,  2.39it/s][A
Training:   6%|▌         | 9/157 [00:03<00:46,  3.21it/s][A
Training:   8%|▊         | 12/157 [00:03<00:30,  4.77it/s][A
Training:   9%|▉         | 14/157 [00:04<00:39,  3.59it/s][A
Training:  11%|█         | 17/157 [00:05<00:41,  3.40it/s][A
Training:  12%|█▏        | 19/157 [00:05<00:32,  4.26it/s][A
Training:  13%|█▎        | 21/157 [00:06<00:38,  3.56it/s][A
Training:  15%|█▍        | 23/157 [00:06<00:29,  4.52it/s][A
Training:  16%|█▌        | 25/157 [00:07<00:38,  3.43it/s][A
Training:  18%|█▊        | 28/157 [00:07<00:25,  5.10it/s][A
Training:  19%|█▉        | 30/157 [00:08<00:32,  3.88it/s][A
Training:  21%|██        | 33/157 [00:09<00:34,  3.59it/s][A
Training:  22%|██▏       | 35/157 [00:09<00:27,  4.41it/s][A
Training:  24%|██▎       | 37/157 [00:10<00:32,  3.67it/s][A
Training:  24%|██▍ 

Epoch: 5/38 - Loss: 1.0796 - Accuracy: 0.9356



  0%|          | 0/20 [00:00<?, ?it/s][A
  5%|▌         | 1/20 [00:01<00:23,  1.25s/it][A
 25%|██▌       | 5/20 [00:02<00:05,  2.80it/s][A
 40%|████      | 8/20 [00:02<00:02,  4.91it/s][A
 50%|█████     | 10/20 [00:03<00:02,  3.65it/s][A
 65%|██████▌   | 13/20 [00:03<00:01,  3.62it/s][A
100%|██████████| 20/20 [00:04<00:00,  4.14it/s][A
Epochs:  13%|█▎        | 5/38 [03:46<24:53, 45.24s/it]

Val Loss: 1.0444 - Val Accuracy: 0.9280



Training:   0%|          | 0/157 [00:00<?, ?it/s][A
Training:   1%|          | 1/157 [00:01<03:31,  1.36s/it][A
Training:   3%|▎         | 5/157 [00:02<01:03,  2.40it/s][A
Training:   6%|▌         | 9/157 [00:03<00:47,  3.10it/s][A
Training:   8%|▊         | 13/157 [00:04<00:43,  3.34it/s][A
Training:  11%|█         | 17/157 [00:05<00:38,  3.61it/s][A
Training:  13%|█▎        | 21/157 [00:06<00:36,  3.70it/s][A
Training:  16%|█▌        | 25/157 [00:07<00:35,  3.76it/s][A
Training:  18%|█▊        | 29/157 [00:08<00:32,  3.91it/s][A
Training:  21%|██        | 33/157 [00:09<00:32,  3.87it/s][A
Training:  24%|██▎       | 37/157 [00:10<00:30,  3.98it/s][A
Training:  26%|██▌       | 41/157 [00:11<00:29,  3.95it/s][A
Training:  29%|██▊       | 45/157 [00:12<00:29,  3.85it/s][A
Training:  31%|███       | 49/157 [00:13<00:27,  3.96it/s][A
Training:  34%|███▍      | 53/157 [00:14<00:26,  3.91it/s][A
Training:  36%|███▋      | 57/157 [00:15<00:25,  3.99it/s][A
Training:  39%|███▉

Epoch: 6/38 - Loss: 0.9692 - Accuracy: 0.9396



  0%|          | 0/20 [00:00<?, ?it/s][A
  5%|▌         | 1/20 [00:01<00:22,  1.19s/it][A
 25%|██▌       | 5/20 [00:02<00:05,  2.74it/s][A
 45%|████▌     | 9/20 [00:02<00:03,  3.48it/s][A
 65%|██████▌   | 13/20 [00:03<00:01,  3.90it/s][A
100%|██████████| 20/20 [00:04<00:00,  4.10it/s][A
Epochs:  16%|█▌        | 6/38 [04:31<24:09, 45.30s/it]

Val Loss: 1.0458 - Val Accuracy: 0.9337



Training:   0%|          | 0/157 [00:00<?, ?it/s][A
Training:   1%|          | 1/157 [00:01<03:19,  1.28s/it][A
Training:   3%|▎         | 5/157 [00:02<01:00,  2.53it/s][A
Training:   6%|▌         | 9/157 [00:03<00:47,  3.11it/s][A
Training:   8%|▊         | 13/157 [00:04<00:40,  3.59it/s][A
Training:  11%|█         | 17/157 [00:05<00:38,  3.65it/s][A
Training:  13%|█▎        | 21/157 [00:06<00:36,  3.69it/s][A
Training:  16%|█▌        | 25/157 [00:07<00:34,  3.84it/s][A
Training:  18%|█▊        | 28/157 [00:07<00:25,  4.99it/s][A
Training:  19%|█▉        | 30/157 [00:08<00:32,  3.86it/s][A
Training:  21%|██        | 33/157 [00:09<00:33,  3.65it/s][A
Training:  24%|██▎       | 37/157 [00:10<00:31,  3.80it/s][A
Training:  26%|██▌       | 41/157 [00:11<00:30,  3.83it/s][A
Training:  28%|██▊       | 44/157 [00:11<00:22,  4.92it/s][A
Training:  29%|██▉       | 46/157 [00:12<00:27,  4.02it/s][A
Training:  31%|███       | 49/157 [00:13<00:29,  3.61it/s][A
Training:  33%|███▎

Epoch: 7/38 - Loss: 0.9244 - Accuracy: 0.9392



  0%|          | 0/20 [00:00<?, ?it/s][A
  5%|▌         | 1/20 [00:01<00:22,  1.17s/it][A
 25%|██▌       | 5/20 [00:02<00:05,  2.76it/s][A
 45%|████▌     | 9/20 [00:02<00:03,  3.43it/s][A
 65%|██████▌   | 13/20 [00:03<00:01,  3.92it/s][A
100%|██████████| 20/20 [00:04<00:00,  4.11it/s][A
Epochs:  18%|█▊        | 7/38 [05:17<23:25, 45.33s/it]

Val Loss: 0.9215 - Val Accuracy: 0.9360



Training:   0%|          | 0/157 [00:00<?, ?it/s][A
Training:   1%|          | 1/157 [00:01<03:23,  1.31s/it][A
Training:   3%|▎         | 5/157 [00:02<01:00,  2.50it/s][A
Training:   6%|▌         | 9/157 [00:03<00:48,  3.05it/s][A
Training:   8%|▊         | 13/157 [00:04<00:41,  3.49it/s][A
Training:  11%|█         | 17/157 [00:05<00:37,  3.69it/s][A
Training:  13%|█▎        | 21/157 [00:06<00:36,  3.76it/s][A
Training:  16%|█▌        | 25/157 [00:07<00:33,  3.94it/s][A
Training:  18%|█▊        | 29/157 [00:08<00:32,  3.90it/s][A
Training:  21%|██        | 33/157 [00:09<00:31,  3.99it/s][A
Training:  23%|██▎       | 36/157 [00:09<00:23,  5.07it/s][A
Training:  24%|██▍       | 38/157 [00:10<00:29,  4.02it/s][A
Training:  26%|██▌       | 41/157 [00:11<00:31,  3.65it/s][A
Training:  28%|██▊       | 44/157 [00:11<00:23,  4.87it/s][A
Training:  29%|██▉       | 46/157 [00:12<00:29,  3.80it/s][A
Training:  31%|███       | 49/157 [00:13<00:31,  3.48it/s][A
Training:  34%|███▍

Epoch: 8/38 - Loss: 0.8752 - Accuracy: 0.9422



  0%|          | 0/20 [00:00<?, ?it/s][A
  5%|▌         | 1/20 [00:01<00:22,  1.19s/it][A
 25%|██▌       | 5/20 [00:02<00:05,  2.63it/s][A
 45%|████▌     | 9/20 [00:02<00:03,  3.52it/s][A
 65%|██████▌   | 13/20 [00:03<00:01,  3.77it/s][A
100%|██████████| 20/20 [00:04<00:00,  4.10it/s][A
Epochs:  21%|██        | 8/38 [06:02<22:38, 45.30s/it]

Val Loss: 0.9111 - Val Accuracy: 0.9360



Training:   0%|          | 0/157 [00:00<?, ?it/s][A
Training:   1%|          | 1/157 [00:01<03:14,  1.25s/it][A
Training:   3%|▎         | 5/157 [00:02<01:01,  2.47it/s][A
Training:   6%|▌         | 9/157 [00:03<00:47,  3.09it/s][A
Training:   8%|▊         | 12/157 [00:03<00:31,  4.61it/s][A
Training:   9%|▉         | 14/157 [00:04<00:39,  3.60it/s][A
Training:  11%|█         | 17/157 [00:05<00:42,  3.30it/s][A
Training:  13%|█▎        | 21/157 [00:06<00:37,  3.62it/s][A
Training:  16%|█▌        | 25/157 [00:07<00:35,  3.75it/s][A
Training:  18%|█▊        | 29/157 [00:08<00:33,  3.80it/s][A
Training:  20%|██        | 32/157 [00:08<00:25,  4.96it/s][A
Training:  22%|██▏       | 34/157 [00:09<00:31,  3.96it/s][A
Training:  24%|██▎       | 37/157 [00:10<00:34,  3.53it/s][A
Training:  26%|██▌       | 41/157 [00:11<00:30,  3.74it/s][A
Training:  29%|██▊       | 45/157 [00:12<00:29,  3.82it/s][A
Training:  31%|███       | 49/157 [00:13<00:28,  3.77it/s][A
Training:  34%|███▍

Epoch: 9/38 - Loss: 0.7991 - Accuracy: 0.9412



  0%|          | 0/20 [00:00<?, ?it/s][A
  5%|▌         | 1/20 [00:01<00:21,  1.15s/it][A
 25%|██▌       | 5/20 [00:02<00:05,  2.64it/s][A
 45%|████▌     | 9/20 [00:02<00:03,  3.51it/s][A
 65%|██████▌   | 13/20 [00:03<00:01,  3.78it/s][A
100%|██████████| 20/20 [00:04<00:00,  4.12it/s][A
Epochs:  24%|██▎       | 9/38 [06:47<21:56, 45.38s/it]

Val Loss: 0.7912 - Val Accuracy: 0.9384



Training:   0%|          | 0/157 [00:00<?, ?it/s][A
Training:   1%|          | 1/157 [00:01<03:22,  1.30s/it][A
Training:   3%|▎         | 5/157 [00:02<01:04,  2.36it/s][A
Training:   6%|▌         | 9/157 [00:03<00:47,  3.10it/s][A
Training:   8%|▊         | 13/157 [00:04<00:42,  3.42it/s][A
Training:  11%|█         | 17/157 [00:05<00:39,  3.58it/s][A
Training:  13%|█▎        | 21/157 [00:06<00:35,  3.79it/s][A
Training:  16%|█▌        | 25/157 [00:07<00:34,  3.79it/s][A
Training:  18%|█▊        | 29/157 [00:08<00:33,  3.82it/s][A
Training:  21%|██        | 33/157 [00:09<00:31,  3.92it/s][A
Training:  24%|██▎       | 37/157 [00:10<00:31,  3.86it/s][A
Training:  26%|██▌       | 41/157 [00:11<00:28,  4.01it/s][A
Training:  29%|██▊       | 45/157 [00:12<00:28,  3.91it/s][A
Training:  31%|███       | 49/157 [00:13<00:27,  3.92it/s][A
Training:  34%|███▍      | 53/157 [00:14<00:26,  3.98it/s][A
Training:  36%|███▋      | 57/157 [00:15<00:25,  3.92it/s][A
Training:  39%|███▉

Epoch: 10/38 - Loss: 0.7939 - Accuracy: 0.9369



  0%|          | 0/20 [00:00<?, ?it/s][A
  5%|▌         | 1/20 [00:01<00:24,  1.29s/it][A
 25%|██▌       | 5/20 [00:02<00:05,  2.71it/s][A
 45%|████▌     | 9/20 [00:03<00:03,  3.35it/s][A
 65%|██████▌   | 13/20 [00:04<00:01,  3.72it/s][A
100%|██████████| 20/20 [00:04<00:00,  4.00it/s][A
Epochs:  26%|██▋       | 10/38 [07:33<21:11, 45.43s/it]

Val Loss: 0.8685 - Val Accuracy: 0.9371



Training:   0%|          | 0/157 [00:00<?, ?it/s][A
Training:   1%|          | 1/157 [00:01<03:31,  1.35s/it][A
Training:   3%|▎         | 5/157 [00:02<01:02,  2.44it/s][A
Training:   6%|▌         | 9/157 [00:03<00:47,  3.14it/s][A
Training:   8%|▊         | 13/157 [00:04<00:42,  3.38it/s][A
Training:  11%|█         | 17/157 [00:05<00:39,  3.59it/s][A
Training:  13%|█▎        | 21/157 [00:06<00:36,  3.74it/s][A
Training:  16%|█▌        | 25/157 [00:07<00:35,  3.73it/s][A
Training:  18%|█▊        | 29/157 [00:08<00:32,  3.93it/s][A
Training:  21%|██        | 33/157 [00:09<00:32,  3.87it/s][A
Training:  24%|██▎       | 37/157 [00:10<00:30,  3.93it/s][A
Training:  26%|██▌       | 41/157 [00:11<00:29,  3.99it/s][A
Training:  29%|██▊       | 45/157 [00:12<00:28,  3.92it/s][A
Training:  31%|███       | 49/157 [00:13<00:26,  4.05it/s][A
Training:  34%|███▍      | 53/157 [00:14<00:26,  3.92it/s][A
Training:  36%|███▋      | 57/157 [00:15<00:25,  3.93it/s][A
Training:  38%|███▊

Epoch: 11/38 - Loss: 0.7709 - Accuracy: 0.9438



  0%|          | 0/20 [00:00<?, ?it/s][A
  5%|▌         | 1/20 [00:01<00:21,  1.13s/it][A
 25%|██▌       | 5/20 [00:02<00:05,  2.72it/s][A
 45%|████▌     | 9/20 [00:02<00:03,  3.59it/s][A
 65%|██████▌   | 13/20 [00:03<00:01,  3.86it/s][A
100%|██████████| 20/20 [00:04<00:00,  4.18it/s][A
Epochs:  29%|██▉       | 11/38 [08:19<20:28, 45.49s/it]

Val Loss: 0.8403 - Val Accuracy: 0.9369



Training:   0%|          | 0/157 [00:00<?, ?it/s][A
Training:   1%|          | 1/157 [00:01<03:08,  1.21s/it][A
Training:   3%|▎         | 5/157 [00:02<01:01,  2.46it/s][A
Training:   6%|▌         | 9/157 [00:03<00:47,  3.13it/s][A
Training:   8%|▊         | 13/157 [00:04<00:41,  3.49it/s][A
Training:  11%|█         | 17/157 [00:05<00:39,  3.58it/s][A
Training:  13%|█▎        | 21/157 [00:06<00:35,  3.81it/s][A
Training:  15%|█▌        | 24/157 [00:06<00:26,  5.02it/s][A
Training:  17%|█▋        | 26/157 [00:07<00:33,  3.92it/s][A
Training:  18%|█▊        | 29/157 [00:08<00:36,  3.53it/s][A
Training:  21%|██        | 33/157 [00:09<00:32,  3.76it/s][A
Training:  24%|██▎       | 37/157 [00:10<00:32,  3.71it/s][A
Training:  26%|██▌       | 41/157 [00:11<00:29,  3.87it/s][A
Training:  29%|██▊       | 45/157 [00:12<00:28,  3.87it/s][A
Training:  31%|███       | 49/157 [00:13<00:28,  3.82it/s][A
Training:  34%|███▍      | 53/157 [00:14<00:26,  3.95it/s][A
Training:  36%|███▋

Epoch: 12/38 - Loss: 0.7280 - Accuracy: 0.9437



  0%|          | 0/20 [00:00<?, ?it/s][A
  5%|▌         | 1/20 [00:01<00:21,  1.14s/it][A
 25%|██▌       | 5/20 [00:02<00:05,  2.65it/s][A
 45%|████▌     | 9/20 [00:02<00:03,  3.53it/s][A
 65%|██████▌   | 13/20 [00:03<00:01,  3.83it/s][A
100%|██████████| 20/20 [00:04<00:00,  4.08it/s][A
Epochs:  32%|███▏      | 12/38 [09:04<19:43, 45.52s/it]

Val Loss: 0.8812 - Val Accuracy: 0.9302



Training:   0%|          | 0/157 [00:00<?, ?it/s][A
Training:   1%|          | 1/157 [00:01<03:20,  1.29s/it][A
Training:   3%|▎         | 5/157 [00:02<01:00,  2.50it/s][A
Training:   6%|▌         | 9/157 [00:03<00:47,  3.11it/s][A
Training:   8%|▊         | 13/157 [00:04<00:41,  3.48it/s][A
Training:  11%|█         | 17/157 [00:05<00:38,  3.61it/s][A
Training:  13%|█▎        | 21/157 [00:06<00:36,  3.71it/s][A
Training:  16%|█▌        | 25/157 [00:07<00:34,  3.86it/s][A
Training:  18%|█▊        | 29/157 [00:08<00:33,  3.82it/s][A
Training:  21%|██        | 33/157 [00:09<00:32,  3.86it/s][A
Training:  24%|██▎       | 37/157 [00:10<00:30,  3.90it/s][A
Training:  26%|██▌       | 41/157 [00:11<00:30,  3.85it/s][A
Training:  29%|██▊       | 45/157 [00:12<00:27,  4.01it/s][A
Training:  31%|███       | 49/157 [00:13<00:27,  3.91it/s][A
Training:  34%|███▍      | 53/157 [00:14<00:26,  3.91it/s][A
Training:  36%|███▋      | 57/157 [00:15<00:25,  3.88it/s][A
Training:  39%|███▉

Epoch: 13/38 - Loss: 0.6897 - Accuracy: 0.9428



  0%|          | 0/20 [00:00<?, ?it/s][A
  5%|▌         | 1/20 [00:01<00:22,  1.21s/it][A
 25%|██▌       | 5/20 [00:02<00:05,  2.84it/s][A
 45%|████▌     | 9/20 [00:03<00:03,  3.40it/s][A
 65%|██████▌   | 13/20 [00:03<00:01,  3.87it/s][A
100%|██████████| 20/20 [00:04<00:00,  4.07it/s][A
Epochs:  34%|███▍      | 13/38 [09:50<18:58, 45.56s/it]

Val Loss: 0.7664 - Val Accuracy: 0.9392



Training:   0%|          | 0/157 [00:00<?, ?it/s][A
Training:   1%|          | 1/157 [00:01<03:30,  1.35s/it][A
Training:   3%|▎         | 5/157 [00:02<01:03,  2.40it/s][A
Training:   6%|▌         | 9/157 [00:03<00:47,  3.13it/s][A
Training:   8%|▊         | 13/157 [00:04<00:43,  3.32it/s][A
Training:  11%|█         | 17/157 [00:05<00:38,  3.66it/s][A
Training:  13%|█▎        | 20/157 [00:05<00:27,  4.90it/s][A
Training:  14%|█▍        | 22/157 [00:06<00:35,  3.77it/s][A
Training:  16%|█▌        | 25/157 [00:07<00:37,  3.53it/s][A
Training:  18%|█▊        | 29/157 [00:08<00:34,  3.72it/s][A
Training:  21%|██        | 33/157 [00:09<00:33,  3.68it/s][A
Training:  24%|██▎       | 37/157 [00:10<00:32,  3.75it/s][A
Training:  26%|██▌       | 41/157 [00:11<00:30,  3.83it/s][A
Training:  29%|██▊       | 45/157 [00:12<00:29,  3.82it/s][A
Training:  31%|███       | 49/157 [00:13<00:27,  3.94it/s][A
Training:  34%|███▍      | 53/157 [00:14<00:26,  3.94it/s][A
Training:  36%|███▋

Epoch: 14/38 - Loss: 0.7095 - Accuracy: 0.9420



  0%|          | 0/20 [00:00<?, ?it/s][A
  5%|▌         | 1/20 [00:01<00:23,  1.26s/it][A
 25%|██▌       | 5/20 [00:02<00:05,  2.78it/s][A
 45%|████▌     | 9/20 [00:03<00:03,  3.42it/s][A
 65%|██████▌   | 13/20 [00:03<00:01,  3.84it/s][A
100%|██████████| 20/20 [00:04<00:00,  4.09it/s][A
Epochs:  37%|███▋      | 14/38 [10:36<18:14, 45.59s/it]

Val Loss: 0.7896 - Val Accuracy: 0.9332



Training:   0%|          | 0/157 [00:00<?, ?it/s][A
Training:   1%|          | 1/157 [00:01<03:38,  1.40s/it][A
Training:   3%|▎         | 5/157 [00:02<01:06,  2.29it/s][A
Training:   5%|▌         | 8/157 [00:02<00:36,  4.08it/s][A
Training:   6%|▋         | 10/157 [00:03<00:45,  3.25it/s][A
Training:   8%|▊         | 13/157 [00:04<00:45,  3.15it/s][A
Training:  10%|█         | 16/157 [00:04<00:30,  4.64it/s][A
Training:  11%|█▏        | 18/157 [00:05<00:39,  3.54it/s][A
Training:  13%|█▎        | 21/157 [00:06<00:39,  3.45it/s][A
Training:  15%|█▌        | 24/157 [00:06<00:27,  4.86it/s][A
Training:  17%|█▋        | 26/157 [00:07<00:36,  3.58it/s][A
Training:  18%|█▊        | 29/157 [00:08<00:36,  3.49it/s][A
Training:  21%|██        | 33/157 [00:09<00:34,  3.60it/s][A
Training:  24%|██▎       | 37/157 [00:10<00:32,  3.74it/s][A
Training:  25%|██▌       | 40/157 [00:10<00:23,  4.93it/s][A
Training:  27%|██▋       | 42/157 [00:11<00:29,  3.91it/s][A
Training:  29%|██▊ 

Epoch: 15/38 - Loss: 0.7048 - Accuracy: 0.9440



  0%|          | 0/20 [00:00<?, ?it/s][A
  5%|▌         | 1/20 [00:01<00:23,  1.25s/it][A
 25%|██▌       | 5/20 [00:02<00:05,  2.65it/s][A
 45%|████▌     | 9/20 [00:03<00:03,  3.41it/s][A
 65%|██████▌   | 13/20 [00:03<00:01,  3.75it/s][A
100%|██████████| 20/20 [00:04<00:00,  4.04it/s][A
Epochs:  39%|███▉      | 15/38 [11:22<17:31, 45.71s/it]

Val Loss: 0.6618 - Val Accuracy: 0.9431



Training:   0%|          | 0/157 [00:00<?, ?it/s][A
Training:   1%|          | 1/157 [00:01<03:28,  1.33s/it][A
Training:   3%|▎         | 5/157 [00:02<01:03,  2.40it/s][A
Training:   6%|▌         | 9/157 [00:03<00:46,  3.20it/s][A
Training:   8%|▊         | 13/157 [00:04<00:41,  3.46it/s][A
Training:  11%|█         | 17/157 [00:05<00:38,  3.68it/s][A
Training:  13%|█▎        | 20/157 [00:05<00:27,  4.92it/s][A
Training:  14%|█▍        | 22/157 [00:06<00:34,  3.87it/s][A
Training:  16%|█▌        | 25/157 [00:07<00:37,  3.52it/s][A
Training:  18%|█▊        | 28/157 [00:07<00:26,  4.83it/s][A
Training:  19%|█▉        | 30/157 [00:08<00:33,  3.84it/s][A
Training:  21%|██        | 33/157 [00:09<00:35,  3.53it/s][A
Training:  24%|██▎       | 37/157 [00:10<00:32,  3.67it/s][A
Training:  26%|██▌       | 41/157 [00:11<00:30,  3.85it/s][A
Training:  29%|██▊       | 45/157 [00:12<00:29,  3.77it/s][A
Training:  31%|███       | 49/157 [00:13<00:27,  3.91it/s][A
Training:  33%|███▎

Epoch: 16/38 - Loss: 0.6626 - Accuracy: 0.9437



  0%|          | 0/20 [00:00<?, ?it/s][A
  5%|▌         | 1/20 [00:01<00:23,  1.23s/it][A
 25%|██▌       | 5/20 [00:02<00:05,  2.72it/s][A
 35%|███▌      | 7/20 [00:02<00:03,  3.97it/s][A
 45%|████▌     | 9/20 [00:02<00:03,  3.34it/s][A
 60%|██████    | 12/20 [00:03<00:01,  5.36it/s][A
 70%|███████   | 14/20 [00:03<00:01,  3.90it/s][A
100%|██████████| 20/20 [00:04<00:00,  4.07it/s][A
Epochs:  42%|████▏     | 16/38 [12:07<16:44, 45.64s/it]

Val Loss: 0.7190 - Val Accuracy: 0.9362



Training:   0%|          | 0/157 [00:00<?, ?it/s][A
Training:   1%|          | 1/157 [00:01<03:37,  1.40s/it][A
Training:   3%|▎         | 5/157 [00:02<01:04,  2.36it/s][A
Training:   6%|▌         | 9/157 [00:03<00:47,  3.08it/s][A
Training:   8%|▊         | 13/157 [00:04<00:43,  3.32it/s][A
Training:  11%|█         | 17/157 [00:05<00:38,  3.66it/s][A
Training:  13%|█▎        | 21/157 [00:06<00:36,  3.70it/s][A
Training:  16%|█▌        | 25/157 [00:07<00:34,  3.78it/s][A
Training:  18%|█▊        | 29/157 [00:08<00:33,  3.88it/s][A
Training:  21%|██        | 33/157 [00:09<00:32,  3.85it/s][A
Training:  24%|██▎       | 37/157 [00:10<00:30,  3.97it/s][A
Training:  25%|██▌       | 40/157 [00:10<00:23,  5.05it/s][A
Training:  27%|██▋       | 42/157 [00:11<00:30,  3.77it/s][A
Training:  29%|██▊       | 45/157 [00:12<00:31,  3.60it/s][A
Training:  31%|███       | 49/157 [00:13<00:29,  3.72it/s][A
Training:  34%|███▍      | 53/157 [00:14<00:27,  3.78it/s][A
Training:  36%|███▋

Epoch: 17/38 - Loss: 0.6588 - Accuracy: 0.9428



  0%|          | 0/20 [00:00<?, ?it/s][A
  5%|▌         | 1/20 [00:01<00:22,  1.18s/it][A
 25%|██▌       | 5/20 [00:02<00:05,  2.70it/s][A
 45%|████▌     | 9/20 [00:03<00:03,  3.36it/s][A
 65%|██████▌   | 13/20 [00:03<00:01,  3.85it/s][A
100%|██████████| 20/20 [00:04<00:00,  4.02it/s][A
Epochs:  45%|████▍     | 17/38 [12:53<15:59, 45.67s/it]

Val Loss: 0.7315 - Val Accuracy: 0.9317



Training:   0%|          | 0/157 [00:00<?, ?it/s][A
Training:   1%|          | 1/157 [00:01<03:20,  1.29s/it][A
Training:   3%|▎         | 4/157 [00:01<00:41,  3.66it/s][A
Training:   4%|▍         | 6/157 [00:02<00:51,  2.96it/s][A
Training:   6%|▌         | 9/157 [00:03<00:50,  2.95it/s][A
Training:   8%|▊         | 13/157 [00:04<00:42,  3.40it/s][A
Training:  11%|█         | 17/157 [00:05<00:38,  3.63it/s][A
Training:  13%|█▎        | 21/157 [00:06<00:36,  3.72it/s][A
Training:  16%|█▌        | 25/157 [00:07<00:34,  3.80it/s][A
Training:  18%|█▊        | 29/157 [00:08<00:34,  3.76it/s][A
Training:  21%|██        | 33/157 [00:09<00:31,  3.94it/s][A
Training:  24%|██▎       | 37/157 [00:10<00:30,  3.91it/s][A
Training:  26%|██▌       | 41/157 [00:11<00:29,  3.87it/s][A
Training:  29%|██▊       | 45/157 [00:12<00:28,  3.98it/s][A
Training:  31%|███       | 49/157 [00:13<00:27,  3.86it/s][A
Training:  34%|███▍      | 53/157 [00:14<00:26,  3.91it/s][A
Training:  36%|███▋ 

Epoch: 18/38 - Loss: 0.6723 - Accuracy: 0.9425



  0%|          | 0/20 [00:00<?, ?it/s][A
  5%|▌         | 1/20 [00:01<00:21,  1.13s/it][A
 25%|██▌       | 5/20 [00:02<00:05,  2.67it/s][A
 45%|████▌     | 9/20 [00:02<00:03,  3.54it/s][A
 65%|██████▌   | 13/20 [00:03<00:01,  3.82it/s][A
100%|██████████| 20/20 [00:04<00:00,  4.11it/s][A
Epochs:  47%|████▋     | 18/38 [13:38<15:11, 45.58s/it]

Val Loss: 0.7093 - Val Accuracy: 0.9392



Training:   0%|          | 0/157 [00:00<?, ?it/s][A
Training:   1%|          | 1/157 [00:01<03:21,  1.29s/it][A
Training:   3%|▎         | 5/157 [00:02<01:04,  2.36it/s][A
Training:   6%|▌         | 9/157 [00:03<00:47,  3.10it/s][A
Training:   8%|▊         | 13/157 [00:04<00:42,  3.43it/s][A
Training:  11%|█         | 17/157 [00:05<00:38,  3.66it/s][A
Training:  13%|█▎        | 21/157 [00:06<00:35,  3.81it/s][A
Training:  16%|█▌        | 25/157 [00:07<00:35,  3.74it/s][A
Training:  18%|█▊        | 29/157 [00:08<00:32,  3.92it/s][A
Training:  21%|██        | 33/157 [00:09<00:31,  3.89it/s][A
Training:  24%|██▎       | 37/157 [00:10<00:30,  3.92it/s][A
Training:  26%|██▌       | 41/157 [00:11<00:28,  4.00it/s][A
Training:  29%|██▊       | 45/157 [00:12<00:28,  3.90it/s][A
Training:  31%|███       | 49/157 [00:13<00:26,  4.01it/s][A
Training:  34%|███▍      | 53/157 [00:14<00:26,  3.92it/s][A
Training:  36%|███▋      | 57/157 [00:15<00:25,  3.96it/s][A
Training:  39%|███▉

Epoch: 19/38 - Loss: 0.6542 - Accuracy: 0.9437



  0%|          | 0/20 [00:00<?, ?it/s][A
  5%|▌         | 1/20 [00:01<00:23,  1.22s/it][A
 25%|██▌       | 5/20 [00:02<00:05,  2.67it/s][A
 45%|████▌     | 9/20 [00:02<00:03,  3.47it/s][A
 65%|██████▌   | 13/20 [00:03<00:01,  3.80it/s][A
100%|██████████| 20/20 [00:04<00:00,  4.08it/s][A
Epochs:  50%|█████     | 19/38 [14:24<14:26, 45.61s/it]

Val Loss: 0.7156 - Val Accuracy: 0.9453



Training:   0%|          | 0/157 [00:00<?, ?it/s][A
Training:   1%|          | 1/157 [00:01<03:22,  1.30s/it][A
Training:   3%|▎         | 5/157 [00:02<01:03,  2.39it/s][A
Training:   6%|▌         | 9/157 [00:03<00:46,  3.17it/s][A
Training:   8%|▊         | 13/157 [00:04<00:41,  3.44it/s][A
Training:  10%|█         | 16/157 [00:04<00:29,  4.79it/s][A
Training:  11%|█▏        | 18/157 [00:05<00:37,  3.72it/s][A
Training:  13%|█▎        | 21/157 [00:06<00:38,  3.49it/s][A
Training:  15%|█▌        | 24/157 [00:06<00:27,  4.87it/s][A
Training:  17%|█▋        | 26/157 [00:07<00:35,  3.67it/s][A
Training:  18%|█▊        | 28/157 [00:07<00:27,  4.61it/s][A
Training:  19%|█▉        | 30/157 [00:08<00:33,  3.75it/s][A
Training:  20%|█▉        | 31/157 [00:08<00:31,  4.04it/s][A
Training:  21%|██        | 33/157 [00:09<00:38,  3.25it/s][A
Training:  23%|██▎       | 36/157 [00:09<00:24,  5.01it/s][A
Training:  24%|██▍       | 38/157 [00:10<00:32,  3.61it/s][A
Training:  26%|██▌ 

Epoch: 20/38 - Loss: 0.6426 - Accuracy: 0.9399



  0%|          | 0/20 [00:00<?, ?it/s][A
  5%|▌         | 1/20 [00:01<00:23,  1.24s/it][A
 25%|██▌       | 5/20 [00:02<00:05,  2.76it/s][A
 45%|████▌     | 9/20 [00:03<00:03,  3.44it/s][A
 65%|██████▌   | 13/20 [00:03<00:01,  3.83it/s][A
100%|██████████| 20/20 [00:04<00:00,  4.05it/s][A
Epochs:  53%|█████▎    | 20/38 [15:09<13:41, 45.64s/it]

Val Loss: 0.6383 - Val Accuracy: 0.9382



Training:   0%|          | 0/157 [00:00<?, ?it/s][A
Training:   1%|          | 1/157 [00:01<03:32,  1.36s/it][A
Training:   3%|▎         | 5/157 [00:02<01:03,  2.38it/s][A
Training:   6%|▌         | 9/157 [00:03<00:47,  3.10it/s][A
Training:   8%|▊         | 13/157 [00:04<00:42,  3.38it/s][A
Training:  11%|█         | 17/157 [00:05<00:38,  3.61it/s][A
Training:  13%|█▎        | 21/157 [00:06<00:36,  3.73it/s][A
Training:  16%|█▌        | 25/157 [00:07<00:35,  3.77it/s][A
Training:  18%|█▊        | 29/157 [00:08<00:32,  3.92it/s][A
Training:  20%|██        | 32/157 [00:08<00:24,  5.03it/s][A
Training:  22%|██▏       | 34/157 [00:09<00:31,  3.86it/s][A
Training:  24%|██▎       | 37/157 [00:10<00:33,  3.55it/s][A
Training:  26%|██▌       | 41/157 [00:11<00:30,  3.76it/s][A
Training:  29%|██▊       | 45/157 [00:12<00:29,  3.74it/s][A
Training:  31%|███       | 49/157 [00:13<00:28,  3.81it/s][A
Training:  34%|███▍      | 53/157 [00:14<00:27,  3.85it/s][A
Training:  36%|███▋

Epoch: 21/38 - Loss: 0.6428 - Accuracy: 0.9445



  0%|          | 0/20 [00:00<?, ?it/s][A
  5%|▌         | 1/20 [00:01<00:23,  1.26s/it][A
 25%|██▌       | 5/20 [00:02<00:05,  2.75it/s][A
 45%|████▌     | 9/20 [00:03<00:03,  3.45it/s][A
 65%|██████▌   | 13/20 [00:03<00:01,  3.86it/s][A
 75%|███████▌  | 15/20 [00:03<00:01,  4.77it/s][A
100%|██████████| 20/20 [00:04<00:00,  4.04it/s][A
Epochs:  55%|█████▌    | 21/38 [15:55<12:56, 45.67s/it]

Val Loss: 0.7192 - Val Accuracy: 0.9337



Training:   0%|          | 0/157 [00:00<?, ?it/s][A
Training:   1%|          | 1/157 [00:01<03:25,  1.32s/it][A
Training:   3%|▎         | 5/157 [00:02<01:02,  2.43it/s][A
Training:   6%|▌         | 9/157 [00:03<00:46,  3.15it/s][A
Training:   8%|▊         | 13/157 [00:04<00:42,  3.39it/s][A
Training:  10%|█         | 16/157 [00:04<00:30,  4.69it/s][A
Training:  11%|█▏        | 18/157 [00:05<00:36,  3.83it/s][A
Training:  13%|█▎        | 20/157 [00:05<00:28,  4.76it/s][A
Training:  14%|█▍        | 22/157 [00:06<00:37,  3.63it/s][A
Training:  16%|█▌        | 25/157 [00:07<00:38,  3.39it/s][A
Training:  17%|█▋        | 27/157 [00:07<00:30,  4.23it/s][A
Training:  18%|█▊        | 29/157 [00:08<00:35,  3.56it/s][A
Training:  20%|██        | 32/157 [00:08<00:23,  5.23it/s][A
Training:  22%|██▏       | 34/157 [00:09<00:33,  3.67it/s][A
Training:  24%|██▎       | 37/157 [00:10<00:34,  3.47it/s][A
Training:  25%|██▍       | 39/157 [00:10<00:27,  4.35it/s][A
Training:  26%|██▌ 

Epoch: 22/38 - Loss: 0.6368 - Accuracy: 0.9454



  0%|          | 0/20 [00:00<?, ?it/s][A
  5%|▌         | 1/20 [00:01<00:23,  1.21s/it][A
 25%|██▌       | 5/20 [00:02<00:05,  2.69it/s][A
 45%|████▌     | 9/20 [00:03<00:03,  3.43it/s][A
 65%|██████▌   | 13/20 [00:03<00:01,  3.80it/s][A
100%|██████████| 20/20 [00:04<00:00,  4.03it/s][A
Epochs:  58%|█████▊    | 22/38 [16:41<12:11, 45.70s/it]

Val Loss: 0.7566 - Val Accuracy: 0.9341



Training:   0%|          | 0/157 [00:00<?, ?it/s][A
Training:   1%|          | 1/157 [00:01<03:31,  1.35s/it][A
Training:   3%|▎         | 5/157 [00:02<00:59,  2.54it/s][A
Training:   5%|▌         | 8/157 [00:02<00:33,  4.40it/s][A
Training:   6%|▋         | 10/157 [00:03<00:45,  3.27it/s][A
Training:   8%|▊         | 13/157 [00:04<00:44,  3.27it/s][A
Training:  11%|█         | 17/157 [00:05<00:39,  3.51it/s][A
Training:  13%|█▎        | 21/157 [00:06<00:36,  3.72it/s][A
Training:  15%|█▌        | 24/157 [00:06<00:26,  4.96it/s][A
Training:  17%|█▋        | 26/157 [00:07<00:34,  3.83it/s][A
Training:  18%|█▊        | 29/157 [00:08<00:37,  3.46it/s][A
Training:  21%|██        | 33/157 [00:09<00:33,  3.66it/s][A
Training:  24%|██▎       | 37/157 [00:10<00:32,  3.75it/s][A
Training:  26%|██▌       | 41/157 [00:11<00:31,  3.74it/s][A
Training:  29%|██▊       | 45/157 [00:12<00:28,  3.94it/s][A
Training:  31%|███       | 49/157 [00:13<00:27,  3.92it/s][A
Training:  34%|███▍

Epoch: 23/38 - Loss: 0.6238 - Accuracy: 0.9432



  0%|          | 0/20 [00:00<?, ?it/s][A
  5%|▌         | 1/20 [00:01<00:23,  1.23s/it][A
 25%|██▌       | 5/20 [00:02<00:05,  2.77it/s][A
 45%|████▌     | 9/20 [00:03<00:03,  3.42it/s][A
 65%|██████▌   | 13/20 [00:03<00:01,  3.94it/s][A
100%|██████████| 20/20 [00:04<00:00,  4.08it/s][A
Epochs:  61%|██████    | 23/38 [17:27<11:25, 45.71s/it]

Val Loss: 0.6204 - Val Accuracy: 0.9399



Training:   0%|          | 0/157 [00:00<?, ?it/s][A
Training:   1%|          | 1/157 [00:01<03:37,  1.40s/it][A
Training:   3%|▎         | 5/157 [00:02<01:04,  2.37it/s][A
Training:   6%|▌         | 9/157 [00:03<00:48,  3.08it/s][A
Training:   8%|▊         | 13/157 [00:04<00:43,  3.35it/s][A
Training:  11%|█         | 17/157 [00:05<00:38,  3.68it/s][A
Training:  13%|█▎        | 21/157 [00:06<00:36,  3.73it/s][A
Training:  16%|█▌        | 25/157 [00:07<00:34,  3.78it/s][A
Training:  18%|█▊        | 29/157 [00:08<00:32,  3.93it/s][A
Training:  21%|██        | 33/157 [00:09<00:31,  3.91it/s][A
Training:  24%|██▎       | 37/157 [00:10<00:30,  3.98it/s][A
Training:  26%|██▌       | 41/157 [00:11<00:29,  3.91it/s][A
Training:  29%|██▊       | 45/157 [00:12<00:29,  3.85it/s][A
Training:  31%|███       | 49/157 [00:13<00:27,  3.99it/s][A
Training:  34%|███▍      | 53/157 [00:14<00:26,  3.90it/s][A
Training:  36%|███▋      | 57/157 [00:15<00:25,  3.94it/s][A
Training:  39%|███▉

Epoch: 24/38 - Loss: 0.6410 - Accuracy: 0.9412



  0%|          | 0/20 [00:00<?, ?it/s][A
  5%|▌         | 1/20 [00:01<00:22,  1.20s/it][A
 25%|██▌       | 5/20 [00:02<00:05,  2.73it/s][A
 45%|████▌     | 9/20 [00:03<00:03,  3.43it/s][A
 65%|██████▌   | 13/20 [00:03<00:01,  3.94it/s][A
100%|██████████| 20/20 [00:04<00:00,  4.04it/s][A
Epochs:  63%|██████▎   | 24/38 [18:12<10:39, 45.71s/it]

Val Loss: 0.7263 - Val Accuracy: 0.9281



Training:   0%|          | 0/157 [00:00<?, ?it/s][A
Training:   1%|          | 1/157 [00:01<03:34,  1.38s/it][A
Training:   3%|▎         | 5/157 [00:02<01:01,  2.48it/s][A
Training:   6%|▌         | 9/157 [00:03<00:48,  3.03it/s][A
Training:   8%|▊         | 13/157 [00:04<00:42,  3.42it/s][A
Training:  11%|█         | 17/157 [00:05<00:38,  3.65it/s][A
Training:  13%|█▎        | 21/157 [00:06<00:36,  3.68it/s][A
Training:  16%|█▌        | 25/157 [00:07<00:34,  3.83it/s][A
Training:  18%|█▊        | 28/157 [00:07<00:26,  4.96it/s][A
Training:  19%|█▉        | 30/157 [00:08<00:32,  3.88it/s][A
Training:  21%|██        | 33/157 [00:09<00:35,  3.51it/s][A
Training:  24%|██▎       | 37/157 [00:10<00:32,  3.73it/s][A
Training:  26%|██▌       | 41/157 [00:11<00:30,  3.79it/s][A
Training:  29%|██▊       | 45/157 [00:12<00:29,  3.85it/s][A
Training:  31%|███       | 49/157 [00:13<00:27,  3.94it/s][A
Training:  34%|███▍      | 53/157 [00:14<00:26,  3.89it/s][A
Training:  36%|███▋

Epoch: 25/38 - Loss: 0.6251 - Accuracy: 0.9406



  0%|          | 0/20 [00:00<?, ?it/s][A
  5%|▌         | 1/20 [00:01<00:23,  1.22s/it][A
 25%|██▌       | 5/20 [00:02<00:05,  2.84it/s][A
 45%|████▌     | 9/20 [00:02<00:03,  3.44it/s][A
 65%|██████▌   | 13/20 [00:03<00:01,  3.92it/s][A
100%|██████████| 20/20 [00:04<00:00,  4.09it/s][A
Epochs:  66%|██████▌   | 25/38 [18:58<09:54, 45.72s/it]

Val Loss: 0.6856 - Val Accuracy: 0.9365



Training:   0%|          | 0/157 [00:00<?, ?it/s][A
Training:   1%|          | 1/157 [00:01<03:27,  1.33s/it][A
Training:   3%|▎         | 5/157 [00:02<01:02,  2.42it/s][A
Training:   5%|▌         | 8/157 [00:02<00:34,  4.27it/s][A
Training:   6%|▋         | 10/157 [00:03<00:45,  3.26it/s][A
Training:   8%|▊         | 13/157 [00:04<00:46,  3.10it/s][A
Training:  10%|█         | 16/157 [00:04<00:30,  4.60it/s][A
Training:  11%|█▏        | 18/157 [00:05<00:37,  3.66it/s][A
Training:  13%|█▎        | 21/157 [00:06<00:40,  3.38it/s][A
Training:  15%|█▍        | 23/157 [00:06<00:31,  4.26it/s][A
Training:  16%|█▌        | 25/157 [00:07<00:38,  3.45it/s][A
Training:  17%|█▋        | 26/157 [00:07<00:34,  3.84it/s][A
Training:  18%|█▊        | 29/157 [00:08<00:35,  3.64it/s][A
Training:  20%|██        | 32/157 [00:08<00:23,  5.36it/s][A
Training:  22%|██▏       | 34/157 [00:09<00:34,  3.55it/s][A
Training:  24%|██▎       | 37/157 [00:10<00:34,  3.51it/s][A
Training:  25%|██▌ 

Epoch: 26/38 - Loss: 0.6248 - Accuracy: 0.9413



  0%|          | 0/20 [00:00<?, ?it/s][A
  5%|▌         | 1/20 [00:01<00:22,  1.18s/it][A
 25%|██▌       | 5/20 [00:02<00:05,  2.78it/s][A
 45%|████▌     | 9/20 [00:02<00:03,  3.51it/s][A
 65%|██████▌   | 13/20 [00:03<00:01,  3.92it/s][A
100%|██████████| 20/20 [00:04<00:00,  4.10it/s][A
Epochs:  68%|██████▊   | 26/38 [19:44<09:08, 45.74s/it]

Val Loss: 0.7282 - Val Accuracy: 0.9323



Training:   0%|          | 0/157 [00:00<?, ?it/s][A
Training:   1%|          | 1/157 [00:01<03:30,  1.35s/it][A
Training:   3%|▎         | 5/157 [00:02<01:00,  2.52it/s][A
Training:   6%|▌         | 9/157 [00:03<00:47,  3.13it/s][A
Training:   8%|▊         | 13/157 [00:04<00:41,  3.44it/s][A
Training:  11%|█         | 17/157 [00:05<00:38,  3.62it/s][A
Training:  13%|█▎        | 21/157 [00:06<00:37,  3.65it/s][A
Training:  16%|█▌        | 25/157 [00:07<00:34,  3.86it/s][A
Training:  17%|█▋        | 27/157 [00:07<00:28,  4.58it/s][A
Training:  18%|█▊        | 29/157 [00:08<00:34,  3.71it/s][A
Training:  20%|██        | 32/157 [00:08<00:24,  5.13it/s][A
Training:  22%|██▏       | 34/157 [00:09<00:32,  3.77it/s][A
Training:  24%|██▎       | 37/157 [00:10<00:32,  3.65it/s][A
Training:  25%|██▌       | 40/157 [00:10<00:23,  5.04it/s][A
Training:  27%|██▋       | 42/157 [00:11<00:30,  3.72it/s][A
Training:  29%|██▊       | 45/157 [00:12<00:31,  3.55it/s][A
Training:  31%|███ 

Epoch: 27/38 - Loss: 0.6214 - Accuracy: 0.9435



  0%|          | 0/20 [00:00<?, ?it/s][A
  5%|▌         | 1/20 [00:01<00:22,  1.20s/it][A
 25%|██▌       | 5/20 [00:02<00:05,  2.73it/s][A
 45%|████▌     | 9/20 [00:03<00:03,  3.39it/s][A
 65%|██████▌   | 13/20 [00:03<00:01,  3.88it/s][A
100%|██████████| 20/20 [00:04<00:00,  4.02it/s][A
Epochs:  71%|███████   | 27/38 [20:30<08:22, 45.71s/it]

Val Loss: 0.6993 - Val Accuracy: 0.9349



Training:   0%|          | 0/157 [00:00<?, ?it/s][A
Training:   1%|          | 1/157 [00:01<03:19,  1.28s/it][A
Training:   3%|▎         | 4/157 [00:01<00:41,  3.70it/s][A
Training:   4%|▍         | 6/157 [00:02<00:52,  2.85it/s][A
Training:   6%|▌         | 9/157 [00:03<00:51,  2.85it/s][A
Training:   8%|▊         | 13/157 [00:04<00:41,  3.44it/s][A
Training:  11%|█         | 17/157 [00:05<00:39,  3.58it/s][A
Training:  13%|█▎        | 21/157 [00:06<00:37,  3.66it/s][A
Training:  16%|█▌        | 25/157 [00:07<00:35,  3.76it/s][A
Training:  18%|█▊        | 29/157 [00:08<00:34,  3.74it/s][A
Training:  21%|██        | 33/157 [00:09<00:32,  3.80it/s][A
Training:  24%|██▎       | 37/157 [00:10<00:30,  3.87it/s][A
Training:  26%|██▌       | 41/157 [00:11<00:30,  3.81it/s][A
Training:  29%|██▊       | 45/157 [00:12<00:28,  3.95it/s][A
Training:  31%|███       | 49/157 [00:13<00:27,  3.95it/s][A
Training:  34%|███▍      | 53/157 [00:14<00:26,  3.92it/s][A
Training:  36%|███▋ 

Epoch: 28/38 - Loss: 0.6258 - Accuracy: 0.9397



  0%|          | 0/20 [00:00<?, ?it/s][A
  5%|▌         | 1/20 [00:01<00:23,  1.22s/it][A
 25%|██▌       | 5/20 [00:02<00:05,  2.74it/s][A
 45%|████▌     | 9/20 [00:03<00:03,  3.37it/s][A
 65%|██████▌   | 13/20 [00:03<00:01,  3.90it/s][A
100%|██████████| 20/20 [00:04<00:00,  4.07it/s][A
Epochs:  74%|███████▎  | 28/38 [21:15<07:37, 45.72s/it]

Val Loss: 0.6673 - Val Accuracy: 0.9386



Training:   0%|          | 0/157 [00:00<?, ?it/s][A
Training:   1%|          | 1/157 [00:01<03:31,  1.35s/it][A
Training:   3%|▎         | 5/157 [00:02<01:01,  2.49it/s][A
Training:   6%|▌         | 9/157 [00:03<00:48,  3.07it/s][A
Training:   8%|▊         | 13/157 [00:04<00:41,  3.44it/s][A
Training:  11%|█         | 17/157 [00:05<00:38,  3.68it/s][A
Training:  13%|█▎        | 20/157 [00:05<00:27,  4.94it/s][A
Training:  14%|█▍        | 22/157 [00:06<00:36,  3.70it/s][A
Training:  16%|█▌        | 25/157 [00:07<00:36,  3.61it/s][A
Training:  17%|█▋        | 26/157 [00:07<00:33,  3.87it/s][A
Training:  18%|█▊        | 29/157 [00:08<00:34,  3.71it/s][A
Training:  19%|█▉        | 30/157 [00:08<00:31,  4.01it/s][A
Training:  21%|██        | 33/157 [00:09<00:32,  3.81it/s][A
Training:  22%|██▏       | 34/157 [00:09<00:31,  3.91it/s][A
Training:  24%|██▎       | 37/157 [00:10<00:30,  3.99it/s][A
Training:  24%|██▍       | 38/157 [00:10<00:28,  4.14it/s][A
Training:  26%|██▌ 

Epoch: 29/38 - Loss: 0.5880 - Accuracy: 0.9445



  0%|          | 0/20 [00:00<?, ?it/s][A
  5%|▌         | 1/20 [00:01<00:21,  1.12s/it][A
 25%|██▌       | 5/20 [00:02<00:05,  2.70it/s][A
 45%|████▌     | 9/20 [00:02<00:03,  3.43it/s][A
 65%|██████▌   | 13/20 [00:03<00:01,  3.86it/s][A
100%|██████████| 20/20 [00:04<00:00,  4.05it/s][A
Epochs:  76%|███████▋  | 29/38 [22:01<06:51, 45.68s/it]

Val Loss: 0.7082 - Val Accuracy: 0.9358



Training:   0%|          | 0/157 [00:00<?, ?it/s][A
Training:   1%|          | 1/157 [00:01<03:25,  1.31s/it][A
Training:   3%|▎         | 5/157 [00:02<00:59,  2.54it/s][A
Training:   6%|▌         | 9/157 [00:03<00:47,  3.10it/s][A
Training:   8%|▊         | 13/157 [00:04<00:41,  3.44it/s][A
Training:  11%|█         | 17/157 [00:05<00:38,  3.65it/s][A
Training:  13%|█▎        | 21/157 [00:06<00:36,  3.70it/s][A
Training:  16%|█▌        | 25/157 [00:07<00:33,  3.89it/s][A
Training:  18%|█▊        | 29/157 [00:08<00:33,  3.84it/s][A
Training:  21%|██        | 33/157 [00:09<00:31,  3.90it/s][A
Training:  23%|██▎       | 36/157 [00:09<00:24,  5.00it/s][A
Training:  24%|██▍       | 38/157 [00:10<00:29,  4.03it/s][A
Training:  26%|██▌       | 41/157 [00:11<00:32,  3.62it/s][A
Training:  29%|██▊       | 45/157 [00:12<00:29,  3.80it/s][A
Training:  31%|███       | 48/157 [00:12<00:21,  5.00it/s][A
Training:  32%|███▏      | 50/157 [00:13<00:27,  3.95it/s][A
Training:  34%|███▍

Epoch: 30/38 - Loss: 0.5976 - Accuracy: 0.9432



  0%|          | 0/20 [00:00<?, ?it/s][A
  5%|▌         | 1/20 [00:01<00:21,  1.12s/it][A
 25%|██▌       | 5/20 [00:02<00:05,  2.65it/s][A
 45%|████▌     | 9/20 [00:03<00:03,  3.35it/s][A
 65%|██████▌   | 13/20 [00:03<00:01,  3.81it/s][A
100%|██████████| 20/20 [00:04<00:00,  4.05it/s][A
Epochs:  79%|███████▉  | 30/38 [22:46<06:05, 45.63s/it]

Val Loss: 0.6659 - Val Accuracy: 0.9371



Training:   0%|          | 0/157 [00:00<?, ?it/s][A
Training:   1%|          | 1/157 [00:01<03:17,  1.27s/it][A
Training:   3%|▎         | 5/157 [00:02<00:59,  2.55it/s][A
Training:   6%|▌         | 9/157 [00:03<00:48,  3.06it/s][A
Training:   8%|▊         | 13/157 [00:04<00:41,  3.45it/s][A
Training:  11%|█         | 17/157 [00:05<00:38,  3.64it/s][A
Training:  13%|█▎        | 21/157 [00:06<00:36,  3.68it/s][A
Training:  16%|█▌        | 25/157 [00:07<00:33,  3.88it/s][A
Training:  18%|█▊        | 29/157 [00:08<00:32,  3.91it/s][A
Training:  21%|██        | 33/157 [00:09<00:31,  3.99it/s][A
Training:  23%|██▎       | 36/157 [00:09<00:23,  5.08it/s][A
Training:  24%|██▍       | 38/157 [00:10<00:29,  4.04it/s][A
Training:  26%|██▌       | 41/157 [00:11<00:32,  3.58it/s][A
Training:  29%|██▊       | 45/157 [00:12<00:29,  3.80it/s][A
Training:  31%|███       | 49/157 [00:13<00:28,  3.82it/s][A
Training:  34%|███▍      | 53/157 [00:14<00:26,  3.89it/s][A
Training:  36%|███▋

Epoch: 31/38 - Loss: 0.5808 - Accuracy: 0.9430



  0%|          | 0/20 [00:00<?, ?it/s][A
  5%|▌         | 1/20 [00:01<00:22,  1.21s/it][A
 25%|██▌       | 5/20 [00:02<00:05,  2.65it/s][A
 45%|████▌     | 9/20 [00:03<00:03,  3.43it/s][A
 65%|██████▌   | 13/20 [00:03<00:01,  3.70it/s][A
100%|██████████| 20/20 [00:04<00:00,  4.08it/s][A
Epochs:  82%|████████▏ | 31/38 [23:32<05:18, 45.57s/it]

Val Loss: 0.6463 - Val Accuracy: 0.9380



Training:   0%|          | 0/157 [00:00<?, ?it/s][A
Training:   1%|          | 1/157 [00:01<03:12,  1.23s/it][A
Training:   3%|▎         | 4/157 [00:01<00:40,  3.82it/s][A
Training:   4%|▍         | 6/157 [00:02<00:54,  2.79it/s][A
Training:   6%|▌         | 9/157 [00:03<00:50,  2.95it/s][A
Training:   8%|▊         | 13/157 [00:04<00:42,  3.42it/s][A
Training:  11%|█         | 17/157 [00:05<00:39,  3.58it/s][A
Training:  13%|█▎        | 20/157 [00:05<00:28,  4.87it/s][A
Training:  14%|█▍        | 22/157 [00:06<00:34,  3.88it/s][A
Training:  16%|█▌        | 25/157 [00:07<00:37,  3.54it/s][A
Training:  18%|█▊        | 29/157 [00:08<00:34,  3.67it/s][A
Training:  21%|██        | 33/157 [00:09<00:32,  3.83it/s][A
Training:  24%|██▎       | 37/157 [00:10<00:31,  3.80it/s][A
Training:  26%|██▌       | 41/157 [00:11<00:29,  3.97it/s][A
Training:  28%|██▊       | 44/157 [00:11<00:22,  5.09it/s][A
Training:  29%|██▉       | 46/157 [00:12<00:28,  3.92it/s][A
Training:  31%|███  

Epoch: 32/38 - Loss: 0.5921 - Accuracy: 0.9450



  0%|          | 0/20 [00:00<?, ?it/s][A
  5%|▌         | 1/20 [00:01<00:22,  1.21s/it][A
 25%|██▌       | 5/20 [00:02<00:05,  2.69it/s][A
 40%|████      | 8/20 [00:02<00:02,  4.70it/s][A
 50%|█████     | 10/20 [00:03<00:02,  3.69it/s][A
 65%|██████▌   | 13/20 [00:03<00:01,  3.54it/s][A
 80%|████████  | 16/20 [00:04<00:00,  5.15it/s][A
100%|██████████| 20/20 [00:04<00:00,  4.09it/s][A
Epochs:  84%|████████▍ | 32/38 [24:17<04:32, 45.50s/it]

Val Loss: 0.6295 - Val Accuracy: 0.9431



Training:   0%|          | 0/157 [00:00<?, ?it/s][A
Training:   1%|          | 1/157 [00:01<03:19,  1.28s/it][A
Training:   3%|▎         | 5/157 [00:02<01:02,  2.42it/s][A
Training:   6%|▌         | 9/157 [00:03<00:47,  3.13it/s][A
Training:   8%|▊         | 13/157 [00:04<00:41,  3.47it/s][A
Training:  11%|█         | 17/157 [00:05<00:39,  3.57it/s][A
Training:  13%|█▎        | 21/157 [00:06<00:36,  3.77it/s][A
Training:  16%|█▌        | 25/157 [00:07<00:34,  3.80it/s][A
Training:  18%|█▊        | 29/157 [00:08<00:33,  3.83it/s][A
Training:  21%|██        | 33/157 [00:09<00:31,  3.95it/s][A
Training:  24%|██▎       | 37/157 [00:10<00:31,  3.87it/s][A
Training:  26%|██▌       | 41/157 [00:11<00:29,  3.89it/s][A
Training:  29%|██▊       | 45/157 [00:12<00:28,  3.95it/s][A
Training:  31%|███       | 49/157 [00:13<00:27,  3.90it/s][A
Training:  34%|███▍      | 53/157 [00:14<00:26,  3.95it/s][A
Training:  36%|███▋      | 57/157 [00:15<00:25,  3.94it/s][A
Training:  39%|███▉

Epoch: 33/38 - Loss: 0.5843 - Accuracy: 0.9439



  0%|          | 0/20 [00:00<?, ?it/s][A
  5%|▌         | 1/20 [00:01<00:23,  1.24s/it][A
 25%|██▌       | 5/20 [00:02<00:05,  2.68it/s][A
 45%|████▌     | 9/20 [00:03<00:03,  3.45it/s][A
 65%|██████▌   | 13/20 [00:03<00:01,  3.73it/s][A
100%|██████████| 20/20 [00:04<00:00,  4.07it/s][A
Epochs:  87%|████████▋ | 33/38 [25:03<03:47, 45.59s/it]

Val Loss: 0.7057 - Val Accuracy: 0.9365



Training:   0%|          | 0/157 [00:00<?, ?it/s][A
Training:   1%|          | 1/157 [00:01<03:19,  1.28s/it][A
Training:   3%|▎         | 4/157 [00:01<00:41,  3.72it/s][A
Training:   4%|▍         | 6/157 [00:02<00:56,  2.66it/s][A
Training:   6%|▌         | 9/157 [00:03<00:50,  2.94it/s][A
Training:   8%|▊         | 13/157 [00:04<00:43,  3.31it/s][A
Training:  11%|█         | 17/157 [00:05<00:39,  3.55it/s][A
Training:  13%|█▎        | 21/157 [00:06<00:36,  3.72it/s][A
Training:  16%|█▌        | 25/157 [00:07<00:35,  3.70it/s][A
Training:  18%|█▊        | 29/157 [00:08<00:33,  3.85it/s][A
Training:  21%|██        | 33/157 [00:09<00:31,  3.88it/s][A
Training:  24%|██▎       | 37/157 [00:10<00:31,  3.84it/s][A
Training:  25%|██▌       | 40/157 [00:10<00:23,  4.90it/s][A
Training:  27%|██▋       | 42/157 [00:11<00:28,  3.97it/s][A
Training:  29%|██▊       | 45/157 [00:12<00:30,  3.63it/s][A
Training:  31%|███       | 49/157 [00:13<00:29,  3.71it/s][A
Training:  34%|███▍ 

Epoch: 34/38 - Loss: 0.5873 - Accuracy: 0.9460



  0%|          | 0/20 [00:00<?, ?it/s][A
  5%|▌         | 1/20 [00:01<00:23,  1.24s/it][A
 25%|██▌       | 5/20 [00:02<00:05,  2.67it/s][A
 45%|████▌     | 9/20 [00:03<00:03,  3.47it/s][A
 65%|██████▌   | 13/20 [00:03<00:01,  3.73it/s][A
100%|██████████| 20/20 [00:04<00:00,  4.07it/s][A
Epochs:  89%|████████▉ | 34/38 [25:49<03:02, 45.63s/it]

Val Loss: 0.6250 - Val Accuracy: 0.9356



Training:   0%|          | 0/157 [00:00<?, ?it/s][A
Training:   1%|          | 1/157 [00:01<03:21,  1.29s/it][A
Training:   3%|▎         | 5/157 [00:02<01:04,  2.37it/s][A
Training:   6%|▌         | 9/157 [00:03<00:48,  3.02it/s][A
Training:   8%|▊         | 13/157 [00:04<00:41,  3.44it/s][A
Training:  11%|█         | 17/157 [00:05<00:38,  3.59it/s][A
Training:  13%|█▎        | 20/157 [00:05<00:28,  4.82it/s][A
Training:  14%|█▍        | 22/157 [00:06<00:34,  3.89it/s][A
Training:  16%|█▌        | 25/157 [00:07<00:38,  3.44it/s][A
Training:  18%|█▊        | 29/157 [00:08<00:34,  3.72it/s][A
Training:  21%|██        | 33/157 [00:09<00:33,  3.71it/s][A
Training:  24%|██▎       | 37/157 [00:10<00:31,  3.83it/s][A
Training:  25%|██▍       | 39/157 [00:10<00:26,  4.50it/s][A
Training:  26%|██▌       | 41/157 [00:11<00:30,  3.76it/s][A
Training:  27%|██▋       | 43/157 [00:11<00:24,  4.62it/s][A
Training:  29%|██▊       | 45/157 [00:12<00:31,  3.52it/s][A
Training:  30%|██▉ 

Epoch: 35/38 - Loss: 0.5915 - Accuracy: 0.9399



  0%|          | 0/20 [00:00<?, ?it/s][A
  5%|▌         | 1/20 [00:01<00:24,  1.27s/it][A
 25%|██▌       | 5/20 [00:02<00:05,  2.67it/s][A
 45%|████▌     | 9/20 [00:03<00:03,  3.37it/s][A
 65%|██████▌   | 13/20 [00:03<00:01,  3.79it/s][A
100%|██████████| 20/20 [00:04<00:00,  4.00it/s][A
Epochs:  92%|█████████▏| 35/38 [26:35<02:17, 45.73s/it]

Val Loss: 0.6913 - Val Accuracy: 0.9328



Training:   0%|          | 0/157 [00:00<?, ?it/s][A
Training:   1%|          | 1/157 [00:01<03:26,  1.33s/it][A
Training:   3%|▎         | 5/157 [00:02<01:04,  2.37it/s][A
Training:   5%|▌         | 8/157 [00:02<00:35,  4.22it/s][A
Training:   6%|▋         | 10/157 [00:03<00:45,  3.22it/s][A
Training:   8%|▊         | 13/157 [00:04<00:47,  3.03it/s][A
Training:  11%|█         | 17/157 [00:05<00:40,  3.43it/s][A
Training:  13%|█▎        | 21/157 [00:06<00:37,  3.60it/s][A
Training:  16%|█▌        | 25/157 [00:07<00:35,  3.73it/s][A
Training:  18%|█▊        | 29/157 [00:08<00:33,  3.87it/s][A
Training:  21%|██        | 33/157 [00:09<00:32,  3.81it/s][A
Training:  24%|██▎       | 37/157 [00:10<00:30,  3.97it/s][A
Training:  26%|██▌       | 41/157 [00:11<00:29,  3.92it/s][A
Training:  29%|██▊       | 45/157 [00:12<00:28,  3.91it/s][A
Training:  31%|███       | 49/157 [00:13<00:27,  3.96it/s][A
Training:  34%|███▍      | 53/157 [00:14<00:27,  3.85it/s][A
Training:  36%|███▋

Epoch: 36/38 - Loss: 0.5903 - Accuracy: 0.9448



  0%|          | 0/20 [00:00<?, ?it/s][A
  5%|▌         | 1/20 [00:01<00:21,  1.12s/it][A
 25%|██▌       | 5/20 [00:02<00:05,  2.71it/s][A
 45%|████▌     | 9/20 [00:02<00:03,  3.49it/s][A
 65%|██████▌   | 13/20 [00:03<00:01,  3.68it/s][A
100%|██████████| 20/20 [00:04<00:00,  4.08it/s][A
Epochs:  95%|█████████▍| 36/38 [27:20<01:31, 45.73s/it]

Val Loss: 0.6662 - Val Accuracy: 0.9311



Training:   0%|          | 0/157 [00:00<?, ?it/s][A
Training:   1%|          | 1/157 [00:01<03:15,  1.25s/it][A
Training:   3%|▎         | 4/157 [00:01<00:40,  3.74it/s][A
Training:   4%|▍         | 6/157 [00:02<00:54,  2.76it/s][A
Training:   6%|▌         | 9/157 [00:03<00:50,  2.94it/s][A
Training:   8%|▊         | 13/157 [00:04<00:42,  3.37it/s][A
Training:  11%|█         | 17/157 [00:05<00:39,  3.54it/s][A
Training:  13%|█▎        | 21/157 [00:06<00:36,  3.74it/s][A
Training:  16%|█▌        | 25/157 [00:07<00:35,  3.71it/s][A
Training:  18%|█▊        | 29/157 [00:08<00:34,  3.75it/s][A
Training:  21%|██        | 33/157 [00:09<00:32,  3.83it/s][A
Training:  24%|██▎       | 37/157 [00:10<00:31,  3.81it/s][A
Training:  26%|██▌       | 41/157 [00:11<00:29,  3.96it/s][A
Training:  29%|██▊       | 45/157 [00:12<00:28,  3.87it/s][A
Training:  31%|███       | 49/157 [00:13<00:27,  3.88it/s][A
Training:  34%|███▍      | 53/157 [00:14<00:26,  3.98it/s][A
Training:  36%|███▋ 

Epoch: 37/38 - Loss: 0.5887 - Accuracy: 0.9435



  0%|          | 0/20 [00:00<?, ?it/s][A
  5%|▌         | 1/20 [00:01<00:23,  1.21s/it][A
 25%|██▌       | 5/20 [00:02<00:05,  2.70it/s][A
 45%|████▌     | 9/20 [00:02<00:03,  3.46it/s][A
 65%|██████▌   | 13/20 [00:03<00:01,  3.81it/s][A
100%|██████████| 20/20 [00:04<00:00,  4.12it/s][A
Epochs:  97%|█████████▋| 37/38 [28:06<00:45, 45.70s/it]

Val Loss: 0.7027 - Val Accuracy: 0.9354



Training:   0%|          | 0/157 [00:00<?, ?it/s][A
Training:   1%|          | 1/157 [00:01<03:21,  1.29s/it][A
Training:   3%|▎         | 4/157 [00:01<00:41,  3.66it/s][A
Training:   4%|▍         | 6/157 [00:02<00:57,  2.63it/s][A
Training:   6%|▌         | 9/157 [00:03<00:49,  2.98it/s][A
Training:   6%|▋         | 10/157 [00:03<00:43,  3.41it/s][A
Training:   8%|▊         | 13/157 [00:04<00:44,  3.26it/s][A
Training:  10%|▉         | 15/157 [00:04<00:32,  4.32it/s][A
Training:  11%|█         | 17/157 [00:05<00:41,  3.39it/s][A
Training:  11%|█▏        | 18/157 [00:05<00:37,  3.72it/s][A
Training:  13%|█▎        | 21/157 [00:06<00:36,  3.68it/s][A
Training:  14%|█▍        | 22/157 [00:06<00:33,  4.03it/s][A
Training:  16%|█▌        | 25/157 [00:07<00:36,  3.61it/s][A
Training:  17%|█▋        | 27/157 [00:07<00:27,  4.67it/s][A
Training:  18%|█▊        | 29/157 [00:08<00:34,  3.76it/s][A
Training:  19%|█▉        | 30/157 [00:08<00:32,  3.93it/s][A
Training:  21%|██   

Epoch: 38/38 - Loss: 0.5766 - Accuracy: 0.9450



  0%|          | 0/20 [00:00<?, ?it/s][A
  5%|▌         | 1/20 [00:01<00:22,  1.20s/it][A
 25%|██▌       | 5/20 [00:02<00:05,  2.61it/s][A
 45%|████▌     | 9/20 [00:02<00:03,  3.48it/s][A
 65%|██████▌   | 13/20 [00:03<00:01,  3.76it/s][A
100%|██████████| 20/20 [00:04<00:00,  4.05it/s][A
Epochs: 100%|██████████| 38/38 [28:52<00:00, 45.59s/it]
[32m[I 2023-12-15 04:36:40,876][0m Trial 11 finished with value: 0.9303684234619141 and parameters: {'learning_rate': 0.0002823858251405799, 'weight_decay': 0.00036934903983322265, 'epsilon': 4.3482407552971556e-09, 'batch_size': 89, 'epochs': 38}. Best is trial 2 with value: 0.9405519962310791.[0m


Val Loss: 0.6827 - Val Accuracy: 0.9304
Learning rate: 0.00020661369754506833
Weight decay: 0.001854784109648099
Epsilon: 1.1302129242663285e-09
Batch size: 123
Number of epochs: 63


Epochs:   0%|          | 0/63 [00:00<?, ?it/s]
Training:   0%|          | 0/114 [00:00<?, ?it/s][A
Training:   1%|          | 1/114 [00:01<03:10,  1.68s/it][A
Training:   4%|▎         | 4/114 [00:01<00:38,  2.87it/s][A
Training:   5%|▌         | 6/114 [00:03<00:52,  2.05it/s][A
Training:   8%|▊         | 9/114 [00:04<00:48,  2.17it/s][A
Training:  11%|█         | 12/114 [00:04<00:29,  3.47it/s][A
Training:  12%|█▏        | 14/114 [00:05<00:38,  2.58it/s][A
Training:  15%|█▍        | 17/114 [00:07<00:39,  2.44it/s][A
Training:  18%|█▊        | 20/114 [00:07<00:26,  3.55it/s][A
Training:  19%|█▉        | 22/114 [00:08<00:34,  2.64it/s][A
Training:  22%|██▏       | 25/114 [00:10<00:36,  2.46it/s][A
Training:  24%|██▎       | 27/114 [00:10<00:27,  3.13it/s][A
Training:  25%|██▌       | 29/114 [00:11<00:34,  2.46it/s][A
Training:  26%|██▋       | 30/114 [00:11<00:30,  2.77it/s][A
Training:  29%|██▉       | 33/114 [00:12<00:31,  2.58it/s][A
Training:  30%|██▉       | 34/114 [0

Epoch: 1/63 - Loss: 4.1571 - Accuracy: 0.7800



  0%|          | 0/15 [00:00<?, ?it/s][A
  7%|▋         | 1/15 [00:01<00:22,  1.60s/it][A
 33%|███▎      | 5/15 [00:02<00:05,  1.95it/s][A
 60%|██████    | 9/15 [00:04<00:02,  2.53it/s][A
100%|██████████| 15/15 [00:05<00:00,  2.79it/s][A
Epochs:   0%|          | 0/63 [00:46<?, ?it/s]
[32m[I 2023-12-15 04:37:27,317][0m Trial 12 pruned. [0m


Val Loss: 2.8852 - Val Accuracy: 0.8937
Learning rate: 0.000596159547334826
Weight decay: 0.0003996636985332951
Epsilon: 5.074725794249708e-09
Batch size: 67
Number of epochs: 65


Epochs:   0%|          | 0/65 [00:00<?, ?it/s]
Training:   0%|          | 0/209 [00:00<?, ?it/s][A
Training:   0%|          | 1/209 [00:01<03:27,  1.00it/s][A
Training:   2%|▏         | 5/209 [00:01<01:06,  3.07it/s][A
Training:   4%|▍         | 9/209 [00:02<00:48,  4.16it/s][A
Training:   6%|▌         | 13/209 [00:03<00:44,  4.38it/s][A
Training:   8%|▊         | 17/209 [00:04<00:39,  4.83it/s][A
Training:  10%|█         | 21/209 [00:04<00:39,  4.78it/s][A
Training:  12%|█▏        | 25/209 [00:05<00:35,  5.13it/s][A
Training:  14%|█▍        | 29/209 [00:06<00:35,  5.00it/s][A
Training:  16%|█▌        | 33/209 [00:07<00:33,  5.19it/s][A
Training:  18%|█▊        | 37/209 [00:07<00:32,  5.24it/s][A
Training:  20%|█▉        | 41/209 [00:08<00:32,  5.20it/s][A
Training:  22%|██▏       | 45/209 [00:09<00:30,  5.35it/s][A
Training:  23%|██▎       | 49/209 [00:10<00:30,  5.24it/s][A
Training:  25%|██▌       | 53/209 [00:10<00:29,  5.33it/s][A
Training:  27%|██▋       | 57/209 [

Epoch: 1/65 - Loss: 2.9321 - Accuracy: 0.8661



  0%|          | 0/27 [00:00<?, ?it/s][A
  4%|▎         | 1/27 [00:00<00:25,  1.01it/s][A
 19%|█▊        | 5/27 [00:01<00:06,  3.39it/s][A
 33%|███▎      | 9/27 [00:02<00:03,  4.61it/s][A
 48%|████▊     | 13/27 [00:03<00:02,  4.87it/s][A
 63%|██████▎   | 17/27 [00:03<00:01,  5.45it/s][A
 78%|███████▊  | 21/27 [00:04<00:01,  5.49it/s][A
100%|██████████| 27/27 [00:05<00:00,  5.31it/s][A
Epochs:   0%|          | 0/65 [00:45<?, ?it/s]
[32m[I 2023-12-15 04:38:13,076][0m Trial 13 pruned. [0m


Val Loss: 2.1333 - Val Accuracy: 0.9003
Learning rate: 7.43105201067417e-05
Weight decay: 0.0018632437914117503
Epsilon: 2.880140018685109e-09
Batch size: 168
Number of epochs: 41


Epochs:   0%|          | 0/41 [00:00<?, ?it/s]
Training:   0%|          | 0/84 [00:00<?, ?it/s][A
Training:   1%|          | 1/84 [00:02<03:08,  2.27s/it][A
Training:   5%|▍         | 4/84 [00:02<00:37,  2.15it/s][A
Training:   7%|▋         | 6/84 [00:04<00:50,  1.53it/s][A
Training:  11%|█         | 9/84 [00:06<00:47,  1.57it/s][A
Training:  14%|█▍        | 12/84 [00:06<00:28,  2.54it/s][A
Training:  17%|█▋        | 14/84 [00:07<00:37,  1.88it/s][A
Training:  20%|██        | 17/84 [00:09<00:37,  1.78it/s][A
Training:  24%|██▍       | 20/84 [00:09<00:24,  2.62it/s][A
Training:  26%|██▌       | 22/84 [00:11<00:31,  1.94it/s][A
Training:  30%|██▉       | 25/84 [00:13<00:33,  1.78it/s][A
Training:  33%|███▎      | 28/84 [00:13<00:21,  2.57it/s][A
Training:  36%|███▌      | 30/84 [00:15<00:28,  1.93it/s][A
Training:  39%|███▉      | 33/84 [00:17<00:28,  1.81it/s][A
Training:  43%|████▎     | 36/84 [00:17<00:18,  2.59it/s][A
Training:  45%|████▌     | 38/84 [00:19<00:23,  1.9

Epoch: 1/41 - Loss: 6.1369 - Accuracy: 0.5781



  0%|          | 0/11 [00:00<?, ?it/s][A
  9%|▉         | 1/11 [00:01<00:19,  1.96s/it][A
 36%|███▋      | 4/11 [00:02<00:02,  2.47it/s][A
 55%|█████▍    | 6/11 [00:03<00:02,  1.71it/s][A
100%|██████████| 11/11 [00:05<00:00,  2.01it/s][A
Epochs:   0%|          | 0/41 [00:45<?, ?it/s]
[32m[I 2023-12-15 04:38:59,196][0m Trial 14 pruned. [0m


Val Loss: 4.8257 - Val Accuracy: 0.6898
Learning rate: 0.0007965009741028532
Weight decay: 0.0004238400381991029
Epsilon: 2.4426663175115657e-08
Batch size: 117
Number of epochs: 85


Epochs:   0%|          | 0/85 [00:00<?, ?it/s]
Training:   0%|          | 0/120 [00:00<?, ?it/s][A
Training:   1%|          | 1/120 [00:01<03:16,  1.65s/it][A
Training:   3%|▎         | 4/120 [00:01<00:39,  2.94it/s][A
Training:   5%|▌         | 6/120 [00:02<00:52,  2.16it/s][A
Training:   8%|▊         | 9/120 [00:04<00:48,  2.28it/s][A
Training:  10%|█         | 12/120 [00:04<00:29,  3.64it/s][A
Training:  12%|█▏        | 14/120 [00:05<00:39,  2.70it/s][A
Training:  14%|█▍        | 17/120 [00:06<00:41,  2.49it/s][A
Training:  18%|█▊        | 21/120 [00:08<00:37,  2.66it/s][A
Training:  21%|██        | 25/120 [00:09<00:34,  2.74it/s][A
Training:  24%|██▍       | 29/120 [00:10<00:31,  2.85it/s][A
Training:  28%|██▊       | 33/120 [00:12<00:29,  2.95it/s][A
Training:  31%|███       | 37/120 [00:13<00:28,  2.95it/s][A
Training:  33%|███▎      | 40/120 [00:13<00:20,  3.83it/s][A
Training:  35%|███▌      | 42/120 [00:15<00:26,  2.91it/s][A
Training:  38%|███▊      | 45/120 [0

Epoch: 1/85 - Loss: 3.0044 - Accuracy: 0.8565



  0%|          | 0/15 [00:00<?, ?it/s][A
  7%|▋         | 1/15 [00:01<00:21,  1.53s/it][A
 33%|███▎      | 5/15 [00:02<00:04,  2.07it/s][A
 60%|██████    | 9/15 [00:03<00:02,  2.66it/s][A
100%|██████████| 15/15 [00:05<00:00,  2.96it/s][A
Epochs:   1%|          | 1/85 [00:45<1:03:31, 45.38s/it]

Val Loss: 1.8123 - Val Accuracy: 0.9193



Training:   0%|          | 0/120 [00:00<?, ?it/s][A
Training:   1%|          | 1/120 [00:01<03:16,  1.65s/it][A
Training:   3%|▎         | 4/120 [00:01<00:39,  2.93it/s][A
Training:   5%|▌         | 6/120 [00:02<00:51,  2.19it/s][A
Training:   8%|▊         | 9/120 [00:04<00:49,  2.24it/s][A
Training:  11%|█         | 13/120 [00:05<00:41,  2.55it/s][A
Training:  14%|█▍        | 17/120 [00:06<00:37,  2.77it/s][A
Training:  18%|█▊        | 21/120 [00:08<00:33,  2.93it/s][A
Training:  19%|█▉        | 23/120 [00:08<00:27,  3.52it/s][A
Training:  21%|██        | 25/120 [00:09<00:33,  2.85it/s][A
Training:  23%|██▎       | 28/120 [00:09<00:22,  4.02it/s][A
Training:  25%|██▌       | 30/120 [00:10<00:30,  2.92it/s][A
Training:  28%|██▊       | 33/120 [00:12<00:32,  2.69it/s][A
Training:  29%|██▉       | 35/120 [00:12<00:25,  3.40it/s][A
Training:  31%|███       | 37/120 [00:13<00:31,  2.67it/s][A
Training:  33%|███▎      | 40/120 [00:13<00:20,  3.90it/s][A
Training:  35%|███▌ 

Epoch: 2/85 - Loss: 1.6333 - Accuracy: 0.9228



  0%|          | 0/15 [00:00<?, ?it/s][A
  7%|▋         | 1/15 [00:01<00:22,  1.58s/it][A
 33%|███▎      | 5/15 [00:02<00:04,  2.10it/s][A
 60%|██████    | 9/15 [00:03<00:02,  2.65it/s][A
100%|██████████| 15/15 [00:05<00:00,  2.90it/s][A
Epochs:   2%|▏         | 2/85 [01:30<1:02:32, 45.21s/it]

Val Loss: 1.4580 - Val Accuracy: 0.9267



Training:   0%|          | 0/120 [00:00<?, ?it/s][A
Training:   1%|          | 1/120 [00:01<03:14,  1.63s/it][A
Training:   4%|▍         | 5/120 [00:02<01:01,  1.88it/s][A
Training:   8%|▊         | 9/120 [00:04<00:45,  2.43it/s][A
Training:  10%|█         | 12/120 [00:04<00:29,  3.68it/s][A
Training:  12%|█▏        | 14/120 [00:05<00:37,  2.82it/s][A
Training:  14%|█▍        | 17/120 [00:06<00:40,  2.55it/s][A
Training:  18%|█▊        | 21/120 [00:08<00:36,  2.74it/s][A
Training:  20%|██        | 24/120 [00:08<00:25,  3.76it/s][A
Training:  22%|██▏       | 26/120 [00:09<00:31,  2.95it/s][A
Training:  24%|██▍       | 29/120 [00:10<00:32,  2.80it/s][A
Training:  27%|██▋       | 32/120 [00:10<00:22,  3.90it/s][A
Training:  28%|██▊       | 34/120 [00:12<00:29,  2.91it/s][A
Training:  31%|███       | 37/120 [00:13<00:30,  2.70it/s][A
Training:  32%|███▎      | 39/120 [00:13<00:23,  3.39it/s][A
Training:  34%|███▍      | 41/120 [00:14<00:29,  2.71it/s][A
Training:  36%|███▌

Epoch: 3/85 - Loss: 1.4241 - Accuracy: 0.9284



  0%|          | 0/15 [00:00<?, ?it/s][A
  7%|▋         | 1/15 [00:01<00:21,  1.51s/it][A
 33%|███▎      | 5/15 [00:02<00:04,  2.07it/s][A
 60%|██████    | 9/15 [00:03<00:02,  2.68it/s][A
100%|██████████| 15/15 [00:05<00:00,  2.97it/s][A
Epochs:   4%|▎         | 3/85 [02:15<1:01:37, 45.09s/it]

Val Loss: 1.3667 - Val Accuracy: 0.9107



Training:   0%|          | 0/120 [00:00<?, ?it/s][A
Training:   1%|          | 1/120 [00:01<03:11,  1.61s/it][A
Training:   3%|▎         | 4/120 [00:01<00:38,  3.00it/s][A
Training:   5%|▌         | 6/120 [00:02<00:52,  2.17it/s][A
Training:   8%|▊         | 9/120 [00:04<00:49,  2.22it/s][A
Training:  11%|█         | 13/120 [00:05<00:42,  2.52it/s][A
Training:  14%|█▍        | 17/120 [00:06<00:37,  2.74it/s][A
Training:  18%|█▊        | 21/120 [00:08<00:34,  2.87it/s][A
Training:  21%|██        | 25/120 [00:09<00:32,  2.92it/s][A
Training:  24%|██▍       | 29/120 [00:10<00:31,  2.93it/s][A
Training:  28%|██▊       | 33/120 [00:12<00:29,  2.94it/s][A
Training:  31%|███       | 37/120 [00:13<00:27,  2.99it/s][A
Training:  34%|███▍      | 41/120 [00:14<00:25,  3.04it/s][A
Training:  38%|███▊      | 45/120 [00:16<00:24,  3.05it/s][A
Training:  41%|████      | 49/120 [00:17<00:23,  3.01it/s][A
Training:  44%|████▍     | 53/120 [00:18<00:22,  2.99it/s][A
Training:  48%|████▊

Epoch: 4/85 - Loss: 1.2376 - Accuracy: 0.9303



  0%|          | 0/15 [00:00<?, ?it/s][A
  7%|▋         | 1/15 [00:01<00:20,  1.44s/it][A
 27%|██▋       | 4/15 [00:01<00:03,  3.29it/s][A
 40%|████      | 6/15 [00:02<00:03,  2.51it/s][A
 53%|█████▎    | 8/15 [00:02<00:01,  3.76it/s][A
 67%|██████▋   | 10/15 [00:03<00:01,  2.61it/s][A
100%|██████████| 15/15 [00:05<00:00,  2.95it/s][A
Epochs:   5%|▍         | 4/85 [03:00<1:00:55, 45.13s/it]

Val Loss: 1.1185 - Val Accuracy: 0.9386



Training:   0%|          | 0/120 [00:00<?, ?it/s][A
Training:   1%|          | 1/120 [00:01<03:07,  1.58s/it][A
Training:   3%|▎         | 4/120 [00:01<00:37,  3.06it/s][A
Training:   5%|▌         | 6/120 [00:02<00:50,  2.25it/s][A
Training:   8%|▊         | 9/120 [00:04<00:46,  2.36it/s][A
Training:   9%|▉         | 11/120 [00:04<00:33,  3.26it/s][A
Training:  11%|█         | 13/120 [00:05<00:42,  2.49it/s][A
Training:  13%|█▎        | 16/120 [00:05<00:26,  3.92it/s][A
Training:  15%|█▌        | 18/120 [00:06<00:36,  2.76it/s][A
Training:  18%|█▊        | 21/120 [00:08<00:38,  2.59it/s][A
Training:  20%|██        | 24/120 [00:08<00:25,  3.78it/s][A
Training:  22%|██▏       | 26/120 [00:09<00:32,  2.86it/s][A
Training:  24%|██▍       | 29/120 [00:10<00:33,  2.69it/s][A
Training:  27%|██▋       | 32/120 [00:10<00:22,  3.85it/s][A
Training:  28%|██▊       | 34/120 [00:12<00:30,  2.86it/s][A
Training:  31%|███       | 37/120 [00:13<00:31,  2.61it/s][A
Training:  34%|███▍ 

Epoch: 5/85 - Loss: 1.1629 - Accuracy: 0.9325



  0%|          | 0/15 [00:00<?, ?it/s][A
  7%|▋         | 1/15 [00:01<00:21,  1.51s/it][A
 27%|██▋       | 4/15 [00:01<00:03,  3.19it/s][A
 40%|████      | 6/15 [00:02<00:03,  2.43it/s][A
 60%|██████    | 9/15 [00:03<00:02,  2.57it/s][A
100%|██████████| 15/15 [00:05<00:00,  2.98it/s][A
Epochs:   6%|▌         | 5/85 [03:45<1:00:06, 45.09s/it]

Val Loss: 1.1087 - Val Accuracy: 0.9326



Training:   0%|          | 0/120 [00:00<?, ?it/s][A
Training:   1%|          | 1/120 [00:01<03:21,  1.69s/it][A
Training:   4%|▍         | 5/120 [00:03<01:02,  1.85it/s][A
Training:   8%|▊         | 9/120 [00:04<00:47,  2.33it/s][A
Training:  11%|█         | 13/120 [00:05<00:40,  2.64it/s][A
Training:  13%|█▎        | 16/120 [00:05<00:27,  3.72it/s][A
Training:  15%|█▌        | 18/120 [00:06<00:35,  2.91it/s][A
Training:  18%|█▊        | 21/120 [00:08<00:37,  2.67it/s][A
Training:  20%|██        | 24/120 [00:08<00:25,  3.79it/s][A
Training:  22%|██▏       | 26/120 [00:09<00:32,  2.85it/s][A
Training:  24%|██▍       | 29/120 [00:10<00:34,  2.63it/s][A
Training:  28%|██▊       | 33/120 [00:12<00:31,  2.79it/s][A
Training:  31%|███       | 37/120 [00:13<00:28,  2.91it/s][A
Training:  34%|███▍      | 41/120 [00:14<00:27,  2.90it/s][A
Training:  38%|███▊      | 45/120 [00:16<00:25,  2.93it/s][A
Training:  40%|████      | 48/120 [00:16<00:18,  3.82it/s][A
Training:  42%|████

Epoch: 6/85 - Loss: 1.1435 - Accuracy: 0.9305



  0%|          | 0/15 [00:00<?, ?it/s][A
  7%|▋         | 1/15 [00:01<00:20,  1.44s/it][A
 33%|███▎      | 5/15 [00:02<00:04,  2.08it/s][A
 60%|██████    | 9/15 [00:03<00:02,  2.64it/s][A
100%|██████████| 15/15 [00:05<00:00,  2.96it/s][A
Epochs:   7%|▋         | 6/85 [04:30<59:25, 45.14s/it]  

Val Loss: 1.1764 - Val Accuracy: 0.9331



Training:   0%|          | 0/120 [00:00<?, ?it/s][A
Training:   1%|          | 1/120 [00:01<03:09,  1.59s/it][A
Training:   3%|▎         | 4/120 [00:01<00:38,  2.98it/s][A
Training:   5%|▌         | 6/120 [00:02<00:51,  2.23it/s][A
Training:   8%|▊         | 9/120 [00:04<00:48,  2.28it/s][A
Training:  10%|█         | 12/120 [00:04<00:29,  3.65it/s][A
Training:  12%|█▏        | 14/120 [00:05<00:40,  2.64it/s][A
Training:  14%|█▍        | 17/120 [00:06<00:39,  2.59it/s][A
Training:  15%|█▌        | 18/120 [00:06<00:35,  2.84it/s][A
Training:  18%|█▊        | 21/120 [00:08<00:35,  2.79it/s][A
Training:  18%|█▊        | 22/120 [00:08<00:31,  3.08it/s][A
Training:  21%|██        | 25/120 [00:09<00:33,  2.84it/s][A
Training:  22%|██▏       | 26/120 [00:09<00:29,  3.21it/s][A
Training:  24%|██▍       | 29/120 [00:10<00:32,  2.81it/s][A
Training:  25%|██▌       | 30/120 [00:10<00:28,  3.12it/s][A
Training:  28%|██▊       | 33/120 [00:12<00:30,  2.82it/s][A
Training:  28%|██▊  

Epoch: 7/85 - Loss: 1.0362 - Accuracy: 0.9346



  0%|          | 0/15 [00:00<?, ?it/s][A
  7%|▋         | 1/15 [00:01<00:20,  1.49s/it][A
 33%|███▎      | 5/15 [00:02<00:04,  2.04it/s][A
 60%|██████    | 9/15 [00:03<00:02,  2.67it/s][A
100%|██████████| 15/15 [00:05<00:00,  2.95it/s][A
Epochs:   8%|▊         | 7/85 [05:15<58:31, 45.02s/it]

Val Loss: 1.0123 - Val Accuracy: 0.9352



Training:   0%|          | 0/120 [00:00<?, ?it/s][A
Training:   1%|          | 1/120 [00:01<03:14,  1.63s/it][A
Training:   3%|▎         | 4/120 [00:01<00:39,  2.96it/s][A
Training:   5%|▌         | 6/120 [00:02<00:50,  2.24it/s][A
Training:   8%|▊         | 9/120 [00:04<00:48,  2.27it/s][A
Training:  11%|█         | 13/120 [00:05<00:41,  2.58it/s][A
Training:  14%|█▍        | 17/120 [00:06<00:37,  2.75it/s][A
Training:  18%|█▊        | 21/120 [00:08<00:34,  2.90it/s][A
Training:  20%|██        | 24/120 [00:08<00:24,  3.85it/s][A
Training:  22%|██▏       | 26/120 [00:09<00:30,  3.05it/s][A
Training:  24%|██▍       | 29/120 [00:10<00:33,  2.70it/s][A
Training:  28%|██▊       | 33/120 [00:12<00:31,  2.79it/s][A
Training:  30%|███       | 36/120 [00:12<00:22,  3.76it/s][A
Training:  32%|███▏      | 38/120 [00:13<00:28,  2.92it/s][A
Training:  34%|███▍      | 41/120 [00:14<00:28,  2.73it/s][A
Training:  37%|███▋      | 44/120 [00:14<00:20,  3.77it/s][A
Training:  38%|███▊ 

Epoch: 8/85 - Loss: 1.0753 - Accuracy: 0.9347



  0%|          | 0/15 [00:00<?, ?it/s][A
  7%|▋         | 1/15 [00:01<00:20,  1.48s/it][A
 33%|███▎      | 5/15 [00:02<00:04,  2.18it/s][A
 60%|██████    | 9/15 [00:03<00:02,  2.66it/s][A
100%|██████████| 15/15 [00:05<00:00,  2.94it/s][A
Epochs:   9%|▉         | 8/85 [06:00<57:45, 45.00s/it]

Val Loss: 1.0392 - Val Accuracy: 0.9392



Training:   0%|          | 0/120 [00:00<?, ?it/s][A
Training:   1%|          | 1/120 [00:01<03:12,  1.62s/it][A
Training:   3%|▎         | 4/120 [00:01<00:38,  3.00it/s][A
Training:   5%|▌         | 6/120 [00:03<00:53,  2.14it/s][A
Training:   8%|▊         | 9/120 [00:04<00:48,  2.28it/s][A
Training:  10%|█         | 12/120 [00:04<00:29,  3.64it/s][A
Training:  12%|█▏        | 14/120 [00:05<00:38,  2.73it/s][A
Training:  14%|█▍        | 17/120 [00:06<00:39,  2.59it/s][A
Training:  16%|█▌        | 19/120 [00:06<00:30,  3.34it/s][A
Training:  18%|█▊        | 21/120 [00:08<00:38,  2.59it/s][A
Training:  18%|█▊        | 22/120 [00:08<00:33,  2.95it/s][A
Training:  21%|██        | 25/120 [00:09<00:35,  2.71it/s][A
Training:  22%|██▏       | 26/120 [00:09<00:30,  3.06it/s][A
Training:  24%|██▍       | 29/120 [00:10<00:31,  2.92it/s][A
Training:  25%|██▌       | 30/120 [00:10<00:27,  3.24it/s][A
Training:  28%|██▊       | 33/120 [00:11<00:29,  2.92it/s][A
Training:  29%|██▉  

Epoch: 9/85 - Loss: 1.0948 - Accuracy: 0.9348



  0%|          | 0/15 [00:00<?, ?it/s][A
  7%|▋         | 1/15 [00:01<00:20,  1.49s/it][A
 27%|██▋       | 4/15 [00:01<00:03,  3.22it/s][A
 40%|████      | 6/15 [00:02<00:03,  2.34it/s][A
 60%|██████    | 9/15 [00:03<00:02,  2.49it/s][A
100%|██████████| 15/15 [00:05<00:00,  2.98it/s][A
Epochs:  11%|█         | 9/85 [06:45<56:56, 44.96s/it]

Val Loss: 1.1038 - Val Accuracy: 0.9319



Training:   0%|          | 0/120 [00:00<?, ?it/s][A
Training:   1%|          | 1/120 [00:01<03:10,  1.60s/it][A
Training:   3%|▎         | 4/120 [00:01<00:38,  2.99it/s][A
Training:   5%|▌         | 6/120 [00:02<00:51,  2.23it/s][A
Training:   8%|▊         | 9/120 [00:04<00:49,  2.25it/s][A
Training:  10%|█         | 12/120 [00:04<00:29,  3.61it/s][A
Training:  12%|█▏        | 14/120 [00:05<00:39,  2.67it/s][A
Training:  14%|█▍        | 17/120 [00:06<00:39,  2.58it/s][A
Training:  17%|█▋        | 20/120 [00:06<00:26,  3.77it/s][A
Training:  18%|█▊        | 22/120 [00:08<00:34,  2.85it/s][A
Training:  21%|██        | 25/120 [00:09<00:35,  2.64it/s][A
Training:  24%|██▍       | 29/120 [00:10<00:33,  2.74it/s][A
Training:  28%|██▊       | 33/120 [00:12<00:30,  2.82it/s][A
Training:  31%|███       | 37/120 [00:13<00:28,  2.92it/s][A
Training:  33%|███▎      | 40/120 [00:13<00:20,  3.82it/s][A
Training:  35%|███▌      | 42/120 [00:14<00:25,  3.07it/s][A
Training:  38%|███▊ 

Epoch: 10/85 - Loss: 1.0547 - Accuracy: 0.9382



  0%|          | 0/15 [00:00<?, ?it/s][A
  7%|▋         | 1/15 [00:01<00:20,  1.44s/it][A
 33%|███▎      | 5/15 [00:02<00:04,  2.20it/s][A
 60%|██████    | 9/15 [00:03<00:02,  2.67it/s][A
 87%|████████▋ | 13/15 [00:04<00:00,  2.96it/s][A
100%|██████████| 15/15 [00:05<00:00,  2.91it/s][A
Epochs:  12%|█▏        | 10/85 [07:30<56:17, 45.03s/it]

Val Loss: 0.9146 - Val Accuracy: 0.9393



Training:   0%|          | 0/120 [00:00<?, ?it/s][A
Training:   1%|          | 1/120 [00:01<03:18,  1.67s/it][A
Training:   3%|▎         | 4/120 [00:01<00:39,  2.92it/s][A
Training:   5%|▌         | 6/120 [00:03<00:54,  2.09it/s][A
Training:   8%|▊         | 9/120 [00:04<00:49,  2.24it/s][A
Training:  11%|█         | 13/120 [00:05<00:40,  2.62it/s][A
Training:  14%|█▍        | 17/120 [00:06<00:37,  2.75it/s][A
Training:  18%|█▊        | 21/120 [00:08<00:35,  2.82it/s][A
Training:  21%|██        | 25/120 [00:09<00:33,  2.85it/s][A
Training:  24%|██▍       | 29/120 [00:10<00:31,  2.90it/s][A
Training:  28%|██▊       | 33/120 [00:12<00:29,  3.00it/s][A
Training:  30%|███       | 36/120 [00:12<00:21,  3.89it/s][A
Training:  32%|███▏      | 38/120 [00:13<00:26,  3.06it/s][A
Training:  34%|███▍      | 41/120 [00:14<00:28,  2.77it/s][A
Training:  38%|███▊      | 45/120 [00:16<00:26,  2.84it/s][A
Training:  41%|████      | 49/120 [00:17<00:24,  2.89it/s][A
Training:  44%|████▍

Epoch: 11/85 - Loss: 1.0197 - Accuracy: 0.9372



  0%|          | 0/15 [00:00<?, ?it/s][A
  7%|▋         | 1/15 [00:01<00:20,  1.49s/it][A
 27%|██▋       | 4/15 [00:01<00:03,  3.22it/s][A
 40%|████      | 6/15 [00:02<00:03,  2.50it/s][A
 60%|██████    | 9/15 [00:03<00:02,  2.53it/s][A
100%|██████████| 15/15 [00:05<00:00,  2.96it/s][A
Epochs:  13%|█▎        | 11/85 [08:15<55:36, 45.09s/it]

Val Loss: 0.9321 - Val Accuracy: 0.9394



Training:   0%|          | 0/120 [00:00<?, ?it/s][A
Training:   1%|          | 1/120 [00:01<03:17,  1.66s/it][A
Training:   3%|▎         | 4/120 [00:01<00:40,  2.90it/s][A
Training:   5%|▌         | 6/120 [00:03<00:54,  2.09it/s][A
Training:   8%|▊         | 9/120 [00:04<00:49,  2.24it/s][A
Training:  10%|█         | 12/120 [00:04<00:30,  3.58it/s][A
Training:  12%|█▏        | 14/120 [00:05<00:39,  2.70it/s][A
Training:  14%|█▍        | 17/120 [00:06<00:40,  2.53it/s][A
Training:  18%|█▊        | 21/120 [00:08<00:36,  2.69it/s][A
Training:  21%|██        | 25/120 [00:09<00:33,  2.81it/s][A
Training:  24%|██▍       | 29/120 [00:10<00:31,  2.91it/s][A
Training:  26%|██▌       | 31/120 [00:10<00:25,  3.50it/s][A
Training:  28%|██▊       | 33/120 [00:12<00:31,  2.77it/s][A
Training:  30%|███       | 36/120 [00:12<00:21,  3.88it/s][A
Training:  32%|███▏      | 38/120 [00:13<00:28,  2.88it/s][A
Training:  34%|███▍      | 41/120 [00:14<00:29,  2.66it/s][A
Training:  36%|███▌ 

Epoch: 12/85 - Loss: 0.9837 - Accuracy: 0.9380



  0%|          | 0/15 [00:00<?, ?it/s][A
  7%|▋         | 1/15 [00:01<00:21,  1.57s/it][A
 33%|███▎      | 5/15 [00:02<00:04,  2.01it/s][A
 60%|██████    | 9/15 [00:03<00:02,  2.64it/s][A
100%|██████████| 15/15 [00:05<00:00,  2.92it/s][A
Epochs:  14%|█▍        | 12/85 [09:01<54:55, 45.15s/it]

Val Loss: 1.1425 - Val Accuracy: 0.9319



Training:   0%|          | 0/120 [00:00<?, ?it/s][A
Training:   1%|          | 1/120 [00:01<03:12,  1.62s/it][A
Training:   3%|▎         | 4/120 [00:01<00:39,  2.96it/s][A
Training:   5%|▌         | 6/120 [00:02<00:52,  2.17it/s][A
Training:   8%|▊         | 9/120 [00:04<00:49,  2.25it/s][A
Training:  10%|█         | 12/120 [00:04<00:29,  3.60it/s][A
Training:  12%|█▏        | 14/120 [00:05<00:40,  2.62it/s][A
Training:  14%|█▍        | 17/120 [00:06<00:40,  2.51it/s][A
Training:  17%|█▋        | 20/120 [00:07<00:27,  3.66it/s][A
Training:  18%|█▊        | 22/120 [00:08<00:35,  2.77it/s][A
Training:  21%|██        | 25/120 [00:09<00:36,  2.62it/s][A
Training:  23%|██▎       | 28/120 [00:09<00:24,  3.73it/s][A
Training:  25%|██▌       | 30/120 [00:10<00:32,  2.80it/s][A
Training:  28%|██▊       | 33/120 [00:12<00:33,  2.57it/s][A
Training:  31%|███       | 37/120 [00:13<00:30,  2.70it/s][A
Training:  34%|███▍      | 41/120 [00:14<00:27,  2.86it/s][A
Training:  38%|███▊ 

Epoch: 13/85 - Loss: 1.0738 - Accuracy: 0.9340



  0%|          | 0/15 [00:00<?, ?it/s][A
  7%|▋         | 1/15 [00:01<00:21,  1.57s/it][A
 33%|███▎      | 5/15 [00:02<00:04,  2.04it/s][A
 60%|██████    | 9/15 [00:03<00:02,  2.68it/s][A
100%|██████████| 15/15 [00:05<00:00,  2.94it/s][A
Epochs:  15%|█▌        | 13/85 [09:46<54:20, 45.28s/it]

Val Loss: 1.0782 - Val Accuracy: 0.9312



Training:   0%|          | 0/120 [00:00<?, ?it/s][A
Training:   1%|          | 1/120 [00:01<03:15,  1.64s/it][A
Training:   2%|▎         | 3/120 [00:01<00:54,  2.14it/s][A
Training:   4%|▍         | 5/120 [00:03<01:04,  1.77it/s][A
Training:   8%|▊         | 9/120 [00:04<00:47,  2.34it/s][A
Training:  11%|█         | 13/120 [00:05<00:40,  2.64it/s][A
Training:  14%|█▍        | 17/120 [00:06<00:36,  2.82it/s][A
Training:  18%|█▊        | 21/120 [00:08<00:34,  2.91it/s][A
Training:  21%|██        | 25/120 [00:09<00:32,  2.96it/s][A
Training:  23%|██▎       | 28/120 [00:09<00:23,  3.87it/s][A
Training:  25%|██▌       | 30/120 [00:10<00:30,  2.97it/s][A
Training:  28%|██▊       | 33/120 [00:12<00:31,  2.79it/s][A
Training:  29%|██▉       | 35/120 [00:12<00:24,  3.42it/s][A
Training:  31%|███       | 37/120 [00:13<00:30,  2.76it/s][A
Training:  32%|███▎      | 39/120 [00:13<00:23,  3.50it/s][A
Training:  34%|███▍      | 41/120 [00:14<00:29,  2.67it/s][A
Training:  38%|███▊ 

Epoch: 14/85 - Loss: 1.0453 - Accuracy: 0.9366



  0%|          | 0/15 [00:00<?, ?it/s][A
  7%|▋         | 1/15 [00:01<00:20,  1.45s/it][A
 27%|██▋       | 4/15 [00:01<00:03,  3.30it/s][A
 40%|████      | 6/15 [00:02<00:03,  2.41it/s][A
 60%|██████    | 9/15 [00:03<00:02,  2.48it/s][A
 80%|████████  | 12/15 [00:03<00:00,  3.95it/s][A
100%|██████████| 15/15 [00:05<00:00,  2.94it/s][A
Epochs:  16%|█▋        | 14/85 [10:31<53:30, 45.21s/it]

Val Loss: 1.0340 - Val Accuracy: 0.9330



Training:   0%|          | 0/120 [00:00<?, ?it/s][A
Training:   1%|          | 1/120 [00:01<03:18,  1.67s/it][A
Training:   4%|▍         | 5/120 [00:02<01:00,  1.90it/s][A
Training:   7%|▋         | 8/120 [00:03<00:32,  3.43it/s][A
Training:   8%|▊         | 10/120 [00:04<00:42,  2.58it/s][A
Training:  11%|█         | 13/120 [00:05<00:43,  2.46it/s][A
Training:  14%|█▍        | 17/120 [00:06<00:38,  2.66it/s][A
Training:  17%|█▋        | 20/120 [00:07<00:26,  3.73it/s][A
Training:  18%|█▊        | 22/120 [00:08<00:34,  2.82it/s][A
Training:  21%|██        | 25/120 [00:09<00:36,  2.64it/s][A
Training:  23%|██▎       | 28/120 [00:09<00:24,  3.71it/s][A
Training:  25%|██▌       | 30/120 [00:10<00:31,  2.86it/s][A
Training:  28%|██▊       | 33/120 [00:12<00:32,  2.69it/s][A
Training:  31%|███       | 37/120 [00:13<00:29,  2.77it/s][A
Training:  34%|███▍      | 41/120 [00:14<00:27,  2.84it/s][A
Training:  37%|███▋      | 44/120 [00:15<00:20,  3.79it/s][A
Training:  38%|███▊

Epoch: 15/85 - Loss: 1.0288 - Accuracy: 0.9353



  0%|          | 0/15 [00:00<?, ?it/s][A
  7%|▋         | 1/15 [00:01<00:21,  1.51s/it][A
 33%|███▎      | 5/15 [00:02<00:04,  2.08it/s][A
 60%|██████    | 9/15 [00:03<00:02,  2.65it/s][A
100%|██████████| 15/15 [00:05<00:00,  2.94it/s][A
Epochs:  18%|█▊        | 15/85 [11:17<52:46, 45.24s/it]

Val Loss: 1.0549 - Val Accuracy: 0.9314



Training:   0%|          | 0/120 [00:00<?, ?it/s][A
Training:   1%|          | 1/120 [00:01<03:14,  1.64s/it][A
Training:   3%|▎         | 4/120 [00:01<00:39,  2.97it/s][A
Training:   5%|▌         | 6/120 [00:02<00:52,  2.19it/s][A
Training:   8%|▊         | 9/120 [00:04<00:49,  2.22it/s][A
Training:  11%|█         | 13/120 [00:05<00:42,  2.49it/s][A
Training:  14%|█▍        | 17/120 [00:06<00:37,  2.73it/s][A
Training:  18%|█▊        | 21/120 [00:08<00:34,  2.85it/s][A
Training:  21%|██        | 25/120 [00:09<00:33,  2.85it/s][A
Training:  24%|██▍       | 29/120 [00:11<00:31,  2.85it/s][A
Training:  28%|██▊       | 33/120 [00:12<00:30,  2.89it/s][A
Training:  31%|███       | 37/120 [00:13<00:28,  2.94it/s][A
Training:  33%|███▎      | 40/120 [00:13<00:21,  3.80it/s][A
Training:  35%|███▌      | 42/120 [00:15<00:25,  3.04it/s][A
Training:  38%|███▊      | 45/120 [00:16<00:26,  2.78it/s][A
Training:  41%|████      | 49/120 [00:17<00:25,  2.84it/s][A
Training:  44%|████▍

Epoch: 16/85 - Loss: 1.0324 - Accuracy: 0.9335



  0%|          | 0/15 [00:00<?, ?it/s][A
  7%|▋         | 1/15 [00:01<00:20,  1.49s/it][A
 33%|███▎      | 5/15 [00:02<00:04,  2.19it/s][A
 60%|██████    | 9/15 [00:03<00:02,  2.71it/s][A
100%|██████████| 15/15 [00:05<00:00,  2.97it/s][A
Epochs:  19%|█▉        | 16/85 [12:02<52:04, 45.28s/it]

Val Loss: 1.0583 - Val Accuracy: 0.9313



Training:   0%|          | 0/120 [00:00<?, ?it/s][A
Training:   1%|          | 1/120 [00:01<03:19,  1.67s/it][A
Training:   4%|▍         | 5/120 [00:03<01:01,  1.86it/s][A
Training:   8%|▊         | 9/120 [00:04<00:47,  2.33it/s][A
Training:  11%|█         | 13/120 [00:05<00:41,  2.61it/s][A
Training:  14%|█▍        | 17/120 [00:06<00:36,  2.79it/s][A
Training:  17%|█▋        | 20/120 [00:07<00:26,  3.80it/s][A
Training:  18%|█▊        | 22/120 [00:08<00:34,  2.88it/s][A
Training:  21%|██        | 25/120 [00:09<00:35,  2.65it/s][A
Training:  24%|██▍       | 29/120 [00:11<00:32,  2.77it/s][A
Training:  28%|██▊       | 33/120 [00:12<00:29,  2.91it/s][A
Training:  30%|███       | 36/120 [00:12<00:21,  3.85it/s][A
Training:  32%|███▏      | 38/120 [00:13<00:27,  3.03it/s][A
Training:  34%|███▍      | 41/120 [00:14<00:28,  2.77it/s][A
Training:  38%|███▊      | 45/120 [00:16<00:26,  2.83it/s][A
Training:  41%|████      | 49/120 [00:17<00:24,  2.89it/s][A
Training:  44%|████

Epoch: 17/85 - Loss: 1.0189 - Accuracy: 0.9367



  0%|          | 0/15 [00:00<?, ?it/s][A
  7%|▋         | 1/15 [00:01<00:20,  1.46s/it][A
 33%|███▎      | 5/15 [00:02<00:04,  2.14it/s][A
 60%|██████    | 9/15 [00:03<00:02,  2.64it/s][A
100%|██████████| 15/15 [00:05<00:00,  2.94it/s][A
Epochs:  20%|██        | 17/85 [12:47<51:19, 45.28s/it]

Val Loss: 1.0587 - Val Accuracy: 0.9324



Training:   0%|          | 0/120 [00:00<?, ?it/s][A
Training:   1%|          | 1/120 [00:01<03:16,  1.65s/it][A
Training:   3%|▎         | 4/120 [00:01<00:39,  2.93it/s][A
Training:   5%|▌         | 6/120 [00:03<00:52,  2.15it/s][A
Training:   8%|▊         | 9/120 [00:04<00:47,  2.35it/s][A
Training:   9%|▉         | 11/120 [00:04<00:33,  3.22it/s][A
Training:  11%|█         | 13/120 [00:05<00:43,  2.48it/s][A
Training:  12%|█▏        | 14/120 [00:05<00:37,  2.86it/s][A
Training:  14%|█▍        | 17/120 [00:06<00:39,  2.64it/s][A
Training:  16%|█▌        | 19/120 [00:06<00:28,  3.49it/s][A
Training:  18%|█▊        | 21/120 [00:08<00:37,  2.63it/s][A
Training:  19%|█▉        | 23/120 [00:08<00:27,  3.50it/s][A
Training:  21%|██        | 25/120 [00:09<00:35,  2.70it/s][A
Training:  22%|██▏       | 26/120 [00:09<00:31,  3.00it/s][A
Training:  24%|██▍       | 29/120 [00:10<00:32,  2.82it/s][A
Training:  25%|██▌       | 30/120 [00:10<00:28,  3.14it/s][A
Training:  28%|██▊  

Epoch: 18/85 - Loss: 1.0274 - Accuracy: 0.9355



  0%|          | 0/15 [00:00<?, ?it/s][A
  7%|▋         | 1/15 [00:01<00:20,  1.48s/it][A
 33%|███▎      | 5/15 [00:02<00:04,  2.07it/s][A
 60%|██████    | 9/15 [00:03<00:02,  2.68it/s][A
100%|██████████| 15/15 [00:05<00:00,  2.97it/s][A
Epochs:  21%|██        | 18/85 [13:32<50:29, 45.22s/it]

Val Loss: 1.1124 - Val Accuracy: 0.9353



Training:   0%|          | 0/120 [00:00<?, ?it/s][A
Training:   1%|          | 1/120 [00:01<03:10,  1.60s/it][A
Training:   3%|▎         | 4/120 [00:01<00:38,  3.03it/s][A
Training:   5%|▌         | 6/120 [00:02<00:51,  2.19it/s][A
Training:   8%|▊         | 9/120 [00:04<00:49,  2.23it/s][A
Training:  11%|█         | 13/120 [00:05<00:41,  2.55it/s][A
Training:  13%|█▎        | 16/120 [00:05<00:28,  3.68it/s][A
Training:  15%|█▌        | 18/120 [00:06<00:36,  2.78it/s][A
Training:  18%|█▊        | 21/120 [00:08<00:37,  2.62it/s][A
Training:  21%|██        | 25/120 [00:09<00:34,  2.77it/s][A
Training:  24%|██▍       | 29/120 [00:10<00:32,  2.83it/s][A
Training:  28%|██▊       | 33/120 [00:12<00:30,  2.89it/s][A
Training:  31%|███       | 37/120 [00:13<00:28,  2.94it/s][A
Training:  34%|███▍      | 41/120 [00:14<00:26,  3.00it/s][A
Training:  38%|███▊      | 45/120 [00:16<00:24,  3.01it/s][A
Training:  40%|████      | 48/120 [00:16<00:18,  3.88it/s][A
Training:  42%|████▏

Epoch: 19/85 - Loss: 0.9759 - Accuracy: 0.9369



  0%|          | 0/15 [00:00<?, ?it/s][A
  7%|▋         | 1/15 [00:01<00:21,  1.51s/it][A
 33%|███▎      | 5/15 [00:02<00:04,  2.16it/s][A
 60%|██████    | 9/15 [00:03<00:02,  2.72it/s][A
100%|██████████| 15/15 [00:05<00:00,  2.97it/s][A
Epochs:  21%|██        | 18/85 [14:18<53:14, 47.68s/it]
[32m[I 2023-12-15 04:53:17,614][0m Trial 15 pruned. [0m


Val Loss: 1.0703 - Val Accuracy: 0.9312
Learning rate: 1.1378392517976528e-05
Weight decay: 0.0028178470992172165
Epsilon: 6.893632083019577e-09
Batch size: 75
Number of epochs: 36


Epochs:   0%|          | 0/36 [00:00<?, ?it/s]
Training:   0%|          | 0/187 [00:00<?, ?it/s][A
Training:   1%|          | 1/187 [00:01<03:36,  1.17s/it][A
Training:   3%|▎         | 5/187 [00:01<01:03,  2.88it/s][A
Training:   5%|▍         | 9/187 [00:02<00:49,  3.61it/s][A
Training:   7%|▋         | 13/187 [00:03<00:42,  4.05it/s][A
Training:   9%|▉         | 17/187 [00:04<00:40,  4.23it/s][A
Training:  11%|█         | 21/187 [00:05<00:36,  4.51it/s][A
Training:  13%|█▎        | 25/187 [00:06<00:35,  4.54it/s][A
Training:  16%|█▌        | 29/187 [00:07<00:34,  4.59it/s][A
Training:  18%|█▊        | 33/187 [00:07<00:33,  4.63it/s][A
Training:  20%|█▉        | 37/187 [00:08<00:32,  4.61it/s][A
Training:  22%|██▏       | 41/187 [00:09<00:31,  4.64it/s][A
Training:  24%|██▍       | 45/187 [00:10<00:30,  4.63it/s][A
Training:  26%|██▌       | 49/187 [00:11<00:29,  4.68it/s][A
Training:  28%|██▊       | 53/187 [00:12<00:28,  4.67it/s][A
Training:  29%|██▉       | 54/187 [

Epoch: 1/36 - Loss: 7.7978 - Accuracy: 0.5601



  0%|          | 0/24 [00:00<?, ?it/s][A
  4%|▍         | 1/24 [00:01<00:24,  1.07s/it][A
 21%|██        | 5/24 [00:01<00:05,  3.26it/s][A
 38%|███▊      | 9/24 [00:02<00:03,  4.12it/s][A
 54%|█████▍    | 13/24 [00:03<00:02,  4.60it/s][A
 71%|███████   | 17/24 [00:04<00:01,  4.78it/s][A
100%|██████████| 24/24 [00:04<00:00,  4.90it/s][A
Epochs:   0%|          | 0/36 [00:45<?, ?it/s]
[32m[I 2023-12-15 04:54:03,113][0m Trial 16 pruned. [0m


Val Loss: 6.3883 - Val Accuracy: 0.6019
Learning rate: 7.956120865746836e-05
Weight decay: 0.009533171835060042
Epsilon: 1.7418908039386952e-08
Batch size: 254
Number of epochs: 63


Epochs:   0%|          | 0/63 [00:00<?, ?it/s]
Training:   0%|          | 0/56 [00:00<?, ?it/s][A
Training:   2%|▏         | 1/56 [00:03<02:55,  3.19s/it][A
Training:   5%|▌         | 3/56 [00:03<00:46,  1.14it/s][A
Training:   9%|▉         | 5/56 [00:06<00:58,  1.14s/it][A
Training:  12%|█▎        | 7/56 [00:06<00:33,  1.46it/s][A
Training:  16%|█▌        | 9/56 [00:09<00:44,  1.05it/s][A
Training:  20%|█▉        | 11/56 [00:09<00:28,  1.56it/s][A
Training:  23%|██▎       | 13/56 [00:11<00:37,  1.15it/s][A
Training:  27%|██▋       | 15/56 [00:11<00:24,  1.65it/s][A
Training:  30%|███       | 17/56 [00:14<00:33,  1.17it/s][A
Training:  34%|███▍      | 19/56 [00:14<00:22,  1.65it/s][A
Training:  38%|███▊      | 21/56 [00:17<00:29,  1.18it/s][A
Training:  41%|████      | 23/56 [00:17<00:20,  1.65it/s][A
Training:  45%|████▍     | 25/56 [00:20<00:25,  1.21it/s][A
Training:  48%|████▊     | 27/56 [00:20<00:17,  1.68it/s][A
Training:  52%|█████▏    | 29/56 [00:23<00:22,  1.20

Epoch: 1/63 - Loss: 6.2949 - Accuracy: 0.6886



  0%|          | 0/7 [00:00<?, ?it/s][A
 14%|█▍        | 1/7 [00:02<00:17,  2.89s/it][A
 43%|████▎     | 3/7 [00:03<00:03,  1.26it/s][A
100%|██████████| 7/7 [00:05<00:00,  1.27it/s][A
Epochs:   0%|          | 0/63 [00:46<?, ?it/s]
[32m[I 2023-12-15 04:54:49,501][0m Trial 17 pruned. [0m


Val Loss: 4.7690 - Val Accuracy: 0.7708
Learning rate: 0.001500408021994709
Weight decay: 0.0005897407305513715
Epsilon: 3.127923040073714e-09
Batch size: 145
Number of epochs: 23


Epochs:   0%|          | 0/23 [00:00<?, ?it/s]
Training:   0%|          | 0/97 [00:00<?, ?it/s][A
Training:   1%|          | 1/97 [00:01<03:03,  1.91s/it][A
Training:   4%|▍         | 4/97 [00:02<00:36,  2.53it/s][A
Training:   6%|▌         | 6/97 [00:03<00:51,  1.78it/s][A
Training:   9%|▉         | 9/97 [00:05<00:48,  1.83it/s][A
Training:  12%|█▏        | 12/97 [00:05<00:28,  2.96it/s][A
Training:  14%|█▍        | 14/97 [00:06<00:38,  2.17it/s][A
Training:  18%|█▊        | 17/97 [00:08<00:39,  2.04it/s][A
Training:  21%|██        | 20/97 [00:08<00:25,  3.02it/s][A
Training:  23%|██▎       | 22/97 [00:10<00:33,  2.26it/s][A
Training:  26%|██▌       | 25/97 [00:11<00:34,  2.12it/s][A
Training:  29%|██▉       | 28/97 [00:11<00:22,  3.05it/s][A
Training:  31%|███       | 30/97 [00:13<00:29,  2.30it/s][A
Training:  34%|███▍      | 33/97 [00:14<00:29,  2.15it/s][A
Training:  37%|███▋      | 36/97 [00:15<00:19,  3.07it/s][A
Training:  39%|███▉      | 38/97 [00:16<00:25,  2.3

Epoch: 1/23 - Loss: 3.1386 - Accuracy: 0.8686



  0%|          | 0/13 [00:00<?, ?it/s][A
  8%|▊         | 1/13 [00:01<00:21,  1.76s/it][A
 31%|███       | 4/13 [00:01<00:03,  2.76it/s][A
 46%|████▌     | 6/13 [00:03<00:03,  1.95it/s][A
 69%|██████▉   | 9/13 [00:04<00:02,  2.00it/s][A
100%|██████████| 13/13 [00:04<00:00,  2.64it/s][A
Epochs:   4%|▍         | 1/23 [00:45<16:33, 45.17s/it]

Val Loss: 2.3339 - Val Accuracy: 0.9337



Training:   0%|          | 0/97 [00:00<?, ?it/s][A
Training:   1%|          | 1/97 [00:02<03:12,  2.01s/it][A
Training:   4%|▍         | 4/97 [00:02<00:38,  2.44it/s][A
Training:   6%|▌         | 6/97 [00:03<00:52,  1.74it/s][A
Training:   9%|▉         | 9/97 [00:05<00:48,  1.81it/s][A
Training:  12%|█▏        | 12/97 [00:05<00:29,  2.91it/s][A
Training:  14%|█▍        | 14/97 [00:06<00:38,  2.16it/s][A
Training:  18%|█▊        | 17/97 [00:08<00:39,  2.04it/s][A
Training:  21%|██        | 20/97 [00:08<00:25,  3.02it/s][A
Training:  23%|██▎       | 22/97 [00:10<00:32,  2.28it/s][A
Training:  26%|██▌       | 25/97 [00:11<00:33,  2.13it/s][A
Training:  29%|██▉       | 28/97 [00:11<00:22,  3.06it/s][A
Training:  31%|███       | 30/97 [00:13<00:29,  2.30it/s][A
Training:  34%|███▍      | 33/97 [00:15<00:29,  2.15it/s][A
Training:  36%|███▌      | 35/97 [00:15<00:22,  2.74it/s][A
Training:  38%|███▊      | 37/97 [00:16<00:27,  2.14it/s][A
Training:  41%|████      | 40/97 [00

Epoch: 2/23 - Loss: 2.0790 - Accuracy: 0.9184



  0%|          | 0/13 [00:00<?, ?it/s][A
  8%|▊         | 1/13 [00:01<00:21,  1.75s/it][A
 31%|███       | 4/13 [00:01<00:03,  2.78it/s][A
 46%|████▌     | 6/13 [00:03<00:03,  2.02it/s][A
 69%|██████▉   | 9/13 [00:04<00:01,  2.11it/s][A
100%|██████████| 13/13 [00:04<00:00,  2.75it/s][A
Epochs:   9%|▊         | 2/23 [01:30<15:45, 45.04s/it]

Val Loss: 1.9053 - Val Accuracy: 0.9077



Training:   0%|          | 0/97 [00:00<?, ?it/s][A
Training:   1%|          | 1/97 [00:01<03:04,  1.92s/it][A
Training:   4%|▍         | 4/97 [00:02<00:36,  2.54it/s][A
Training:   6%|▌         | 6/97 [00:03<00:51,  1.77it/s][A
Training:   9%|▉         | 9/97 [00:05<00:48,  1.82it/s][A
Training:  12%|█▏        | 12/97 [00:05<00:29,  2.93it/s][A
Training:  14%|█▍        | 14/97 [00:06<00:39,  2.12it/s][A
Training:  18%|█▊        | 17/97 [00:08<00:39,  2.02it/s][A
Training:  21%|██        | 20/97 [00:08<00:25,  2.98it/s][A
Training:  23%|██▎       | 22/97 [00:10<00:33,  2.23it/s][A
Training:  26%|██▌       | 25/97 [00:11<00:34,  2.08it/s][A
Training:  29%|██▉       | 28/97 [00:11<00:23,  2.99it/s][A
Training:  31%|███       | 30/97 [00:13<00:29,  2.26it/s][A
Training:  34%|███▍      | 33/97 [00:15<00:30,  2.12it/s][A
Training:  37%|███▋      | 36/97 [00:15<00:20,  3.04it/s][A
Training:  39%|███▉      | 38/97 [00:16<00:25,  2.29it/s][A
Training:  42%|████▏     | 41/97 [00

Epoch: 3/23 - Loss: 1.8879 - Accuracy: 0.9236



  0%|          | 0/13 [00:00<?, ?it/s][A
  8%|▊         | 1/13 [00:01<00:21,  1.82s/it][A
 31%|███       | 4/13 [00:01<00:03,  2.67it/s][A
 46%|████▌     | 6/13 [00:03<00:03,  1.98it/s][A
 69%|██████▉   | 9/13 [00:04<00:01,  2.03it/s][A
100%|██████████| 13/13 [00:04<00:00,  2.65it/s][A
Epochs:  13%|█▎        | 3/23 [02:15<15:04, 45.23s/it]

Val Loss: 1.9387 - Val Accuracy: 0.9369



Training:   0%|          | 0/97 [00:00<?, ?it/s][A
Training:   1%|          | 1/97 [00:01<03:09,  1.98s/it][A
Training:   4%|▍         | 4/97 [00:02<00:37,  2.45it/s][A
Training:   6%|▌         | 6/97 [00:03<00:50,  1.79it/s][A
Training:   9%|▉         | 9/97 [00:05<00:47,  1.84it/s][A
Training:  12%|█▏        | 12/97 [00:05<00:28,  2.96it/s][A
Training:  14%|█▍        | 14/97 [00:06<00:38,  2.16it/s][A
Training:  18%|█▊        | 17/97 [00:08<00:38,  2.06it/s][A
Training:  21%|██        | 20/97 [00:08<00:25,  3.03it/s][A
Training:  23%|██▎       | 22/97 [00:10<00:33,  2.26it/s][A
Training:  26%|██▌       | 25/97 [00:11<00:34,  2.10it/s][A
Training:  29%|██▉       | 28/97 [00:11<00:22,  3.03it/s][A
Training:  31%|███       | 30/97 [00:13<00:29,  2.29it/s][A
Training:  34%|███▍      | 33/97 [00:14<00:29,  2.13it/s][A
Training:  36%|███▌      | 35/97 [00:15<00:22,  2.70it/s][A
Training:  38%|███▊      | 37/97 [00:16<00:28,  2.11it/s][A
Training:  40%|████      | 39/97 [00

Epoch: 4/23 - Loss: 1.8311 - Accuracy: 0.9248



  0%|          | 0/13 [00:00<?, ?it/s][A
  8%|▊         | 1/13 [00:01<00:21,  1.77s/it][A
 38%|███▊      | 5/13 [00:03<00:04,  1.70it/s][A
 69%|██████▉   | 9/13 [00:04<00:01,  2.16it/s][A
100%|██████████| 13/13 [00:04<00:00,  2.65it/s][A
Epochs:  17%|█▋        | 4/23 [03:00<14:18, 45.20s/it]

Val Loss: 1.8277 - Val Accuracy: 0.9088



Training:   0%|          | 0/97 [00:00<?, ?it/s][A
Training:   1%|          | 1/97 [00:01<03:06,  1.94s/it][A
Training:   4%|▍         | 4/97 [00:02<00:37,  2.51it/s][A
Training:   6%|▌         | 6/97 [00:03<00:51,  1.78it/s][A
Training:   9%|▉         | 9/97 [00:05<00:48,  1.82it/s][A
Training:  12%|█▏        | 12/97 [00:05<00:28,  2.94it/s][A
Training:  14%|█▍        | 14/97 [00:06<00:38,  2.14it/s][A
Training:  18%|█▊        | 17/97 [00:08<00:39,  2.02it/s][A
Training:  21%|██        | 20/97 [00:08<00:25,  2.98it/s][A
Training:  23%|██▎       | 22/97 [00:10<00:33,  2.24it/s][A
Training:  26%|██▌       | 25/97 [00:11<00:34,  2.10it/s][A
Training:  30%|██▉       | 29/97 [00:13<00:30,  2.22it/s][A
Training:  33%|███▎      | 32/97 [00:13<00:21,  3.07it/s][A
Training:  35%|███▌      | 34/97 [00:15<00:26,  2.34it/s][A
Training:  38%|███▊      | 37/97 [00:16<00:27,  2.16it/s][A
Training:  42%|████▏     | 41/97 [00:18<00:24,  2.25it/s][A
Training:  45%|████▌     | 44/97 [00

Epoch: 5/23 - Loss: 1.7532 - Accuracy: 0.9260



  0%|          | 0/13 [00:00<?, ?it/s][A
  8%|▊         | 1/13 [00:01<00:21,  1.76s/it][A
 31%|███       | 4/13 [00:01<00:03,  2.75it/s][A
 46%|████▌     | 6/13 [00:03<00:03,  2.01it/s][A
 69%|██████▉   | 9/13 [00:04<00:01,  2.11it/s][A
100%|██████████| 13/13 [00:04<00:00,  2.73it/s][A
Epochs:  22%|██▏       | 5/23 [03:46<13:34, 45.25s/it]

Val Loss: 1.6812 - Val Accuracy: 0.9390



Training:   0%|          | 0/97 [00:00<?, ?it/s][A
Training:   1%|          | 1/97 [00:01<03:11,  1.99s/it][A
Training:   4%|▍         | 4/97 [00:02<00:38,  2.42it/s][A
Training:   6%|▌         | 6/97 [00:03<00:53,  1.71it/s][A
Training:   9%|▉         | 9/97 [00:05<00:49,  1.79it/s][A
Training:  12%|█▏        | 12/97 [00:05<00:29,  2.88it/s][A
Training:  14%|█▍        | 14/97 [00:07<00:39,  2.13it/s][A
Training:  18%|█▊        | 17/97 [00:08<00:39,  2.03it/s][A
Training:  21%|██        | 20/97 [00:08<00:25,  2.99it/s][A
Training:  23%|██▎       | 22/97 [00:10<00:33,  2.22it/s][A
Training:  26%|██▌       | 25/97 [00:11<00:34,  2.09it/s][A
Training:  29%|██▉       | 28/97 [00:12<00:23,  2.99it/s][A
Training:  31%|███       | 30/97 [00:13<00:29,  2.27it/s][A
Training:  34%|███▍      | 33/97 [00:15<00:30,  2.12it/s][A
Training:  37%|███▋      | 36/97 [00:15<00:20,  3.04it/s][A
Training:  39%|███▉      | 38/97 [00:16<00:25,  2.29it/s][A
Training:  42%|████▏     | 41/97 [00

Epoch: 6/23 - Loss: 1.8021 - Accuracy: 0.9293



  0%|          | 0/13 [00:00<?, ?it/s][A
  8%|▊         | 1/13 [00:01<00:21,  1.76s/it][A
 31%|███       | 4/13 [00:01<00:03,  2.73it/s][A
 46%|████▌     | 6/13 [00:03<00:03,  1.94it/s][A
 69%|██████▉   | 9/13 [00:04<00:01,  2.12it/s][A
100%|██████████| 13/13 [00:04<00:00,  2.69it/s][A
Epochs:  26%|██▌       | 6/23 [04:31<12:49, 45.26s/it]

Val Loss: 1.6058 - Val Accuracy: 0.9332



Training:   0%|          | 0/97 [00:00<?, ?it/s][A
Training:   1%|          | 1/97 [00:01<03:02,  1.90s/it][A
Training:   4%|▍         | 4/97 [00:02<00:36,  2.55it/s][A
Training:   6%|▌         | 6/97 [00:03<00:51,  1.77it/s][A
Training:   9%|▉         | 9/97 [00:05<00:48,  1.82it/s][A
Training:  12%|█▏        | 12/97 [00:05<00:28,  2.94it/s][A
Training:  14%|█▍        | 14/97 [00:06<00:38,  2.16it/s][A
Training:  18%|█▊        | 17/97 [00:08<00:39,  2.02it/s][A
Training:  21%|██        | 20/97 [00:08<00:25,  2.99it/s][A
Training:  23%|██▎       | 22/97 [00:10<00:33,  2.24it/s][A
Training:  26%|██▌       | 25/97 [00:11<00:34,  2.09it/s][A
Training:  29%|██▉       | 28/97 [00:11<00:22,  3.02it/s][A
Training:  31%|███       | 30/97 [00:13<00:29,  2.27it/s][A
Training:  34%|███▍      | 33/97 [00:15<00:29,  2.14it/s][A
Training:  37%|███▋      | 36/97 [00:15<00:19,  3.06it/s][A
Training:  39%|███▉      | 38/97 [00:16<00:25,  2.30it/s][A
Training:  42%|████▏     | 41/97 [00

Epoch: 7/23 - Loss: 1.8104 - Accuracy: 0.9304



  0%|          | 0/13 [00:00<?, ?it/s][A
  8%|▊         | 1/13 [00:01<00:21,  1.76s/it][A
 31%|███       | 4/13 [00:01<00:03,  2.75it/s][A
 46%|████▌     | 6/13 [00:03<00:03,  1.98it/s][A
 69%|██████▉   | 9/13 [00:04<00:01,  2.06it/s][A
100%|██████████| 13/13 [00:04<00:00,  2.70it/s][A
Epochs:  30%|███       | 7/23 [05:16<12:02, 45.18s/it]

Val Loss: 1.8504 - Val Accuracy: 0.9379



Training:   0%|          | 0/97 [00:00<?, ?it/s][A
Training:   1%|          | 1/97 [00:01<03:11,  1.99s/it][A
Training:   4%|▍         | 4/97 [00:02<00:37,  2.47it/s][A
Training:   6%|▌         | 6/97 [00:03<00:53,  1.72it/s][A
Training:   9%|▉         | 9/97 [00:05<00:49,  1.79it/s][A
Training:  13%|█▎        | 13/97 [00:06<00:40,  2.08it/s][A
Training:  16%|█▋        | 16/97 [00:07<00:26,  3.04it/s][A
Training:  19%|█▊        | 18/97 [00:08<00:34,  2.27it/s][A
Training:  22%|██▏       | 21/97 [00:10<00:35,  2.13it/s][A
Training:  25%|██▍       | 24/97 [00:10<00:23,  3.06it/s][A
Training:  27%|██▋       | 26/97 [00:11<00:31,  2.28it/s][A
Training:  30%|██▉       | 29/97 [00:13<00:32,  2.12it/s][A
Training:  33%|███▎      | 32/97 [00:13<00:21,  3.03it/s][A
Training:  35%|███▌      | 34/97 [00:15<00:27,  2.29it/s][A
Training:  38%|███▊      | 37/97 [00:16<00:28,  2.12it/s][A
Training:  41%|████      | 40/97 [00:16<00:18,  3.03it/s][A
Training:  43%|████▎     | 42/97 [00

Epoch: 8/23 - Loss: 1.7075 - Accuracy: 0.9318



  0%|          | 0/13 [00:00<?, ?it/s][A
  8%|▊         | 1/13 [00:01<00:21,  1.78s/it][A
 31%|███       | 4/13 [00:01<00:03,  2.72it/s][A
 46%|████▌     | 6/13 [00:03<00:03,  1.99it/s][A
 69%|██████▉   | 9/13 [00:04<00:01,  2.07it/s][A
100%|██████████| 13/13 [00:04<00:00,  2.69it/s][A
Epochs:  35%|███▍      | 8/23 [06:01<11:18, 45.23s/it]

Val Loss: 1.9398 - Val Accuracy: 0.9236



Training:   0%|          | 0/97 [00:00<?, ?it/s][A
Training:   1%|          | 1/97 [00:01<03:06,  1.94s/it][A
Training:   4%|▍         | 4/97 [00:02<00:36,  2.52it/s][A
Training:   6%|▌         | 6/97 [00:03<00:51,  1.77it/s][A
Training:   9%|▉         | 9/97 [00:05<00:48,  1.81it/s][A
Training:  12%|█▏        | 12/97 [00:05<00:29,  2.93it/s][A
Training:  14%|█▍        | 14/97 [00:06<00:38,  2.13it/s][A
Training:  18%|█▊        | 17/97 [00:08<00:39,  2.04it/s][A
Training:  21%|██        | 20/97 [00:08<00:25,  3.01it/s][A
Training:  23%|██▎       | 22/97 [00:10<00:33,  2.26it/s][A
Training:  26%|██▌       | 25/97 [00:11<00:34,  2.07it/s][A
Training:  29%|██▉       | 28/97 [00:11<00:23,  3.00it/s][A
Training:  31%|███       | 30/97 [00:13<00:29,  2.28it/s][A
Training:  34%|███▍      | 33/97 [00:15<00:29,  2.14it/s][A
Training:  37%|███▋      | 36/97 [00:15<00:19,  3.05it/s][A
Training:  39%|███▉      | 38/97 [00:16<00:25,  2.31it/s][A
Training:  42%|████▏     | 41/97 [00

Epoch: 9/23 - Loss: 1.8707 - Accuracy: 0.9253



  0%|          | 0/13 [00:00<?, ?it/s][A
  8%|▊         | 1/13 [00:01<00:21,  1.79s/it][A
 38%|███▊      | 5/13 [00:03<00:04,  1.73it/s][A
 69%|██████▉   | 9/13 [00:04<00:01,  2.18it/s][A
100%|██████████| 13/13 [00:04<00:00,  2.67it/s][A
Epochs:  39%|███▉      | 9/23 [06:46<10:32, 45.18s/it]

Val Loss: 1.8235 - Val Accuracy: 0.9072



Training:   0%|          | 0/97 [00:00<?, ?it/s][A
Training:   1%|          | 1/97 [00:01<03:11,  1.99s/it][A
Training:   4%|▍         | 4/97 [00:02<00:38,  2.43it/s][A
Training:   6%|▌         | 6/97 [00:03<00:51,  1.77it/s][A
Training:   9%|▉         | 9/97 [00:05<00:48,  1.83it/s][A
Training:  12%|█▏        | 12/97 [00:05<00:28,  2.94it/s][A
Training:  14%|█▍        | 14/97 [00:06<00:38,  2.16it/s][A
Training:  18%|█▊        | 17/97 [00:08<00:39,  2.04it/s][A
Training:  21%|██        | 20/97 [00:08<00:25,  3.00it/s][A
Training:  23%|██▎       | 22/97 [00:10<00:33,  2.22it/s][A
Training:  26%|██▌       | 25/97 [00:11<00:34,  2.08it/s][A
Training:  28%|██▊       | 27/97 [00:11<00:26,  2.68it/s][A
Training:  30%|██▉       | 29/97 [00:13<00:32,  2.11it/s][A
Training:  33%|███▎      | 32/97 [00:13<00:20,  3.14it/s][A
Training:  35%|███▌      | 34/97 [00:15<00:27,  2.28it/s][A
Training:  38%|███▊      | 37/97 [00:16<00:28,  2.10it/s][A
Training:  41%|████      | 40/97 [00

Epoch: 10/23 - Loss: 1.8306 - Accuracy: 0.9291



  0%|          | 0/13 [00:00<?, ?it/s][A
  8%|▊         | 1/13 [00:01<00:21,  1.77s/it][A
 38%|███▊      | 5/13 [00:03<00:04,  1.73it/s][A
100%|██████████| 13/13 [00:04<00:00,  2.68it/s][A
Epochs:  43%|████▎     | 10/23 [07:32<09:48, 45.24s/it]

Val Loss: 1.9421 - Val Accuracy: 0.9247



Training:   0%|          | 0/97 [00:00<?, ?it/s][A
Training:   1%|          | 1/97 [00:01<03:05,  1.94s/it][A
Training:   4%|▍         | 4/97 [00:02<00:37,  2.50it/s][A
Training:   6%|▌         | 6/97 [00:03<00:54,  1.67it/s][A
Training:   9%|▉         | 9/97 [00:05<00:49,  1.76it/s][A
Training:  12%|█▏        | 12/97 [00:05<00:29,  2.84it/s][A
Training:  14%|█▍        | 14/97 [00:07<00:39,  2.12it/s][A
Training:  18%|█▊        | 17/97 [00:08<00:39,  2.03it/s][A
Training:  20%|█▉        | 19/97 [00:08<00:29,  2.64it/s][A
Training:  22%|██▏       | 21/97 [00:10<00:36,  2.08it/s][A
Training:  24%|██▎       | 23/97 [00:10<00:26,  2.75it/s][A
Training:  26%|██▌       | 25/97 [00:11<00:33,  2.12it/s][A
Training:  27%|██▋       | 26/97 [00:11<00:28,  2.45it/s][A
Training:  30%|██▉       | 29/97 [00:13<00:31,  2.19it/s][A
Training:  33%|███▎      | 32/97 [00:13<00:19,  3.31it/s][A
Training:  35%|███▌      | 34/97 [00:15<00:27,  2.31it/s][A
Training:  38%|███▊      | 37/97 [00

Epoch: 11/23 - Loss: 1.9612 - Accuracy: 0.9289



  0%|          | 0/13 [00:00<?, ?it/s][A
  8%|▊         | 1/13 [00:01<00:21,  1.81s/it][A
 23%|██▎       | 3/13 [00:01<00:05,  1.95it/s][A
 38%|███▊      | 5/13 [00:03<00:04,  1.69it/s][A
 69%|██████▉   | 9/13 [00:04<00:01,  2.22it/s][A
100%|██████████| 13/13 [00:04<00:00,  2.67it/s][A
Epochs:  48%|████▊     | 11/23 [08:17<09:02, 45.19s/it]

Val Loss: 1.8132 - Val Accuracy: 0.9363



Training:   0%|          | 0/97 [00:00<?, ?it/s][A
Training:   1%|          | 1/97 [00:01<03:10,  1.99s/it][A
Training:   4%|▍         | 4/97 [00:02<00:37,  2.46it/s][A
Training:   6%|▌         | 6/97 [00:03<00:51,  1.77it/s][A
Training:   9%|▉         | 9/97 [00:05<00:48,  1.82it/s][A
Training:  12%|█▏        | 12/97 [00:05<00:28,  2.94it/s][A
Training:  14%|█▍        | 14/97 [00:06<00:38,  2.16it/s][A
Training:  18%|█▊        | 17/97 [00:08<00:39,  2.03it/s][A
Training:  21%|██        | 20/97 [00:08<00:25,  3.00it/s][A
Training:  23%|██▎       | 22/97 [00:10<00:33,  2.27it/s][A
Training:  26%|██▌       | 25/97 [00:11<00:34,  2.10it/s][A
Training:  29%|██▉       | 28/97 [00:11<00:22,  3.02it/s][A
Training:  31%|███       | 30/97 [00:13<00:29,  2.29it/s][A
Training:  34%|███▍      | 33/97 [00:15<00:30,  2.12it/s][A
Training:  37%|███▋      | 36/97 [00:15<00:20,  3.03it/s][A
Training:  39%|███▉      | 38/97 [00:16<00:25,  2.31it/s][A
Training:  42%|████▏     | 41/97 [00

Epoch: 12/23 - Loss: 1.7840 - Accuracy: 0.9389



  0%|          | 0/13 [00:00<?, ?it/s][A
  8%|▊         | 1/13 [00:01<00:21,  1.77s/it][A
 31%|███       | 4/13 [00:01<00:03,  2.74it/s][A
 46%|████▌     | 6/13 [00:03<00:03,  1.96it/s][A
 69%|██████▉   | 9/13 [00:04<00:01,  2.04it/s][A
100%|██████████| 13/13 [00:04<00:00,  2.67it/s][A
Epochs:  52%|█████▏    | 12/23 [09:02<08:16, 45.14s/it]

Val Loss: 2.0095 - Val Accuracy: 0.8912



Training:   0%|          | 0/97 [00:00<?, ?it/s][A
Training:   1%|          | 1/97 [00:01<03:02,  1.91s/it][A
Training:   4%|▍         | 4/97 [00:02<00:36,  2.54it/s][A
Training:   6%|▌         | 6/97 [00:03<00:51,  1.77it/s][A
Training:   9%|▉         | 9/97 [00:05<00:48,  1.80it/s][A
Training:  13%|█▎        | 13/97 [00:06<00:40,  2.06it/s][A
Training:  16%|█▋        | 16/97 [00:06<00:27,  3.00it/s][A
Training:  19%|█▊        | 18/97 [00:08<00:35,  2.25it/s][A
Training:  22%|██▏       | 21/97 [00:10<00:36,  2.11it/s][A
Training:  25%|██▍       | 24/97 [00:10<00:24,  3.04it/s][A
Training:  27%|██▋       | 26/97 [00:11<00:30,  2.30it/s][A
Training:  30%|██▉       | 29/97 [00:13<00:31,  2.13it/s][A
Training:  33%|███▎      | 32/97 [00:13<00:21,  3.04it/s][A
Training:  35%|███▌      | 34/97 [00:15<00:27,  2.28it/s][A
Training:  38%|███▊      | 37/97 [00:16<00:28,  2.14it/s][A
Training:  41%|████      | 40/97 [00:16<00:18,  3.05it/s][A
Training:  43%|████▎     | 42/97 [00

Epoch: 13/23 - Loss: 1.8951 - Accuracy: 0.9297



  0%|          | 0/13 [00:00<?, ?it/s][A
  8%|▊         | 1/13 [00:01<00:21,  1.75s/it][A
 31%|███       | 4/13 [00:01<00:03,  2.73it/s][A
 46%|████▌     | 6/13 [00:03<00:03,  1.98it/s][A
 69%|██████▉   | 9/13 [00:04<00:01,  2.05it/s][A
100%|██████████| 13/13 [00:04<00:00,  2.69it/s][A
Epochs:  57%|█████▋    | 13/23 [09:47<07:31, 45.16s/it]

Val Loss: 1.6582 - Val Accuracy: 0.9135



Training:   0%|          | 0/97 [00:00<?, ?it/s][A
Training:   1%|          | 1/97 [00:01<03:05,  1.93s/it][A
Training:   3%|▎         | 3/97 [00:02<00:51,  1.84it/s][A
Training:   5%|▌         | 5/97 [00:03<01:00,  1.51it/s][A
Training:   7%|▋         | 7/97 [00:03<00:36,  2.46it/s][A
Training:   9%|▉         | 9/97 [00:05<00:47,  1.85it/s][A
Training:  12%|█▏        | 12/97 [00:05<00:27,  3.15it/s][A
Training:  14%|█▍        | 14/97 [00:06<00:37,  2.21it/s][A
Training:  18%|█▊        | 17/97 [00:08<00:38,  2.07it/s][A
Training:  21%|██        | 20/97 [00:08<00:25,  3.08it/s][A
Training:  23%|██▎       | 22/97 [00:10<00:32,  2.33it/s][A
Training:  24%|██▎       | 23/97 [00:10<00:28,  2.57it/s][A
Training:  26%|██▌       | 25/97 [00:11<00:34,  2.07it/s][A
Training:  28%|██▊       | 27/97 [00:11<00:26,  2.68it/s][A
Training:  30%|██▉       | 29/97 [00:13<00:31,  2.15it/s][A
Training:  32%|███▏      | 31/97 [00:13<00:24,  2.71it/s][A
Training:  34%|███▍      | 33/97 [00:

Epoch: 14/23 - Loss: 1.8477 - Accuracy: 0.9334



  0%|          | 0/13 [00:00<?, ?it/s][A
  8%|▊         | 1/13 [00:01<00:21,  1.77s/it][A
 38%|███▊      | 5/13 [00:03<00:04,  1.74it/s][A
 69%|██████▉   | 9/13 [00:04<00:01,  2.23it/s][A
100%|██████████| 13/13 [00:04<00:00,  2.70it/s][A
Epochs:  61%|██████    | 14/23 [10:32<06:45, 45.08s/it]

Val Loss: 1.7911 - Val Accuracy: 0.9358



Training:   0%|          | 0/97 [00:00<?, ?it/s][A
Training:   1%|          | 1/97 [00:01<03:05,  1.93s/it][A
Training:   3%|▎         | 3/97 [00:02<00:50,  1.85it/s][A
Training:   5%|▌         | 5/97 [00:03<01:00,  1.53it/s][A
Training:   7%|▋         | 7/97 [00:03<00:36,  2.47it/s][A
Training:   9%|▉         | 9/97 [00:05<00:47,  1.87it/s][A
Training:  10%|█         | 10/97 [00:05<00:38,  2.24it/s][A
Training:  13%|█▎        | 13/97 [00:06<00:39,  2.10it/s][A
Training:  14%|█▍        | 14/97 [00:06<00:34,  2.44it/s][A
Training:  18%|█▊        | 17/97 [00:08<00:36,  2.18it/s][A
Training:  20%|█▉        | 19/97 [00:08<00:26,  2.93it/s][A
Training:  22%|██▏       | 21/97 [00:10<00:35,  2.14it/s][A
Training:  25%|██▍       | 24/97 [00:10<00:22,  3.30it/s][A
Training:  27%|██▋       | 26/97 [00:11<00:30,  2.30it/s][A
Training:  30%|██▉       | 29/97 [00:13<00:32,  2.12it/s][A
Training:  33%|███▎      | 32/97 [00:13<00:21,  3.09it/s][A
Training:  35%|███▌      | 34/97 [00:

Epoch: 15/23 - Loss: 1.9457 - Accuracy: 0.9338



  0%|          | 0/13 [00:00<?, ?it/s][A
  8%|▊         | 1/13 [00:01<00:21,  1.77s/it][A
 23%|██▎       | 3/13 [00:01<00:04,  2.01it/s][A
 38%|███▊      | 5/13 [00:03<00:04,  1.67it/s][A
 62%|██████▏   | 8/13 [00:03<00:01,  3.31it/s][A
100%|██████████| 13/13 [00:04<00:00,  2.64it/s][A
Epochs:  65%|██████▌   | 15/23 [11:17<06:01, 45.19s/it]

Val Loss: 1.6553 - Val Accuracy: 0.9390



Training:   0%|          | 0/97 [00:00<?, ?it/s][A
Training:   1%|          | 1/97 [00:02<03:14,  2.02s/it][A
Training:   4%|▍         | 4/97 [00:02<00:38,  2.40it/s][A
Training:   6%|▌         | 6/97 [00:03<00:50,  1.79it/s][A
Training:   9%|▉         | 9/97 [00:05<00:47,  1.85it/s][A
Training:  12%|█▏        | 12/97 [00:05<00:28,  2.96it/s][A
Training:  14%|█▍        | 14/97 [00:06<00:37,  2.20it/s][A
Training:  18%|█▊        | 17/97 [00:08<00:38,  2.10it/s][A
Training:  20%|█▉        | 19/97 [00:08<00:28,  2.72it/s][A
Training:  22%|██▏       | 21/97 [00:10<00:35,  2.12it/s][A
Training:  24%|██▎       | 23/97 [00:10<00:26,  2.78it/s][A
Training:  26%|██▌       | 25/97 [00:11<00:33,  2.15it/s][A
Training:  28%|██▊       | 27/97 [00:11<00:24,  2.83it/s][A
Training:  30%|██▉       | 29/97 [00:13<00:31,  2.18it/s][A
Training:  32%|███▏      | 31/97 [00:13<00:23,  2.83it/s][A
Training:  34%|███▍      | 33/97 [00:14<00:29,  2.16it/s][A
Training:  36%|███▌      | 35/97 [00

Epoch: 16/23 - Loss: 1.8320 - Accuracy: 0.9371



  0%|          | 0/13 [00:00<?, ?it/s][A
  8%|▊         | 1/13 [00:01<00:21,  1.79s/it][A
 31%|███       | 4/13 [00:01<00:03,  2.70it/s][A
 46%|████▌     | 6/13 [00:03<00:03,  1.92it/s][A
100%|██████████| 13/13 [00:04<00:00,  2.64it/s][A
Epochs:  70%|██████▉   | 16/23 [12:03<05:16, 45.24s/it]

Val Loss: 2.0373 - Val Accuracy: 0.9395



Training:   0%|          | 0/97 [00:00<?, ?it/s][A
Training:   1%|          | 1/97 [00:01<03:03,  1.91s/it][A
Training:   4%|▍         | 4/97 [00:02<00:36,  2.52it/s][A
Training:   6%|▌         | 6/97 [00:03<00:51,  1.77it/s][A
Training:   9%|▉         | 9/97 [00:05<00:48,  1.81it/s][A
Training:  12%|█▏        | 12/97 [00:05<00:29,  2.92it/s][A
Training:  14%|█▍        | 14/97 [00:06<00:39,  2.11it/s][A
Training:  18%|█▊        | 17/97 [00:08<00:39,  2.02it/s][A
Training:  21%|██        | 20/97 [00:08<00:25,  2.98it/s][A
Training:  23%|██▎       | 22/97 [00:10<00:33,  2.25it/s][A
Training:  26%|██▌       | 25/97 [00:11<00:33,  2.12it/s][A
Training:  29%|██▉       | 28/97 [00:11<00:22,  3.04it/s][A
Training:  31%|███       | 30/97 [00:13<00:29,  2.29it/s][A
Training:  33%|███▎      | 32/97 [00:13<00:22,  2.93it/s][A
Training:  35%|███▌      | 34/97 [00:15<00:28,  2.18it/s][A
Training:  37%|███▋      | 36/97 [00:15<00:21,  2.83it/s][A
Training:  38%|███▊      | 37/97 [00

Epoch: 17/23 - Loss: 1.8967 - Accuracy: 0.9357



  0%|          | 0/13 [00:00<?, ?it/s][A
  8%|▊         | 1/13 [00:01<00:21,  1.77s/it][A
 31%|███       | 4/13 [00:01<00:03,  2.75it/s][A
 46%|████▌     | 6/13 [00:03<00:03,  1.99it/s][A
 69%|██████▉   | 9/13 [00:04<00:01,  2.08it/s][A
100%|██████████| 13/13 [00:04<00:00,  2.71it/s][A
Epochs:  74%|███████▍  | 17/23 [12:48<04:31, 45.24s/it]

Val Loss: 1.6293 - Val Accuracy: 0.9427



Training:   0%|          | 0/97 [00:00<?, ?it/s][A
Training:   1%|          | 1/97 [00:01<03:07,  1.95s/it][A
Training:   4%|▍         | 4/97 [00:02<00:37,  2.49it/s][A
Training:   6%|▌         | 6/97 [00:03<00:51,  1.76it/s][A
Training:   9%|▉         | 9/97 [00:05<00:48,  1.83it/s][A
Training:  13%|█▎        | 13/97 [00:06<00:40,  2.08it/s][A
Training:  16%|█▋        | 16/97 [00:06<00:26,  3.04it/s][A
Training:  19%|█▊        | 18/97 [00:08<00:34,  2.28it/s][A
Training:  22%|██▏       | 21/97 [00:10<00:35,  2.13it/s][A
Training:  25%|██▍       | 24/97 [00:10<00:23,  3.05it/s][A
Training:  27%|██▋       | 26/97 [00:11<00:30,  2.30it/s][A
Training:  30%|██▉       | 29/97 [00:13<00:31,  2.16it/s][A
Training:  32%|███▏      | 31/97 [00:13<00:24,  2.75it/s][A
Training:  34%|███▍      | 33/97 [00:15<00:30,  2.10it/s][A
Training:  36%|███▌      | 35/97 [00:15<00:22,  2.75it/s][A
Training:  38%|███▊      | 37/97 [00:16<00:28,  2.12it/s][A
Training:  40%|████      | 39/97 [00

Epoch: 18/23 - Loss: 1.8824 - Accuracy: 0.9361



  0%|          | 0/13 [00:00<?, ?it/s][A
  8%|▊         | 1/13 [00:01<00:21,  1.79s/it][A
 31%|███       | 4/13 [00:01<00:03,  2.71it/s][A
 46%|████▌     | 6/13 [00:03<00:03,  1.98it/s][A
 69%|██████▉   | 9/13 [00:04<00:01,  2.05it/s][A
100%|██████████| 13/13 [00:04<00:00,  2.67it/s][A
Epochs:  78%|███████▊  | 18/23 [13:33<03:46, 45.27s/it]

Val Loss: 1.9640 - Val Accuracy: 0.9300



Training:   0%|          | 0/97 [00:00<?, ?it/s][A
Training:   1%|          | 1/97 [00:01<03:11,  1.99s/it][A
Training:   4%|▍         | 4/97 [00:02<00:38,  2.44it/s][A
Training:   6%|▌         | 6/97 [00:03<00:52,  1.73it/s][A
Training:   9%|▉         | 9/97 [00:05<00:49,  1.79it/s][A
Training:  12%|█▏        | 12/97 [00:05<00:29,  2.89it/s][A
Training:  14%|█▍        | 14/97 [00:06<00:38,  2.17it/s][A
Training:  18%|█▊        | 17/97 [00:08<00:39,  2.02it/s][A
Training:  21%|██        | 20/97 [00:08<00:25,  2.97it/s][A
Training:  23%|██▎       | 22/97 [00:10<00:33,  2.22it/s][A
Training:  26%|██▌       | 25/97 [00:11<00:34,  2.09it/s][A
Training:  29%|██▉       | 28/97 [00:12<00:22,  3.01it/s][A
Training:  31%|███       | 30/97 [00:13<00:29,  2.26it/s][A
Training:  34%|███▍      | 33/97 [00:15<00:30,  2.10it/s][A
Training:  38%|███▊      | 37/97 [00:16<00:27,  2.21it/s][A
Training:  41%|████      | 40/97 [00:16<00:18,  3.05it/s][A
Training:  43%|████▎     | 42/97 [00

Epoch: 19/23 - Loss: 1.9001 - Accuracy: 0.9377



  0%|          | 0/13 [00:00<?, ?it/s][A
  8%|▊         | 1/13 [00:01<00:21,  1.77s/it][A
 31%|███       | 4/13 [00:01<00:03,  2.71it/s][A
 46%|████▌     | 6/13 [00:03<00:03,  1.92it/s][A
 69%|██████▉   | 9/13 [00:04<00:02,  1.98it/s][A
100%|██████████| 13/13 [00:05<00:00,  2.60it/s][A
Epochs:  83%|████████▎ | 19/23 [14:19<03:01, 45.35s/it]

Val Loss: 2.1567 - Val Accuracy: 0.9300



Training:   0%|          | 0/97 [00:00<?, ?it/s][A
Training:   1%|          | 1/97 [00:02<03:12,  2.00s/it][A
Training:   3%|▎         | 3/97 [00:02<00:52,  1.78it/s][A
Training:   5%|▌         | 5/97 [00:03<01:00,  1.51it/s][A
Training:   7%|▋         | 7/97 [00:03<00:36,  2.48it/s][A
Training:   9%|▉         | 9/97 [00:05<00:46,  1.87it/s][A
Training:  11%|█▏        | 11/97 [00:05<00:31,  2.72it/s][A
Training:  13%|█▎        | 13/97 [00:06<00:42,  1.96it/s][A
Training:  16%|█▋        | 16/97 [00:07<00:25,  3.20it/s][A
Training:  19%|█▊        | 18/97 [00:08<00:35,  2.22it/s][A
Training:  22%|██▏       | 21/97 [00:10<00:36,  2.09it/s][A
Training:  25%|██▍       | 24/97 [00:10<00:23,  3.09it/s][A
Training:  27%|██▋       | 26/97 [00:11<00:31,  2.29it/s][A
Training:  30%|██▉       | 29/97 [00:13<00:32,  2.12it/s][A
Training:  32%|███▏      | 31/97 [00:13<00:24,  2.73it/s][A
Training:  34%|███▍      | 33/97 [00:15<00:30,  2.12it/s][A
Training:  36%|███▌      | 35/97 [00:

Epoch: 20/23 - Loss: 1.8072 - Accuracy: 0.9352



  0%|          | 0/13 [00:00<?, ?it/s][A
  8%|▊         | 1/13 [00:01<00:20,  1.75s/it][A
 31%|███       | 4/13 [00:01<00:03,  2.78it/s][A
 46%|████▌     | 6/13 [00:03<00:03,  1.95it/s][A
 69%|██████▉   | 9/13 [00:04<00:01,  2.04it/s][A
100%|██████████| 13/13 [00:04<00:00,  2.67it/s][A
Epochs:  87%|████████▋ | 20/23 [15:04<02:16, 45.39s/it]

Val Loss: 2.0948 - Val Accuracy: 0.9284



Training:   0%|          | 0/97 [00:00<?, ?it/s][A
Training:   1%|          | 1/97 [00:01<03:09,  1.98s/it][A
Training:   4%|▍         | 4/97 [00:02<00:37,  2.46it/s][A
Training:   6%|▌         | 6/97 [00:03<00:52,  1.74it/s][A
Training:   9%|▉         | 9/97 [00:05<00:48,  1.80it/s][A
Training:  12%|█▏        | 12/97 [00:05<00:29,  2.91it/s][A
Training:  14%|█▍        | 14/97 [00:06<00:38,  2.14it/s][A
Training:  18%|█▊        | 17/97 [00:08<00:39,  2.03it/s][A
Training:  21%|██        | 20/97 [00:08<00:25,  2.99it/s][A
Training:  23%|██▎       | 22/97 [00:10<00:33,  2.27it/s][A
Training:  26%|██▌       | 25/97 [00:11<00:34,  2.08it/s][A
Training:  29%|██▉       | 28/97 [00:12<00:23,  2.98it/s][A
Training:  31%|███       | 30/97 [00:13<00:30,  2.22it/s][A
Training:  34%|███▍      | 33/97 [00:15<00:30,  2.10it/s][A
Training:  37%|███▋      | 36/97 [00:15<00:20,  3.00it/s][A
Training:  39%|███▉      | 38/97 [00:16<00:25,  2.28it/s][A
Training:  42%|████▏     | 41/97 [00

Epoch: 21/23 - Loss: 1.8687 - Accuracy: 0.9371



  0%|          | 0/13 [00:00<?, ?it/s][A
  8%|▊         | 1/13 [00:01<00:21,  1.78s/it][A
 31%|███       | 4/13 [00:01<00:03,  2.74it/s][A
 46%|████▌     | 6/13 [00:03<00:03,  1.96it/s][A
 69%|██████▉   | 9/13 [00:04<00:01,  2.03it/s][A
100%|██████████| 13/13 [00:04<00:00,  2.66it/s][A
Epochs:  91%|█████████▏| 21/23 [15:50<01:30, 45.39s/it]

Val Loss: 2.1749 - Val Accuracy: 0.9369



Training:   0%|          | 0/97 [00:00<?, ?it/s][A
Training:   1%|          | 1/97 [00:02<03:15,  2.03s/it][A
Training:   4%|▍         | 4/97 [00:02<00:38,  2.41it/s][A
Training:   6%|▌         | 6/97 [00:03<00:52,  1.73it/s][A
Training:   9%|▉         | 9/97 [00:05<00:48,  1.82it/s][A
Training:  12%|█▏        | 12/97 [00:05<00:28,  2.95it/s][A
Training:  14%|█▍        | 14/97 [00:06<00:38,  2.15it/s][A
Training:  18%|█▊        | 17/97 [00:08<00:39,  2.04it/s][A
Training:  21%|██        | 20/97 [00:08<00:25,  2.99it/s][A
Training:  23%|██▎       | 22/97 [00:10<00:33,  2.24it/s][A
Training:  26%|██▌       | 25/97 [00:11<00:33,  2.13it/s][A
Training:  28%|██▊       | 27/97 [00:11<00:25,  2.73it/s][A
Training:  30%|██▉       | 29/97 [00:13<00:31,  2.16it/s][A
Training:  32%|███▏      | 31/97 [00:13<00:23,  2.84it/s][A
Training:  34%|███▍      | 33/97 [00:14<00:29,  2.16it/s][A
Training:  36%|███▌      | 35/97 [00:15<00:21,  2.88it/s][A
Training:  38%|███▊      | 37/97 [00

Epoch: 22/23 - Loss: 1.8830 - Accuracy: 0.9397



  0%|          | 0/13 [00:00<?, ?it/s][A
  8%|▊         | 1/13 [00:01<00:21,  1.80s/it][A
 31%|███       | 4/13 [00:01<00:03,  2.71it/s][A
 46%|████▌     | 6/13 [00:03<00:03,  1.95it/s][A
 69%|██████▉   | 9/13 [00:04<00:01,  2.02it/s][A
100%|██████████| 13/13 [00:04<00:00,  2.64it/s][A
Epochs:  96%|█████████▌| 22/23 [16:35<00:45, 45.32s/it]

Val Loss: 1.7816 - Val Accuracy: 0.9279



Training:   0%|          | 0/97 [00:00<?, ?it/s][A
Training:   1%|          | 1/97 [00:01<03:09,  1.97s/it][A
Training:   4%|▍         | 4/97 [00:02<00:37,  2.48it/s][A
Training:   6%|▌         | 6/97 [00:03<00:50,  1.79it/s][A
Training:   9%|▉         | 9/97 [00:05<00:48,  1.83it/s][A
Training:  12%|█▏        | 12/97 [00:05<00:28,  2.95it/s][A
Training:  14%|█▍        | 14/97 [00:06<00:38,  2.17it/s][A
Training:  18%|█▊        | 17/97 [00:08<00:39,  2.05it/s][A
Training:  21%|██        | 20/97 [00:08<00:25,  3.03it/s][A
Training:  23%|██▎       | 22/97 [00:10<00:33,  2.26it/s][A
Training:  26%|██▌       | 25/97 [00:11<00:34,  2.11it/s][A
Training:  29%|██▉       | 28/97 [00:11<00:22,  3.04it/s][A
Training:  31%|███       | 30/97 [00:13<00:29,  2.28it/s][A
Training:  34%|███▍      | 33/97 [00:14<00:29,  2.14it/s][A
Training:  37%|███▋      | 36/97 [00:15<00:19,  3.06it/s][A
Training:  39%|███▉      | 38/97 [00:16<00:25,  2.29it/s][A
Training:  42%|████▏     | 41/97 [00

Epoch: 23/23 - Loss: 1.8749 - Accuracy: 0.9381



  0%|          | 0/13 [00:00<?, ?it/s][A
  8%|▊         | 1/13 [00:01<00:21,  1.77s/it][A
 31%|███       | 4/13 [00:01<00:03,  2.76it/s][A
 46%|████▌     | 6/13 [00:03<00:03,  1.95it/s][A
 69%|██████▉   | 9/13 [00:04<00:01,  2.01it/s][A
100%|██████████| 13/13 [00:04<00:00,  2.65it/s][A
Epochs: 100%|██████████| 23/23 [17:20<00:00, 45.23s/it]
[32m[I 2023-12-15 05:12:10,034][0m Trial 18 finished with value: 0.9368699789047241 and parameters: {'learning_rate': 0.001500408021994709, 'weight_decay': 0.0005897407305513715, 'epsilon': 3.127923040073714e-09, 'batch_size': 145, 'epochs': 23}. Best is trial 2 with value: 0.9405519962310791.[0m


Val Loss: 2.1457 - Val Accuracy: 0.9369
Learning rate: 0.00024125614085284403
Weight decay: 0.0013256086878026582
Epsilon: 2.613211238494921e-08
Batch size: 173
Number of epochs: 86


Epochs:   0%|          | 0/86 [00:00<?, ?it/s]
Training:   0%|          | 0/81 [00:00<?, ?it/s][A
Training:   1%|          | 1/81 [00:02<02:58,  2.23s/it][A
Training:   5%|▍         | 4/81 [00:02<00:35,  2.17it/s][A
Training:   7%|▋         | 6/81 [00:04<00:48,  1.54it/s][A
Training:  11%|█         | 9/81 [00:06<00:46,  1.56it/s][A
Training:  15%|█▍        | 12/81 [00:06<00:27,  2.52it/s][A
Training:  17%|█▋        | 14/81 [00:08<00:37,  1.80it/s][A
Training:  21%|██        | 17/81 [00:10<00:37,  1.69it/s][A
Training:  25%|██▍       | 20/81 [00:10<00:24,  2.50it/s][A
Training:  27%|██▋       | 22/81 [00:12<00:31,  1.89it/s][A
Training:  31%|███       | 25/81 [00:13<00:31,  1.78it/s][A
Training:  35%|███▍      | 28/81 [00:14<00:20,  2.58it/s][A
Training:  37%|███▋      | 30/81 [00:15<00:26,  1.90it/s][A
Training:  41%|████      | 33/81 [00:17<00:27,  1.77it/s][A
Training:  44%|████▍     | 36/81 [00:17<00:17,  2.54it/s][A
Training:  47%|████▋     | 38/81 [00:19<00:22,  1.9

Epoch: 1/86 - Loss: 4.3779 - Accuracy: 0.7825



  0%|          | 0/11 [00:00<?, ?it/s][A
  9%|▉         | 1/11 [00:02<00:20,  2.07s/it][A
 36%|███▋      | 4/11 [00:02<00:02,  2.37it/s][A
 55%|█████▍    | 6/11 [00:03<00:02,  1.70it/s][A
100%|██████████| 11/11 [00:05<00:00,  2.00it/s][A
Epochs:   0%|          | 0/86 [00:46<?, ?it/s]
[32m[I 2023-12-15 05:12:56,486][0m Trial 19 pruned. [0m


Val Loss: 3.0306 - Val Accuracy: 0.8757

Study statistics: 
  Number of finished trials:  20
  Number of pruned trials:  13
  Number of complete trials:  7


In [23]:
print("Best trial:")
trial = study.best_trial

print("  Value: ", trial.value)

print("  Params: ")
for key, value in trial.params.items():
    print("    {}: {}".format(key, value))

Best trial:
  Value:  0.9405519962310791
  Params: 
    batch_size: 157
    epochs: 89
    epsilon: 6.582574844800083e-09
    learning_rate: 0.00014936159954798418
    weight_decay: 0.000648991059773433


In [None]:
# ViT P12-S8 Triplet Mean

Best trial:
Value:  0.9405519962310791
Params: 
batch_size: 157
epochs: 89
epsilon: 6.582574844800083e-09
learning_rate: 0.00014936159954798418
weight_decay: 0.000648991059773433