In [1]:
import pandas as pd
import numpy as np
import torch
import torch.nn as nn
from torch.utils.data import TensorDataset, DataLoader
from torch import Tensor
import torch.nn.functional as F
from torch.optim.lr_scheduler import MultiStepLR
from torch.utils.tensorboard import SummaryWriter

In [2]:
writer = SummaryWriter()

In [3]:
train_set = pd.read_csv("data/final_format/train_set.csv",header=None).to_numpy()
train_label = pd.read_csv("data/final_format/train_label.csv",header=None).to_numpy()
test_set = pd.read_csv("data/final_format/test_set.csv",header=None).to_numpy()
test_label = pd.read_csv("data/final_format/test_label.csv",header=None).to_numpy()

In [4]:
print(train_set.shape, train_label.shape, test_set.shape, test_label.shape)

(14393, 4096) (14393, 1) (3599, 4096) (3599, 1)


In [5]:
#delet first row data
train_set = train_set[1:]
train_label = train_label[1:]
test_set = test_set[1:]
test_label = test_label[1:]
print(train_set.shape, train_label.shape, test_set.shape, test_label.shape)

(14392, 4096) (14392, 1) (3598, 4096) (3598, 1)


In [6]:
train_set = train_set.reshape((-1,1,64,64))
test_set = test_set.reshape((-1,1,64,64))
print(train_set.shape, train_label.shape, test_set.shape, test_label.shape)

(14392, 1, 64, 64) (14392, 1) (3598, 1, 64, 64) (3598, 1)


In [7]:
train_label = train_label.reshape(-1)
test_label = test_label.reshape(-1)

print(train_set.shape, train_label.shape, test_set.shape, test_label.shape)

(14392, 1, 64, 64) (14392,) (3598, 1, 64, 64) (3598,)


In [8]:
# Hyper parameters
num_epochs = 300
num_classes = 4
batch_size = 64
learning_rate = 1e-3

In [9]:
train_set_tensor = Tensor(train_set) 
train_label_tensor = Tensor(train_label).type(torch.LongTensor)

train_dataset = TensorDataset(train_set_tensor,train_label_tensor) 
train_loader = DataLoader(train_dataset, batch_size=batch_size) 

test_set_tensor = Tensor(test_set) 
test_label_tensor = Tensor(test_label).type(torch.LongTensor)

test_dataset = TensorDataset(test_set_tensor,test_label_tensor) 
test_loader = DataLoader(test_dataset, batch_size=batch_size) 

In [10]:
# Device configuration
device = torch.device('cuda:0' if torch.cuda.is_available() else 'cpu')
device

device(type='cuda', index=0)

In [31]:
# Convolutional neural network (two convolutional layers)
class ResNet(nn.Module):
    def __init__(self, num_classes=4):
        super(ResNet, self).__init__()
        self.c1 = nn.Conv2d(1, 48, kernel_size=1, padding='same')
        self.c2 = nn.Conv2d(48, 48, kernel_size=3,padding='same')
        self.c3 = nn.Conv2d(48, 96, kernel_size=1,padding='same') 
        self.c4 = nn.Conv2d(97, 96, kernel_size=1, padding='same')
        self.c5 = nn.Conv2d(96, 96, kernel_size=3,padding='same')
        self.c6 = nn.Conv2d(96, 128, kernel_size=1, padding='same')
        self.c7 = nn.Conv2d(225, 128, kernel_size=3, padding='same')
        self.c8 = nn.Conv2d(128, 128, kernel_size=3,padding='same')
        self.c9 = nn.Conv2d(128, 256, kernel_size=3, padding='same')
        
        self.d1 = nn.Dropout(p=0.25)
        self.d2 = nn.Dropout(p=0.25)
        self.d3 = nn.Dropout(p=0.25)
        self.d4 = nn.Dropout(p=0.25)
        self.d5 = nn.Dropout(p=0.25)
        self.d6 = nn.Dropout(p=0.25) 
        self.d7 = nn.Dropout(p=0.25)
        self.d8 = nn.Dropout(p=0.25)
        self.d9 = nn.Dropout(p=0.25) 
        
        self.bn1 =  nn.BatchNorm2d(1)
        self.bn2 =  nn.BatchNorm2d(48)
        self.bn3 =  nn.BatchNorm2d(48)
        self.bn4 =  nn.BatchNorm2d(97)
        self.bn5 =  nn.BatchNorm2d(96)
        self.bn6 =  nn.BatchNorm2d(96)
        self.bn7 =  nn.BatchNorm2d(225)
        self.bn8 =  nn.BatchNorm2d(128)
        self.bn9 =  nn.BatchNorm2d(256)
        
        self.fc1 = nn.Linear(481*8*8, 512)
        self.fc2 = nn.Linear(512, num_classes)
        
        
    def forward(self, x):
        C1 = self.c1(self.bn1(x))
        C1 = F.leaky_relu(C1,0.2)
        C1 = self.d1(C1)
        C2 = self.c2(self.bn2(C1))
        C2 = F.leaky_relu(C2,0.2)
        C2 = self.d2(C2)
        C3 = self.c3(self.bn3(C2))
        sum1 = torch.cat((x, C3), dim=1)
        sum1 = F.leaky_relu(sum1,0.2)
        sum1 = self.d3(sum1)
        M1 = F.max_pool2d(sum1, kernel_size=2, stride=2)
         
        C4 = self.c4(self.bn4(M1))
        C4 = F.leaky_relu(C4,0.2)
        C4 = self.d4(C4)
        C5 = self.c5(self.bn5(C4))
        C5 = F.leaky_relu(C5,0.2)
        C5 = self.d5(C5)
        C6 = self.c6(self.bn6(C5))
        sum2 = torch.cat((M1, C6), dim=1)
        sum2 = F.leaky_relu(sum2,0.2)
        sum2 = self.d6(sum2)
        M2 = F.max_pool2d(sum2, kernel_size=2, stride=2)
        
        C7 = self.c7(self.bn7(M2))
        C7 = F.leaky_relu(C7,0.2)
        C7 = self.d7(C7)
        C8 = self.c8(self.bn8(C7))
        C8 = F.leaky_relu(C8,0.2)
        C8 = self.d8(C8)
        C9 = self.c9(self.bn9(C8))
        sum3 = torch.cat((M2, C9), dim=1)
        sum3 = F.leaky_relu(sum3,0.2)
        sum3 = self.d9(sum3)
        M3 = F.max_pool2d(sum3, kernel_size=2, stride=2)
        

        F1 = M3.reshape(M3.size(0), -1)
        Fc1 = self.fc1(F1)
        Fc2 = self.fc2(Fc1)
       
        return Fc2
    


In [32]:
model = ResNet(num_classes).to(device)

In [33]:
# Loss and optimizer
criterion = nn.CrossEntropyLoss()
optimizer = torch.optim.Adam(model.parameters(), lr=learning_rate, weight_decay=1e-3) 
#optimizer = torch.optim.Adam(model.parameters(), lr=learning_rate) 
milestones = [50,100,150,200,250]
milestones = [a * len(train_loader) for a in milestones]
scheduler = MultiStepLR(optimizer, milestones=milestones, gamma=0.5)

In [None]:
# Train the model
total_step = len(train_loader)
for epoch in range(num_epochs):
    correct=0
    total=0
    running_loss = 0
    for i, (X, Y) in enumerate(train_loader):
        X = X.to(device)
        Y = Y.to(device)
        
        
        # Forward pass
        outputs = model(X)
        loss = criterion(outputs, Y)
        
        # Backward and optimize
        optimizer.zero_grad()
        loss.backward()
        #scheduler.step() 
        #print(scheduler.get_last_lr()[0])
      
        optimizer.step()
        scheduler.step() 
        #print(optimizer.param_groups[0]["lr"])
        
        _, predicted = outputs.max(1)
        total += Y.size(0)
        correct += predicted.eq(Y).sum().item()
        running_loss += loss.item()
        accu=100.*correct/total
        train_loss = running_loss/(i+1)
        print ('Epoch [{}/{}], Step [{}/{}], Training Accuracy: {:.4f}%, Training Loss: {:.4f}%'.format(epoch+1, num_epochs, i+1, total_step, accu, train_loss))
    
   
        #writer.add_scalar(f'train/accuracy', accu, epoch)
        #writer.add_scalar(f'train/loss', train_loss, epoch)
        writer.add_scalars(f'train/accuracy_loss', {
            'accuracy': accu,
            'loss': train_loss,
        }, epoch)
        
        

Epoch [1/300], Step [1/225], Training Accuracy: 28.1250%, Training Loss: 1.5506%
Epoch [1/300], Step [2/225], Training Accuracy: 28.9062%, Training Loss: 56.4850%
Epoch [1/300], Step [3/225], Training Accuracy: 27.0833%, Training Loss: 61.9703%
Epoch [1/300], Step [4/225], Training Accuracy: 27.3438%, Training Loss: 51.3761%
Epoch [1/300], Step [5/225], Training Accuracy: 25.9375%, Training Loss: 47.2340%
Epoch [1/300], Step [6/225], Training Accuracy: 26.0417%, Training Loss: 43.9296%
Epoch [1/300], Step [7/225], Training Accuracy: 25.0000%, Training Loss: 43.5640%
Epoch [1/300], Step [8/225], Training Accuracy: 25.1953%, Training Loss: 40.9122%
Epoch [1/300], Step [9/225], Training Accuracy: 25.0000%, Training Loss: 39.9092%
Epoch [1/300], Step [10/225], Training Accuracy: 25.9375%, Training Loss: 38.0317%
Epoch [1/300], Step [11/225], Training Accuracy: 26.1364%, Training Loss: 37.0273%
Epoch [1/300], Step [12/225], Training Accuracy: 26.0417%, Training Loss: 35.8446%
Epoch [1/300],

Epoch [1/300], Step [108/225], Training Accuracy: 27.3582%, Training Loss: 6.8720%
Epoch [1/300], Step [109/225], Training Accuracy: 27.4943%, Training Loss: 6.8235%
Epoch [1/300], Step [110/225], Training Accuracy: 27.4716%, Training Loss: 6.7821%
Epoch [1/300], Step [111/225], Training Accuracy: 27.5056%, Training Loss: 6.7357%
Epoch [1/300], Step [112/225], Training Accuracy: 27.5251%, Training Loss: 6.6899%
Epoch [1/300], Step [113/225], Training Accuracy: 27.5581%, Training Loss: 6.6462%
Epoch [1/300], Step [114/225], Training Accuracy: 27.5630%, Training Loss: 6.6014%
Epoch [1/300], Step [115/225], Training Accuracy: 27.5408%, Training Loss: 6.5603%
Epoch [1/300], Step [116/225], Training Accuracy: 27.6401%, Training Loss: 6.5169%
Epoch [1/300], Step [117/225], Training Accuracy: 27.5507%, Training Loss: 6.4766%
Epoch [1/300], Step [118/225], Training Accuracy: 27.5291%, Training Loss: 6.4370%
Epoch [1/300], Step [119/225], Training Accuracy: 27.5867%, Training Loss: 6.3982%
Epoc

Epoch [1/300], Step [208/225], Training Accuracy: 28.1100%, Training Loss: 4.4127%
Epoch [1/300], Step [209/225], Training Accuracy: 28.1175%, Training Loss: 4.3985%
Epoch [1/300], Step [210/225], Training Accuracy: 28.0804%, Training Loss: 4.3853%
Epoch [1/300], Step [211/225], Training Accuracy: 28.0880%, Training Loss: 4.3711%
Epoch [1/300], Step [212/225], Training Accuracy: 28.0808%, Training Loss: 4.3570%
Epoch [1/300], Step [213/225], Training Accuracy: 28.1030%, Training Loss: 4.3435%
Epoch [1/300], Step [214/225], Training Accuracy: 28.0958%, Training Loss: 4.3301%
Epoch [1/300], Step [215/225], Training Accuracy: 28.0160%, Training Loss: 4.3178%
Epoch [1/300], Step [216/225], Training Accuracy: 28.0744%, Training Loss: 4.3042%
Epoch [1/300], Step [217/225], Training Accuracy: 28.1250%, Training Loss: 4.2902%
Epoch [1/300], Step [218/225], Training Accuracy: 28.1537%, Training Loss: 4.2781%
Epoch [1/300], Step [219/225], Training Accuracy: 28.1393%, Training Loss: 4.2661%
Epoc

Epoch [2/300], Step [83/225], Training Accuracy: 30.4405%, Training Loss: 1.4179%
Epoch [2/300], Step [84/225], Training Accuracy: 30.4688%, Training Loss: 1.4166%
Epoch [2/300], Step [85/225], Training Accuracy: 30.4963%, Training Loss: 1.4166%
Epoch [2/300], Step [86/225], Training Accuracy: 30.5414%, Training Loss: 1.4155%
Epoch [2/300], Step [87/225], Training Accuracy: 30.5496%, Training Loss: 1.4170%
Epoch [2/300], Step [88/225], Training Accuracy: 30.4510%, Training Loss: 1.4179%
Epoch [2/300], Step [89/225], Training Accuracy: 30.4249%, Training Loss: 1.4185%
Epoch [2/300], Step [90/225], Training Accuracy: 30.4167%, Training Loss: 1.4185%
Epoch [2/300], Step [91/225], Training Accuracy: 30.3400%, Training Loss: 1.4253%
Epoch [2/300], Step [92/225], Training Accuracy: 30.2310%, Training Loss: 1.4305%
Epoch [2/300], Step [93/225], Training Accuracy: 30.2923%, Training Loss: 1.4323%
Epoch [2/300], Step [94/225], Training Accuracy: 30.3191%, Training Loss: 1.4309%
Epoch [2/300], S

Epoch [2/300], Step [189/225], Training Accuracy: 31.5972%, Training Loss: 1.4062%
Epoch [2/300], Step [190/225], Training Accuracy: 31.5461%, Training Loss: 1.4068%
Epoch [2/300], Step [191/225], Training Accuracy: 31.4791%, Training Loss: 1.4076%
Epoch [2/300], Step [192/225], Training Accuracy: 31.4860%, Training Loss: 1.4072%
Epoch [2/300], Step [193/225], Training Accuracy: 31.5253%, Training Loss: 1.4066%
Epoch [2/300], Step [194/225], Training Accuracy: 31.5802%, Training Loss: 1.4060%
Epoch [2/300], Step [195/225], Training Accuracy: 31.5785%, Training Loss: 1.4058%
Epoch [2/300], Step [196/225], Training Accuracy: 31.5370%, Training Loss: 1.4061%
Epoch [2/300], Step [197/225], Training Accuracy: 31.4959%, Training Loss: 1.4067%
Epoch [2/300], Step [198/225], Training Accuracy: 31.5025%, Training Loss: 1.4058%
Epoch [2/300], Step [199/225], Training Accuracy: 31.4777%, Training Loss: 1.4057%
Epoch [2/300], Step [200/225], Training Accuracy: 31.4844%, Training Loss: 1.4054%
Epoc

Epoch [3/300], Step [72/225], Training Accuracy: 34.1146%, Training Loss: 1.3496%
Epoch [3/300], Step [73/225], Training Accuracy: 34.1182%, Training Loss: 1.3496%
Epoch [3/300], Step [74/225], Training Accuracy: 34.2483%, Training Loss: 1.3481%
Epoch [3/300], Step [75/225], Training Accuracy: 34.2917%, Training Loss: 1.3466%
Epoch [3/300], Step [76/225], Training Accuracy: 34.2722%, Training Loss: 1.3469%
Epoch [3/300], Step [77/225], Training Accuracy: 34.2532%, Training Loss: 1.3474%
Epoch [3/300], Step [78/225], Training Accuracy: 34.3149%, Training Loss: 1.3463%
Epoch [3/300], Step [79/225], Training Accuracy: 34.3157%, Training Loss: 1.3462%
Epoch [3/300], Step [80/225], Training Accuracy: 34.1602%, Training Loss: 1.3463%
Epoch [3/300], Step [81/225], Training Accuracy: 34.2014%, Training Loss: 1.3460%
Epoch [3/300], Step [82/225], Training Accuracy: 34.1845%, Training Loss: 1.3480%
Epoch [3/300], Step [83/225], Training Accuracy: 34.1303%, Training Loss: 1.3486%
Epoch [3/300], S

Epoch [3/300], Step [172/225], Training Accuracy: 34.9110%, Training Loss: 1.3308%
Epoch [3/300], Step [173/225], Training Accuracy: 34.9530%, Training Loss: 1.3304%
Epoch [3/300], Step [174/225], Training Accuracy: 34.9048%, Training Loss: 1.3301%
Epoch [3/300], Step [175/225], Training Accuracy: 34.9375%, Training Loss: 1.3301%
Epoch [3/300], Step [176/225], Training Accuracy: 34.9254%, Training Loss: 1.3303%
Epoch [3/300], Step [177/225], Training Accuracy: 34.9311%, Training Loss: 1.3305%
Epoch [3/300], Step [178/225], Training Accuracy: 34.9368%, Training Loss: 1.3302%
Epoch [3/300], Step [179/225], Training Accuracy: 34.9511%, Training Loss: 1.3299%
Epoch [3/300], Step [180/225], Training Accuracy: 35.0174%, Training Loss: 1.3292%
Epoch [3/300], Step [181/225], Training Accuracy: 34.9879%, Training Loss: 1.3290%
Epoch [3/300], Step [182/225], Training Accuracy: 34.9760%, Training Loss: 1.3286%
Epoch [3/300], Step [183/225], Training Accuracy: 34.9556%, Training Loss: 1.3286%
Epoc

Epoch [4/300], Step [50/225], Training Accuracy: 37.4688%, Training Loss: 1.2841%
Epoch [4/300], Step [51/225], Training Accuracy: 37.6225%, Training Loss: 1.2836%
Epoch [4/300], Step [52/225], Training Accuracy: 37.7404%, Training Loss: 1.2834%
Epoch [4/300], Step [53/225], Training Accuracy: 37.7358%, Training Loss: 1.2827%
Epoch [4/300], Step [54/225], Training Accuracy: 37.8472%, Training Loss: 1.2819%
Epoch [4/300], Step [55/225], Training Accuracy: 37.7557%, Training Loss: 1.2823%
Epoch [4/300], Step [56/225], Training Accuracy: 37.6395%, Training Loss: 1.2823%
Epoch [4/300], Step [57/225], Training Accuracy: 37.7741%, Training Loss: 1.2801%
Epoch [4/300], Step [58/225], Training Accuracy: 37.7694%, Training Loss: 1.2794%
Epoch [4/300], Step [59/225], Training Accuracy: 37.9237%, Training Loss: 1.2777%
Epoch [4/300], Step [60/225], Training Accuracy: 37.8646%, Training Loss: 1.2768%
Epoch [4/300], Step [61/225], Training Accuracy: 37.8330%, Training Loss: 1.2764%
Epoch [4/300], S

Epoch [4/300], Step [155/225], Training Accuracy: 38.5585%, Training Loss: 1.2678%
Epoch [4/300], Step [156/225], Training Accuracy: 38.5216%, Training Loss: 1.2686%
Epoch [4/300], Step [157/225], Training Accuracy: 38.5052%, Training Loss: 1.2686%
Epoch [4/300], Step [158/225], Training Accuracy: 38.5384%, Training Loss: 1.2680%
Epoch [4/300], Step [159/225], Training Accuracy: 38.5613%, Training Loss: 1.2680%
Epoch [4/300], Step [160/225], Training Accuracy: 38.5840%, Training Loss: 1.2681%
Epoch [4/300], Step [161/225], Training Accuracy: 38.6549%, Training Loss: 1.2675%
Epoch [4/300], Step [162/225], Training Accuracy: 38.6671%, Training Loss: 1.2671%
Epoch [4/300], Step [163/225], Training Accuracy: 38.7270%, Training Loss: 1.2663%
Epoch [4/300], Step [164/225], Training Accuracy: 38.7671%, Training Loss: 1.2656%
Epoch [4/300], Step [165/225], Training Accuracy: 38.7405%, Training Loss: 1.2667%
Epoch [4/300], Step [166/225], Training Accuracy: 38.7707%, Training Loss: 1.2662%
Epoc

Epoch [5/300], Step [33/225], Training Accuracy: 40.8617%, Training Loss: 1.2221%
Epoch [5/300], Step [34/225], Training Accuracy: 40.8548%, Training Loss: 1.2229%
Epoch [5/300], Step [35/225], Training Accuracy: 40.7589%, Training Loss: 1.2225%
Epoch [5/300], Step [36/225], Training Accuracy: 40.5816%, Training Loss: 1.2228%
Epoch [5/300], Step [37/225], Training Accuracy: 40.6672%, Training Loss: 1.2217%
Epoch [5/300], Step [38/225], Training Accuracy: 40.8717%, Training Loss: 1.2201%
Epoch [5/300], Step [39/225], Training Accuracy: 41.0657%, Training Loss: 1.2178%
Epoch [5/300], Step [40/225], Training Accuracy: 40.8203%, Training Loss: 1.2181%
Epoch [5/300], Step [41/225], Training Accuracy: 40.8155%, Training Loss: 1.2172%
Epoch [5/300], Step [42/225], Training Accuracy: 40.8854%, Training Loss: 1.2167%
Epoch [5/300], Step [43/225], Training Accuracy: 40.9157%, Training Loss: 1.2157%
Epoch [5/300], Step [44/225], Training Accuracy: 41.1222%, Training Loss: 1.2129%
Epoch [5/300], S

Epoch [5/300], Step [138/225], Training Accuracy: 41.0892%, Training Loss: 1.2045%
Epoch [5/300], Step [139/225], Training Accuracy: 41.0746%, Training Loss: 1.2047%
Epoch [5/300], Step [140/225], Training Accuracy: 41.0938%, Training Loss: 1.2052%
Epoch [5/300], Step [141/225], Training Accuracy: 41.0793%, Training Loss: 1.2051%
Epoch [5/300], Step [142/225], Training Accuracy: 41.1312%, Training Loss: 1.2048%
Epoch [5/300], Step [143/225], Training Accuracy: 41.1713%, Training Loss: 1.2043%
Epoch [5/300], Step [144/225], Training Accuracy: 41.2435%, Training Loss: 1.2042%
Epoch [5/300], Step [145/225], Training Accuracy: 41.2392%, Training Loss: 1.2043%
Epoch [5/300], Step [146/225], Training Accuracy: 41.2136%, Training Loss: 1.2047%
Epoch [5/300], Step [147/225], Training Accuracy: 41.2521%, Training Loss: 1.2045%
Epoch [5/300], Step [148/225], Training Accuracy: 41.3640%, Training Loss: 1.2038%
Epoch [5/300], Step [149/225], Training Accuracy: 41.3591%, Training Loss: 1.2036%
Epoc

Epoch [6/300], Step [16/225], Training Accuracy: 45.0195%, Training Loss: 1.1631%
Epoch [6/300], Step [17/225], Training Accuracy: 45.4044%, Training Loss: 1.1557%
Epoch [6/300], Step [18/225], Training Accuracy: 44.7917%, Training Loss: 1.1565%
Epoch [6/300], Step [19/225], Training Accuracy: 44.9836%, Training Loss: 1.1548%
Epoch [6/300], Step [20/225], Training Accuracy: 44.7656%, Training Loss: 1.1560%
Epoch [6/300], Step [21/225], Training Accuracy: 45.1637%, Training Loss: 1.1498%
Epoch [6/300], Step [22/225], Training Accuracy: 45.0284%, Training Loss: 1.1507%
Epoch [6/300], Step [23/225], Training Accuracy: 45.1087%, Training Loss: 1.1462%
Epoch [6/300], Step [24/225], Training Accuracy: 45.1823%, Training Loss: 1.1446%
Epoch [6/300], Step [25/225], Training Accuracy: 45.4375%, Training Loss: 1.1385%
Epoch [6/300], Step [26/225], Training Accuracy: 45.4928%, Training Loss: 1.1371%
Epoch [6/300], Step [27/225], Training Accuracy: 44.9653%, Training Loss: 1.1414%
Epoch [6/300], S

Epoch [6/300], Step [117/225], Training Accuracy: 45.3392%, Training Loss: 1.1243%
Epoch [6/300], Step [118/225], Training Accuracy: 45.3655%, Training Loss: 1.1237%
Epoch [6/300], Step [119/225], Training Accuracy: 45.3388%, Training Loss: 1.1231%
Epoch [6/300], Step [120/225], Training Accuracy: 45.3646%, Training Loss: 1.1235%
Epoch [6/300], Step [121/225], Training Accuracy: 45.3642%, Training Loss: 1.1238%
Epoch [6/300], Step [122/225], Training Accuracy: 45.3765%, Training Loss: 1.1236%
Epoch [6/300], Step [123/225], Training Accuracy: 45.3760%, Training Loss: 1.1232%
Epoch [6/300], Step [124/225], Training Accuracy: 45.4007%, Training Loss: 1.1224%
Epoch [6/300], Step [125/225], Training Accuracy: 45.4125%, Training Loss: 1.1230%
Epoch [6/300], Step [126/225], Training Accuracy: 45.3745%, Training Loss: 1.1238%
Epoch [6/300], Step [127/225], Training Accuracy: 45.2756%, Training Loss: 1.1242%
Epoch [6/300], Step [128/225], Training Accuracy: 45.2393%, Training Loss: 1.1245%
Epoc

Epoch [6/300], Step [218/225], Training Accuracy: 45.9576%, Training Loss: 1.1093%
Epoch [6/300], Step [219/225], Training Accuracy: 45.9618%, Training Loss: 1.1088%
Epoch [6/300], Step [220/225], Training Accuracy: 46.0014%, Training Loss: 1.1086%
Epoch [6/300], Step [221/225], Training Accuracy: 45.9771%, Training Loss: 1.1089%
Epoch [6/300], Step [222/225], Training Accuracy: 45.9882%, Training Loss: 1.1084%
Epoch [6/300], Step [223/225], Training Accuracy: 45.9851%, Training Loss: 1.1085%
Epoch [6/300], Step [224/225], Training Accuracy: 45.9961%, Training Loss: 1.1078%
Epoch [6/300], Step [225/225], Training Accuracy: 45.9700%, Training Loss: 1.1080%
Epoch [7/300], Step [1/225], Training Accuracy: 57.8125%, Training Loss: 0.9899%
Epoch [7/300], Step [2/225], Training Accuracy: 53.9062%, Training Loss: 1.1048%
Epoch [7/300], Step [3/225], Training Accuracy: 50.0000%, Training Loss: 1.1208%
Epoch [7/300], Step [4/225], Training Accuracy: 49.2188%, Training Loss: 1.1041%
Epoch [7/300

Epoch [7/300], Step [99/225], Training Accuracy: 48.6269%, Training Loss: 1.0534%
Epoch [7/300], Step [100/225], Training Accuracy: 48.6250%, Training Loss: 1.0533%
Epoch [7/300], Step [101/225], Training Accuracy: 48.6850%, Training Loss: 1.0526%
Epoch [7/300], Step [102/225], Training Accuracy: 48.6520%, Training Loss: 1.0536%
Epoch [7/300], Step [103/225], Training Accuracy: 48.6802%, Training Loss: 1.0542%
Epoch [7/300], Step [104/225], Training Accuracy: 48.7230%, Training Loss: 1.0543%
Epoch [7/300], Step [105/225], Training Accuracy: 48.9286%, Training Loss: 1.0531%
Epoch [7/300], Step [106/225], Training Accuracy: 48.9387%, Training Loss: 1.0527%
Epoch [7/300], Step [107/225], Training Accuracy: 48.8756%, Training Loss: 1.0530%
Epoch [7/300], Step [108/225], Training Accuracy: 48.8137%, Training Loss: 1.0529%
Epoch [7/300], Step [109/225], Training Accuracy: 48.8245%, Training Loss: 1.0522%
Epoch [7/300], Step [110/225], Training Accuracy: 48.7784%, Training Loss: 1.0522%
Epoch

Epoch [7/300], Step [198/225], Training Accuracy: 49.2977%, Training Loss: 1.0403%
Epoch [7/300], Step [199/225], Training Accuracy: 49.2541%, Training Loss: 1.0403%
Epoch [7/300], Step [200/225], Training Accuracy: 49.2656%, Training Loss: 1.0406%
Epoch [7/300], Step [201/225], Training Accuracy: 49.2304%, Training Loss: 1.0413%
Epoch [7/300], Step [202/225], Training Accuracy: 49.2265%, Training Loss: 1.0413%
Epoch [7/300], Step [203/225], Training Accuracy: 49.2380%, Training Loss: 1.0412%
Epoch [7/300], Step [204/225], Training Accuracy: 49.2494%, Training Loss: 1.0414%
Epoch [7/300], Step [205/225], Training Accuracy: 49.2530%, Training Loss: 1.0414%
Epoch [7/300], Step [206/225], Training Accuracy: 49.2036%, Training Loss: 1.0419%
Epoch [7/300], Step [207/225], Training Accuracy: 49.1923%, Training Loss: 1.0423%
Epoch [7/300], Step [208/225], Training Accuracy: 49.1962%, Training Loss: 1.0420%
Epoch [7/300], Step [209/225], Training Accuracy: 49.2001%, Training Loss: 1.0424%
Epoc

Epoch [8/300], Step [74/225], Training Accuracy: 50.5068%, Training Loss: 1.0085%
Epoch [8/300], Step [75/225], Training Accuracy: 50.6458%, Training Loss: 1.0069%
Epoch [8/300], Step [76/225], Training Accuracy: 50.5345%, Training Loss: 1.0067%
Epoch [8/300], Step [77/225], Training Accuracy: 50.5885%, Training Loss: 1.0071%
Epoch [8/300], Step [78/225], Training Accuracy: 50.5609%, Training Loss: 1.0068%
Epoch [8/300], Step [79/225], Training Accuracy: 50.4747%, Training Loss: 1.0075%
Epoch [8/300], Step [80/225], Training Accuracy: 50.3906%, Training Loss: 1.0080%
Epoch [8/300], Step [81/225], Training Accuracy: 50.3858%, Training Loss: 1.0087%
Epoch [8/300], Step [82/225], Training Accuracy: 50.4192%, Training Loss: 1.0074%
Epoch [8/300], Step [83/225], Training Accuracy: 50.4142%, Training Loss: 1.0066%
Epoch [8/300], Step [84/225], Training Accuracy: 50.4278%, Training Loss: 1.0058%
Epoch [8/300], Step [85/225], Training Accuracy: 50.4779%, Training Loss: 1.0052%
Epoch [8/300], S

Epoch [8/300], Step [176/225], Training Accuracy: 50.9322%, Training Loss: 1.0016%
Epoch [8/300], Step [177/225], Training Accuracy: 51.0152%, Training Loss: 1.0006%
Epoch [8/300], Step [178/225], Training Accuracy: 50.9744%, Training Loss: 1.0010%
Epoch [8/300], Step [179/225], Training Accuracy: 51.0213%, Training Loss: 1.0002%
Epoch [8/300], Step [180/225], Training Accuracy: 51.1285%, Training Loss: 0.9992%
Epoch [8/300], Step [181/225], Training Accuracy: 51.0791%, Training Loss: 1.0002%
Epoch [8/300], Step [182/225], Training Accuracy: 51.1075%, Training Loss: 0.9997%
Epoch [8/300], Step [183/225], Training Accuracy: 51.0758%, Training Loss: 0.9999%
Epoch [8/300], Step [184/225], Training Accuracy: 51.0954%, Training Loss: 0.9992%
Epoch [8/300], Step [185/225], Training Accuracy: 51.0895%, Training Loss: 0.9989%
Epoch [8/300], Step [186/225], Training Accuracy: 51.1425%, Training Loss: 0.9979%
Epoch [8/300], Step [187/225], Training Accuracy: 51.1531%, Training Loss: 0.9976%
Epoc

Epoch [9/300], Step [57/225], Training Accuracy: 53.6732%, Training Loss: 0.9474%
Epoch [9/300], Step [58/225], Training Accuracy: 53.6369%, Training Loss: 0.9481%
Epoch [9/300], Step [59/225], Training Accuracy: 53.7341%, Training Loss: 0.9468%
Epoch [9/300], Step [60/225], Training Accuracy: 53.6979%, Training Loss: 0.9493%
Epoch [9/300], Step [61/225], Training Accuracy: 53.6885%, Training Loss: 0.9483%
Epoch [9/300], Step [62/225], Training Accuracy: 53.6290%, Training Loss: 0.9493%
Epoch [9/300], Step [63/225], Training Accuracy: 53.5714%, Training Loss: 0.9509%
Epoch [9/300], Step [64/225], Training Accuracy: 53.4180%, Training Loss: 0.9554%
Epoch [9/300], Step [65/225], Training Accuracy: 53.4135%, Training Loss: 0.9562%
Epoch [9/300], Step [66/225], Training Accuracy: 53.5038%, Training Loss: 0.9555%
Epoch [9/300], Step [67/225], Training Accuracy: 53.5215%, Training Loss: 0.9564%
Epoch [9/300], Step [68/225], Training Accuracy: 53.4926%, Training Loss: 0.9575%
Epoch [9/300], S

Epoch [9/300], Step [165/225], Training Accuracy: 52.9072%, Training Loss: 0.9576%
Epoch [9/300], Step [166/225], Training Accuracy: 52.8897%, Training Loss: 0.9571%
Epoch [9/300], Step [167/225], Training Accuracy: 52.9566%, Training Loss: 0.9563%
Epoch [9/300], Step [168/225], Training Accuracy: 52.9762%, Training Loss: 0.9560%
Epoch [9/300], Step [169/225], Training Accuracy: 53.0325%, Training Loss: 0.9548%
Epoch [9/300], Step [170/225], Training Accuracy: 53.0331%, Training Loss: 0.9545%
Epoch [9/300], Step [171/225], Training Accuracy: 53.0154%, Training Loss: 0.9545%
Epoch [9/300], Step [172/225], Training Accuracy: 52.9615%, Training Loss: 0.9551%
Epoch [9/300], Step [173/225], Training Accuracy: 52.9444%, Training Loss: 0.9551%
Epoch [9/300], Step [174/225], Training Accuracy: 52.9903%, Training Loss: 0.9546%
Epoch [9/300], Step [175/225], Training Accuracy: 53.0714%, Training Loss: 0.9540%
Epoch [9/300], Step [176/225], Training Accuracy: 53.1161%, Training Loss: 0.9537%
Epoc

Epoch [10/300], Step [40/225], Training Accuracy: 55.0391%, Training Loss: 0.9174%
Epoch [10/300], Step [41/225], Training Accuracy: 54.8018%, Training Loss: 0.9197%
Epoch [10/300], Step [42/225], Training Accuracy: 54.7991%, Training Loss: 0.9184%
Epoch [10/300], Step [43/225], Training Accuracy: 54.6875%, Training Loss: 0.9175%
Epoch [10/300], Step [44/225], Training Accuracy: 54.7940%, Training Loss: 0.9167%
Epoch [10/300], Step [45/225], Training Accuracy: 54.6875%, Training Loss: 0.9168%
Epoch [10/300], Step [46/225], Training Accuracy: 54.9932%, Training Loss: 0.9131%
Epoch [10/300], Step [47/225], Training Accuracy: 54.7872%, Training Loss: 0.9151%
Epoch [10/300], Step [48/225], Training Accuracy: 54.7526%, Training Loss: 0.9172%
Epoch [10/300], Step [49/225], Training Accuracy: 54.7832%, Training Loss: 0.9184%
Epoch [10/300], Step [50/225], Training Accuracy: 54.8438%, Training Loss: 0.9176%
Epoch [10/300], Step [51/225], Training Accuracy: 54.8100%, Training Loss: 0.9182%
Epoc

Epoch [10/300], Step [143/225], Training Accuracy: 54.7531%, Training Loss: 0.9266%
Epoch [10/300], Step [144/225], Training Accuracy: 54.7092%, Training Loss: 0.9268%
Epoch [10/300], Step [145/225], Training Accuracy: 54.6444%, Training Loss: 0.9270%
Epoch [10/300], Step [146/225], Training Accuracy: 54.6554%, Training Loss: 0.9277%
Epoch [10/300], Step [147/225], Training Accuracy: 54.6237%, Training Loss: 0.9282%
Epoch [10/300], Step [148/225], Training Accuracy: 54.6242%, Training Loss: 0.9281%
Epoch [10/300], Step [149/225], Training Accuracy: 54.6036%, Training Loss: 0.9283%
Epoch [10/300], Step [150/225], Training Accuracy: 54.6042%, Training Loss: 0.9278%
Epoch [10/300], Step [151/225], Training Accuracy: 54.6254%, Training Loss: 0.9271%
Epoch [10/300], Step [152/225], Training Accuracy: 54.6669%, Training Loss: 0.9266%
Epoch [10/300], Step [153/225], Training Accuracy: 54.6977%, Training Loss: 0.9259%
Epoch [10/300], Step [154/225], Training Accuracy: 54.7179%, Training Loss: 

Epoch [11/300], Step [20/225], Training Accuracy: 58.2031%, Training Loss: 0.8899%
Epoch [11/300], Step [21/225], Training Accuracy: 57.7381%, Training Loss: 0.8871%
Epoch [11/300], Step [22/225], Training Accuracy: 57.1023%, Training Loss: 0.8890%
Epoch [11/300], Step [23/225], Training Accuracy: 56.9973%, Training Loss: 0.8891%
Epoch [11/300], Step [24/225], Training Accuracy: 57.0964%, Training Loss: 0.8893%
Epoch [11/300], Step [25/225], Training Accuracy: 57.2500%, Training Loss: 0.8870%
Epoch [11/300], Step [26/225], Training Accuracy: 57.2115%, Training Loss: 0.8844%
Epoch [11/300], Step [27/225], Training Accuracy: 57.4653%, Training Loss: 0.8848%
Epoch [11/300], Step [28/225], Training Accuracy: 57.5893%, Training Loss: 0.8798%
Epoch [11/300], Step [29/225], Training Accuracy: 57.9203%, Training Loss: 0.8754%
Epoch [11/300], Step [30/225], Training Accuracy: 57.7604%, Training Loss: 0.8740%
Epoch [11/300], Step [31/225], Training Accuracy: 57.7621%, Training Loss: 0.8733%
Epoc

Epoch [11/300], Step [120/225], Training Accuracy: 56.5365%, Training Loss: 0.9081%
Epoch [11/300], Step [121/225], Training Accuracy: 56.4824%, Training Loss: 0.9083%
Epoch [11/300], Step [122/225], Training Accuracy: 56.5574%, Training Loss: 0.9076%
Epoch [11/300], Step [123/225], Training Accuracy: 56.6184%, Training Loss: 0.9065%
Epoch [11/300], Step [124/225], Training Accuracy: 56.6154%, Training Loss: 0.9059%
Epoch [11/300], Step [125/225], Training Accuracy: 56.6750%, Training Loss: 0.9083%
Epoch [11/300], Step [126/225], Training Accuracy: 56.7212%, Training Loss: 0.9078%
Epoch [11/300], Step [127/225], Training Accuracy: 56.7052%, Training Loss: 0.9080%
Epoch [11/300], Step [128/225], Training Accuracy: 56.7139%, Training Loss: 0.9080%
Epoch [11/300], Step [129/225], Training Accuracy: 56.6134%, Training Loss: 0.9098%
Epoch [11/300], Step [130/225], Training Accuracy: 56.5385%, Training Loss: 0.9110%
Epoch [11/300], Step [131/225], Training Accuracy: 56.5482%, Training Loss: 

Epoch [11/300], Step [222/225], Training Accuracy: 57.2424%, Training Loss: 0.8971%
Epoch [11/300], Step [223/225], Training Accuracy: 57.2520%, Training Loss: 0.8971%
Epoch [11/300], Step [224/225], Training Accuracy: 57.2614%, Training Loss: 0.8967%
Epoch [11/300], Step [225/225], Training Accuracy: 57.2610%, Training Loss: 0.8971%
Epoch [12/300], Step [1/225], Training Accuracy: 64.0625%, Training Loss: 0.7767%
Epoch [12/300], Step [2/225], Training Accuracy: 58.5938%, Training Loss: 0.8148%
Epoch [12/300], Step [3/225], Training Accuracy: 58.3333%, Training Loss: 0.9088%
Epoch [12/300], Step [4/225], Training Accuracy: 57.4219%, Training Loss: 0.9008%
Epoch [12/300], Step [5/225], Training Accuracy: 59.0625%, Training Loss: 0.8737%
Epoch [12/300], Step [6/225], Training Accuracy: 60.6771%, Training Loss: 0.8774%
Epoch [12/300], Step [7/225], Training Accuracy: 58.9286%, Training Loss: 0.8821%
Epoch [12/300], Step [8/225], Training Accuracy: 58.3984%, Training Loss: 0.8857%
Epoch [1

Epoch [12/300], Step [98/225], Training Accuracy: 58.1792%, Training Loss: 0.8692%
Epoch [12/300], Step [99/225], Training Accuracy: 58.2071%, Training Loss: 0.8690%
Epoch [12/300], Step [100/225], Training Accuracy: 58.1406%, Training Loss: 0.8705%
Epoch [12/300], Step [101/225], Training Accuracy: 58.0600%, Training Loss: 0.8704%
Epoch [12/300], Step [102/225], Training Accuracy: 58.0576%, Training Loss: 0.8720%
Epoch [12/300], Step [103/225], Training Accuracy: 58.0552%, Training Loss: 0.8726%
Epoch [12/300], Step [104/225], Training Accuracy: 57.9928%, Training Loss: 0.8730%
Epoch [12/300], Step [105/225], Training Accuracy: 58.0506%, Training Loss: 0.8726%
Epoch [12/300], Step [106/225], Training Accuracy: 58.0483%, Training Loss: 0.8723%
Epoch [12/300], Step [107/225], Training Accuracy: 57.9585%, Training Loss: 0.8735%
Epoch [12/300], Step [108/225], Training Accuracy: 57.8559%, Training Loss: 0.8732%
Epoch [12/300], Step [109/225], Training Accuracy: 57.8842%, Training Loss: 0.

Epoch [12/300], Step [198/225], Training Accuracy: 58.2702%, Training Loss: 0.8673%
Epoch [12/300], Step [199/225], Training Accuracy: 58.2836%, Training Loss: 0.8666%
Epoch [12/300], Step [200/225], Training Accuracy: 58.2891%, Training Loss: 0.8667%
Epoch [12/300], Step [201/225], Training Accuracy: 58.2867%, Training Loss: 0.8666%
Epoch [12/300], Step [202/225], Training Accuracy: 58.2766%, Training Loss: 0.8667%
Epoch [12/300], Step [203/225], Training Accuracy: 58.3359%, Training Loss: 0.8662%
Epoch [12/300], Step [204/225], Training Accuracy: 58.3487%, Training Loss: 0.8670%
Epoch [12/300], Step [205/225], Training Accuracy: 58.3765%, Training Loss: 0.8669%
Epoch [12/300], Step [206/225], Training Accuracy: 58.3359%, Training Loss: 0.8673%
Epoch [12/300], Step [207/225], Training Accuracy: 58.3484%, Training Loss: 0.8675%
Epoch [12/300], Step [208/225], Training Accuracy: 58.3984%, Training Loss: 0.8668%
Epoch [12/300], Step [209/225], Training Accuracy: 58.3882%, Training Loss: 

Epoch [13/300], Step [74/225], Training Accuracy: 60.2829%, Training Loss: 0.8360%
Epoch [13/300], Step [75/225], Training Accuracy: 60.2083%, Training Loss: 0.8362%
Epoch [13/300], Step [76/225], Training Accuracy: 60.0535%, Training Loss: 0.8379%
Epoch [13/300], Step [77/225], Training Accuracy: 60.0244%, Training Loss: 0.8393%
Epoch [13/300], Step [78/225], Training Accuracy: 59.9960%, Training Loss: 0.8397%
Epoch [13/300], Step [79/225], Training Accuracy: 59.9684%, Training Loss: 0.8399%
Epoch [13/300], Step [80/225], Training Accuracy: 59.8047%, Training Loss: 0.8405%
Epoch [13/300], Step [81/225], Training Accuracy: 59.7608%, Training Loss: 0.8417%
Epoch [13/300], Step [82/225], Training Accuracy: 59.7180%, Training Loss: 0.8416%
Epoch [13/300], Step [83/225], Training Accuracy: 59.7515%, Training Loss: 0.8416%
Epoch [13/300], Step [84/225], Training Accuracy: 59.8214%, Training Loss: 0.8411%
Epoch [13/300], Step [85/225], Training Accuracy: 59.9265%, Training Loss: 0.8398%
Epoc

Epoch [13/300], Step [175/225], Training Accuracy: 59.7768%, Training Loss: 0.8431%
Epoch [13/300], Step [176/225], Training Accuracy: 59.8011%, Training Loss: 0.8425%
Epoch [13/300], Step [177/225], Training Accuracy: 59.8694%, Training Loss: 0.8418%
Epoch [13/300], Step [178/225], Training Accuracy: 59.8315%, Training Loss: 0.8422%
Epoch [13/300], Step [179/225], Training Accuracy: 59.8638%, Training Loss: 0.8412%
Epoch [13/300], Step [180/225], Training Accuracy: 59.9306%, Training Loss: 0.8406%
Epoch [13/300], Step [181/225], Training Accuracy: 59.9275%, Training Loss: 0.8409%
Epoch [13/300], Step [182/225], Training Accuracy: 59.9330%, Training Loss: 0.8403%
Epoch [13/300], Step [183/225], Training Accuracy: 59.8702%, Training Loss: 0.8419%
Epoch [13/300], Step [184/225], Training Accuracy: 59.9100%, Training Loss: 0.8413%
Epoch [13/300], Step [185/225], Training Accuracy: 59.9324%, Training Loss: 0.8417%
Epoch [13/300], Step [186/225], Training Accuracy: 59.9378%, Training Loss: 

Epoch [14/300], Step [52/225], Training Accuracy: 61.6286%, Training Loss: 0.8120%
Epoch [14/300], Step [53/225], Training Accuracy: 61.5271%, Training Loss: 0.8122%
Epoch [14/300], Step [54/225], Training Accuracy: 61.3137%, Training Loss: 0.8142%
Epoch [14/300], Step [55/225], Training Accuracy: 61.3068%, Training Loss: 0.8151%
Epoch [14/300], Step [56/225], Training Accuracy: 61.2444%, Training Loss: 0.8147%
Epoch [14/300], Step [57/225], Training Accuracy: 61.2664%, Training Loss: 0.8132%
Epoch [14/300], Step [58/225], Training Accuracy: 61.2608%, Training Loss: 0.8141%
Epoch [14/300], Step [59/225], Training Accuracy: 61.2818%, Training Loss: 0.8132%
Epoch [14/300], Step [60/225], Training Accuracy: 61.4323%, Training Loss: 0.8124%
Epoch [14/300], Step [61/225], Training Accuracy: 61.3473%, Training Loss: 0.8134%
Epoch [14/300], Step [62/225], Training Accuracy: 61.4415%, Training Loss: 0.8122%
Epoch [14/300], Step [63/225], Training Accuracy: 61.2847%, Training Loss: 0.8127%
Epoc

Epoch [14/300], Step [152/225], Training Accuracy: 60.6086%, Training Loss: 0.8420%
Epoch [14/300], Step [153/225], Training Accuracy: 60.6107%, Training Loss: 0.8414%
Epoch [14/300], Step [154/225], Training Accuracy: 60.6027%, Training Loss: 0.8413%
Epoch [14/300], Step [155/225], Training Accuracy: 60.5444%, Training Loss: 0.8418%
Epoch [14/300], Step [156/225], Training Accuracy: 60.5369%, Training Loss: 0.8427%
Epoch [14/300], Step [157/225], Training Accuracy: 60.5593%, Training Loss: 0.8422%
Epoch [14/300], Step [158/225], Training Accuracy: 60.5024%, Training Loss: 0.8428%
Epoch [14/300], Step [159/225], Training Accuracy: 60.5248%, Training Loss: 0.8429%
Epoch [14/300], Step [160/225], Training Accuracy: 60.5762%, Training Loss: 0.8423%
Epoch [14/300], Step [161/225], Training Accuracy: 60.5784%, Training Loss: 0.8423%
Epoch [14/300], Step [162/225], Training Accuracy: 60.5324%, Training Loss: 0.8421%
Epoch [14/300], Step [163/225], Training Accuracy: 60.5445%, Training Loss: 

Epoch [15/300], Step [33/225], Training Accuracy: 63.7311%, Training Loss: 0.8087%
Epoch [15/300], Step [34/225], Training Accuracy: 63.4191%, Training Loss: 0.8129%
Epoch [15/300], Step [35/225], Training Accuracy: 63.1696%, Training Loss: 0.8130%
Epoch [15/300], Step [36/225], Training Accuracy: 63.0642%, Training Loss: 0.8160%
Epoch [15/300], Step [37/225], Training Accuracy: 62.9645%, Training Loss: 0.8167%
Epoch [15/300], Step [38/225], Training Accuracy: 62.9523%, Training Loss: 0.8156%
Epoch [15/300], Step [39/225], Training Accuracy: 62.9006%, Training Loss: 0.8171%
Epoch [15/300], Step [40/225], Training Accuracy: 63.0469%, Training Loss: 0.8170%
Epoch [15/300], Step [41/225], Training Accuracy: 62.8811%, Training Loss: 0.8183%
Epoch [15/300], Step [42/225], Training Accuracy: 62.8720%, Training Loss: 0.8173%
Epoch [15/300], Step [43/225], Training Accuracy: 62.7907%, Training Loss: 0.8177%
Epoch [15/300], Step [44/225], Training Accuracy: 62.7841%, Training Loss: 0.8187%
Epoc

Epoch [15/300], Step [135/225], Training Accuracy: 63.1597%, Training Loss: 0.8102%
Epoch [15/300], Step [136/225], Training Accuracy: 63.1664%, Training Loss: 0.8101%
Epoch [15/300], Step [137/225], Training Accuracy: 63.1843%, Training Loss: 0.8104%
Epoch [15/300], Step [138/225], Training Accuracy: 63.3039%, Training Loss: 0.8089%
Epoch [15/300], Step [139/225], Training Accuracy: 63.2756%, Training Loss: 0.8090%
Epoch [15/300], Step [140/225], Training Accuracy: 63.3036%, Training Loss: 0.8082%
Epoch [15/300], Step [141/225], Training Accuracy: 63.3311%, Training Loss: 0.8082%
Epoch [15/300], Step [142/225], Training Accuracy: 63.3693%, Training Loss: 0.8082%
Epoch [15/300], Step [143/225], Training Accuracy: 63.4288%, Training Loss: 0.8071%
Epoch [15/300], Step [144/225], Training Accuracy: 63.4006%, Training Loss: 0.8069%
Epoch [15/300], Step [145/225], Training Accuracy: 63.3728%, Training Loss: 0.8077%
Epoch [15/300], Step [146/225], Training Accuracy: 63.3776%, Training Loss: 

Epoch [16/300], Step [10/225], Training Accuracy: 64.8438%, Training Loss: 0.7977%
Epoch [16/300], Step [11/225], Training Accuracy: 64.4886%, Training Loss: 0.7971%
Epoch [16/300], Step [12/225], Training Accuracy: 64.0625%, Training Loss: 0.8002%
Epoch [16/300], Step [13/225], Training Accuracy: 65.0240%, Training Loss: 0.7839%
Epoch [16/300], Step [14/225], Training Accuracy: 64.8438%, Training Loss: 0.7881%
Epoch [16/300], Step [15/225], Training Accuracy: 64.5833%, Training Loss: 0.7943%
Epoch [16/300], Step [16/225], Training Accuracy: 65.0391%, Training Loss: 0.7911%
Epoch [16/300], Step [17/225], Training Accuracy: 65.1654%, Training Loss: 0.7856%
Epoch [16/300], Step [18/225], Training Accuracy: 64.9306%, Training Loss: 0.7897%
Epoch [16/300], Step [19/225], Training Accuracy: 65.2138%, Training Loss: 0.7852%
Epoch [16/300], Step [20/225], Training Accuracy: 65.3906%, Training Loss: 0.7829%
Epoch [16/300], Step [21/225], Training Accuracy: 65.2530%, Training Loss: 0.7797%
Epoc

Epoch [16/300], Step [111/225], Training Accuracy: 64.8930%, Training Loss: 0.7691%
Epoch [16/300], Step [112/225], Training Accuracy: 64.9554%, Training Loss: 0.7683%
Epoch [16/300], Step [113/225], Training Accuracy: 64.9475%, Training Loss: 0.7684%
Epoch [16/300], Step [114/225], Training Accuracy: 64.8986%, Training Loss: 0.7684%
Epoch [16/300], Step [115/225], Training Accuracy: 65.0136%, Training Loss: 0.7671%
Epoch [16/300], Step [116/225], Training Accuracy: 65.0323%, Training Loss: 0.7668%
Epoch [16/300], Step [117/225], Training Accuracy: 64.9038%, Training Loss: 0.7697%
Epoch [16/300], Step [118/225], Training Accuracy: 64.9364%, Training Loss: 0.7685%
Epoch [16/300], Step [119/225], Training Accuracy: 64.9422%, Training Loss: 0.7681%
Epoch [16/300], Step [120/225], Training Accuracy: 64.9349%, Training Loss: 0.7684%
Epoch [16/300], Step [121/225], Training Accuracy: 64.8760%, Training Loss: 0.7686%
Epoch [16/300], Step [122/225], Training Accuracy: 64.8181%, Training Loss: 

Epoch [16/300], Step [212/225], Training Accuracy: 65.7282%, Training Loss: 0.7552%
Epoch [16/300], Step [213/225], Training Accuracy: 65.6910%, Training Loss: 0.7568%
Epoch [16/300], Step [214/225], Training Accuracy: 65.7126%, Training Loss: 0.7565%
Epoch [16/300], Step [215/225], Training Accuracy: 65.6686%, Training Loss: 0.7583%
Epoch [16/300], Step [216/225], Training Accuracy: 65.6467%, Training Loss: 0.7583%
Epoch [16/300], Step [217/225], Training Accuracy: 65.6394%, Training Loss: 0.7585%
Epoch [16/300], Step [218/225], Training Accuracy: 65.6035%, Training Loss: 0.7588%
Epoch [16/300], Step [219/225], Training Accuracy: 65.6036%, Training Loss: 0.7592%
Epoch [16/300], Step [220/225], Training Accuracy: 65.6250%, Training Loss: 0.7589%
Epoch [16/300], Step [221/225], Training Accuracy: 65.6391%, Training Loss: 0.7590%
Epoch [16/300], Step [222/225], Training Accuracy: 65.6180%, Training Loss: 0.7589%
Epoch [16/300], Step [223/225], Training Accuracy: 65.6250%, Training Loss: 

Epoch [17/300], Step [91/225], Training Accuracy: 65.7624%, Training Loss: 0.7519%
Epoch [17/300], Step [92/225], Training Accuracy: 65.7269%, Training Loss: 0.7520%
Epoch [17/300], Step [93/225], Training Accuracy: 65.7426%, Training Loss: 0.7517%
Epoch [17/300], Step [94/225], Training Accuracy: 65.8910%, Training Loss: 0.7492%
Epoch [17/300], Step [95/225], Training Accuracy: 65.9211%, Training Loss: 0.7492%
Epoch [17/300], Step [96/225], Training Accuracy: 66.0807%, Training Loss: 0.7473%
Epoch [17/300], Step [97/225], Training Accuracy: 66.0921%, Training Loss: 0.7480%
Epoch [17/300], Step [98/225], Training Accuracy: 66.0714%, Training Loss: 0.7483%
Epoch [17/300], Step [99/225], Training Accuracy: 66.0196%, Training Loss: 0.7498%
Epoch [17/300], Step [100/225], Training Accuracy: 65.9844%, Training Loss: 0.7501%
Epoch [17/300], Step [101/225], Training Accuracy: 66.0427%, Training Loss: 0.7500%
Epoch [17/300], Step [102/225], Training Accuracy: 65.9926%, Training Loss: 0.7499%
E

Epoch [17/300], Step [195/225], Training Accuracy: 66.5705%, Training Loss: 0.7473%
Epoch [17/300], Step [196/225], Training Accuracy: 66.5896%, Training Loss: 0.7471%
Epoch [17/300], Step [197/225], Training Accuracy: 66.5530%, Training Loss: 0.7471%
Epoch [17/300], Step [198/225], Training Accuracy: 66.6035%, Training Loss: 0.7458%
Epoch [17/300], Step [199/225], Training Accuracy: 66.6457%, Training Loss: 0.7453%
Epoch [17/300], Step [200/225], Training Accuracy: 66.6953%, Training Loss: 0.7449%
Epoch [17/300], Step [201/225], Training Accuracy: 66.6822%, Training Loss: 0.7446%
Epoch [17/300], Step [202/225], Training Accuracy: 66.6925%, Training Loss: 0.7451%
Epoch [17/300], Step [203/225], Training Accuracy: 66.7411%, Training Loss: 0.7440%
Epoch [17/300], Step [204/225], Training Accuracy: 66.7279%, Training Loss: 0.7440%
Epoch [17/300], Step [205/225], Training Accuracy: 66.7530%, Training Loss: 0.7441%
Epoch [17/300], Step [206/225], Training Accuracy: 66.7476%, Training Loss: 

Epoch [18/300], Step [72/225], Training Accuracy: 68.1207%, Training Loss: 0.7278%
Epoch [18/300], Step [73/225], Training Accuracy: 68.1721%, Training Loss: 0.7271%
Epoch [18/300], Step [74/225], Training Accuracy: 68.2432%, Training Loss: 0.7243%
Epoch [18/300], Step [75/225], Training Accuracy: 68.1875%, Training Loss: 0.7241%
Epoch [18/300], Step [76/225], Training Accuracy: 68.0921%, Training Loss: 0.7262%
Epoch [18/300], Step [77/225], Training Accuracy: 68.0601%, Training Loss: 0.7273%
Epoch [18/300], Step [78/225], Training Accuracy: 67.9888%, Training Loss: 0.7284%
Epoch [18/300], Step [79/225], Training Accuracy: 67.9391%, Training Loss: 0.7288%
Epoch [18/300], Step [80/225], Training Accuracy: 67.8125%, Training Loss: 0.7308%
Epoch [18/300], Step [81/225], Training Accuracy: 67.6505%, Training Loss: 0.7316%
Epoch [18/300], Step [82/225], Training Accuracy: 67.6639%, Training Loss: 0.7310%
Epoch [18/300], Step [83/225], Training Accuracy: 67.5452%, Training Loss: 0.7317%
Epoc

Epoch [18/300], Step [175/225], Training Accuracy: 67.5982%, Training Loss: 0.7303%
Epoch [18/300], Step [176/225], Training Accuracy: 67.5337%, Training Loss: 0.7304%
Epoch [18/300], Step [177/225], Training Accuracy: 67.5318%, Training Loss: 0.7305%
Epoch [18/300], Step [178/225], Training Accuracy: 67.6001%, Training Loss: 0.7297%
Epoch [18/300], Step [179/225], Training Accuracy: 67.6763%, Training Loss: 0.7286%
Epoch [18/300], Step [180/225], Training Accuracy: 67.6910%, Training Loss: 0.7283%
Epoch [18/300], Step [181/225], Training Accuracy: 67.7055%, Training Loss: 0.7284%
Epoch [18/300], Step [182/225], Training Accuracy: 67.7026%, Training Loss: 0.7279%
Epoch [18/300], Step [183/225], Training Accuracy: 67.7254%, Training Loss: 0.7274%
Epoch [18/300], Step [184/225], Training Accuracy: 67.7055%, Training Loss: 0.7278%
Epoch [18/300], Step [185/225], Training Accuracy: 67.7365%, Training Loss: 0.7273%
Epoch [18/300], Step [186/225], Training Accuracy: 67.7755%, Training Loss: 

Epoch [19/300], Step [54/225], Training Accuracy: 68.3449%, Training Loss: 0.7340%
Epoch [19/300], Step [55/225], Training Accuracy: 68.2955%, Training Loss: 0.7346%
Epoch [19/300], Step [56/225], Training Accuracy: 68.2478%, Training Loss: 0.7343%
Epoch [19/300], Step [57/225], Training Accuracy: 68.2840%, Training Loss: 0.7330%
Epoch [19/300], Step [58/225], Training Accuracy: 68.2112%, Training Loss: 0.7337%
Epoch [19/300], Step [59/225], Training Accuracy: 68.2998%, Training Loss: 0.7316%
Epoch [19/300], Step [60/225], Training Accuracy: 68.2552%, Training Loss: 0.7330%
Epoch [19/300], Step [61/225], Training Accuracy: 68.2377%, Training Loss: 0.7343%
Epoch [19/300], Step [62/225], Training Accuracy: 68.4476%, Training Loss: 0.7317%
Epoch [19/300], Step [63/225], Training Accuracy: 68.5764%, Training Loss: 0.7296%
Epoch [19/300], Step [64/225], Training Accuracy: 68.6279%, Training Loss: 0.7296%
Epoch [19/300], Step [65/225], Training Accuracy: 68.6298%, Training Loss: 0.7318%
Epoc

Epoch [19/300], Step [157/225], Training Accuracy: 68.5709%, Training Loss: 0.7203%
Epoch [19/300], Step [158/225], Training Accuracy: 68.4929%, Training Loss: 0.7216%
Epoch [19/300], Step [159/225], Training Accuracy: 68.4847%, Training Loss: 0.7217%
Epoch [19/300], Step [160/225], Training Accuracy: 68.4961%, Training Loss: 0.7219%
Epoch [19/300], Step [161/225], Training Accuracy: 68.5074%, Training Loss: 0.7217%
Epoch [19/300], Step [162/225], Training Accuracy: 68.5571%, Training Loss: 0.7207%
Epoch [19/300], Step [163/225], Training Accuracy: 68.5679%, Training Loss: 0.7198%
Epoch [19/300], Step [164/225], Training Accuracy: 68.5976%, Training Loss: 0.7192%
Epoch [19/300], Step [165/225], Training Accuracy: 68.6174%, Training Loss: 0.7187%
Epoch [19/300], Step [166/225], Training Accuracy: 68.6465%, Training Loss: 0.7181%
Epoch [19/300], Step [167/225], Training Accuracy: 68.6845%, Training Loss: 0.7173%
Epoch [19/300], Step [168/225], Training Accuracy: 68.7035%, Training Loss: 

Epoch [20/300], Step [35/225], Training Accuracy: 69.0625%, Training Loss: 0.7114%
Epoch [20/300], Step [36/225], Training Accuracy: 68.9670%, Training Loss: 0.7131%
Epoch [20/300], Step [37/225], Training Accuracy: 69.2145%, Training Loss: 0.7105%
Epoch [20/300], Step [38/225], Training Accuracy: 69.2434%, Training Loss: 0.7078%
Epoch [20/300], Step [39/225], Training Accuracy: 69.4311%, Training Loss: 0.7044%
Epoch [20/300], Step [40/225], Training Accuracy: 69.4141%, Training Loss: 0.7059%
Epoch [20/300], Step [41/225], Training Accuracy: 69.0549%, Training Loss: 0.7118%
Epoch [20/300], Step [42/225], Training Accuracy: 68.7500%, Training Loss: 0.7138%
Epoch [20/300], Step [43/225], Training Accuracy: 68.6410%, Training Loss: 0.7156%
Epoch [20/300], Step [44/225], Training Accuracy: 68.7500%, Training Loss: 0.7145%
Epoch [20/300], Step [45/225], Training Accuracy: 68.8889%, Training Loss: 0.7138%
Epoch [20/300], Step [46/225], Training Accuracy: 69.1236%, Training Loss: 0.7103%
Epoc

Epoch [20/300], Step [139/225], Training Accuracy: 68.7950%, Training Loss: 0.7188%
Epoch [20/300], Step [140/225], Training Accuracy: 68.7500%, Training Loss: 0.7187%
Epoch [20/300], Step [141/225], Training Accuracy: 68.7832%, Training Loss: 0.7176%
Epoch [20/300], Step [142/225], Training Accuracy: 68.7500%, Training Loss: 0.7183%
Epoch [20/300], Step [143/225], Training Accuracy: 68.7609%, Training Loss: 0.7181%
Epoch [20/300], Step [144/225], Training Accuracy: 68.7826%, Training Loss: 0.7172%
Epoch [20/300], Step [145/225], Training Accuracy: 68.7284%, Training Loss: 0.7171%
Epoch [20/300], Step [146/225], Training Accuracy: 68.7179%, Training Loss: 0.7171%
Epoch [20/300], Step [147/225], Training Accuracy: 68.7181%, Training Loss: 0.7175%
Epoch [20/300], Step [148/225], Training Accuracy: 68.8028%, Training Loss: 0.7163%
Epoch [20/300], Step [149/225], Training Accuracy: 68.7815%, Training Loss: 0.7163%
Epoch [20/300], Step [150/225], Training Accuracy: 68.8333%, Training Loss: 

Epoch [21/300], Step [18/225], Training Accuracy: 70.9201%, Training Loss: 0.6509%
Epoch [21/300], Step [19/225], Training Accuracy: 71.1349%, Training Loss: 0.6456%
Epoch [21/300], Step [20/225], Training Accuracy: 71.4062%, Training Loss: 0.6365%
Epoch [21/300], Step [21/225], Training Accuracy: 71.5774%, Training Loss: 0.6347%
Epoch [21/300], Step [22/225], Training Accuracy: 71.0227%, Training Loss: 0.6391%
Epoch [21/300], Step [23/225], Training Accuracy: 71.0598%, Training Loss: 0.6372%
Epoch [21/300], Step [24/225], Training Accuracy: 71.0938%, Training Loss: 0.6379%
Epoch [21/300], Step [25/225], Training Accuracy: 71.4375%, Training Loss: 0.6324%
Epoch [21/300], Step [26/225], Training Accuracy: 71.3942%, Training Loss: 0.6288%
Epoch [21/300], Step [27/225], Training Accuracy: 71.4699%, Training Loss: 0.6328%
Epoch [21/300], Step [28/225], Training Accuracy: 71.9308%, Training Loss: 0.6245%
Epoch [21/300], Step [29/225], Training Accuracy: 72.1983%, Training Loss: 0.6208%
Epoc

Epoch [21/300], Step [122/225], Training Accuracy: 70.0435%, Training Loss: 0.6799%
Epoch [21/300], Step [123/225], Training Accuracy: 70.0457%, Training Loss: 0.6791%
Epoch [21/300], Step [124/225], Training Accuracy: 70.1109%, Training Loss: 0.6780%
Epoch [21/300], Step [125/225], Training Accuracy: 70.1250%, Training Loss: 0.6783%
Epoch [21/300], Step [126/225], Training Accuracy: 70.1389%, Training Loss: 0.6779%
Epoch [21/300], Step [127/225], Training Accuracy: 70.1403%, Training Loss: 0.6781%
Epoch [21/300], Step [128/225], Training Accuracy: 70.1294%, Training Loss: 0.6778%
Epoch [21/300], Step [129/225], Training Accuracy: 70.1550%, Training Loss: 0.6776%
Epoch [21/300], Step [130/225], Training Accuracy: 70.1322%, Training Loss: 0.6781%
Epoch [21/300], Step [131/225], Training Accuracy: 70.0859%, Training Loss: 0.6787%
Epoch [21/300], Step [132/225], Training Accuracy: 70.1113%, Training Loss: 0.6780%
Epoch [21/300], Step [133/225], Training Accuracy: 70.1480%, Training Loss: 

Epoch [21/300], Step [225/225], Training Accuracy: 71.4355%, Training Loss: 0.6520%
Epoch [22/300], Step [1/225], Training Accuracy: 79.6875%, Training Loss: 0.4935%
Epoch [22/300], Step [2/225], Training Accuracy: 75.0000%, Training Loss: 0.5689%
Epoch [22/300], Step [3/225], Training Accuracy: 72.3958%, Training Loss: 0.6526%
Epoch [22/300], Step [4/225], Training Accuracy: 71.8750%, Training Loss: 0.6621%
Epoch [22/300], Step [5/225], Training Accuracy: 70.3125%, Training Loss: 0.7123%
Epoch [22/300], Step [6/225], Training Accuracy: 71.8750%, Training Loss: 0.6741%
Epoch [22/300], Step [7/225], Training Accuracy: 71.6518%, Training Loss: 0.6622%
Epoch [22/300], Step [8/225], Training Accuracy: 73.0469%, Training Loss: 0.6487%
Epoch [22/300], Step [9/225], Training Accuracy: 73.0903%, Training Loss: 0.6388%
Epoch [22/300], Step [10/225], Training Accuracy: 72.6562%, Training Loss: 0.6510%
Epoch [22/300], Step [11/225], Training Accuracy: 72.8693%, Training Loss: 0.6503%
Epoch [22/30

Epoch [22/300], Step [105/225], Training Accuracy: 71.9494%, Training Loss: 0.6612%
Epoch [22/300], Step [106/225], Training Accuracy: 71.8603%, Training Loss: 0.6626%
Epoch [22/300], Step [107/225], Training Accuracy: 71.8750%, Training Loss: 0.6634%
Epoch [22/300], Step [108/225], Training Accuracy: 71.8461%, Training Loss: 0.6637%
Epoch [22/300], Step [109/225], Training Accuracy: 71.8033%, Training Loss: 0.6636%
Epoch [22/300], Step [110/225], Training Accuracy: 71.8182%, Training Loss: 0.6629%
Epoch [22/300], Step [111/225], Training Accuracy: 71.7765%, Training Loss: 0.6645%
Epoch [22/300], Step [112/225], Training Accuracy: 71.7773%, Training Loss: 0.6634%
Epoch [22/300], Step [113/225], Training Accuracy: 71.7782%, Training Loss: 0.6634%
Epoch [22/300], Step [114/225], Training Accuracy: 71.7516%, Training Loss: 0.6631%
Epoch [22/300], Step [115/225], Training Accuracy: 71.7935%, Training Loss: 0.6623%
Epoch [22/300], Step [116/225], Training Accuracy: 71.8211%, Training Loss: 

Epoch [22/300], Step [203/225], Training Accuracy: 72.6678%, Training Loss: 0.6445%
Epoch [22/300], Step [204/225], Training Accuracy: 72.6869%, Training Loss: 0.6440%
Epoch [22/300], Step [205/225], Training Accuracy: 72.7287%, Training Loss: 0.6433%
Epoch [22/300], Step [206/225], Training Accuracy: 72.7093%, Training Loss: 0.6431%
Epoch [22/300], Step [207/225], Training Accuracy: 72.7431%, Training Loss: 0.6423%
Epoch [22/300], Step [208/225], Training Accuracy: 72.7239%, Training Loss: 0.6421%
Epoch [22/300], Step [209/225], Training Accuracy: 72.6824%, Training Loss: 0.6422%
Epoch [22/300], Step [210/225], Training Accuracy: 72.6414%, Training Loss: 0.6425%
Epoch [22/300], Step [211/225], Training Accuracy: 72.6748%, Training Loss: 0.6421%
Epoch [22/300], Step [212/225], Training Accuracy: 72.7226%, Training Loss: 0.6412%
Epoch [22/300], Step [213/225], Training Accuracy: 72.7039%, Training Loss: 0.6412%
Epoch [22/300], Step [214/225], Training Accuracy: 72.7074%, Training Loss: 

Epoch [23/300], Step [78/225], Training Accuracy: 73.5577%, Training Loss: 0.6016%
Epoch [23/300], Step [79/225], Training Accuracy: 73.5759%, Training Loss: 0.6006%
Epoch [23/300], Step [80/225], Training Accuracy: 73.5742%, Training Loss: 0.5993%
Epoch [23/300], Step [81/225], Training Accuracy: 73.5725%, Training Loss: 0.5985%
Epoch [23/300], Step [82/225], Training Accuracy: 73.6662%, Training Loss: 0.5976%
Epoch [23/300], Step [83/225], Training Accuracy: 73.5881%, Training Loss: 0.5995%
Epoch [23/300], Step [84/225], Training Accuracy: 73.6793%, Training Loss: 0.5978%
Epoch [23/300], Step [85/225], Training Accuracy: 73.6765%, Training Loss: 0.5966%
Epoch [23/300], Step [86/225], Training Accuracy: 73.7282%, Training Loss: 0.5958%
Epoch [23/300], Step [87/225], Training Accuracy: 73.6710%, Training Loss: 0.5968%
Epoch [23/300], Step [88/225], Training Accuracy: 73.6683%, Training Loss: 0.5974%
Epoch [23/300], Step [89/225], Training Accuracy: 73.7008%, Training Loss: 0.5972%
Epoc

Epoch [23/300], Step [177/225], Training Accuracy: 73.1815%, Training Loss: 0.6185%
Epoch [23/300], Step [178/225], Training Accuracy: 73.2268%, Training Loss: 0.6175%
Epoch [23/300], Step [179/225], Training Accuracy: 73.2455%, Training Loss: 0.6173%
Epoch [23/300], Step [180/225], Training Accuracy: 73.2726%, Training Loss: 0.6166%
Epoch [23/300], Step [181/225], Training Accuracy: 73.2907%, Training Loss: 0.6166%
Epoch [23/300], Step [182/225], Training Accuracy: 73.2830%, Training Loss: 0.6165%
Epoch [23/300], Step [183/225], Training Accuracy: 73.2838%, Training Loss: 0.6164%
Epoch [23/300], Step [184/225], Training Accuracy: 73.2931%, Training Loss: 0.6160%
Epoch [23/300], Step [185/225], Training Accuracy: 73.3361%, Training Loss: 0.6156%
Epoch [23/300], Step [186/225], Training Accuracy: 73.4039%, Training Loss: 0.6147%
Epoch [23/300], Step [187/225], Training Accuracy: 73.4041%, Training Loss: 0.6147%
Epoch [23/300], Step [188/225], Training Accuracy: 73.4707%, Training Loss: 

Epoch [24/300], Step [51/225], Training Accuracy: 74.3566%, Training Loss: 0.5772%
Epoch [24/300], Step [52/225], Training Accuracy: 74.5793%, Training Loss: 0.5739%
Epoch [24/300], Step [53/225], Training Accuracy: 74.3219%, Training Loss: 0.5773%
Epoch [24/300], Step [54/225], Training Accuracy: 74.3924%, Training Loss: 0.5777%
Epoch [24/300], Step [55/225], Training Accuracy: 74.3182%, Training Loss: 0.5787%
Epoch [24/300], Step [56/225], Training Accuracy: 74.4699%, Training Loss: 0.5754%
Epoch [24/300], Step [57/225], Training Accuracy: 74.4243%, Training Loss: 0.5744%
Epoch [24/300], Step [58/225], Training Accuracy: 74.4343%, Training Loss: 0.5752%
Epoch [24/300], Step [59/225], Training Accuracy: 74.3114%, Training Loss: 0.5768%
Epoch [24/300], Step [60/225], Training Accuracy: 74.2969%, Training Loss: 0.5775%
Epoch [24/300], Step [61/225], Training Accuracy: 74.2059%, Training Loss: 0.5794%
Epoch [24/300], Step [62/225], Training Accuracy: 74.2692%, Training Loss: 0.5786%
Epoc

Epoch [24/300], Step [150/225], Training Accuracy: 74.4062%, Training Loss: 0.5942%
Epoch [24/300], Step [151/225], Training Accuracy: 74.3791%, Training Loss: 0.5946%
Epoch [24/300], Step [152/225], Training Accuracy: 74.4346%, Training Loss: 0.5947%
Epoch [24/300], Step [153/225], Training Accuracy: 74.4587%, Training Loss: 0.5942%
Epoch [24/300], Step [154/225], Training Accuracy: 74.4014%, Training Loss: 0.5954%
Epoch [24/300], Step [155/225], Training Accuracy: 74.3649%, Training Loss: 0.5957%
Epoch [24/300], Step [156/225], Training Accuracy: 74.3189%, Training Loss: 0.5968%
Epoch [24/300], Step [157/225], Training Accuracy: 74.2834%, Training Loss: 0.5968%
Epoch [24/300], Step [158/225], Training Accuracy: 74.1990%, Training Loss: 0.5989%
Epoch [24/300], Step [159/225], Training Accuracy: 74.1942%, Training Loss: 0.5989%
Epoch [24/300], Step [160/225], Training Accuracy: 74.1992%, Training Loss: 0.5985%
Epoch [24/300], Step [161/225], Training Accuracy: 74.1654%, Training Loss: 

Epoch [25/300], Step [27/225], Training Accuracy: 75.5787%, Training Loss: 0.5767%
Epoch [25/300], Step [28/225], Training Accuracy: 75.8929%, Training Loss: 0.5713%
Epoch [25/300], Step [29/225], Training Accuracy: 75.9698%, Training Loss: 0.5736%
Epoch [25/300], Step [30/225], Training Accuracy: 76.0938%, Training Loss: 0.5742%
Epoch [25/300], Step [31/225], Training Accuracy: 75.9073%, Training Loss: 0.5787%
Epoch [25/300], Step [32/225], Training Accuracy: 75.7324%, Training Loss: 0.5794%
Epoch [25/300], Step [33/225], Training Accuracy: 75.7102%, Training Loss: 0.5814%
Epoch [25/300], Step [34/225], Training Accuracy: 75.3676%, Training Loss: 0.5916%
Epoch [25/300], Step [35/225], Training Accuracy: 75.4464%, Training Loss: 0.5889%
Epoch [25/300], Step [36/225], Training Accuracy: 75.2604%, Training Loss: 0.5916%
Epoch [25/300], Step [37/225], Training Accuracy: 75.1689%, Training Loss: 0.5908%
Epoch [25/300], Step [38/225], Training Accuracy: 75.1645%, Training Loss: 0.5903%
Epoc

Epoch [25/300], Step [127/225], Training Accuracy: 75.0861%, Training Loss: 0.5903%
Epoch [25/300], Step [128/225], Training Accuracy: 75.0732%, Training Loss: 0.5904%
Epoch [25/300], Step [129/225], Training Accuracy: 75.0242%, Training Loss: 0.5908%
Epoch [25/300], Step [130/225], Training Accuracy: 75.0120%, Training Loss: 0.5915%
Epoch [25/300], Step [131/225], Training Accuracy: 75.0239%, Training Loss: 0.5919%
Epoch [25/300], Step [132/225], Training Accuracy: 75.0473%, Training Loss: 0.5918%
Epoch [25/300], Step [133/225], Training Accuracy: 75.0705%, Training Loss: 0.5921%
Epoch [25/300], Step [134/225], Training Accuracy: 75.0233%, Training Loss: 0.5927%
Epoch [25/300], Step [135/225], Training Accuracy: 75.0347%, Training Loss: 0.5937%
Epoch [25/300], Step [136/225], Training Accuracy: 75.0345%, Training Loss: 0.5945%
Epoch [25/300], Step [137/225], Training Accuracy: 75.0000%, Training Loss: 0.5950%
Epoch [25/300], Step [138/225], Training Accuracy: 75.0566%, Training Loss: 

Epoch [26/300], Step [5/225], Training Accuracy: 74.6875%, Training Loss: 0.5854%
Epoch [26/300], Step [6/225], Training Accuracy: 75.5208%, Training Loss: 0.5665%
Epoch [26/300], Step [7/225], Training Accuracy: 76.5625%, Training Loss: 0.5681%
Epoch [26/300], Step [8/225], Training Accuracy: 76.3672%, Training Loss: 0.5720%
Epoch [26/300], Step [9/225], Training Accuracy: 75.6944%, Training Loss: 0.5751%
Epoch [26/300], Step [10/225], Training Accuracy: 75.3125%, Training Loss: 0.5917%
Epoch [26/300], Step [11/225], Training Accuracy: 75.2841%, Training Loss: 0.5973%
Epoch [26/300], Step [12/225], Training Accuracy: 76.1719%, Training Loss: 0.5790%
Epoch [26/300], Step [13/225], Training Accuracy: 76.9231%, Training Loss: 0.5654%
Epoch [26/300], Step [14/225], Training Accuracy: 77.3438%, Training Loss: 0.5610%
Epoch [26/300], Step [15/225], Training Accuracy: 77.2917%, Training Loss: 0.5577%
Epoch [26/300], Step [16/225], Training Accuracy: 77.1484%, Training Loss: 0.5586%
Epoch [26

Epoch [26/300], Step [108/225], Training Accuracy: 76.5191%, Training Loss: 0.5603%
Epoch [26/300], Step [109/225], Training Accuracy: 76.5625%, Training Loss: 0.5599%
Epoch [26/300], Step [110/225], Training Accuracy: 76.5625%, Training Loss: 0.5588%
Epoch [26/300], Step [111/225], Training Accuracy: 76.5343%, Training Loss: 0.5597%
Epoch [26/300], Step [112/225], Training Accuracy: 76.5206%, Training Loss: 0.5608%
Epoch [26/300], Step [113/225], Training Accuracy: 76.4934%, Training Loss: 0.5631%
Epoch [26/300], Step [114/225], Training Accuracy: 76.4940%, Training Loss: 0.5629%
Epoch [26/300], Step [115/225], Training Accuracy: 76.5217%, Training Loss: 0.5625%
Epoch [26/300], Step [116/225], Training Accuracy: 76.4817%, Training Loss: 0.5633%
Epoch [26/300], Step [117/225], Training Accuracy: 76.4156%, Training Loss: 0.5650%
Epoch [26/300], Step [118/225], Training Accuracy: 76.4036%, Training Loss: 0.5653%
Epoch [26/300], Step [119/225], Training Accuracy: 76.4181%, Training Loss: 

Epoch [26/300], Step [214/225], Training Accuracy: 76.8546%, Training Loss: 0.5590%
Epoch [26/300], Step [215/225], Training Accuracy: 76.8750%, Training Loss: 0.5586%
Epoch [26/300], Step [216/225], Training Accuracy: 76.9097%, Training Loss: 0.5581%
Epoch [26/300], Step [217/225], Training Accuracy: 76.8793%, Training Loss: 0.5582%
Epoch [26/300], Step [218/225], Training Accuracy: 76.8349%, Training Loss: 0.5595%
Epoch [26/300], Step [219/225], Training Accuracy: 76.8408%, Training Loss: 0.5596%
Epoch [26/300], Step [220/225], Training Accuracy: 76.8963%, Training Loss: 0.5588%
Epoch [26/300], Step [221/225], Training Accuracy: 76.9089%, Training Loss: 0.5580%
Epoch [26/300], Step [222/225], Training Accuracy: 76.8792%, Training Loss: 0.5580%
Epoch [26/300], Step [223/225], Training Accuracy: 76.8708%, Training Loss: 0.5583%
Epoch [26/300], Step [224/225], Training Accuracy: 76.8834%, Training Loss: 0.5578%
Epoch [26/300], Step [225/225], Training Accuracy: 76.8830%, Training Loss: 

Epoch [27/300], Step [92/225], Training Accuracy: 76.4946%, Training Loss: 0.5534%
Epoch [27/300], Step [93/225], Training Accuracy: 76.5289%, Training Loss: 0.5526%
Epoch [27/300], Step [94/225], Training Accuracy: 76.5625%, Training Loss: 0.5508%
Epoch [27/300], Step [95/225], Training Accuracy: 76.6118%, Training Loss: 0.5502%
Epoch [27/300], Step [96/225], Training Accuracy: 76.6602%, Training Loss: 0.5483%
Epoch [27/300], Step [97/225], Training Accuracy: 76.5464%, Training Loss: 0.5502%
Epoch [27/300], Step [98/225], Training Accuracy: 76.5944%, Training Loss: 0.5505%
Epoch [27/300], Step [99/225], Training Accuracy: 76.6414%, Training Loss: 0.5502%
Epoch [27/300], Step [100/225], Training Accuracy: 76.5156%, Training Loss: 0.5526%
Epoch [27/300], Step [101/225], Training Accuracy: 76.5625%, Training Loss: 0.5513%
Epoch [27/300], Step [102/225], Training Accuracy: 76.6391%, Training Loss: 0.5508%
Epoch [27/300], Step [103/225], Training Accuracy: 76.7294%, Training Loss: 0.5498%


Epoch [27/300], Step [196/225], Training Accuracy: 77.5590%, Training Loss: 0.5355%
Epoch [27/300], Step [197/225], Training Accuracy: 77.5857%, Training Loss: 0.5354%
Epoch [27/300], Step [198/225], Training Accuracy: 77.6121%, Training Loss: 0.5348%
Epoch [27/300], Step [199/225], Training Accuracy: 77.6382%, Training Loss: 0.5341%
Epoch [27/300], Step [200/225], Training Accuracy: 77.6641%, Training Loss: 0.5337%
Epoch [27/300], Step [201/225], Training Accuracy: 77.7052%, Training Loss: 0.5328%
Epoch [27/300], Step [202/225], Training Accuracy: 77.7537%, Training Loss: 0.5320%
Epoch [27/300], Step [203/225], Training Accuracy: 77.7709%, Training Loss: 0.5323%
Epoch [27/300], Step [204/225], Training Accuracy: 77.7956%, Training Loss: 0.5316%
Epoch [27/300], Step [205/225], Training Accuracy: 77.7973%, Training Loss: 0.5316%
Epoch [27/300], Step [206/225], Training Accuracy: 77.7988%, Training Loss: 0.5314%
Epoch [27/300], Step [207/225], Training Accuracy: 77.7853%, Training Loss: 

Epoch [28/300], Step [75/225], Training Accuracy: 77.6875%, Training Loss: 0.5387%
Epoch [28/300], Step [76/225], Training Accuracy: 77.6727%, Training Loss: 0.5386%
Epoch [28/300], Step [77/225], Training Accuracy: 77.6583%, Training Loss: 0.5390%
Epoch [28/300], Step [78/225], Training Accuracy: 77.7043%, Training Loss: 0.5386%
Epoch [28/300], Step [79/225], Training Accuracy: 77.7888%, Training Loss: 0.5363%
Epoch [28/300], Step [80/225], Training Accuracy: 77.8906%, Training Loss: 0.5350%
Epoch [28/300], Step [81/225], Training Accuracy: 78.0093%, Training Loss: 0.5331%
Epoch [28/300], Step [82/225], Training Accuracy: 78.0869%, Training Loss: 0.5312%
Epoch [28/300], Step [83/225], Training Accuracy: 78.1062%, Training Loss: 0.5308%
Epoch [28/300], Step [84/225], Training Accuracy: 78.1808%, Training Loss: 0.5294%
Epoch [28/300], Step [85/225], Training Accuracy: 78.2904%, Training Loss: 0.5272%
Epoch [28/300], Step [86/225], Training Accuracy: 78.3612%, Training Loss: 0.5261%
Epoc

Epoch [28/300], Step [179/225], Training Accuracy: 77.6100%, Training Loss: 0.5390%
Epoch [28/300], Step [180/225], Training Accuracy: 77.6562%, Training Loss: 0.5383%
Epoch [28/300], Step [181/225], Training Accuracy: 77.6416%, Training Loss: 0.5385%
Epoch [28/300], Step [182/225], Training Accuracy: 77.5498%, Training Loss: 0.5398%
Epoch [28/300], Step [183/225], Training Accuracy: 77.5529%, Training Loss: 0.5404%
Epoch [28/300], Step [184/225], Training Accuracy: 77.5645%, Training Loss: 0.5408%
Epoch [28/300], Step [185/225], Training Accuracy: 77.5929%, Training Loss: 0.5398%
Epoch [28/300], Step [186/225], Training Accuracy: 77.6042%, Training Loss: 0.5392%
Epoch [28/300], Step [187/225], Training Accuracy: 77.5902%, Training Loss: 0.5395%
Epoch [28/300], Step [188/225], Training Accuracy: 77.6180%, Training Loss: 0.5390%
Epoch [28/300], Step [189/225], Training Accuracy: 77.6290%, Training Loss: 0.5386%
Epoch [28/300], Step [190/225], Training Accuracy: 77.6234%, Training Loss: 

Epoch [29/300], Step [55/225], Training Accuracy: 78.2102%, Training Loss: 0.5131%
Epoch [29/300], Step [56/225], Training Accuracy: 78.2645%, Training Loss: 0.5105%
Epoch [29/300], Step [57/225], Training Accuracy: 78.2072%, Training Loss: 0.5109%
Epoch [29/300], Step [58/225], Training Accuracy: 78.2328%, Training Loss: 0.5109%
Epoch [29/300], Step [59/225], Training Accuracy: 78.1250%, Training Loss: 0.5118%
Epoch [29/300], Step [60/225], Training Accuracy: 78.0208%, Training Loss: 0.5136%
Epoch [29/300], Step [61/225], Training Accuracy: 77.9969%, Training Loss: 0.5132%
Epoch [29/300], Step [62/225], Training Accuracy: 78.1250%, Training Loss: 0.5123%
Epoch [29/300], Step [63/225], Training Accuracy: 78.0754%, Training Loss: 0.5129%
Epoch [29/300], Step [64/225], Training Accuracy: 78.1738%, Training Loss: 0.5112%
Epoch [29/300], Step [65/225], Training Accuracy: 78.1731%, Training Loss: 0.5129%
Epoch [29/300], Step [66/225], Training Accuracy: 78.2907%, Training Loss: 0.5106%
Epoc

Epoch [29/300], Step [154/225], Training Accuracy: 78.0641%, Training Loss: 0.5154%
Epoch [29/300], Step [155/225], Training Accuracy: 78.0343%, Training Loss: 0.5154%
Epoch [29/300], Step [156/225], Training Accuracy: 78.0148%, Training Loss: 0.5155%
Epoch [29/300], Step [157/225], Training Accuracy: 78.0653%, Training Loss: 0.5149%
Epoch [29/300], Step [158/225], Training Accuracy: 78.0459%, Training Loss: 0.5160%
Epoch [29/300], Step [159/225], Training Accuracy: 77.9579%, Training Loss: 0.5174%
Epoch [29/300], Step [160/225], Training Accuracy: 77.9883%, Training Loss: 0.5170%
Epoch [29/300], Step [161/225], Training Accuracy: 77.9988%, Training Loss: 0.5168%
Epoch [29/300], Step [162/225], Training Accuracy: 78.0285%, Training Loss: 0.5163%
Epoch [29/300], Step [163/225], Training Accuracy: 78.0483%, Training Loss: 0.5159%
Epoch [29/300], Step [164/225], Training Accuracy: 78.0488%, Training Loss: 0.5155%
Epoch [29/300], Step [165/225], Training Accuracy: 78.0114%, Training Loss: 

Epoch [30/300], Step [28/225], Training Accuracy: 79.6317%, Training Loss: 0.4771%
Epoch [30/300], Step [29/225], Training Accuracy: 79.7953%, Training Loss: 0.4740%
Epoch [30/300], Step [30/225], Training Accuracy: 79.7917%, Training Loss: 0.4754%
Epoch [30/300], Step [31/225], Training Accuracy: 79.6875%, Training Loss: 0.4790%
Epoch [30/300], Step [32/225], Training Accuracy: 79.4922%, Training Loss: 0.4810%
Epoch [30/300], Step [33/225], Training Accuracy: 79.4034%, Training Loss: 0.4858%
Epoch [30/300], Step [34/225], Training Accuracy: 79.2739%, Training Loss: 0.4938%
Epoch [30/300], Step [35/225], Training Accuracy: 79.2411%, Training Loss: 0.4948%
Epoch [30/300], Step [36/225], Training Accuracy: 79.4271%, Training Loss: 0.4908%
Epoch [30/300], Step [37/225], Training Accuracy: 79.3919%, Training Loss: 0.4893%
Epoch [30/300], Step [38/225], Training Accuracy: 79.4408%, Training Loss: 0.4883%
Epoch [30/300], Step [39/225], Training Accuracy: 79.2869%, Training Loss: 0.4905%
Epoc

Epoch [30/300], Step [127/225], Training Accuracy: 79.2077%, Training Loss: 0.4985%
Epoch [30/300], Step [128/225], Training Accuracy: 79.1992%, Training Loss: 0.4987%
Epoch [30/300], Step [129/225], Training Accuracy: 79.1182%, Training Loss: 0.4998%
Epoch [30/300], Step [130/225], Training Accuracy: 79.0986%, Training Loss: 0.5002%
Epoch [30/300], Step [131/225], Training Accuracy: 79.0792%, Training Loss: 0.5007%
Epoch [30/300], Step [132/225], Training Accuracy: 79.0246%, Training Loss: 0.5011%
Epoch [30/300], Step [133/225], Training Accuracy: 78.9944%, Training Loss: 0.5018%
Epoch [30/300], Step [134/225], Training Accuracy: 78.9995%, Training Loss: 0.5027%
Epoch [30/300], Step [135/225], Training Accuracy: 79.0162%, Training Loss: 0.5021%
Epoch [30/300], Step [136/225], Training Accuracy: 79.0211%, Training Loss: 0.5015%
Epoch [30/300], Step [137/225], Training Accuracy: 78.9462%, Training Loss: 0.5025%
Epoch [30/300], Step [138/225], Training Accuracy: 78.9742%, Training Loss: 

Epoch [30/300], Step [225/225], Training Accuracy: 79.4469%, Training Loss: 0.4911%
Epoch [31/300], Step [1/225], Training Accuracy: 82.8125%, Training Loss: 0.3733%
Epoch [31/300], Step [2/225], Training Accuracy: 80.4688%, Training Loss: 0.4747%
Epoch [31/300], Step [3/225], Training Accuracy: 80.7292%, Training Loss: 0.4705%
Epoch [31/300], Step [4/225], Training Accuracy: 79.2969%, Training Loss: 0.4727%
Epoch [31/300], Step [5/225], Training Accuracy: 78.7500%, Training Loss: 0.4914%
Epoch [31/300], Step [6/225], Training Accuracy: 79.9479%, Training Loss: 0.4870%
Epoch [31/300], Step [7/225], Training Accuracy: 79.9107%, Training Loss: 0.4832%
Epoch [31/300], Step [8/225], Training Accuracy: 80.0781%, Training Loss: 0.4826%
Epoch [31/300], Step [9/225], Training Accuracy: 79.8611%, Training Loss: 0.4882%
Epoch [31/300], Step [10/225], Training Accuracy: 80.1562%, Training Loss: 0.4922%
Epoch [31/300], Step [11/225], Training Accuracy: 80.3977%, Training Loss: 0.4841%
Epoch [31/30

Epoch [31/300], Step [99/225], Training Accuracy: 79.8453%, Training Loss: 0.4893%
Epoch [31/300], Step [100/225], Training Accuracy: 79.7969%, Training Loss: 0.4904%
Epoch [31/300], Step [101/225], Training Accuracy: 79.8113%, Training Loss: 0.4892%
Epoch [31/300], Step [102/225], Training Accuracy: 79.8407%, Training Loss: 0.4888%
Epoch [31/300], Step [103/225], Training Accuracy: 79.8392%, Training Loss: 0.4884%
Epoch [31/300], Step [104/225], Training Accuracy: 79.8227%, Training Loss: 0.4879%
Epoch [31/300], Step [105/225], Training Accuracy: 79.8214%, Training Loss: 0.4871%
Epoch [31/300], Step [106/225], Training Accuracy: 79.8939%, Training Loss: 0.4865%
Epoch [31/300], Step [107/225], Training Accuracy: 79.8189%, Training Loss: 0.4881%
Epoch [31/300], Step [108/225], Training Accuracy: 79.8032%, Training Loss: 0.4893%
Epoch [31/300], Step [109/225], Training Accuracy: 79.8165%, Training Loss: 0.4891%
Epoch [31/300], Step [110/225], Training Accuracy: 79.8153%, Training Loss: 0

Epoch [31/300], Step [198/225], Training Accuracy: 79.8848%, Training Loss: 0.4831%
Epoch [31/300], Step [199/225], Training Accuracy: 79.9152%, Training Loss: 0.4825%
Epoch [31/300], Step [200/225], Training Accuracy: 79.9141%, Training Loss: 0.4822%
Epoch [31/300], Step [201/225], Training Accuracy: 79.9285%, Training Loss: 0.4815%
Epoch [31/300], Step [202/225], Training Accuracy: 79.9582%, Training Loss: 0.4811%
Epoch [31/300], Step [203/225], Training Accuracy: 79.9492%, Training Loss: 0.4812%
Epoch [31/300], Step [204/225], Training Accuracy: 79.9326%, Training Loss: 0.4815%
Epoch [31/300], Step [205/225], Training Accuracy: 79.9619%, Training Loss: 0.4811%
Epoch [31/300], Step [206/225], Training Accuracy: 79.9606%, Training Loss: 0.4813%
Epoch [31/300], Step [207/225], Training Accuracy: 80.0121%, Training Loss: 0.4805%
Epoch [31/300], Step [208/225], Training Accuracy: 80.0180%, Training Loss: 0.4804%
Epoch [31/300], Step [209/225], Training Accuracy: 80.0314%, Training Loss: 

Epoch [32/300], Step [80/225], Training Accuracy: 80.3125%, Training Loss: 0.4862%
Epoch [32/300], Step [81/225], Training Accuracy: 80.3434%, Training Loss: 0.4854%
Epoch [32/300], Step [82/225], Training Accuracy: 80.3354%, Training Loss: 0.4851%
Epoch [32/300], Step [83/225], Training Accuracy: 80.2899%, Training Loss: 0.4850%
Epoch [32/300], Step [84/225], Training Accuracy: 80.3571%, Training Loss: 0.4831%
Epoch [32/300], Step [85/225], Training Accuracy: 80.3125%, Training Loss: 0.4832%
Epoch [32/300], Step [86/225], Training Accuracy: 80.3597%, Training Loss: 0.4819%
Epoch [32/300], Step [87/225], Training Accuracy: 80.3341%, Training Loss: 0.4834%
Epoch [32/300], Step [88/225], Training Accuracy: 80.2202%, Training Loss: 0.4845%
Epoch [32/300], Step [89/225], Training Accuracy: 80.2142%, Training Loss: 0.4859%
Epoch [32/300], Step [90/225], Training Accuracy: 80.2083%, Training Loss: 0.4860%
Epoch [32/300], Step [91/225], Training Accuracy: 80.1168%, Training Loss: 0.4866%
Epoc

Epoch [32/300], Step [178/225], Training Accuracy: 80.0650%, Training Loss: 0.4791%
Epoch [32/300], Step [179/225], Training Accuracy: 80.0541%, Training Loss: 0.4789%
Epoch [32/300], Step [180/225], Training Accuracy: 80.1042%, Training Loss: 0.4781%
Epoch [32/300], Step [181/225], Training Accuracy: 80.1105%, Training Loss: 0.4781%
Epoch [32/300], Step [182/225], Training Accuracy: 80.1425%, Training Loss: 0.4780%
Epoch [32/300], Step [183/225], Training Accuracy: 80.1998%, Training Loss: 0.4776%
Epoch [32/300], Step [184/225], Training Accuracy: 80.2395%, Training Loss: 0.4771%
Epoch [32/300], Step [185/225], Training Accuracy: 80.2534%, Training Loss: 0.4764%
Epoch [32/300], Step [186/225], Training Accuracy: 80.2839%, Training Loss: 0.4755%
Epoch [32/300], Step [187/225], Training Accuracy: 80.3058%, Training Loss: 0.4749%
Epoch [32/300], Step [188/225], Training Accuracy: 80.2942%, Training Loss: 0.4749%
Epoch [32/300], Step [189/225], Training Accuracy: 80.3241%, Training Loss: 

Epoch [33/300], Step [53/225], Training Accuracy: 81.0142%, Training Loss: 0.4625%
Epoch [33/300], Step [54/225], Training Accuracy: 80.9606%, Training Loss: 0.4640%
Epoch [33/300], Step [55/225], Training Accuracy: 81.0511%, Training Loss: 0.4627%
Epoch [33/300], Step [56/225], Training Accuracy: 81.1942%, Training Loss: 0.4603%
Epoch [33/300], Step [57/225], Training Accuracy: 81.1678%, Training Loss: 0.4603%
Epoch [33/300], Step [58/225], Training Accuracy: 81.1692%, Training Loss: 0.4602%
Epoch [33/300], Step [59/225], Training Accuracy: 81.1706%, Training Loss: 0.4598%
Epoch [33/300], Step [60/225], Training Accuracy: 81.1719%, Training Loss: 0.4588%
Epoch [33/300], Step [61/225], Training Accuracy: 81.2244%, Training Loss: 0.4583%
Epoch [33/300], Step [62/225], Training Accuracy: 81.2752%, Training Loss: 0.4560%
Epoch [33/300], Step [63/225], Training Accuracy: 81.3244%, Training Loss: 0.4540%
Epoch [33/300], Step [64/225], Training Accuracy: 81.1768%, Training Loss: 0.4554%
Epoc

Epoch [33/300], Step [156/225], Training Accuracy: 80.5188%, Training Loss: 0.4770%
Epoch [33/300], Step [157/225], Training Accuracy: 80.4837%, Training Loss: 0.4781%
Epoch [33/300], Step [158/225], Training Accuracy: 80.4490%, Training Loss: 0.4783%
Epoch [33/300], Step [159/225], Training Accuracy: 80.4442%, Training Loss: 0.4784%
Epoch [33/300], Step [160/225], Training Accuracy: 80.4492%, Training Loss: 0.4781%
Epoch [33/300], Step [161/225], Training Accuracy: 80.4445%, Training Loss: 0.4782%
Epoch [33/300], Step [162/225], Training Accuracy: 80.4784%, Training Loss: 0.4775%
Epoch [33/300], Step [163/225], Training Accuracy: 80.4544%, Training Loss: 0.4771%
Epoch [33/300], Step [164/225], Training Accuracy: 80.4783%, Training Loss: 0.4764%
Epoch [33/300], Step [165/225], Training Accuracy: 80.4830%, Training Loss: 0.4761%
Epoch [33/300], Step [166/225], Training Accuracy: 80.5064%, Training Loss: 0.4754%
Epoch [33/300], Step [167/225], Training Accuracy: 80.5109%, Training Loss: 

Epoch [34/300], Step [29/225], Training Accuracy: 82.0043%, Training Loss: 0.4432%
Epoch [34/300], Step [30/225], Training Accuracy: 81.7708%, Training Loss: 0.4471%
Epoch [34/300], Step [31/225], Training Accuracy: 81.6532%, Training Loss: 0.4521%
Epoch [34/300], Step [32/225], Training Accuracy: 81.5918%, Training Loss: 0.4535%
Epoch [34/300], Step [33/225], Training Accuracy: 81.5814%, Training Loss: 0.4533%
Epoch [34/300], Step [34/225], Training Accuracy: 81.2960%, Training Loss: 0.4567%
Epoch [34/300], Step [35/225], Training Accuracy: 81.2500%, Training Loss: 0.4597%
Epoch [34/300], Step [36/225], Training Accuracy: 81.2066%, Training Loss: 0.4600%
Epoch [34/300], Step [37/225], Training Accuracy: 81.2078%, Training Loss: 0.4602%
Epoch [34/300], Step [38/225], Training Accuracy: 81.2911%, Training Loss: 0.4586%
Epoch [34/300], Step [39/225], Training Accuracy: 81.2500%, Training Loss: 0.4631%
Epoch [34/300], Step [40/225], Training Accuracy: 81.2109%, Training Loss: 0.4643%
Epoc

Epoch [34/300], Step [128/225], Training Accuracy: 81.3721%, Training Loss: 0.4620%
Epoch [34/300], Step [129/225], Training Accuracy: 81.3469%, Training Loss: 0.4621%
Epoch [34/300], Step [130/225], Training Accuracy: 81.2981%, Training Loss: 0.4625%
Epoch [34/300], Step [131/225], Training Accuracy: 81.2739%, Training Loss: 0.4624%
Epoch [34/300], Step [132/225], Training Accuracy: 81.2737%, Training Loss: 0.4625%
Epoch [34/300], Step [133/225], Training Accuracy: 81.2617%, Training Loss: 0.4633%
Epoch [34/300], Step [134/225], Training Accuracy: 81.1217%, Training Loss: 0.4655%
Epoch [34/300], Step [135/225], Training Accuracy: 81.0995%, Training Loss: 0.4653%
Epoch [34/300], Step [136/225], Training Accuracy: 81.0662%, Training Loss: 0.4660%
Epoch [34/300], Step [137/225], Training Accuracy: 81.0561%, Training Loss: 0.4658%
Epoch [34/300], Step [138/225], Training Accuracy: 81.1028%, Training Loss: 0.4646%
Epoch [34/300], Step [139/225], Training Accuracy: 81.0926%, Training Loss: 

Epoch [35/300], Step [1/225], Training Accuracy: 84.3750%, Training Loss: 0.4041%
Epoch [35/300], Step [2/225], Training Accuracy: 83.5938%, Training Loss: 0.4310%
Epoch [35/300], Step [3/225], Training Accuracy: 82.2917%, Training Loss: 0.4125%
Epoch [35/300], Step [4/225], Training Accuracy: 83.2031%, Training Loss: 0.4070%
Epoch [35/300], Step [5/225], Training Accuracy: 83.1250%, Training Loss: 0.4233%
Epoch [35/300], Step [6/225], Training Accuracy: 84.3750%, Training Loss: 0.4066%
Epoch [35/300], Step [7/225], Training Accuracy: 84.1518%, Training Loss: 0.4120%
Epoch [35/300], Step [8/225], Training Accuracy: 82.6172%, Training Loss: 0.4301%
Epoch [35/300], Step [9/225], Training Accuracy: 82.6389%, Training Loss: 0.4366%
Epoch [35/300], Step [10/225], Training Accuracy: 81.8750%, Training Loss: 0.4542%
Epoch [35/300], Step [11/225], Training Accuracy: 81.6761%, Training Loss: 0.4561%
Epoch [35/300], Step [12/225], Training Accuracy: 81.5104%, Training Loss: 0.4525%
Epoch [35/300

Epoch [35/300], Step [100/225], Training Accuracy: 82.5469%, Training Loss: 0.4283%
Epoch [35/300], Step [101/225], Training Accuracy: 82.4876%, Training Loss: 0.4286%
Epoch [35/300], Step [102/225], Training Accuracy: 82.4755%, Training Loss: 0.4284%
Epoch [35/300], Step [103/225], Training Accuracy: 82.4636%, Training Loss: 0.4289%
Epoch [35/300], Step [104/225], Training Accuracy: 82.4669%, Training Loss: 0.4289%
Epoch [35/300], Step [105/225], Training Accuracy: 82.5446%, Training Loss: 0.4273%
Epoch [35/300], Step [106/225], Training Accuracy: 82.5619%, Training Loss: 0.4273%
Epoch [35/300], Step [107/225], Training Accuracy: 82.6373%, Training Loss: 0.4264%
Epoch [35/300], Step [108/225], Training Accuracy: 82.5810%, Training Loss: 0.4271%
Epoch [35/300], Step [109/225], Training Accuracy: 82.5258%, Training Loss: 0.4281%
Epoch [35/300], Step [110/225], Training Accuracy: 82.5994%, Training Loss: 0.4270%
Epoch [35/300], Step [111/225], Training Accuracy: 82.5310%, Training Loss: 

Epoch [35/300], Step [199/225], Training Accuracy: 82.2550%, Training Loss: 0.4354%
Epoch [35/300], Step [200/225], Training Accuracy: 82.2422%, Training Loss: 0.4360%
Epoch [35/300], Step [201/225], Training Accuracy: 82.2761%, Training Loss: 0.4355%
Epoch [35/300], Step [202/225], Training Accuracy: 82.2710%, Training Loss: 0.4352%
Epoch [35/300], Step [203/225], Training Accuracy: 82.2968%, Training Loss: 0.4349%
Epoch [35/300], Step [204/225], Training Accuracy: 82.2763%, Training Loss: 0.4351%
Epoch [35/300], Step [205/225], Training Accuracy: 82.3171%, Training Loss: 0.4344%
Epoch [35/300], Step [206/225], Training Accuracy: 82.3498%, Training Loss: 0.4336%
Epoch [35/300], Step [207/225], Training Accuracy: 82.3143%, Training Loss: 0.4347%
Epoch [35/300], Step [208/225], Training Accuracy: 82.3092%, Training Loss: 0.4347%
Epoch [35/300], Step [209/225], Training Accuracy: 82.2667%, Training Loss: 0.4356%
Epoch [35/300], Step [210/225], Training Accuracy: 82.2693%, Training Loss: 

Epoch [36/300], Step [73/225], Training Accuracy: 81.6353%, Training Loss: 0.4446%
Epoch [36/300], Step [74/225], Training Accuracy: 81.5878%, Training Loss: 0.4438%
Epoch [36/300], Step [75/225], Training Accuracy: 81.6458%, Training Loss: 0.4424%
Epoch [36/300], Step [76/225], Training Accuracy: 81.5995%, Training Loss: 0.4429%
Epoch [36/300], Step [77/225], Training Accuracy: 81.5544%, Training Loss: 0.4454%
Epoch [36/300], Step [78/225], Training Accuracy: 81.5104%, Training Loss: 0.4455%
Epoch [36/300], Step [79/225], Training Accuracy: 81.5269%, Training Loss: 0.4453%
Epoch [36/300], Step [80/225], Training Accuracy: 81.4844%, Training Loss: 0.4457%
Epoch [36/300], Step [81/225], Training Accuracy: 81.5008%, Training Loss: 0.4451%
Epoch [36/300], Step [82/225], Training Accuracy: 81.4977%, Training Loss: 0.4452%
Epoch [36/300], Step [83/225], Training Accuracy: 81.5324%, Training Loss: 0.4444%
Epoch [36/300], Step [84/225], Training Accuracy: 81.6034%, Training Loss: 0.4426%
Epoc

Epoch [36/300], Step [172/225], Training Accuracy: 81.4135%, Training Loss: 0.4535%
Epoch [36/300], Step [173/225], Training Accuracy: 81.4216%, Training Loss: 0.4542%
Epoch [36/300], Step [174/225], Training Accuracy: 81.4655%, Training Loss: 0.4538%
Epoch [36/300], Step [175/225], Training Accuracy: 81.4554%, Training Loss: 0.4537%
Epoch [36/300], Step [176/225], Training Accuracy: 81.4808%, Training Loss: 0.4528%
Epoch [36/300], Step [177/225], Training Accuracy: 81.5501%, Training Loss: 0.4514%
Epoch [36/300], Step [178/225], Training Accuracy: 81.5572%, Training Loss: 0.4511%
Epoch [36/300], Step [179/225], Training Accuracy: 81.5817%, Training Loss: 0.4507%
Epoch [36/300], Step [180/225], Training Accuracy: 81.5885%, Training Loss: 0.4515%
Epoch [36/300], Step [181/225], Training Accuracy: 81.6126%, Training Loss: 0.4512%
Epoch [36/300], Step [182/225], Training Accuracy: 81.6192%, Training Loss: 0.4506%
Epoch [36/300], Step [183/225], Training Accuracy: 81.6257%, Training Loss: 

Epoch [37/300], Step [54/225], Training Accuracy: 82.2917%, Training Loss: 0.4374%
Epoch [37/300], Step [55/225], Training Accuracy: 82.2159%, Training Loss: 0.4389%
Epoch [37/300], Step [56/225], Training Accuracy: 82.2545%, Training Loss: 0.4391%
Epoch [37/300], Step [57/225], Training Accuracy: 82.2094%, Training Loss: 0.4389%
Epoch [37/300], Step [58/225], Training Accuracy: 82.1121%, Training Loss: 0.4403%
Epoch [37/300], Step [59/225], Training Accuracy: 81.8856%, Training Loss: 0.4423%
Epoch [37/300], Step [60/225], Training Accuracy: 81.8229%, Training Loss: 0.4437%
Epoch [37/300], Step [61/225], Training Accuracy: 81.7111%, Training Loss: 0.4453%
Epoch [37/300], Step [62/225], Training Accuracy: 81.8044%, Training Loss: 0.4421%
Epoch [37/300], Step [63/225], Training Accuracy: 81.8948%, Training Loss: 0.4428%
Epoch [37/300], Step [64/225], Training Accuracy: 81.9336%, Training Loss: 0.4423%
Epoch [37/300], Step [65/225], Training Accuracy: 81.9471%, Training Loss: 0.4427%
Epoc

Epoch [37/300], Step [153/225], Training Accuracy: 82.4551%, Training Loss: 0.4289%
Epoch [37/300], Step [154/225], Training Accuracy: 82.4574%, Training Loss: 0.4286%
Epoch [37/300], Step [155/225], Training Accuracy: 82.3992%, Training Loss: 0.4296%
Epoch [37/300], Step [156/225], Training Accuracy: 82.4018%, Training Loss: 0.4303%
Epoch [37/300], Step [157/225], Training Accuracy: 82.3746%, Training Loss: 0.4307%
Epoch [37/300], Step [158/225], Training Accuracy: 82.3477%, Training Loss: 0.4322%
Epoch [37/300], Step [159/225], Training Accuracy: 82.3211%, Training Loss: 0.4325%
Epoch [37/300], Step [160/225], Training Accuracy: 82.3145%, Training Loss: 0.4327%
Epoch [37/300], Step [161/225], Training Accuracy: 82.3467%, Training Loss: 0.4326%
Epoch [37/300], Step [162/225], Training Accuracy: 82.3592%, Training Loss: 0.4323%
Epoch [37/300], Step [163/225], Training Accuracy: 82.3332%, Training Loss: 0.4324%
Epoch [37/300], Step [164/225], Training Accuracy: 82.3742%, Training Loss: 

Epoch [38/300], Step [27/225], Training Accuracy: 82.9282%, Training Loss: 0.4200%
Epoch [38/300], Step [28/225], Training Accuracy: 83.1473%, Training Loss: 0.4164%
Epoch [38/300], Step [29/225], Training Accuracy: 83.3513%, Training Loss: 0.4113%
Epoch [38/300], Step [30/225], Training Accuracy: 83.4896%, Training Loss: 0.4087%
Epoch [38/300], Step [31/225], Training Accuracy: 83.3669%, Training Loss: 0.4123%
Epoch [38/300], Step [32/225], Training Accuracy: 83.3984%, Training Loss: 0.4140%
Epoch [38/300], Step [33/225], Training Accuracy: 83.4754%, Training Loss: 0.4115%
Epoch [38/300], Step [34/225], Training Accuracy: 83.1801%, Training Loss: 0.4167%
Epoch [38/300], Step [35/225], Training Accuracy: 83.3036%, Training Loss: 0.4135%
Epoch [38/300], Step [36/225], Training Accuracy: 83.3333%, Training Loss: 0.4130%
Epoch [38/300], Step [37/225], Training Accuracy: 83.4459%, Training Loss: 0.4094%
Epoch [38/300], Step [38/225], Training Accuracy: 83.3059%, Training Loss: 0.4110%
Epoc

Epoch [38/300], Step [126/225], Training Accuracy: 81.8824%, Training Loss: 0.4442%
Epoch [38/300], Step [127/225], Training Accuracy: 81.9144%, Training Loss: 0.4432%
Epoch [38/300], Step [128/225], Training Accuracy: 81.9580%, Training Loss: 0.4424%
Epoch [38/300], Step [129/225], Training Accuracy: 81.9404%, Training Loss: 0.4421%
Epoch [38/300], Step [130/225], Training Accuracy: 81.9471%, Training Loss: 0.4417%
Epoch [38/300], Step [131/225], Training Accuracy: 81.8822%, Training Loss: 0.4428%
Epoch [38/300], Step [132/225], Training Accuracy: 81.8537%, Training Loss: 0.4456%
Epoch [38/300], Step [133/225], Training Accuracy: 81.8257%, Training Loss: 0.4463%
Epoch [38/300], Step [134/225], Training Accuracy: 81.7980%, Training Loss: 0.4473%
Epoch [38/300], Step [135/225], Training Accuracy: 81.8056%, Training Loss: 0.4465%
Epoch [38/300], Step [136/225], Training Accuracy: 81.7900%, Training Loss: 0.4462%
Epoch [38/300], Step [137/225], Training Accuracy: 81.7974%, Training Loss: 

Epoch [38/300], Step [225/225], Training Accuracy: 82.5528%, Training Loss: 0.4269%
Epoch [39/300], Step [1/225], Training Accuracy: 81.2500%, Training Loss: 0.4503%
Epoch [39/300], Step [2/225], Training Accuracy: 82.0312%, Training Loss: 0.3878%
Epoch [39/300], Step [3/225], Training Accuracy: 84.3750%, Training Loss: 0.3542%
Epoch [39/300], Step [4/225], Training Accuracy: 84.3750%, Training Loss: 0.3582%
Epoch [39/300], Step [5/225], Training Accuracy: 84.0625%, Training Loss: 0.3534%
Epoch [39/300], Step [6/225], Training Accuracy: 85.1562%, Training Loss: 0.3436%
Epoch [39/300], Step [7/225], Training Accuracy: 85.9375%, Training Loss: 0.3396%
Epoch [39/300], Step [8/225], Training Accuracy: 85.9375%, Training Loss: 0.3361%
Epoch [39/300], Step [9/225], Training Accuracy: 85.4167%, Training Loss: 0.3437%
Epoch [39/300], Step [10/225], Training Accuracy: 84.6875%, Training Loss: 0.3679%
Epoch [39/300], Step [11/225], Training Accuracy: 84.3750%, Training Loss: 0.3743%
Epoch [39/30

Epoch [39/300], Step [99/225], Training Accuracy: 83.0966%, Training Loss: 0.4142%
Epoch [39/300], Step [100/225], Training Accuracy: 83.0781%, Training Loss: 0.4154%
Epoch [39/300], Step [101/225], Training Accuracy: 83.0755%, Training Loss: 0.4156%
Epoch [39/300], Step [102/225], Training Accuracy: 83.0423%, Training Loss: 0.4177%
Epoch [39/300], Step [103/225], Training Accuracy: 83.1311%, Training Loss: 0.4161%
Epoch [39/300], Step [104/225], Training Accuracy: 82.9928%, Training Loss: 0.4179%
Epoch [39/300], Step [105/225], Training Accuracy: 83.0208%, Training Loss: 0.4175%
Epoch [39/300], Step [106/225], Training Accuracy: 83.0631%, Training Loss: 0.4169%
Epoch [39/300], Step [107/225], Training Accuracy: 83.0169%, Training Loss: 0.4181%
Epoch [39/300], Step [108/225], Training Accuracy: 82.9282%, Training Loss: 0.4194%
Epoch [39/300], Step [109/225], Training Accuracy: 82.8698%, Training Loss: 0.4197%
Epoch [39/300], Step [110/225], Training Accuracy: 82.8977%, Training Loss: 0

Epoch [39/300], Step [198/225], Training Accuracy: 82.9624%, Training Loss: 0.4131%
Epoch [39/300], Step [199/225], Training Accuracy: 82.9852%, Training Loss: 0.4125%
Epoch [39/300], Step [200/225], Training Accuracy: 83.0078%, Training Loss: 0.4118%
Epoch [39/300], Step [201/225], Training Accuracy: 83.0068%, Training Loss: 0.4117%
Epoch [39/300], Step [202/225], Training Accuracy: 83.0213%, Training Loss: 0.4116%
Epoch [39/300], Step [203/225], Training Accuracy: 83.0588%, Training Loss: 0.4112%
Epoch [39/300], Step [204/225], Training Accuracy: 83.0806%, Training Loss: 0.4107%
Epoch [39/300], Step [205/225], Training Accuracy: 83.0945%, Training Loss: 0.4104%
Epoch [39/300], Step [206/225], Training Accuracy: 83.0400%, Training Loss: 0.4116%
Epoch [39/300], Step [207/225], Training Accuracy: 83.0163%, Training Loss: 0.4124%
Epoch [39/300], Step [208/225], Training Accuracy: 83.0003%, Training Loss: 0.4124%
Epoch [39/300], Step [209/225], Training Accuracy: 82.9994%, Training Loss: 

Epoch [40/300], Step [72/225], Training Accuracy: 83.8976%, Training Loss: 0.4038%
Epoch [40/300], Step [73/225], Training Accuracy: 83.9683%, Training Loss: 0.4019%
Epoch [40/300], Step [74/225], Training Accuracy: 83.9738%, Training Loss: 0.4015%
Epoch [40/300], Step [75/225], Training Accuracy: 84.0208%, Training Loss: 0.4002%
Epoch [40/300], Step [76/225], Training Accuracy: 83.9433%, Training Loss: 0.4015%
Epoch [40/300], Step [77/225], Training Accuracy: 83.8880%, Training Loss: 0.4017%
Epoch [40/300], Step [78/225], Training Accuracy: 83.8542%, Training Loss: 0.4011%
Epoch [40/300], Step [79/225], Training Accuracy: 83.9003%, Training Loss: 0.3999%
Epoch [40/300], Step [80/225], Training Accuracy: 83.8672%, Training Loss: 0.4003%
Epoch [40/300], Step [81/225], Training Accuracy: 83.9120%, Training Loss: 0.3989%
Epoch [40/300], Step [82/225], Training Accuracy: 83.9558%, Training Loss: 0.3978%
Epoch [40/300], Step [83/225], Training Accuracy: 83.9608%, Training Loss: 0.3968%
Epoc

Epoch [40/300], Step [171/225], Training Accuracy: 83.9547%, Training Loss: 0.4002%
Epoch [40/300], Step [172/225], Training Accuracy: 83.9390%, Training Loss: 0.4000%
Epoch [40/300], Step [173/225], Training Accuracy: 83.9505%, Training Loss: 0.3996%
Epoch [40/300], Step [174/225], Training Accuracy: 84.0068%, Training Loss: 0.3987%
Epoch [40/300], Step [175/225], Training Accuracy: 84.0179%, Training Loss: 0.3986%
Epoch [40/300], Step [176/225], Training Accuracy: 84.0288%, Training Loss: 0.3986%
Epoch [40/300], Step [177/225], Training Accuracy: 84.0307%, Training Loss: 0.3984%
Epoch [40/300], Step [178/225], Training Accuracy: 84.0327%, Training Loss: 0.3978%
Epoch [40/300], Step [179/225], Training Accuracy: 84.0433%, Training Loss: 0.3972%
Epoch [40/300], Step [180/225], Training Accuracy: 84.0712%, Training Loss: 0.3972%
Epoch [40/300], Step [181/225], Training Accuracy: 84.0642%, Training Loss: 0.3974%
Epoch [40/300], Step [182/225], Training Accuracy: 84.1003%, Training Loss: 

Epoch [41/300], Step [45/225], Training Accuracy: 82.7083%, Training Loss: 0.4344%
Epoch [41/300], Step [46/225], Training Accuracy: 82.7785%, Training Loss: 0.4310%
Epoch [41/300], Step [47/225], Training Accuracy: 82.7128%, Training Loss: 0.4304%
Epoch [41/300], Step [48/225], Training Accuracy: 82.5521%, Training Loss: 0.4326%
Epoch [41/300], Step [49/225], Training Accuracy: 82.5893%, Training Loss: 0.4315%
Epoch [41/300], Step [50/225], Training Accuracy: 82.5000%, Training Loss: 0.4339%
Epoch [41/300], Step [51/225], Training Accuracy: 82.5061%, Training Loss: 0.4309%
Epoch [41/300], Step [52/225], Training Accuracy: 82.6923%, Training Loss: 0.4281%
Epoch [41/300], Step [53/225], Training Accuracy: 82.7830%, Training Loss: 0.4271%
Epoch [41/300], Step [54/225], Training Accuracy: 82.7836%, Training Loss: 0.4284%
Epoch [41/300], Step [55/225], Training Accuracy: 82.6420%, Training Loss: 0.4307%
Epoch [41/300], Step [56/225], Training Accuracy: 82.7009%, Training Loss: 0.4292%
Epoc

Epoch [41/300], Step [144/225], Training Accuracy: 82.9210%, Training Loss: 0.4168%
Epoch [41/300], Step [145/225], Training Accuracy: 82.9095%, Training Loss: 0.4164%
Epoch [41/300], Step [146/225], Training Accuracy: 82.8874%, Training Loss: 0.4167%
Epoch [41/300], Step [147/225], Training Accuracy: 82.9507%, Training Loss: 0.4157%
Epoch [41/300], Step [148/225], Training Accuracy: 83.0025%, Training Loss: 0.4144%
Epoch [41/300], Step [149/225], Training Accuracy: 82.9279%, Training Loss: 0.4152%
Epoch [41/300], Step [150/225], Training Accuracy: 82.9792%, Training Loss: 0.4149%
Epoch [41/300], Step [151/225], Training Accuracy: 83.0195%, Training Loss: 0.4136%
Epoch [41/300], Step [152/225], Training Accuracy: 83.0284%, Training Loss: 0.4138%
Epoch [41/300], Step [153/225], Training Accuracy: 83.0678%, Training Loss: 0.4136%
Epoch [41/300], Step [154/225], Training Accuracy: 83.0357%, Training Loss: 0.4155%
Epoch [41/300], Step [155/225], Training Accuracy: 83.0444%, Training Loss: 

Epoch [42/300], Step [18/225], Training Accuracy: 87.3264%, Training Loss: 0.3515%
Epoch [42/300], Step [19/225], Training Accuracy: 87.4178%, Training Loss: 0.3484%
Epoch [42/300], Step [20/225], Training Accuracy: 87.3438%, Training Loss: 0.3522%
Epoch [42/300], Step [21/225], Training Accuracy: 87.4256%, Training Loss: 0.3478%
Epoch [42/300], Step [22/225], Training Accuracy: 87.0739%, Training Loss: 0.3561%
Epoch [42/300], Step [23/225], Training Accuracy: 87.2962%, Training Loss: 0.3545%
Epoch [42/300], Step [24/225], Training Accuracy: 87.3698%, Training Loss: 0.3602%
Epoch [42/300], Step [25/225], Training Accuracy: 87.5000%, Training Loss: 0.3534%
Epoch [42/300], Step [26/225], Training Accuracy: 87.3197%, Training Loss: 0.3565%
Epoch [42/300], Step [27/225], Training Accuracy: 87.2685%, Training Loss: 0.3573%
Epoch [42/300], Step [28/225], Training Accuracy: 87.1652%, Training Loss: 0.3596%
Epoch [42/300], Step [29/225], Training Accuracy: 87.1228%, Training Loss: 0.3587%
Epoc

Epoch [42/300], Step [117/225], Training Accuracy: 85.4701%, Training Loss: 0.3764%
Epoch [42/300], Step [118/225], Training Accuracy: 85.4873%, Training Loss: 0.3768%
Epoch [42/300], Step [119/225], Training Accuracy: 85.4779%, Training Loss: 0.3762%
Epoch [42/300], Step [120/225], Training Accuracy: 85.4427%, Training Loss: 0.3760%
Epoch [42/300], Step [121/225], Training Accuracy: 85.4210%, Training Loss: 0.3773%
Epoch [42/300], Step [122/225], Training Accuracy: 85.3996%, Training Loss: 0.3781%
Epoch [42/300], Step [123/225], Training Accuracy: 85.4167%, Training Loss: 0.3779%
Epoch [42/300], Step [124/225], Training Accuracy: 85.4209%, Training Loss: 0.3777%
Epoch [42/300], Step [125/225], Training Accuracy: 85.4125%, Training Loss: 0.3789%
Epoch [42/300], Step [126/225], Training Accuracy: 85.3547%, Training Loss: 0.3789%
Epoch [42/300], Step [127/225], Training Accuracy: 85.3100%, Training Loss: 0.3795%
Epoch [42/300], Step [128/225], Training Accuracy: 85.3027%, Training Loss: 

Epoch [42/300], Step [216/225], Training Accuracy: 85.0984%, Training Loss: 0.3826%
Epoch [42/300], Step [217/225], Training Accuracy: 85.1022%, Training Loss: 0.3820%
Epoch [42/300], Step [218/225], Training Accuracy: 85.0989%, Training Loss: 0.3822%
Epoch [42/300], Step [219/225], Training Accuracy: 85.1027%, Training Loss: 0.3825%
Epoch [42/300], Step [220/225], Training Accuracy: 85.1420%, Training Loss: 0.3817%
Epoch [42/300], Step [221/225], Training Accuracy: 85.1669%, Training Loss: 0.3810%
Epoch [42/300], Step [222/225], Training Accuracy: 85.1492%, Training Loss: 0.3809%
Epoch [42/300], Step [223/225], Training Accuracy: 85.1247%, Training Loss: 0.3806%
Epoch [42/300], Step [224/225], Training Accuracy: 85.1214%, Training Loss: 0.3805%
Epoch [42/300], Step [225/225], Training Accuracy: 85.1306%, Training Loss: 0.3799%
Epoch [43/300], Step [1/225], Training Accuracy: 75.0000%, Training Loss: 0.6372%
Epoch [43/300], Step [2/225], Training Accuracy: 78.9062%, Training Loss: 0.51

Epoch [43/300], Step [98/225], Training Accuracy: 84.2793%, Training Loss: 0.3985%
Epoch [43/300], Step [99/225], Training Accuracy: 84.2961%, Training Loss: 0.3990%
Epoch [43/300], Step [100/225], Training Accuracy: 84.1719%, Training Loss: 0.4012%
Epoch [43/300], Step [101/225], Training Accuracy: 84.1894%, Training Loss: 0.4004%
Epoch [43/300], Step [102/225], Training Accuracy: 84.2218%, Training Loss: 0.4006%
Epoch [43/300], Step [103/225], Training Accuracy: 84.2840%, Training Loss: 0.3988%
Epoch [43/300], Step [104/225], Training Accuracy: 84.1797%, Training Loss: 0.4003%
Epoch [43/300], Step [105/225], Training Accuracy: 84.2113%, Training Loss: 0.3998%
Epoch [43/300], Step [106/225], Training Accuracy: 84.1834%, Training Loss: 0.4002%
Epoch [43/300], Step [107/225], Training Accuracy: 84.1852%, Training Loss: 0.4003%
Epoch [43/300], Step [108/225], Training Accuracy: 84.2159%, Training Loss: 0.4000%
Epoch [43/300], Step [109/225], Training Accuracy: 84.1743%, Training Loss: 0.

Epoch [43/300], Step [197/225], Training Accuracy: 84.3591%, Training Loss: 0.3935%
Epoch [43/300], Step [198/225], Training Accuracy: 84.3513%, Training Loss: 0.3937%
Epoch [43/300], Step [199/225], Training Accuracy: 84.3436%, Training Loss: 0.3934%
Epoch [43/300], Step [200/225], Training Accuracy: 84.3359%, Training Loss: 0.3935%
Epoch [43/300], Step [201/225], Training Accuracy: 84.3439%, Training Loss: 0.3935%
Epoch [43/300], Step [202/225], Training Accuracy: 84.3827%, Training Loss: 0.3926%
Epoch [43/300], Step [203/225], Training Accuracy: 84.4212%, Training Loss: 0.3922%
Epoch [43/300], Step [204/225], Training Accuracy: 84.4669%, Training Loss: 0.3913%
Epoch [43/300], Step [205/225], Training Accuracy: 84.4741%, Training Loss: 0.3912%
Epoch [43/300], Step [206/225], Training Accuracy: 84.4812%, Training Loss: 0.3906%
Epoch [43/300], Step [207/225], Training Accuracy: 84.4807%, Training Loss: 0.3908%
Epoch [43/300], Step [208/225], Training Accuracy: 84.4802%, Training Loss: 

Epoch [44/300], Step [71/225], Training Accuracy: 85.3213%, Training Loss: 0.3750%
Epoch [44/300], Step [72/225], Training Accuracy: 85.3299%, Training Loss: 0.3733%
Epoch [44/300], Step [73/225], Training Accuracy: 85.2740%, Training Loss: 0.3756%
Epoch [44/300], Step [74/225], Training Accuracy: 85.2407%, Training Loss: 0.3758%
Epoch [44/300], Step [75/225], Training Accuracy: 85.2292%, Training Loss: 0.3751%
Epoch [44/300], Step [76/225], Training Accuracy: 85.1974%, Training Loss: 0.3758%
Epoch [44/300], Step [77/225], Training Accuracy: 85.2273%, Training Loss: 0.3749%
Epoch [44/300], Step [78/225], Training Accuracy: 85.2364%, Training Loss: 0.3755%
Epoch [44/300], Step [79/225], Training Accuracy: 85.2255%, Training Loss: 0.3759%
Epoch [44/300], Step [80/225], Training Accuracy: 85.1562%, Training Loss: 0.3769%
Epoch [44/300], Step [81/225], Training Accuracy: 85.1852%, Training Loss: 0.3760%
Epoch [44/300], Step [82/225], Training Accuracy: 85.2325%, Training Loss: 0.3746%
Epoc

Epoch [44/300], Step [170/225], Training Accuracy: 84.5221%, Training Loss: 0.3859%
Epoch [44/300], Step [171/225], Training Accuracy: 84.5029%, Training Loss: 0.3860%
Epoch [44/300], Step [172/225], Training Accuracy: 84.5022%, Training Loss: 0.3868%
Epoch [44/300], Step [173/225], Training Accuracy: 84.5014%, Training Loss: 0.3874%
Epoch [44/300], Step [174/225], Training Accuracy: 84.5456%, Training Loss: 0.3871%
Epoch [44/300], Step [175/225], Training Accuracy: 84.5625%, Training Loss: 0.3869%
Epoch [44/300], Step [176/225], Training Accuracy: 84.5526%, Training Loss: 0.3863%
Epoch [44/300], Step [177/225], Training Accuracy: 84.5692%, Training Loss: 0.3855%
Epoch [44/300], Step [178/225], Training Accuracy: 84.5593%, Training Loss: 0.3855%
Epoch [44/300], Step [179/225], Training Accuracy: 84.5670%, Training Loss: 0.3850%
Epoch [44/300], Step [180/225], Training Accuracy: 84.5660%, Training Loss: 0.3853%
Epoch [44/300], Step [181/225], Training Accuracy: 84.5477%, Training Loss: 

Epoch [45/300], Step [44/225], Training Accuracy: 84.7301%, Training Loss: 0.3886%
Epoch [45/300], Step [45/225], Training Accuracy: 84.6875%, Training Loss: 0.3877%
Epoch [45/300], Step [46/225], Training Accuracy: 84.7826%, Training Loss: 0.3842%
Epoch [45/300], Step [47/225], Training Accuracy: 84.8072%, Training Loss: 0.3829%
Epoch [45/300], Step [48/225], Training Accuracy: 84.5378%, Training Loss: 0.3884%
Epoch [45/300], Step [49/225], Training Accuracy: 84.6620%, Training Loss: 0.3862%
Epoch [45/300], Step [50/225], Training Accuracy: 84.5625%, Training Loss: 0.3865%
Epoch [45/300], Step [51/225], Training Accuracy: 84.6201%, Training Loss: 0.3855%
Epoch [45/300], Step [52/225], Training Accuracy: 84.7356%, Training Loss: 0.3834%
Epoch [45/300], Step [53/225], Training Accuracy: 84.9057%, Training Loss: 0.3801%
Epoch [45/300], Step [54/225], Training Accuracy: 84.8958%, Training Loss: 0.3796%
Epoch [45/300], Step [55/225], Training Accuracy: 84.8295%, Training Loss: 0.3825%
Epoc

Epoch [45/300], Step [143/225], Training Accuracy: 83.9270%, Training Loss: 0.4158%
Epoch [45/300], Step [144/225], Training Accuracy: 83.9193%, Training Loss: 0.4158%
Epoch [45/300], Step [145/225], Training Accuracy: 83.8901%, Training Loss: 0.4165%
Epoch [45/300], Step [146/225], Training Accuracy: 83.9148%, Training Loss: 0.4156%
Epoch [45/300], Step [147/225], Training Accuracy: 83.9605%, Training Loss: 0.4148%
Epoch [45/300], Step [148/225], Training Accuracy: 83.9949%, Training Loss: 0.4147%
Epoch [45/300], Step [149/225], Training Accuracy: 83.9765%, Training Loss: 0.4146%
Epoch [45/300], Step [150/225], Training Accuracy: 83.9583%, Training Loss: 0.4145%
Epoch [45/300], Step [151/225], Training Accuracy: 83.9921%, Training Loss: 0.4139%
Epoch [45/300], Step [152/225], Training Accuracy: 84.0255%, Training Loss: 0.4128%
Epoch [45/300], Step [153/225], Training Accuracy: 83.9869%, Training Loss: 0.4130%
Epoch [45/300], Step [154/225], Training Accuracy: 84.0199%, Training Loss: 

Epoch [46/300], Step [17/225], Training Accuracy: 84.8346%, Training Loss: 0.3730%
Epoch [46/300], Step [18/225], Training Accuracy: 84.4618%, Training Loss: 0.3820%
Epoch [46/300], Step [19/225], Training Accuracy: 84.3750%, Training Loss: 0.3858%
Epoch [46/300], Step [20/225], Training Accuracy: 84.8438%, Training Loss: 0.3789%
Epoch [46/300], Step [21/225], Training Accuracy: 85.3423%, Training Loss: 0.3690%
Epoch [46/300], Step [22/225], Training Accuracy: 84.9432%, Training Loss: 0.3699%
Epoch [46/300], Step [23/225], Training Accuracy: 84.9864%, Training Loss: 0.3669%
Epoch [46/300], Step [24/225], Training Accuracy: 84.8307%, Training Loss: 0.3647%
Epoch [46/300], Step [25/225], Training Accuracy: 84.9375%, Training Loss: 0.3663%
Epoch [46/300], Step [26/225], Training Accuracy: 84.9159%, Training Loss: 0.3665%
Epoch [46/300], Step [27/225], Training Accuracy: 84.9537%, Training Loss: 0.3647%
Epoch [46/300], Step [28/225], Training Accuracy: 84.9888%, Training Loss: 0.3621%
Epoc

Epoch [46/300], Step [116/225], Training Accuracy: 84.7656%, Training Loss: 0.3796%
Epoch [46/300], Step [117/225], Training Accuracy: 84.6554%, Training Loss: 0.3823%
Epoch [46/300], Step [118/225], Training Accuracy: 84.6796%, Training Loss: 0.3821%
Epoch [46/300], Step [119/225], Training Accuracy: 84.6901%, Training Loss: 0.3817%
Epoch [46/300], Step [120/225], Training Accuracy: 84.6875%, Training Loss: 0.3818%
Epoch [46/300], Step [121/225], Training Accuracy: 84.6333%, Training Loss: 0.3832%
Epoch [46/300], Step [122/225], Training Accuracy: 84.6440%, Training Loss: 0.3830%
Epoch [46/300], Step [123/225], Training Accuracy: 84.6672%, Training Loss: 0.3831%
Epoch [46/300], Step [124/225], Training Accuracy: 84.6900%, Training Loss: 0.3822%
Epoch [46/300], Step [125/225], Training Accuracy: 84.6750%, Training Loss: 0.3823%
Epoch [46/300], Step [126/225], Training Accuracy: 84.5734%, Training Loss: 0.3842%
Epoch [46/300], Step [127/225], Training Accuracy: 84.5472%, Training Loss: 

Epoch [46/300], Step [215/225], Training Accuracy: 84.8038%, Training Loss: 0.3802%
Epoch [46/300], Step [216/225], Training Accuracy: 84.8452%, Training Loss: 0.3796%
Epoch [46/300], Step [217/225], Training Accuracy: 84.8358%, Training Loss: 0.3794%
Epoch [46/300], Step [218/225], Training Accuracy: 84.8337%, Training Loss: 0.3795%
Epoch [46/300], Step [219/225], Training Accuracy: 84.8602%, Training Loss: 0.3791%
Epoch [46/300], Step [220/225], Training Accuracy: 84.8651%, Training Loss: 0.3795%
Epoch [46/300], Step [221/225], Training Accuracy: 84.8840%, Training Loss: 0.3792%
Epoch [46/300], Step [222/225], Training Accuracy: 84.9099%, Training Loss: 0.3791%
Epoch [46/300], Step [223/225], Training Accuracy: 84.8655%, Training Loss: 0.3800%
Epoch [46/300], Step [224/225], Training Accuracy: 84.8703%, Training Loss: 0.3799%
Epoch [46/300], Step [225/225], Training Accuracy: 84.8874%, Training Loss: 0.3799%
Epoch [47/300], Step [1/225], Training Accuracy: 75.0000%, Training Loss: 0.

Epoch [47/300], Step [89/225], Training Accuracy: 85.6917%, Training Loss: 0.3669%
Epoch [47/300], Step [90/225], Training Accuracy: 85.5729%, Training Loss: 0.3693%
Epoch [47/300], Step [91/225], Training Accuracy: 85.5941%, Training Loss: 0.3684%
Epoch [47/300], Step [92/225], Training Accuracy: 85.5808%, Training Loss: 0.3687%
Epoch [47/300], Step [93/225], Training Accuracy: 85.6519%, Training Loss: 0.3676%
Epoch [47/300], Step [94/225], Training Accuracy: 85.6549%, Training Loss: 0.3672%
Epoch [47/300], Step [95/225], Training Accuracy: 85.6743%, Training Loss: 0.3664%
Epoch [47/300], Step [96/225], Training Accuracy: 85.6934%, Training Loss: 0.3647%
Epoch [47/300], Step [97/225], Training Accuracy: 85.7603%, Training Loss: 0.3640%
Epoch [47/300], Step [98/225], Training Accuracy: 85.7621%, Training Loss: 0.3639%
Epoch [47/300], Step [99/225], Training Accuracy: 85.7323%, Training Loss: 0.3654%
Epoch [47/300], Step [100/225], Training Accuracy: 85.6562%, Training Loss: 0.3666%
Epo

Epoch [47/300], Step [188/225], Training Accuracy: 85.2975%, Training Loss: 0.3723%
Epoch [47/300], Step [189/225], Training Accuracy: 85.3257%, Training Loss: 0.3717%
Epoch [47/300], Step [190/225], Training Accuracy: 85.3207%, Training Loss: 0.3716%
Epoch [47/300], Step [191/225], Training Accuracy: 85.3485%, Training Loss: 0.3713%
Epoch [47/300], Step [192/225], Training Accuracy: 85.3678%, Training Loss: 0.3708%
Epoch [47/300], Step [193/225], Training Accuracy: 85.3546%, Training Loss: 0.3716%
Epoch [47/300], Step [194/225], Training Accuracy: 85.3576%, Training Loss: 0.3718%
Epoch [47/300], Step [195/225], Training Accuracy: 85.3686%, Training Loss: 0.3712%
Epoch [47/300], Step [196/225], Training Accuracy: 85.3555%, Training Loss: 0.3717%
Epoch [47/300], Step [197/225], Training Accuracy: 85.3585%, Training Loss: 0.3720%
Epoch [47/300], Step [198/225], Training Accuracy: 85.3851%, Training Loss: 0.3717%
Epoch [47/300], Step [199/225], Training Accuracy: 85.4036%, Training Loss: 

Epoch [48/300], Step [62/225], Training Accuracy: 85.0050%, Training Loss: 0.3608%
Epoch [48/300], Step [63/225], Training Accuracy: 84.9206%, Training Loss: 0.3627%
Epoch [48/300], Step [64/225], Training Accuracy: 84.9365%, Training Loss: 0.3619%
Epoch [48/300], Step [65/225], Training Accuracy: 84.8798%, Training Loss: 0.3643%
Epoch [48/300], Step [66/225], Training Accuracy: 84.8722%, Training Loss: 0.3655%
Epoch [48/300], Step [67/225], Training Accuracy: 84.9114%, Training Loss: 0.3654%
Epoch [48/300], Step [68/225], Training Accuracy: 84.7886%, Training Loss: 0.3671%
Epoch [48/300], Step [69/225], Training Accuracy: 84.8279%, Training Loss: 0.3655%
Epoch [48/300], Step [70/225], Training Accuracy: 84.9107%, Training Loss: 0.3645%
Epoch [48/300], Step [71/225], Training Accuracy: 84.8371%, Training Loss: 0.3646%
Epoch [48/300], Step [72/225], Training Accuracy: 84.7656%, Training Loss: 0.3668%
Epoch [48/300], Step [73/225], Training Accuracy: 84.7603%, Training Loss: 0.3671%
Epoc

Epoch [48/300], Step [161/225], Training Accuracy: 85.3552%, Training Loss: 0.3638%
Epoch [48/300], Step [162/225], Training Accuracy: 85.3588%, Training Loss: 0.3639%
Epoch [48/300], Step [163/225], Training Accuracy: 85.3623%, Training Loss: 0.3638%
Epoch [48/300], Step [164/225], Training Accuracy: 85.3849%, Training Loss: 0.3637%
Epoch [48/300], Step [165/225], Training Accuracy: 85.3883%, Training Loss: 0.3635%
Epoch [48/300], Step [166/225], Training Accuracy: 85.3727%, Training Loss: 0.3634%
Epoch [48/300], Step [167/225], Training Accuracy: 85.3948%, Training Loss: 0.3628%
Epoch [48/300], Step [168/225], Training Accuracy: 85.3981%, Training Loss: 0.3637%
Epoch [48/300], Step [169/225], Training Accuracy: 85.4290%, Training Loss: 0.3630%
Epoch [48/300], Step [170/225], Training Accuracy: 85.4228%, Training Loss: 0.3629%
Epoch [48/300], Step [171/225], Training Accuracy: 85.3710%, Training Loss: 0.3639%
Epoch [48/300], Step [172/225], Training Accuracy: 85.3834%, Training Loss: 

Epoch [49/300], Step [35/225], Training Accuracy: 86.5179%, Training Loss: 0.3409%
Epoch [49/300], Step [36/225], Training Accuracy: 86.5451%, Training Loss: 0.3417%
Epoch [49/300], Step [37/225], Training Accuracy: 86.5709%, Training Loss: 0.3423%
Epoch [49/300], Step [38/225], Training Accuracy: 86.5543%, Training Loss: 0.3412%
Epoch [49/300], Step [39/225], Training Accuracy: 86.4183%, Training Loss: 0.3424%
Epoch [49/300], Step [40/225], Training Accuracy: 86.4844%, Training Loss: 0.3417%
Epoch [49/300], Step [41/225], Training Accuracy: 86.3186%, Training Loss: 0.3465%
Epoch [49/300], Step [42/225], Training Accuracy: 86.4583%, Training Loss: 0.3442%
Epoch [49/300], Step [43/225], Training Accuracy: 86.4826%, Training Loss: 0.3458%
Epoch [49/300], Step [44/225], Training Accuracy: 86.5057%, Training Loss: 0.3461%
Epoch [49/300], Step [45/225], Training Accuracy: 86.5278%, Training Loss: 0.3458%
Epoch [49/300], Step [46/225], Training Accuracy: 86.6168%, Training Loss: 0.3432%
Epoc

Epoch [49/300], Step [134/225], Training Accuracy: 85.8559%, Training Loss: 0.3578%
Epoch [49/300], Step [135/225], Training Accuracy: 85.8681%, Training Loss: 0.3580%
Epoch [49/300], Step [136/225], Training Accuracy: 85.8456%, Training Loss: 0.3588%
Epoch [49/300], Step [137/225], Training Accuracy: 85.8349%, Training Loss: 0.3586%
Epoch [49/300], Step [138/225], Training Accuracy: 85.9035%, Training Loss: 0.3571%
Epoch [49/300], Step [139/225], Training Accuracy: 85.8588%, Training Loss: 0.3590%
Epoch [49/300], Step [140/225], Training Accuracy: 85.8482%, Training Loss: 0.3587%
Epoch [49/300], Step [141/225], Training Accuracy: 85.8156%, Training Loss: 0.3591%
Epoch [49/300], Step [142/225], Training Accuracy: 85.8385%, Training Loss: 0.3585%
Epoch [49/300], Step [143/225], Training Accuracy: 85.8282%, Training Loss: 0.3590%
Epoch [49/300], Step [144/225], Training Accuracy: 85.8398%, Training Loss: 0.3584%
Epoch [49/300], Step [145/225], Training Accuracy: 85.8190%, Training Loss: 

Epoch [50/300], Step [7/225], Training Accuracy: 83.9286%, Training Loss: 0.3951%
Epoch [50/300], Step [8/225], Training Accuracy: 84.1797%, Training Loss: 0.4001%
Epoch [50/300], Step [9/225], Training Accuracy: 83.6806%, Training Loss: 0.4067%
Epoch [50/300], Step [10/225], Training Accuracy: 83.9062%, Training Loss: 0.4015%
Epoch [50/300], Step [11/225], Training Accuracy: 83.8068%, Training Loss: 0.4110%
Epoch [50/300], Step [12/225], Training Accuracy: 83.9844%, Training Loss: 0.3995%
Epoch [50/300], Step [13/225], Training Accuracy: 84.9760%, Training Loss: 0.3761%
Epoch [50/300], Step [14/225], Training Accuracy: 85.7143%, Training Loss: 0.3613%
Epoch [50/300], Step [15/225], Training Accuracy: 86.0417%, Training Loss: 0.3517%
Epoch [50/300], Step [16/225], Training Accuracy: 86.0352%, Training Loss: 0.3508%
Epoch [50/300], Step [17/225], Training Accuracy: 86.0294%, Training Loss: 0.3488%
Epoch [50/300], Step [18/225], Training Accuracy: 86.1979%, Training Loss: 0.3444%
Epoch [

Epoch [50/300], Step [106/225], Training Accuracy: 86.2323%, Training Loss: 0.3512%
Epoch [50/300], Step [107/225], Training Accuracy: 86.2880%, Training Loss: 0.3513%
Epoch [50/300], Step [108/225], Training Accuracy: 86.2847%, Training Loss: 0.3511%
Epoch [50/300], Step [109/225], Training Accuracy: 86.2242%, Training Loss: 0.3517%
Epoch [50/300], Step [110/225], Training Accuracy: 86.2358%, Training Loss: 0.3519%
Epoch [50/300], Step [111/225], Training Accuracy: 86.2613%, Training Loss: 0.3522%
Epoch [50/300], Step [112/225], Training Accuracy: 86.3002%, Training Loss: 0.3514%
Epoch [50/300], Step [113/225], Training Accuracy: 86.2970%, Training Loss: 0.3508%
Epoch [50/300], Step [114/225], Training Accuracy: 86.3213%, Training Loss: 0.3506%
Epoch [50/300], Step [115/225], Training Accuracy: 86.2908%, Training Loss: 0.3501%
Epoch [50/300], Step [116/225], Training Accuracy: 86.2204%, Training Loss: 0.3525%
Epoch [50/300], Step [117/225], Training Accuracy: 86.1378%, Training Loss: 

Epoch [50/300], Step [205/225], Training Accuracy: 86.2881%, Training Loss: 0.3467%
Epoch [50/300], Step [206/225], Training Accuracy: 86.2940%, Training Loss: 0.3467%
Epoch [50/300], Step [207/225], Training Accuracy: 86.2621%, Training Loss: 0.3474%
Epoch [50/300], Step [208/225], Training Accuracy: 86.2605%, Training Loss: 0.3475%
Epoch [50/300], Step [209/225], Training Accuracy: 86.2515%, Training Loss: 0.3476%
Epoch [50/300], Step [210/225], Training Accuracy: 86.2574%, Training Loss: 0.3471%
Epoch [50/300], Step [211/225], Training Accuracy: 86.2633%, Training Loss: 0.3471%
Epoch [50/300], Step [212/225], Training Accuracy: 86.2544%, Training Loss: 0.3470%
Epoch [50/300], Step [213/225], Training Accuracy: 86.2823%, Training Loss: 0.3465%
Epoch [50/300], Step [214/225], Training Accuracy: 86.2953%, Training Loss: 0.3462%
Epoch [50/300], Step [215/225], Training Accuracy: 86.2791%, Training Loss: 0.3461%
Epoch [50/300], Step [216/225], Training Accuracy: 86.2775%, Training Loss: 

Epoch [51/300], Step [79/225], Training Accuracy: 87.7769%, Training Loss: 0.3032%
Epoch [51/300], Step [80/225], Training Accuracy: 87.7734%, Training Loss: 0.3032%
Epoch [51/300], Step [81/225], Training Accuracy: 87.8086%, Training Loss: 0.3025%
Epoch [51/300], Step [82/225], Training Accuracy: 87.8811%, Training Loss: 0.3011%
Epoch [51/300], Step [83/225], Training Accuracy: 87.9330%, Training Loss: 0.3001%
Epoch [51/300], Step [84/225], Training Accuracy: 87.9278%, Training Loss: 0.3003%
Epoch [51/300], Step [85/225], Training Accuracy: 87.9596%, Training Loss: 0.2991%
Epoch [51/300], Step [86/225], Training Accuracy: 88.0087%, Training Loss: 0.2981%
Epoch [51/300], Step [87/225], Training Accuracy: 87.9310%, Training Loss: 0.2995%
Epoch [51/300], Step [88/225], Training Accuracy: 87.8906%, Training Loss: 0.3000%
Epoch [51/300], Step [89/225], Training Accuracy: 87.9213%, Training Loss: 0.2993%
Epoch [51/300], Step [90/225], Training Accuracy: 87.8299%, Training Loss: 0.3010%
Epoc

Epoch [51/300], Step [178/225], Training Accuracy: 89.1591%, Training Loss: 0.2712%
Epoch [51/300], Step [179/225], Training Accuracy: 89.1760%, Training Loss: 0.2706%
Epoch [51/300], Step [180/225], Training Accuracy: 89.2014%, Training Loss: 0.2702%
Epoch [51/300], Step [181/225], Training Accuracy: 89.1920%, Training Loss: 0.2702%
Epoch [51/300], Step [182/225], Training Accuracy: 89.2170%, Training Loss: 0.2702%
Epoch [51/300], Step [183/225], Training Accuracy: 89.2333%, Training Loss: 0.2699%
Epoch [51/300], Step [184/225], Training Accuracy: 89.2323%, Training Loss: 0.2698%
Epoch [51/300], Step [185/225], Training Accuracy: 89.2821%, Training Loss: 0.2687%
Epoch [51/300], Step [186/225], Training Accuracy: 89.3313%, Training Loss: 0.2677%
Epoch [51/300], Step [187/225], Training Accuracy: 89.3717%, Training Loss: 0.2668%
Epoch [51/300], Step [188/225], Training Accuracy: 89.3949%, Training Loss: 0.2665%
Epoch [51/300], Step [189/225], Training Accuracy: 89.3932%, Training Loss: 

Epoch [52/300], Step [52/225], Training Accuracy: 90.8353%, Training Loss: 0.2343%
Epoch [52/300], Step [53/225], Training Accuracy: 90.7429%, Training Loss: 0.2339%
Epoch [52/300], Step [54/225], Training Accuracy: 90.7697%, Training Loss: 0.2329%
Epoch [52/300], Step [55/225], Training Accuracy: 90.6818%, Training Loss: 0.2334%
Epoch [52/300], Step [56/225], Training Accuracy: 90.6808%, Training Loss: 0.2332%
Epoch [52/300], Step [57/225], Training Accuracy: 90.5428%, Training Loss: 0.2353%
Epoch [52/300], Step [58/225], Training Accuracy: 90.5711%, Training Loss: 0.2350%
Epoch [52/300], Step [59/225], Training Accuracy: 90.6515%, Training Loss: 0.2343%
Epoch [52/300], Step [60/225], Training Accuracy: 90.6250%, Training Loss: 0.2343%
Epoch [52/300], Step [61/225], Training Accuracy: 90.6762%, Training Loss: 0.2343%
Epoch [52/300], Step [62/225], Training Accuracy: 90.7762%, Training Loss: 0.2325%
Epoch [52/300], Step [63/225], Training Accuracy: 90.8234%, Training Loss: 0.2314%
Epoc

Epoch [52/300], Step [151/225], Training Accuracy: 91.2148%, Training Loss: 0.2193%
Epoch [52/300], Step [152/225], Training Accuracy: 91.2212%, Training Loss: 0.2195%
Epoch [52/300], Step [153/225], Training Accuracy: 91.2071%, Training Loss: 0.2194%
Epoch [52/300], Step [154/225], Training Accuracy: 91.2135%, Training Loss: 0.2194%
Epoch [52/300], Step [155/225], Training Accuracy: 91.2097%, Training Loss: 0.2195%
Epoch [52/300], Step [156/225], Training Accuracy: 91.2059%, Training Loss: 0.2195%
Epoch [52/300], Step [157/225], Training Accuracy: 91.2221%, Training Loss: 0.2193%
Epoch [52/300], Step [158/225], Training Accuracy: 91.2678%, Training Loss: 0.2186%
Epoch [52/300], Step [159/225], Training Accuracy: 91.2539%, Training Loss: 0.2186%
Epoch [52/300], Step [160/225], Training Accuracy: 91.2207%, Training Loss: 0.2186%
Epoch [52/300], Step [161/225], Training Accuracy: 91.2170%, Training Loss: 0.2190%
Epoch [52/300], Step [162/225], Training Accuracy: 91.2326%, Training Loss: 

Epoch [53/300], Step [25/225], Training Accuracy: 90.3750%, Training Loss: 0.2502%
Epoch [53/300], Step [26/225], Training Accuracy: 90.5048%, Training Loss: 0.2454%
Epoch [53/300], Step [27/225], Training Accuracy: 90.6250%, Training Loss: 0.2424%
Epoch [53/300], Step [28/225], Training Accuracy: 90.8482%, Training Loss: 0.2372%
Epoch [53/300], Step [29/225], Training Accuracy: 90.8405%, Training Loss: 0.2358%
Epoch [53/300], Step [30/225], Training Accuracy: 90.9896%, Training Loss: 0.2338%
Epoch [53/300], Step [31/225], Training Accuracy: 90.8266%, Training Loss: 0.2435%
Epoch [53/300], Step [32/225], Training Accuracy: 90.9180%, Training Loss: 0.2418%
Epoch [53/300], Step [33/225], Training Accuracy: 90.9091%, Training Loss: 0.2435%
Epoch [53/300], Step [34/225], Training Accuracy: 90.9007%, Training Loss: 0.2433%
Epoch [53/300], Step [35/225], Training Accuracy: 91.0268%, Training Loss: 0.2404%
Epoch [53/300], Step [36/225], Training Accuracy: 91.1458%, Training Loss: 0.2376%
Epoc

Epoch [53/300], Step [124/225], Training Accuracy: 90.7888%, Training Loss: 0.2310%
Epoch [53/300], Step [125/225], Training Accuracy: 90.8000%, Training Loss: 0.2304%
Epoch [53/300], Step [126/225], Training Accuracy: 90.8110%, Training Loss: 0.2303%
Epoch [53/300], Step [127/225], Training Accuracy: 90.8095%, Training Loss: 0.2303%
Epoch [53/300], Step [128/225], Training Accuracy: 90.8447%, Training Loss: 0.2297%
Epoch [53/300], Step [129/225], Training Accuracy: 90.8672%, Training Loss: 0.2296%
Epoch [53/300], Step [130/225], Training Accuracy: 90.8774%, Training Loss: 0.2298%
Epoch [53/300], Step [131/225], Training Accuracy: 90.8397%, Training Loss: 0.2308%
Epoch [53/300], Step [132/225], Training Accuracy: 90.8736%, Training Loss: 0.2304%
Epoch [53/300], Step [133/225], Training Accuracy: 90.8365%, Training Loss: 0.2307%
Epoch [53/300], Step [134/225], Training Accuracy: 90.8582%, Training Loss: 0.2304%
Epoch [53/300], Step [135/225], Training Accuracy: 90.8449%, Training Loss: 

Epoch [53/300], Step [223/225], Training Accuracy: 91.5779%, Training Loss: 0.2132%
Epoch [53/300], Step [224/225], Training Accuracy: 91.5876%, Training Loss: 0.2130%
Epoch [53/300], Step [225/225], Training Accuracy: 91.5717%, Training Loss: 0.2134%
Epoch [54/300], Step [1/225], Training Accuracy: 90.6250%, Training Loss: 0.2466%
Epoch [54/300], Step [2/225], Training Accuracy: 89.0625%, Training Loss: 0.2698%
Epoch [54/300], Step [3/225], Training Accuracy: 89.5833%, Training Loss: 0.2821%
Epoch [54/300], Step [4/225], Training Accuracy: 89.8438%, Training Loss: 0.2891%
Epoch [54/300], Step [5/225], Training Accuracy: 90.3125%, Training Loss: 0.2685%
Epoch [54/300], Step [6/225], Training Accuracy: 90.8854%, Training Loss: 0.2524%
Epoch [54/300], Step [7/225], Training Accuracy: 90.8482%, Training Loss: 0.2461%
Epoch [54/300], Step [8/225], Training Accuracy: 90.4297%, Training Loss: 0.2489%
Epoch [54/300], Step [9/225], Training Accuracy: 90.6250%, Training Loss: 0.2466%
Epoch [54/

Epoch [54/300], Step [97/225], Training Accuracy: 92.5258%, Training Loss: 0.1947%
Epoch [54/300], Step [98/225], Training Accuracy: 92.5383%, Training Loss: 0.1938%
Epoch [54/300], Step [99/225], Training Accuracy: 92.5663%, Training Loss: 0.1933%
Epoch [54/300], Step [100/225], Training Accuracy: 92.5000%, Training Loss: 0.1945%
Epoch [54/300], Step [101/225], Training Accuracy: 92.4660%, Training Loss: 0.1952%
Epoch [54/300], Step [102/225], Training Accuracy: 92.4020%, Training Loss: 0.1958%
Epoch [54/300], Step [103/225], Training Accuracy: 92.4302%, Training Loss: 0.1953%
Epoch [54/300], Step [104/225], Training Accuracy: 92.4429%, Training Loss: 0.1953%
Epoch [54/300], Step [105/225], Training Accuracy: 92.4405%, Training Loss: 0.1954%
Epoch [54/300], Step [106/225], Training Accuracy: 92.4381%, Training Loss: 0.1957%
Epoch [54/300], Step [107/225], Training Accuracy: 92.4650%, Training Loss: 0.1955%
Epoch [54/300], Step [108/225], Training Accuracy: 92.4479%, Training Loss: 0.1

Epoch [54/300], Step [196/225], Training Accuracy: 92.2114%, Training Loss: 0.2007%
Epoch [54/300], Step [197/225], Training Accuracy: 92.2272%, Training Loss: 0.2003%
Epoch [54/300], Step [198/225], Training Accuracy: 92.2506%, Training Loss: 0.1997%
Epoch [54/300], Step [199/225], Training Accuracy: 92.2346%, Training Loss: 0.2000%
Epoch [54/300], Step [200/225], Training Accuracy: 92.2656%, Training Loss: 0.1995%
Epoch [54/300], Step [201/225], Training Accuracy: 92.2886%, Training Loss: 0.1993%
Epoch [54/300], Step [202/225], Training Accuracy: 92.2881%, Training Loss: 0.1993%
Epoch [54/300], Step [203/225], Training Accuracy: 92.3183%, Training Loss: 0.1988%
Epoch [54/300], Step [204/225], Training Accuracy: 92.3330%, Training Loss: 0.1986%
Epoch [54/300], Step [205/225], Training Accuracy: 92.3476%, Training Loss: 0.1983%
Epoch [54/300], Step [206/225], Training Accuracy: 92.3544%, Training Loss: 0.1985%
Epoch [54/300], Step [207/225], Training Accuracy: 92.3385%, Training Loss: 

Epoch [55/300], Step [70/225], Training Accuracy: 92.4107%, Training Loss: 0.1951%
Epoch [55/300], Step [71/225], Training Accuracy: 92.3856%, Training Loss: 0.1946%
Epoch [55/300], Step [72/225], Training Accuracy: 92.3394%, Training Loss: 0.1945%
Epoch [55/300], Step [73/225], Training Accuracy: 92.3801%, Training Loss: 0.1942%
Epoch [55/300], Step [74/225], Training Accuracy: 92.3353%, Training Loss: 0.1949%
Epoch [55/300], Step [75/225], Training Accuracy: 92.3958%, Training Loss: 0.1941%
Epoch [55/300], Step [76/225], Training Accuracy: 92.3520%, Training Loss: 0.1950%
Epoch [55/300], Step [77/225], Training Accuracy: 92.4107%, Training Loss: 0.1939%
Epoch [55/300], Step [78/225], Training Accuracy: 92.4279%, Training Loss: 0.1943%
Epoch [55/300], Step [79/225], Training Accuracy: 92.4842%, Training Loss: 0.1929%
Epoch [55/300], Step [80/225], Training Accuracy: 92.4414%, Training Loss: 0.1935%
Epoch [55/300], Step [81/225], Training Accuracy: 92.4576%, Training Loss: 0.1928%
Epoc

Epoch [55/300], Step [169/225], Training Accuracy: 92.4649%, Training Loss: 0.1920%
Epoch [55/300], Step [170/225], Training Accuracy: 92.4449%, Training Loss: 0.1921%
Epoch [55/300], Step [171/225], Training Accuracy: 92.4159%, Training Loss: 0.1926%
Epoch [55/300], Step [172/225], Training Accuracy: 92.3874%, Training Loss: 0.1932%
Epoch [55/300], Step [173/225], Training Accuracy: 92.4043%, Training Loss: 0.1928%
Epoch [55/300], Step [174/225], Training Accuracy: 92.3940%, Training Loss: 0.1927%
Epoch [55/300], Step [175/225], Training Accuracy: 92.3929%, Training Loss: 0.1927%
Epoch [55/300], Step [176/225], Training Accuracy: 92.4183%, Training Loss: 0.1920%
Epoch [55/300], Step [177/225], Training Accuracy: 92.4258%, Training Loss: 0.1919%
Epoch [55/300], Step [178/225], Training Accuracy: 92.4421%, Training Loss: 0.1916%
Epoch [55/300], Step [179/225], Training Accuracy: 92.3883%, Training Loss: 0.1921%
Epoch [55/300], Step [180/225], Training Accuracy: 92.3872%, Training Loss: 

Epoch [56/300], Step [43/225], Training Accuracy: 92.3328%, Training Loss: 0.1989%
Epoch [56/300], Step [44/225], Training Accuracy: 92.2940%, Training Loss: 0.1988%
Epoch [56/300], Step [45/225], Training Accuracy: 92.3264%, Training Loss: 0.1971%
Epoch [56/300], Step [46/225], Training Accuracy: 92.4253%, Training Loss: 0.1959%
Epoch [56/300], Step [47/225], Training Accuracy: 92.4535%, Training Loss: 0.1950%
Epoch [56/300], Step [48/225], Training Accuracy: 92.3503%, Training Loss: 0.1954%
Epoch [56/300], Step [49/225], Training Accuracy: 92.4426%, Training Loss: 0.1942%
Epoch [56/300], Step [50/225], Training Accuracy: 92.5000%, Training Loss: 0.1932%
Epoch [56/300], Step [51/225], Training Accuracy: 92.4632%, Training Loss: 0.1936%
Epoch [56/300], Step [52/225], Training Accuracy: 92.4880%, Training Loss: 0.1928%
Epoch [56/300], Step [53/225], Training Accuracy: 92.4528%, Training Loss: 0.1930%
Epoch [56/300], Step [54/225], Training Accuracy: 92.5347%, Training Loss: 0.1923%
Epoc

Epoch [56/300], Step [142/225], Training Accuracy: 92.6937%, Training Loss: 0.1901%
Epoch [56/300], Step [143/225], Training Accuracy: 92.7120%, Training Loss: 0.1900%
Epoch [56/300], Step [144/225], Training Accuracy: 92.7300%, Training Loss: 0.1908%
Epoch [56/300], Step [145/225], Training Accuracy: 92.7371%, Training Loss: 0.1906%
Epoch [56/300], Step [146/225], Training Accuracy: 92.7654%, Training Loss: 0.1902%
Epoch [56/300], Step [147/225], Training Accuracy: 92.7721%, Training Loss: 0.1901%
Epoch [56/300], Step [148/225], Training Accuracy: 92.7682%, Training Loss: 0.1899%
Epoch [56/300], Step [149/225], Training Accuracy: 92.7328%, Training Loss: 0.1905%
Epoch [56/300], Step [150/225], Training Accuracy: 92.7708%, Training Loss: 0.1896%
Epoch [56/300], Step [151/225], Training Accuracy: 92.7877%, Training Loss: 0.1891%
Epoch [56/300], Step [152/225], Training Accuracy: 92.8043%, Training Loss: 0.1887%
Epoch [56/300], Step [153/225], Training Accuracy: 92.8105%, Training Loss: 

Epoch [57/300], Step [16/225], Training Accuracy: 92.9688%, Training Loss: 0.1975%
Epoch [57/300], Step [17/225], Training Accuracy: 92.8309%, Training Loss: 0.2008%
Epoch [57/300], Step [18/225], Training Accuracy: 92.6215%, Training Loss: 0.2049%
Epoch [57/300], Step [19/225], Training Accuracy: 92.6809%, Training Loss: 0.2022%
Epoch [57/300], Step [20/225], Training Accuracy: 92.7344%, Training Loss: 0.1997%
Epoch [57/300], Step [21/225], Training Accuracy: 92.7083%, Training Loss: 0.1991%
Epoch [57/300], Step [22/225], Training Accuracy: 92.5426%, Training Loss: 0.2039%
Epoch [57/300], Step [23/225], Training Accuracy: 92.5272%, Training Loss: 0.2015%
Epoch [57/300], Step [24/225], Training Accuracy: 92.4479%, Training Loss: 0.2033%
Epoch [57/300], Step [25/225], Training Accuracy: 92.3125%, Training Loss: 0.2031%
Epoch [57/300], Step [26/225], Training Accuracy: 92.4279%, Training Loss: 0.2023%
Epoch [57/300], Step [27/225], Training Accuracy: 92.5347%, Training Loss: 0.2005%
Epoc

Epoch [57/300], Step [115/225], Training Accuracy: 92.5679%, Training Loss: 0.1971%
Epoch [57/300], Step [116/225], Training Accuracy: 92.5377%, Training Loss: 0.1976%
Epoch [57/300], Step [117/225], Training Accuracy: 92.5481%, Training Loss: 0.1977%
Epoch [57/300], Step [118/225], Training Accuracy: 92.5450%, Training Loss: 0.1979%
Epoch [57/300], Step [119/225], Training Accuracy: 92.5551%, Training Loss: 0.1978%
Epoch [57/300], Step [120/225], Training Accuracy: 92.5781%, Training Loss: 0.1979%
Epoch [57/300], Step [121/225], Training Accuracy: 92.5878%, Training Loss: 0.1976%
Epoch [57/300], Step [122/225], Training Accuracy: 92.5717%, Training Loss: 0.1977%
Epoch [57/300], Step [123/225], Training Accuracy: 92.6067%, Training Loss: 0.1973%
Epoch [57/300], Step [124/225], Training Accuracy: 92.6411%, Training Loss: 0.1969%
Epoch [57/300], Step [125/225], Training Accuracy: 92.6750%, Training Loss: 0.1963%
Epoch [57/300], Step [126/225], Training Accuracy: 92.6711%, Training Loss: 

Epoch [57/300], Step [214/225], Training Accuracy: 92.5672%, Training Loss: 0.1963%
Epoch [57/300], Step [215/225], Training Accuracy: 92.5945%, Training Loss: 0.1958%
Epoch [57/300], Step [216/225], Training Accuracy: 92.6071%, Training Loss: 0.1957%
Epoch [57/300], Step [217/225], Training Accuracy: 92.6339%, Training Loss: 0.1954%
Epoch [57/300], Step [218/225], Training Accuracy: 92.6319%, Training Loss: 0.1956%
Epoch [57/300], Step [219/225], Training Accuracy: 92.6370%, Training Loss: 0.1954%
Epoch [57/300], Step [220/225], Training Accuracy: 92.6634%, Training Loss: 0.1950%
Epoch [57/300], Step [221/225], Training Accuracy: 92.6541%, Training Loss: 0.1947%
Epoch [57/300], Step [222/225], Training Accuracy: 92.6309%, Training Loss: 0.1952%
Epoch [57/300], Step [223/225], Training Accuracy: 92.6079%, Training Loss: 0.1958%
Epoch [57/300], Step [224/225], Training Accuracy: 92.6130%, Training Loss: 0.1957%
Epoch [57/300], Step [225/225], Training Accuracy: 92.6140%, Training Loss: 

Epoch [58/300], Step [88/225], Training Accuracy: 92.0277%, Training Loss: 0.2088%
Epoch [58/300], Step [89/225], Training Accuracy: 92.0646%, Training Loss: 0.2085%
Epoch [58/300], Step [90/225], Training Accuracy: 92.0312%, Training Loss: 0.2084%
Epoch [58/300], Step [91/225], Training Accuracy: 92.0158%, Training Loss: 0.2083%
Epoch [58/300], Step [92/225], Training Accuracy: 92.0177%, Training Loss: 0.2091%
Epoch [58/300], Step [93/225], Training Accuracy: 92.0363%, Training Loss: 0.2089%
Epoch [58/300], Step [94/225], Training Accuracy: 91.9548%, Training Loss: 0.2099%
Epoch [58/300], Step [95/225], Training Accuracy: 91.9408%, Training Loss: 0.2097%
Epoch [58/300], Step [96/225], Training Accuracy: 91.9596%, Training Loss: 0.2092%
Epoch [58/300], Step [97/225], Training Accuracy: 91.9620%, Training Loss: 0.2095%
Epoch [58/300], Step [98/225], Training Accuracy: 91.8846%, Training Loss: 0.2100%
Epoch [58/300], Step [99/225], Training Accuracy: 91.9034%, Training Loss: 0.2099%
Epoc

Epoch [58/300], Step [187/225], Training Accuracy: 91.9786%, Training Loss: 0.2054%
Epoch [58/300], Step [188/225], Training Accuracy: 92.0047%, Training Loss: 0.2051%
Epoch [58/300], Step [189/225], Training Accuracy: 92.0304%, Training Loss: 0.2046%
Epoch [58/300], Step [190/225], Training Accuracy: 92.0148%, Training Loss: 0.2046%
Epoch [58/300], Step [191/225], Training Accuracy: 91.9912%, Training Loss: 0.2048%
Epoch [58/300], Step [192/225], Training Accuracy: 92.0166%, Training Loss: 0.2043%
Epoch [58/300], Step [193/225], Training Accuracy: 92.0256%, Training Loss: 0.2041%
Epoch [58/300], Step [194/225], Training Accuracy: 92.0184%, Training Loss: 0.2043%
Epoch [58/300], Step [195/225], Training Accuracy: 92.0433%, Training Loss: 0.2038%
Epoch [58/300], Step [196/225], Training Accuracy: 92.0360%, Training Loss: 0.2037%
Epoch [58/300], Step [197/225], Training Accuracy: 92.0606%, Training Loss: 0.2030%
Epoch [58/300], Step [198/225], Training Accuracy: 92.0770%, Training Loss: 

Epoch [59/300], Step [61/225], Training Accuracy: 92.2643%, Training Loss: 0.2045%
Epoch [59/300], Step [62/225], Training Accuracy: 92.2883%, Training Loss: 0.2056%
Epoch [59/300], Step [63/225], Training Accuracy: 92.3115%, Training Loss: 0.2052%
Epoch [59/300], Step [64/225], Training Accuracy: 92.3828%, Training Loss: 0.2040%
Epoch [59/300], Step [65/225], Training Accuracy: 92.2596%, Training Loss: 0.2075%
Epoch [59/300], Step [66/225], Training Accuracy: 92.2348%, Training Loss: 0.2071%
Epoch [59/300], Step [67/225], Training Accuracy: 92.0709%, Training Loss: 0.2091%
Epoch [59/300], Step [68/225], Training Accuracy: 92.0037%, Training Loss: 0.2098%
Epoch [59/300], Step [69/225], Training Accuracy: 92.0516%, Training Loss: 0.2094%
Epoch [59/300], Step [70/225], Training Accuracy: 92.0759%, Training Loss: 0.2091%
Epoch [59/300], Step [71/225], Training Accuracy: 92.0775%, Training Loss: 0.2089%
Epoch [59/300], Step [72/225], Training Accuracy: 92.1007%, Training Loss: 0.2083%
Epoc

Epoch [59/300], Step [160/225], Training Accuracy: 92.1582%, Training Loss: 0.2012%
Epoch [59/300], Step [161/225], Training Accuracy: 92.1293%, Training Loss: 0.2018%
Epoch [59/300], Step [162/225], Training Accuracy: 92.1296%, Training Loss: 0.2016%
Epoch [59/300], Step [163/225], Training Accuracy: 92.1300%, Training Loss: 0.2015%
Epoch [59/300], Step [164/225], Training Accuracy: 92.1589%, Training Loss: 0.2012%
Epoch [59/300], Step [165/225], Training Accuracy: 92.1875%, Training Loss: 0.2008%
Epoch [59/300], Step [166/225], Training Accuracy: 92.1969%, Training Loss: 0.2008%
Epoch [59/300], Step [167/225], Training Accuracy: 92.2062%, Training Loss: 0.2006%
Epoch [59/300], Step [168/225], Training Accuracy: 92.1410%, Training Loss: 0.2018%
Epoch [59/300], Step [169/225], Training Accuracy: 92.1690%, Training Loss: 0.2013%
Epoch [59/300], Step [170/225], Training Accuracy: 92.1324%, Training Loss: 0.2020%
Epoch [59/300], Step [171/225], Training Accuracy: 92.1235%, Training Loss: 

Epoch [60/300], Step [34/225], Training Accuracy: 90.6250%, Training Loss: 0.2157%
Epoch [60/300], Step [35/225], Training Accuracy: 90.8036%, Training Loss: 0.2149%
Epoch [60/300], Step [36/225], Training Accuracy: 90.9722%, Training Loss: 0.2107%
Epoch [60/300], Step [37/225], Training Accuracy: 91.1318%, Training Loss: 0.2076%
Epoch [60/300], Step [38/225], Training Accuracy: 91.0773%, Training Loss: 0.2096%
Epoch [60/300], Step [39/225], Training Accuracy: 91.2260%, Training Loss: 0.2098%
Epoch [60/300], Step [40/225], Training Accuracy: 91.2891%, Training Loss: 0.2090%
Epoch [60/300], Step [41/225], Training Accuracy: 91.1966%, Training Loss: 0.2100%
Epoch [60/300], Step [42/225], Training Accuracy: 91.2946%, Training Loss: 0.2081%
Epoch [60/300], Step [43/225], Training Accuracy: 91.3517%, Training Loss: 0.2086%
Epoch [60/300], Step [44/225], Training Accuracy: 91.4418%, Training Loss: 0.2074%
Epoch [60/300], Step [45/225], Training Accuracy: 91.4931%, Training Loss: 0.2060%
Epoc

Epoch [60/300], Step [133/225], Training Accuracy: 91.8233%, Training Loss: 0.2075%
Epoch [60/300], Step [134/225], Training Accuracy: 91.8027%, Training Loss: 0.2077%
Epoch [60/300], Step [135/225], Training Accuracy: 91.8171%, Training Loss: 0.2075%
Epoch [60/300], Step [136/225], Training Accuracy: 91.7969%, Training Loss: 0.2076%
Epoch [60/300], Step [137/225], Training Accuracy: 91.8339%, Training Loss: 0.2072%
Epoch [60/300], Step [138/225], Training Accuracy: 91.8478%, Training Loss: 0.2066%
Epoch [60/300], Step [139/225], Training Accuracy: 91.8952%, Training Loss: 0.2059%
Epoch [60/300], Step [140/225], Training Accuracy: 91.8973%, Training Loss: 0.2061%
Epoch [60/300], Step [141/225], Training Accuracy: 91.9215%, Training Loss: 0.2059%
Epoch [60/300], Step [142/225], Training Accuracy: 91.9344%, Training Loss: 0.2055%
Epoch [60/300], Step [143/225], Training Accuracy: 91.9471%, Training Loss: 0.2050%
Epoch [60/300], Step [144/225], Training Accuracy: 91.9705%, Training Loss: 

Epoch [61/300], Step [7/225], Training Accuracy: 93.0804%, Training Loss: 0.1967%
Epoch [61/300], Step [8/225], Training Accuracy: 93.1641%, Training Loss: 0.1937%
Epoch [61/300], Step [9/225], Training Accuracy: 93.0556%, Training Loss: 0.1960%
Epoch [61/300], Step [10/225], Training Accuracy: 93.2812%, Training Loss: 0.1946%
Epoch [61/300], Step [11/225], Training Accuracy: 92.8977%, Training Loss: 0.2032%
Epoch [61/300], Step [12/225], Training Accuracy: 92.9688%, Training Loss: 0.1979%
Epoch [61/300], Step [13/225], Training Accuracy: 93.1490%, Training Loss: 0.1952%
Epoch [61/300], Step [14/225], Training Accuracy: 93.0804%, Training Loss: 0.1936%
Epoch [61/300], Step [15/225], Training Accuracy: 93.0208%, Training Loss: 0.1987%
Epoch [61/300], Step [16/225], Training Accuracy: 92.6758%, Training Loss: 0.2089%
Epoch [61/300], Step [17/225], Training Accuracy: 92.9228%, Training Loss: 0.2027%
Epoch [61/300], Step [18/225], Training Accuracy: 92.7083%, Training Loss: 0.2087%
Epoch [

Epoch [61/300], Step [106/225], Training Accuracy: 92.9098%, Training Loss: 0.1926%
Epoch [61/300], Step [107/225], Training Accuracy: 92.8592%, Training Loss: 0.1932%
Epoch [61/300], Step [108/225], Training Accuracy: 92.8675%, Training Loss: 0.1931%
Epoch [61/300], Step [109/225], Training Accuracy: 92.8756%, Training Loss: 0.1937%
Epoch [61/300], Step [110/225], Training Accuracy: 92.9119%, Training Loss: 0.1933%
Epoch [61/300], Step [111/225], Training Accuracy: 92.9054%, Training Loss: 0.1937%
Epoch [61/300], Step [112/225], Training Accuracy: 92.9129%, Training Loss: 0.1931%
Epoch [61/300], Step [113/225], Training Accuracy: 92.8650%, Training Loss: 0.1933%
Epoch [61/300], Step [114/225], Training Accuracy: 92.8865%, Training Loss: 0.1931%
Epoch [61/300], Step [115/225], Training Accuracy: 92.9348%, Training Loss: 0.1926%
Epoch [61/300], Step [116/225], Training Accuracy: 92.9014%, Training Loss: 0.1935%
Epoch [61/300], Step [117/225], Training Accuracy: 92.9087%, Training Loss: 

Epoch [61/300], Step [205/225], Training Accuracy: 92.9192%, Training Loss: 0.1892%
Epoch [61/300], Step [206/225], Training Accuracy: 92.9005%, Training Loss: 0.1893%
Epoch [61/300], Step [207/225], Training Accuracy: 92.8895%, Training Loss: 0.1892%
Epoch [61/300], Step [208/225], Training Accuracy: 92.9087%, Training Loss: 0.1890%
Epoch [61/300], Step [209/225], Training Accuracy: 92.8977%, Training Loss: 0.1891%
Epoch [61/300], Step [210/225], Training Accuracy: 92.8869%, Training Loss: 0.1892%
Epoch [61/300], Step [211/225], Training Accuracy: 92.8614%, Training Loss: 0.1895%
Epoch [61/300], Step [212/225], Training Accuracy: 92.8435%, Training Loss: 0.1898%
Epoch [61/300], Step [213/225], Training Accuracy: 92.8330%, Training Loss: 0.1905%
Epoch [61/300], Step [214/225], Training Accuracy: 92.8300%, Training Loss: 0.1905%
Epoch [61/300], Step [215/225], Training Accuracy: 92.8416%, Training Loss: 0.1900%
Epoch [61/300], Step [216/225], Training Accuracy: 92.8530%, Training Loss: 

Epoch [62/300], Step [79/225], Training Accuracy: 92.9786%, Training Loss: 0.1877%
Epoch [62/300], Step [80/225], Training Accuracy: 92.9883%, Training Loss: 0.1872%
Epoch [62/300], Step [81/225], Training Accuracy: 93.0363%, Training Loss: 0.1864%
Epoch [62/300], Step [82/225], Training Accuracy: 93.1021%, Training Loss: 0.1847%
Epoch [62/300], Step [83/225], Training Accuracy: 93.0723%, Training Loss: 0.1851%
Epoch [62/300], Step [84/225], Training Accuracy: 93.0990%, Training Loss: 0.1845%
Epoch [62/300], Step [85/225], Training Accuracy: 93.1066%, Training Loss: 0.1841%
Epoch [62/300], Step [86/225], Training Accuracy: 93.1868%, Training Loss: 0.1829%
Epoch [62/300], Step [87/225], Training Accuracy: 93.0855%, Training Loss: 0.1841%
Epoch [62/300], Step [88/225], Training Accuracy: 93.0220%, Training Loss: 0.1849%
Epoch [62/300], Step [89/225], Training Accuracy: 93.0478%, Training Loss: 0.1840%
Epoch [62/300], Step [90/225], Training Accuracy: 93.0556%, Training Loss: 0.1837%
Epoc

Epoch [62/300], Step [178/225], Training Accuracy: 92.6615%, Training Loss: 0.1921%
Epoch [62/300], Step [179/225], Training Accuracy: 92.6414%, Training Loss: 0.1925%
Epoch [62/300], Step [180/225], Training Accuracy: 92.6302%, Training Loss: 0.1927%
Epoch [62/300], Step [181/225], Training Accuracy: 92.5932%, Training Loss: 0.1934%
Epoch [62/300], Step [182/225], Training Accuracy: 92.5996%, Training Loss: 0.1933%
Epoch [62/300], Step [183/225], Training Accuracy: 92.6059%, Training Loss: 0.1934%
Epoch [62/300], Step [184/225], Training Accuracy: 92.6461%, Training Loss: 0.1926%
Epoch [62/300], Step [185/225], Training Accuracy: 92.6689%, Training Loss: 0.1922%
Epoch [62/300], Step [186/225], Training Accuracy: 92.6831%, Training Loss: 0.1916%
Epoch [62/300], Step [187/225], Training Accuracy: 92.6721%, Training Loss: 0.1917%
Epoch [62/300], Step [188/225], Training Accuracy: 92.6695%, Training Loss: 0.1916%
Epoch [62/300], Step [189/225], Training Accuracy: 92.6670%, Training Loss: 

Epoch [63/300], Step [54/225], Training Accuracy: 93.2870%, Training Loss: 0.1748%
Epoch [63/300], Step [55/225], Training Accuracy: 93.2670%, Training Loss: 0.1749%
Epoch [63/300], Step [56/225], Training Accuracy: 93.3036%, Training Loss: 0.1742%
Epoch [63/300], Step [57/225], Training Accuracy: 93.2566%, Training Loss: 0.1751%
Epoch [63/300], Step [58/225], Training Accuracy: 93.2920%, Training Loss: 0.1748%
Epoch [63/300], Step [59/225], Training Accuracy: 93.1144%, Training Loss: 0.1784%
Epoch [63/300], Step [60/225], Training Accuracy: 93.1771%, Training Loss: 0.1779%
Epoch [63/300], Step [61/225], Training Accuracy: 93.1352%, Training Loss: 0.1786%
Epoch [63/300], Step [62/225], Training Accuracy: 93.1452%, Training Loss: 0.1795%
Epoch [63/300], Step [63/225], Training Accuracy: 93.1548%, Training Loss: 0.1791%
Epoch [63/300], Step [64/225], Training Accuracy: 93.1641%, Training Loss: 0.1785%
Epoch [63/300], Step [65/225], Training Accuracy: 93.2212%, Training Loss: 0.1782%
Epoc

Epoch [63/300], Step [153/225], Training Accuracy: 92.9432%, Training Loss: 0.1822%
Epoch [63/300], Step [154/225], Training Accuracy: 92.9485%, Training Loss: 0.1822%
Epoch [63/300], Step [155/225], Training Accuracy: 92.9435%, Training Loss: 0.1820%
Epoch [63/300], Step [156/225], Training Accuracy: 92.9387%, Training Loss: 0.1819%
Epoch [63/300], Step [157/225], Training Accuracy: 92.9339%, Training Loss: 0.1822%
Epoch [63/300], Step [158/225], Training Accuracy: 92.9292%, Training Loss: 0.1819%
Epoch [63/300], Step [159/225], Training Accuracy: 92.8950%, Training Loss: 0.1823%
Epoch [63/300], Step [160/225], Training Accuracy: 92.8711%, Training Loss: 0.1827%
Epoch [63/300], Step [161/225], Training Accuracy: 92.8960%, Training Loss: 0.1822%
Epoch [63/300], Step [162/225], Training Accuracy: 92.9205%, Training Loss: 0.1817%
Epoch [63/300], Step [163/225], Training Accuracy: 92.9160%, Training Loss: 0.1821%
Epoch [63/300], Step [164/225], Training Accuracy: 92.9402%, Training Loss: 

Epoch [64/300], Step [26/225], Training Accuracy: 91.6466%, Training Loss: 0.2184%
Epoch [64/300], Step [27/225], Training Accuracy: 91.6667%, Training Loss: 0.2174%
Epoch [64/300], Step [28/225], Training Accuracy: 91.7411%, Training Loss: 0.2129%
Epoch [64/300], Step [29/225], Training Accuracy: 91.8642%, Training Loss: 0.2088%
Epoch [64/300], Step [30/225], Training Accuracy: 91.9792%, Training Loss: 0.2116%
Epoch [64/300], Step [31/225], Training Accuracy: 91.9355%, Training Loss: 0.2121%
Epoch [64/300], Step [32/225], Training Accuracy: 91.9434%, Training Loss: 0.2127%
Epoch [64/300], Step [33/225], Training Accuracy: 92.0928%, Training Loss: 0.2103%
Epoch [64/300], Step [34/225], Training Accuracy: 92.0496%, Training Loss: 0.2114%
Epoch [64/300], Step [35/225], Training Accuracy: 92.0536%, Training Loss: 0.2104%
Epoch [64/300], Step [36/225], Training Accuracy: 92.1441%, Training Loss: 0.2074%
Epoch [64/300], Step [37/225], Training Accuracy: 92.1030%, Training Loss: 0.2059%
Epoc

Epoch [64/300], Step [125/225], Training Accuracy: 92.8250%, Training Loss: 0.1877%
Epoch [64/300], Step [126/225], Training Accuracy: 92.8075%, Training Loss: 0.1879%
Epoch [64/300], Step [127/225], Training Accuracy: 92.7781%, Training Loss: 0.1882%
Epoch [64/300], Step [128/225], Training Accuracy: 92.7856%, Training Loss: 0.1881%
Epoch [64/300], Step [129/225], Training Accuracy: 92.7568%, Training Loss: 0.1891%
Epoch [64/300], Step [130/225], Training Accuracy: 92.8005%, Training Loss: 0.1886%
Epoch [64/300], Step [131/225], Training Accuracy: 92.7958%, Training Loss: 0.1890%
Epoch [64/300], Step [132/225], Training Accuracy: 92.8149%, Training Loss: 0.1888%
Epoch [64/300], Step [133/225], Training Accuracy: 92.8102%, Training Loss: 0.1886%
Epoch [64/300], Step [134/225], Training Accuracy: 92.7705%, Training Loss: 0.1899%
Epoch [64/300], Step [135/225], Training Accuracy: 92.7662%, Training Loss: 0.1898%
Epoch [64/300], Step [136/225], Training Accuracy: 92.7619%, Training Loss: 

Epoch [64/300], Step [224/225], Training Accuracy: 92.8990%, Training Loss: 0.1852%
Epoch [64/300], Step [225/225], Training Accuracy: 92.9127%, Training Loss: 0.1848%
Epoch [65/300], Step [1/225], Training Accuracy: 92.1875%, Training Loss: 0.1767%
Epoch [65/300], Step [2/225], Training Accuracy: 94.5312%, Training Loss: 0.1781%
Epoch [65/300], Step [3/225], Training Accuracy: 95.3125%, Training Loss: 0.1588%
Epoch [65/300], Step [4/225], Training Accuracy: 94.5312%, Training Loss: 0.1929%
Epoch [65/300], Step [5/225], Training Accuracy: 92.8125%, Training Loss: 0.2239%
Epoch [65/300], Step [6/225], Training Accuracy: 92.9688%, Training Loss: 0.2137%
Epoch [65/300], Step [7/225], Training Accuracy: 92.8571%, Training Loss: 0.2062%
Epoch [65/300], Step [8/225], Training Accuracy: 93.3594%, Training Loss: 0.1919%
Epoch [65/300], Step [9/225], Training Accuracy: 93.0556%, Training Loss: 0.1990%
Epoch [65/300], Step [10/225], Training Accuracy: 92.9688%, Training Loss: 0.1986%
Epoch [65/3

Epoch [65/300], Step [98/225], Training Accuracy: 93.0325%, Training Loss: 0.1780%
Epoch [65/300], Step [99/225], Training Accuracy: 93.0398%, Training Loss: 0.1778%
Epoch [65/300], Step [100/225], Training Accuracy: 93.0000%, Training Loss: 0.1784%
Epoch [65/300], Step [101/225], Training Accuracy: 92.9920%, Training Loss: 0.1783%
Epoch [65/300], Step [102/225], Training Accuracy: 92.9534%, Training Loss: 0.1796%
Epoch [65/300], Step [103/225], Training Accuracy: 92.8701%, Training Loss: 0.1819%
Epoch [65/300], Step [104/225], Training Accuracy: 92.8185%, Training Loss: 0.1835%
Epoch [65/300], Step [105/225], Training Accuracy: 92.8720%, Training Loss: 0.1827%
Epoch [65/300], Step [106/225], Training Accuracy: 92.8656%, Training Loss: 0.1828%
Epoch [65/300], Step [107/225], Training Accuracy: 92.8884%, Training Loss: 0.1823%
Epoch [65/300], Step [108/225], Training Accuracy: 92.9543%, Training Loss: 0.1816%
Epoch [65/300], Step [109/225], Training Accuracy: 92.9616%, Training Loss: 0.

Epoch [65/300], Step [197/225], Training Accuracy: 93.3058%, Training Loss: 0.1744%
Epoch [65/300], Step [198/225], Training Accuracy: 93.3160%, Training Loss: 0.1742%
Epoch [65/300], Step [199/225], Training Accuracy: 93.3182%, Training Loss: 0.1741%
Epoch [65/300], Step [200/225], Training Accuracy: 93.3047%, Training Loss: 0.1740%
Epoch [65/300], Step [201/225], Training Accuracy: 93.2836%, Training Loss: 0.1745%
Epoch [65/300], Step [202/225], Training Accuracy: 93.2782%, Training Loss: 0.1745%
Epoch [65/300], Step [203/225], Training Accuracy: 93.2959%, Training Loss: 0.1741%
Epoch [65/300], Step [204/225], Training Accuracy: 93.2981%, Training Loss: 0.1739%
Epoch [65/300], Step [205/225], Training Accuracy: 93.3232%, Training Loss: 0.1733%
Epoch [65/300], Step [206/225], Training Accuracy: 93.3177%, Training Loss: 0.1734%
Epoch [65/300], Step [207/225], Training Accuracy: 93.2971%, Training Loss: 0.1736%
Epoch [65/300], Step [208/225], Training Accuracy: 93.2918%, Training Loss: 

Epoch [66/300], Step [71/225], Training Accuracy: 93.8820%, Training Loss: 0.1684%
Epoch [66/300], Step [72/225], Training Accuracy: 93.7717%, Training Loss: 0.1708%
Epoch [66/300], Step [73/225], Training Accuracy: 93.7286%, Training Loss: 0.1709%
Epoch [66/300], Step [74/225], Training Accuracy: 93.7078%, Training Loss: 0.1708%
Epoch [66/300], Step [75/225], Training Accuracy: 93.7500%, Training Loss: 0.1699%
Epoch [66/300], Step [76/225], Training Accuracy: 93.7706%, Training Loss: 0.1701%
Epoch [66/300], Step [77/225], Training Accuracy: 93.7297%, Training Loss: 0.1709%
Epoch [66/300], Step [78/225], Training Accuracy: 93.6699%, Training Loss: 0.1719%
Epoch [66/300], Step [79/225], Training Accuracy: 93.7302%, Training Loss: 0.1705%
Epoch [66/300], Step [80/225], Training Accuracy: 93.6719%, Training Loss: 0.1713%
Epoch [66/300], Step [81/225], Training Accuracy: 93.6535%, Training Loss: 0.1710%
Epoch [66/300], Step [82/225], Training Accuracy: 93.6738%, Training Loss: 0.1703%
Epoc

Epoch [66/300], Step [170/225], Training Accuracy: 93.1618%, Training Loss: 0.1817%
Epoch [66/300], Step [171/225], Training Accuracy: 93.1743%, Training Loss: 0.1815%
Epoch [66/300], Step [172/225], Training Accuracy: 93.1686%, Training Loss: 0.1817%
Epoch [66/300], Step [173/225], Training Accuracy: 93.1629%, Training Loss: 0.1815%
Epoch [66/300], Step [174/225], Training Accuracy: 93.1573%, Training Loss: 0.1818%
Epoch [66/300], Step [175/225], Training Accuracy: 93.1339%, Training Loss: 0.1819%
Epoch [66/300], Step [176/225], Training Accuracy: 93.1374%, Training Loss: 0.1818%
Epoch [66/300], Step [177/225], Training Accuracy: 93.1585%, Training Loss: 0.1812%
Epoch [66/300], Step [178/225], Training Accuracy: 93.1970%, Training Loss: 0.1807%
Epoch [66/300], Step [179/225], Training Accuracy: 93.1652%, Training Loss: 0.1811%
Epoch [66/300], Step [180/225], Training Accuracy: 93.1510%, Training Loss: 0.1817%
Epoch [66/300], Step [181/225], Training Accuracy: 93.1371%, Training Loss: 

Epoch [67/300], Step [44/225], Training Accuracy: 93.5014%, Training Loss: 0.1705%
Epoch [67/300], Step [45/225], Training Accuracy: 93.5069%, Training Loss: 0.1709%
Epoch [67/300], Step [46/225], Training Accuracy: 93.4783%, Training Loss: 0.1701%
Epoch [67/300], Step [47/225], Training Accuracy: 93.4508%, Training Loss: 0.1719%
Epoch [67/300], Step [48/225], Training Accuracy: 93.5221%, Training Loss: 0.1714%
Epoch [67/300], Step [49/225], Training Accuracy: 93.5906%, Training Loss: 0.1700%
Epoch [67/300], Step [50/225], Training Accuracy: 93.6562%, Training Loss: 0.1693%
Epoch [67/300], Step [51/225], Training Accuracy: 93.7194%, Training Loss: 0.1679%
Epoch [67/300], Step [52/225], Training Accuracy: 93.7500%, Training Loss: 0.1667%
Epoch [67/300], Step [53/225], Training Accuracy: 93.8090%, Training Loss: 0.1657%
Epoch [67/300], Step [54/225], Training Accuracy: 93.7211%, Training Loss: 0.1669%
Epoch [67/300], Step [55/225], Training Accuracy: 93.7216%, Training Loss: 0.1665%
Epoc

Epoch [67/300], Step [143/225], Training Accuracy: 93.6517%, Training Loss: 0.1687%
Epoch [67/300], Step [144/225], Training Accuracy: 93.6632%, Training Loss: 0.1686%
Epoch [67/300], Step [145/225], Training Accuracy: 93.6315%, Training Loss: 0.1693%
Epoch [67/300], Step [146/225], Training Accuracy: 93.6644%, Training Loss: 0.1686%
Epoch [67/300], Step [147/225], Training Accuracy: 93.6437%, Training Loss: 0.1688%
Epoch [67/300], Step [148/225], Training Accuracy: 93.6444%, Training Loss: 0.1685%
Epoch [67/300], Step [149/225], Training Accuracy: 93.6346%, Training Loss: 0.1684%
Epoch [67/300], Step [150/225], Training Accuracy: 93.6354%, Training Loss: 0.1682%
Epoch [67/300], Step [151/225], Training Accuracy: 93.6569%, Training Loss: 0.1677%
Epoch [67/300], Step [152/225], Training Accuracy: 93.6472%, Training Loss: 0.1682%
Epoch [67/300], Step [153/225], Training Accuracy: 93.6377%, Training Loss: 0.1684%
Epoch [67/300], Step [154/225], Training Accuracy: 93.6485%, Training Loss: 

Epoch [68/300], Step [17/225], Training Accuracy: 92.0956%, Training Loss: 0.1895%
Epoch [68/300], Step [18/225], Training Accuracy: 92.3611%, Training Loss: 0.1892%
Epoch [68/300], Step [19/225], Training Accuracy: 92.4342%, Training Loss: 0.1906%
Epoch [68/300], Step [20/225], Training Accuracy: 92.4219%, Training Loss: 0.1875%
Epoch [68/300], Step [21/225], Training Accuracy: 92.6339%, Training Loss: 0.1815%
Epoch [68/300], Step [22/225], Training Accuracy: 92.5426%, Training Loss: 0.1872%
Epoch [68/300], Step [23/225], Training Accuracy: 92.5272%, Training Loss: 0.1885%
Epoch [68/300], Step [24/225], Training Accuracy: 92.5130%, Training Loss: 0.1883%
Epoch [68/300], Step [25/225], Training Accuracy: 92.6875%, Training Loss: 0.1833%
Epoch [68/300], Step [26/225], Training Accuracy: 92.7885%, Training Loss: 0.1803%
Epoch [68/300], Step [27/225], Training Accuracy: 92.8241%, Training Loss: 0.1782%
Epoch [68/300], Step [28/225], Training Accuracy: 92.8571%, Training Loss: 0.1755%
Epoc

Epoch [68/300], Step [116/225], Training Accuracy: 93.0765%, Training Loss: 0.1939%
Epoch [68/300], Step [117/225], Training Accuracy: 93.1357%, Training Loss: 0.1928%
Epoch [68/300], Step [118/225], Training Accuracy: 93.1144%, Training Loss: 0.1933%
Epoch [68/300], Step [119/225], Training Accuracy: 93.1329%, Training Loss: 0.1928%
Epoch [68/300], Step [120/225], Training Accuracy: 93.0729%, Training Loss: 0.1935%
Epoch [68/300], Step [121/225], Training Accuracy: 93.1043%, Training Loss: 0.1932%
Epoch [68/300], Step [122/225], Training Accuracy: 93.1096%, Training Loss: 0.1929%
Epoch [68/300], Step [123/225], Training Accuracy: 93.1021%, Training Loss: 0.1929%
Epoch [68/300], Step [124/225], Training Accuracy: 93.0570%, Training Loss: 0.1943%
Epoch [68/300], Step [125/225], Training Accuracy: 93.1000%, Training Loss: 0.1936%
Epoch [68/300], Step [126/225], Training Accuracy: 93.0804%, Training Loss: 0.1938%
Epoch [68/300], Step [127/225], Training Accuracy: 93.0487%, Training Loss: 

Epoch [68/300], Step [215/225], Training Accuracy: 92.9651%, Training Loss: 0.1935%
Epoch [68/300], Step [216/225], Training Accuracy: 92.9832%, Training Loss: 0.1930%
Epoch [68/300], Step [217/225], Training Accuracy: 92.9724%, Training Loss: 0.1931%
Epoch [68/300], Step [218/225], Training Accuracy: 92.9544%, Training Loss: 0.1935%
Epoch [68/300], Step [219/225], Training Accuracy: 92.9580%, Training Loss: 0.1936%
Epoch [68/300], Step [220/225], Training Accuracy: 92.9616%, Training Loss: 0.1934%
Epoch [68/300], Step [221/225], Training Accuracy: 92.9794%, Training Loss: 0.1928%
Epoch [68/300], Step [222/225], Training Accuracy: 92.9617%, Training Loss: 0.1934%
Epoch [68/300], Step [223/225], Training Accuracy: 92.9442%, Training Loss: 0.1936%
Epoch [68/300], Step [224/225], Training Accuracy: 92.9060%, Training Loss: 0.1944%
Epoch [68/300], Step [225/225], Training Accuracy: 92.9266%, Training Loss: 0.1942%
Epoch [69/300], Step [1/225], Training Accuracy: 90.6250%, Training Loss: 0.

Epoch [69/300], Step [89/225], Training Accuracy: 93.1706%, Training Loss: 0.1808%
Epoch [69/300], Step [90/225], Training Accuracy: 93.1771%, Training Loss: 0.1803%
Epoch [69/300], Step [91/225], Training Accuracy: 93.2005%, Training Loss: 0.1793%
Epoch [69/300], Step [92/225], Training Accuracy: 93.1895%, Training Loss: 0.1793%
Epoch [69/300], Step [93/225], Training Accuracy: 93.2292%, Training Loss: 0.1783%
Epoch [69/300], Step [94/225], Training Accuracy: 93.2181%, Training Loss: 0.1779%
Epoch [69/300], Step [95/225], Training Accuracy: 93.2401%, Training Loss: 0.1772%
Epoch [69/300], Step [96/225], Training Accuracy: 93.2943%, Training Loss: 0.1761%
Epoch [69/300], Step [97/225], Training Accuracy: 93.2990%, Training Loss: 0.1760%
Epoch [69/300], Step [98/225], Training Accuracy: 93.2876%, Training Loss: 0.1771%
Epoch [69/300], Step [99/225], Training Accuracy: 93.2765%, Training Loss: 0.1775%
Epoch [69/300], Step [100/225], Training Accuracy: 93.2500%, Training Loss: 0.1785%
Epo

Epoch [69/300], Step [188/225], Training Accuracy: 92.9937%, Training Loss: 0.1828%
Epoch [69/300], Step [189/225], Training Accuracy: 92.9894%, Training Loss: 0.1830%
Epoch [69/300], Step [190/225], Training Accuracy: 92.9770%, Training Loss: 0.1833%
Epoch [69/300], Step [191/225], Training Accuracy: 92.9647%, Training Loss: 0.1836%
Epoch [69/300], Step [192/225], Training Accuracy: 92.9606%, Training Loss: 0.1834%
Epoch [69/300], Step [193/225], Training Accuracy: 92.9809%, Training Loss: 0.1832%
Epoch [69/300], Step [194/225], Training Accuracy: 92.9849%, Training Loss: 0.1832%
Epoch [69/300], Step [195/225], Training Accuracy: 93.0048%, Training Loss: 0.1829%
Epoch [69/300], Step [196/225], Training Accuracy: 93.0006%, Training Loss: 0.1832%
Epoch [69/300], Step [197/225], Training Accuracy: 92.9965%, Training Loss: 0.1833%
Epoch [69/300], Step [198/225], Training Accuracy: 93.0003%, Training Loss: 0.1833%
Epoch [69/300], Step [199/225], Training Accuracy: 92.9884%, Training Loss: 

Epoch [70/300], Step [62/225], Training Accuracy: 93.6240%, Training Loss: 0.1671%
Epoch [70/300], Step [63/225], Training Accuracy: 93.6260%, Training Loss: 0.1673%
Epoch [70/300], Step [64/225], Training Accuracy: 93.6523%, Training Loss: 0.1665%
Epoch [70/300], Step [65/225], Training Accuracy: 93.5817%, Training Loss: 0.1674%
Epoch [70/300], Step [66/225], Training Accuracy: 93.6316%, Training Loss: 0.1674%
Epoch [70/300], Step [67/225], Training Accuracy: 93.6567%, Training Loss: 0.1670%
Epoch [70/300], Step [68/225], Training Accuracy: 93.6811%, Training Loss: 0.1673%
Epoch [70/300], Step [69/225], Training Accuracy: 93.6594%, Training Loss: 0.1672%
Epoch [70/300], Step [70/225], Training Accuracy: 93.6830%, Training Loss: 0.1661%
Epoch [70/300], Step [71/225], Training Accuracy: 93.7060%, Training Loss: 0.1661%
Epoch [70/300], Step [72/225], Training Accuracy: 93.7066%, Training Loss: 0.1663%
Epoch [70/300], Step [73/225], Training Accuracy: 93.7286%, Training Loss: 0.1662%
Epoc

Epoch [70/300], Step [161/225], Training Accuracy: 93.6530%, Training Loss: 0.1667%
Epoch [70/300], Step [162/225], Training Accuracy: 93.6535%, Training Loss: 0.1667%
Epoch [70/300], Step [163/225], Training Accuracy: 93.6541%, Training Loss: 0.1665%
Epoch [70/300], Step [164/225], Training Accuracy: 93.6738%, Training Loss: 0.1659%
Epoch [70/300], Step [165/225], Training Accuracy: 93.6458%, Training Loss: 0.1661%
Epoch [70/300], Step [166/225], Training Accuracy: 93.6653%, Training Loss: 0.1661%
Epoch [70/300], Step [167/225], Training Accuracy: 93.6845%, Training Loss: 0.1656%
Epoch [70/300], Step [168/225], Training Accuracy: 93.7035%, Training Loss: 0.1652%
Epoch [70/300], Step [169/225], Training Accuracy: 93.7130%, Training Loss: 0.1648%
Epoch [70/300], Step [170/225], Training Accuracy: 93.7224%, Training Loss: 0.1646%
Epoch [70/300], Step [171/225], Training Accuracy: 93.7500%, Training Loss: 0.1642%
Epoch [70/300], Step [172/225], Training Accuracy: 93.7227%, Training Loss: 

In [None]:
# Test the model
model.eval()  # eval mode (batchnorm uses moving mean/variance instead of mini-batch mean/variance)
with torch.no_grad():
    correct = 0
    total = 0
    for X, Y in test_loader:
        X = X.to(device)
        Y = Y.to(device)
        outputs = model(X)
        _, predicted = torch.max(outputs.data, 1)
        total += Y.size(0)
        correct += (predicted == Y).sum().item()

    print('Test Accuracy : {} %'.format(100 * correct / total))

# Save the model checkpoint
#torch.save(model.state_dict(), 'model.ckpt')