In [1]:
import pandas as pd
import numpy as np
import torch
import torch.nn as nn
from torch.utils.data import TensorDataset, DataLoader
from torch import Tensor
import torch.nn.functional as F
from torch.optim.lr_scheduler import MultiStepLR
from torch.utils.tensorboard import SummaryWriter

![image.png](attachment:image.png)

In [2]:
writer = SummaryWriter()

In [3]:
train_set = pd.read_csv("data/final_format/train_set.csv",header=None).to_numpy()
train_label = pd.read_csv("data/final_format/train_label.csv",header=None).to_numpy()
test_set = pd.read_csv("data/final_format/test_set.csv",header=None).to_numpy()
test_label = pd.read_csv("data/final_format/test_label.csv",header=None).to_numpy()

In [4]:
print(train_set.shape, train_label.shape, test_set.shape, test_label.shape)

(14393, 4096) (14393, 1) (3599, 4096) (3599, 1)


In [5]:
#delet first row data
train_set = train_set[1:]
train_label = train_label[1:]
test_set = test_set[1:]
test_label = test_label[1:]
print(train_set.shape, train_label.shape, test_set.shape, test_label.shape)

(14392, 4096) (14392, 1) (3598, 4096) (3598, 1)


In [6]:
train_set = train_set.reshape((-1,64,64))
test_set = test_set.reshape((-1,64,64))
print(train_set.shape, train_label.shape, test_set.shape, test_label.shape)

(14392, 64, 64) (14392, 1) (3598, 64, 64) (3598, 1)


In [7]:
train_label = train_label.reshape(-1)
test_label = test_label.reshape(-1)

print(train_set.shape, train_label.shape, test_set.shape, test_label.shape)

(14392, 64, 64) (14392,) (3598, 64, 64) (3598,)


In [8]:
# Hyper parameters
num_epochs = 300
num_classes = 4
batch_size = 64
learning_rate = 1e-4

In [9]:
train_set_tensor = Tensor(train_set) 
train_label_tensor = Tensor(train_label).type(torch.LongTensor)

train_dataset = TensorDataset(train_set_tensor,train_label_tensor) 
train_loader = DataLoader(train_dataset, batch_size=batch_size) 

test_set_tensor = Tensor(test_set) 
test_label_tensor = Tensor(test_label).type(torch.LongTensor)

test_dataset = TensorDataset(test_set_tensor,test_label_tensor) 
test_loader = DataLoader(test_dataset, batch_size=batch_size) 

In [10]:
# Device configuration
device = torch.device('cuda:0' if torch.cuda.is_available() else 'cpu')
device

device(type='cuda', index=0)

In [11]:
# Authors: Patryk Chrabaszcz
#          Lukas Gemein <l.gemein@gmail.com>
#
# License: BSD-3

from torch import nn
from torch.nn import init
from torch.nn.utils import weight_norm

from function.modules import Ensure4d, Expression
from function.functions import squeeze_final_output


class TCN(nn.Module):
    """Temporal Convolutional Network (TCN) from Bai et al 2018.

    See [Bai2018]_ for details.

    Code adapted from https://github.com/locuslab/TCN/blob/master/TCN/tcn.py

    Parameters
    ---------- 
    n_in_chans: int
        number of input EEG channels
    n_outputs: int
        number of outputs of the decoding task (for example number of classes in
        classification)
    n_filters: int
        number of output filters of each convolution
    n_blocks: int
        number of temporal blocks in the network
    kernel_size: int
        kernel size of the convolutions
    drop_prob: float
        dropout probability
    add_log_softmax: bool
        whether to add a log softmax layer

    References
    ----------
    .. [Bai2018] Bai, S., Kolter, J. Z., & Koltun, V. (2018).
       An empirical evaluation of generic convolutional and recurrent networks
       for sequence modeling.
       arXiv preprint arXiv:1803.01271.
    """
    def __init__(self, n_in_chans=64, n_outputs=4, n_blocks=4
                 , n_filters=24, kernel_size=3,
                 drop_prob=0.25, add_log_softmax=False):
        super().__init__()
        self.ensuredims = Ensure4d()
        t_blocks = nn.Sequential()
        for i in range(n_blocks):
            n_inputs = n_in_chans if i == 0 else n_filters
            dilation_size = 2 ** i
            t_blocks.add_module("temporal_block_{:d}".format(i), TemporalBlock(
                n_inputs=n_inputs,
                n_outputs=n_filters,
                kernel_size=kernel_size,
                stride=1,
                dilation=dilation_size,
                padding=(kernel_size - 1) * dilation_size,
                drop_prob=drop_prob
            ))
        self.temporal_blocks = t_blocks
        self.fc = nn.Linear(in_features=n_filters, out_features=n_outputs)
        self.fc_last = nn.Linear(4*4, out_features=n_outputs)
        if add_log_softmax:
            self.log_softmax = nn.LogSoftmax(dim=1)
        self.squeeze = Expression(squeeze_final_output)

        self.min_len = 1
        for i in range(n_blocks):
            dilation = 2 ** i
            self.min_len += 2 * (kernel_size - 1) * dilation

        # start in eval mode
        self.eval()

    def forward(self, x):
        """Forward pass.

        Parameters
        ----------
        x: torch.Tensor
            Batch of EEG windows of shape (batch_size, n_channels, n_times).
        """
        # b 64 64
        x = self.ensuredims(x)
        # x is in format: B x C x T x 1
        (batch_size, _, time_size, _) = x.size()
        
        assert time_size >= self.min_len
        # remove empty trailing dimension
        x = x.squeeze(3)
        # b 64 64
        x = self.temporal_blocks(x)
        #  if n_blocks = 2 -> b 20 64
        # Convert to: B x T x C
        x = x.transpose(1, 2).contiguous()
        # b 64 20
        fc_out = self.fc(x.view(batch_size * time_size, x.size(2)))
        # b*64 4
        fc_out = fc_out.view(batch_size, time_size, fc_out.size(1))
        #b 64 4
        out_size = 1 + max(0, time_size - self.min_len)
        out = fc_out[:, -out_size:, :].transpose(1, 2)
        #b 4 52
        out = self.fc_last(out.reshape(out.size(0),-1))
       
        return out


class TemporalBlock(nn.Module):
    def __init__(self, n_inputs, n_outputs, kernel_size, stride, dilation,
                 padding, drop_prob):
        super().__init__()
        self.conv1 = weight_norm(nn.Conv1d(
            n_inputs, n_outputs, kernel_size,
            stride=stride, padding=padding, dilation=dilation))
        self.chomp1 = Chomp1d(padding)
        self.relu1 = nn.ReLU()
        self.dropout1 = nn.Dropout2d(drop_prob)

        self.conv2 = weight_norm(nn.Conv1d(
            n_outputs, n_outputs, kernel_size,
            stride=stride, padding=padding, dilation=dilation))
        self.chomp2 = Chomp1d(padding)
        self.relu2 = nn.ReLU()
        self.dropout2 = nn.Dropout2d(drop_prob)

        self.downsample = (nn.Conv1d(n_inputs, n_outputs, 1)
                           if n_inputs != n_outputs else None)
        self.relu = nn.ReLU()

        init.normal_(self.conv1.weight, 0, 0.01)
        init.normal_(self.conv2.weight, 0, 0.01)
        if self.downsample is not None:
            init.normal_(self.downsample.weight, 0, 0.01)

    def forward(self, x):
        #b 64 64, b 20 64 
        out = self.conv1(x)
        #b 20 66, b 20 68
        out = self.chomp1(out)
        #b 20 64, b 20 64
        out = self.relu1(out)
        out = self.dropout1(out)
        out = self.conv2(out)
        #b 20 66, b 20 68 
        out = self.chomp2(out)
        #b 20 64, b 20 64
        out = self.relu2(out)
        out = self.dropout2(out)
        res = x if self.downsample is None else self.downsample(x)# b 20 64
        return self.relu(out + res)


class Chomp1d(nn.Module):
    def __init__(self, chomp_size):
        super().__init__()
        self.chomp_size = chomp_size

    def extra_repr(self):
        return 'chomp_size={}'.format(self.chomp_size)

    def forward(self, x):
        return x[:, :, :-self.chomp_size].contiguous()


In [12]:
test = torch.randn((64,1,10))
test[None,:,:].shape

torch.Size([1, 64, 1, 10])

In [13]:
a = torch.randn((10,64,64))
model = TCN()
b = model(a)
b.shape

torch.Size([10, 4])

In [14]:
print(model)

TCN(
  (ensuredims): Ensure4d()
  (temporal_blocks): Sequential(
    (temporal_block_0): TemporalBlock(
      (conv1): Conv1d(64, 24, kernel_size=(3,), stride=(1,), padding=(2,))
      (chomp1): Chomp1d(chomp_size=2)
      (relu1): ReLU()
      (dropout1): Dropout2d(p=0.25, inplace=False)
      (conv2): Conv1d(24, 24, kernel_size=(3,), stride=(1,), padding=(2,))
      (chomp2): Chomp1d(chomp_size=2)
      (relu2): ReLU()
      (dropout2): Dropout2d(p=0.25, inplace=False)
      (downsample): Conv1d(64, 24, kernel_size=(1,), stride=(1,))
      (relu): ReLU()
    )
    (temporal_block_1): TemporalBlock(
      (conv1): Conv1d(24, 24, kernel_size=(3,), stride=(1,), padding=(4,), dilation=(2,))
      (chomp1): Chomp1d(chomp_size=4)
      (relu1): ReLU()
      (dropout1): Dropout2d(p=0.25, inplace=False)
      (conv2): Conv1d(24, 24, kernel_size=(3,), stride=(1,), padding=(4,), dilation=(2,))
      (chomp2): Chomp1d(chomp_size=4)
      (relu2): ReLU()
      (dropout2): Dropout2d(p=0.25, inpla

In [15]:
model = TCN().to(device)

In [16]:
# Loss and optimizer
criterion = nn.CrossEntropyLoss()
optimizer = torch.optim.Adam(model.parameters(), lr=learning_rate, weight_decay=1e-3) 
#optimizer = torch.optim.Adam(model.parameters(), lr=learning_rate) 
milestones = [50,100,150,200,250]
milestones = [a * len(train_loader) for a in milestones]
scheduler = MultiStepLR(optimizer, milestones=milestones, gamma=0.5)

In [None]:

# Train the model
total_step = len(train_loader)
for epoch in range(num_epochs):
    correct=0
    total=0
    running_loss = 0
    for i, (X, Y) in enumerate(train_loader):
        X = X.to(device)
        Y = Y.to(device)


        # Forward pass
        outputs = model(X)
        loss = criterion(outputs, Y)

        # Backward and optimize
        optimizer.zero_grad()
        loss.backward()
        #scheduler.step() 
        #print(scheduler.get_last_lr()[0])

        optimizer.step()
        scheduler.step() 
        #print(optimizer.param_groups[0]["lr"])

        _, predicted = outputs.max(1)
        total += Y.size(0)
        correct += predicted.eq(Y).sum().item()
        running_loss += loss.item()
        accu=100.*correct/total
        train_loss = running_loss/(i+1)
        print ('Epoch [{}/{}], Step [{}/{}], Training Accuracy: {:.4f}%, Training Loss: {:.4f}%'.format(epoch+1, num_epochs, i+1, total_step, accu, train_loss))


        #writer.add_scalar(f'train/accuracy', accu, epoch)
        #writer.add_scalar(f'train/loss', train_loss, epoch)
        writer.add_scalars(f'train/accuracy_loss', {
            'accuracy': accu,
            'loss': train_loss,
        }, epoch)



Epoch [1/300], Step [1/225], Training Accuracy: 26.5625%, Training Loss: 1.3893%
Epoch [1/300], Step [2/225], Training Accuracy: 25.0000%, Training Loss: 1.3875%
Epoch [1/300], Step [3/225], Training Accuracy: 23.4375%, Training Loss: 1.3872%
Epoch [1/300], Step [4/225], Training Accuracy: 24.2188%, Training Loss: 1.3865%
Epoch [1/300], Step [5/225], Training Accuracy: 22.1875%, Training Loss: 1.3896%
Epoch [1/300], Step [6/225], Training Accuracy: 24.2188%, Training Loss: 1.3875%
Epoch [1/300], Step [7/225], Training Accuracy: 24.1071%, Training Loss: 1.3869%
Epoch [1/300], Step [8/225], Training Accuracy: 25.0000%, Training Loss: 1.3859%
Epoch [1/300], Step [9/225], Training Accuracy: 25.1736%, Training Loss: 1.3864%
Epoch [1/300], Step [10/225], Training Accuracy: 25.4688%, Training Loss: 1.3854%
Epoch [1/300], Step [11/225], Training Accuracy: 26.1364%, Training Loss: 1.3859%
Epoch [1/300], Step [12/225], Training Accuracy: 26.3021%, Training Loss: 1.3852%
Epoch [1/300], Step [13/2

Epoch [1/300], Step [109/225], Training Accuracy: 26.4908%, Training Loss: 1.3857%
Epoch [1/300], Step [110/225], Training Accuracy: 26.5909%, Training Loss: 1.3856%
Epoch [1/300], Step [111/225], Training Accuracy: 26.6188%, Training Loss: 1.3855%
Epoch [1/300], Step [112/225], Training Accuracy: 26.6323%, Training Loss: 1.3855%
Epoch [1/300], Step [113/225], Training Accuracy: 26.6316%, Training Loss: 1.3855%
Epoch [1/300], Step [114/225], Training Accuracy: 26.6721%, Training Loss: 1.3854%
Epoch [1/300], Step [115/225], Training Accuracy: 26.6984%, Training Loss: 1.3854%
Epoch [1/300], Step [116/225], Training Accuracy: 26.7915%, Training Loss: 1.3853%
Epoch [1/300], Step [117/225], Training Accuracy: 26.7228%, Training Loss: 1.3854%
Epoch [1/300], Step [118/225], Training Accuracy: 26.7744%, Training Loss: 1.3853%
Epoch [1/300], Step [119/225], Training Accuracy: 26.8251%, Training Loss: 1.3852%
Epoch [1/300], Step [120/225], Training Accuracy: 26.8099%, Training Loss: 1.3853%
Epoc

Epoch [1/300], Step [220/225], Training Accuracy: 27.7841%, Training Loss: 1.3833%
Epoch [1/300], Step [221/225], Training Accuracy: 27.7574%, Training Loss: 1.3833%
Epoch [1/300], Step [222/225], Training Accuracy: 27.7942%, Training Loss: 1.3833%
Epoch [1/300], Step [223/225], Training Accuracy: 27.7536%, Training Loss: 1.3833%
Epoch [1/300], Step [224/225], Training Accuracy: 27.7204%, Training Loss: 1.3834%
Epoch [1/300], Step [225/225], Training Accuracy: 27.6959%, Training Loss: 1.3835%
Epoch [2/300], Step [1/225], Training Accuracy: 35.9375%, Training Loss: 1.3715%
Epoch [2/300], Step [2/225], Training Accuracy: 33.5938%, Training Loss: 1.3712%
Epoch [2/300], Step [3/225], Training Accuracy: 31.2500%, Training Loss: 1.3718%
Epoch [2/300], Step [4/225], Training Accuracy: 31.6406%, Training Loss: 1.3709%
Epoch [2/300], Step [5/225], Training Accuracy: 28.7500%, Training Loss: 1.3751%
Epoch [2/300], Step [6/225], Training Accuracy: 28.6458%, Training Loss: 1.3761%
Epoch [2/300], S

Epoch [2/300], Step [106/225], Training Accuracy: 30.9994%, Training Loss: 1.3755%
Epoch [2/300], Step [107/225], Training Accuracy: 30.9725%, Training Loss: 1.3755%
Epoch [2/300], Step [108/225], Training Accuracy: 30.9896%, Training Loss: 1.3755%
Epoch [2/300], Step [109/225], Training Accuracy: 30.9776%, Training Loss: 1.3754%
Epoch [2/300], Step [110/225], Training Accuracy: 31.0227%, Training Loss: 1.3752%
Epoch [2/300], Step [111/225], Training Accuracy: 31.0670%, Training Loss: 1.3751%
Epoch [2/300], Step [112/225], Training Accuracy: 31.1523%, Training Loss: 1.3749%
Epoch [2/300], Step [113/225], Training Accuracy: 31.1117%, Training Loss: 1.3751%
Epoch [2/300], Step [114/225], Training Accuracy: 31.0992%, Training Loss: 1.3749%
Epoch [2/300], Step [115/225], Training Accuracy: 31.0870%, Training Loss: 1.3748%
Epoch [2/300], Step [116/225], Training Accuracy: 31.1422%, Training Loss: 1.3746%
Epoch [2/300], Step [117/225], Training Accuracy: 31.0897%, Training Loss: 1.3749%
Epoc

Epoch [2/300], Step [221/225], Training Accuracy: 31.6035%, Training Loss: 1.3705%
Epoch [2/300], Step [222/225], Training Accuracy: 31.6512%, Training Loss: 1.3704%
Epoch [2/300], Step [223/225], Training Accuracy: 31.6284%, Training Loss: 1.3705%
Epoch [2/300], Step [224/225], Training Accuracy: 31.5918%, Training Loss: 1.3706%
Epoch [2/300], Step [225/225], Training Accuracy: 31.6078%, Training Loss: 1.3707%
Epoch [3/300], Step [1/225], Training Accuracy: 32.8125%, Training Loss: 1.3550%
Epoch [3/300], Step [2/225], Training Accuracy: 32.8125%, Training Loss: 1.3526%
Epoch [3/300], Step [3/225], Training Accuracy: 30.7292%, Training Loss: 1.3554%
Epoch [3/300], Step [4/225], Training Accuracy: 31.2500%, Training Loss: 1.3507%
Epoch [3/300], Step [5/225], Training Accuracy: 31.2500%, Training Loss: 1.3586%
Epoch [3/300], Step [6/225], Training Accuracy: 30.4688%, Training Loss: 1.3606%
Epoch [3/300], Step [7/225], Training Accuracy: 31.0268%, Training Loss: 1.3587%
Epoch [3/300], Ste

Epoch [3/300], Step [109/225], Training Accuracy: 33.0275%, Training Loss: 1.3470%
Epoch [3/300], Step [110/225], Training Accuracy: 33.0966%, Training Loss: 1.3466%
Epoch [3/300], Step [111/225], Training Accuracy: 33.1222%, Training Loss: 1.3463%
Epoch [3/300], Step [112/225], Training Accuracy: 33.1613%, Training Loss: 1.3460%
Epoch [3/300], Step [113/225], Training Accuracy: 33.1444%, Training Loss: 1.3463%
Epoch [3/300], Step [114/225], Training Accuracy: 33.1689%, Training Loss: 1.3457%
Epoch [3/300], Step [115/225], Training Accuracy: 33.1658%, Training Loss: 1.3455%
Epoch [3/300], Step [116/225], Training Accuracy: 33.2435%, Training Loss: 1.3450%
Epoch [3/300], Step [117/225], Training Accuracy: 33.1998%, Training Loss: 1.3457%
Epoch [3/300], Step [118/225], Training Accuracy: 33.2495%, Training Loss: 1.3455%
Epoch [3/300], Step [119/225], Training Accuracy: 33.2589%, Training Loss: 1.3455%
Epoch [3/300], Step [120/225], Training Accuracy: 33.2943%, Training Loss: 1.3456%
Epoc

Epoch [3/300], Step [222/225], Training Accuracy: 34.6847%, Training Loss: 1.3285%
Epoch [3/300], Step [223/225], Training Accuracy: 34.6623%, Training Loss: 1.3284%
Epoch [3/300], Step [224/225], Training Accuracy: 34.6191%, Training Loss: 1.3283%
Epoch [3/300], Step [225/225], Training Accuracy: 34.6304%, Training Loss: 1.3283%
Epoch [4/300], Step [1/225], Training Accuracy: 40.6250%, Training Loss: 1.3006%
Epoch [4/300], Step [2/225], Training Accuracy: 39.8438%, Training Loss: 1.3168%
Epoch [4/300], Step [3/225], Training Accuracy: 35.9375%, Training Loss: 1.3237%
Epoch [4/300], Step [4/225], Training Accuracy: 38.2812%, Training Loss: 1.3030%
Epoch [4/300], Step [5/225], Training Accuracy: 39.0625%, Training Loss: 1.3097%
Epoch [4/300], Step [6/225], Training Accuracy: 38.8021%, Training Loss: 1.3192%
Epoch [4/300], Step [7/225], Training Accuracy: 38.1696%, Training Loss: 1.3141%
Epoch [4/300], Step [8/225], Training Accuracy: 36.5234%, Training Loss: 1.3103%
Epoch [4/300], Step 

Epoch [4/300], Step [108/225], Training Accuracy: 37.1238%, Training Loss: 1.2820%
Epoch [4/300], Step [109/225], Training Accuracy: 37.0700%, Training Loss: 1.2820%
Epoch [4/300], Step [110/225], Training Accuracy: 37.0739%, Training Loss: 1.2822%
Epoch [4/300], Step [111/225], Training Accuracy: 37.0636%, Training Loss: 1.2822%
Epoch [4/300], Step [112/225], Training Accuracy: 37.0675%, Training Loss: 1.2819%
Epoch [4/300], Step [113/225], Training Accuracy: 37.0299%, Training Loss: 1.2826%
Epoch [4/300], Step [114/225], Training Accuracy: 36.9929%, Training Loss: 1.2820%
Epoch [4/300], Step [115/225], Training Accuracy: 36.9701%, Training Loss: 1.2820%
Epoch [4/300], Step [116/225], Training Accuracy: 37.0286%, Training Loss: 1.2813%
Epoch [4/300], Step [117/225], Training Accuracy: 36.9525%, Training Loss: 1.2822%
Epoch [4/300], Step [118/225], Training Accuracy: 36.9836%, Training Loss: 1.2821%
Epoch [4/300], Step [119/225], Training Accuracy: 36.9879%, Training Loss: 1.2822%
Epoc

Epoch [4/300], Step [219/225], Training Accuracy: 37.7212%, Training Loss: 1.2688%
Epoch [4/300], Step [220/225], Training Accuracy: 37.7273%, Training Loss: 1.2684%
Epoch [4/300], Step [221/225], Training Accuracy: 37.7121%, Training Loss: 1.2684%
Epoch [4/300], Step [222/225], Training Accuracy: 37.7252%, Training Loss: 1.2684%
Epoch [4/300], Step [223/225], Training Accuracy: 37.6682%, Training Loss: 1.2684%
Epoch [4/300], Step [224/225], Training Accuracy: 37.6186%, Training Loss: 1.2684%
Epoch [4/300], Step [225/225], Training Accuracy: 37.6181%, Training Loss: 1.2687%
Epoch [5/300], Step [1/225], Training Accuracy: 50.0000%, Training Loss: 1.2485%
Epoch [5/300], Step [2/225], Training Accuracy: 46.0938%, Training Loss: 1.2749%
Epoch [5/300], Step [3/225], Training Accuracy: 40.6250%, Training Loss: 1.2901%
Epoch [5/300], Step [4/225], Training Accuracy: 39.4531%, Training Loss: 1.2633%
Epoch [5/300], Step [5/225], Training Accuracy: 39.6875%, Training Loss: 1.2637%
Epoch [5/300],

Epoch [5/300], Step [109/225], Training Accuracy: 39.2775%, Training Loss: 1.2405%
Epoch [5/300], Step [110/225], Training Accuracy: 39.2898%, Training Loss: 1.2408%
Epoch [5/300], Step [111/225], Training Accuracy: 39.2877%, Training Loss: 1.2407%
Epoch [5/300], Step [112/225], Training Accuracy: 39.3276%, Training Loss: 1.2405%
Epoch [5/300], Step [113/225], Training Accuracy: 39.3252%, Training Loss: 1.2414%
Epoch [5/300], Step [114/225], Training Accuracy: 39.3092%, Training Loss: 1.2408%
Epoch [5/300], Step [115/225], Training Accuracy: 39.2527%, Training Loss: 1.2408%
Epoch [5/300], Step [116/225], Training Accuracy: 39.3588%, Training Loss: 1.2400%
Epoch [5/300], Step [117/225], Training Accuracy: 39.2762%, Training Loss: 1.2410%
Epoch [5/300], Step [118/225], Training Accuracy: 39.3008%, Training Loss: 1.2411%
Epoch [5/300], Step [119/225], Training Accuracy: 39.3251%, Training Loss: 1.2409%
Epoch [5/300], Step [120/225], Training Accuracy: 39.2969%, Training Loss: 1.2410%
Epoc

Epoch [5/300], Step [220/225], Training Accuracy: 39.7230%, Training Loss: 1.2314%
Epoch [5/300], Step [221/225], Training Accuracy: 39.7059%, Training Loss: 1.2314%
Epoch [5/300], Step [222/225], Training Accuracy: 39.7523%, Training Loss: 1.2314%
Epoch [5/300], Step [223/225], Training Accuracy: 39.6861%, Training Loss: 1.2315%
Epoch [5/300], Step [224/225], Training Accuracy: 39.6345%, Training Loss: 1.2317%
Epoch [5/300], Step [225/225], Training Accuracy: 39.6331%, Training Loss: 1.2321%
Epoch [6/300], Step [1/225], Training Accuracy: 53.1250%, Training Loss: 1.2046%
Epoch [6/300], Step [2/225], Training Accuracy: 43.7500%, Training Loss: 1.2484%
Epoch [6/300], Step [3/225], Training Accuracy: 39.5833%, Training Loss: 1.2656%
Epoch [6/300], Step [4/225], Training Accuracy: 39.4531%, Training Loss: 1.2381%
Epoch [6/300], Step [5/225], Training Accuracy: 40.9375%, Training Loss: 1.2351%
Epoch [6/300], Step [6/225], Training Accuracy: 42.1875%, Training Loss: 1.2437%
Epoch [6/300], S

Epoch [6/300], Step [108/225], Training Accuracy: 40.4803%, Training Loss: 1.2125%
Epoch [6/300], Step [109/225], Training Accuracy: 40.4243%, Training Loss: 1.2126%
Epoch [6/300], Step [110/225], Training Accuracy: 40.4545%, Training Loss: 1.2130%
Epoch [6/300], Step [111/225], Training Accuracy: 40.4702%, Training Loss: 1.2128%
Epoch [6/300], Step [112/225], Training Accuracy: 40.5552%, Training Loss: 1.2124%
Epoch [6/300], Step [113/225], Training Accuracy: 40.5282%, Training Loss: 1.2133%
Epoch [6/300], Step [114/225], Training Accuracy: 40.5428%, Training Loss: 1.2126%
Epoch [6/300], Step [115/225], Training Accuracy: 40.5299%, Training Loss: 1.2125%
Epoch [6/300], Step [116/225], Training Accuracy: 40.6115%, Training Loss: 1.2116%
Epoch [6/300], Step [117/225], Training Accuracy: 40.5582%, Training Loss: 1.2128%
Epoch [6/300], Step [118/225], Training Accuracy: 40.5323%, Training Loss: 1.2129%
Epoch [6/300], Step [119/225], Training Accuracy: 40.5593%, Training Loss: 1.2125%
Epoc

Epoch [6/300], Step [212/225], Training Accuracy: 41.0083%, Training Loss: 1.2051%
Epoch [6/300], Step [213/225], Training Accuracy: 40.9844%, Training Loss: 1.2053%
Epoch [6/300], Step [214/225], Training Accuracy: 40.9828%, Training Loss: 1.2052%
Epoch [6/300], Step [215/225], Training Accuracy: 41.0320%, Training Loss: 1.2048%
Epoch [6/300], Step [216/225], Training Accuracy: 40.9939%, Training Loss: 1.2051%
Epoch [6/300], Step [217/225], Training Accuracy: 40.9850%, Training Loss: 1.2049%
Epoch [6/300], Step [218/225], Training Accuracy: 40.9619%, Training Loss: 1.2052%
Epoch [6/300], Step [219/225], Training Accuracy: 40.9461%, Training Loss: 1.2050%
Epoch [6/300], Step [220/225], Training Accuracy: 40.9517%, Training Loss: 1.2046%
Epoch [6/300], Step [221/225], Training Accuracy: 40.9290%, Training Loss: 1.2047%
Epoch [6/300], Step [222/225], Training Accuracy: 40.9628%, Training Loss: 1.2046%
Epoch [6/300], Step [223/225], Training Accuracy: 40.8842%, Training Loss: 1.2049%
Epoc

Epoch [7/300], Step [99/225], Training Accuracy: 42.3295%, Training Loss: 1.1881%
Epoch [7/300], Step [100/225], Training Accuracy: 42.2500%, Training Loss: 1.1880%
Epoch [7/300], Step [101/225], Training Accuracy: 42.1875%, Training Loss: 1.1877%
Epoch [7/300], Step [102/225], Training Accuracy: 42.2488%, Training Loss: 1.1872%
Epoch [7/300], Step [103/225], Training Accuracy: 42.1875%, Training Loss: 1.1880%
Epoch [7/300], Step [104/225], Training Accuracy: 42.2476%, Training Loss: 1.1873%
Epoch [7/300], Step [105/225], Training Accuracy: 42.1875%, Training Loss: 1.1874%
Epoch [7/300], Step [106/225], Training Accuracy: 42.1138%, Training Loss: 1.1874%
Epoch [7/300], Step [107/225], Training Accuracy: 42.1437%, Training Loss: 1.1872%
Epoch [7/300], Step [108/225], Training Accuracy: 42.0862%, Training Loss: 1.1877%
Epoch [7/300], Step [109/225], Training Accuracy: 42.0155%, Training Loss: 1.1878%
Epoch [7/300], Step [110/225], Training Accuracy: 42.0028%, Training Loss: 1.1883%
Epoch

Epoch [7/300], Step [217/225], Training Accuracy: 42.5187%, Training Loss: 1.1809%
Epoch [7/300], Step [218/225], Training Accuracy: 42.4742%, Training Loss: 1.1812%
Epoch [7/300], Step [219/225], Training Accuracy: 42.4586%, Training Loss: 1.1810%
Epoch [7/300], Step [220/225], Training Accuracy: 42.4716%, Training Loss: 1.1807%
Epoch [7/300], Step [221/225], Training Accuracy: 42.4491%, Training Loss: 1.1808%
Epoch [7/300], Step [222/225], Training Accuracy: 42.4901%, Training Loss: 1.1807%
Epoch [7/300], Step [223/225], Training Accuracy: 42.4187%, Training Loss: 1.1811%
Epoch [7/300], Step [224/225], Training Accuracy: 42.3619%, Training Loss: 1.1813%
Epoch [7/300], Step [225/225], Training Accuracy: 42.3360%, Training Loss: 1.1818%
Epoch [8/300], Step [1/225], Training Accuracy: 54.6875%, Training Loss: 1.1408%
Epoch [8/300], Step [2/225], Training Accuracy: 45.3125%, Training Loss: 1.2074%
Epoch [8/300], Step [3/225], Training Accuracy: 41.1458%, Training Loss: 1.2238%
Epoch [8/3

Epoch [8/300], Step [102/225], Training Accuracy: 42.9841%, Training Loss: 1.1661%
Epoch [8/300], Step [103/225], Training Accuracy: 42.9005%, Training Loss: 1.1669%
Epoch [8/300], Step [104/225], Training Accuracy: 42.9537%, Training Loss: 1.1661%
Epoch [8/300], Step [105/225], Training Accuracy: 42.9315%, Training Loss: 1.1660%
Epoch [8/300], Step [106/225], Training Accuracy: 42.8361%, Training Loss: 1.1661%
Epoch [8/300], Step [107/225], Training Accuracy: 42.8300%, Training Loss: 1.1659%
Epoch [8/300], Step [108/225], Training Accuracy: 42.7662%, Training Loss: 1.1664%
Epoch [8/300], Step [109/225], Training Accuracy: 42.7036%, Training Loss: 1.1666%
Epoch [8/300], Step [110/225], Training Accuracy: 42.6847%, Training Loss: 1.1670%
Epoch [8/300], Step [111/225], Training Accuracy: 42.7646%, Training Loss: 1.1669%
Epoch [8/300], Step [112/225], Training Accuracy: 42.8432%, Training Loss: 1.1664%
Epoch [8/300], Step [113/225], Training Accuracy: 42.8097%, Training Loss: 1.1675%
Epoc

Epoch [8/300], Step [211/225], Training Accuracy: 43.3575%, Training Loss: 1.1591%
Epoch [8/300], Step [212/225], Training Accuracy: 43.3373%, Training Loss: 1.1593%
Epoch [8/300], Step [213/225], Training Accuracy: 43.3319%, Training Loss: 1.1596%
Epoch [8/300], Step [214/225], Training Accuracy: 43.3557%, Training Loss: 1.1595%
Epoch [8/300], Step [215/225], Training Accuracy: 43.3866%, Training Loss: 1.1590%
Epoch [8/300], Step [216/225], Training Accuracy: 43.3594%, Training Loss: 1.1594%
Epoch [8/300], Step [217/225], Training Accuracy: 43.3540%, Training Loss: 1.1594%
Epoch [8/300], Step [218/225], Training Accuracy: 43.3128%, Training Loss: 1.1598%
Epoch [8/300], Step [219/225], Training Accuracy: 43.2791%, Training Loss: 1.1596%
Epoch [8/300], Step [220/225], Training Accuracy: 43.2955%, Training Loss: 1.1593%
Epoch [8/300], Step [221/225], Training Accuracy: 43.2834%, Training Loss: 1.1594%
Epoch [8/300], Step [222/225], Training Accuracy: 43.3066%, Training Loss: 1.1593%
Epoc

Epoch [9/300], Step [98/225], Training Accuracy: 43.7500%, Training Loss: 1.1463%
Epoch [9/300], Step [99/225], Training Accuracy: 43.7973%, Training Loss: 1.1466%
Epoch [9/300], Step [100/225], Training Accuracy: 43.7031%, Training Loss: 1.1465%
Epoch [9/300], Step [101/225], Training Accuracy: 43.6726%, Training Loss: 1.1465%
Epoch [9/300], Step [102/225], Training Accuracy: 43.7040%, Training Loss: 1.1462%
Epoch [9/300], Step [103/225], Training Accuracy: 43.6590%, Training Loss: 1.1471%
Epoch [9/300], Step [104/225], Training Accuracy: 43.7049%, Training Loss: 1.1462%
Epoch [9/300], Step [105/225], Training Accuracy: 43.6905%, Training Loss: 1.1460%
Epoch [9/300], Step [106/225], Training Accuracy: 43.6026%, Training Loss: 1.1462%
Epoch [9/300], Step [107/225], Training Accuracy: 43.6186%, Training Loss: 1.1460%
Epoch [9/300], Step [108/225], Training Accuracy: 43.5619%, Training Loss: 1.1465%
Epoch [9/300], Step [109/225], Training Accuracy: 43.4920%, Training Loss: 1.1467%
Epoch 

Epoch [9/300], Step [209/225], Training Accuracy: 44.2434%, Training Loss: 1.1391%
Epoch [9/300], Step [210/225], Training Accuracy: 44.2411%, Training Loss: 1.1388%
Epoch [9/300], Step [211/225], Training Accuracy: 44.2758%, Training Loss: 1.1386%
Epoch [9/300], Step [212/225], Training Accuracy: 44.2438%, Training Loss: 1.1390%
Epoch [9/300], Step [213/225], Training Accuracy: 44.2268%, Training Loss: 1.1394%
Epoch [9/300], Step [214/225], Training Accuracy: 44.2465%, Training Loss: 1.1392%
Epoch [9/300], Step [215/225], Training Accuracy: 44.2878%, Training Loss: 1.1388%
Epoch [9/300], Step [216/225], Training Accuracy: 44.2708%, Training Loss: 1.1391%
Epoch [9/300], Step [217/225], Training Accuracy: 44.2468%, Training Loss: 1.1391%
Epoch [9/300], Step [218/225], Training Accuracy: 44.2087%, Training Loss: 1.1396%
Epoch [9/300], Step [219/225], Training Accuracy: 44.1781%, Training Loss: 1.1395%
Epoch [9/300], Step [220/225], Training Accuracy: 44.2116%, Training Loss: 1.1392%
Epoc

Epoch [10/300], Step [96/225], Training Accuracy: 44.4499%, Training Loss: 1.1282%
Epoch [10/300], Step [97/225], Training Accuracy: 44.4749%, Training Loss: 1.1280%
Epoch [10/300], Step [98/225], Training Accuracy: 44.4515%, Training Loss: 1.1271%
Epoch [10/300], Step [99/225], Training Accuracy: 44.5076%, Training Loss: 1.1274%
Epoch [10/300], Step [100/225], Training Accuracy: 44.3906%, Training Loss: 1.1273%
Epoch [10/300], Step [101/225], Training Accuracy: 44.3379%, Training Loss: 1.1274%
Epoch [10/300], Step [102/225], Training Accuracy: 44.3321%, Training Loss: 1.1273%
Epoch [10/300], Step [103/225], Training Accuracy: 44.3113%, Training Loss: 1.1281%
Epoch [10/300], Step [104/225], Training Accuracy: 44.3359%, Training Loss: 1.1273%
Epoch [10/300], Step [105/225], Training Accuracy: 44.3452%, Training Loss: 1.1270%
Epoch [10/300], Step [106/225], Training Accuracy: 44.2512%, Training Loss: 1.1273%
Epoch [10/300], Step [107/225], Training Accuracy: 44.2465%, Training Loss: 1.12

Epoch [10/300], Step [209/225], Training Accuracy: 44.9387%, Training Loss: 1.1201%
Epoch [10/300], Step [210/225], Training Accuracy: 44.9330%, Training Loss: 1.1197%
Epoch [10/300], Step [211/225], Training Accuracy: 44.9719%, Training Loss: 1.1196%
Epoch [10/300], Step [212/225], Training Accuracy: 44.9219%, Training Loss: 1.1200%
Epoch [10/300], Step [213/225], Training Accuracy: 44.8944%, Training Loss: 1.1205%
Epoch [10/300], Step [214/225], Training Accuracy: 44.9182%, Training Loss: 1.1203%
Epoch [10/300], Step [215/225], Training Accuracy: 44.9491%, Training Loss: 1.1200%
Epoch [10/300], Step [216/225], Training Accuracy: 44.9363%, Training Loss: 1.1202%
Epoch [10/300], Step [217/225], Training Accuracy: 44.9093%, Training Loss: 1.1202%
Epoch [10/300], Step [218/225], Training Accuracy: 44.8753%, Training Loss: 1.1208%
Epoch [10/300], Step [219/225], Training Accuracy: 44.8416%, Training Loss: 1.1207%
Epoch [10/300], Step [220/225], Training Accuracy: 44.8935%, Training Loss: 

Epoch [11/300], Step [95/225], Training Accuracy: 45.4605%, Training Loss: 1.1105%
Epoch [11/300], Step [96/225], Training Accuracy: 45.4915%, Training Loss: 1.1101%
Epoch [11/300], Step [97/225], Training Accuracy: 45.5058%, Training Loss: 1.1098%
Epoch [11/300], Step [98/225], Training Accuracy: 45.5038%, Training Loss: 1.1089%
Epoch [11/300], Step [99/225], Training Accuracy: 45.5335%, Training Loss: 1.1092%
Epoch [11/300], Step [100/225], Training Accuracy: 45.4062%, Training Loss: 1.1092%
Epoch [11/300], Step [101/225], Training Accuracy: 45.3280%, Training Loss: 1.1093%
Epoch [11/300], Step [102/225], Training Accuracy: 45.3125%, Training Loss: 1.1094%
Epoch [11/300], Step [103/225], Training Accuracy: 45.2973%, Training Loss: 1.1103%
Epoch [11/300], Step [104/225], Training Accuracy: 45.2825%, Training Loss: 1.1095%
Epoch [11/300], Step [105/225], Training Accuracy: 45.2976%, Training Loss: 1.1090%
Epoch [11/300], Step [106/225], Training Accuracy: 45.1946%, Training Loss: 1.109

Epoch [11/300], Step [208/225], Training Accuracy: 45.7782%, Training Loss: 1.1025%
Epoch [11/300], Step [209/225], Training Accuracy: 45.7461%, Training Loss: 1.1025%
Epoch [11/300], Step [210/225], Training Accuracy: 45.7217%, Training Loss: 1.1022%
Epoch [11/300], Step [211/225], Training Accuracy: 45.7346%, Training Loss: 1.1020%
Epoch [11/300], Step [212/225], Training Accuracy: 45.6810%, Training Loss: 1.1025%
Epoch [11/300], Step [213/225], Training Accuracy: 45.6279%, Training Loss: 1.1031%
Epoch [11/300], Step [214/225], Training Accuracy: 45.6484%, Training Loss: 1.1028%
Epoch [11/300], Step [215/225], Training Accuracy: 45.6759%, Training Loss: 1.1026%
Epoch [11/300], Step [216/225], Training Accuracy: 45.6742%, Training Loss: 1.1028%
Epoch [11/300], Step [217/225], Training Accuracy: 45.6581%, Training Loss: 1.1028%
Epoch [11/300], Step [218/225], Training Accuracy: 45.6064%, Training Loss: 1.1034%
Epoch [11/300], Step [219/225], Training Accuracy: 45.5693%, Training Loss: 

Epoch [12/300], Step [92/225], Training Accuracy: 46.2126%, Training Loss: 1.0939%
Epoch [12/300], Step [93/225], Training Accuracy: 46.2030%, Training Loss: 1.0940%
Epoch [12/300], Step [94/225], Training Accuracy: 46.3098%, Training Loss: 1.0929%
Epoch [12/300], Step [95/225], Training Accuracy: 46.1842%, Training Loss: 1.0941%
Epoch [12/300], Step [96/225], Training Accuracy: 46.2565%, Training Loss: 1.0937%
Epoch [12/300], Step [97/225], Training Accuracy: 46.2790%, Training Loss: 1.0933%
Epoch [12/300], Step [98/225], Training Accuracy: 46.2691%, Training Loss: 1.0926%
Epoch [12/300], Step [99/225], Training Accuracy: 46.2753%, Training Loss: 1.0929%
Epoch [12/300], Step [100/225], Training Accuracy: 46.1406%, Training Loss: 1.0930%
Epoch [12/300], Step [101/225], Training Accuracy: 46.0860%, Training Loss: 1.0933%
Epoch [12/300], Step [102/225], Training Accuracy: 46.0784%, Training Loss: 1.0935%
Epoch [12/300], Step [103/225], Training Accuracy: 46.0407%, Training Loss: 1.0943%


Epoch [12/300], Step [207/225], Training Accuracy: 46.3466%, Training Loss: 1.0875%
Epoch [12/300], Step [208/225], Training Accuracy: 46.3942%, Training Loss: 1.0870%
Epoch [12/300], Step [209/225], Training Accuracy: 46.3367%, Training Loss: 1.0870%
Epoch [12/300], Step [210/225], Training Accuracy: 46.3244%, Training Loss: 1.0867%
Epoch [12/300], Step [211/225], Training Accuracy: 46.3270%, Training Loss: 1.0866%
Epoch [12/300], Step [212/225], Training Accuracy: 46.2854%, Training Loss: 1.0871%
Epoch [12/300], Step [213/225], Training Accuracy: 46.2295%, Training Loss: 1.0877%
Epoch [12/300], Step [214/225], Training Accuracy: 46.2471%, Training Loss: 1.0874%
Epoch [12/300], Step [215/225], Training Accuracy: 46.2791%, Training Loss: 1.0873%
Epoch [12/300], Step [216/225], Training Accuracy: 46.2674%, Training Loss: 1.0874%
Epoch [12/300], Step [217/225], Training Accuracy: 46.2486%, Training Loss: 1.0874%
Epoch [12/300], Step [218/225], Training Accuracy: 46.2013%, Training Loss: 

Epoch [13/300], Step [91/225], Training Accuracy: 47.0295%, Training Loss: 1.0786%
Epoch [13/300], Step [92/225], Training Accuracy: 46.9939%, Training Loss: 1.0787%
Epoch [13/300], Step [93/225], Training Accuracy: 46.9422%, Training Loss: 1.0788%
Epoch [13/300], Step [94/225], Training Accuracy: 47.0745%, Training Loss: 1.0776%
Epoch [13/300], Step [95/225], Training Accuracy: 46.9243%, Training Loss: 1.0788%
Epoch [13/300], Step [96/225], Training Accuracy: 46.9889%, Training Loss: 1.0784%
Epoch [13/300], Step [97/225], Training Accuracy: 47.0039%, Training Loss: 1.0779%
Epoch [13/300], Step [98/225], Training Accuracy: 46.9707%, Training Loss: 1.0772%
Epoch [13/300], Step [99/225], Training Accuracy: 46.9855%, Training Loss: 1.0774%
Epoch [13/300], Step [100/225], Training Accuracy: 46.8750%, Training Loss: 1.0775%
Epoch [13/300], Step [101/225], Training Accuracy: 46.8441%, Training Loss: 1.0778%
Epoch [13/300], Step [102/225], Training Accuracy: 46.8444%, Training Loss: 1.0781%
E

Epoch [13/300], Step [201/225], Training Accuracy: 46.9139%, Training Loss: 1.0723%
Epoch [13/300], Step [202/225], Training Accuracy: 46.9446%, Training Loss: 1.0720%
Epoch [13/300], Step [203/225], Training Accuracy: 46.9443%, Training Loss: 1.0723%
Epoch [13/300], Step [204/225], Training Accuracy: 46.9899%, Training Loss: 1.0721%
Epoch [13/300], Step [205/225], Training Accuracy: 47.0046%, Training Loss: 1.0723%
Epoch [13/300], Step [206/225], Training Accuracy: 47.0419%, Training Loss: 1.0726%
Epoch [13/300], Step [207/225], Training Accuracy: 47.0033%, Training Loss: 1.0730%
Epoch [13/300], Step [208/225], Training Accuracy: 47.0628%, Training Loss: 1.0725%
Epoch [13/300], Step [209/225], Training Accuracy: 47.0320%, Training Loss: 1.0726%
Epoch [13/300], Step [210/225], Training Accuracy: 47.0089%, Training Loss: 1.0723%
Epoch [13/300], Step [211/225], Training Accuracy: 47.0157%, Training Loss: 1.0722%
Epoch [13/300], Step [212/225], Training Accuracy: 46.9708%, Training Loss: 

Epoch [14/300], Step [84/225], Training Accuracy: 47.3586%, Training Loss: 1.0664%
Epoch [14/300], Step [85/225], Training Accuracy: 47.3897%, Training Loss: 1.0659%
Epoch [14/300], Step [86/225], Training Accuracy: 47.4201%, Training Loss: 1.0663%
Epoch [14/300], Step [87/225], Training Accuracy: 47.4856%, Training Loss: 1.0659%
Epoch [14/300], Step [88/225], Training Accuracy: 47.3899%, Training Loss: 1.0658%
Epoch [14/300], Step [89/225], Training Accuracy: 47.4192%, Training Loss: 1.0668%
Epoch [14/300], Step [90/225], Training Accuracy: 47.3438%, Training Loss: 1.0669%
Epoch [14/300], Step [91/225], Training Accuracy: 47.4416%, Training Loss: 1.0652%
Epoch [14/300], Step [92/225], Training Accuracy: 47.4015%, Training Loss: 1.0652%
Epoch [14/300], Step [93/225], Training Accuracy: 47.3790%, Training Loss: 1.0654%
Epoch [14/300], Step [94/225], Training Accuracy: 47.4900%, Training Loss: 1.0641%
Epoch [14/300], Step [95/225], Training Accuracy: 47.3520%, Training Loss: 1.0653%
Epoc

Epoch [14/300], Step [200/225], Training Accuracy: 47.4062%, Training Loss: 1.0590%
Epoch [14/300], Step [201/225], Training Accuracy: 47.4114%, Training Loss: 1.0593%
Epoch [14/300], Step [202/225], Training Accuracy: 47.4551%, Training Loss: 1.0590%
Epoch [14/300], Step [203/225], Training Accuracy: 47.4446%, Training Loss: 1.0593%
Epoch [14/300], Step [204/225], Training Accuracy: 47.4954%, Training Loss: 1.0592%
Epoch [14/300], Step [205/225], Training Accuracy: 47.5000%, Training Loss: 1.0592%
Epoch [14/300], Step [206/225], Training Accuracy: 47.5501%, Training Loss: 1.0597%
Epoch [14/300], Step [207/225], Training Accuracy: 47.5242%, Training Loss: 1.0601%
Epoch [14/300], Step [208/225], Training Accuracy: 47.5886%, Training Loss: 1.0596%
Epoch [14/300], Step [209/225], Training Accuracy: 47.5628%, Training Loss: 1.0596%
Epoch [14/300], Step [210/225], Training Accuracy: 47.5521%, Training Loss: 1.0594%
Epoch [14/300], Step [211/225], Training Accuracy: 47.5711%, Training Loss: 

Epoch [15/300], Step [87/225], Training Accuracy: 48.1322%, Training Loss: 1.0529%
Epoch [15/300], Step [88/225], Training Accuracy: 48.0114%, Training Loss: 1.0530%
Epoch [15/300], Step [89/225], Training Accuracy: 48.0337%, Training Loss: 1.0541%
Epoch [15/300], Step [90/225], Training Accuracy: 47.9340%, Training Loss: 1.0543%
Epoch [15/300], Step [91/225], Training Accuracy: 48.0254%, Training Loss: 1.0525%
Epoch [15/300], Step [92/225], Training Accuracy: 48.0129%, Training Loss: 1.0525%
Epoch [15/300], Step [93/225], Training Accuracy: 48.0007%, Training Loss: 1.0527%
Epoch [15/300], Step [94/225], Training Accuracy: 48.0884%, Training Loss: 1.0514%
Epoch [15/300], Step [95/225], Training Accuracy: 47.9770%, Training Loss: 1.0525%
Epoch [15/300], Step [96/225], Training Accuracy: 48.0143%, Training Loss: 1.0521%
Epoch [15/300], Step [97/225], Training Accuracy: 48.0509%, Training Loss: 1.0514%
Epoch [15/300], Step [98/225], Training Accuracy: 48.0389%, Training Loss: 1.0507%
Epoc

Epoch [15/300], Step [196/225], Training Accuracy: 48.0628%, Training Loss: 1.0480%
Epoch [15/300], Step [197/225], Training Accuracy: 48.0489%, Training Loss: 1.0475%
Epoch [15/300], Step [198/225], Training Accuracy: 48.0508%, Training Loss: 1.0469%
Epoch [15/300], Step [199/225], Training Accuracy: 48.0528%, Training Loss: 1.0466%
Epoch [15/300], Step [200/225], Training Accuracy: 48.0703%, Training Loss: 1.0468%
Epoch [15/300], Step [201/225], Training Accuracy: 48.0721%, Training Loss: 1.0472%
Epoch [15/300], Step [202/225], Training Accuracy: 48.1126%, Training Loss: 1.0468%
Epoch [15/300], Step [203/225], Training Accuracy: 48.0911%, Training Loss: 1.0471%
Epoch [15/300], Step [204/225], Training Accuracy: 48.1235%, Training Loss: 1.0470%
Epoch [15/300], Step [205/225], Training Accuracy: 48.1174%, Training Loss: 1.0471%
Epoch [15/300], Step [206/225], Training Accuracy: 48.1644%, Training Loss: 1.0475%
Epoch [15/300], Step [207/225], Training Accuracy: 48.1431%, Training Loss: 

Epoch [16/300], Step [78/225], Training Accuracy: 48.7981%, Training Loss: 1.0402%
Epoch [16/300], Step [79/225], Training Accuracy: 48.8133%, Training Loss: 1.0411%
Epoch [16/300], Step [80/225], Training Accuracy: 48.7695%, Training Loss: 1.0412%
Epoch [16/300], Step [81/225], Training Accuracy: 48.8040%, Training Loss: 1.0420%
Epoch [16/300], Step [82/225], Training Accuracy: 48.8758%, Training Loss: 1.0411%
Epoch [16/300], Step [83/225], Training Accuracy: 48.8517%, Training Loss: 1.0411%
Epoch [16/300], Step [84/225], Training Accuracy: 48.8281%, Training Loss: 1.0418%
Epoch [16/300], Step [85/225], Training Accuracy: 48.8603%, Training Loss: 1.0413%
Epoch [16/300], Step [86/225], Training Accuracy: 48.9099%, Training Loss: 1.0416%
Epoch [16/300], Step [87/225], Training Accuracy: 48.9224%, Training Loss: 1.0413%
Epoch [16/300], Step [88/225], Training Accuracy: 48.7926%, Training Loss: 1.0415%
Epoch [16/300], Step [89/225], Training Accuracy: 48.8062%, Training Loss: 1.0427%
Epoc

Epoch [16/300], Step [193/225], Training Accuracy: 48.5832%, Training Loss: 1.0371%
Epoch [16/300], Step [194/225], Training Accuracy: 48.6227%, Training Loss: 1.0373%
Epoch [16/300], Step [195/225], Training Accuracy: 48.6298%, Training Loss: 1.0368%
Epoch [16/300], Step [196/225], Training Accuracy: 48.6767%, Training Loss: 1.0369%
Epoch [16/300], Step [197/225], Training Accuracy: 48.6675%, Training Loss: 1.0364%
Epoch [16/300], Step [198/225], Training Accuracy: 48.6664%, Training Loss: 1.0358%
Epoch [16/300], Step [199/225], Training Accuracy: 48.6652%, Training Loss: 1.0355%
Epoch [16/300], Step [200/225], Training Accuracy: 48.6875%, Training Loss: 1.0357%
Epoch [16/300], Step [201/225], Training Accuracy: 48.7018%, Training Loss: 1.0360%
Epoch [16/300], Step [202/225], Training Accuracy: 48.7237%, Training Loss: 1.0356%
Epoch [16/300], Step [203/225], Training Accuracy: 48.6992%, Training Loss: 1.0360%
Epoch [16/300], Step [204/225], Training Accuracy: 48.7286%, Training Loss: 

Epoch [17/300], Step [77/225], Training Accuracy: 48.9651%, Training Loss: 1.0280%
Epoch [17/300], Step [78/225], Training Accuracy: 48.9183%, Training Loss: 1.0293%
Epoch [17/300], Step [79/225], Training Accuracy: 48.9320%, Training Loss: 1.0303%
Epoch [17/300], Step [80/225], Training Accuracy: 48.8672%, Training Loss: 1.0304%
Epoch [17/300], Step [81/225], Training Accuracy: 48.8812%, Training Loss: 1.0312%
Epoch [17/300], Step [82/225], Training Accuracy: 48.9329%, Training Loss: 1.0303%
Epoch [17/300], Step [83/225], Training Accuracy: 48.9081%, Training Loss: 1.0303%
Epoch [17/300], Step [84/225], Training Accuracy: 48.9025%, Training Loss: 1.0310%
Epoch [17/300], Step [85/225], Training Accuracy: 48.9338%, Training Loss: 1.0304%
Epoch [17/300], Step [86/225], Training Accuracy: 48.9826%, Training Loss: 1.0307%
Epoch [17/300], Step [87/225], Training Accuracy: 49.0122%, Training Loss: 1.0305%
Epoch [17/300], Step [88/225], Training Accuracy: 48.8991%, Training Loss: 1.0307%
Epoc

Epoch [17/300], Step [188/225], Training Accuracy: 48.7284%, Training Loss: 1.0270%
Epoch [17/300], Step [189/225], Training Accuracy: 48.7930%, Training Loss: 1.0265%
Epoch [17/300], Step [190/225], Training Accuracy: 48.7993%, Training Loss: 1.0269%
Epoch [17/300], Step [191/225], Training Accuracy: 48.7974%, Training Loss: 1.0270%
Epoch [17/300], Step [192/225], Training Accuracy: 48.8363%, Training Loss: 1.0267%
Epoch [17/300], Step [193/225], Training Accuracy: 48.8099%, Training Loss: 1.0267%
Epoch [17/300], Step [194/225], Training Accuracy: 48.8563%, Training Loss: 1.0268%
Epoch [17/300], Step [195/225], Training Accuracy: 48.8622%, Training Loss: 1.0263%
Epoch [17/300], Step [196/225], Training Accuracy: 48.9078%, Training Loss: 1.0264%
Epoch [17/300], Step [197/225], Training Accuracy: 48.9134%, Training Loss: 1.0259%
Epoch [17/300], Step [198/225], Training Accuracy: 48.9189%, Training Loss: 1.0253%
Epoch [17/300], Step [199/225], Training Accuracy: 48.9165%, Training Loss: 

Epoch [18/300], Step [72/225], Training Accuracy: 49.0885%, Training Loss: 1.0182%
Epoch [18/300], Step [73/225], Training Accuracy: 49.0368%, Training Loss: 1.0211%
Epoch [18/300], Step [74/225], Training Accuracy: 49.1343%, Training Loss: 1.0191%
Epoch [18/300], Step [75/225], Training Accuracy: 49.1458%, Training Loss: 1.0184%
Epoch [18/300], Step [76/225], Training Accuracy: 49.2188%, Training Loss: 1.0185%
Epoch [18/300], Step [77/225], Training Accuracy: 49.3304%, Training Loss: 1.0180%
Epoch [18/300], Step [78/225], Training Accuracy: 49.3189%, Training Loss: 1.0193%
Epoch [18/300], Step [79/225], Training Accuracy: 49.3473%, Training Loss: 1.0204%
Epoch [18/300], Step [80/225], Training Accuracy: 49.2773%, Training Loss: 1.0206%
Epoch [18/300], Step [81/225], Training Accuracy: 49.2670%, Training Loss: 1.0213%
Epoch [18/300], Step [82/225], Training Accuracy: 49.3521%, Training Loss: 1.0204%
Epoch [18/300], Step [83/225], Training Accuracy: 49.3411%, Training Loss: 1.0204%
Epoc

Epoch [18/300], Step [185/225], Training Accuracy: 49.1470%, Training Loss: 1.0187%
Epoch [18/300], Step [186/225], Training Accuracy: 49.1851%, Training Loss: 1.0184%
Epoch [18/300], Step [187/225], Training Accuracy: 49.2229%, Training Loss: 1.0178%
Epoch [18/300], Step [188/225], Training Accuracy: 49.2852%, Training Loss: 1.0173%
Epoch [18/300], Step [189/225], Training Accuracy: 49.3386%, Training Loss: 1.0168%
Epoch [18/300], Step [190/225], Training Accuracy: 49.3339%, Training Loss: 1.0172%
Epoch [18/300], Step [191/225], Training Accuracy: 49.3210%, Training Loss: 1.0172%
Epoch [18/300], Step [192/225], Training Accuracy: 49.3571%, Training Loss: 1.0170%
Epoch [18/300], Step [193/225], Training Accuracy: 49.3280%, Training Loss: 1.0169%
Epoch [18/300], Step [194/225], Training Accuracy: 49.3718%, Training Loss: 1.0171%
Epoch [18/300], Step [195/225], Training Accuracy: 49.3910%, Training Loss: 1.0166%
Epoch [18/300], Step [196/225], Training Accuracy: 49.4340%, Training Loss: 

Epoch [19/300], Step [72/225], Training Accuracy: 49.5226%, Training Loss: 1.0090%
Epoch [19/300], Step [73/225], Training Accuracy: 49.4649%, Training Loss: 1.0118%
Epoch [19/300], Step [74/225], Training Accuracy: 49.5566%, Training Loss: 1.0098%
Epoch [19/300], Step [75/225], Training Accuracy: 49.5208%, Training Loss: 1.0092%
Epoch [19/300], Step [76/225], Training Accuracy: 49.5683%, Training Loss: 1.0092%
Epoch [19/300], Step [77/225], Training Accuracy: 49.6753%, Training Loss: 1.0088%
Epoch [19/300], Step [78/225], Training Accuracy: 49.6795%, Training Loss: 1.0101%
Epoch [19/300], Step [79/225], Training Accuracy: 49.7033%, Training Loss: 1.0112%
Epoch [19/300], Step [80/225], Training Accuracy: 49.6289%, Training Loss: 1.0114%
Epoch [19/300], Step [81/225], Training Accuracy: 49.6721%, Training Loss: 1.0121%
Epoch [19/300], Step [82/225], Training Accuracy: 49.7523%, Training Loss: 1.0112%
Epoch [19/300], Step [83/225], Training Accuracy: 49.7364%, Training Loss: 1.0111%
Epoc

Epoch [19/300], Step [184/225], Training Accuracy: 49.6094%, Training Loss: 1.0095%
Epoch [19/300], Step [185/225], Training Accuracy: 49.6030%, Training Loss: 1.0095%
Epoch [19/300], Step [186/225], Training Accuracy: 49.6388%, Training Loss: 1.0093%
Epoch [19/300], Step [187/225], Training Accuracy: 49.6658%, Training Loss: 1.0086%
Epoch [19/300], Step [188/225], Training Accuracy: 49.7257%, Training Loss: 1.0081%
Epoch [19/300], Step [189/225], Training Accuracy: 49.7685%, Training Loss: 1.0076%
Epoch [19/300], Step [190/225], Training Accuracy: 49.7615%, Training Loss: 1.0080%
Epoch [19/300], Step [191/225], Training Accuracy: 49.7300%, Training Loss: 1.0081%
Epoch [19/300], Step [192/225], Training Accuracy: 49.7721%, Training Loss: 1.0078%
Epoch [19/300], Step [193/225], Training Accuracy: 49.7490%, Training Loss: 1.0078%
Epoch [19/300], Step [194/225], Training Accuracy: 49.7906%, Training Loss: 1.0079%
Epoch [19/300], Step [195/225], Training Accuracy: 49.8157%, Training Loss: 

Epoch [20/300], Step [65/225], Training Accuracy: 49.8798%, Training Loss: 1.0000%
Epoch [20/300], Step [66/225], Training Accuracy: 50.0710%, Training Loss: 0.9983%
Epoch [20/300], Step [67/225], Training Accuracy: 49.9767%, Training Loss: 0.9985%
Epoch [20/300], Step [68/225], Training Accuracy: 49.8851%, Training Loss: 0.9983%
Epoch [20/300], Step [69/225], Training Accuracy: 49.8188%, Training Loss: 0.9985%
Epoch [20/300], Step [70/225], Training Accuracy: 49.7321%, Training Loss: 0.9999%
Epoch [20/300], Step [71/225], Training Accuracy: 49.8019%, Training Loss: 0.9988%
Epoch [20/300], Step [72/225], Training Accuracy: 49.6962%, Training Loss: 1.0008%
Epoch [20/300], Step [73/225], Training Accuracy: 49.6361%, Training Loss: 1.0034%
Epoch [20/300], Step [74/225], Training Accuracy: 49.6622%, Training Loss: 1.0015%
Epoch [20/300], Step [75/225], Training Accuracy: 49.6250%, Training Loss: 1.0009%
Epoch [20/300], Step [76/225], Training Accuracy: 49.6916%, Training Loss: 1.0008%
Epoc

Epoch [20/300], Step [166/225], Training Accuracy: 49.7929%, Training Loss: 1.0015%
Epoch [20/300], Step [167/225], Training Accuracy: 49.8129%, Training Loss: 1.0008%
Epoch [20/300], Step [168/225], Training Accuracy: 49.8047%, Training Loss: 1.0010%
Epoch [20/300], Step [169/225], Training Accuracy: 49.8151%, Training Loss: 1.0010%
Epoch [20/300], Step [170/225], Training Accuracy: 49.7978%, Training Loss: 1.0016%
Epoch [20/300], Step [171/225], Training Accuracy: 49.7990%, Training Loss: 1.0014%
Epoch [20/300], Step [172/225], Training Accuracy: 49.7366%, Training Loss: 1.0021%
Epoch [20/300], Step [173/225], Training Accuracy: 49.7471%, Training Loss: 1.0017%
Epoch [20/300], Step [174/225], Training Accuracy: 49.7665%, Training Loss: 1.0017%
Epoch [20/300], Step [175/225], Training Accuracy: 49.7500%, Training Loss: 1.0017%
Epoch [20/300], Step [176/225], Training Accuracy: 49.7603%, Training Loss: 1.0016%
Epoch [20/300], Step [177/225], Training Accuracy: 49.7440%, Training Loss: 

Epoch [21/300], Step [48/225], Training Accuracy: 50.1953%, Training Loss: 0.9926%
Epoch [21/300], Step [49/225], Training Accuracy: 50.0000%, Training Loss: 0.9941%
Epoch [21/300], Step [50/225], Training Accuracy: 50.1562%, Training Loss: 0.9926%
Epoch [21/300], Step [51/225], Training Accuracy: 50.2145%, Training Loss: 0.9905%
Epoch [21/300], Step [52/225], Training Accuracy: 50.3606%, Training Loss: 0.9886%
Epoch [21/300], Step [53/225], Training Accuracy: 50.1769%, Training Loss: 0.9886%
Epoch [21/300], Step [54/225], Training Accuracy: 49.9711%, Training Loss: 0.9903%
Epoch [21/300], Step [55/225], Training Accuracy: 49.8295%, Training Loss: 0.9920%
Epoch [21/300], Step [56/225], Training Accuracy: 49.8047%, Training Loss: 0.9932%
Epoch [21/300], Step [57/225], Training Accuracy: 50.0548%, Training Loss: 0.9901%
Epoch [21/300], Step [58/225], Training Accuracy: 50.0000%, Training Loss: 0.9906%
Epoch [21/300], Step [59/225], Training Accuracy: 50.1059%, Training Loss: 0.9900%
Epoc

Epoch [21/300], Step [164/225], Training Accuracy: 50.1620%, Training Loss: 0.9931%
Epoch [21/300], Step [165/225], Training Accuracy: 50.1799%, Training Loss: 0.9930%
Epoch [21/300], Step [166/225], Training Accuracy: 50.1788%, Training Loss: 0.9931%
Epoch [21/300], Step [167/225], Training Accuracy: 50.1965%, Training Loss: 0.9924%
Epoch [21/300], Step [168/225], Training Accuracy: 50.1860%, Training Loss: 0.9927%
Epoch [21/300], Step [169/225], Training Accuracy: 50.1849%, Training Loss: 0.9926%
Epoch [21/300], Step [170/225], Training Accuracy: 50.1746%, Training Loss: 0.9932%
Epoch [21/300], Step [171/225], Training Accuracy: 50.1645%, Training Loss: 0.9931%
Epoch [21/300], Step [172/225], Training Accuracy: 50.0999%, Training Loss: 0.9937%
Epoch [21/300], Step [173/225], Training Accuracy: 50.0993%, Training Loss: 0.9934%
Epoch [21/300], Step [174/225], Training Accuracy: 50.1167%, Training Loss: 0.9933%
Epoch [21/300], Step [175/225], Training Accuracy: 50.0982%, Training Loss: 

Epoch [22/300], Step [52/225], Training Accuracy: 50.8413%, Training Loss: 0.9814%
Epoch [22/300], Step [53/225], Training Accuracy: 50.6781%, Training Loss: 0.9814%
Epoch [22/300], Step [54/225], Training Accuracy: 50.4340%, Training Loss: 0.9832%
Epoch [22/300], Step [55/225], Training Accuracy: 50.2841%, Training Loss: 0.9850%
Epoch [22/300], Step [56/225], Training Accuracy: 50.2511%, Training Loss: 0.9861%
Epoch [22/300], Step [57/225], Training Accuracy: 50.4934%, Training Loss: 0.9830%
Epoch [22/300], Step [58/225], Training Accuracy: 50.4310%, Training Loss: 0.9834%
Epoch [22/300], Step [59/225], Training Accuracy: 50.5561%, Training Loss: 0.9828%
Epoch [22/300], Step [60/225], Training Accuracy: 50.5208%, Training Loss: 0.9830%
Epoch [22/300], Step [61/225], Training Accuracy: 50.6404%, Training Loss: 0.9826%
Epoch [22/300], Step [62/225], Training Accuracy: 50.5796%, Training Loss: 0.9831%
Epoch [22/300], Step [63/225], Training Accuracy: 50.4464%, Training Loss: 0.9843%
Epoc

Epoch [22/300], Step [166/225], Training Accuracy: 50.6683%, Training Loss: 0.9851%
Epoch [22/300], Step [167/225], Training Accuracy: 50.6830%, Training Loss: 0.9844%
Epoch [22/300], Step [168/225], Training Accuracy: 50.6603%, Training Loss: 0.9847%
Epoch [22/300], Step [169/225], Training Accuracy: 50.6564%, Training Loss: 0.9847%
Epoch [22/300], Step [170/225], Training Accuracy: 50.6342%, Training Loss: 0.9852%
Epoch [22/300], Step [171/225], Training Accuracy: 50.6213%, Training Loss: 0.9851%
Epoch [22/300], Step [172/225], Training Accuracy: 50.5723%, Training Loss: 0.9858%
Epoch [22/300], Step [173/225], Training Accuracy: 50.5690%, Training Loss: 0.9854%
Epoch [22/300], Step [174/225], Training Accuracy: 50.5837%, Training Loss: 0.9854%
Epoch [22/300], Step [175/225], Training Accuracy: 50.5625%, Training Loss: 0.9855%
Epoch [22/300], Step [176/225], Training Accuracy: 50.5859%, Training Loss: 0.9853%
Epoch [22/300], Step [177/225], Training Accuracy: 50.5473%, Training Loss: 

Epoch [23/300], Step [47/225], Training Accuracy: 50.7979%, Training Loss: 0.9777%
Epoch [23/300], Step [48/225], Training Accuracy: 50.8464%, Training Loss: 0.9785%
Epoch [23/300], Step [49/225], Training Accuracy: 50.7334%, Training Loss: 0.9801%
Epoch [23/300], Step [50/225], Training Accuracy: 50.8750%, Training Loss: 0.9786%
Epoch [23/300], Step [51/225], Training Accuracy: 50.9498%, Training Loss: 0.9760%
Epoch [23/300], Step [52/225], Training Accuracy: 51.0817%, Training Loss: 0.9739%
Epoch [23/300], Step [53/225], Training Accuracy: 50.9434%, Training Loss: 0.9739%
Epoch [23/300], Step [54/225], Training Accuracy: 50.6944%, Training Loss: 0.9758%
Epoch [23/300], Step [55/225], Training Accuracy: 50.5398%, Training Loss: 0.9776%
Epoch [23/300], Step [56/225], Training Accuracy: 50.4743%, Training Loss: 0.9788%
Epoch [23/300], Step [57/225], Training Accuracy: 50.7127%, Training Loss: 0.9756%
Epoch [23/300], Step [58/225], Training Accuracy: 50.6466%, Training Loss: 0.9760%
Epoc

Epoch [23/300], Step [156/225], Training Accuracy: 50.9415%, Training Loss: 0.9792%
Epoch [23/300], Step [157/225], Training Accuracy: 50.9455%, Training Loss: 0.9797%
Epoch [23/300], Step [158/225], Training Accuracy: 50.9691%, Training Loss: 0.9798%
Epoch [23/300], Step [159/225], Training Accuracy: 50.9631%, Training Loss: 0.9795%
Epoch [23/300], Step [160/225], Training Accuracy: 50.9180%, Training Loss: 0.9795%
Epoch [23/300], Step [161/225], Training Accuracy: 51.0093%, Training Loss: 0.9785%
Epoch [23/300], Step [162/225], Training Accuracy: 51.0417%, Training Loss: 0.9787%
Epoch [23/300], Step [163/225], Training Accuracy: 50.9778%, Training Loss: 0.9784%
Epoch [23/300], Step [164/225], Training Accuracy: 51.0290%, Training Loss: 0.9774%
Epoch [23/300], Step [165/225], Training Accuracy: 51.0322%, Training Loss: 0.9772%
Epoch [23/300], Step [166/225], Training Accuracy: 51.0354%, Training Loss: 0.9774%
Epoch [23/300], Step [167/225], Training Accuracy: 51.0479%, Training Loss: 

Epoch [24/300], Step [46/225], Training Accuracy: 51.2908%, Training Loss: 0.9687%
Epoch [24/300], Step [47/225], Training Accuracy: 51.2965%, Training Loss: 0.9703%
Epoch [24/300], Step [48/225], Training Accuracy: 51.3021%, Training Loss: 0.9712%
Epoch [24/300], Step [49/225], Training Accuracy: 51.1798%, Training Loss: 0.9727%
Epoch [24/300], Step [50/225], Training Accuracy: 51.2812%, Training Loss: 0.9713%
Epoch [24/300], Step [51/225], Training Accuracy: 51.3480%, Training Loss: 0.9686%
Epoch [24/300], Step [52/225], Training Accuracy: 51.4724%, Training Loss: 0.9664%
Epoch [24/300], Step [53/225], Training Accuracy: 51.3267%, Training Loss: 0.9664%
Epoch [24/300], Step [54/225], Training Accuracy: 51.0127%, Training Loss: 0.9684%
Epoch [24/300], Step [55/225], Training Accuracy: 50.8807%, Training Loss: 0.9703%
Epoch [24/300], Step [56/225], Training Accuracy: 50.8371%, Training Loss: 0.9714%
Epoch [24/300], Step [57/225], Training Accuracy: 51.0417%, Training Loss: 0.9683%
Epoc

Epoch [24/300], Step [162/225], Training Accuracy: 51.2635%, Training Loss: 0.9713%
Epoch [24/300], Step [163/225], Training Accuracy: 51.1982%, Training Loss: 0.9710%
Epoch [24/300], Step [164/225], Training Accuracy: 51.2481%, Training Loss: 0.9700%
Epoch [24/300], Step [165/225], Training Accuracy: 51.2500%, Training Loss: 0.9698%
Epoch [24/300], Step [166/225], Training Accuracy: 51.2519%, Training Loss: 0.9699%
Epoch [24/300], Step [167/225], Training Accuracy: 51.2725%, Training Loss: 0.9692%
Epoch [24/300], Step [168/225], Training Accuracy: 51.2463%, Training Loss: 0.9694%
Epoch [24/300], Step [169/225], Training Accuracy: 51.2389%, Training Loss: 0.9694%
Epoch [24/300], Step [170/225], Training Accuracy: 51.2040%, Training Loss: 0.9700%
Epoch [24/300], Step [171/225], Training Accuracy: 51.2061%, Training Loss: 0.9699%
Epoch [24/300], Step [172/225], Training Accuracy: 51.1719%, Training Loss: 0.9705%
Epoch [24/300], Step [173/225], Training Accuracy: 51.1832%, Training Loss: 

Epoch [25/300], Step [46/225], Training Accuracy: 51.6304%, Training Loss: 0.9616%
Epoch [25/300], Step [47/225], Training Accuracy: 51.6290%, Training Loss: 0.9633%
Epoch [25/300], Step [48/225], Training Accuracy: 51.6276%, Training Loss: 0.9643%
Epoch [25/300], Step [49/225], Training Accuracy: 51.4987%, Training Loss: 0.9658%
Epoch [25/300], Step [50/225], Training Accuracy: 51.5625%, Training Loss: 0.9643%
Epoch [25/300], Step [51/225], Training Accuracy: 51.7157%, Training Loss: 0.9614%
Epoch [25/300], Step [52/225], Training Accuracy: 51.8329%, Training Loss: 0.9593%
Epoch [25/300], Step [53/225], Training Accuracy: 51.7394%, Training Loss: 0.9592%
Epoch [25/300], Step [54/225], Training Accuracy: 51.4468%, Training Loss: 0.9613%
Epoch [25/300], Step [55/225], Training Accuracy: 51.3636%, Training Loss: 0.9634%
Epoch [25/300], Step [56/225], Training Accuracy: 51.3672%, Training Loss: 0.9644%
Epoch [25/300], Step [57/225], Training Accuracy: 51.5625%, Training Loss: 0.9613%
Epoc

Epoch [25/300], Step [156/225], Training Accuracy: 51.4223%, Training Loss: 0.9648%
Epoch [25/300], Step [157/225], Training Accuracy: 51.4232%, Training Loss: 0.9652%
Epoch [25/300], Step [158/225], Training Accuracy: 51.4537%, Training Loss: 0.9654%
Epoch [25/300], Step [159/225], Training Accuracy: 51.4642%, Training Loss: 0.9650%
Epoch [25/300], Step [160/225], Training Accuracy: 51.4160%, Training Loss: 0.9650%
Epoch [25/300], Step [161/225], Training Accuracy: 51.5043%, Training Loss: 0.9640%
Epoch [25/300], Step [162/225], Training Accuracy: 51.5336%, Training Loss: 0.9642%
Epoch [25/300], Step [163/225], Training Accuracy: 51.4762%, Training Loss: 0.9639%
Epoch [25/300], Step [164/225], Training Accuracy: 51.5339%, Training Loss: 0.9629%
Epoch [25/300], Step [165/225], Training Accuracy: 51.5436%, Training Loss: 0.9627%
Epoch [25/300], Step [166/225], Training Accuracy: 51.5437%, Training Loss: 0.9628%
Epoch [25/300], Step [167/225], Training Accuracy: 51.5719%, Training Loss: 

Epoch [26/300], Step [40/225], Training Accuracy: 52.0703%, Training Loss: 0.9600%
Epoch [26/300], Step [41/225], Training Accuracy: 51.7912%, Training Loss: 0.9620%
Epoch [26/300], Step [42/225], Training Accuracy: 51.9345%, Training Loss: 0.9606%
Epoch [26/300], Step [43/225], Training Accuracy: 51.8532%, Training Loss: 0.9599%
Epoch [26/300], Step [44/225], Training Accuracy: 51.9176%, Training Loss: 0.9587%
Epoch [26/300], Step [45/225], Training Accuracy: 51.8403%, Training Loss: 0.9587%
Epoch [26/300], Step [46/225], Training Accuracy: 52.1399%, Training Loss: 0.9553%
Epoch [26/300], Step [47/225], Training Accuracy: 52.1609%, Training Loss: 0.9570%
Epoch [26/300], Step [48/225], Training Accuracy: 52.1810%, Training Loss: 0.9582%
Epoch [26/300], Step [49/225], Training Accuracy: 51.9770%, Training Loss: 0.9597%
Epoch [26/300], Step [50/225], Training Accuracy: 52.0000%, Training Loss: 0.9583%
Epoch [26/300], Step [51/225], Training Accuracy: 52.1446%, Training Loss: 0.9553%
Epoc

Epoch [26/300], Step [150/225], Training Accuracy: 51.9167%, Training Loss: 0.9586%
Epoch [26/300], Step [151/225], Training Accuracy: 51.9350%, Training Loss: 0.9580%
Epoch [26/300], Step [152/225], Training Accuracy: 51.9120%, Training Loss: 0.9580%
Epoch [26/300], Step [153/225], Training Accuracy: 51.9404%, Training Loss: 0.9575%
Epoch [26/300], Step [154/225], Training Accuracy: 51.9278%, Training Loss: 0.9570%
Epoch [26/300], Step [155/225], Training Accuracy: 51.8851%, Training Loss: 0.9581%
Epoch [26/300], Step [156/225], Training Accuracy: 51.8429%, Training Loss: 0.9583%
Epoch [26/300], Step [157/225], Training Accuracy: 51.8412%, Training Loss: 0.9586%
Epoch [26/300], Step [158/225], Training Accuracy: 51.8592%, Training Loss: 0.9588%
Epoch [26/300], Step [159/225], Training Accuracy: 51.8770%, Training Loss: 0.9585%
Epoch [26/300], Step [160/225], Training Accuracy: 51.8359%, Training Loss: 0.9584%
Epoch [26/300], Step [161/225], Training Accuracy: 51.9313%, Training Loss: 

Epoch [27/300], Step [36/225], Training Accuracy: 52.0833%, Training Loss: 0.9580%
Epoch [27/300], Step [37/225], Training Accuracy: 52.3649%, Training Loss: 0.9552%
Epoch [27/300], Step [38/225], Training Accuracy: 52.5905%, Training Loss: 0.9536%
Epoch [27/300], Step [39/225], Training Accuracy: 52.6442%, Training Loss: 0.9530%
Epoch [27/300], Step [40/225], Training Accuracy: 52.5781%, Training Loss: 0.9530%
Epoch [27/300], Step [41/225], Training Accuracy: 52.1723%, Training Loss: 0.9551%
Epoch [27/300], Step [42/225], Training Accuracy: 52.3065%, Training Loss: 0.9539%
Epoch [27/300], Step [43/225], Training Accuracy: 52.1802%, Training Loss: 0.9531%
Epoch [27/300], Step [44/225], Training Accuracy: 52.2372%, Training Loss: 0.9521%
Epoch [27/300], Step [45/225], Training Accuracy: 52.1875%, Training Loss: 0.9521%
Epoch [27/300], Step [46/225], Training Accuracy: 52.5136%, Training Loss: 0.9488%
Epoch [27/300], Step [47/225], Training Accuracy: 52.5266%, Training Loss: 0.9506%
Epoc

Epoch [27/300], Step [149/225], Training Accuracy: 52.2966%, Training Loss: 0.9518%
Epoch [27/300], Step [150/225], Training Accuracy: 52.2604%, Training Loss: 0.9523%
Epoch [27/300], Step [151/225], Training Accuracy: 52.2868%, Training Loss: 0.9517%
Epoch [27/300], Step [152/225], Training Accuracy: 52.2615%, Training Loss: 0.9517%
Epoch [27/300], Step [153/225], Training Accuracy: 52.2774%, Training Loss: 0.9512%
Epoch [27/300], Step [154/225], Training Accuracy: 52.2727%, Training Loss: 0.9506%
Epoch [27/300], Step [155/225], Training Accuracy: 52.2278%, Training Loss: 0.9517%
Epoch [27/300], Step [156/225], Training Accuracy: 52.1835%, Training Loss: 0.9520%
Epoch [27/300], Step [157/225], Training Accuracy: 52.1895%, Training Loss: 0.9523%
Epoch [27/300], Step [158/225], Training Accuracy: 52.1954%, Training Loss: 0.9525%
Epoch [27/300], Step [159/225], Training Accuracy: 52.2209%, Training Loss: 0.9522%
Epoch [27/300], Step [160/225], Training Accuracy: 52.2070%, Training Loss: 

Epoch [28/300], Step [33/225], Training Accuracy: 52.2727%, Training Loss: 0.9490%
Epoch [28/300], Step [34/225], Training Accuracy: 52.2978%, Training Loss: 0.9510%
Epoch [28/300], Step [35/225], Training Accuracy: 52.1875%, Training Loss: 0.9513%
Epoch [28/300], Step [36/225], Training Accuracy: 52.1701%, Training Loss: 0.9513%
Epoch [28/300], Step [37/225], Training Accuracy: 52.4493%, Training Loss: 0.9486%
Epoch [28/300], Step [38/225], Training Accuracy: 52.6727%, Training Loss: 0.9470%
Epoch [28/300], Step [39/225], Training Accuracy: 52.7644%, Training Loss: 0.9464%
Epoch [28/300], Step [40/225], Training Accuracy: 52.6953%, Training Loss: 0.9465%
Epoch [28/300], Step [41/225], Training Accuracy: 52.2866%, Training Loss: 0.9487%
Epoch [28/300], Step [42/225], Training Accuracy: 52.4182%, Training Loss: 0.9477%
Epoch [28/300], Step [43/225], Training Accuracy: 52.3256%, Training Loss: 0.9468%
Epoch [28/300], Step [44/225], Training Accuracy: 52.3793%, Training Loss: 0.9459%
Epoc

Epoch [28/300], Step [148/225], Training Accuracy: 52.4388%, Training Loss: 0.9457%
Epoch [28/300], Step [149/225], Training Accuracy: 52.4119%, Training Loss: 0.9458%
Epoch [28/300], Step [150/225], Training Accuracy: 52.3750%, Training Loss: 0.9463%
Epoch [28/300], Step [151/225], Training Accuracy: 52.4007%, Training Loss: 0.9457%
Epoch [28/300], Step [152/225], Training Accuracy: 52.3746%, Training Loss: 0.9457%
Epoch [28/300], Step [153/225], Training Accuracy: 52.3795%, Training Loss: 0.9452%
Epoch [28/300], Step [154/225], Training Accuracy: 52.3742%, Training Loss: 0.9446%
Epoch [28/300], Step [155/225], Training Accuracy: 52.3185%, Training Loss: 0.9458%
Epoch [28/300], Step [156/225], Training Accuracy: 52.2736%, Training Loss: 0.9460%
Epoch [28/300], Step [157/225], Training Accuracy: 52.2791%, Training Loss: 0.9464%
Epoch [28/300], Step [158/225], Training Accuracy: 52.2844%, Training Loss: 0.9466%
Epoch [28/300], Step [159/225], Training Accuracy: 52.3192%, Training Loss: 

Epoch [29/300], Step [34/225], Training Accuracy: 52.6195%, Training Loss: 0.9442%
Epoch [29/300], Step [35/225], Training Accuracy: 52.4554%, Training Loss: 0.9449%
Epoch [29/300], Step [36/225], Training Accuracy: 52.3872%, Training Loss: 0.9450%
Epoch [29/300], Step [37/225], Training Accuracy: 52.7027%, Training Loss: 0.9423%
Epoch [29/300], Step [38/225], Training Accuracy: 52.8783%, Training Loss: 0.9408%
Epoch [29/300], Step [39/225], Training Accuracy: 52.9247%, Training Loss: 0.9402%
Epoch [29/300], Step [40/225], Training Accuracy: 52.8906%, Training Loss: 0.9402%
Epoch [29/300], Step [41/225], Training Accuracy: 52.4771%, Training Loss: 0.9424%
Epoch [29/300], Step [42/225], Training Accuracy: 52.5670%, Training Loss: 0.9416%
Epoch [29/300], Step [43/225], Training Accuracy: 52.4709%, Training Loss: 0.9407%
Epoch [29/300], Step [44/225], Training Accuracy: 52.5213%, Training Loss: 0.9399%
Epoch [29/300], Step [45/225], Training Accuracy: 52.5000%, Training Loss: 0.9401%
Epoc

Epoch [29/300], Step [135/225], Training Accuracy: 52.6042%, Training Loss: 0.9434%
Epoch [29/300], Step [136/225], Training Accuracy: 52.5965%, Training Loss: 0.9427%
Epoch [29/300], Step [137/225], Training Accuracy: 52.6574%, Training Loss: 0.9419%
Epoch [29/300], Step [138/225], Training Accuracy: 52.7174%, Training Loss: 0.9407%
Epoch [29/300], Step [139/225], Training Accuracy: 52.6866%, Training Loss: 0.9409%
Epoch [29/300], Step [140/225], Training Accuracy: 52.7455%, Training Loss: 0.9407%
Epoch [29/300], Step [141/225], Training Accuracy: 52.7704%, Training Loss: 0.9404%
Epoch [29/300], Step [142/225], Training Accuracy: 52.8169%, Training Loss: 0.9404%
Epoch [29/300], Step [143/225], Training Accuracy: 52.8846%, Training Loss: 0.9399%
Epoch [29/300], Step [144/225], Training Accuracy: 52.8754%, Training Loss: 0.9397%
Epoch [29/300], Step [145/225], Training Accuracy: 52.9203%, Training Loss: 0.9389%
Epoch [29/300], Step [146/225], Training Accuracy: 52.9217%, Training Loss: 

Epoch [30/300], Step [22/225], Training Accuracy: 24.4318%, Training Loss: nan%
Epoch [30/300], Step [23/225], Training Accuracy: 24.4565%, Training Loss: nan%
Epoch [30/300], Step [24/225], Training Accuracy: 24.7396%, Training Loss: nan%
Epoch [30/300], Step [25/225], Training Accuracy: 24.7500%, Training Loss: nan%
Epoch [30/300], Step [26/225], Training Accuracy: 24.9399%, Training Loss: nan%
Epoch [30/300], Step [27/225], Training Accuracy: 24.7106%, Training Loss: nan%
Epoch [30/300], Step [28/225], Training Accuracy: 24.4978%, Training Loss: nan%
Epoch [30/300], Step [29/225], Training Accuracy: 24.7306%, Training Loss: nan%
Epoch [30/300], Step [30/225], Training Accuracy: 24.8438%, Training Loss: nan%
Epoch [30/300], Step [31/225], Training Accuracy: 24.6976%, Training Loss: nan%
Epoch [30/300], Step [32/225], Training Accuracy: 24.7559%, Training Loss: nan%
Epoch [30/300], Step [33/225], Training Accuracy: 24.7159%, Training Loss: nan%
Epoch [30/300], Step [34/225], Training 

Epoch [30/300], Step [128/225], Training Accuracy: 25.5737%, Training Loss: nan%
Epoch [30/300], Step [129/225], Training Accuracy: 25.6298%, Training Loss: nan%
Epoch [30/300], Step [130/225], Training Accuracy: 25.6370%, Training Loss: nan%
Epoch [30/300], Step [131/225], Training Accuracy: 25.6202%, Training Loss: nan%
Epoch [30/300], Step [132/225], Training Accuracy: 25.5682%, Training Loss: nan%
Epoch [30/300], Step [133/225], Training Accuracy: 25.5757%, Training Loss: nan%
Epoch [30/300], Step [134/225], Training Accuracy: 25.6297%, Training Loss: nan%
Epoch [30/300], Step [135/225], Training Accuracy: 25.6366%, Training Loss: nan%
Epoch [30/300], Step [136/225], Training Accuracy: 25.6893%, Training Loss: nan%
Epoch [30/300], Step [137/225], Training Accuracy: 25.6615%, Training Loss: nan%
Epoch [30/300], Step [138/225], Training Accuracy: 25.6567%, Training Loss: nan%
Epoch [30/300], Step [139/225], Training Accuracy: 25.6520%, Training Loss: nan%
Epoch [30/300], Step [140/22

Epoch [31/300], Step [17/225], Training Accuracy: 23.1618%, Training Loss: nan%
Epoch [31/300], Step [18/225], Training Accuracy: 23.6111%, Training Loss: nan%
Epoch [31/300], Step [19/225], Training Accuracy: 24.0954%, Training Loss: nan%
Epoch [31/300], Step [20/225], Training Accuracy: 24.5312%, Training Loss: nan%
Epoch [31/300], Step [21/225], Training Accuracy: 24.1815%, Training Loss: nan%
Epoch [31/300], Step [22/225], Training Accuracy: 24.4318%, Training Loss: nan%
Epoch [31/300], Step [23/225], Training Accuracy: 24.4565%, Training Loss: nan%
Epoch [31/300], Step [24/225], Training Accuracy: 24.7396%, Training Loss: nan%
Epoch [31/300], Step [25/225], Training Accuracy: 24.7500%, Training Loss: nan%
Epoch [31/300], Step [26/225], Training Accuracy: 24.9399%, Training Loss: nan%
Epoch [31/300], Step [27/225], Training Accuracy: 24.7106%, Training Loss: nan%
Epoch [31/300], Step [28/225], Training Accuracy: 24.4978%, Training Loss: nan%
Epoch [31/300], Step [29/225], Training 

Epoch [31/300], Step [130/225], Training Accuracy: 25.6370%, Training Loss: nan%
Epoch [31/300], Step [131/225], Training Accuracy: 25.6202%, Training Loss: nan%
Epoch [31/300], Step [132/225], Training Accuracy: 25.5682%, Training Loss: nan%
Epoch [31/300], Step [133/225], Training Accuracy: 25.5757%, Training Loss: nan%
Epoch [31/300], Step [134/225], Training Accuracy: 25.6297%, Training Loss: nan%
Epoch [31/300], Step [135/225], Training Accuracy: 25.6366%, Training Loss: nan%
Epoch [31/300], Step [136/225], Training Accuracy: 25.6893%, Training Loss: nan%
Epoch [31/300], Step [137/225], Training Accuracy: 25.6615%, Training Loss: nan%
Epoch [31/300], Step [138/225], Training Accuracy: 25.6567%, Training Loss: nan%
Epoch [31/300], Step [139/225], Training Accuracy: 25.6520%, Training Loss: nan%
Epoch [31/300], Step [140/225], Training Accuracy: 25.6138%, Training Loss: nan%
Epoch [31/300], Step [141/225], Training Accuracy: 25.5208%, Training Loss: nan%
Epoch [31/300], Step [142/22

Epoch [32/300], Step [19/225], Training Accuracy: 24.0954%, Training Loss: nan%
Epoch [32/300], Step [20/225], Training Accuracy: 24.5312%, Training Loss: nan%
Epoch [32/300], Step [21/225], Training Accuracy: 24.1815%, Training Loss: nan%
Epoch [32/300], Step [22/225], Training Accuracy: 24.4318%, Training Loss: nan%
Epoch [32/300], Step [23/225], Training Accuracy: 24.4565%, Training Loss: nan%
Epoch [32/300], Step [24/225], Training Accuracy: 24.7396%, Training Loss: nan%
Epoch [32/300], Step [25/225], Training Accuracy: 24.7500%, Training Loss: nan%
Epoch [32/300], Step [26/225], Training Accuracy: 24.9399%, Training Loss: nan%
Epoch [32/300], Step [27/225], Training Accuracy: 24.7106%, Training Loss: nan%
Epoch [32/300], Step [28/225], Training Accuracy: 24.4978%, Training Loss: nan%
Epoch [32/300], Step [29/225], Training Accuracy: 24.7306%, Training Loss: nan%
Epoch [32/300], Step [30/225], Training Accuracy: 24.8438%, Training Loss: nan%
Epoch [32/300], Step [31/225], Training 

Epoch [32/300], Step [124/225], Training Accuracy: 25.5418%, Training Loss: nan%
Epoch [32/300], Step [125/225], Training Accuracy: 25.5875%, Training Loss: nan%
Epoch [32/300], Step [126/225], Training Accuracy: 25.5580%, Training Loss: nan%
Epoch [32/300], Step [127/225], Training Accuracy: 25.5290%, Training Loss: nan%
Epoch [32/300], Step [128/225], Training Accuracy: 25.5737%, Training Loss: nan%
Epoch [32/300], Step [129/225], Training Accuracy: 25.6298%, Training Loss: nan%
Epoch [32/300], Step [130/225], Training Accuracy: 25.6370%, Training Loss: nan%
Epoch [32/300], Step [131/225], Training Accuracy: 25.6202%, Training Loss: nan%
Epoch [32/300], Step [132/225], Training Accuracy: 25.5682%, Training Loss: nan%
Epoch [32/300], Step [133/225], Training Accuracy: 25.5757%, Training Loss: nan%
Epoch [32/300], Step [134/225], Training Accuracy: 25.6297%, Training Loss: nan%
Epoch [32/300], Step [135/225], Training Accuracy: 25.6366%, Training Loss: nan%
Epoch [32/300], Step [136/22

Epoch [33/300], Step [15/225], Training Accuracy: 23.1250%, Training Loss: nan%
Epoch [33/300], Step [16/225], Training Accuracy: 23.3398%, Training Loss: nan%
Epoch [33/300], Step [17/225], Training Accuracy: 23.1618%, Training Loss: nan%
Epoch [33/300], Step [18/225], Training Accuracy: 23.6111%, Training Loss: nan%
Epoch [33/300], Step [19/225], Training Accuracy: 24.0954%, Training Loss: nan%
Epoch [33/300], Step [20/225], Training Accuracy: 24.5312%, Training Loss: nan%
Epoch [33/300], Step [21/225], Training Accuracy: 24.1815%, Training Loss: nan%
Epoch [33/300], Step [22/225], Training Accuracy: 24.4318%, Training Loss: nan%
Epoch [33/300], Step [23/225], Training Accuracy: 24.4565%, Training Loss: nan%
Epoch [33/300], Step [24/225], Training Accuracy: 24.7396%, Training Loss: nan%
Epoch [33/300], Step [25/225], Training Accuracy: 24.7500%, Training Loss: nan%
Epoch [33/300], Step [26/225], Training Accuracy: 24.9399%, Training Loss: nan%
Epoch [33/300], Step [27/225], Training 

Epoch [33/300], Step [125/225], Training Accuracy: 25.5875%, Training Loss: nan%
Epoch [33/300], Step [126/225], Training Accuracy: 25.5580%, Training Loss: nan%
Epoch [33/300], Step [127/225], Training Accuracy: 25.5290%, Training Loss: nan%
Epoch [33/300], Step [128/225], Training Accuracy: 25.5737%, Training Loss: nan%
Epoch [33/300], Step [129/225], Training Accuracy: 25.6298%, Training Loss: nan%
Epoch [33/300], Step [130/225], Training Accuracy: 25.6370%, Training Loss: nan%
Epoch [33/300], Step [131/225], Training Accuracy: 25.6202%, Training Loss: nan%
Epoch [33/300], Step [132/225], Training Accuracy: 25.5682%, Training Loss: nan%
Epoch [33/300], Step [133/225], Training Accuracy: 25.5757%, Training Loss: nan%
Epoch [33/300], Step [134/225], Training Accuracy: 25.6297%, Training Loss: nan%
Epoch [33/300], Step [135/225], Training Accuracy: 25.6366%, Training Loss: nan%
Epoch [33/300], Step [136/225], Training Accuracy: 25.6893%, Training Loss: nan%
Epoch [33/300], Step [137/22

Epoch [34/300], Step [12/225], Training Accuracy: 23.4375%, Training Loss: nan%
Epoch [34/300], Step [13/225], Training Accuracy: 22.5962%, Training Loss: nan%
Epoch [34/300], Step [14/225], Training Accuracy: 22.7679%, Training Loss: nan%
Epoch [34/300], Step [15/225], Training Accuracy: 23.1250%, Training Loss: nan%
Epoch [34/300], Step [16/225], Training Accuracy: 23.3398%, Training Loss: nan%
Epoch [34/300], Step [17/225], Training Accuracy: 23.1618%, Training Loss: nan%
Epoch [34/300], Step [18/225], Training Accuracy: 23.6111%, Training Loss: nan%
Epoch [34/300], Step [19/225], Training Accuracy: 24.0954%, Training Loss: nan%
Epoch [34/300], Step [20/225], Training Accuracy: 24.5312%, Training Loss: nan%
Epoch [34/300], Step [21/225], Training Accuracy: 24.1815%, Training Loss: nan%
Epoch [34/300], Step [22/225], Training Accuracy: 24.4318%, Training Loss: nan%
Epoch [34/300], Step [23/225], Training Accuracy: 24.4565%, Training Loss: nan%
Epoch [34/300], Step [24/225], Training 

Epoch [34/300], Step [123/225], Training Accuracy: 25.5716%, Training Loss: nan%
Epoch [34/300], Step [124/225], Training Accuracy: 25.5418%, Training Loss: nan%
Epoch [34/300], Step [125/225], Training Accuracy: 25.5875%, Training Loss: nan%
Epoch [34/300], Step [126/225], Training Accuracy: 25.5580%, Training Loss: nan%
Epoch [34/300], Step [127/225], Training Accuracy: 25.5290%, Training Loss: nan%
Epoch [34/300], Step [128/225], Training Accuracy: 25.5737%, Training Loss: nan%
Epoch [34/300], Step [129/225], Training Accuracy: 25.6298%, Training Loss: nan%
Epoch [34/300], Step [130/225], Training Accuracy: 25.6370%, Training Loss: nan%
Epoch [34/300], Step [131/225], Training Accuracy: 25.6202%, Training Loss: nan%
Epoch [34/300], Step [132/225], Training Accuracy: 25.5682%, Training Loss: nan%
Epoch [34/300], Step [133/225], Training Accuracy: 25.5757%, Training Loss: nan%
Epoch [34/300], Step [134/225], Training Accuracy: 25.6297%, Training Loss: nan%
Epoch [34/300], Step [135/22

Epoch [35/300], Step [7/225], Training Accuracy: 24.3304%, Training Loss: nan%
Epoch [35/300], Step [8/225], Training Accuracy: 23.8281%, Training Loss: nan%
Epoch [35/300], Step [9/225], Training Accuracy: 23.9583%, Training Loss: nan%
Epoch [35/300], Step [10/225], Training Accuracy: 23.9062%, Training Loss: nan%
Epoch [35/300], Step [11/225], Training Accuracy: 23.8636%, Training Loss: nan%
Epoch [35/300], Step [12/225], Training Accuracy: 23.4375%, Training Loss: nan%
Epoch [35/300], Step [13/225], Training Accuracy: 22.5962%, Training Loss: nan%
Epoch [35/300], Step [14/225], Training Accuracy: 22.7679%, Training Loss: nan%
Epoch [35/300], Step [15/225], Training Accuracy: 23.1250%, Training Loss: nan%
Epoch [35/300], Step [16/225], Training Accuracy: 23.3398%, Training Loss: nan%
Epoch [35/300], Step [17/225], Training Accuracy: 23.1618%, Training Loss: nan%
Epoch [35/300], Step [18/225], Training Accuracy: 23.6111%, Training Loss: nan%
Epoch [35/300], Step [19/225], Training Acc

Epoch [35/300], Step [119/225], Training Accuracy: 25.4596%, Training Loss: nan%
Epoch [35/300], Step [120/225], Training Accuracy: 25.4427%, Training Loss: nan%
Epoch [35/300], Step [121/225], Training Accuracy: 25.5424%, Training Loss: nan%
Epoch [35/300], Step [122/225], Training Accuracy: 25.5251%, Training Loss: nan%
Epoch [35/300], Step [123/225], Training Accuracy: 25.5716%, Training Loss: nan%
Epoch [35/300], Step [124/225], Training Accuracy: 25.5418%, Training Loss: nan%
Epoch [35/300], Step [125/225], Training Accuracy: 25.5875%, Training Loss: nan%
Epoch [35/300], Step [126/225], Training Accuracy: 25.5580%, Training Loss: nan%
Epoch [35/300], Step [127/225], Training Accuracy: 25.5290%, Training Loss: nan%
Epoch [35/300], Step [128/225], Training Accuracy: 25.5737%, Training Loss: nan%
Epoch [35/300], Step [129/225], Training Accuracy: 25.6298%, Training Loss: nan%
Epoch [35/300], Step [130/225], Training Accuracy: 25.6370%, Training Loss: nan%
Epoch [35/300], Step [131/22

Epoch [36/300], Step [7/225], Training Accuracy: 24.3304%, Training Loss: nan%
Epoch [36/300], Step [8/225], Training Accuracy: 23.8281%, Training Loss: nan%
Epoch [36/300], Step [9/225], Training Accuracy: 23.9583%, Training Loss: nan%
Epoch [36/300], Step [10/225], Training Accuracy: 23.9062%, Training Loss: nan%
Epoch [36/300], Step [11/225], Training Accuracy: 23.8636%, Training Loss: nan%
Epoch [36/300], Step [12/225], Training Accuracy: 23.4375%, Training Loss: nan%
Epoch [36/300], Step [13/225], Training Accuracy: 22.5962%, Training Loss: nan%
Epoch [36/300], Step [14/225], Training Accuracy: 22.7679%, Training Loss: nan%
Epoch [36/300], Step [15/225], Training Accuracy: 23.1250%, Training Loss: nan%
Epoch [36/300], Step [16/225], Training Accuracy: 23.3398%, Training Loss: nan%
Epoch [36/300], Step [17/225], Training Accuracy: 23.1618%, Training Loss: nan%
Epoch [36/300], Step [18/225], Training Accuracy: 23.6111%, Training Loss: nan%
Epoch [36/300], Step [19/225], Training Acc

Epoch [36/300], Step [117/225], Training Accuracy: 25.5609%, Training Loss: nan%
Epoch [36/300], Step [118/225], Training Accuracy: 25.4767%, Training Loss: nan%
Epoch [36/300], Step [119/225], Training Accuracy: 25.4596%, Training Loss: nan%
Epoch [36/300], Step [120/225], Training Accuracy: 25.4427%, Training Loss: nan%
Epoch [36/300], Step [121/225], Training Accuracy: 25.5424%, Training Loss: nan%
Epoch [36/300], Step [122/225], Training Accuracy: 25.5251%, Training Loss: nan%
Epoch [36/300], Step [123/225], Training Accuracy: 25.5716%, Training Loss: nan%
Epoch [36/300], Step [124/225], Training Accuracy: 25.5418%, Training Loss: nan%
Epoch [36/300], Step [125/225], Training Accuracy: 25.5875%, Training Loss: nan%
Epoch [36/300], Step [126/225], Training Accuracy: 25.5580%, Training Loss: nan%
Epoch [36/300], Step [127/225], Training Accuracy: 25.5290%, Training Loss: nan%
Epoch [36/300], Step [128/225], Training Accuracy: 25.5737%, Training Loss: nan%
Epoch [36/300], Step [129/22

Epoch [36/300], Step [220/225], Training Accuracy: 25.2699%, Training Loss: nan%
Epoch [36/300], Step [221/225], Training Accuracy: 25.2899%, Training Loss: nan%
Epoch [36/300], Step [222/225], Training Accuracy: 25.2463%, Training Loss: nan%
Epoch [36/300], Step [223/225], Training Accuracy: 25.2733%, Training Loss: nan%
Epoch [36/300], Step [224/225], Training Accuracy: 25.2581%, Training Loss: nan%
Epoch [36/300], Step [225/225], Training Accuracy: 25.2779%, Training Loss: nan%
Epoch [37/300], Step [1/225], Training Accuracy: 23.4375%, Training Loss: nan%
Epoch [37/300], Step [2/225], Training Accuracy: 24.2188%, Training Loss: nan%
Epoch [37/300], Step [3/225], Training Accuracy: 26.0417%, Training Loss: nan%
Epoch [37/300], Step [4/225], Training Accuracy: 24.6094%, Training Loss: nan%
Epoch [37/300], Step [5/225], Training Accuracy: 25.0000%, Training Loss: nan%
Epoch [37/300], Step [6/225], Training Accuracy: 25.2604%, Training Loss: nan%
Epoch [37/300], Step [7/225], Training A

Epoch [37/300], Step [107/225], Training Accuracy: 25.5111%, Training Loss: nan%
Epoch [37/300], Step [108/225], Training Accuracy: 25.6076%, Training Loss: nan%
Epoch [37/300], Step [109/225], Training Accuracy: 25.5447%, Training Loss: nan%
Epoch [37/300], Step [110/225], Training Accuracy: 25.5398%, Training Loss: nan%
Epoch [37/300], Step [111/225], Training Accuracy: 25.4927%, Training Loss: nan%
Epoch [37/300], Step [112/225], Training Accuracy: 25.5441%, Training Loss: nan%
Epoch [37/300], Step [113/225], Training Accuracy: 25.5254%, Training Loss: nan%
Epoch [37/300], Step [114/225], Training Accuracy: 25.6031%, Training Loss: nan%
Epoch [37/300], Step [115/225], Training Accuracy: 25.5842%, Training Loss: nan%
Epoch [37/300], Step [116/225], Training Accuracy: 25.5388%, Training Loss: nan%
Epoch [37/300], Step [117/225], Training Accuracy: 25.5609%, Training Loss: nan%
Epoch [37/300], Step [118/225], Training Accuracy: 25.4767%, Training Loss: nan%
Epoch [37/300], Step [119/22

Epoch [37/300], Step [221/225], Training Accuracy: 25.2899%, Training Loss: nan%
Epoch [37/300], Step [222/225], Training Accuracy: 25.2463%, Training Loss: nan%
Epoch [37/300], Step [223/225], Training Accuracy: 25.2733%, Training Loss: nan%
Epoch [37/300], Step [224/225], Training Accuracy: 25.2581%, Training Loss: nan%
Epoch [37/300], Step [225/225], Training Accuracy: 25.2779%, Training Loss: nan%
Epoch [38/300], Step [1/225], Training Accuracy: 23.4375%, Training Loss: nan%
Epoch [38/300], Step [2/225], Training Accuracy: 24.2188%, Training Loss: nan%
Epoch [38/300], Step [3/225], Training Accuracy: 26.0417%, Training Loss: nan%
Epoch [38/300], Step [4/225], Training Accuracy: 24.6094%, Training Loss: nan%
Epoch [38/300], Step [5/225], Training Accuracy: 25.0000%, Training Loss: nan%
Epoch [38/300], Step [6/225], Training Accuracy: 25.2604%, Training Loss: nan%
Epoch [38/300], Step [7/225], Training Accuracy: 24.3304%, Training Loss: nan%
Epoch [38/300], Step [8/225], Training Acc

Epoch [38/300], Step [106/225], Training Accuracy: 25.4717%, Training Loss: nan%
Epoch [38/300], Step [107/225], Training Accuracy: 25.5111%, Training Loss: nan%
Epoch [38/300], Step [108/225], Training Accuracy: 25.6076%, Training Loss: nan%
Epoch [38/300], Step [109/225], Training Accuracy: 25.5447%, Training Loss: nan%
Epoch [38/300], Step [110/225], Training Accuracy: 25.5398%, Training Loss: nan%
Epoch [38/300], Step [111/225], Training Accuracy: 25.4927%, Training Loss: nan%
Epoch [38/300], Step [112/225], Training Accuracy: 25.5441%, Training Loss: nan%
Epoch [38/300], Step [113/225], Training Accuracy: 25.5254%, Training Loss: nan%
Epoch [38/300], Step [114/225], Training Accuracy: 25.6031%, Training Loss: nan%
Epoch [38/300], Step [115/225], Training Accuracy: 25.5842%, Training Loss: nan%
Epoch [38/300], Step [116/225], Training Accuracy: 25.5388%, Training Loss: nan%
Epoch [38/300], Step [117/225], Training Accuracy: 25.5609%, Training Loss: nan%
Epoch [38/300], Step [118/22

Epoch [38/300], Step [218/225], Training Accuracy: 25.2652%, Training Loss: nan%
Epoch [38/300], Step [219/225], Training Accuracy: 25.2854%, Training Loss: nan%
Epoch [38/300], Step [220/225], Training Accuracy: 25.2699%, Training Loss: nan%
Epoch [38/300], Step [221/225], Training Accuracy: 25.2899%, Training Loss: nan%
Epoch [38/300], Step [222/225], Training Accuracy: 25.2463%, Training Loss: nan%
Epoch [38/300], Step [223/225], Training Accuracy: 25.2733%, Training Loss: nan%
Epoch [38/300], Step [224/225], Training Accuracy: 25.2581%, Training Loss: nan%
Epoch [38/300], Step [225/225], Training Accuracy: 25.2779%, Training Loss: nan%
Epoch [39/300], Step [1/225], Training Accuracy: 23.4375%, Training Loss: nan%
Epoch [39/300], Step [2/225], Training Accuracy: 24.2188%, Training Loss: nan%
Epoch [39/300], Step [3/225], Training Accuracy: 26.0417%, Training Loss: nan%
Epoch [39/300], Step [4/225], Training Accuracy: 24.6094%, Training Loss: nan%
Epoch [39/300], Step [5/225], Traini

Epoch [39/300], Step [102/225], Training Accuracy: 25.3370%, Training Loss: nan%
Epoch [39/300], Step [103/225], Training Accuracy: 25.3792%, Training Loss: nan%
Epoch [39/300], Step [104/225], Training Accuracy: 25.3906%, Training Loss: nan%
Epoch [39/300], Step [105/225], Training Accuracy: 25.3423%, Training Loss: nan%
Epoch [39/300], Step [106/225], Training Accuracy: 25.4717%, Training Loss: nan%
Epoch [39/300], Step [107/225], Training Accuracy: 25.5111%, Training Loss: nan%
Epoch [39/300], Step [108/225], Training Accuracy: 25.6076%, Training Loss: nan%
Epoch [39/300], Step [109/225], Training Accuracy: 25.5447%, Training Loss: nan%
Epoch [39/300], Step [110/225], Training Accuracy: 25.5398%, Training Loss: nan%
Epoch [39/300], Step [111/225], Training Accuracy: 25.4927%, Training Loss: nan%
Epoch [39/300], Step [112/225], Training Accuracy: 25.5441%, Training Loss: nan%
Epoch [39/300], Step [113/225], Training Accuracy: 25.5254%, Training Loss: nan%
Epoch [39/300], Step [114/22

Epoch [39/300], Step [215/225], Training Accuracy: 25.3125%, Training Loss: nan%
Epoch [39/300], Step [216/225], Training Accuracy: 25.2604%, Training Loss: nan%
Epoch [39/300], Step [217/225], Training Accuracy: 25.2592%, Training Loss: nan%
Epoch [39/300], Step [218/225], Training Accuracy: 25.2652%, Training Loss: nan%
Epoch [39/300], Step [219/225], Training Accuracy: 25.2854%, Training Loss: nan%
Epoch [39/300], Step [220/225], Training Accuracy: 25.2699%, Training Loss: nan%
Epoch [39/300], Step [221/225], Training Accuracy: 25.2899%, Training Loss: nan%
Epoch [39/300], Step [222/225], Training Accuracy: 25.2463%, Training Loss: nan%
Epoch [39/300], Step [223/225], Training Accuracy: 25.2733%, Training Loss: nan%
Epoch [39/300], Step [224/225], Training Accuracy: 25.2581%, Training Loss: nan%
Epoch [39/300], Step [225/225], Training Accuracy: 25.2779%, Training Loss: nan%
Epoch [40/300], Step [1/225], Training Accuracy: 23.4375%, Training Loss: nan%
Epoch [40/300], Step [2/225], 

Epoch [40/300], Step [101/225], Training Accuracy: 25.4177%, Training Loss: nan%
Epoch [40/300], Step [102/225], Training Accuracy: 25.3370%, Training Loss: nan%
Epoch [40/300], Step [103/225], Training Accuracy: 25.3792%, Training Loss: nan%
Epoch [40/300], Step [104/225], Training Accuracy: 25.3906%, Training Loss: nan%
Epoch [40/300], Step [105/225], Training Accuracy: 25.3423%, Training Loss: nan%
Epoch [40/300], Step [106/225], Training Accuracy: 25.4717%, Training Loss: nan%
Epoch [40/300], Step [107/225], Training Accuracy: 25.5111%, Training Loss: nan%
Epoch [40/300], Step [108/225], Training Accuracy: 25.6076%, Training Loss: nan%
Epoch [40/300], Step [109/225], Training Accuracy: 25.5447%, Training Loss: nan%
Epoch [40/300], Step [110/225], Training Accuracy: 25.5398%, Training Loss: nan%
Epoch [40/300], Step [111/225], Training Accuracy: 25.4927%, Training Loss: nan%
Epoch [40/300], Step [112/225], Training Accuracy: 25.5441%, Training Loss: nan%
Epoch [40/300], Step [113/22

Epoch [40/300], Step [218/225], Training Accuracy: 25.2652%, Training Loss: nan%
Epoch [40/300], Step [219/225], Training Accuracy: 25.2854%, Training Loss: nan%
Epoch [40/300], Step [220/225], Training Accuracy: 25.2699%, Training Loss: nan%
Epoch [40/300], Step [221/225], Training Accuracy: 25.2899%, Training Loss: nan%
Epoch [40/300], Step [222/225], Training Accuracy: 25.2463%, Training Loss: nan%
Epoch [40/300], Step [223/225], Training Accuracy: 25.2733%, Training Loss: nan%
Epoch [40/300], Step [224/225], Training Accuracy: 25.2581%, Training Loss: nan%
Epoch [40/300], Step [225/225], Training Accuracy: 25.2779%, Training Loss: nan%
Epoch [41/300], Step [1/225], Training Accuracy: 23.4375%, Training Loss: nan%
Epoch [41/300], Step [2/225], Training Accuracy: 24.2188%, Training Loss: nan%
Epoch [41/300], Step [3/225], Training Accuracy: 26.0417%, Training Loss: nan%
Epoch [41/300], Step [4/225], Training Accuracy: 24.6094%, Training Loss: nan%
Epoch [41/300], Step [5/225], Traini

Epoch [41/300], Step [107/225], Training Accuracy: 25.5111%, Training Loss: nan%
Epoch [41/300], Step [108/225], Training Accuracy: 25.6076%, Training Loss: nan%
Epoch [41/300], Step [109/225], Training Accuracy: 25.5447%, Training Loss: nan%
Epoch [41/300], Step [110/225], Training Accuracy: 25.5398%, Training Loss: nan%
Epoch [41/300], Step [111/225], Training Accuracy: 25.4927%, Training Loss: nan%
Epoch [41/300], Step [112/225], Training Accuracy: 25.5441%, Training Loss: nan%
Epoch [41/300], Step [113/225], Training Accuracy: 25.5254%, Training Loss: nan%
Epoch [41/300], Step [114/225], Training Accuracy: 25.6031%, Training Loss: nan%
Epoch [41/300], Step [115/225], Training Accuracy: 25.5842%, Training Loss: nan%
Epoch [41/300], Step [116/225], Training Accuracy: 25.5388%, Training Loss: nan%
Epoch [41/300], Step [117/225], Training Accuracy: 25.5609%, Training Loss: nan%
Epoch [41/300], Step [118/225], Training Accuracy: 25.4767%, Training Loss: nan%
Epoch [41/300], Step [119/22

Epoch [41/300], Step [217/225], Training Accuracy: 25.2592%, Training Loss: nan%
Epoch [41/300], Step [218/225], Training Accuracy: 25.2652%, Training Loss: nan%
Epoch [41/300], Step [219/225], Training Accuracy: 25.2854%, Training Loss: nan%
Epoch [41/300], Step [220/225], Training Accuracy: 25.2699%, Training Loss: nan%
Epoch [41/300], Step [221/225], Training Accuracy: 25.2899%, Training Loss: nan%
Epoch [41/300], Step [222/225], Training Accuracy: 25.2463%, Training Loss: nan%
Epoch [41/300], Step [223/225], Training Accuracy: 25.2733%, Training Loss: nan%
Epoch [41/300], Step [224/225], Training Accuracy: 25.2581%, Training Loss: nan%
Epoch [41/300], Step [225/225], Training Accuracy: 25.2779%, Training Loss: nan%
Epoch [42/300], Step [1/225], Training Accuracy: 23.4375%, Training Loss: nan%
Epoch [42/300], Step [2/225], Training Accuracy: 24.2188%, Training Loss: nan%
Epoch [42/300], Step [3/225], Training Accuracy: 26.0417%, Training Loss: nan%
Epoch [42/300], Step [4/225], Trai

Epoch [42/300], Step [103/225], Training Accuracy: 25.3792%, Training Loss: nan%
Epoch [42/300], Step [104/225], Training Accuracy: 25.3906%, Training Loss: nan%
Epoch [42/300], Step [105/225], Training Accuracy: 25.3423%, Training Loss: nan%
Epoch [42/300], Step [106/225], Training Accuracy: 25.4717%, Training Loss: nan%
Epoch [42/300], Step [107/225], Training Accuracy: 25.5111%, Training Loss: nan%
Epoch [42/300], Step [108/225], Training Accuracy: 25.6076%, Training Loss: nan%
Epoch [42/300], Step [109/225], Training Accuracy: 25.5447%, Training Loss: nan%
Epoch [42/300], Step [110/225], Training Accuracy: 25.5398%, Training Loss: nan%
Epoch [42/300], Step [111/225], Training Accuracy: 25.4927%, Training Loss: nan%
Epoch [42/300], Step [112/225], Training Accuracy: 25.5441%, Training Loss: nan%
Epoch [42/300], Step [113/225], Training Accuracy: 25.5254%, Training Loss: nan%
Epoch [42/300], Step [114/225], Training Accuracy: 25.6031%, Training Loss: nan%
Epoch [42/300], Step [115/22

Epoch [42/300], Step [214/225], Training Accuracy: 25.3724%, Training Loss: nan%
Epoch [42/300], Step [215/225], Training Accuracy: 25.3125%, Training Loss: nan%
Epoch [42/300], Step [216/225], Training Accuracy: 25.2604%, Training Loss: nan%
Epoch [42/300], Step [217/225], Training Accuracy: 25.2592%, Training Loss: nan%
Epoch [42/300], Step [218/225], Training Accuracy: 25.2652%, Training Loss: nan%
Epoch [42/300], Step [219/225], Training Accuracy: 25.2854%, Training Loss: nan%
Epoch [42/300], Step [220/225], Training Accuracy: 25.2699%, Training Loss: nan%
Epoch [42/300], Step [221/225], Training Accuracy: 25.2899%, Training Loss: nan%
Epoch [42/300], Step [222/225], Training Accuracy: 25.2463%, Training Loss: nan%
Epoch [42/300], Step [223/225], Training Accuracy: 25.2733%, Training Loss: nan%
Epoch [42/300], Step [224/225], Training Accuracy: 25.2581%, Training Loss: nan%
Epoch [42/300], Step [225/225], Training Accuracy: 25.2779%, Training Loss: nan%
Epoch [43/300], Step [1/225]

Epoch [43/300], Step [100/225], Training Accuracy: 25.3281%, Training Loss: nan%
Epoch [43/300], Step [101/225], Training Accuracy: 25.4177%, Training Loss: nan%
Epoch [43/300], Step [102/225], Training Accuracy: 25.3370%, Training Loss: nan%
Epoch [43/300], Step [103/225], Training Accuracy: 25.3792%, Training Loss: nan%
Epoch [43/300], Step [104/225], Training Accuracy: 25.3906%, Training Loss: nan%
Epoch [43/300], Step [105/225], Training Accuracy: 25.3423%, Training Loss: nan%
Epoch [43/300], Step [106/225], Training Accuracy: 25.4717%, Training Loss: nan%
Epoch [43/300], Step [107/225], Training Accuracy: 25.5111%, Training Loss: nan%
Epoch [43/300], Step [108/225], Training Accuracy: 25.6076%, Training Loss: nan%
Epoch [43/300], Step [109/225], Training Accuracy: 25.5447%, Training Loss: nan%
Epoch [43/300], Step [110/225], Training Accuracy: 25.5398%, Training Loss: nan%
Epoch [43/300], Step [111/225], Training Accuracy: 25.4927%, Training Loss: nan%
Epoch [43/300], Step [112/22

Epoch [43/300], Step [211/225], Training Accuracy: 25.3406%, Training Loss: nan%
Epoch [43/300], Step [212/225], Training Accuracy: 25.3685%, Training Loss: nan%
Epoch [43/300], Step [213/225], Training Accuracy: 25.3815%, Training Loss: nan%
Epoch [43/300], Step [214/225], Training Accuracy: 25.3724%, Training Loss: nan%
Epoch [43/300], Step [215/225], Training Accuracy: 25.3125%, Training Loss: nan%
Epoch [43/300], Step [216/225], Training Accuracy: 25.2604%, Training Loss: nan%
Epoch [43/300], Step [217/225], Training Accuracy: 25.2592%, Training Loss: nan%
Epoch [43/300], Step [218/225], Training Accuracy: 25.2652%, Training Loss: nan%
Epoch [43/300], Step [219/225], Training Accuracy: 25.2854%, Training Loss: nan%
Epoch [43/300], Step [220/225], Training Accuracy: 25.2699%, Training Loss: nan%
Epoch [43/300], Step [221/225], Training Accuracy: 25.2899%, Training Loss: nan%
Epoch [43/300], Step [222/225], Training Accuracy: 25.2463%, Training Loss: nan%
Epoch [43/300], Step [223/22

Epoch [44/300], Step [97/225], Training Accuracy: 25.1772%, Training Loss: nan%
Epoch [44/300], Step [98/225], Training Accuracy: 25.2073%, Training Loss: nan%
Epoch [44/300], Step [99/225], Training Accuracy: 25.2841%, Training Loss: nan%
Epoch [44/300], Step [100/225], Training Accuracy: 25.3281%, Training Loss: nan%
Epoch [44/300], Step [101/225], Training Accuracy: 25.4177%, Training Loss: nan%
Epoch [44/300], Step [102/225], Training Accuracy: 25.3370%, Training Loss: nan%
Epoch [44/300], Step [103/225], Training Accuracy: 25.3792%, Training Loss: nan%
Epoch [44/300], Step [104/225], Training Accuracy: 25.3906%, Training Loss: nan%
Epoch [44/300], Step [105/225], Training Accuracy: 25.3423%, Training Loss: nan%
Epoch [44/300], Step [106/225], Training Accuracy: 25.4717%, Training Loss: nan%
Epoch [44/300], Step [107/225], Training Accuracy: 25.5111%, Training Loss: nan%
Epoch [44/300], Step [108/225], Training Accuracy: 25.6076%, Training Loss: nan%
Epoch [44/300], Step [109/225],

Epoch [44/300], Step [209/225], Training Accuracy: 25.3514%, Training Loss: nan%
Epoch [44/300], Step [210/225], Training Accuracy: 25.3720%, Training Loss: nan%
Epoch [44/300], Step [211/225], Training Accuracy: 25.3406%, Training Loss: nan%
Epoch [44/300], Step [212/225], Training Accuracy: 25.3685%, Training Loss: nan%
Epoch [44/300], Step [213/225], Training Accuracy: 25.3815%, Training Loss: nan%
Epoch [44/300], Step [214/225], Training Accuracy: 25.3724%, Training Loss: nan%
Epoch [44/300], Step [215/225], Training Accuracy: 25.3125%, Training Loss: nan%
Epoch [44/300], Step [216/225], Training Accuracy: 25.2604%, Training Loss: nan%
Epoch [44/300], Step [217/225], Training Accuracy: 25.2592%, Training Loss: nan%
Epoch [44/300], Step [218/225], Training Accuracy: 25.2652%, Training Loss: nan%
Epoch [44/300], Step [219/225], Training Accuracy: 25.2854%, Training Loss: nan%
Epoch [44/300], Step [220/225], Training Accuracy: 25.2699%, Training Loss: nan%
Epoch [44/300], Step [221/22

Epoch [45/300], Step [101/225], Training Accuracy: 25.4177%, Training Loss: nan%
Epoch [45/300], Step [102/225], Training Accuracy: 25.3370%, Training Loss: nan%
Epoch [45/300], Step [103/225], Training Accuracy: 25.3792%, Training Loss: nan%
Epoch [45/300], Step [104/225], Training Accuracy: 25.3906%, Training Loss: nan%
Epoch [45/300], Step [105/225], Training Accuracy: 25.3423%, Training Loss: nan%
Epoch [45/300], Step [106/225], Training Accuracy: 25.4717%, Training Loss: nan%
Epoch [45/300], Step [107/225], Training Accuracy: 25.5111%, Training Loss: nan%
Epoch [45/300], Step [108/225], Training Accuracy: 25.6076%, Training Loss: nan%
Epoch [45/300], Step [109/225], Training Accuracy: 25.5447%, Training Loss: nan%
Epoch [45/300], Step [110/225], Training Accuracy: 25.5398%, Training Loss: nan%
Epoch [45/300], Step [111/225], Training Accuracy: 25.4927%, Training Loss: nan%
Epoch [45/300], Step [112/225], Training Accuracy: 25.5441%, Training Loss: nan%
Epoch [45/300], Step [113/22

Epoch [45/300], Step [214/225], Training Accuracy: 25.3724%, Training Loss: nan%
Epoch [45/300], Step [215/225], Training Accuracy: 25.3125%, Training Loss: nan%
Epoch [45/300], Step [216/225], Training Accuracy: 25.2604%, Training Loss: nan%
Epoch [45/300], Step [217/225], Training Accuracy: 25.2592%, Training Loss: nan%
Epoch [45/300], Step [218/225], Training Accuracy: 25.2652%, Training Loss: nan%
Epoch [45/300], Step [219/225], Training Accuracy: 25.2854%, Training Loss: nan%
Epoch [45/300], Step [220/225], Training Accuracy: 25.2699%, Training Loss: nan%
Epoch [45/300], Step [221/225], Training Accuracy: 25.2899%, Training Loss: nan%
Epoch [45/300], Step [222/225], Training Accuracy: 25.2463%, Training Loss: nan%
Epoch [45/300], Step [223/225], Training Accuracy: 25.2733%, Training Loss: nan%
Epoch [45/300], Step [224/225], Training Accuracy: 25.2581%, Training Loss: nan%
Epoch [45/300], Step [225/225], Training Accuracy: 25.2779%, Training Loss: nan%
Epoch [46/300], Step [1/225]

Epoch [46/300], Step [95/225], Training Accuracy: 25.1974%, Training Loss: nan%
Epoch [46/300], Step [96/225], Training Accuracy: 25.2279%, Training Loss: nan%
Epoch [46/300], Step [97/225], Training Accuracy: 25.1772%, Training Loss: nan%
Epoch [46/300], Step [98/225], Training Accuracy: 25.2073%, Training Loss: nan%
Epoch [46/300], Step [99/225], Training Accuracy: 25.2841%, Training Loss: nan%
Epoch [46/300], Step [100/225], Training Accuracy: 25.3281%, Training Loss: nan%
Epoch [46/300], Step [101/225], Training Accuracy: 25.4177%, Training Loss: nan%
Epoch [46/300], Step [102/225], Training Accuracy: 25.3370%, Training Loss: nan%
Epoch [46/300], Step [103/225], Training Accuracy: 25.3792%, Training Loss: nan%
Epoch [46/300], Step [104/225], Training Accuracy: 25.3906%, Training Loss: nan%
Epoch [46/300], Step [105/225], Training Accuracy: 25.3423%, Training Loss: nan%
Epoch [46/300], Step [106/225], Training Accuracy: 25.4717%, Training Loss: nan%
Epoch [46/300], Step [107/225], T

Epoch [46/300], Step [208/225], Training Accuracy: 25.3155%, Training Loss: nan%
Epoch [46/300], Step [209/225], Training Accuracy: 25.3514%, Training Loss: nan%
Epoch [46/300], Step [210/225], Training Accuracy: 25.3720%, Training Loss: nan%
Epoch [46/300], Step [211/225], Training Accuracy: 25.3406%, Training Loss: nan%
Epoch [46/300], Step [212/225], Training Accuracy: 25.3685%, Training Loss: nan%
Epoch [46/300], Step [213/225], Training Accuracy: 25.3815%, Training Loss: nan%
Epoch [46/300], Step [214/225], Training Accuracy: 25.3724%, Training Loss: nan%
Epoch [46/300], Step [215/225], Training Accuracy: 25.3125%, Training Loss: nan%
Epoch [46/300], Step [216/225], Training Accuracy: 25.2604%, Training Loss: nan%
Epoch [46/300], Step [217/225], Training Accuracy: 25.2592%, Training Loss: nan%
Epoch [46/300], Step [218/225], Training Accuracy: 25.2652%, Training Loss: nan%
Epoch [46/300], Step [219/225], Training Accuracy: 25.2854%, Training Loss: nan%
Epoch [46/300], Step [220/22

Epoch [47/300], Step [94/225], Training Accuracy: 25.1662%, Training Loss: nan%
Epoch [47/300], Step [95/225], Training Accuracy: 25.1974%, Training Loss: nan%
Epoch [47/300], Step [96/225], Training Accuracy: 25.2279%, Training Loss: nan%
Epoch [47/300], Step [97/225], Training Accuracy: 25.1772%, Training Loss: nan%
Epoch [47/300], Step [98/225], Training Accuracy: 25.2073%, Training Loss: nan%
Epoch [47/300], Step [99/225], Training Accuracy: 25.2841%, Training Loss: nan%
Epoch [47/300], Step [100/225], Training Accuracy: 25.3281%, Training Loss: nan%
Epoch [47/300], Step [101/225], Training Accuracy: 25.4177%, Training Loss: nan%
Epoch [47/300], Step [102/225], Training Accuracy: 25.3370%, Training Loss: nan%
Epoch [47/300], Step [103/225], Training Accuracy: 25.3792%, Training Loss: nan%
Epoch [47/300], Step [104/225], Training Accuracy: 25.3906%, Training Loss: nan%
Epoch [47/300], Step [105/225], Training Accuracy: 25.3423%, Training Loss: nan%
Epoch [47/300], Step [106/225], Tr

Epoch [47/300], Step [210/225], Training Accuracy: 25.3720%, Training Loss: nan%
Epoch [47/300], Step [211/225], Training Accuracy: 25.3406%, Training Loss: nan%
Epoch [47/300], Step [212/225], Training Accuracy: 25.3685%, Training Loss: nan%
Epoch [47/300], Step [213/225], Training Accuracy: 25.3815%, Training Loss: nan%
Epoch [47/300], Step [214/225], Training Accuracy: 25.3724%, Training Loss: nan%
Epoch [47/300], Step [215/225], Training Accuracy: 25.3125%, Training Loss: nan%
Epoch [47/300], Step [216/225], Training Accuracy: 25.2604%, Training Loss: nan%
Epoch [47/300], Step [217/225], Training Accuracy: 25.2592%, Training Loss: nan%
Epoch [47/300], Step [218/225], Training Accuracy: 25.2652%, Training Loss: nan%
Epoch [47/300], Step [219/225], Training Accuracy: 25.2854%, Training Loss: nan%
Epoch [47/300], Step [220/225], Training Accuracy: 25.2699%, Training Loss: nan%
Epoch [47/300], Step [221/225], Training Accuracy: 25.2899%, Training Loss: nan%
Epoch [47/300], Step [222/22

Epoch [48/300], Step [97/225], Training Accuracy: 25.1772%, Training Loss: nan%
Epoch [48/300], Step [98/225], Training Accuracy: 25.2073%, Training Loss: nan%
Epoch [48/300], Step [99/225], Training Accuracy: 25.2841%, Training Loss: nan%
Epoch [48/300], Step [100/225], Training Accuracy: 25.3281%, Training Loss: nan%
Epoch [48/300], Step [101/225], Training Accuracy: 25.4177%, Training Loss: nan%
Epoch [48/300], Step [102/225], Training Accuracy: 25.3370%, Training Loss: nan%
Epoch [48/300], Step [103/225], Training Accuracy: 25.3792%, Training Loss: nan%
Epoch [48/300], Step [104/225], Training Accuracy: 25.3906%, Training Loss: nan%
Epoch [48/300], Step [105/225], Training Accuracy: 25.3423%, Training Loss: nan%
Epoch [48/300], Step [106/225], Training Accuracy: 25.4717%, Training Loss: nan%
Epoch [48/300], Step [107/225], Training Accuracy: 25.5111%, Training Loss: nan%
Epoch [48/300], Step [108/225], Training Accuracy: 25.6076%, Training Loss: nan%
Epoch [48/300], Step [109/225],

Epoch [48/300], Step [203/225], Training Accuracy: 25.2771%, Training Loss: nan%
Epoch [48/300], Step [204/225], Training Accuracy: 25.3217%, Training Loss: nan%
Epoch [48/300], Step [205/225], Training Accuracy: 25.2973%, Training Loss: nan%
Epoch [48/300], Step [206/225], Training Accuracy: 25.3110%, Training Loss: nan%
Epoch [48/300], Step [207/225], Training Accuracy: 25.3170%, Training Loss: nan%
Epoch [48/300], Step [208/225], Training Accuracy: 25.3155%, Training Loss: nan%
Epoch [48/300], Step [209/225], Training Accuracy: 25.3514%, Training Loss: nan%
Epoch [48/300], Step [210/225], Training Accuracy: 25.3720%, Training Loss: nan%
Epoch [48/300], Step [211/225], Training Accuracy: 25.3406%, Training Loss: nan%
Epoch [48/300], Step [212/225], Training Accuracy: 25.3685%, Training Loss: nan%
Epoch [48/300], Step [213/225], Training Accuracy: 25.3815%, Training Loss: nan%
Epoch [48/300], Step [214/225], Training Accuracy: 25.3724%, Training Loss: nan%
Epoch [48/300], Step [215/22

Epoch [49/300], Step [88/225], Training Accuracy: 25.1776%, Training Loss: nan%
Epoch [49/300], Step [89/225], Training Accuracy: 25.1580%, Training Loss: nan%
Epoch [49/300], Step [90/225], Training Accuracy: 25.0694%, Training Loss: nan%
Epoch [49/300], Step [91/225], Training Accuracy: 25.1030%, Training Loss: nan%
Epoch [49/300], Step [92/225], Training Accuracy: 25.0510%, Training Loss: nan%
Epoch [49/300], Step [93/225], Training Accuracy: 25.1176%, Training Loss: nan%
Epoch [49/300], Step [94/225], Training Accuracy: 25.1662%, Training Loss: nan%
Epoch [49/300], Step [95/225], Training Accuracy: 25.1974%, Training Loss: nan%
Epoch [49/300], Step [96/225], Training Accuracy: 25.2279%, Training Loss: nan%
Epoch [49/300], Step [97/225], Training Accuracy: 25.1772%, Training Loss: nan%
Epoch [49/300], Step [98/225], Training Accuracy: 25.2073%, Training Loss: nan%
Epoch [49/300], Step [99/225], Training Accuracy: 25.2841%, Training Loss: nan%
Epoch [49/300], Step [100/225], Training

Epoch [49/300], Step [200/225], Training Accuracy: 25.2734%, Training Loss: nan%
Epoch [49/300], Step [201/225], Training Accuracy: 25.2954%, Training Loss: nan%
Epoch [49/300], Step [202/225], Training Accuracy: 25.2553%, Training Loss: nan%
Epoch [49/300], Step [203/225], Training Accuracy: 25.2771%, Training Loss: nan%
Epoch [49/300], Step [204/225], Training Accuracy: 25.3217%, Training Loss: nan%
Epoch [49/300], Step [205/225], Training Accuracy: 25.2973%, Training Loss: nan%
Epoch [49/300], Step [206/225], Training Accuracy: 25.3110%, Training Loss: nan%
Epoch [49/300], Step [207/225], Training Accuracy: 25.3170%, Training Loss: nan%
Epoch [49/300], Step [208/225], Training Accuracy: 25.3155%, Training Loss: nan%
Epoch [49/300], Step [209/225], Training Accuracy: 25.3514%, Training Loss: nan%
Epoch [49/300], Step [210/225], Training Accuracy: 25.3720%, Training Loss: nan%
Epoch [49/300], Step [211/225], Training Accuracy: 25.3406%, Training Loss: nan%
Epoch [49/300], Step [212/22

Epoch [50/300], Step [86/225], Training Accuracy: 25.1453%, Training Loss: nan%
Epoch [50/300], Step [87/225], Training Accuracy: 25.1616%, Training Loss: nan%
Epoch [50/300], Step [88/225], Training Accuracy: 25.1776%, Training Loss: nan%
Epoch [50/300], Step [89/225], Training Accuracy: 25.1580%, Training Loss: nan%
Epoch [50/300], Step [90/225], Training Accuracy: 25.0694%, Training Loss: nan%
Epoch [50/300], Step [91/225], Training Accuracy: 25.1030%, Training Loss: nan%
Epoch [50/300], Step [92/225], Training Accuracy: 25.0510%, Training Loss: nan%
Epoch [50/300], Step [93/225], Training Accuracy: 25.1176%, Training Loss: nan%
Epoch [50/300], Step [94/225], Training Accuracy: 25.1662%, Training Loss: nan%
Epoch [50/300], Step [95/225], Training Accuracy: 25.1974%, Training Loss: nan%
Epoch [50/300], Step [96/225], Training Accuracy: 25.2279%, Training Loss: nan%
Epoch [50/300], Step [97/225], Training Accuracy: 25.1772%, Training Loss: nan%
Epoch [50/300], Step [98/225], Training 

Epoch [50/300], Step [197/225], Training Accuracy: 25.3569%, Training Loss: nan%
Epoch [50/300], Step [198/225], Training Accuracy: 25.3314%, Training Loss: nan%
Epoch [50/300], Step [199/225], Training Accuracy: 25.3141%, Training Loss: nan%
Epoch [50/300], Step [200/225], Training Accuracy: 25.2734%, Training Loss: nan%
Epoch [50/300], Step [201/225], Training Accuracy: 25.2954%, Training Loss: nan%
Epoch [50/300], Step [202/225], Training Accuracy: 25.2553%, Training Loss: nan%
Epoch [50/300], Step [203/225], Training Accuracy: 25.2771%, Training Loss: nan%
Epoch [50/300], Step [204/225], Training Accuracy: 25.3217%, Training Loss: nan%
Epoch [50/300], Step [205/225], Training Accuracy: 25.2973%, Training Loss: nan%
Epoch [50/300], Step [206/225], Training Accuracy: 25.3110%, Training Loss: nan%
Epoch [50/300], Step [207/225], Training Accuracy: 25.3170%, Training Loss: nan%
Epoch [50/300], Step [208/225], Training Accuracy: 25.3155%, Training Loss: nan%
Epoch [50/300], Step [209/22

Epoch [51/300], Step [80/225], Training Accuracy: 25.1758%, Training Loss: nan%
Epoch [51/300], Step [81/225], Training Accuracy: 25.1157%, Training Loss: nan%
Epoch [51/300], Step [82/225], Training Accuracy: 25.0953%, Training Loss: nan%
Epoch [51/300], Step [83/225], Training Accuracy: 25.0565%, Training Loss: nan%
Epoch [51/300], Step [84/225], Training Accuracy: 25.0930%, Training Loss: nan%
Epoch [51/300], Step [85/225], Training Accuracy: 25.1103%, Training Loss: nan%
Epoch [51/300], Step [86/225], Training Accuracy: 25.1453%, Training Loss: nan%
Epoch [51/300], Step [87/225], Training Accuracy: 25.1616%, Training Loss: nan%
Epoch [51/300], Step [88/225], Training Accuracy: 25.1776%, Training Loss: nan%
Epoch [51/300], Step [89/225], Training Accuracy: 25.1580%, Training Loss: nan%
Epoch [51/300], Step [90/225], Training Accuracy: 25.0694%, Training Loss: nan%
Epoch [51/300], Step [91/225], Training Accuracy: 25.1030%, Training Loss: nan%
Epoch [51/300], Step [92/225], Training 

Epoch [51/300], Step [197/225], Training Accuracy: 25.3569%, Training Loss: nan%
Epoch [51/300], Step [198/225], Training Accuracy: 25.3314%, Training Loss: nan%
Epoch [51/300], Step [199/225], Training Accuracy: 25.3141%, Training Loss: nan%
Epoch [51/300], Step [200/225], Training Accuracy: 25.2734%, Training Loss: nan%
Epoch [51/300], Step [201/225], Training Accuracy: 25.2954%, Training Loss: nan%
Epoch [51/300], Step [202/225], Training Accuracy: 25.2553%, Training Loss: nan%
Epoch [51/300], Step [203/225], Training Accuracy: 25.2771%, Training Loss: nan%
Epoch [51/300], Step [204/225], Training Accuracy: 25.3217%, Training Loss: nan%
Epoch [51/300], Step [205/225], Training Accuracy: 25.2973%, Training Loss: nan%
Epoch [51/300], Step [206/225], Training Accuracy: 25.3110%, Training Loss: nan%
Epoch [51/300], Step [207/225], Training Accuracy: 25.3170%, Training Loss: nan%
Epoch [51/300], Step [208/225], Training Accuracy: 25.3155%, Training Loss: nan%
Epoch [51/300], Step [209/22

Epoch [52/300], Step [83/225], Training Accuracy: 25.0565%, Training Loss: nan%
Epoch [52/300], Step [84/225], Training Accuracy: 25.0930%, Training Loss: nan%
Epoch [52/300], Step [85/225], Training Accuracy: 25.1103%, Training Loss: nan%
Epoch [52/300], Step [86/225], Training Accuracy: 25.1453%, Training Loss: nan%
Epoch [52/300], Step [87/225], Training Accuracy: 25.1616%, Training Loss: nan%
Epoch [52/300], Step [88/225], Training Accuracy: 25.1776%, Training Loss: nan%
Epoch [52/300], Step [89/225], Training Accuracy: 25.1580%, Training Loss: nan%
Epoch [52/300], Step [90/225], Training Accuracy: 25.0694%, Training Loss: nan%
Epoch [52/300], Step [91/225], Training Accuracy: 25.1030%, Training Loss: nan%
Epoch [52/300], Step [92/225], Training Accuracy: 25.0510%, Training Loss: nan%
Epoch [52/300], Step [93/225], Training Accuracy: 25.1176%, Training Loss: nan%
Epoch [52/300], Step [94/225], Training Accuracy: 25.1662%, Training Loss: nan%
Epoch [52/300], Step [95/225], Training 

Epoch [52/300], Step [194/225], Training Accuracy: 25.4269%, Training Loss: nan%
Epoch [52/300], Step [195/225], Training Accuracy: 25.3846%, Training Loss: nan%
Epoch [52/300], Step [196/225], Training Accuracy: 25.3667%, Training Loss: nan%
Epoch [52/300], Step [197/225], Training Accuracy: 25.3569%, Training Loss: nan%
Epoch [52/300], Step [198/225], Training Accuracy: 25.3314%, Training Loss: nan%
Epoch [52/300], Step [199/225], Training Accuracy: 25.3141%, Training Loss: nan%
Epoch [52/300], Step [200/225], Training Accuracy: 25.2734%, Training Loss: nan%
Epoch [52/300], Step [201/225], Training Accuracy: 25.2954%, Training Loss: nan%
Epoch [52/300], Step [202/225], Training Accuracy: 25.2553%, Training Loss: nan%
Epoch [52/300], Step [203/225], Training Accuracy: 25.2771%, Training Loss: nan%
Epoch [52/300], Step [204/225], Training Accuracy: 25.3217%, Training Loss: nan%
Epoch [52/300], Step [205/225], Training Accuracy: 25.2973%, Training Loss: nan%
Epoch [52/300], Step [206/22

Epoch [53/300], Step [78/225], Training Accuracy: 25.1402%, Training Loss: nan%
Epoch [53/300], Step [79/225], Training Accuracy: 25.1187%, Training Loss: nan%
Epoch [53/300], Step [80/225], Training Accuracy: 25.1758%, Training Loss: nan%
Epoch [53/300], Step [81/225], Training Accuracy: 25.1157%, Training Loss: nan%
Epoch [53/300], Step [82/225], Training Accuracy: 25.0953%, Training Loss: nan%
Epoch [53/300], Step [83/225], Training Accuracy: 25.0565%, Training Loss: nan%
Epoch [53/300], Step [84/225], Training Accuracy: 25.0930%, Training Loss: nan%
Epoch [53/300], Step [85/225], Training Accuracy: 25.1103%, Training Loss: nan%
Epoch [53/300], Step [86/225], Training Accuracy: 25.1453%, Training Loss: nan%
Epoch [53/300], Step [87/225], Training Accuracy: 25.1616%, Training Loss: nan%
Epoch [53/300], Step [88/225], Training Accuracy: 25.1776%, Training Loss: nan%
Epoch [53/300], Step [89/225], Training Accuracy: 25.1580%, Training Loss: nan%
Epoch [53/300], Step [90/225], Training 

Epoch [53/300], Step [189/225], Training Accuracy: 25.5787%, Training Loss: nan%
Epoch [53/300], Step [190/225], Training Accuracy: 25.5592%, Training Loss: nan%
Epoch [53/300], Step [191/225], Training Accuracy: 25.5154%, Training Loss: nan%
Epoch [53/300], Step [192/225], Training Accuracy: 25.4720%, Training Loss: nan%
Epoch [53/300], Step [193/225], Training Accuracy: 25.4534%, Training Loss: nan%
Epoch [53/300], Step [194/225], Training Accuracy: 25.4269%, Training Loss: nan%
Epoch [53/300], Step [195/225], Training Accuracy: 25.3846%, Training Loss: nan%
Epoch [53/300], Step [196/225], Training Accuracy: 25.3667%, Training Loss: nan%
Epoch [53/300], Step [197/225], Training Accuracy: 25.3569%, Training Loss: nan%
Epoch [53/300], Step [198/225], Training Accuracy: 25.3314%, Training Loss: nan%
Epoch [53/300], Step [199/225], Training Accuracy: 25.3141%, Training Loss: nan%
Epoch [53/300], Step [200/225], Training Accuracy: 25.2734%, Training Loss: nan%
Epoch [53/300], Step [201/22

Epoch [54/300], Step [80/225], Training Accuracy: 25.1758%, Training Loss: nan%
Epoch [54/300], Step [81/225], Training Accuracy: 25.1157%, Training Loss: nan%
Epoch [54/300], Step [82/225], Training Accuracy: 25.0953%, Training Loss: nan%
Epoch [54/300], Step [83/225], Training Accuracy: 25.0565%, Training Loss: nan%
Epoch [54/300], Step [84/225], Training Accuracy: 25.0930%, Training Loss: nan%
Epoch [54/300], Step [85/225], Training Accuracy: 25.1103%, Training Loss: nan%
Epoch [54/300], Step [86/225], Training Accuracy: 25.1453%, Training Loss: nan%
Epoch [54/300], Step [87/225], Training Accuracy: 25.1616%, Training Loss: nan%
Epoch [54/300], Step [88/225], Training Accuracy: 25.1776%, Training Loss: nan%
Epoch [54/300], Step [89/225], Training Accuracy: 25.1580%, Training Loss: nan%
Epoch [54/300], Step [90/225], Training Accuracy: 25.0694%, Training Loss: nan%
Epoch [54/300], Step [91/225], Training Accuracy: 25.1030%, Training Loss: nan%
Epoch [54/300], Step [92/225], Training 

Epoch [54/300], Step [194/225], Training Accuracy: 25.4269%, Training Loss: nan%
Epoch [54/300], Step [195/225], Training Accuracy: 25.3846%, Training Loss: nan%
Epoch [54/300], Step [196/225], Training Accuracy: 25.3667%, Training Loss: nan%
Epoch [54/300], Step [197/225], Training Accuracy: 25.3569%, Training Loss: nan%
Epoch [54/300], Step [198/225], Training Accuracy: 25.3314%, Training Loss: nan%
Epoch [54/300], Step [199/225], Training Accuracy: 25.3141%, Training Loss: nan%
Epoch [54/300], Step [200/225], Training Accuracy: 25.2734%, Training Loss: nan%
Epoch [54/300], Step [201/225], Training Accuracy: 25.2954%, Training Loss: nan%
Epoch [54/300], Step [202/225], Training Accuracy: 25.2553%, Training Loss: nan%
Epoch [54/300], Step [203/225], Training Accuracy: 25.2771%, Training Loss: nan%
Epoch [54/300], Step [204/225], Training Accuracy: 25.3217%, Training Loss: nan%
Epoch [54/300], Step [205/225], Training Accuracy: 25.2973%, Training Loss: nan%
Epoch [54/300], Step [206/22

Epoch [55/300], Step [84/225], Training Accuracy: 25.0930%, Training Loss: nan%
Epoch [55/300], Step [85/225], Training Accuracy: 25.1103%, Training Loss: nan%
Epoch [55/300], Step [86/225], Training Accuracy: 25.1453%, Training Loss: nan%
Epoch [55/300], Step [87/225], Training Accuracy: 25.1616%, Training Loss: nan%
Epoch [55/300], Step [88/225], Training Accuracy: 25.1776%, Training Loss: nan%
Epoch [55/300], Step [89/225], Training Accuracy: 25.1580%, Training Loss: nan%
Epoch [55/300], Step [90/225], Training Accuracy: 25.0694%, Training Loss: nan%
Epoch [55/300], Step [91/225], Training Accuracy: 25.1030%, Training Loss: nan%
Epoch [55/300], Step [92/225], Training Accuracy: 25.0510%, Training Loss: nan%
Epoch [55/300], Step [93/225], Training Accuracy: 25.1176%, Training Loss: nan%
Epoch [55/300], Step [94/225], Training Accuracy: 25.1662%, Training Loss: nan%
Epoch [55/300], Step [95/225], Training Accuracy: 25.1974%, Training Loss: nan%
Epoch [55/300], Step [96/225], Training 

Epoch [55/300], Step [194/225], Training Accuracy: 25.4269%, Training Loss: nan%
Epoch [55/300], Step [195/225], Training Accuracy: 25.3846%, Training Loss: nan%
Epoch [55/300], Step [196/225], Training Accuracy: 25.3667%, Training Loss: nan%
Epoch [55/300], Step [197/225], Training Accuracy: 25.3569%, Training Loss: nan%
Epoch [55/300], Step [198/225], Training Accuracy: 25.3314%, Training Loss: nan%
Epoch [55/300], Step [199/225], Training Accuracy: 25.3141%, Training Loss: nan%
Epoch [55/300], Step [200/225], Training Accuracy: 25.2734%, Training Loss: nan%
Epoch [55/300], Step [201/225], Training Accuracy: 25.2954%, Training Loss: nan%
Epoch [55/300], Step [202/225], Training Accuracy: 25.2553%, Training Loss: nan%
Epoch [55/300], Step [203/225], Training Accuracy: 25.2771%, Training Loss: nan%
Epoch [55/300], Step [204/225], Training Accuracy: 25.3217%, Training Loss: nan%
Epoch [55/300], Step [205/225], Training Accuracy: 25.2973%, Training Loss: nan%
Epoch [55/300], Step [206/22

Epoch [56/300], Step [80/225], Training Accuracy: 25.1758%, Training Loss: nan%
Epoch [56/300], Step [81/225], Training Accuracy: 25.1157%, Training Loss: nan%
Epoch [56/300], Step [82/225], Training Accuracy: 25.0953%, Training Loss: nan%
Epoch [56/300], Step [83/225], Training Accuracy: 25.0565%, Training Loss: nan%
Epoch [56/300], Step [84/225], Training Accuracy: 25.0930%, Training Loss: nan%
Epoch [56/300], Step [85/225], Training Accuracy: 25.1103%, Training Loss: nan%
Epoch [56/300], Step [86/225], Training Accuracy: 25.1453%, Training Loss: nan%
Epoch [56/300], Step [87/225], Training Accuracy: 25.1616%, Training Loss: nan%
Epoch [56/300], Step [88/225], Training Accuracy: 25.1776%, Training Loss: nan%
Epoch [56/300], Step [89/225], Training Accuracy: 25.1580%, Training Loss: nan%
Epoch [56/300], Step [90/225], Training Accuracy: 25.0694%, Training Loss: nan%
Epoch [56/300], Step [91/225], Training Accuracy: 25.1030%, Training Loss: nan%
Epoch [56/300], Step [92/225], Training 

Epoch [56/300], Step [194/225], Training Accuracy: 25.4269%, Training Loss: nan%
Epoch [56/300], Step [195/225], Training Accuracy: 25.3846%, Training Loss: nan%
Epoch [56/300], Step [196/225], Training Accuracy: 25.3667%, Training Loss: nan%
Epoch [56/300], Step [197/225], Training Accuracy: 25.3569%, Training Loss: nan%
Epoch [56/300], Step [198/225], Training Accuracy: 25.3314%, Training Loss: nan%
Epoch [56/300], Step [199/225], Training Accuracy: 25.3141%, Training Loss: nan%
Epoch [56/300], Step [200/225], Training Accuracy: 25.2734%, Training Loss: nan%
Epoch [56/300], Step [201/225], Training Accuracy: 25.2954%, Training Loss: nan%
Epoch [56/300], Step [202/225], Training Accuracy: 25.2553%, Training Loss: nan%
Epoch [56/300], Step [203/225], Training Accuracy: 25.2771%, Training Loss: nan%
Epoch [56/300], Step [204/225], Training Accuracy: 25.3217%, Training Loss: nan%
Epoch [56/300], Step [205/225], Training Accuracy: 25.2973%, Training Loss: nan%
Epoch [56/300], Step [206/22

Epoch [57/300], Step [81/225], Training Accuracy: 25.1157%, Training Loss: nan%
Epoch [57/300], Step [82/225], Training Accuracy: 25.0953%, Training Loss: nan%
Epoch [57/300], Step [83/225], Training Accuracy: 25.0565%, Training Loss: nan%
Epoch [57/300], Step [84/225], Training Accuracy: 25.0930%, Training Loss: nan%
Epoch [57/300], Step [85/225], Training Accuracy: 25.1103%, Training Loss: nan%
Epoch [57/300], Step [86/225], Training Accuracy: 25.1453%, Training Loss: nan%
Epoch [57/300], Step [87/225], Training Accuracy: 25.1616%, Training Loss: nan%
Epoch [57/300], Step [88/225], Training Accuracy: 25.1776%, Training Loss: nan%
Epoch [57/300], Step [89/225], Training Accuracy: 25.1580%, Training Loss: nan%
Epoch [57/300], Step [90/225], Training Accuracy: 25.0694%, Training Loss: nan%
Epoch [57/300], Step [91/225], Training Accuracy: 25.1030%, Training Loss: nan%
Epoch [57/300], Step [92/225], Training Accuracy: 25.0510%, Training Loss: nan%
Epoch [57/300], Step [93/225], Training 

Epoch [57/300], Step [197/225], Training Accuracy: 25.3569%, Training Loss: nan%
Epoch [57/300], Step [198/225], Training Accuracy: 25.3314%, Training Loss: nan%
Epoch [57/300], Step [199/225], Training Accuracy: 25.3141%, Training Loss: nan%
Epoch [57/300], Step [200/225], Training Accuracy: 25.2734%, Training Loss: nan%
Epoch [57/300], Step [201/225], Training Accuracy: 25.2954%, Training Loss: nan%
Epoch [57/300], Step [202/225], Training Accuracy: 25.2553%, Training Loss: nan%
Epoch [57/300], Step [203/225], Training Accuracy: 25.2771%, Training Loss: nan%
Epoch [57/300], Step [204/225], Training Accuracy: 25.3217%, Training Loss: nan%
Epoch [57/300], Step [205/225], Training Accuracy: 25.2973%, Training Loss: nan%
Epoch [57/300], Step [206/225], Training Accuracy: 25.3110%, Training Loss: nan%
Epoch [57/300], Step [207/225], Training Accuracy: 25.3170%, Training Loss: nan%
Epoch [57/300], Step [208/225], Training Accuracy: 25.3155%, Training Loss: nan%
Epoch [57/300], Step [209/22

Epoch [58/300], Step [81/225], Training Accuracy: 25.1157%, Training Loss: nan%
Epoch [58/300], Step [82/225], Training Accuracy: 25.0953%, Training Loss: nan%
Epoch [58/300], Step [83/225], Training Accuracy: 25.0565%, Training Loss: nan%
Epoch [58/300], Step [84/225], Training Accuracy: 25.0930%, Training Loss: nan%
Epoch [58/300], Step [85/225], Training Accuracy: 25.1103%, Training Loss: nan%
Epoch [58/300], Step [86/225], Training Accuracy: 25.1453%, Training Loss: nan%
Epoch [58/300], Step [87/225], Training Accuracy: 25.1616%, Training Loss: nan%
Epoch [58/300], Step [88/225], Training Accuracy: 25.1776%, Training Loss: nan%
Epoch [58/300], Step [89/225], Training Accuracy: 25.1580%, Training Loss: nan%
Epoch [58/300], Step [90/225], Training Accuracy: 25.0694%, Training Loss: nan%
Epoch [58/300], Step [91/225], Training Accuracy: 25.1030%, Training Loss: nan%
Epoch [58/300], Step [92/225], Training Accuracy: 25.0510%, Training Loss: nan%
Epoch [58/300], Step [93/225], Training 

Epoch [58/300], Step [196/225], Training Accuracy: 25.3667%, Training Loss: nan%
Epoch [58/300], Step [197/225], Training Accuracy: 25.3569%, Training Loss: nan%
Epoch [58/300], Step [198/225], Training Accuracy: 25.3314%, Training Loss: nan%
Epoch [58/300], Step [199/225], Training Accuracy: 25.3141%, Training Loss: nan%
Epoch [58/300], Step [200/225], Training Accuracy: 25.2734%, Training Loss: nan%
Epoch [58/300], Step [201/225], Training Accuracy: 25.2954%, Training Loss: nan%
Epoch [58/300], Step [202/225], Training Accuracy: 25.2553%, Training Loss: nan%
Epoch [58/300], Step [203/225], Training Accuracy: 25.2771%, Training Loss: nan%
Epoch [58/300], Step [204/225], Training Accuracy: 25.3217%, Training Loss: nan%
Epoch [58/300], Step [205/225], Training Accuracy: 25.2973%, Training Loss: nan%
Epoch [58/300], Step [206/225], Training Accuracy: 25.3110%, Training Loss: nan%
Epoch [58/300], Step [207/225], Training Accuracy: 25.3170%, Training Loss: nan%
Epoch [58/300], Step [208/22

Epoch [59/300], Step [83/225], Training Accuracy: 25.0565%, Training Loss: nan%
Epoch [59/300], Step [84/225], Training Accuracy: 25.0930%, Training Loss: nan%
Epoch [59/300], Step [85/225], Training Accuracy: 25.1103%, Training Loss: nan%
Epoch [59/300], Step [86/225], Training Accuracy: 25.1453%, Training Loss: nan%
Epoch [59/300], Step [87/225], Training Accuracy: 25.1616%, Training Loss: nan%
Epoch [59/300], Step [88/225], Training Accuracy: 25.1776%, Training Loss: nan%
Epoch [59/300], Step [89/225], Training Accuracy: 25.1580%, Training Loss: nan%
Epoch [59/300], Step [90/225], Training Accuracy: 25.0694%, Training Loss: nan%
Epoch [59/300], Step [91/225], Training Accuracy: 25.1030%, Training Loss: nan%
Epoch [59/300], Step [92/225], Training Accuracy: 25.0510%, Training Loss: nan%
Epoch [59/300], Step [93/225], Training Accuracy: 25.1176%, Training Loss: nan%
Epoch [59/300], Step [94/225], Training Accuracy: 25.1662%, Training Loss: nan%
Epoch [59/300], Step [95/225], Training 

Epoch [59/300], Step [197/225], Training Accuracy: 25.3569%, Training Loss: nan%
Epoch [59/300], Step [198/225], Training Accuracy: 25.3314%, Training Loss: nan%
Epoch [59/300], Step [199/225], Training Accuracy: 25.3141%, Training Loss: nan%
Epoch [59/300], Step [200/225], Training Accuracy: 25.2734%, Training Loss: nan%
Epoch [59/300], Step [201/225], Training Accuracy: 25.2954%, Training Loss: nan%
Epoch [59/300], Step [202/225], Training Accuracy: 25.2553%, Training Loss: nan%
Epoch [59/300], Step [203/225], Training Accuracy: 25.2771%, Training Loss: nan%
Epoch [59/300], Step [204/225], Training Accuracy: 25.3217%, Training Loss: nan%
Epoch [59/300], Step [205/225], Training Accuracy: 25.2973%, Training Loss: nan%
Epoch [59/300], Step [206/225], Training Accuracy: 25.3110%, Training Loss: nan%
Epoch [59/300], Step [207/225], Training Accuracy: 25.3170%, Training Loss: nan%
Epoch [59/300], Step [208/225], Training Accuracy: 25.3155%, Training Loss: nan%
Epoch [59/300], Step [209/22

Epoch [60/300], Step [76/225], Training Accuracy: 25.1439%, Training Loss: nan%
Epoch [60/300], Step [77/225], Training Accuracy: 25.0609%, Training Loss: nan%
Epoch [60/300], Step [78/225], Training Accuracy: 25.1402%, Training Loss: nan%
Epoch [60/300], Step [79/225], Training Accuracy: 25.1187%, Training Loss: nan%
Epoch [60/300], Step [80/225], Training Accuracy: 25.1758%, Training Loss: nan%
Epoch [60/300], Step [81/225], Training Accuracy: 25.1157%, Training Loss: nan%
Epoch [60/300], Step [82/225], Training Accuracy: 25.0953%, Training Loss: nan%
Epoch [60/300], Step [83/225], Training Accuracy: 25.0565%, Training Loss: nan%
Epoch [60/300], Step [84/225], Training Accuracy: 25.0930%, Training Loss: nan%
Epoch [60/300], Step [85/225], Training Accuracy: 25.1103%, Training Loss: nan%
Epoch [60/300], Step [86/225], Training Accuracy: 25.1453%, Training Loss: nan%
Epoch [60/300], Step [87/225], Training Accuracy: 25.1616%, Training Loss: nan%
Epoch [60/300], Step [88/225], Training 

Epoch [60/300], Step [187/225], Training Accuracy: 25.5765%, Training Loss: nan%
Epoch [60/300], Step [188/225], Training Accuracy: 25.5652%, Training Loss: nan%
Epoch [60/300], Step [189/225], Training Accuracy: 25.5787%, Training Loss: nan%
Epoch [60/300], Step [190/225], Training Accuracy: 25.5592%, Training Loss: nan%
Epoch [60/300], Step [191/225], Training Accuracy: 25.5154%, Training Loss: nan%
Epoch [60/300], Step [192/225], Training Accuracy: 25.4720%, Training Loss: nan%
Epoch [60/300], Step [193/225], Training Accuracy: 25.4534%, Training Loss: nan%
Epoch [60/300], Step [194/225], Training Accuracy: 25.4269%, Training Loss: nan%
Epoch [60/300], Step [195/225], Training Accuracy: 25.3846%, Training Loss: nan%
Epoch [60/300], Step [196/225], Training Accuracy: 25.3667%, Training Loss: nan%
Epoch [60/300], Step [197/225], Training Accuracy: 25.3569%, Training Loss: nan%
Epoch [60/300], Step [198/225], Training Accuracy: 25.3314%, Training Loss: nan%
Epoch [60/300], Step [199/22

Epoch [61/300], Step [77/225], Training Accuracy: 25.0609%, Training Loss: nan%
Epoch [61/300], Step [78/225], Training Accuracy: 25.1402%, Training Loss: nan%
Epoch [61/300], Step [79/225], Training Accuracy: 25.1187%, Training Loss: nan%
Epoch [61/300], Step [80/225], Training Accuracy: 25.1758%, Training Loss: nan%
Epoch [61/300], Step [81/225], Training Accuracy: 25.1157%, Training Loss: nan%
Epoch [61/300], Step [82/225], Training Accuracy: 25.0953%, Training Loss: nan%
Epoch [61/300], Step [83/225], Training Accuracy: 25.0565%, Training Loss: nan%
Epoch [61/300], Step [84/225], Training Accuracy: 25.0930%, Training Loss: nan%
Epoch [61/300], Step [85/225], Training Accuracy: 25.1103%, Training Loss: nan%
Epoch [61/300], Step [86/225], Training Accuracy: 25.1453%, Training Loss: nan%
Epoch [61/300], Step [87/225], Training Accuracy: 25.1616%, Training Loss: nan%
Epoch [61/300], Step [88/225], Training Accuracy: 25.1776%, Training Loss: nan%
Epoch [61/300], Step [89/225], Training 

Epoch [61/300], Step [194/225], Training Accuracy: 25.4269%, Training Loss: nan%
Epoch [61/300], Step [195/225], Training Accuracy: 25.3846%, Training Loss: nan%
Epoch [61/300], Step [196/225], Training Accuracy: 25.3667%, Training Loss: nan%
Epoch [61/300], Step [197/225], Training Accuracy: 25.3569%, Training Loss: nan%
Epoch [61/300], Step [198/225], Training Accuracy: 25.3314%, Training Loss: nan%
Epoch [61/300], Step [199/225], Training Accuracy: 25.3141%, Training Loss: nan%
Epoch [61/300], Step [200/225], Training Accuracy: 25.2734%, Training Loss: nan%
Epoch [61/300], Step [201/225], Training Accuracy: 25.2954%, Training Loss: nan%
Epoch [61/300], Step [202/225], Training Accuracy: 25.2553%, Training Loss: nan%
Epoch [61/300], Step [203/225], Training Accuracy: 25.2771%, Training Loss: nan%
Epoch [61/300], Step [204/225], Training Accuracy: 25.3217%, Training Loss: nan%
Epoch [61/300], Step [205/225], Training Accuracy: 25.2973%, Training Loss: nan%
Epoch [61/300], Step [206/22

Epoch [62/300], Step [82/225], Training Accuracy: 25.0953%, Training Loss: nan%
Epoch [62/300], Step [83/225], Training Accuracy: 25.0565%, Training Loss: nan%
Epoch [62/300], Step [84/225], Training Accuracy: 25.0930%, Training Loss: nan%
Epoch [62/300], Step [85/225], Training Accuracy: 25.1103%, Training Loss: nan%
Epoch [62/300], Step [86/225], Training Accuracy: 25.1453%, Training Loss: nan%
Epoch [62/300], Step [87/225], Training Accuracy: 25.1616%, Training Loss: nan%
Epoch [62/300], Step [88/225], Training Accuracy: 25.1776%, Training Loss: nan%
Epoch [62/300], Step [89/225], Training Accuracy: 25.1580%, Training Loss: nan%
Epoch [62/300], Step [90/225], Training Accuracy: 25.0694%, Training Loss: nan%
Epoch [62/300], Step [91/225], Training Accuracy: 25.1030%, Training Loss: nan%
Epoch [62/300], Step [92/225], Training Accuracy: 25.0510%, Training Loss: nan%
Epoch [62/300], Step [93/225], Training Accuracy: 25.1176%, Training Loss: nan%
Epoch [62/300], Step [94/225], Training 

Epoch [62/300], Step [187/225], Training Accuracy: 25.5765%, Training Loss: nan%
Epoch [62/300], Step [188/225], Training Accuracy: 25.5652%, Training Loss: nan%
Epoch [62/300], Step [189/225], Training Accuracy: 25.5787%, Training Loss: nan%
Epoch [62/300], Step [190/225], Training Accuracy: 25.5592%, Training Loss: nan%
Epoch [62/300], Step [191/225], Training Accuracy: 25.5154%, Training Loss: nan%
Epoch [62/300], Step [192/225], Training Accuracy: 25.4720%, Training Loss: nan%
Epoch [62/300], Step [193/225], Training Accuracy: 25.4534%, Training Loss: nan%
Epoch [62/300], Step [194/225], Training Accuracy: 25.4269%, Training Loss: nan%
Epoch [62/300], Step [195/225], Training Accuracy: 25.3846%, Training Loss: nan%
Epoch [62/300], Step [196/225], Training Accuracy: 25.3667%, Training Loss: nan%
Epoch [62/300], Step [197/225], Training Accuracy: 25.3569%, Training Loss: nan%
Epoch [62/300], Step [198/225], Training Accuracy: 25.3314%, Training Loss: nan%
Epoch [62/300], Step [199/22

Epoch [63/300], Step [72/225], Training Accuracy: 25.1519%, Training Loss: nan%
Epoch [63/300], Step [73/225], Training Accuracy: 25.0856%, Training Loss: nan%
Epoch [63/300], Step [74/225], Training Accuracy: 25.0845%, Training Loss: nan%
Epoch [63/300], Step [75/225], Training Accuracy: 25.0833%, Training Loss: nan%
Epoch [63/300], Step [76/225], Training Accuracy: 25.1439%, Training Loss: nan%
Epoch [63/300], Step [77/225], Training Accuracy: 25.0609%, Training Loss: nan%
Epoch [63/300], Step [78/225], Training Accuracy: 25.1402%, Training Loss: nan%
Epoch [63/300], Step [79/225], Training Accuracy: 25.1187%, Training Loss: nan%
Epoch [63/300], Step [80/225], Training Accuracy: 25.1758%, Training Loss: nan%
Epoch [63/300], Step [81/225], Training Accuracy: 25.1157%, Training Loss: nan%
Epoch [63/300], Step [82/225], Training Accuracy: 25.0953%, Training Loss: nan%
Epoch [63/300], Step [83/225], Training Accuracy: 25.0565%, Training Loss: nan%
Epoch [63/300], Step [84/225], Training 

Epoch [63/300], Step [186/225], Training Accuracy: 25.6048%, Training Loss: nan%
Epoch [63/300], Step [187/225], Training Accuracy: 25.5765%, Training Loss: nan%
Epoch [63/300], Step [188/225], Training Accuracy: 25.5652%, Training Loss: nan%
Epoch [63/300], Step [189/225], Training Accuracy: 25.5787%, Training Loss: nan%
Epoch [63/300], Step [190/225], Training Accuracy: 25.5592%, Training Loss: nan%
Epoch [63/300], Step [191/225], Training Accuracy: 25.5154%, Training Loss: nan%
Epoch [63/300], Step [192/225], Training Accuracy: 25.4720%, Training Loss: nan%
Epoch [63/300], Step [193/225], Training Accuracy: 25.4534%, Training Loss: nan%
Epoch [63/300], Step [194/225], Training Accuracy: 25.4269%, Training Loss: nan%
Epoch [63/300], Step [195/225], Training Accuracy: 25.3846%, Training Loss: nan%
Epoch [63/300], Step [196/225], Training Accuracy: 25.3667%, Training Loss: nan%
Epoch [63/300], Step [197/225], Training Accuracy: 25.3569%, Training Loss: nan%
Epoch [63/300], Step [198/22

Epoch [64/300], Step [78/225], Training Accuracy: 25.1402%, Training Loss: nan%
Epoch [64/300], Step [79/225], Training Accuracy: 25.1187%, Training Loss: nan%
Epoch [64/300], Step [80/225], Training Accuracy: 25.1758%, Training Loss: nan%
Epoch [64/300], Step [81/225], Training Accuracy: 25.1157%, Training Loss: nan%
Epoch [64/300], Step [82/225], Training Accuracy: 25.0953%, Training Loss: nan%
Epoch [64/300], Step [83/225], Training Accuracy: 25.0565%, Training Loss: nan%
Epoch [64/300], Step [84/225], Training Accuracy: 25.0930%, Training Loss: nan%
Epoch [64/300], Step [85/225], Training Accuracy: 25.1103%, Training Loss: nan%
Epoch [64/300], Step [86/225], Training Accuracy: 25.1453%, Training Loss: nan%
Epoch [64/300], Step [87/225], Training Accuracy: 25.1616%, Training Loss: nan%
Epoch [64/300], Step [88/225], Training Accuracy: 25.1776%, Training Loss: nan%
Epoch [64/300], Step [89/225], Training Accuracy: 25.1580%, Training Loss: nan%
Epoch [64/300], Step [90/225], Training 

Epoch [64/300], Step [187/225], Training Accuracy: 25.5765%, Training Loss: nan%
Epoch [64/300], Step [188/225], Training Accuracy: 25.5652%, Training Loss: nan%
Epoch [64/300], Step [189/225], Training Accuracy: 25.5787%, Training Loss: nan%
Epoch [64/300], Step [190/225], Training Accuracy: 25.5592%, Training Loss: nan%
Epoch [64/300], Step [191/225], Training Accuracy: 25.5154%, Training Loss: nan%
Epoch [64/300], Step [192/225], Training Accuracy: 25.4720%, Training Loss: nan%
Epoch [64/300], Step [193/225], Training Accuracy: 25.4534%, Training Loss: nan%
Epoch [64/300], Step [194/225], Training Accuracy: 25.4269%, Training Loss: nan%
Epoch [64/300], Step [195/225], Training Accuracy: 25.3846%, Training Loss: nan%
Epoch [64/300], Step [196/225], Training Accuracy: 25.3667%, Training Loss: nan%
Epoch [64/300], Step [197/225], Training Accuracy: 25.3569%, Training Loss: nan%
Epoch [64/300], Step [198/225], Training Accuracy: 25.3314%, Training Loss: nan%
Epoch [64/300], Step [199/22

Epoch [65/300], Step [65/225], Training Accuracy: 25.1202%, Training Loss: nan%
Epoch [65/300], Step [66/225], Training Accuracy: 25.0947%, Training Loss: nan%
Epoch [65/300], Step [67/225], Training Accuracy: 25.1632%, Training Loss: nan%
Epoch [65/300], Step [68/225], Training Accuracy: 25.2528%, Training Loss: nan%
Epoch [65/300], Step [69/225], Training Accuracy: 25.1812%, Training Loss: nan%
Epoch [65/300], Step [70/225], Training Accuracy: 25.2009%, Training Loss: nan%
Epoch [65/300], Step [71/225], Training Accuracy: 25.1981%, Training Loss: nan%
Epoch [65/300], Step [72/225], Training Accuracy: 25.1519%, Training Loss: nan%
Epoch [65/300], Step [73/225], Training Accuracy: 25.0856%, Training Loss: nan%
Epoch [65/300], Step [74/225], Training Accuracy: 25.0845%, Training Loss: nan%
Epoch [65/300], Step [75/225], Training Accuracy: 25.0833%, Training Loss: nan%
Epoch [65/300], Step [76/225], Training Accuracy: 25.1439%, Training Loss: nan%
Epoch [65/300], Step [77/225], Training 

Epoch [65/300], Step [183/225], Training Accuracy: 25.6660%, Training Loss: nan%
Epoch [65/300], Step [184/225], Training Accuracy: 25.6284%, Training Loss: nan%
Epoch [65/300], Step [185/225], Training Accuracy: 25.6081%, Training Loss: nan%
Epoch [65/300], Step [186/225], Training Accuracy: 25.6048%, Training Loss: nan%
Epoch [65/300], Step [187/225], Training Accuracy: 25.5765%, Training Loss: nan%
Epoch [65/300], Step [188/225], Training Accuracy: 25.5652%, Training Loss: nan%
Epoch [65/300], Step [189/225], Training Accuracy: 25.5787%, Training Loss: nan%
Epoch [65/300], Step [190/225], Training Accuracy: 25.5592%, Training Loss: nan%
Epoch [65/300], Step [191/225], Training Accuracy: 25.5154%, Training Loss: nan%
Epoch [65/300], Step [192/225], Training Accuracy: 25.4720%, Training Loss: nan%
Epoch [65/300], Step [193/225], Training Accuracy: 25.4534%, Training Loss: nan%
Epoch [65/300], Step [194/225], Training Accuracy: 25.4269%, Training Loss: nan%
Epoch [65/300], Step [195/22

Epoch [66/300], Step [67/225], Training Accuracy: 25.1632%, Training Loss: nan%
Epoch [66/300], Step [68/225], Training Accuracy: 25.2528%, Training Loss: nan%
Epoch [66/300], Step [69/225], Training Accuracy: 25.1812%, Training Loss: nan%
Epoch [66/300], Step [70/225], Training Accuracy: 25.2009%, Training Loss: nan%
Epoch [66/300], Step [71/225], Training Accuracy: 25.1981%, Training Loss: nan%
Epoch [66/300], Step [72/225], Training Accuracy: 25.1519%, Training Loss: nan%
Epoch [66/300], Step [73/225], Training Accuracy: 25.0856%, Training Loss: nan%
Epoch [66/300], Step [74/225], Training Accuracy: 25.0845%, Training Loss: nan%
Epoch [66/300], Step [75/225], Training Accuracy: 25.0833%, Training Loss: nan%
Epoch [66/300], Step [76/225], Training Accuracy: 25.1439%, Training Loss: nan%
Epoch [66/300], Step [77/225], Training Accuracy: 25.0609%, Training Loss: nan%
Epoch [66/300], Step [78/225], Training Accuracy: 25.1402%, Training Loss: nan%
Epoch [66/300], Step [79/225], Training 

Epoch [66/300], Step [173/225], Training Accuracy: 25.6774%, Training Loss: nan%
Epoch [66/300], Step [174/225], Training Accuracy: 25.7004%, Training Loss: nan%
Epoch [66/300], Step [175/225], Training Accuracy: 25.7321%, Training Loss: nan%
Epoch [66/300], Step [176/225], Training Accuracy: 25.7369%, Training Loss: nan%
Epoch [66/300], Step [177/225], Training Accuracy: 25.7504%, Training Loss: nan%
Epoch [66/300], Step [178/225], Training Accuracy: 25.7549%, Training Loss: nan%
Epoch [66/300], Step [179/225], Training Accuracy: 25.7332%, Training Loss: nan%
Epoch [66/300], Step [180/225], Training Accuracy: 25.6944%, Training Loss: nan%
Epoch [66/300], Step [181/225], Training Accuracy: 25.6733%, Training Loss: nan%
Epoch [66/300], Step [182/225], Training Accuracy: 25.6439%, Training Loss: nan%
Epoch [66/300], Step [183/225], Training Accuracy: 25.6660%, Training Loss: nan%
Epoch [66/300], Step [184/225], Training Accuracy: 25.6284%, Training Loss: nan%
Epoch [66/300], Step [185/22

Epoch [67/300], Step [56/225], Training Accuracy: 24.8047%, Training Loss: nan%
Epoch [67/300], Step [57/225], Training Accuracy: 24.6436%, Training Loss: nan%
Epoch [67/300], Step [58/225], Training Accuracy: 24.6767%, Training Loss: nan%
Epoch [67/300], Step [59/225], Training Accuracy: 24.9206%, Training Loss: nan%
Epoch [67/300], Step [60/225], Training Accuracy: 24.9219%, Training Loss: nan%
Epoch [67/300], Step [61/225], Training Accuracy: 24.9232%, Training Loss: nan%
Epoch [67/300], Step [62/225], Training Accuracy: 25.0756%, Training Loss: nan%
Epoch [67/300], Step [63/225], Training Accuracy: 25.1984%, Training Loss: nan%
Epoch [67/300], Step [64/225], Training Accuracy: 25.0732%, Training Loss: nan%
Epoch [67/300], Step [65/225], Training Accuracy: 25.1202%, Training Loss: nan%
Epoch [67/300], Step [66/225], Training Accuracy: 25.0947%, Training Loss: nan%
Epoch [67/300], Step [67/225], Training Accuracy: 25.1632%, Training Loss: nan%
Epoch [67/300], Step [68/225], Training 

Epoch [67/300], Step [167/225], Training Accuracy: 25.7391%, Training Loss: nan%
Epoch [67/300], Step [168/225], Training Accuracy: 25.7254%, Training Loss: nan%
Epoch [67/300], Step [169/225], Training Accuracy: 25.6379%, Training Loss: nan%
Epoch [67/300], Step [170/225], Training Accuracy: 25.6250%, Training Loss: nan%
Epoch [67/300], Step [171/225], Training Accuracy: 25.6488%, Training Loss: nan%
Epoch [67/300], Step [172/225], Training Accuracy: 25.6541%, Training Loss: nan%
Epoch [67/300], Step [173/225], Training Accuracy: 25.6774%, Training Loss: nan%
Epoch [67/300], Step [174/225], Training Accuracy: 25.7004%, Training Loss: nan%
Epoch [67/300], Step [175/225], Training Accuracy: 25.7321%, Training Loss: nan%
Epoch [67/300], Step [176/225], Training Accuracy: 25.7369%, Training Loss: nan%
Epoch [67/300], Step [177/225], Training Accuracy: 25.7504%, Training Loss: nan%
Epoch [67/300], Step [178/225], Training Accuracy: 25.7549%, Training Loss: nan%
Epoch [67/300], Step [179/22

Epoch [68/300], Step [54/225], Training Accuracy: 24.5370%, Training Loss: nan%
Epoch [68/300], Step [55/225], Training Accuracy: 24.6307%, Training Loss: nan%
Epoch [68/300], Step [56/225], Training Accuracy: 24.8047%, Training Loss: nan%
Epoch [68/300], Step [57/225], Training Accuracy: 24.6436%, Training Loss: nan%
Epoch [68/300], Step [58/225], Training Accuracy: 24.6767%, Training Loss: nan%
Epoch [68/300], Step [59/225], Training Accuracy: 24.9206%, Training Loss: nan%
Epoch [68/300], Step [60/225], Training Accuracy: 24.9219%, Training Loss: nan%
Epoch [68/300], Step [61/225], Training Accuracy: 24.9232%, Training Loss: nan%
Epoch [68/300], Step [62/225], Training Accuracy: 25.0756%, Training Loss: nan%
Epoch [68/300], Step [63/225], Training Accuracy: 25.1984%, Training Loss: nan%
Epoch [68/300], Step [64/225], Training Accuracy: 25.0732%, Training Loss: nan%
Epoch [68/300], Step [65/225], Training Accuracy: 25.1202%, Training Loss: nan%
Epoch [68/300], Step [66/225], Training 

Epoch [68/300], Step [165/225], Training Accuracy: 25.7197%, Training Loss: nan%
Epoch [68/300], Step [166/225], Training Accuracy: 25.7154%, Training Loss: nan%
Epoch [68/300], Step [167/225], Training Accuracy: 25.7391%, Training Loss: nan%
Epoch [68/300], Step [168/225], Training Accuracy: 25.7254%, Training Loss: nan%
Epoch [68/300], Step [169/225], Training Accuracy: 25.6379%, Training Loss: nan%
Epoch [68/300], Step [170/225], Training Accuracy: 25.6250%, Training Loss: nan%
Epoch [68/300], Step [171/225], Training Accuracy: 25.6488%, Training Loss: nan%
Epoch [68/300], Step [172/225], Training Accuracy: 25.6541%, Training Loss: nan%
Epoch [68/300], Step [173/225], Training Accuracy: 25.6774%, Training Loss: nan%
Epoch [68/300], Step [174/225], Training Accuracy: 25.7004%, Training Loss: nan%
Epoch [68/300], Step [175/225], Training Accuracy: 25.7321%, Training Loss: nan%
Epoch [68/300], Step [176/225], Training Accuracy: 25.7369%, Training Loss: nan%
Epoch [68/300], Step [177/22

Epoch [69/300], Step [52/225], Training Accuracy: 24.6995%, Training Loss: nan%
Epoch [69/300], Step [53/225], Training Accuracy: 24.6462%, Training Loss: nan%
Epoch [69/300], Step [54/225], Training Accuracy: 24.5370%, Training Loss: nan%
Epoch [69/300], Step [55/225], Training Accuracy: 24.6307%, Training Loss: nan%
Epoch [69/300], Step [56/225], Training Accuracy: 24.8047%, Training Loss: nan%
Epoch [69/300], Step [57/225], Training Accuracy: 24.6436%, Training Loss: nan%
Epoch [69/300], Step [58/225], Training Accuracy: 24.6767%, Training Loss: nan%
Epoch [69/300], Step [59/225], Training Accuracy: 24.9206%, Training Loss: nan%
Epoch [69/300], Step [60/225], Training Accuracy: 24.9219%, Training Loss: nan%
Epoch [69/300], Step [61/225], Training Accuracy: 24.9232%, Training Loss: nan%
Epoch [69/300], Step [62/225], Training Accuracy: 25.0756%, Training Loss: nan%
Epoch [69/300], Step [63/225], Training Accuracy: 25.1984%, Training Loss: nan%
Epoch [69/300], Step [64/225], Training 

Epoch [69/300], Step [162/225], Training Accuracy: 25.7427%, Training Loss: nan%
Epoch [69/300], Step [163/225], Training Accuracy: 25.8148%, Training Loss: nan%
Epoch [69/300], Step [164/225], Training Accuracy: 25.7527%, Training Loss: nan%
Epoch [69/300], Step [165/225], Training Accuracy: 25.7197%, Training Loss: nan%
Epoch [69/300], Step [166/225], Training Accuracy: 25.7154%, Training Loss: nan%
Epoch [69/300], Step [167/225], Training Accuracy: 25.7391%, Training Loss: nan%
Epoch [69/300], Step [168/225], Training Accuracy: 25.7254%, Training Loss: nan%
Epoch [69/300], Step [169/225], Training Accuracy: 25.6379%, Training Loss: nan%
Epoch [69/300], Step [170/225], Training Accuracy: 25.6250%, Training Loss: nan%
Epoch [69/300], Step [171/225], Training Accuracy: 25.6488%, Training Loss: nan%
Epoch [69/300], Step [172/225], Training Accuracy: 25.6541%, Training Loss: nan%
Epoch [69/300], Step [173/225], Training Accuracy: 25.6774%, Training Loss: nan%
Epoch [69/300], Step [174/22

Epoch [70/300], Step [54/225], Training Accuracy: 24.5370%, Training Loss: nan%
Epoch [70/300], Step [55/225], Training Accuracy: 24.6307%, Training Loss: nan%
Epoch [70/300], Step [56/225], Training Accuracy: 24.8047%, Training Loss: nan%
Epoch [70/300], Step [57/225], Training Accuracy: 24.6436%, Training Loss: nan%
Epoch [70/300], Step [58/225], Training Accuracy: 24.6767%, Training Loss: nan%
Epoch [70/300], Step [59/225], Training Accuracy: 24.9206%, Training Loss: nan%
Epoch [70/300], Step [60/225], Training Accuracy: 24.9219%, Training Loss: nan%
Epoch [70/300], Step [61/225], Training Accuracy: 24.9232%, Training Loss: nan%
Epoch [70/300], Step [62/225], Training Accuracy: 25.0756%, Training Loss: nan%
Epoch [70/300], Step [63/225], Training Accuracy: 25.1984%, Training Loss: nan%
Epoch [70/300], Step [64/225], Training Accuracy: 25.0732%, Training Loss: nan%
Epoch [70/300], Step [65/225], Training Accuracy: 25.1202%, Training Loss: nan%
Epoch [70/300], Step [66/225], Training 

Epoch [70/300], Step [167/225], Training Accuracy: 25.7391%, Training Loss: nan%
Epoch [70/300], Step [168/225], Training Accuracy: 25.7254%, Training Loss: nan%
Epoch [70/300], Step [169/225], Training Accuracy: 25.6379%, Training Loss: nan%
Epoch [70/300], Step [170/225], Training Accuracy: 25.6250%, Training Loss: nan%
Epoch [70/300], Step [171/225], Training Accuracy: 25.6488%, Training Loss: nan%
Epoch [70/300], Step [172/225], Training Accuracy: 25.6541%, Training Loss: nan%
Epoch [70/300], Step [173/225], Training Accuracy: 25.6774%, Training Loss: nan%
Epoch [70/300], Step [174/225], Training Accuracy: 25.7004%, Training Loss: nan%
Epoch [70/300], Step [175/225], Training Accuracy: 25.7321%, Training Loss: nan%
Epoch [70/300], Step [176/225], Training Accuracy: 25.7369%, Training Loss: nan%
Epoch [70/300], Step [177/225], Training Accuracy: 25.7504%, Training Loss: nan%
Epoch [70/300], Step [178/225], Training Accuracy: 25.7549%, Training Loss: nan%
Epoch [70/300], Step [179/22

Epoch [71/300], Step [57/225], Training Accuracy: 24.6436%, Training Loss: nan%
Epoch [71/300], Step [58/225], Training Accuracy: 24.6767%, Training Loss: nan%
Epoch [71/300], Step [59/225], Training Accuracy: 24.9206%, Training Loss: nan%
Epoch [71/300], Step [60/225], Training Accuracy: 24.9219%, Training Loss: nan%
Epoch [71/300], Step [61/225], Training Accuracy: 24.9232%, Training Loss: nan%
Epoch [71/300], Step [62/225], Training Accuracy: 25.0756%, Training Loss: nan%
Epoch [71/300], Step [63/225], Training Accuracy: 25.1984%, Training Loss: nan%
Epoch [71/300], Step [64/225], Training Accuracy: 25.0732%, Training Loss: nan%
Epoch [71/300], Step [65/225], Training Accuracy: 25.1202%, Training Loss: nan%
Epoch [71/300], Step [66/225], Training Accuracy: 25.0947%, Training Loss: nan%
Epoch [71/300], Step [67/225], Training Accuracy: 25.1632%, Training Loss: nan%
Epoch [71/300], Step [68/225], Training Accuracy: 25.2528%, Training Loss: nan%
Epoch [71/300], Step [69/225], Training 

Epoch [71/300], Step [168/225], Training Accuracy: 25.7254%, Training Loss: nan%
Epoch [71/300], Step [169/225], Training Accuracy: 25.6379%, Training Loss: nan%
Epoch [71/300], Step [170/225], Training Accuracy: 25.6250%, Training Loss: nan%
Epoch [71/300], Step [171/225], Training Accuracy: 25.6488%, Training Loss: nan%
Epoch [71/300], Step [172/225], Training Accuracy: 25.6541%, Training Loss: nan%
Epoch [71/300], Step [173/225], Training Accuracy: 25.6774%, Training Loss: nan%
Epoch [71/300], Step [174/225], Training Accuracy: 25.7004%, Training Loss: nan%
Epoch [71/300], Step [175/225], Training Accuracy: 25.7321%, Training Loss: nan%
Epoch [71/300], Step [176/225], Training Accuracy: 25.7369%, Training Loss: nan%
Epoch [71/300], Step [177/225], Training Accuracy: 25.7504%, Training Loss: nan%
Epoch [71/300], Step [178/225], Training Accuracy: 25.7549%, Training Loss: nan%
Epoch [71/300], Step [179/225], Training Accuracy: 25.7332%, Training Loss: nan%
Epoch [71/300], Step [180/22

Epoch [72/300], Step [53/225], Training Accuracy: 24.6462%, Training Loss: nan%
Epoch [72/300], Step [54/225], Training Accuracy: 24.5370%, Training Loss: nan%
Epoch [72/300], Step [55/225], Training Accuracy: 24.6307%, Training Loss: nan%
Epoch [72/300], Step [56/225], Training Accuracy: 24.8047%, Training Loss: nan%
Epoch [72/300], Step [57/225], Training Accuracy: 24.6436%, Training Loss: nan%
Epoch [72/300], Step [58/225], Training Accuracy: 24.6767%, Training Loss: nan%
Epoch [72/300], Step [59/225], Training Accuracy: 24.9206%, Training Loss: nan%
Epoch [72/300], Step [60/225], Training Accuracy: 24.9219%, Training Loss: nan%
Epoch [72/300], Step [61/225], Training Accuracy: 24.9232%, Training Loss: nan%
Epoch [72/300], Step [62/225], Training Accuracy: 25.0756%, Training Loss: nan%
Epoch [72/300], Step [63/225], Training Accuracy: 25.1984%, Training Loss: nan%
Epoch [72/300], Step [64/225], Training Accuracy: 25.0732%, Training Loss: nan%
Epoch [72/300], Step [65/225], Training 

Epoch [72/300], Step [170/225], Training Accuracy: 25.6250%, Training Loss: nan%
Epoch [72/300], Step [171/225], Training Accuracy: 25.6488%, Training Loss: nan%
Epoch [72/300], Step [172/225], Training Accuracy: 25.6541%, Training Loss: nan%
Epoch [72/300], Step [173/225], Training Accuracy: 25.6774%, Training Loss: nan%
Epoch [72/300], Step [174/225], Training Accuracy: 25.7004%, Training Loss: nan%
Epoch [72/300], Step [175/225], Training Accuracy: 25.7321%, Training Loss: nan%
Epoch [72/300], Step [176/225], Training Accuracy: 25.7369%, Training Loss: nan%
Epoch [72/300], Step [177/225], Training Accuracy: 25.7504%, Training Loss: nan%
Epoch [72/300], Step [178/225], Training Accuracy: 25.7549%, Training Loss: nan%
Epoch [72/300], Step [179/225], Training Accuracy: 25.7332%, Training Loss: nan%
Epoch [72/300], Step [180/225], Training Accuracy: 25.6944%, Training Loss: nan%
Epoch [72/300], Step [181/225], Training Accuracy: 25.6733%, Training Loss: nan%
Epoch [72/300], Step [182/22

Epoch [73/300], Step [62/225], Training Accuracy: 25.0756%, Training Loss: nan%
Epoch [73/300], Step [63/225], Training Accuracy: 25.1984%, Training Loss: nan%
Epoch [73/300], Step [64/225], Training Accuracy: 25.0732%, Training Loss: nan%
Epoch [73/300], Step [65/225], Training Accuracy: 25.1202%, Training Loss: nan%
Epoch [73/300], Step [66/225], Training Accuracy: 25.0947%, Training Loss: nan%
Epoch [73/300], Step [67/225], Training Accuracy: 25.1632%, Training Loss: nan%
Epoch [73/300], Step [68/225], Training Accuracy: 25.2528%, Training Loss: nan%
Epoch [73/300], Step [69/225], Training Accuracy: 25.1812%, Training Loss: nan%
Epoch [73/300], Step [70/225], Training Accuracy: 25.2009%, Training Loss: nan%
Epoch [73/300], Step [71/225], Training Accuracy: 25.1981%, Training Loss: nan%
Epoch [73/300], Step [72/225], Training Accuracy: 25.1519%, Training Loss: nan%
Epoch [73/300], Step [73/225], Training Accuracy: 25.0856%, Training Loss: nan%
Epoch [73/300], Step [74/225], Training 

Epoch [73/300], Step [175/225], Training Accuracy: 25.7321%, Training Loss: nan%
Epoch [73/300], Step [176/225], Training Accuracy: 25.7369%, Training Loss: nan%
Epoch [73/300], Step [177/225], Training Accuracy: 25.7504%, Training Loss: nan%
Epoch [73/300], Step [178/225], Training Accuracy: 25.7549%, Training Loss: nan%
Epoch [73/300], Step [179/225], Training Accuracy: 25.7332%, Training Loss: nan%
Epoch [73/300], Step [180/225], Training Accuracy: 25.6944%, Training Loss: nan%
Epoch [73/300], Step [181/225], Training Accuracy: 25.6733%, Training Loss: nan%
Epoch [73/300], Step [182/225], Training Accuracy: 25.6439%, Training Loss: nan%
Epoch [73/300], Step [183/225], Training Accuracy: 25.6660%, Training Loss: nan%
Epoch [73/300], Step [184/225], Training Accuracy: 25.6284%, Training Loss: nan%
Epoch [73/300], Step [185/225], Training Accuracy: 25.6081%, Training Loss: nan%
Epoch [73/300], Step [186/225], Training Accuracy: 25.6048%, Training Loss: nan%
Epoch [73/300], Step [187/22

Epoch [74/300], Step [60/225], Training Accuracy: 24.9219%, Training Loss: nan%
Epoch [74/300], Step [61/225], Training Accuracy: 24.9232%, Training Loss: nan%
Epoch [74/300], Step [62/225], Training Accuracy: 25.0756%, Training Loss: nan%
Epoch [74/300], Step [63/225], Training Accuracy: 25.1984%, Training Loss: nan%
Epoch [74/300], Step [64/225], Training Accuracy: 25.0732%, Training Loss: nan%
Epoch [74/300], Step [65/225], Training Accuracy: 25.1202%, Training Loss: nan%
Epoch [74/300], Step [66/225], Training Accuracy: 25.0947%, Training Loss: nan%
Epoch [74/300], Step [67/225], Training Accuracy: 25.1632%, Training Loss: nan%
Epoch [74/300], Step [68/225], Training Accuracy: 25.2528%, Training Loss: nan%
Epoch [74/300], Step [69/225], Training Accuracy: 25.1812%, Training Loss: nan%
Epoch [74/300], Step [70/225], Training Accuracy: 25.2009%, Training Loss: nan%
Epoch [74/300], Step [71/225], Training Accuracy: 25.1981%, Training Loss: nan%
Epoch [74/300], Step [72/225], Training 

Epoch [74/300], Step [164/225], Training Accuracy: 25.7527%, Training Loss: nan%
Epoch [74/300], Step [165/225], Training Accuracy: 25.7197%, Training Loss: nan%
Epoch [74/300], Step [166/225], Training Accuracy: 25.7154%, Training Loss: nan%
Epoch [74/300], Step [167/225], Training Accuracy: 25.7391%, Training Loss: nan%
Epoch [74/300], Step [168/225], Training Accuracy: 25.7254%, Training Loss: nan%
Epoch [74/300], Step [169/225], Training Accuracy: 25.6379%, Training Loss: nan%
Epoch [74/300], Step [170/225], Training Accuracy: 25.6250%, Training Loss: nan%
Epoch [74/300], Step [171/225], Training Accuracy: 25.6488%, Training Loss: nan%
Epoch [74/300], Step [172/225], Training Accuracy: 25.6541%, Training Loss: nan%
Epoch [74/300], Step [173/225], Training Accuracy: 25.6774%, Training Loss: nan%
Epoch [74/300], Step [174/225], Training Accuracy: 25.7004%, Training Loss: nan%
Epoch [74/300], Step [175/225], Training Accuracy: 25.7321%, Training Loss: nan%
Epoch [74/300], Step [176/22

Epoch [75/300], Step [56/225], Training Accuracy: 24.8047%, Training Loss: nan%
Epoch [75/300], Step [57/225], Training Accuracy: 24.6436%, Training Loss: nan%
Epoch [75/300], Step [58/225], Training Accuracy: 24.6767%, Training Loss: nan%
Epoch [75/300], Step [59/225], Training Accuracy: 24.9206%, Training Loss: nan%
Epoch [75/300], Step [60/225], Training Accuracy: 24.9219%, Training Loss: nan%
Epoch [75/300], Step [61/225], Training Accuracy: 24.9232%, Training Loss: nan%
Epoch [75/300], Step [62/225], Training Accuracy: 25.0756%, Training Loss: nan%
Epoch [75/300], Step [63/225], Training Accuracy: 25.1984%, Training Loss: nan%
Epoch [75/300], Step [64/225], Training Accuracy: 25.0732%, Training Loss: nan%
Epoch [75/300], Step [65/225], Training Accuracy: 25.1202%, Training Loss: nan%
Epoch [75/300], Step [66/225], Training Accuracy: 25.0947%, Training Loss: nan%
Epoch [75/300], Step [67/225], Training Accuracy: 25.1632%, Training Loss: nan%
Epoch [75/300], Step [68/225], Training 

Epoch [75/300], Step [168/225], Training Accuracy: 25.7254%, Training Loss: nan%
Epoch [75/300], Step [169/225], Training Accuracy: 25.6379%, Training Loss: nan%
Epoch [75/300], Step [170/225], Training Accuracy: 25.6250%, Training Loss: nan%
Epoch [75/300], Step [171/225], Training Accuracy: 25.6488%, Training Loss: nan%
Epoch [75/300], Step [172/225], Training Accuracy: 25.6541%, Training Loss: nan%
Epoch [75/300], Step [173/225], Training Accuracy: 25.6774%, Training Loss: nan%
Epoch [75/300], Step [174/225], Training Accuracy: 25.7004%, Training Loss: nan%
Epoch [75/300], Step [175/225], Training Accuracy: 25.7321%, Training Loss: nan%
Epoch [75/300], Step [176/225], Training Accuracy: 25.7369%, Training Loss: nan%
Epoch [75/300], Step [177/225], Training Accuracy: 25.7504%, Training Loss: nan%
Epoch [75/300], Step [178/225], Training Accuracy: 25.7549%, Training Loss: nan%
Epoch [75/300], Step [179/225], Training Accuracy: 25.7332%, Training Loss: nan%
Epoch [75/300], Step [180/22

Epoch [76/300], Step [45/225], Training Accuracy: 24.8958%, Training Loss: nan%
Epoch [76/300], Step [46/225], Training Accuracy: 24.7962%, Training Loss: nan%
Epoch [76/300], Step [47/225], Training Accuracy: 24.7340%, Training Loss: nan%
Epoch [76/300], Step [48/225], Training Accuracy: 24.8372%, Training Loss: nan%
Epoch [76/300], Step [49/225], Training Accuracy: 24.6811%, Training Loss: nan%
Epoch [76/300], Step [50/225], Training Accuracy: 24.7812%, Training Loss: nan%
Epoch [76/300], Step [51/225], Training Accuracy: 24.7243%, Training Loss: nan%
Epoch [76/300], Step [52/225], Training Accuracy: 24.6995%, Training Loss: nan%
Epoch [76/300], Step [53/225], Training Accuracy: 24.6462%, Training Loss: nan%
Epoch [76/300], Step [54/225], Training Accuracy: 24.5370%, Training Loss: nan%
Epoch [76/300], Step [55/225], Training Accuracy: 24.6307%, Training Loss: nan%
Epoch [76/300], Step [56/225], Training Accuracy: 24.8047%, Training Loss: nan%
Epoch [76/300], Step [57/225], Training 

Epoch [76/300], Step [150/225], Training Accuracy: 25.6875%, Training Loss: nan%
Epoch [76/300], Step [151/225], Training Accuracy: 25.6933%, Training Loss: nan%
Epoch [76/300], Step [152/225], Training Accuracy: 25.6579%, Training Loss: nan%
Epoch [76/300], Step [153/225], Training Accuracy: 25.6230%, Training Loss: nan%
Epoch [76/300], Step [154/225], Training Accuracy: 25.6595%, Training Loss: nan%
Epoch [76/300], Step [155/225], Training Accuracy: 25.6855%, Training Loss: nan%
Epoch [76/300], Step [156/225], Training Accuracy: 25.7212%, Training Loss: nan%
Epoch [76/300], Step [157/225], Training Accuracy: 25.6568%, Training Loss: nan%
Epoch [76/300], Step [158/225], Training Accuracy: 25.6824%, Training Loss: nan%
Epoch [76/300], Step [159/225], Training Accuracy: 25.7862%, Training Loss: nan%
Epoch [76/300], Step [160/225], Training Accuracy: 25.7910%, Training Loss: nan%
Epoch [76/300], Step [161/225], Training Accuracy: 25.7861%, Training Loss: nan%
Epoch [76/300], Step [162/22

Epoch [77/300], Step [39/225], Training Accuracy: 24.3590%, Training Loss: nan%
Epoch [77/300], Step [40/225], Training Accuracy: 24.5703%, Training Loss: nan%
Epoch [77/300], Step [41/225], Training Accuracy: 24.7332%, Training Loss: nan%
Epoch [77/300], Step [42/225], Training Accuracy: 24.7396%, Training Loss: nan%
Epoch [77/300], Step [43/225], Training Accuracy: 24.9273%, Training Loss: nan%
Epoch [77/300], Step [44/225], Training Accuracy: 24.9290%, Training Loss: nan%
Epoch [77/300], Step [45/225], Training Accuracy: 24.8958%, Training Loss: nan%
Epoch [77/300], Step [46/225], Training Accuracy: 24.7962%, Training Loss: nan%
Epoch [77/300], Step [47/225], Training Accuracy: 24.7340%, Training Loss: nan%
Epoch [77/300], Step [48/225], Training Accuracy: 24.8372%, Training Loss: nan%
Epoch [77/300], Step [49/225], Training Accuracy: 24.6811%, Training Loss: nan%
Epoch [77/300], Step [50/225], Training Accuracy: 24.7812%, Training Loss: nan%
Epoch [77/300], Step [51/225], Training 

Epoch [77/300], Step [148/225], Training Accuracy: 25.6440%, Training Loss: nan%
Epoch [77/300], Step [149/225], Training Accuracy: 25.6816%, Training Loss: nan%
Epoch [77/300], Step [150/225], Training Accuracy: 25.6875%, Training Loss: nan%
Epoch [77/300], Step [151/225], Training Accuracy: 25.6933%, Training Loss: nan%
Epoch [77/300], Step [152/225], Training Accuracy: 25.6579%, Training Loss: nan%
Epoch [77/300], Step [153/225], Training Accuracy: 25.6230%, Training Loss: nan%
Epoch [77/300], Step [154/225], Training Accuracy: 25.6595%, Training Loss: nan%
Epoch [77/300], Step [155/225], Training Accuracy: 25.6855%, Training Loss: nan%
Epoch [77/300], Step [156/225], Training Accuracy: 25.7212%, Training Loss: nan%
Epoch [77/300], Step [157/225], Training Accuracy: 25.6568%, Training Loss: nan%
Epoch [77/300], Step [158/225], Training Accuracy: 25.6824%, Training Loss: nan%
Epoch [77/300], Step [159/225], Training Accuracy: 25.7862%, Training Loss: nan%
Epoch [77/300], Step [160/22

Epoch [78/300], Step [32/225], Training Accuracy: 24.7559%, Training Loss: nan%
Epoch [78/300], Step [33/225], Training Accuracy: 24.7159%, Training Loss: nan%
Epoch [78/300], Step [34/225], Training Accuracy: 24.5864%, Training Loss: nan%
Epoch [78/300], Step [35/225], Training Accuracy: 24.5982%, Training Loss: nan%
Epoch [78/300], Step [36/225], Training Accuracy: 24.6528%, Training Loss: nan%
Epoch [78/300], Step [37/225], Training Accuracy: 24.6622%, Training Loss: nan%
Epoch [78/300], Step [38/225], Training Accuracy: 24.5477%, Training Loss: nan%
Epoch [78/300], Step [39/225], Training Accuracy: 24.3590%, Training Loss: nan%
Epoch [78/300], Step [40/225], Training Accuracy: 24.5703%, Training Loss: nan%
Epoch [78/300], Step [41/225], Training Accuracy: 24.7332%, Training Loss: nan%
Epoch [78/300], Step [42/225], Training Accuracy: 24.7396%, Training Loss: nan%
Epoch [78/300], Step [43/225], Training Accuracy: 24.9273%, Training Loss: nan%
Epoch [78/300], Step [44/225], Training 

Epoch [78/300], Step [146/225], Training Accuracy: 25.6314%, Training Loss: nan%
Epoch [78/300], Step [147/225], Training Accuracy: 25.6590%, Training Loss: nan%
Epoch [78/300], Step [148/225], Training Accuracy: 25.6440%, Training Loss: nan%
Epoch [78/300], Step [149/225], Training Accuracy: 25.6816%, Training Loss: nan%
Epoch [78/300], Step [150/225], Training Accuracy: 25.6875%, Training Loss: nan%
Epoch [78/300], Step [151/225], Training Accuracy: 25.6933%, Training Loss: nan%
Epoch [78/300], Step [152/225], Training Accuracy: 25.6579%, Training Loss: nan%
Epoch [78/300], Step [153/225], Training Accuracy: 25.6230%, Training Loss: nan%
Epoch [78/300], Step [154/225], Training Accuracy: 25.6595%, Training Loss: nan%
Epoch [78/300], Step [155/225], Training Accuracy: 25.6855%, Training Loss: nan%
Epoch [78/300], Step [156/225], Training Accuracy: 25.7212%, Training Loss: nan%
Epoch [78/300], Step [157/225], Training Accuracy: 25.6568%, Training Loss: nan%
Epoch [78/300], Step [158/22

Epoch [79/300], Step [38/225], Training Accuracy: 24.5477%, Training Loss: nan%
Epoch [79/300], Step [39/225], Training Accuracy: 24.3590%, Training Loss: nan%
Epoch [79/300], Step [40/225], Training Accuracy: 24.5703%, Training Loss: nan%
Epoch [79/300], Step [41/225], Training Accuracy: 24.7332%, Training Loss: nan%
Epoch [79/300], Step [42/225], Training Accuracy: 24.7396%, Training Loss: nan%
Epoch [79/300], Step [43/225], Training Accuracy: 24.9273%, Training Loss: nan%
Epoch [79/300], Step [44/225], Training Accuracy: 24.9290%, Training Loss: nan%
Epoch [79/300], Step [45/225], Training Accuracy: 24.8958%, Training Loss: nan%
Epoch [79/300], Step [46/225], Training Accuracy: 24.7962%, Training Loss: nan%
Epoch [79/300], Step [47/225], Training Accuracy: 24.7340%, Training Loss: nan%
Epoch [79/300], Step [48/225], Training Accuracy: 24.8372%, Training Loss: nan%
Epoch [79/300], Step [49/225], Training Accuracy: 24.6811%, Training Loss: nan%
Epoch [79/300], Step [50/225], Training 

Epoch [79/300], Step [146/225], Training Accuracy: 25.6314%, Training Loss: nan%
Epoch [79/300], Step [147/225], Training Accuracy: 25.6590%, Training Loss: nan%
Epoch [79/300], Step [148/225], Training Accuracy: 25.6440%, Training Loss: nan%
Epoch [79/300], Step [149/225], Training Accuracy: 25.6816%, Training Loss: nan%
Epoch [79/300], Step [150/225], Training Accuracy: 25.6875%, Training Loss: nan%
Epoch [79/300], Step [151/225], Training Accuracy: 25.6933%, Training Loss: nan%
Epoch [79/300], Step [152/225], Training Accuracy: 25.6579%, Training Loss: nan%
Epoch [79/300], Step [153/225], Training Accuracy: 25.6230%, Training Loss: nan%
Epoch [79/300], Step [154/225], Training Accuracy: 25.6595%, Training Loss: nan%
Epoch [79/300], Step [155/225], Training Accuracy: 25.6855%, Training Loss: nan%
Epoch [79/300], Step [156/225], Training Accuracy: 25.7212%, Training Loss: nan%
Epoch [79/300], Step [157/225], Training Accuracy: 25.6568%, Training Loss: nan%
Epoch [79/300], Step [158/22

Epoch [80/300], Step [26/225], Training Accuracy: 24.9399%, Training Loss: nan%
Epoch [80/300], Step [27/225], Training Accuracy: 24.7106%, Training Loss: nan%
Epoch [80/300], Step [28/225], Training Accuracy: 24.4978%, Training Loss: nan%
Epoch [80/300], Step [29/225], Training Accuracy: 24.7306%, Training Loss: nan%
Epoch [80/300], Step [30/225], Training Accuracy: 24.8438%, Training Loss: nan%
Epoch [80/300], Step [31/225], Training Accuracy: 24.6976%, Training Loss: nan%
Epoch [80/300], Step [32/225], Training Accuracy: 24.7559%, Training Loss: nan%
Epoch [80/300], Step [33/225], Training Accuracy: 24.7159%, Training Loss: nan%
Epoch [80/300], Step [34/225], Training Accuracy: 24.5864%, Training Loss: nan%
Epoch [80/300], Step [35/225], Training Accuracy: 24.5982%, Training Loss: nan%
Epoch [80/300], Step [36/225], Training Accuracy: 24.6528%, Training Loss: nan%
Epoch [80/300], Step [37/225], Training Accuracy: 24.6622%, Training Loss: nan%
Epoch [80/300], Step [38/225], Training 

Epoch [80/300], Step [144/225], Training Accuracy: 25.5968%, Training Loss: nan%
Epoch [80/300], Step [145/225], Training Accuracy: 25.6142%, Training Loss: nan%
Epoch [80/300], Step [146/225], Training Accuracy: 25.6314%, Training Loss: nan%
Epoch [80/300], Step [147/225], Training Accuracy: 25.6590%, Training Loss: nan%
Epoch [80/300], Step [148/225], Training Accuracy: 25.6440%, Training Loss: nan%
Epoch [80/300], Step [149/225], Training Accuracy: 25.6816%, Training Loss: nan%
Epoch [80/300], Step [150/225], Training Accuracy: 25.6875%, Training Loss: nan%
Epoch [80/300], Step [151/225], Training Accuracy: 25.6933%, Training Loss: nan%
Epoch [80/300], Step [152/225], Training Accuracy: 25.6579%, Training Loss: nan%
Epoch [80/300], Step [153/225], Training Accuracy: 25.6230%, Training Loss: nan%
Epoch [80/300], Step [154/225], Training Accuracy: 25.6595%, Training Loss: nan%
Epoch [80/300], Step [155/225], Training Accuracy: 25.6855%, Training Loss: nan%
Epoch [80/300], Step [156/22

Epoch [81/300], Step [31/225], Training Accuracy: 24.6976%, Training Loss: nan%
Epoch [81/300], Step [32/225], Training Accuracy: 24.7559%, Training Loss: nan%
Epoch [81/300], Step [33/225], Training Accuracy: 24.7159%, Training Loss: nan%
Epoch [81/300], Step [34/225], Training Accuracy: 24.5864%, Training Loss: nan%
Epoch [81/300], Step [35/225], Training Accuracy: 24.5982%, Training Loss: nan%
Epoch [81/300], Step [36/225], Training Accuracy: 24.6528%, Training Loss: nan%
Epoch [81/300], Step [37/225], Training Accuracy: 24.6622%, Training Loss: nan%
Epoch [81/300], Step [38/225], Training Accuracy: 24.5477%, Training Loss: nan%
Epoch [81/300], Step [39/225], Training Accuracy: 24.3590%, Training Loss: nan%
Epoch [81/300], Step [40/225], Training Accuracy: 24.5703%, Training Loss: nan%
Epoch [81/300], Step [41/225], Training Accuracy: 24.7332%, Training Loss: nan%
Epoch [81/300], Step [42/225], Training Accuracy: 24.7396%, Training Loss: nan%
Epoch [81/300], Step [43/225], Training 

Epoch [81/300], Step [143/225], Training Accuracy: 25.6010%, Training Loss: nan%
Epoch [81/300], Step [144/225], Training Accuracy: 25.5968%, Training Loss: nan%
Epoch [81/300], Step [145/225], Training Accuracy: 25.6142%, Training Loss: nan%
Epoch [81/300], Step [146/225], Training Accuracy: 25.6314%, Training Loss: nan%
Epoch [81/300], Step [147/225], Training Accuracy: 25.6590%, Training Loss: nan%
Epoch [81/300], Step [148/225], Training Accuracy: 25.6440%, Training Loss: nan%
Epoch [81/300], Step [149/225], Training Accuracy: 25.6816%, Training Loss: nan%
Epoch [81/300], Step [150/225], Training Accuracy: 25.6875%, Training Loss: nan%
Epoch [81/300], Step [151/225], Training Accuracy: 25.6933%, Training Loss: nan%
Epoch [81/300], Step [152/225], Training Accuracy: 25.6579%, Training Loss: nan%
Epoch [81/300], Step [153/225], Training Accuracy: 25.6230%, Training Loss: nan%
Epoch [81/300], Step [154/225], Training Accuracy: 25.6595%, Training Loss: nan%
Epoch [81/300], Step [155/22

Epoch [82/300], Step [31/225], Training Accuracy: 24.6976%, Training Loss: nan%
Epoch [82/300], Step [32/225], Training Accuracy: 24.7559%, Training Loss: nan%
Epoch [82/300], Step [33/225], Training Accuracy: 24.7159%, Training Loss: nan%
Epoch [82/300], Step [34/225], Training Accuracy: 24.5864%, Training Loss: nan%
Epoch [82/300], Step [35/225], Training Accuracy: 24.5982%, Training Loss: nan%
Epoch [82/300], Step [36/225], Training Accuracy: 24.6528%, Training Loss: nan%
Epoch [82/300], Step [37/225], Training Accuracy: 24.6622%, Training Loss: nan%
Epoch [82/300], Step [38/225], Training Accuracy: 24.5477%, Training Loss: nan%
Epoch [82/300], Step [39/225], Training Accuracy: 24.3590%, Training Loss: nan%
Epoch [82/300], Step [40/225], Training Accuracy: 24.5703%, Training Loss: nan%
Epoch [82/300], Step [41/225], Training Accuracy: 24.7332%, Training Loss: nan%
Epoch [82/300], Step [42/225], Training Accuracy: 24.7396%, Training Loss: nan%
Epoch [82/300], Step [43/225], Training 

Epoch [82/300], Step [146/225], Training Accuracy: 25.6314%, Training Loss: nan%
Epoch [82/300], Step [147/225], Training Accuracy: 25.6590%, Training Loss: nan%
Epoch [82/300], Step [148/225], Training Accuracy: 25.6440%, Training Loss: nan%
Epoch [82/300], Step [149/225], Training Accuracy: 25.6816%, Training Loss: nan%
Epoch [82/300], Step [150/225], Training Accuracy: 25.6875%, Training Loss: nan%
Epoch [82/300], Step [151/225], Training Accuracy: 25.6933%, Training Loss: nan%
Epoch [82/300], Step [152/225], Training Accuracy: 25.6579%, Training Loss: nan%
Epoch [82/300], Step [153/225], Training Accuracy: 25.6230%, Training Loss: nan%
Epoch [82/300], Step [154/225], Training Accuracy: 25.6595%, Training Loss: nan%
Epoch [82/300], Step [155/225], Training Accuracy: 25.6855%, Training Loss: nan%
Epoch [82/300], Step [156/225], Training Accuracy: 25.7212%, Training Loss: nan%
Epoch [82/300], Step [157/225], Training Accuracy: 25.6568%, Training Loss: nan%
Epoch [82/300], Step [158/22

Epoch [83/300], Step [38/225], Training Accuracy: 24.5477%, Training Loss: nan%
Epoch [83/300], Step [39/225], Training Accuracy: 24.3590%, Training Loss: nan%
Epoch [83/300], Step [40/225], Training Accuracy: 24.5703%, Training Loss: nan%
Epoch [83/300], Step [41/225], Training Accuracy: 24.7332%, Training Loss: nan%
Epoch [83/300], Step [42/225], Training Accuracy: 24.7396%, Training Loss: nan%
Epoch [83/300], Step [43/225], Training Accuracy: 24.9273%, Training Loss: nan%
Epoch [83/300], Step [44/225], Training Accuracy: 24.9290%, Training Loss: nan%
Epoch [83/300], Step [45/225], Training Accuracy: 24.8958%, Training Loss: nan%
Epoch [83/300], Step [46/225], Training Accuracy: 24.7962%, Training Loss: nan%
Epoch [83/300], Step [47/225], Training Accuracy: 24.7340%, Training Loss: nan%
Epoch [83/300], Step [48/225], Training Accuracy: 24.8372%, Training Loss: nan%
Epoch [83/300], Step [49/225], Training Accuracy: 24.6811%, Training Loss: nan%
Epoch [83/300], Step [50/225], Training 

Epoch [83/300], Step [152/225], Training Accuracy: 25.6579%, Training Loss: nan%
Epoch [83/300], Step [153/225], Training Accuracy: 25.6230%, Training Loss: nan%
Epoch [83/300], Step [154/225], Training Accuracy: 25.6595%, Training Loss: nan%
Epoch [83/300], Step [155/225], Training Accuracy: 25.6855%, Training Loss: nan%
Epoch [83/300], Step [156/225], Training Accuracy: 25.7212%, Training Loss: nan%
Epoch [83/300], Step [157/225], Training Accuracy: 25.6568%, Training Loss: nan%
Epoch [83/300], Step [158/225], Training Accuracy: 25.6824%, Training Loss: nan%
Epoch [83/300], Step [159/225], Training Accuracy: 25.7862%, Training Loss: nan%
Epoch [83/300], Step [160/225], Training Accuracy: 25.7910%, Training Loss: nan%
Epoch [83/300], Step [161/225], Training Accuracy: 25.7861%, Training Loss: nan%
Epoch [83/300], Step [162/225], Training Accuracy: 25.7427%, Training Loss: nan%
Epoch [83/300], Step [163/225], Training Accuracy: 25.8148%, Training Loss: nan%
Epoch [83/300], Step [164/22

Epoch [84/300], Step [31/225], Training Accuracy: 24.6976%, Training Loss: nan%
Epoch [84/300], Step [32/225], Training Accuracy: 24.7559%, Training Loss: nan%
Epoch [84/300], Step [33/225], Training Accuracy: 24.7159%, Training Loss: nan%
Epoch [84/300], Step [34/225], Training Accuracy: 24.5864%, Training Loss: nan%
Epoch [84/300], Step [35/225], Training Accuracy: 24.5982%, Training Loss: nan%
Epoch [84/300], Step [36/225], Training Accuracy: 24.6528%, Training Loss: nan%
Epoch [84/300], Step [37/225], Training Accuracy: 24.6622%, Training Loss: nan%
Epoch [84/300], Step [38/225], Training Accuracy: 24.5477%, Training Loss: nan%
Epoch [84/300], Step [39/225], Training Accuracy: 24.3590%, Training Loss: nan%
Epoch [84/300], Step [40/225], Training Accuracy: 24.5703%, Training Loss: nan%
Epoch [84/300], Step [41/225], Training Accuracy: 24.7332%, Training Loss: nan%
Epoch [84/300], Step [42/225], Training Accuracy: 24.7396%, Training Loss: nan%
Epoch [84/300], Step [43/225], Training 

Epoch [84/300], Step [147/225], Training Accuracy: 25.6590%, Training Loss: nan%
Epoch [84/300], Step [148/225], Training Accuracy: 25.6440%, Training Loss: nan%
Epoch [84/300], Step [149/225], Training Accuracy: 25.6816%, Training Loss: nan%
Epoch [84/300], Step [150/225], Training Accuracy: 25.6875%, Training Loss: nan%
Epoch [84/300], Step [151/225], Training Accuracy: 25.6933%, Training Loss: nan%
Epoch [84/300], Step [152/225], Training Accuracy: 25.6579%, Training Loss: nan%
Epoch [84/300], Step [153/225], Training Accuracy: 25.6230%, Training Loss: nan%
Epoch [84/300], Step [154/225], Training Accuracy: 25.6595%, Training Loss: nan%
Epoch [84/300], Step [155/225], Training Accuracy: 25.6855%, Training Loss: nan%
Epoch [84/300], Step [156/225], Training Accuracy: 25.7212%, Training Loss: nan%
Epoch [84/300], Step [157/225], Training Accuracy: 25.6568%, Training Loss: nan%
Epoch [84/300], Step [158/225], Training Accuracy: 25.6824%, Training Loss: nan%
Epoch [84/300], Step [159/22

In [None]:

# Test the model
model.eval()  # eval mode (batchnorm uses moving mean/variance instead of mini-batch mean/variance)
with torch.no_grad():
    correct = 0
    total = 0
    for X, Y in test_loader:
        X = X.to(device)
        Y = Y.to(device)
        outputs = model(X)
        _, predicted = torch.max(outputs.data, 1)
        total += Y.size(0)
        correct += (predicted == Y).sum().item()

    print('Test Accuracy : {} %'.format(100 * correct / total))

# Save the model checkpoint
#torch.save(model.state_dict(), 'model.ckpt')