In [1]:
import sys
import torch
import torch.nn as nn
from torch import cuda
from torch.autograd import Variable
from torch.utils.data import DataLoader,Dataset

import torchvision
import torchvision.datasets as dset
import torchvision.transforms as transforms
import torchvision.utils
from PIL import Image

import torch.nn.functional as F

import matplotlib.pyplot as plt
import numpy as np
import random
import torch.optim as optim 

import nibabel as nib
import os
from skimage.transform import resize 
import random
import torch.utils.model_zoo as model_zoo
import torch.nn as nn
import math
import pandas as pd

In [2]:
class AD_2DSlicesData(Dataset):
    """labeled Faces in the Wild dataset."""
    
    def __init__(self, root_dir_1, root_dir_2, root_dir_3, data_file, transform=None, slice = slice):
        """
        Args:
            root_dir (string): Directory of all the images.
            data_file (string): File name of the train/test split file.
            transform (callable, optional): Optional transform to be applied on a sample.
            data_augmentation (boolean): Optional data augmentation.
        """
        self.root_dir_1 = root_dir_1
        self.root_dir_2 = root_dir_2
        self.root_dir_3 = root_dir_3
        self.data_file = data_file
        self.transform = transform
    
    def __len__(self):
        return sum(1 for line in open(self.data_file))
    
    def __getitem__(self, idx):
        df = open(self.data_file)
        lines = df.readlines()
        lst = lines[idx].split()
        num_images=len(lst)-1
        if num_images == 3:
            img_name_1 = lst[0]
            img_name_2 = lst[1]
            img_name_3 = lst[2]
            img_label = lst[3]
            image_path1 = os.path.join(self.root_dir_1, img_name_1)
            image_path2 = os.path.join(self.root_dir_2, img_name_2)
            image_path3 = os.path.join(self.root_dir_3, img_name_3)
            image1 = Image.open(image_path1)
            image2 = Image.open(image_path2)
            image3 = Image.open(image_path3)

           
        elif num_images == 2:
            img_name_1 = lst[0]
            img_name_2 = lst[1]
            img_label = lst[2]
            image_path1 = os.path.join(self.root_dir_1, img_name_1)
            image_path2 = os.path.join(self.root_dir_2, img_name_2)
            image1 = Image.open(image_path1)         
            image2 = Image.open(image_path2)
            image3 = Image.new("RGB", (224, 224), (255, 255, 255))

          
        elif num_images == 1:
            img_name = lst[0]
            img_label = lst[1]
            if img_name[0]=='r':
                image_path = os.path.join(self.root_dir_3, img_name)
                image1 = Image.new("RGB", (224, 224), (255, 255, 255))
                image2 = Image.new("RGB", (224, 224), (255, 255, 255))
                image3 = Image.open(image_path)         

            elif img_name[0]=='F':
                image_path = os.path.join(self.root_dir_1, img_name)
                image1 =  Image.open(image_path)       
                image2 = Image.new("RGB", (224, 224), (255, 255, 255))
                image3 =Image.new("RGB", (224, 224), (255, 255, 255))
            elif img_name[0]=='M':
                image_path = os.path.join(self.root_dir_2, img_name)
                image1 = Image.new("RGB", (224, 224), (255, 255, 255))    
                image2 = Image.open(image_path) 
                image3 = Image.new("RGB", (224, 224), (255, 255, 255))
                    
                
                
        if img_label == 'Normal':
            label = 0
        elif img_label == 'AD':
            label = 2
        elif img_label == 'MCI':
            label = 1
            #image = Image.fromarray(image.astype(np.uint8), 'RGB')
        if self.transform:
            image1 = self.transform(image1)
            image2 = self.transform(image2)
            image3 = self.transform(image3)

        
        sample = {'t1w': image3,'FA':image1, 'MD':image2, 'label': label}
        return sample
    

In [32]:
# Path configuration
TRAINING_PATH = '/home/aidana_massalimova/classifier/agnostic/train_fold1.txt'
TESTING_PATH = '/home/aidana_massalimova/classifier/MD_only/test_fold1_upd.txt'
IMG_PATH_1 = '/home/aidana_massalimova/classifier/agnostic/fold1/train/FA'
IMG_PATH_2 = '/home/aidana_massalimova/classifier/agnostic/fold1/train/MD'
IMG_PATH_3 = '/home/aidana_massalimova/classifier/agnostic/fold1/train/T1w'

IMG_PATH_4 = '/home/aidana_massalimova/classifier/agnostic/fold1/test/FA'
IMG_PATH_5 = '/home/aidana_massalimova/classifier/agnostic/fold1/test/MD'
IMG_PATH_6 = '/home/aidana_massalimova/classifier/agnostic/fold1/test/T1w'


batch_size=16
epochs=200
lr = 1e-3


transforms_train = transforms.Compose([
    transforms.Resize((224,224)),
    transforms.RandomHorizontalFlip(),
    transforms.RandomVerticalFlip(),
    transforms.ToTensor(),
])

transforms_test = transforms.Compose([
    transforms.Resize((224,224)),
    transforms.ToTensor(),
])
dset_train = AD_2DSlicesData(IMG_PATH_1, IMG_PATH_2,IMG_PATH_3,TRAINING_PATH, transforms_train)
dset_test = AD_2DSlicesData(IMG_PATH_4, IMG_PATH_5,IMG_PATH_6, TESTING_PATH, transforms_test)


# Use argument load to distinguish training and testing
train_loader = DataLoader(dset_train,
                          batch_size = batch_size,
                          shuffle = True,
                          num_workers = 4,
                          drop_last = True
                         )

test_loader = DataLoader(dset_test,
                         batch_size = batch_size,
                         shuffle = False,
                         num_workers = 4,
                         drop_last=True
                         )



In [4]:
class ResNet18(nn.Module):

    def __init__(self, out_size):
        super(ResNet18, self).__init__()
        self.resnet18 = torchvision.models.resnet18(pretrained=True)
        num_ftrs = self.resnet18.fc.in_features
        self.resnet18.fc = nn.Sequential(
            nn.Linear(num_ftrs, out_size)
        )

    def forward(self, x):
        x = self.resnet18(x)
        return x
    
class MyEnsemble(nn.Module):
    def __init__(self, modelA, modelB,modelC, nb_classes=3):
        super(MyEnsemble, self).__init__()
        self.modelA = modelA
        self.modelB = modelB
        self.modelC = modelC
        # Remove last linear layer
        self.modelA.module.resnet18.fc = nn.Identity()
        self.modelB.module.resnet18.fc = nn.Identity()
        self.modelC.module.resnet18.fc = nn.Identity()
        # Create new classifier
        self.classifier = nn.Linear(512+512+512, nb_classes)
        
    def forward(self, x1,x2,x3):
        x1 = self.modelA(x1) 
        x2 = self.modelB(x2)
        x3 = self.modelC(x3)
        x = torch.cat((x1, x2, x3), dim=1)   
        x = self.classifier(F.relu(x))
        return x

# Train your separate models
                                                

modelA = ResNet18(out_size=3)
modelB = ResNet18(out_size=3)
modelC = ResNet18(out_size=3)


optimizerA = eval("optim.Adam")(modelA.parameters(), 1e-4)      
optimizerB = eval("optim.Adam")(modelB.parameters(), 1e-4)
optimizerC = eval("optim.Adam")(modelC.parameters(), 1e-4)      

# Freeze these models
for param in modelA.parameters():
    param.requires_grad = False

for param in modelB.parameters():
    param.requires_grad = False

    
for param in modelC.parameters():
    param.requires_grad = False
    
gpu_ids=[11]
cuda='cuda:'+str(gpu_ids[0]) 
device=torch.device(cuda)
#cuda='cuda:0'
modelA = nn.DataParallel(modelA, device_ids=gpu_ids)
modelB = nn.DataParallel(modelB, device_ids=gpu_ids)
modelC = nn.DataParallel(modelC, device_ids=gpu_ids)


modelA.to(device)    
modelB.to(device)    
modelC.to(device)    

checkpointA = torch.load('/home/aidana_massalimova/classifier/t1w_only/model1_upd.pt')
modelA.load_state_dict(checkpointA['model_state_dict'])
optimizerA.load_state_dict(checkpointA['optimizer_state_dict'])

checkpointB = torch.load('/home/aidana_massalimova/classifier/FA_only/model1_upd.pt')
modelB.load_state_dict(checkpointB['model_state_dict'])
optimizerB.load_state_dict(checkpointB['optimizer_state_dict'])

checkpointC = torch.load('/home/aidana_massalimova/classifier/MD_only/model1_upd.pt')
modelC.load_state_dict(checkpointC['model_state_dict'])
optimizerC.load_state_dict(checkpointC['optimizer_state_dict'])
                
# Create ensemble model
model = MyEnsemble(modelA, modelB, modelC)
model = nn.DataParallel(model, device_ids=gpu_ids)
model.to(device)    
criterion = torch.nn.CrossEntropyLoss()
optimizer = eval("optim.Adam")(model.parameters(), lr)

In [5]:
# Training process

last_dev_avg_loss = float("inf")
best_accuracy = float("-inf")
# main training loop
best_accuracy=0
for epoch_i in range(epochs):
    print("At {0}-th epoch.".format(epoch_i))
    train_loss = 0.0
    correct_cnt = 0.0
    model.train()
    for it, train_data in enumerate(train_loader):
        t1w,FA,MD, labels = Variable(train_data['t1w']).to(device), Variable(train_data['FA']).to(device),Variable(train_data['MD']).to(device),Variable(train_data['label']).to(device) 
        integer_encoded = labels.data.cpu().numpy()
        ground_truth = Variable(torch.from_numpy(integer_encoded)).long().to(device)
        train_output = model(t1w,FA,MD)
        train_prob_predict = F.softmax(train_output, dim=1)
        _, predict = train_prob_predict.topk(1)
        loss = criterion(train_output, ground_truth)

        train_loss += loss
        correct_this_batch = (predict.squeeze(1) == ground_truth).sum()
        correct_cnt += correct_this_batch
        accuracy = float(correct_this_batch) / len(ground_truth)
        print("batch {0} training loss is : {1:.5f}".format(it, loss.data))
        print("batch {0} training accuracy is : {1:.5f}".format(it, accuracy))
        optimizer.zero_grad()
        loss.backward()
        optimizer.step()

    train_avg_loss = train_loss / (len(dset_train) / batch_size)
    train_avg_acu = float(correct_cnt) / len(dset_train)
    print("Average training loss is {0:.5f} at the end of epoch {1}".format(train_avg_loss.data, epoch_i))
    print("Average training accuracy is {0:.5f} at the end of epoch {1}".format(train_avg_acu, epoch_i))
    

    # validation -- this is a crude esitmation because there might be some paddings at the end
    dev_loss = 0.0
    correct_cnt = 0.0
    model.eval()
    for it, test_data in enumerate(test_loader):
        with torch.no_grad():
            t1w,FA,MD, labels = Variable(test_data['t1w']).to(device),Variable(test_data['FA']).to(device),Variable(test_data['MD']).to(device), Variable(test_data['label']).to(device) 
            integer_encoded = labels.data.cpu().numpy()
            ground_truth = Variable(torch.from_numpy(integer_encoded)).long().to(device)
    
        test_output = model( t1w,FA,MD)
        test_prob_predict = F.softmax(test_output, dim=1)
        _, predict = test_prob_predict.topk(1)
        loss = criterion(test_output, ground_truth)
        dev_loss += loss
        correct_this_batch = (predict.squeeze(1) == ground_truth).sum()
        correct_cnt += (predict.squeeze(1) == ground_truth).sum()
        accuracy = float(correct_this_batch) / len(ground_truth)
        print("batch {0} dev loss is : {1:.5f}".format(it, loss.data))
        print("batch {0} dev accuracy is : {1:.5f}".format(it, accuracy))

    dev_avg_loss = dev_loss / (len(dset_test) / batch_size)
    dev_avg_acu = float(correct_cnt) / len(dset_test)
    
    print("Average validation loss is {0:.5f} at the end of epoch {1}".format(dev_avg_loss.data, epoch_i))
    print("Average validation accuracy is {0:.5f} at the end of epoch {1}".format(dev_avg_acu, epoch_i))
    if dev_avg_acu>best_accuracy: 
        best_accuracy=dev_avg_acu
        torch.save({ 'epoch': epoch_i,
            'model_state_dict': model.state_dict(),
            'optimizer_state_dict': optimizer.state_dict(),
            'loss': loss}, '/home/aidana_massalimova/classifier/agnostic/model1_upd.pt') # official recommended

    last_dev_avg_loss = dev_avg_loss


At 0-th epoch.
batch 0 training loss is : 0.98042
batch 0 training accuracy is : 0.37500
batch 1 training loss is : 0.76296
batch 1 training accuracy is : 0.56250
batch 2 training loss is : 0.49623
batch 2 training accuracy is : 0.87500
batch 3 training loss is : 0.47038
batch 3 training accuracy is : 0.81250
batch 4 training loss is : 0.18334
batch 4 training accuracy is : 1.00000
batch 5 training loss is : 0.67062
batch 5 training accuracy is : 0.62500
batch 6 training loss is : 0.34389
batch 6 training accuracy is : 0.87500
batch 7 training loss is : 0.16025
batch 7 training accuracy is : 0.93750
batch 8 training loss is : 0.15005
batch 8 training accuracy is : 0.93750
batch 9 training loss is : 0.31900
batch 9 training accuracy is : 0.87500
batch 10 training loss is : 0.14230
batch 10 training accuracy is : 0.93750
batch 11 training loss is : 0.33573
batch 11 training accuracy is : 0.87500
batch 12 training loss is : 0.28799
batch 12 training accuracy is : 0.87500
batch 13 training

batch 111 training loss is : 0.00341
batch 111 training accuracy is : 1.00000
batch 112 training loss is : 0.22859
batch 112 training accuracy is : 0.93750
Average training loss is 0.19507 at the end of epoch 0
Average training accuracy is 0.90445 at the end of epoch 0
batch 0 dev loss is : 0.51851
batch 0 dev accuracy is : 0.68750
batch 1 dev loss is : 0.55285
batch 1 dev accuracy is : 0.75000
batch 2 dev loss is : 0.26949
batch 2 dev accuracy is : 0.81250
batch 3 dev loss is : 0.46090
batch 3 dev accuracy is : 0.81250
batch 4 dev loss is : 0.49499
batch 4 dev accuracy is : 0.75000
batch 5 dev loss is : 0.12836
batch 5 dev accuracy is : 1.00000
batch 6 dev loss is : 0.29792
batch 6 dev accuracy is : 0.87500
batch 7 dev loss is : 0.97116
batch 7 dev accuracy is : 0.68750
batch 8 dev loss is : 0.82065
batch 8 dev accuracy is : 0.62500
batch 9 dev loss is : 0.20819
batch 9 dev accuracy is : 0.93750
batch 10 dev loss is : 0.78288
batch 10 dev accuracy is : 0.75000
batch 11 dev loss is : 0

batch 82 training loss is : 0.00403
batch 82 training accuracy is : 1.00000
batch 83 training loss is : 0.02436
batch 83 training accuracy is : 1.00000
batch 84 training loss is : 0.05821
batch 84 training accuracy is : 1.00000
batch 85 training loss is : 0.58272
batch 85 training accuracy is : 0.87500
batch 86 training loss is : 0.20947
batch 86 training accuracy is : 0.87500
batch 87 training loss is : 0.25475
batch 87 training accuracy is : 0.81250
batch 88 training loss is : 0.10911
batch 88 training accuracy is : 0.93750
batch 89 training loss is : 0.22006
batch 89 training accuracy is : 0.87500
batch 90 training loss is : 0.11124
batch 90 training accuracy is : 0.93750
batch 91 training loss is : 0.12351
batch 91 training accuracy is : 0.93750
batch 92 training loss is : 0.08207
batch 92 training accuracy is : 1.00000
batch 93 training loss is : 0.13915
batch 93 training accuracy is : 0.93750
batch 94 training loss is : 0.10503
batch 94 training accuracy is : 1.00000
batch 95 tra

batch 50 training loss is : 0.12099
batch 50 training accuracy is : 0.93750
batch 51 training loss is : 0.11925
batch 51 training accuracy is : 0.87500
batch 52 training loss is : 0.21040
batch 52 training accuracy is : 0.93750
batch 53 training loss is : 0.30672
batch 53 training accuracy is : 0.87500
batch 54 training loss is : 0.28096
batch 54 training accuracy is : 0.87500
batch 55 training loss is : 0.26093
batch 55 training accuracy is : 0.87500
batch 56 training loss is : 0.31764
batch 56 training accuracy is : 0.87500
batch 57 training loss is : 0.02105
batch 57 training accuracy is : 1.00000
batch 58 training loss is : 0.12207
batch 58 training accuracy is : 0.87500
batch 59 training loss is : 0.31840
batch 59 training accuracy is : 0.87500
batch 60 training loss is : 0.03280
batch 60 training accuracy is : 1.00000
batch 61 training loss is : 0.07455
batch 61 training accuracy is : 0.93750
batch 62 training loss is : 0.03542
batch 62 training accuracy is : 1.00000
batch 63 tra

batch 23 training loss is : 0.11767
batch 23 training accuracy is : 0.93750
batch 24 training loss is : 0.17181
batch 24 training accuracy is : 0.87500
batch 25 training loss is : 0.06404
batch 25 training accuracy is : 0.93750
batch 26 training loss is : 0.00162
batch 26 training accuracy is : 1.00000
batch 27 training loss is : 0.15760
batch 27 training accuracy is : 0.93750
batch 28 training loss is : 0.13675
batch 28 training accuracy is : 0.93750
batch 29 training loss is : 0.04377
batch 29 training accuracy is : 1.00000
batch 30 training loss is : 0.26891
batch 30 training accuracy is : 0.81250
batch 31 training loss is : 0.10316
batch 31 training accuracy is : 0.93750
batch 32 training loss is : 0.07900
batch 32 training accuracy is : 1.00000
batch 33 training loss is : 0.15145
batch 33 training accuracy is : 0.93750
batch 34 training loss is : 0.10030
batch 34 training accuracy is : 0.93750
batch 35 training loss is : 0.19146
batch 35 training accuracy is : 0.93750
batch 36 tra

batch 19 dev loss is : 1.23436
batch 19 dev accuracy is : 0.75000
batch 20 dev loss is : 1.01056
batch 20 dev accuracy is : 0.81250
batch 21 dev loss is : 0.90134
batch 21 dev accuracy is : 0.68750
batch 22 dev loss is : 1.26845
batch 22 dev accuracy is : 0.68750
batch 23 dev loss is : 0.69666
batch 23 dev accuracy is : 0.75000
batch 24 dev loss is : 0.84296
batch 24 dev accuracy is : 0.75000
batch 25 dev loss is : 0.47298
batch 25 dev accuracy is : 0.87500
batch 26 dev loss is : 0.72182
batch 26 dev accuracy is : 0.75000
batch 27 dev loss is : 0.57205
batch 27 dev accuracy is : 0.81250
Average validation loss is 0.89519 at the end of epoch 3
Average validation accuracy is 0.72511 at the end of epoch 3
At 4-th epoch.
batch 0 training loss is : 0.09620
batch 0 training accuracy is : 0.93750
batch 1 training loss is : 0.04079
batch 1 training accuracy is : 1.00000
batch 2 training loss is : 0.28471
batch 2 training accuracy is : 0.87500
batch 3 training loss is : 0.33634
batch 3 training

batch 99 training loss is : 0.24196
batch 99 training accuracy is : 0.87500
batch 100 training loss is : 0.31976
batch 100 training accuracy is : 0.81250
batch 101 training loss is : 0.03339
batch 101 training accuracy is : 1.00000
batch 102 training loss is : 0.06115
batch 102 training accuracy is : 1.00000
batch 103 training loss is : 0.02492
batch 103 training accuracy is : 1.00000
batch 104 training loss is : 0.07047
batch 104 training accuracy is : 1.00000
batch 105 training loss is : 0.06926
batch 105 training accuracy is : 1.00000
batch 106 training loss is : 0.02621
batch 106 training accuracy is : 1.00000
batch 107 training loss is : 0.04490
batch 107 training accuracy is : 1.00000
batch 108 training loss is : 0.16470
batch 108 training accuracy is : 0.93750
batch 109 training loss is : 0.11219
batch 109 training accuracy is : 0.93750
batch 110 training loss is : 0.11123
batch 110 training accuracy is : 1.00000
batch 111 training loss is : 0.08460
batch 111 training accuracy i

batch 69 training loss is : 0.01926
batch 69 training accuracy is : 1.00000
batch 70 training loss is : 0.04976
batch 70 training accuracy is : 1.00000
batch 71 training loss is : 0.04544
batch 71 training accuracy is : 0.93750
batch 72 training loss is : 0.00699
batch 72 training accuracy is : 1.00000
batch 73 training loss is : 0.12328
batch 73 training accuracy is : 0.87500
batch 74 training loss is : 0.14097
batch 74 training accuracy is : 0.87500
batch 75 training loss is : 0.17588
batch 75 training accuracy is : 0.87500
batch 76 training loss is : 0.04415
batch 76 training accuracy is : 1.00000
batch 77 training loss is : 0.07511
batch 77 training accuracy is : 1.00000
batch 78 training loss is : 0.18730
batch 78 training accuracy is : 0.93750
batch 79 training loss is : 0.10816
batch 79 training accuracy is : 0.93750
batch 80 training loss is : 0.09870
batch 80 training accuracy is : 1.00000
batch 81 training loss is : 1.00403
batch 81 training accuracy is : 0.81250
batch 82 tra

batch 37 training loss is : 0.23307
batch 37 training accuracy is : 0.87500
batch 38 training loss is : 0.21392
batch 38 training accuracy is : 0.81250
batch 39 training loss is : 0.02517
batch 39 training accuracy is : 1.00000
batch 40 training loss is : 0.08028
batch 40 training accuracy is : 1.00000
batch 41 training loss is : 0.09738
batch 41 training accuracy is : 1.00000
batch 42 training loss is : 0.10589
batch 42 training accuracy is : 0.93750
batch 43 training loss is : 0.08284
batch 43 training accuracy is : 1.00000
batch 44 training loss is : 0.14130
batch 44 training accuracy is : 0.93750
batch 45 training loss is : 0.09060
batch 45 training accuracy is : 1.00000
batch 46 training loss is : 0.09357
batch 46 training accuracy is : 1.00000
batch 47 training loss is : 0.18153
batch 47 training accuracy is : 0.93750
batch 48 training loss is : 0.11512
batch 48 training accuracy is : 0.93750
batch 49 training loss is : 0.07698
batch 49 training accuracy is : 1.00000
batch 50 tra

batch 10 training loss is : 0.44312
batch 10 training accuracy is : 0.87500
batch 11 training loss is : 0.09447
batch 11 training accuracy is : 0.93750
batch 12 training loss is : 0.22886
batch 12 training accuracy is : 0.81250
batch 13 training loss is : 0.06554
batch 13 training accuracy is : 1.00000
batch 14 training loss is : 0.03860
batch 14 training accuracy is : 1.00000
batch 15 training loss is : 0.12727
batch 15 training accuracy is : 0.93750
batch 16 training loss is : 0.27734
batch 16 training accuracy is : 0.87500
batch 17 training loss is : 0.11836
batch 17 training accuracy is : 1.00000
batch 18 training loss is : 0.05537
batch 18 training accuracy is : 1.00000
batch 19 training loss is : 0.18583
batch 19 training accuracy is : 0.87500
batch 20 training loss is : 0.20704
batch 20 training accuracy is : 0.93750
batch 21 training loss is : 0.12966
batch 21 training accuracy is : 0.93750
batch 22 training loss is : 0.14455
batch 22 training accuracy is : 0.93750
batch 23 tra

batch 4 dev loss is : 0.71602
batch 4 dev accuracy is : 0.68750
batch 5 dev loss is : 0.36633
batch 5 dev accuracy is : 0.87500
batch 6 dev loss is : 0.34029
batch 6 dev accuracy is : 0.75000
batch 7 dev loss is : 1.30034
batch 7 dev accuracy is : 0.75000
batch 8 dev loss is : 0.59775
batch 8 dev accuracy is : 0.81250
batch 9 dev loss is : 0.54318
batch 9 dev accuracy is : 0.81250
batch 10 dev loss is : 1.05900
batch 10 dev accuracy is : 0.56250
batch 11 dev loss is : 1.10542
batch 11 dev accuracy is : 0.62500
batch 12 dev loss is : 0.79266
batch 12 dev accuracy is : 0.68750
batch 13 dev loss is : 1.31435
batch 13 dev accuracy is : 0.62500
batch 14 dev loss is : 1.26575
batch 14 dev accuracy is : 0.68750
batch 15 dev loss is : 0.61809
batch 15 dev accuracy is : 0.87500
batch 16 dev loss is : 0.81765
batch 16 dev accuracy is : 0.56250
batch 17 dev loss is : 1.68551
batch 17 dev accuracy is : 0.62500
batch 18 dev loss is : 1.14911
batch 18 dev accuracy is : 0.75000
batch 19 dev loss is :

batch 87 training loss is : 0.23251
batch 87 training accuracy is : 0.93750
batch 88 training loss is : 0.09993
batch 88 training accuracy is : 0.93750
batch 89 training loss is : 0.18455
batch 89 training accuracy is : 0.93750
batch 90 training loss is : 0.19654
batch 90 training accuracy is : 0.93750
batch 91 training loss is : 0.10963
batch 91 training accuracy is : 0.93750
batch 92 training loss is : 0.00010
batch 92 training accuracy is : 1.00000
batch 93 training loss is : 0.24448
batch 93 training accuracy is : 0.93750
batch 94 training loss is : 0.00155
batch 94 training accuracy is : 1.00000
batch 95 training loss is : 0.12212
batch 95 training accuracy is : 0.93750
batch 96 training loss is : 0.09639
batch 96 training accuracy is : 0.93750
batch 97 training loss is : 0.08248
batch 97 training accuracy is : 1.00000
batch 98 training loss is : 0.09820
batch 98 training accuracy is : 0.93750
batch 99 training loss is : 0.22926
batch 99 training accuracy is : 0.81250
batch 100 tr

batch 55 training loss is : 0.02529
batch 55 training accuracy is : 1.00000
batch 56 training loss is : 0.01816
batch 56 training accuracy is : 1.00000
batch 57 training loss is : 0.24051
batch 57 training accuracy is : 0.93750
batch 58 training loss is : 0.83697
batch 58 training accuracy is : 0.68750
batch 59 training loss is : 0.31802
batch 59 training accuracy is : 0.93750
batch 60 training loss is : 0.03831
batch 60 training accuracy is : 1.00000
batch 61 training loss is : 0.07639
batch 61 training accuracy is : 1.00000
batch 62 training loss is : 0.61458
batch 62 training accuracy is : 0.75000
batch 63 training loss is : 0.09252
batch 63 training accuracy is : 0.93750
batch 64 training loss is : 0.05713
batch 64 training accuracy is : 1.00000
batch 65 training loss is : 0.19385
batch 65 training accuracy is : 0.93750
batch 66 training loss is : 0.00009
batch 66 training accuracy is : 1.00000
batch 67 training loss is : 0.12786
batch 67 training accuracy is : 0.93750
batch 68 tra

batch 25 training loss is : 0.37919
batch 25 training accuracy is : 0.81250
batch 26 training loss is : 0.67236
batch 26 training accuracy is : 0.81250
batch 27 training loss is : 0.12959
batch 27 training accuracy is : 0.87500
batch 28 training loss is : 0.10869
batch 28 training accuracy is : 0.93750
batch 29 training loss is : 0.06904
batch 29 training accuracy is : 0.93750
batch 30 training loss is : 0.07050
batch 30 training accuracy is : 1.00000
batch 31 training loss is : 0.12128
batch 31 training accuracy is : 1.00000
batch 32 training loss is : 0.19170
batch 32 training accuracy is : 0.87500
batch 33 training loss is : 0.50061
batch 33 training accuracy is : 0.75000
batch 34 training loss is : 0.07531
batch 34 training accuracy is : 1.00000
batch 35 training loss is : 0.33578
batch 35 training accuracy is : 0.81250
batch 36 training loss is : 0.14037
batch 36 training accuracy is : 0.93750
batch 37 training loss is : 0.19612
batch 37 training accuracy is : 0.87500
batch 38 tra

batch 24 dev loss is : 0.21509
batch 24 dev accuracy is : 0.93750
batch 25 dev loss is : 1.49450
batch 25 dev accuracy is : 0.62500
batch 26 dev loss is : 1.65443
batch 26 dev accuracy is : 0.68750
batch 27 dev loss is : 1.28642
batch 27 dev accuracy is : 0.75000
Average validation loss is 1.06128 at the end of epoch 10
Average validation accuracy is 0.74026 at the end of epoch 10
At 11-th epoch.
batch 0 training loss is : 0.37928
batch 0 training accuracy is : 0.75000
batch 1 training loss is : 0.11398
batch 1 training accuracy is : 0.93750
batch 2 training loss is : 0.23203
batch 2 training accuracy is : 0.87500
batch 3 training loss is : 0.15933
batch 3 training accuracy is : 0.93750
batch 4 training loss is : 0.05182
batch 4 training accuracy is : 1.00000
batch 5 training loss is : 0.04451
batch 5 training accuracy is : 1.00000
batch 6 training loss is : 0.02313
batch 6 training accuracy is : 1.00000
batch 7 training loss is : 0.03092
batch 7 training accuracy is : 1.00000
batch 8 

batch 103 training loss is : 0.25622
batch 103 training accuracy is : 0.87500
batch 104 training loss is : 0.00230
batch 104 training accuracy is : 1.00000
batch 105 training loss is : 0.02307
batch 105 training accuracy is : 1.00000
batch 106 training loss is : 0.03981
batch 106 training accuracy is : 1.00000
batch 107 training loss is : 0.15451
batch 107 training accuracy is : 0.93750
batch 108 training loss is : 0.01531
batch 108 training accuracy is : 1.00000
batch 109 training loss is : 0.17456
batch 109 training accuracy is : 0.87500
batch 110 training loss is : 0.15599
batch 110 training accuracy is : 0.87500
batch 111 training loss is : 0.01887
batch 111 training accuracy is : 1.00000
batch 112 training loss is : 0.55458
batch 112 training accuracy is : 0.87500
Average training loss is 0.11713 at the end of epoch 11
Average training accuracy is 0.94069 at the end of epoch 11
batch 0 dev loss is : 0.64880
batch 0 dev accuracy is : 0.75000
batch 1 dev loss is : 0.37116
batch 1 de

batch 71 training loss is : 0.01302
batch 71 training accuracy is : 1.00000
batch 72 training loss is : 0.19709
batch 72 training accuracy is : 0.93750
batch 73 training loss is : 0.06541
batch 73 training accuracy is : 0.93750
batch 74 training loss is : 0.18044
batch 74 training accuracy is : 0.87500
batch 75 training loss is : 0.12984
batch 75 training accuracy is : 0.93750
batch 76 training loss is : 0.23150
batch 76 training accuracy is : 0.93750
batch 77 training loss is : 0.04418
batch 77 training accuracy is : 1.00000
batch 78 training loss is : 0.35369
batch 78 training accuracy is : 0.87500
batch 79 training loss is : 0.42737
batch 79 training accuracy is : 0.93750
batch 80 training loss is : 0.14868
batch 80 training accuracy is : 0.93750
batch 81 training loss is : 0.34985
batch 81 training accuracy is : 0.87500
batch 82 training loss is : 0.22115
batch 82 training accuracy is : 0.93750
batch 83 training loss is : 0.10412
batch 83 training accuracy is : 0.93750
batch 84 tra

batch 39 training loss is : 0.05449
batch 39 training accuracy is : 1.00000
batch 40 training loss is : 0.20699
batch 40 training accuracy is : 0.93750
batch 41 training loss is : 0.06177
batch 41 training accuracy is : 1.00000
batch 42 training loss is : 0.06505
batch 42 training accuracy is : 1.00000
batch 43 training loss is : 0.00033
batch 43 training accuracy is : 1.00000
batch 44 training loss is : 0.03472
batch 44 training accuracy is : 1.00000
batch 45 training loss is : 0.10643
batch 45 training accuracy is : 0.93750
batch 46 training loss is : 0.00022
batch 46 training accuracy is : 1.00000
batch 47 training loss is : 0.08922
batch 47 training accuracy is : 0.93750
batch 48 training loss is : 0.16232
batch 48 training accuracy is : 0.93750
batch 49 training loss is : 0.21974
batch 49 training accuracy is : 0.87500
batch 50 training loss is : 0.20206
batch 50 training accuracy is : 0.87500
batch 51 training loss is : 0.05180
batch 51 training accuracy is : 0.93750
batch 52 tra

batch 8 training loss is : 0.12422
batch 8 training accuracy is : 0.93750
batch 9 training loss is : 0.00269
batch 9 training accuracy is : 1.00000
batch 10 training loss is : 0.03446
batch 10 training accuracy is : 1.00000
batch 11 training loss is : 0.00522
batch 11 training accuracy is : 1.00000
batch 12 training loss is : 0.00385
batch 12 training accuracy is : 1.00000
batch 13 training loss is : 0.10626
batch 13 training accuracy is : 0.93750
batch 14 training loss is : 0.09917
batch 14 training accuracy is : 0.93750
batch 15 training loss is : 0.02928
batch 15 training accuracy is : 1.00000
batch 16 training loss is : 0.07044
batch 16 training accuracy is : 0.93750
batch 17 training loss is : 0.00075
batch 17 training accuracy is : 1.00000
batch 18 training loss is : 0.05652
batch 18 training accuracy is : 1.00000
batch 19 training loss is : 0.07087
batch 19 training accuracy is : 0.93750
batch 20 training loss is : 0.10414
batch 20 training accuracy is : 0.93750
batch 21 trainin

batch 3 dev loss is : 0.56208
batch 3 dev accuracy is : 0.87500
batch 4 dev loss is : 0.59841
batch 4 dev accuracy is : 0.68750
batch 5 dev loss is : 0.20083
batch 5 dev accuracy is : 0.87500
batch 6 dev loss is : 0.21338
batch 6 dev accuracy is : 0.87500
batch 7 dev loss is : 1.37057
batch 7 dev accuracy is : 0.81250
batch 8 dev loss is : 1.06862
batch 8 dev accuracy is : 0.68750
batch 9 dev loss is : 0.26949
batch 9 dev accuracy is : 0.93750
batch 10 dev loss is : 1.22935
batch 10 dev accuracy is : 0.62500
batch 11 dev loss is : 1.00915
batch 11 dev accuracy is : 0.62500
batch 12 dev loss is : 0.54352
batch 12 dev accuracy is : 0.75000
batch 13 dev loss is : 1.46590
batch 13 dev accuracy is : 0.68750
batch 14 dev loss is : 0.90272
batch 14 dev accuracy is : 0.75000
batch 15 dev loss is : 0.47650
batch 15 dev accuracy is : 0.87500
batch 16 dev loss is : 0.71816
batch 16 dev accuracy is : 0.75000
batch 17 dev loss is : 1.51826
batch 17 dev accuracy is : 0.62500
batch 18 dev loss is : 1

batch 86 training loss is : 0.07205
batch 86 training accuracy is : 0.93750
batch 87 training loss is : 0.16094
batch 87 training accuracy is : 0.93750
batch 88 training loss is : 0.17948
batch 88 training accuracy is : 0.87500
batch 89 training loss is : 0.27034
batch 89 training accuracy is : 0.81250
batch 90 training loss is : 0.00536
batch 90 training accuracy is : 1.00000
batch 91 training loss is : 0.16698
batch 91 training accuracy is : 0.93750
batch 92 training loss is : 0.05559
batch 92 training accuracy is : 1.00000
batch 93 training loss is : 0.43132
batch 93 training accuracy is : 0.87500
batch 94 training loss is : 0.02399
batch 94 training accuracy is : 1.00000
batch 95 training loss is : 0.08006
batch 95 training accuracy is : 1.00000
batch 96 training loss is : 0.50042
batch 96 training accuracy is : 0.81250
batch 97 training loss is : 0.04463
batch 97 training accuracy is : 1.00000
batch 98 training loss is : 0.00972
batch 98 training accuracy is : 1.00000
batch 99 tra

batch 55 training loss is : 0.15024
batch 55 training accuracy is : 0.87500
batch 56 training loss is : 0.25193
batch 56 training accuracy is : 0.93750
batch 57 training loss is : 0.14545
batch 57 training accuracy is : 0.93750
batch 58 training loss is : 0.33987
batch 58 training accuracy is : 0.81250
batch 59 training loss is : 0.91219
batch 59 training accuracy is : 0.75000
batch 60 training loss is : 0.06855
batch 60 training accuracy is : 0.93750
batch 61 training loss is : 0.00101
batch 61 training accuracy is : 1.00000
batch 62 training loss is : 0.16377
batch 62 training accuracy is : 0.93750
batch 63 training loss is : 0.06319
batch 63 training accuracy is : 0.93750
batch 64 training loss is : 0.11413
batch 64 training accuracy is : 0.93750
batch 65 training loss is : 0.01984
batch 65 training accuracy is : 1.00000
batch 66 training loss is : 0.03441
batch 66 training accuracy is : 1.00000
batch 67 training loss is : 0.03056
batch 67 training accuracy is : 1.00000
batch 68 tra

batch 24 training loss is : 0.12241
batch 24 training accuracy is : 0.93750
batch 25 training loss is : 0.07507
batch 25 training accuracy is : 1.00000
batch 26 training loss is : 0.75591
batch 26 training accuracy is : 0.81250
batch 27 training loss is : 0.10756
batch 27 training accuracy is : 1.00000
batch 28 training loss is : 0.11321
batch 28 training accuracy is : 0.93750
batch 29 training loss is : 0.22269
batch 29 training accuracy is : 0.93750
batch 30 training loss is : 0.07730
batch 30 training accuracy is : 1.00000
batch 31 training loss is : 0.02060
batch 31 training accuracy is : 1.00000
batch 32 training loss is : 0.01665
batch 32 training accuracy is : 1.00000
batch 33 training loss is : 0.15771
batch 33 training accuracy is : 0.93750
batch 34 training loss is : 0.05862
batch 34 training accuracy is : 0.93750
batch 35 training loss is : 0.12908
batch 35 training accuracy is : 0.93750
batch 36 training loss is : 0.00387
batch 36 training accuracy is : 1.00000
batch 37 tra

batch 22 dev loss is : 1.02255
batch 22 dev accuracy is : 0.87500
batch 23 dev loss is : 0.38513
batch 23 dev accuracy is : 0.87500
batch 24 dev loss is : 0.27827
batch 24 dev accuracy is : 0.93750
batch 25 dev loss is : 0.50715
batch 25 dev accuracy is : 0.75000
batch 26 dev loss is : 1.33413
batch 26 dev accuracy is : 0.68750
batch 27 dev loss is : 1.08437
batch 27 dev accuracy is : 0.75000
Average validation loss is 0.75054 at the end of epoch 17
Average validation accuracy is 0.77489 at the end of epoch 17
At 18-th epoch.
batch 0 training loss is : 0.14807
batch 0 training accuracy is : 0.93750
batch 1 training loss is : 0.11644
batch 1 training accuracy is : 0.93750
batch 2 training loss is : 0.07243
batch 2 training accuracy is : 1.00000
batch 3 training loss is : 0.15705
batch 3 training accuracy is : 0.93750
batch 4 training loss is : 0.14163
batch 4 training accuracy is : 0.93750
batch 5 training loss is : 0.50691
batch 5 training accuracy is : 0.75000
batch 6 training loss is

batch 103 training loss is : 0.03709
batch 103 training accuracy is : 1.00000
batch 104 training loss is : 0.02520
batch 104 training accuracy is : 1.00000
batch 105 training loss is : 0.03113
batch 105 training accuracy is : 1.00000
batch 106 training loss is : 0.09143
batch 106 training accuracy is : 1.00000
batch 107 training loss is : 0.04631
batch 107 training accuracy is : 1.00000
batch 108 training loss is : 0.00100
batch 108 training accuracy is : 1.00000
batch 109 training loss is : 0.20760
batch 109 training accuracy is : 0.93750
batch 110 training loss is : 0.10867
batch 110 training accuracy is : 0.93750
batch 111 training loss is : 0.00559
batch 111 training accuracy is : 1.00000
batch 112 training loss is : 0.06571
batch 112 training accuracy is : 0.93750
Average training loss is 0.09389 at the end of epoch 18
Average training accuracy is 0.95717 at the end of epoch 18
batch 0 dev loss is : 0.51470
batch 0 dev accuracy is : 0.75000
batch 1 dev loss is : 0.15321
batch 1 de

batch 73 training loss is : 0.30593
batch 73 training accuracy is : 0.75000
batch 74 training loss is : 0.63021
batch 74 training accuracy is : 0.87500
batch 75 training loss is : 0.12477
batch 75 training accuracy is : 0.93750
batch 76 training loss is : 0.22782
batch 76 training accuracy is : 0.93750
batch 77 training loss is : 0.05539
batch 77 training accuracy is : 1.00000
batch 78 training loss is : 0.00739
batch 78 training accuracy is : 1.00000
batch 79 training loss is : 0.13765
batch 79 training accuracy is : 0.93750
batch 80 training loss is : 0.06591
batch 80 training accuracy is : 0.93750
batch 81 training loss is : 0.23930
batch 81 training accuracy is : 0.87500
batch 82 training loss is : 0.10249
batch 82 training accuracy is : 0.93750
batch 83 training loss is : 0.07105
batch 83 training accuracy is : 0.93750
batch 84 training loss is : 0.12927
batch 84 training accuracy is : 0.93750
batch 85 training loss is : 0.13475
batch 85 training accuracy is : 0.93750
batch 86 tra

batch 42 training loss is : 0.01205
batch 42 training accuracy is : 1.00000
batch 43 training loss is : 0.02775
batch 43 training accuracy is : 1.00000
batch 44 training loss is : 0.10129
batch 44 training accuracy is : 1.00000
batch 45 training loss is : 0.15631
batch 45 training accuracy is : 0.93750
batch 46 training loss is : 0.04929
batch 46 training accuracy is : 1.00000
batch 47 training loss is : 0.00410
batch 47 training accuracy is : 1.00000
batch 48 training loss is : 0.04179
batch 48 training accuracy is : 1.00000
batch 49 training loss is : 0.16686
batch 49 training accuracy is : 0.93750
batch 50 training loss is : 0.04993
batch 50 training accuracy is : 1.00000
batch 51 training loss is : 0.23207
batch 51 training accuracy is : 0.87500
batch 52 training loss is : 0.26965
batch 52 training accuracy is : 0.87500
batch 53 training loss is : 0.22852
batch 53 training accuracy is : 0.87500
batch 54 training loss is : 0.28607
batch 54 training accuracy is : 0.87500
batch 55 tra

batch 12 training loss is : 0.37840
batch 12 training accuracy is : 0.93750
batch 13 training loss is : 0.00045
batch 13 training accuracy is : 1.00000
batch 14 training loss is : 0.23160
batch 14 training accuracy is : 0.93750
batch 15 training loss is : 0.14584
batch 15 training accuracy is : 1.00000
batch 16 training loss is : 0.06825
batch 16 training accuracy is : 1.00000
batch 17 training loss is : 0.16552
batch 17 training accuracy is : 0.93750
batch 18 training loss is : 0.00797
batch 18 training accuracy is : 1.00000
batch 19 training loss is : 0.24258
batch 19 training accuracy is : 0.87500
batch 20 training loss is : 0.13516
batch 20 training accuracy is : 0.87500
batch 21 training loss is : 0.08348
batch 21 training accuracy is : 1.00000
batch 22 training loss is : 0.10637
batch 22 training accuracy is : 0.93750
batch 23 training loss is : 0.22138
batch 23 training accuracy is : 0.87500
batch 24 training loss is : 0.02881
batch 24 training accuracy is : 1.00000
batch 25 tra

batch 6 dev loss is : 0.36405
batch 6 dev accuracy is : 0.75000
batch 7 dev loss is : 1.34101
batch 7 dev accuracy is : 0.75000
batch 8 dev loss is : 1.90010
batch 8 dev accuracy is : 0.62500
batch 9 dev loss is : 0.25688
batch 9 dev accuracy is : 0.87500
batch 10 dev loss is : 1.54092
batch 10 dev accuracy is : 0.56250
batch 11 dev loss is : 1.08881
batch 11 dev accuracy is : 0.62500
batch 12 dev loss is : 0.54677
batch 12 dev accuracy is : 0.81250
batch 13 dev loss is : 1.12240
batch 13 dev accuracy is : 0.75000
batch 14 dev loss is : 0.54398
batch 14 dev accuracy is : 0.87500
batch 15 dev loss is : 0.65019
batch 15 dev accuracy is : 0.87500
batch 16 dev loss is : 0.72983
batch 16 dev accuracy is : 0.87500
batch 17 dev loss is : 1.46124
batch 17 dev accuracy is : 0.62500
batch 18 dev loss is : 1.47198
batch 18 dev accuracy is : 0.62500
batch 19 dev loss is : 1.51726
batch 19 dev accuracy is : 0.81250
batch 20 dev loss is : 1.08312
batch 20 dev accuracy is : 0.87500
batch 21 dev loss 

batch 88 training loss is : 0.03485
batch 88 training accuracy is : 1.00000
batch 89 training loss is : 0.09791
batch 89 training accuracy is : 0.93750
batch 90 training loss is : 0.06759
batch 90 training accuracy is : 0.93750
batch 91 training loss is : 0.08641
batch 91 training accuracy is : 0.93750
batch 92 training loss is : 0.02358
batch 92 training accuracy is : 1.00000
batch 93 training loss is : 0.00592
batch 93 training accuracy is : 1.00000
batch 94 training loss is : 0.03523
batch 94 training accuracy is : 1.00000
batch 95 training loss is : 0.09008
batch 95 training accuracy is : 0.93750
batch 96 training loss is : 0.26163
batch 96 training accuracy is : 0.93750
batch 97 training loss is : 0.05574
batch 97 training accuracy is : 1.00000
batch 98 training loss is : 0.00788
batch 98 training accuracy is : 1.00000
batch 99 training loss is : 0.09151
batch 99 training accuracy is : 0.93750
batch 100 training loss is : 0.05552
batch 100 training accuracy is : 1.00000
batch 101 

batch 58 training loss is : 0.13529
batch 58 training accuracy is : 0.87500
batch 59 training loss is : 0.10603
batch 59 training accuracy is : 1.00000
batch 60 training loss is : 0.05797
batch 60 training accuracy is : 1.00000
batch 61 training loss is : 0.09661
batch 61 training accuracy is : 0.93750
batch 62 training loss is : 0.00748
batch 62 training accuracy is : 1.00000
batch 63 training loss is : 0.06257
batch 63 training accuracy is : 1.00000
batch 64 training loss is : 0.10745
batch 64 training accuracy is : 0.93750
batch 65 training loss is : 0.06347
batch 65 training accuracy is : 1.00000
batch 66 training loss is : 0.17975
batch 66 training accuracy is : 0.93750
batch 67 training loss is : 0.16140
batch 67 training accuracy is : 0.93750
batch 68 training loss is : 0.19632
batch 68 training accuracy is : 0.93750
batch 69 training loss is : 0.03773
batch 69 training accuracy is : 1.00000
batch 70 training loss is : 0.02993
batch 70 training accuracy is : 1.00000
batch 71 tra

batch 27 training loss is : 0.02705
batch 27 training accuracy is : 1.00000
batch 28 training loss is : 0.07668
batch 28 training accuracy is : 0.93750
batch 29 training loss is : 0.00053
batch 29 training accuracy is : 1.00000
batch 30 training loss is : 0.01004
batch 30 training accuracy is : 1.00000
batch 31 training loss is : 0.01231
batch 31 training accuracy is : 1.00000
batch 32 training loss is : 0.27514
batch 32 training accuracy is : 0.87500
batch 33 training loss is : 0.12951
batch 33 training accuracy is : 0.87500
batch 34 training loss is : 0.24490
batch 34 training accuracy is : 0.93750
batch 35 training loss is : 0.03705
batch 35 training accuracy is : 1.00000
batch 36 training loss is : 0.04060
batch 36 training accuracy is : 1.00000
batch 37 training loss is : 0.05895
batch 37 training accuracy is : 1.00000
batch 38 training loss is : 0.09339
batch 38 training accuracy is : 1.00000
batch 39 training loss is : 0.04078
batch 39 training accuracy is : 1.00000
batch 40 tra

batch 26 dev loss is : 1.13215
batch 26 dev accuracy is : 0.68750
batch 27 dev loss is : 0.97647
batch 27 dev accuracy is : 0.81250
Average validation loss is 0.74963 at the end of epoch 24
Average validation accuracy is 0.79654 at the end of epoch 24
At 25-th epoch.
batch 0 training loss is : 0.14741
batch 0 training accuracy is : 0.93750
batch 1 training loss is : 0.01926
batch 1 training accuracy is : 1.00000
batch 2 training loss is : 0.02297
batch 2 training accuracy is : 1.00000
batch 3 training loss is : 0.05910
batch 3 training accuracy is : 0.93750
batch 4 training loss is : 0.04544
batch 4 training accuracy is : 1.00000
batch 5 training loss is : 0.02211
batch 5 training accuracy is : 1.00000
batch 6 training loss is : 0.08979
batch 6 training accuracy is : 0.93750
batch 7 training loss is : 0.25385
batch 7 training accuracy is : 0.87500
batch 8 training loss is : 0.02867
batch 8 training accuracy is : 1.00000
batch 9 training loss is : 0.19853
batch 9 training accuracy is : 

batch 106 training loss is : 0.00076
batch 106 training accuracy is : 1.00000
batch 107 training loss is : 0.03995
batch 107 training accuracy is : 1.00000
batch 108 training loss is : 0.00026
batch 108 training accuracy is : 1.00000
batch 109 training loss is : 0.08421
batch 109 training accuracy is : 0.93750
batch 110 training loss is : 0.07081
batch 110 training accuracy is : 0.93750
batch 111 training loss is : 0.11391
batch 111 training accuracy is : 0.93750
batch 112 training loss is : 0.05188
batch 112 training accuracy is : 1.00000
Average training loss is 0.11470 at the end of epoch 25
Average training accuracy is 0.95277 at the end of epoch 25
batch 0 dev loss is : 0.32679
batch 0 dev accuracy is : 0.81250
batch 1 dev loss is : 0.33559
batch 1 dev accuracy is : 0.87500
batch 2 dev loss is : 0.41395
batch 2 dev accuracy is : 0.87500
batch 3 dev loss is : 0.45020
batch 3 dev accuracy is : 0.75000
batch 4 dev loss is : 0.79404
batch 4 dev accuracy is : 0.81250
batch 5 dev loss i

batch 74 training loss is : 0.09712
batch 74 training accuracy is : 0.93750
batch 75 training loss is : 0.01358
batch 75 training accuracy is : 1.00000
batch 76 training loss is : 0.15619
batch 76 training accuracy is : 0.93750
batch 77 training loss is : 0.02849
batch 77 training accuracy is : 1.00000
batch 78 training loss is : 0.13731
batch 78 training accuracy is : 0.93750
batch 79 training loss is : 0.02506
batch 79 training accuracy is : 1.00000
batch 80 training loss is : 0.00151
batch 80 training accuracy is : 1.00000
batch 81 training loss is : 0.17938
batch 81 training accuracy is : 0.93750
batch 82 training loss is : 0.09621
batch 82 training accuracy is : 0.93750
batch 83 training loss is : 0.05205
batch 83 training accuracy is : 1.00000
batch 84 training loss is : 0.13818
batch 84 training accuracy is : 0.93750
batch 85 training loss is : 0.07864
batch 85 training accuracy is : 1.00000
batch 86 training loss is : 0.02333
batch 86 training accuracy is : 1.00000
batch 87 tra

batch 44 training loss is : 0.09456
batch 44 training accuracy is : 1.00000
batch 45 training loss is : 0.03324
batch 45 training accuracy is : 1.00000
batch 46 training loss is : 0.05200
batch 46 training accuracy is : 0.93750
batch 47 training loss is : 0.14685
batch 47 training accuracy is : 0.81250
batch 48 training loss is : 0.05398
batch 48 training accuracy is : 0.93750
batch 49 training loss is : 0.05849
batch 49 training accuracy is : 1.00000
batch 50 training loss is : 0.11724
batch 50 training accuracy is : 0.93750
batch 51 training loss is : 0.00714
batch 51 training accuracy is : 1.00000
batch 52 training loss is : 0.34223
batch 52 training accuracy is : 0.87500
batch 53 training loss is : 0.04451
batch 53 training accuracy is : 1.00000
batch 54 training loss is : 0.12087
batch 54 training accuracy is : 0.93750
batch 55 training loss is : 0.04670
batch 55 training accuracy is : 1.00000
batch 56 training loss is : 0.08295
batch 56 training accuracy is : 0.93750
batch 57 tra

batch 12 training loss is : 0.02999
batch 12 training accuracy is : 1.00000
batch 13 training loss is : 0.02641
batch 13 training accuracy is : 1.00000
batch 14 training loss is : 0.07499
batch 14 training accuracy is : 0.93750
batch 15 training loss is : 0.45846
batch 15 training accuracy is : 0.87500
batch 16 training loss is : 0.01521
batch 16 training accuracy is : 1.00000
batch 17 training loss is : 0.08426
batch 17 training accuracy is : 0.93750
batch 18 training loss is : 0.11757
batch 18 training accuracy is : 0.93750
batch 19 training loss is : 0.01330
batch 19 training accuracy is : 1.00000
batch 20 training loss is : 0.08870
batch 20 training accuracy is : 0.93750
batch 21 training loss is : 0.15374
batch 21 training accuracy is : 0.93750
batch 22 training loss is : 0.10202
batch 22 training accuracy is : 0.93750
batch 23 training loss is : 0.01118
batch 23 training accuracy is : 1.00000
batch 24 training loss is : 0.22283
batch 24 training accuracy is : 0.93750
batch 25 tra

batch 8 dev loss is : 1.63237
batch 8 dev accuracy is : 0.62500
batch 9 dev loss is : 0.29133
batch 9 dev accuracy is : 0.81250
batch 10 dev loss is : 1.38856
batch 10 dev accuracy is : 0.56250
batch 11 dev loss is : 0.74059
batch 11 dev accuracy is : 0.62500
batch 12 dev loss is : 0.46852
batch 12 dev accuracy is : 0.81250
batch 13 dev loss is : 1.21282
batch 13 dev accuracy is : 0.68750
batch 14 dev loss is : 0.45425
batch 14 dev accuracy is : 0.87500
batch 15 dev loss is : 0.49746
batch 15 dev accuracy is : 0.87500
batch 16 dev loss is : 0.66129
batch 16 dev accuracy is : 0.75000
batch 17 dev loss is : 1.27013
batch 17 dev accuracy is : 0.75000
batch 18 dev loss is : 1.33668
batch 18 dev accuracy is : 0.62500
batch 19 dev loss is : 1.52460
batch 19 dev accuracy is : 0.81250
batch 20 dev loss is : 1.01241
batch 20 dev accuracy is : 0.81250
batch 21 dev loss is : 1.11032
batch 21 dev accuracy is : 0.81250
batch 22 dev loss is : 0.99672
batch 22 dev accuracy is : 0.81250
batch 23 dev l

batch 94 training loss is : 0.04135
batch 94 training accuracy is : 1.00000
batch 95 training loss is : 0.03991
batch 95 training accuracy is : 1.00000
batch 96 training loss is : 0.02168
batch 96 training accuracy is : 1.00000
batch 97 training loss is : 0.20552
batch 97 training accuracy is : 0.87500
batch 98 training loss is : 0.00024
batch 98 training accuracy is : 1.00000
batch 99 training loss is : 0.13633
batch 99 training accuracy is : 0.87500
batch 100 training loss is : 0.10333
batch 100 training accuracy is : 0.93750
batch 101 training loss is : 0.01473
batch 101 training accuracy is : 1.00000
batch 102 training loss is : 0.13953
batch 102 training accuracy is : 0.93750
batch 103 training loss is : 0.05908
batch 103 training accuracy is : 1.00000
batch 104 training loss is : 0.03218
batch 104 training accuracy is : 1.00000
batch 105 training loss is : 0.23216
batch 105 training accuracy is : 0.87500
batch 106 training loss is : 0.09332
batch 106 training accuracy is : 0.9375

batch 65 training loss is : 0.40406
batch 65 training accuracy is : 0.87500
batch 66 training loss is : 0.05097
batch 66 training accuracy is : 0.93750
batch 67 training loss is : 0.01878
batch 67 training accuracy is : 1.00000
batch 68 training loss is : 0.00725
batch 68 training accuracy is : 1.00000
batch 69 training loss is : 0.02300
batch 69 training accuracy is : 1.00000
batch 70 training loss is : 0.13460
batch 70 training accuracy is : 0.87500
batch 71 training loss is : 0.12637
batch 71 training accuracy is : 0.93750
batch 72 training loss is : 0.28119
batch 72 training accuracy is : 0.87500
batch 73 training loss is : 0.43492
batch 73 training accuracy is : 0.87500
batch 74 training loss is : 0.01514
batch 74 training accuracy is : 1.00000
batch 75 training loss is : 0.00964
batch 75 training accuracy is : 1.00000
batch 76 training loss is : 0.61655
batch 76 training accuracy is : 0.75000
batch 77 training loss is : 0.02744
batch 77 training accuracy is : 1.00000
batch 78 tra

batch 34 training loss is : 0.00225
batch 34 training accuracy is : 1.00000
batch 35 training loss is : 0.01425
batch 35 training accuracy is : 1.00000
batch 36 training loss is : 0.44351
batch 36 training accuracy is : 0.93750
batch 37 training loss is : 0.09376
batch 37 training accuracy is : 0.93750
batch 38 training loss is : 0.12370
batch 38 training accuracy is : 0.93750
batch 39 training loss is : 0.18104
batch 39 training accuracy is : 0.93750
batch 40 training loss is : 0.47920
batch 40 training accuracy is : 0.81250
batch 41 training loss is : 0.10756
batch 41 training accuracy is : 1.00000
batch 42 training loss is : 0.13031
batch 42 training accuracy is : 0.93750
batch 43 training loss is : 0.10629
batch 43 training accuracy is : 0.93750
batch 44 training loss is : 0.00014
batch 44 training accuracy is : 1.00000
batch 45 training loss is : 0.02748
batch 45 training accuracy is : 1.00000
batch 46 training loss is : 0.00595
batch 46 training accuracy is : 1.00000
batch 47 tra

batch 4 training loss is : 0.03155
batch 4 training accuracy is : 1.00000
batch 5 training loss is : 0.08919
batch 5 training accuracy is : 1.00000
batch 6 training loss is : 0.02429
batch 6 training accuracy is : 1.00000
batch 7 training loss is : 0.00084
batch 7 training accuracy is : 1.00000
batch 8 training loss is : 0.05029
batch 8 training accuracy is : 1.00000
batch 9 training loss is : 0.15382
batch 9 training accuracy is : 0.93750
batch 10 training loss is : 0.02368
batch 10 training accuracy is : 1.00000
batch 11 training loss is : 0.01175
batch 11 training accuracy is : 1.00000
batch 12 training loss is : 0.00035
batch 12 training accuracy is : 1.00000
batch 13 training loss is : 0.13900
batch 13 training accuracy is : 0.93750
batch 14 training loss is : 0.06099
batch 14 training accuracy is : 1.00000
batch 15 training loss is : 0.12180
batch 15 training accuracy is : 0.93750
batch 16 training loss is : 0.03277
batch 16 training accuracy is : 1.00000
batch 17 training loss i

Average training loss is 0.09432 at the end of epoch 32
Average training accuracy is 0.95387 at the end of epoch 32
batch 0 dev loss is : 0.78287
batch 0 dev accuracy is : 0.81250
batch 1 dev loss is : 0.47093
batch 1 dev accuracy is : 0.87500
batch 2 dev loss is : 0.75176
batch 2 dev accuracy is : 0.75000
batch 3 dev loss is : 0.93243
batch 3 dev accuracy is : 0.87500
batch 4 dev loss is : 0.66417
batch 4 dev accuracy is : 0.68750
batch 5 dev loss is : 0.40973
batch 5 dev accuracy is : 0.87500
batch 6 dev loss is : 0.81949
batch 6 dev accuracy is : 0.75000
batch 7 dev loss is : 1.38544
batch 7 dev accuracy is : 0.81250
batch 8 dev loss is : 1.73571
batch 8 dev accuracy is : 0.62500
batch 9 dev loss is : 0.55111
batch 9 dev accuracy is : 0.75000
batch 10 dev loss is : 1.93753
batch 10 dev accuracy is : 0.56250
batch 11 dev loss is : 0.84010
batch 11 dev accuracy is : 0.68750
batch 12 dev loss is : 0.55809
batch 12 dev accuracy is : 0.81250
batch 13 dev loss is : 1.39138
batch 13 dev ac

batch 81 training loss is : 0.05869
batch 81 training accuracy is : 1.00000
batch 82 training loss is : 0.03495
batch 82 training accuracy is : 1.00000
batch 83 training loss is : 0.14577
batch 83 training accuracy is : 0.93750
batch 84 training loss is : 0.08338
batch 84 training accuracy is : 1.00000
batch 85 training loss is : 0.05105
batch 85 training accuracy is : 1.00000
batch 86 training loss is : 0.21109
batch 86 training accuracy is : 0.93750
batch 87 training loss is : 0.01699
batch 87 training accuracy is : 1.00000
batch 88 training loss is : 0.11044
batch 88 training accuracy is : 0.93750
batch 89 training loss is : 0.17036
batch 89 training accuracy is : 0.87500
batch 90 training loss is : 0.00332
batch 90 training accuracy is : 1.00000
batch 91 training loss is : 0.22297
batch 91 training accuracy is : 0.93750
batch 92 training loss is : 0.01668
batch 92 training accuracy is : 1.00000
batch 93 training loss is : 0.01054
batch 93 training accuracy is : 1.00000
batch 94 tra

batch 49 training loss is : 0.10339
batch 49 training accuracy is : 1.00000
batch 50 training loss is : 0.00872
batch 50 training accuracy is : 1.00000
batch 51 training loss is : 0.19123
batch 51 training accuracy is : 0.87500
batch 52 training loss is : 0.01107
batch 52 training accuracy is : 1.00000
batch 53 training loss is : 0.03889
batch 53 training accuracy is : 1.00000
batch 54 training loss is : 0.18450
batch 54 training accuracy is : 0.87500
batch 55 training loss is : 0.08212
batch 55 training accuracy is : 1.00000
batch 56 training loss is : 0.01807
batch 56 training accuracy is : 1.00000
batch 57 training loss is : 0.00781
batch 57 training accuracy is : 1.00000
batch 58 training loss is : 0.28590
batch 58 training accuracy is : 0.93750
batch 59 training loss is : 0.05998
batch 59 training accuracy is : 1.00000
batch 60 training loss is : 0.12780
batch 60 training accuracy is : 0.93750
batch 61 training loss is : 0.01405
batch 61 training accuracy is : 1.00000
batch 62 tra

batch 19 training loss is : 0.13813
batch 19 training accuracy is : 0.93750
batch 20 training loss is : 0.01385
batch 20 training accuracy is : 1.00000
batch 21 training loss is : 0.08411
batch 21 training accuracy is : 0.93750
batch 22 training loss is : 0.04471
batch 22 training accuracy is : 1.00000
batch 23 training loss is : 0.01711
batch 23 training accuracy is : 1.00000
batch 24 training loss is : 0.08516
batch 24 training accuracy is : 0.93750
batch 25 training loss is : 0.04737
batch 25 training accuracy is : 1.00000
batch 26 training loss is : 0.05774
batch 26 training accuracy is : 1.00000
batch 27 training loss is : 0.04430
batch 27 training accuracy is : 1.00000
batch 28 training loss is : 0.05431
batch 28 training accuracy is : 1.00000
batch 29 training loss is : 0.35789
batch 29 training accuracy is : 0.81250
batch 30 training loss is : 0.13881
batch 30 training accuracy is : 0.93750
batch 31 training loss is : 0.06233
batch 31 training accuracy is : 0.93750
batch 32 tra

batch 15 dev loss is : 0.71186
batch 15 dev accuracy is : 0.81250
batch 16 dev loss is : 0.93241
batch 16 dev accuracy is : 0.81250
batch 17 dev loss is : 2.01921
batch 17 dev accuracy is : 0.62500
batch 18 dev loss is : 1.94969
batch 18 dev accuracy is : 0.68750
batch 19 dev loss is : 1.67816
batch 19 dev accuracy is : 0.75000
batch 20 dev loss is : 1.29921
batch 20 dev accuracy is : 0.75000
batch 21 dev loss is : 1.16564
batch 21 dev accuracy is : 0.75000
batch 22 dev loss is : 0.99514
batch 22 dev accuracy is : 0.81250
batch 23 dev loss is : 0.64315
batch 23 dev accuracy is : 0.81250
batch 24 dev loss is : 0.60382
batch 24 dev accuracy is : 0.87500
batch 25 dev loss is : 0.99188
batch 25 dev accuracy is : 0.68750
batch 26 dev loss is : 1.21729
batch 26 dev accuracy is : 0.68750
batch 27 dev loss is : 0.58299
batch 27 dev accuracy is : 0.81250
Average validation loss is 1.00406 at the end of epoch 35
Average validation accuracy is 0.72727 at the end of epoch 35
At 36-th epoch.
batch 

batch 96 training loss is : 0.23669
batch 96 training accuracy is : 0.87500
batch 97 training loss is : 0.70044
batch 97 training accuracy is : 0.62500
batch 98 training loss is : 0.14692
batch 98 training accuracy is : 0.93750
batch 99 training loss is : 0.07800
batch 99 training accuracy is : 0.93750
batch 100 training loss is : 0.15165
batch 100 training accuracy is : 0.87500
batch 101 training loss is : 0.00728
batch 101 training accuracy is : 1.00000
batch 102 training loss is : 0.06481
batch 102 training accuracy is : 0.93750
batch 103 training loss is : 0.18878
batch 103 training accuracy is : 0.87500
batch 104 training loss is : 0.00583
batch 104 training accuracy is : 1.00000
batch 105 training loss is : 0.18156
batch 105 training accuracy is : 0.93750
batch 106 training loss is : 0.10616
batch 106 training accuracy is : 0.93750
batch 107 training loss is : 0.19093
batch 107 training accuracy is : 0.87500
batch 108 training loss is : 0.12299
batch 108 training accuracy is : 0.

batch 66 training loss is : 0.02340
batch 66 training accuracy is : 1.00000
batch 67 training loss is : 0.08607
batch 67 training accuracy is : 0.93750
batch 68 training loss is : 0.12687
batch 68 training accuracy is : 0.93750
batch 69 training loss is : 0.03697
batch 69 training accuracy is : 1.00000
batch 70 training loss is : 0.01400
batch 70 training accuracy is : 1.00000
batch 71 training loss is : 0.01276
batch 71 training accuracy is : 1.00000
batch 72 training loss is : 0.00046
batch 72 training accuracy is : 1.00000
batch 73 training loss is : 0.13301
batch 73 training accuracy is : 0.93750
batch 74 training loss is : 0.01198
batch 74 training accuracy is : 1.00000
batch 75 training loss is : 0.01445
batch 75 training accuracy is : 1.00000
batch 76 training loss is : 0.01273
batch 76 training accuracy is : 1.00000
batch 77 training loss is : 0.05837
batch 77 training accuracy is : 0.93750
batch 78 training loss is : 0.23157
batch 78 training accuracy is : 0.87500
batch 79 tra

batch 36 training loss is : 0.03831
batch 36 training accuracy is : 1.00000
batch 37 training loss is : 0.03839
batch 37 training accuracy is : 1.00000
batch 38 training loss is : 0.15465
batch 38 training accuracy is : 0.93750
batch 39 training loss is : 0.05028
batch 39 training accuracy is : 1.00000
batch 40 training loss is : 0.03931
batch 40 training accuracy is : 1.00000
batch 41 training loss is : 0.05922
batch 41 training accuracy is : 1.00000
batch 42 training loss is : 0.17789
batch 42 training accuracy is : 0.93750
batch 43 training loss is : 0.33436
batch 43 training accuracy is : 0.93750
batch 44 training loss is : 0.00147
batch 44 training accuracy is : 1.00000
batch 45 training loss is : 0.03685
batch 45 training accuracy is : 1.00000
batch 46 training loss is : 0.06701
batch 46 training accuracy is : 1.00000
batch 47 training loss is : 0.19193
batch 47 training accuracy is : 0.93750
batch 48 training loss is : 0.01443
batch 48 training accuracy is : 1.00000
batch 49 tra

batch 6 training loss is : 0.08993
batch 6 training accuracy is : 0.93750
batch 7 training loss is : 0.08198
batch 7 training accuracy is : 0.93750
batch 8 training loss is : 0.09328
batch 8 training accuracy is : 1.00000
batch 9 training loss is : 0.00800
batch 9 training accuracy is : 1.00000
batch 10 training loss is : 0.11474
batch 10 training accuracy is : 0.93750
batch 11 training loss is : 0.02007
batch 11 training accuracy is : 1.00000
batch 12 training loss is : 0.06939
batch 12 training accuracy is : 1.00000
batch 13 training loss is : 0.02941
batch 13 training accuracy is : 1.00000
batch 14 training loss is : 0.00577
batch 14 training accuracy is : 1.00000
batch 15 training loss is : 0.21532
batch 15 training accuracy is : 0.87500
batch 16 training loss is : 0.01357
batch 16 training accuracy is : 1.00000
batch 17 training loss is : 0.17091
batch 17 training accuracy is : 0.93750
batch 18 training loss is : 0.10142
batch 18 training accuracy is : 0.93750
batch 19 training lo

batch 0 dev loss is : 0.42641
batch 0 dev accuracy is : 0.81250
batch 1 dev loss is : 0.15247
batch 1 dev accuracy is : 0.93750
batch 2 dev loss is : 0.53767
batch 2 dev accuracy is : 0.87500
batch 3 dev loss is : 0.51975
batch 3 dev accuracy is : 0.81250
batch 4 dev loss is : 0.71960
batch 4 dev accuracy is : 0.81250
batch 5 dev loss is : 0.25240
batch 5 dev accuracy is : 0.87500
batch 6 dev loss is : 0.30067
batch 6 dev accuracy is : 0.87500
batch 7 dev loss is : 1.40709
batch 7 dev accuracy is : 0.81250
batch 8 dev loss is : 1.29242
batch 8 dev accuracy is : 0.68750
batch 9 dev loss is : 0.37380
batch 9 dev accuracy is : 0.93750
batch 10 dev loss is : 1.13307
batch 10 dev accuracy is : 0.62500
batch 11 dev loss is : 0.89338
batch 11 dev accuracy is : 0.68750
batch 12 dev loss is : 0.97823
batch 12 dev accuracy is : 0.75000
batch 13 dev loss is : 1.54081
batch 13 dev accuracy is : 0.75000
batch 14 dev loss is : 0.50343
batch 14 dev accuracy is : 0.87500
batch 15 dev loss is : 0.39938

batch 84 training loss is : 0.03252
batch 84 training accuracy is : 1.00000
batch 85 training loss is : 0.09144
batch 85 training accuracy is : 1.00000
batch 86 training loss is : 0.09724
batch 86 training accuracy is : 0.93750
batch 87 training loss is : 0.09259
batch 87 training accuracy is : 0.93750
batch 88 training loss is : 0.03053
batch 88 training accuracy is : 1.00000
batch 89 training loss is : 0.01473
batch 89 training accuracy is : 1.00000
batch 90 training loss is : 0.01901
batch 90 training accuracy is : 1.00000
batch 91 training loss is : 0.41613
batch 91 training accuracy is : 0.87500
batch 92 training loss is : 0.44117
batch 92 training accuracy is : 0.81250
batch 93 training loss is : 0.03621
batch 93 training accuracy is : 1.00000
batch 94 training loss is : 0.02828
batch 94 training accuracy is : 1.00000
batch 95 training loss is : 0.00045
batch 95 training accuracy is : 1.00000
batch 96 training loss is : 0.01006
batch 96 training accuracy is : 1.00000
batch 97 tra

batch 56 training loss is : 0.13584
batch 56 training accuracy is : 0.93750
batch 57 training loss is : 0.04819
batch 57 training accuracy is : 0.93750
batch 58 training loss is : 0.16838
batch 58 training accuracy is : 0.93750
batch 59 training loss is : 0.11585
batch 59 training accuracy is : 0.93750
batch 60 training loss is : 0.18923
batch 60 training accuracy is : 0.93750
batch 61 training loss is : 0.06748
batch 61 training accuracy is : 1.00000
batch 62 training loss is : 0.21589
batch 62 training accuracy is : 0.93750
batch 63 training loss is : 0.21361
batch 63 training accuracy is : 0.93750
batch 64 training loss is : 0.06826
batch 64 training accuracy is : 0.93750
batch 65 training loss is : 0.04203
batch 65 training accuracy is : 1.00000
batch 66 training loss is : 0.07711
batch 66 training accuracy is : 0.93750
batch 67 training loss is : 0.08841
batch 67 training accuracy is : 0.93750
batch 68 training loss is : 0.09369
batch 68 training accuracy is : 0.93750
batch 69 tra

batch 27 training loss is : 0.02024
batch 27 training accuracy is : 1.00000
batch 28 training loss is : 0.15768
batch 28 training accuracy is : 0.87500
batch 29 training loss is : 0.00496
batch 29 training accuracy is : 1.00000
batch 30 training loss is : 0.06383
batch 30 training accuracy is : 0.93750
batch 31 training loss is : 0.03948
batch 31 training accuracy is : 1.00000
batch 32 training loss is : 0.09749
batch 32 training accuracy is : 0.93750
batch 33 training loss is : 0.00878
batch 33 training accuracy is : 1.00000
batch 34 training loss is : 0.00011
batch 34 training accuracy is : 1.00000
batch 35 training loss is : 0.29248
batch 35 training accuracy is : 0.81250
batch 36 training loss is : 0.34707
batch 36 training accuracy is : 0.93750
batch 37 training loss is : 0.12249
batch 37 training accuracy is : 0.93750
batch 38 training loss is : 0.09141
batch 38 training accuracy is : 0.93750
batch 39 training loss is : 0.08444
batch 39 training accuracy is : 0.93750
batch 40 tra

batch 27 dev loss is : 1.27737
batch 27 dev accuracy is : 0.68750
Average validation loss is 0.91100 at the end of epoch 42
Average validation accuracy is 0.75108 at the end of epoch 42
At 43-th epoch.
batch 0 training loss is : 0.03075
batch 0 training accuracy is : 1.00000
batch 1 training loss is : 0.06194
batch 1 training accuracy is : 1.00000
batch 2 training loss is : 0.16292
batch 2 training accuracy is : 0.87500
batch 3 training loss is : 0.01121
batch 3 training accuracy is : 1.00000
batch 4 training loss is : 0.17391
batch 4 training accuracy is : 0.87500
batch 5 training loss is : 0.01705
batch 5 training accuracy is : 1.00000
batch 6 training loss is : 0.13796
batch 6 training accuracy is : 0.87500
batch 7 training loss is : 0.07681
batch 7 training accuracy is : 0.93750
batch 8 training loss is : 0.07812
batch 8 training accuracy is : 0.93750
batch 9 training loss is : 0.10014
batch 9 training accuracy is : 1.00000
batch 10 training loss is : 0.05014
batch 10 training accu

batch 108 training loss is : 0.03241
batch 108 training accuracy is : 1.00000
batch 109 training loss is : 0.22644
batch 109 training accuracy is : 0.87500
batch 110 training loss is : 0.22646
batch 110 training accuracy is : 0.93750
batch 111 training loss is : 0.13306
batch 111 training accuracy is : 0.93750
batch 112 training loss is : 0.09969
batch 112 training accuracy is : 1.00000
Average training loss is 0.08132 at the end of epoch 43
Average training accuracy is 0.95826 at the end of epoch 43
batch 0 dev loss is : 0.83292
batch 0 dev accuracy is : 0.75000
batch 1 dev loss is : 0.21021
batch 1 dev accuracy is : 0.87500
batch 2 dev loss is : 0.34711
batch 2 dev accuracy is : 0.87500
batch 3 dev loss is : 0.75045
batch 3 dev accuracy is : 0.87500
batch 4 dev loss is : 0.52264
batch 4 dev accuracy is : 0.81250
batch 5 dev loss is : 0.23174
batch 5 dev accuracy is : 0.87500
batch 6 dev loss is : 0.35242
batch 6 dev accuracy is : 0.81250
batch 7 dev loss is : 1.51442
batch 7 dev accu

batch 77 training loss is : 0.03841
batch 77 training accuracy is : 1.00000
batch 78 training loss is : 0.06712
batch 78 training accuracy is : 1.00000
batch 79 training loss is : 0.15083
batch 79 training accuracy is : 0.93750
batch 80 training loss is : 0.09079
batch 80 training accuracy is : 0.93750
batch 81 training loss is : 0.15831
batch 81 training accuracy is : 0.93750
batch 82 training loss is : 0.06259
batch 82 training accuracy is : 0.93750
batch 83 training loss is : 0.02422
batch 83 training accuracy is : 1.00000
batch 84 training loss is : 0.07684
batch 84 training accuracy is : 0.93750
batch 85 training loss is : 0.18348
batch 85 training accuracy is : 0.87500
batch 86 training loss is : 0.08109
batch 86 training accuracy is : 0.93750
batch 87 training loss is : 0.01279
batch 87 training accuracy is : 1.00000
batch 88 training loss is : 0.09428
batch 88 training accuracy is : 0.93750
batch 89 training loss is : 0.18071
batch 89 training accuracy is : 0.87500
batch 90 tra

batch 45 training loss is : 0.14376
batch 45 training accuracy is : 0.93750
batch 46 training loss is : 0.01142
batch 46 training accuracy is : 1.00000
batch 47 training loss is : 0.09197
batch 47 training accuracy is : 0.93750
batch 48 training loss is : 0.00310
batch 48 training accuracy is : 1.00000
batch 49 training loss is : 0.17592
batch 49 training accuracy is : 0.93750
batch 50 training loss is : 0.05841
batch 50 training accuracy is : 1.00000
batch 51 training loss is : 0.10589
batch 51 training accuracy is : 0.93750
batch 52 training loss is : 0.01373
batch 52 training accuracy is : 1.00000
batch 53 training loss is : 0.02017
batch 53 training accuracy is : 1.00000
batch 54 training loss is : 0.14280
batch 54 training accuracy is : 0.93750
batch 55 training loss is : 0.15304
batch 55 training accuracy is : 0.93750
batch 56 training loss is : 0.20496
batch 56 training accuracy is : 0.93750
batch 57 training loss is : 0.05833
batch 57 training accuracy is : 1.00000
batch 58 tra

batch 15 training loss is : 0.01695
batch 15 training accuracy is : 1.00000
batch 16 training loss is : 0.09054
batch 16 training accuracy is : 1.00000
batch 17 training loss is : 0.11509
batch 17 training accuracy is : 0.93750
batch 18 training loss is : 0.02972
batch 18 training accuracy is : 1.00000
batch 19 training loss is : 0.01039
batch 19 training accuracy is : 1.00000
batch 20 training loss is : 0.06304
batch 20 training accuracy is : 1.00000
batch 21 training loss is : 0.02079
batch 21 training accuracy is : 1.00000
batch 22 training loss is : 0.03104
batch 22 training accuracy is : 1.00000
batch 23 training loss is : 0.12750
batch 23 training accuracy is : 0.93750
batch 24 training loss is : 0.04195
batch 24 training accuracy is : 1.00000
batch 25 training loss is : 0.21793
batch 25 training accuracy is : 0.93750
batch 26 training loss is : 0.09217
batch 26 training accuracy is : 0.93750
batch 27 training loss is : 0.12847
batch 27 training accuracy is : 0.87500
batch 28 tra

batch 10 dev loss is : 0.93375
batch 10 dev accuracy is : 0.75000
batch 11 dev loss is : 0.71169
batch 11 dev accuracy is : 0.56250
batch 12 dev loss is : 1.05203
batch 12 dev accuracy is : 0.68750
batch 13 dev loss is : 1.77276
batch 13 dev accuracy is : 0.75000
batch 14 dev loss is : 0.62101
batch 14 dev accuracy is : 0.81250
batch 15 dev loss is : 0.31123
batch 15 dev accuracy is : 0.93750
batch 16 dev loss is : 0.99372
batch 16 dev accuracy is : 0.75000
batch 17 dev loss is : 1.64296
batch 17 dev accuracy is : 0.56250
batch 18 dev loss is : 1.37449
batch 18 dev accuracy is : 0.68750
batch 19 dev loss is : 1.97612
batch 19 dev accuracy is : 0.87500
batch 20 dev loss is : 1.19504
batch 20 dev accuracy is : 0.81250
batch 21 dev loss is : 1.79974
batch 21 dev accuracy is : 0.68750
batch 22 dev loss is : 1.10926
batch 22 dev accuracy is : 0.81250
batch 23 dev loss is : 0.35107
batch 23 dev accuracy is : 0.93750
batch 24 dev loss is : 0.47172
batch 24 dev accuracy is : 0.87500
batch 25 d

batch 93 training loss is : 0.26186
batch 93 training accuracy is : 0.93750
batch 94 training loss is : 0.32804
batch 94 training accuracy is : 0.81250
batch 95 training loss is : 0.71837
batch 95 training accuracy is : 0.75000
batch 96 training loss is : 0.32245
batch 96 training accuracy is : 0.81250
batch 97 training loss is : 0.00489
batch 97 training accuracy is : 1.00000
batch 98 training loss is : 0.06744
batch 98 training accuracy is : 0.93750
batch 99 training loss is : 0.32765
batch 99 training accuracy is : 0.93750
batch 100 training loss is : 0.29044
batch 100 training accuracy is : 0.87500
batch 101 training loss is : 0.02881
batch 101 training accuracy is : 1.00000
batch 102 training loss is : 0.02353
batch 102 training accuracy is : 1.00000
batch 103 training loss is : 0.18110
batch 103 training accuracy is : 0.93750
batch 104 training loss is : 0.07027
batch 104 training accuracy is : 1.00000
batch 105 training loss is : 0.82770
batch 105 training accuracy is : 0.87500


batch 64 training loss is : 0.37123
batch 64 training accuracy is : 0.81250
batch 65 training loss is : 0.04201
batch 65 training accuracy is : 1.00000
batch 66 training loss is : 0.38066
batch 66 training accuracy is : 0.81250
batch 67 training loss is : 0.00811
batch 67 training accuracy is : 1.00000
batch 68 training loss is : 0.21220
batch 68 training accuracy is : 0.93750
batch 69 training loss is : 0.03354
batch 69 training accuracy is : 1.00000
batch 70 training loss is : 0.03491
batch 70 training accuracy is : 1.00000
batch 71 training loss is : 0.04341
batch 71 training accuracy is : 1.00000
batch 72 training loss is : 0.93506
batch 72 training accuracy is : 0.75000
batch 73 training loss is : 0.01287
batch 73 training accuracy is : 1.00000
batch 74 training loss is : 0.00849
batch 74 training accuracy is : 1.00000
batch 75 training loss is : 0.07131
batch 75 training accuracy is : 0.93750
batch 76 training loss is : 0.19553
batch 76 training accuracy is : 0.93750
batch 77 tra

batch 32 training loss is : 0.03943
batch 32 training accuracy is : 1.00000
batch 33 training loss is : 0.05528
batch 33 training accuracy is : 1.00000
batch 34 training loss is : 0.07449
batch 34 training accuracy is : 0.93750
batch 35 training loss is : 0.02210
batch 35 training accuracy is : 1.00000
batch 36 training loss is : 0.06958
batch 36 training accuracy is : 1.00000
batch 37 training loss is : 0.49128
batch 37 training accuracy is : 0.75000
batch 38 training loss is : 0.12335
batch 38 training accuracy is : 0.93750
batch 39 training loss is : 0.00139
batch 39 training accuracy is : 1.00000
batch 40 training loss is : 0.00115
batch 40 training accuracy is : 1.00000
batch 41 training loss is : 0.09756
batch 41 training accuracy is : 0.93750
batch 42 training loss is : 0.02136
batch 42 training accuracy is : 1.00000
batch 43 training loss is : 0.00744
batch 43 training accuracy is : 1.00000
batch 44 training loss is : 0.23311
batch 44 training accuracy is : 0.93750
batch 45 tra

batch 0 training loss is : 0.09549
batch 0 training accuracy is : 0.93750
batch 1 training loss is : 0.16615
batch 1 training accuracy is : 0.93750
batch 2 training loss is : 0.04855
batch 2 training accuracy is : 1.00000
batch 3 training loss is : 0.07660
batch 3 training accuracy is : 0.93750
batch 4 training loss is : 0.05084
batch 4 training accuracy is : 1.00000
batch 5 training loss is : 0.00004
batch 5 training accuracy is : 1.00000
batch 6 training loss is : 0.06897
batch 6 training accuracy is : 0.93750
batch 7 training loss is : 0.07081
batch 7 training accuracy is : 0.93750
batch 8 training loss is : 0.09898
batch 8 training accuracy is : 0.93750
batch 9 training loss is : 0.01080
batch 9 training accuracy is : 1.00000
batch 10 training loss is : 0.19231
batch 10 training accuracy is : 0.93750
batch 11 training loss is : 0.27538
batch 11 training accuracy is : 0.87500
batch 12 training loss is : 0.01308
batch 12 training accuracy is : 1.00000
batch 13 training loss is : 0.06

batch 110 training loss is : 0.14209
batch 110 training accuracy is : 0.93750
batch 111 training loss is : 0.22453
batch 111 training accuracy is : 0.93750
batch 112 training loss is : 0.01301
batch 112 training accuracy is : 1.00000
Average training loss is 0.08022 at the end of epoch 50
Average training accuracy is 0.95772 at the end of epoch 50
batch 0 dev loss is : 0.78023
batch 0 dev accuracy is : 0.75000
batch 1 dev loss is : 0.26922
batch 1 dev accuracy is : 0.93750
batch 2 dev loss is : 0.33563
batch 2 dev accuracy is : 0.87500
batch 3 dev loss is : 0.60641
batch 3 dev accuracy is : 0.87500
batch 4 dev loss is : 0.58288
batch 4 dev accuracy is : 0.81250
batch 5 dev loss is : 0.15633
batch 5 dev accuracy is : 0.93750
batch 6 dev loss is : 0.26901
batch 6 dev accuracy is : 0.87500
batch 7 dev loss is : 1.61404
batch 7 dev accuracy is : 0.87500
batch 8 dev loss is : 1.86080
batch 8 dev accuracy is : 0.68750
batch 9 dev loss is : 0.24296
batch 9 dev accuracy is : 0.93750
batch 10 d

batch 79 training loss is : 0.02305
batch 79 training accuracy is : 1.00000
batch 80 training loss is : 0.25344
batch 80 training accuracy is : 0.81250
batch 81 training loss is : 0.03948
batch 81 training accuracy is : 1.00000
batch 82 training loss is : 0.25167
batch 82 training accuracy is : 0.93750
batch 83 training loss is : 0.36698
batch 83 training accuracy is : 0.87500
batch 84 training loss is : 0.10252
batch 84 training accuracy is : 0.93750
batch 85 training loss is : 0.03704
batch 85 training accuracy is : 1.00000
batch 86 training loss is : 0.03715
batch 86 training accuracy is : 1.00000
batch 87 training loss is : 0.00754
batch 87 training accuracy is : 1.00000
batch 88 training loss is : 0.01125
batch 88 training accuracy is : 1.00000
batch 89 training loss is : 0.16334
batch 89 training accuracy is : 0.93750
batch 90 training loss is : 0.01821
batch 90 training accuracy is : 1.00000
batch 91 training loss is : 0.21942
batch 91 training accuracy is : 0.87500
batch 92 tra

batch 50 training loss is : 0.32162
batch 50 training accuracy is : 0.93750
batch 51 training loss is : 0.45918
batch 51 training accuracy is : 0.81250
batch 52 training loss is : 0.19574
batch 52 training accuracy is : 0.93750
batch 53 training loss is : 0.14767
batch 53 training accuracy is : 0.93750
batch 54 training loss is : 0.25513
batch 54 training accuracy is : 0.93750
batch 55 training loss is : 0.01112
batch 55 training accuracy is : 1.00000
batch 56 training loss is : 0.00000
batch 56 training accuracy is : 1.00000
batch 57 training loss is : 0.00782
batch 57 training accuracy is : 1.00000
batch 58 training loss is : 0.00703
batch 58 training accuracy is : 1.00000
batch 59 training loss is : 0.06762
batch 59 training accuracy is : 1.00000
batch 60 training loss is : 0.42689
batch 60 training accuracy is : 0.87500
batch 61 training loss is : 0.15888
batch 61 training accuracy is : 0.93750
batch 62 training loss is : 0.00228
batch 62 training accuracy is : 1.00000
batch 63 tra

batch 18 training loss is : 0.35527
batch 18 training accuracy is : 0.93750
batch 19 training loss is : 0.24833
batch 19 training accuracy is : 0.87500
batch 20 training loss is : 0.18872
batch 20 training accuracy is : 0.93750
batch 21 training loss is : 0.04789
batch 21 training accuracy is : 1.00000
batch 22 training loss is : 0.00250
batch 22 training accuracy is : 1.00000
batch 23 training loss is : 0.26025
batch 23 training accuracy is : 0.87500
batch 24 training loss is : 0.02865
batch 24 training accuracy is : 1.00000
batch 25 training loss is : 0.11984
batch 25 training accuracy is : 0.93750
batch 26 training loss is : 0.09878
batch 26 training accuracy is : 0.93750
batch 27 training loss is : 0.00161
batch 27 training accuracy is : 1.00000
batch 28 training loss is : 0.03389
batch 28 training accuracy is : 1.00000
batch 29 training loss is : 0.00704
batch 29 training accuracy is : 1.00000
batch 30 training loss is : 0.02051
batch 30 training accuracy is : 1.00000
batch 31 tra

batch 15 dev loss is : 0.54375
batch 15 dev accuracy is : 0.87500
batch 16 dev loss is : 0.75953
batch 16 dev accuracy is : 0.81250
batch 17 dev loss is : 1.40276
batch 17 dev accuracy is : 0.62500
batch 18 dev loss is : 1.43979
batch 18 dev accuracy is : 0.62500
batch 19 dev loss is : 1.60992
batch 19 dev accuracy is : 0.87500
batch 20 dev loss is : 1.08581
batch 20 dev accuracy is : 0.75000
batch 21 dev loss is : 1.34281
batch 21 dev accuracy is : 0.75000
batch 22 dev loss is : 1.04776
batch 22 dev accuracy is : 0.81250
batch 23 dev loss is : 0.33540
batch 23 dev accuracy is : 0.81250
batch 24 dev loss is : 0.40296
batch 24 dev accuracy is : 0.93750
batch 25 dev loss is : 0.50421
batch 25 dev accuracy is : 0.81250
batch 26 dev loss is : 1.11798
batch 26 dev accuracy is : 0.75000
batch 27 dev loss is : 0.95389
batch 27 dev accuracy is : 0.81250
Average validation loss is 0.84270 at the end of epoch 53
Average validation accuracy is 0.75541 at the end of epoch 53
At 54-th epoch.
batch 

batch 101 training loss is : 0.01272
batch 101 training accuracy is : 1.00000
batch 102 training loss is : 0.07275
batch 102 training accuracy is : 1.00000
batch 103 training loss is : 0.15318
batch 103 training accuracy is : 0.93750
batch 104 training loss is : 0.09225
batch 104 training accuracy is : 0.93750
batch 105 training loss is : 0.01398
batch 105 training accuracy is : 1.00000
batch 106 training loss is : 0.04839
batch 106 training accuracy is : 0.93750
batch 107 training loss is : 0.03616
batch 107 training accuracy is : 1.00000
batch 108 training loss is : 0.27787
batch 108 training accuracy is : 0.93750
batch 109 training loss is : 0.17710
batch 109 training accuracy is : 0.93750
batch 110 training loss is : 0.06470
batch 110 training accuracy is : 0.93750
batch 111 training loss is : 0.00068
batch 111 training accuracy is : 1.00000
batch 112 training loss is : 0.00549
batch 112 training accuracy is : 1.00000
Average training loss is 0.08584 at the end of epoch 54
Average 

batch 69 training loss is : 0.01127
batch 69 training accuracy is : 1.00000
batch 70 training loss is : 0.18292
batch 70 training accuracy is : 0.93750
batch 71 training loss is : 0.14978
batch 71 training accuracy is : 0.87500
batch 72 training loss is : 0.38095
batch 72 training accuracy is : 0.87500
batch 73 training loss is : 0.02262
batch 73 training accuracy is : 1.00000
batch 74 training loss is : 0.00004
batch 74 training accuracy is : 1.00000
batch 75 training loss is : 0.27296
batch 75 training accuracy is : 0.81250
batch 76 training loss is : 0.02319
batch 76 training accuracy is : 1.00000
batch 77 training loss is : 0.07473
batch 77 training accuracy is : 0.93750
batch 78 training loss is : 0.02292
batch 78 training accuracy is : 1.00000
batch 79 training loss is : 0.05567
batch 79 training accuracy is : 1.00000
batch 80 training loss is : 0.00032
batch 80 training accuracy is : 1.00000
batch 81 training loss is : 0.19695
batch 81 training accuracy is : 0.93750
batch 82 tra

batch 39 training loss is : 0.07088
batch 39 training accuracy is : 1.00000
batch 40 training loss is : 0.04068
batch 40 training accuracy is : 1.00000
batch 41 training loss is : 0.02141
batch 41 training accuracy is : 1.00000
batch 42 training loss is : 0.19357
batch 42 training accuracy is : 0.87500
batch 43 training loss is : 0.05264
batch 43 training accuracy is : 1.00000
batch 44 training loss is : 0.07990
batch 44 training accuracy is : 0.93750
batch 45 training loss is : 0.00833
batch 45 training accuracy is : 1.00000
batch 46 training loss is : 0.00233
batch 46 training accuracy is : 1.00000
batch 47 training loss is : 0.05850
batch 47 training accuracy is : 1.00000
batch 48 training loss is : 0.16100
batch 48 training accuracy is : 0.87500
batch 49 training loss is : 0.00595
batch 49 training accuracy is : 1.00000
batch 50 training loss is : 0.07463
batch 50 training accuracy is : 1.00000
batch 51 training loss is : 0.15048
batch 51 training accuracy is : 0.93750
batch 52 tra

batch 9 training loss is : 0.21401
batch 9 training accuracy is : 0.93750
batch 10 training loss is : 0.25376
batch 10 training accuracy is : 0.93750
batch 11 training loss is : 0.02239
batch 11 training accuracy is : 1.00000
batch 12 training loss is : 0.07046
batch 12 training accuracy is : 1.00000
batch 13 training loss is : 0.01454
batch 13 training accuracy is : 1.00000
batch 14 training loss is : 0.01531
batch 14 training accuracy is : 1.00000
batch 15 training loss is : 0.18080
batch 15 training accuracy is : 0.93750
batch 16 training loss is : 0.12581
batch 16 training accuracy is : 0.87500
batch 17 training loss is : 0.03877
batch 17 training accuracy is : 1.00000
batch 18 training loss is : 0.00003
batch 18 training accuracy is : 1.00000
batch 19 training loss is : 0.01263
batch 19 training accuracy is : 1.00000
batch 20 training loss is : 0.05646
batch 20 training accuracy is : 1.00000
batch 21 training loss is : 0.00772
batch 21 training accuracy is : 1.00000
batch 22 train

batch 3 dev loss is : 0.94935
batch 3 dev accuracy is : 0.87500
batch 4 dev loss is : 0.64311
batch 4 dev accuracy is : 0.75000
batch 5 dev loss is : 0.48202
batch 5 dev accuracy is : 0.87500
batch 6 dev loss is : 0.74169
batch 6 dev accuracy is : 0.75000
batch 7 dev loss is : 1.38880
batch 7 dev accuracy is : 0.87500
batch 8 dev loss is : 1.87285
batch 8 dev accuracy is : 0.62500
batch 9 dev loss is : 0.49224
batch 9 dev accuracy is : 0.81250
batch 10 dev loss is : 2.30417
batch 10 dev accuracy is : 0.56250
batch 11 dev loss is : 0.67079
batch 11 dev accuracy is : 0.87500
batch 12 dev loss is : 0.53931
batch 12 dev accuracy is : 0.81250
batch 13 dev loss is : 1.51567
batch 13 dev accuracy is : 0.62500
batch 14 dev loss is : 0.46286
batch 14 dev accuracy is : 0.87500
batch 15 dev loss is : 0.75036
batch 15 dev accuracy is : 0.81250
batch 16 dev loss is : 0.86510
batch 16 dev accuracy is : 0.81250
batch 17 dev loss is : 1.93527
batch 17 dev accuracy is : 0.68750
batch 18 dev loss is : 2

batch 87 training loss is : 0.12566
batch 87 training accuracy is : 0.93750
batch 88 training loss is : 0.00061
batch 88 training accuracy is : 1.00000
batch 89 training loss is : 0.00610
batch 89 training accuracy is : 1.00000
batch 90 training loss is : 0.01846
batch 90 training accuracy is : 1.00000
batch 91 training loss is : 0.00009
batch 91 training accuracy is : 1.00000
batch 92 training loss is : 0.14592
batch 92 training accuracy is : 0.87500
batch 93 training loss is : 0.13436
batch 93 training accuracy is : 0.93750
batch 94 training loss is : 0.41391
batch 94 training accuracy is : 0.93750
batch 95 training loss is : 0.22172
batch 95 training accuracy is : 0.93750
batch 96 training loss is : 0.16006
batch 96 training accuracy is : 0.93750
batch 97 training loss is : 0.04064
batch 97 training accuracy is : 1.00000
batch 98 training loss is : 0.00715
batch 98 training accuracy is : 1.00000
batch 99 training loss is : 0.03652
batch 99 training accuracy is : 1.00000
batch 100 tr

batch 56 training loss is : 0.12883
batch 56 training accuracy is : 0.93750
batch 57 training loss is : 0.50199
batch 57 training accuracy is : 0.87500
batch 58 training loss is : 0.38009
batch 58 training accuracy is : 0.81250
batch 59 training loss is : 0.04991
batch 59 training accuracy is : 1.00000
batch 60 training loss is : 0.12418
batch 60 training accuracy is : 0.93750
batch 61 training loss is : 0.00000
batch 61 training accuracy is : 1.00000
batch 62 training loss is : 0.00330
batch 62 training accuracy is : 1.00000
batch 63 training loss is : 0.00001
batch 63 training accuracy is : 1.00000
batch 64 training loss is : 0.65558
batch 64 training accuracy is : 0.87500
batch 65 training loss is : 0.17600
batch 65 training accuracy is : 0.93750
batch 66 training loss is : 0.24923
batch 66 training accuracy is : 0.93750
batch 67 training loss is : 0.03683
batch 67 training accuracy is : 1.00000
batch 68 training loss is : 0.04455
batch 68 training accuracy is : 1.00000
batch 69 tra

batch 25 training loss is : 0.11082
batch 25 training accuracy is : 0.93750
batch 26 training loss is : 0.06459
batch 26 training accuracy is : 1.00000
batch 27 training loss is : 0.01798
batch 27 training accuracy is : 1.00000
batch 28 training loss is : 0.04154
batch 28 training accuracy is : 1.00000
batch 29 training loss is : 0.11845
batch 29 training accuracy is : 0.93750
batch 30 training loss is : 0.01583
batch 30 training accuracy is : 1.00000
batch 31 training loss is : 0.24243
batch 31 training accuracy is : 0.93750
batch 32 training loss is : 0.13069
batch 32 training accuracy is : 0.93750
batch 33 training loss is : 0.01747
batch 33 training accuracy is : 1.00000
batch 34 training loss is : 0.09490
batch 34 training accuracy is : 0.93750
batch 35 training loss is : 0.31596
batch 35 training accuracy is : 0.87500
batch 36 training loss is : 0.12913
batch 36 training accuracy is : 0.93750
batch 37 training loss is : 0.02956
batch 37 training accuracy is : 1.00000
batch 38 tra

batch 25 dev loss is : 0.56417
batch 25 dev accuracy is : 0.81250
batch 26 dev loss is : 0.99695
batch 26 dev accuracy is : 0.75000
batch 27 dev loss is : 1.15050
batch 27 dev accuracy is : 0.81250
Average validation loss is 0.95425 at the end of epoch 60
Average validation accuracy is 0.76190 at the end of epoch 60
At 61-th epoch.
batch 0 training loss is : 0.03594
batch 0 training accuracy is : 1.00000
batch 1 training loss is : 0.05255
batch 1 training accuracy is : 1.00000
batch 2 training loss is : 0.04233
batch 2 training accuracy is : 1.00000
batch 3 training loss is : 0.03352
batch 3 training accuracy is : 1.00000
batch 4 training loss is : 0.05906
batch 4 training accuracy is : 0.93750
batch 5 training loss is : 0.00010
batch 5 training accuracy is : 1.00000
batch 6 training loss is : 0.01039
batch 6 training accuracy is : 1.00000
batch 7 training loss is : 0.01769
batch 7 training accuracy is : 1.00000
batch 8 training loss is : 0.05478
batch 8 training accuracy is : 0.93750


batch 106 training loss is : 0.24097
batch 106 training accuracy is : 0.93750
batch 107 training loss is : 0.00788
batch 107 training accuracy is : 1.00000
batch 108 training loss is : 0.03025
batch 108 training accuracy is : 1.00000
batch 109 training loss is : 0.18710
batch 109 training accuracy is : 0.87500
batch 110 training loss is : 0.07609
batch 110 training accuracy is : 0.93750
batch 111 training loss is : 0.09079
batch 111 training accuracy is : 0.93750
batch 112 training loss is : 0.11053
batch 112 training accuracy is : 0.93750
Average training loss is 0.08946 at the end of epoch 61
Average training accuracy is 0.95167 at the end of epoch 61
batch 0 dev loss is : 0.71363
batch 0 dev accuracy is : 0.75000
batch 1 dev loss is : 0.16928
batch 1 dev accuracy is : 0.93750
batch 2 dev loss is : 0.45008
batch 2 dev accuracy is : 0.81250
batch 3 dev loss is : 0.59611
batch 3 dev accuracy is : 0.87500
batch 4 dev loss is : 0.52487
batch 4 dev accuracy is : 0.81250
batch 5 dev loss i

batch 75 training loss is : 0.17034
batch 75 training accuracy is : 0.93750
batch 76 training loss is : 0.01301
batch 76 training accuracy is : 1.00000
batch 77 training loss is : 0.17985
batch 77 training accuracy is : 0.87500
batch 78 training loss is : 0.01212
batch 78 training accuracy is : 1.00000
batch 79 training loss is : 0.05241
batch 79 training accuracy is : 1.00000
batch 80 training loss is : 0.34559
batch 80 training accuracy is : 0.87500
batch 81 training loss is : 0.33774
batch 81 training accuracy is : 0.81250
batch 82 training loss is : 0.02920
batch 82 training accuracy is : 1.00000
batch 83 training loss is : 0.18877
batch 83 training accuracy is : 0.93750
batch 84 training loss is : 0.04210
batch 84 training accuracy is : 1.00000
batch 85 training loss is : 0.14464
batch 85 training accuracy is : 0.87500
batch 86 training loss is : 0.04526
batch 86 training accuracy is : 1.00000
batch 87 training loss is : 0.05472
batch 87 training accuracy is : 1.00000
batch 88 tra

batch 45 training loss is : 0.14569
batch 45 training accuracy is : 0.93750
batch 46 training loss is : 0.00031
batch 46 training accuracy is : 1.00000
batch 47 training loss is : 0.02662
batch 47 training accuracy is : 1.00000
batch 48 training loss is : 0.10045
batch 48 training accuracy is : 0.93750
batch 49 training loss is : 0.12242
batch 49 training accuracy is : 0.93750
batch 50 training loss is : 0.00063
batch 50 training accuracy is : 1.00000
batch 51 training loss is : 0.31177
batch 51 training accuracy is : 0.87500
batch 52 training loss is : 0.00042
batch 52 training accuracy is : 1.00000
batch 53 training loss is : 0.20579
batch 53 training accuracy is : 0.93750
batch 54 training loss is : 0.00630
batch 54 training accuracy is : 1.00000
batch 55 training loss is : 0.04108
batch 55 training accuracy is : 1.00000
batch 56 training loss is : 0.00996
batch 56 training accuracy is : 1.00000
batch 57 training loss is : 0.12402
batch 57 training accuracy is : 0.93750
batch 58 tra

batch 15 training loss is : 0.00093
batch 15 training accuracy is : 1.00000
batch 16 training loss is : 0.00430
batch 16 training accuracy is : 1.00000
batch 17 training loss is : 0.04750
batch 17 training accuracy is : 0.93750
batch 18 training loss is : 0.00528
batch 18 training accuracy is : 1.00000
batch 19 training loss is : 0.33816
batch 19 training accuracy is : 0.87500
batch 20 training loss is : 0.00246
batch 20 training accuracy is : 1.00000
batch 21 training loss is : 0.05823
batch 21 training accuracy is : 0.93750
batch 22 training loss is : 0.23499
batch 22 training accuracy is : 0.87500
batch 23 training loss is : 0.00393
batch 23 training accuracy is : 1.00000
batch 24 training loss is : 0.00814
batch 24 training accuracy is : 1.00000
batch 25 training loss is : 0.39989
batch 25 training accuracy is : 0.87500
batch 26 training loss is : 0.07781
batch 26 training accuracy is : 0.93750
batch 27 training loss is : 0.02829
batch 27 training accuracy is : 1.00000
batch 28 tra

batch 10 dev loss is : 1.13615
batch 10 dev accuracy is : 0.68750
batch 11 dev loss is : 1.81623
batch 11 dev accuracy is : 0.56250
batch 12 dev loss is : 1.19531
batch 12 dev accuracy is : 0.68750
batch 13 dev loss is : 1.92198
batch 13 dev accuracy is : 0.75000
batch 14 dev loss is : 1.23337
batch 14 dev accuracy is : 0.75000
batch 15 dev loss is : 0.60135
batch 15 dev accuracy is : 0.87500
batch 16 dev loss is : 0.96774
batch 16 dev accuracy is : 0.75000
batch 17 dev loss is : 2.01906
batch 17 dev accuracy is : 0.62500
batch 18 dev loss is : 1.50488
batch 18 dev accuracy is : 0.62500
batch 19 dev loss is : 2.32501
batch 19 dev accuracy is : 0.87500
batch 20 dev loss is : 1.51626
batch 20 dev accuracy is : 0.68750
batch 21 dev loss is : 2.08523
batch 21 dev accuracy is : 0.68750
batch 22 dev loss is : 0.88280
batch 22 dev accuracy is : 0.87500
batch 23 dev loss is : 0.34923
batch 23 dev accuracy is : 0.93750
batch 24 dev loss is : 0.40579
batch 24 dev accuracy is : 0.87500
batch 25 d

batch 92 training loss is : 0.01613
batch 92 training accuracy is : 1.00000
batch 93 training loss is : 0.21808
batch 93 training accuracy is : 0.93750
batch 94 training loss is : 0.01798
batch 94 training accuracy is : 1.00000
batch 95 training loss is : 0.07717
batch 95 training accuracy is : 0.93750
batch 96 training loss is : 0.00555
batch 96 training accuracy is : 1.00000
batch 97 training loss is : 0.02411
batch 97 training accuracy is : 1.00000
batch 98 training loss is : 0.06293
batch 98 training accuracy is : 1.00000
batch 99 training loss is : 0.24505
batch 99 training accuracy is : 0.93750
batch 100 training loss is : 0.13062
batch 100 training accuracy is : 0.93750
batch 101 training loss is : 0.31489
batch 101 training accuracy is : 0.93750
batch 102 training loss is : 0.39328
batch 102 training accuracy is : 0.93750
batch 103 training loss is : 0.02047
batch 103 training accuracy is : 1.00000
batch 104 training loss is : 0.03780
batch 104 training accuracy is : 1.00000
ba

batch 63 training loss is : 0.00051
batch 63 training accuracy is : 1.00000
batch 64 training loss is : 0.09742
batch 64 training accuracy is : 0.93750
batch 65 training loss is : 0.00465
batch 65 training accuracy is : 1.00000
batch 66 training loss is : 0.08626
batch 66 training accuracy is : 0.93750
batch 67 training loss is : 0.10113
batch 67 training accuracy is : 0.93750
batch 68 training loss is : 0.04668
batch 68 training accuracy is : 0.93750
batch 69 training loss is : 0.00474
batch 69 training accuracy is : 1.00000
batch 70 training loss is : 0.34612
batch 70 training accuracy is : 0.93750
batch 71 training loss is : 0.05399
batch 71 training accuracy is : 1.00000
batch 72 training loss is : 0.01224
batch 72 training accuracy is : 1.00000
batch 73 training loss is : 0.06028
batch 73 training accuracy is : 0.93750
batch 74 training loss is : 0.21540
batch 74 training accuracy is : 0.87500
batch 75 training loss is : 0.02214
batch 75 training accuracy is : 1.00000
batch 76 tra

batch 34 training loss is : 0.00129
batch 34 training accuracy is : 1.00000
batch 35 training loss is : 0.21828
batch 35 training accuracy is : 0.87500
batch 36 training loss is : 0.11490
batch 36 training accuracy is : 0.93750
batch 37 training loss is : 0.06408
batch 37 training accuracy is : 0.93750
batch 38 training loss is : 0.02849
batch 38 training accuracy is : 1.00000
batch 39 training loss is : 0.06822
batch 39 training accuracy is : 0.93750
batch 40 training loss is : 0.51110
batch 40 training accuracy is : 0.81250
batch 41 training loss is : 0.02556
batch 41 training accuracy is : 1.00000
batch 42 training loss is : 0.03746
batch 42 training accuracy is : 1.00000
batch 43 training loss is : 0.07080
batch 43 training accuracy is : 0.93750
batch 44 training loss is : 0.06735
batch 44 training accuracy is : 0.93750
batch 45 training loss is : 0.02072
batch 45 training accuracy is : 1.00000
batch 46 training loss is : 0.19001
batch 46 training accuracy is : 0.93750
batch 47 tra

batch 4 training loss is : 0.06781
batch 4 training accuracy is : 0.93750
batch 5 training loss is : 0.01028
batch 5 training accuracy is : 1.00000
batch 6 training loss is : 0.02367
batch 6 training accuracy is : 1.00000
batch 7 training loss is : 0.01507
batch 7 training accuracy is : 1.00000
batch 8 training loss is : 0.00980
batch 8 training accuracy is : 1.00000
batch 9 training loss is : 0.06259
batch 9 training accuracy is : 0.93750
batch 10 training loss is : 0.02211
batch 10 training accuracy is : 1.00000
batch 11 training loss is : 0.24546
batch 11 training accuracy is : 0.87500
batch 12 training loss is : 0.05118
batch 12 training accuracy is : 1.00000
batch 13 training loss is : 0.01063
batch 13 training accuracy is : 1.00000
batch 14 training loss is : 0.18964
batch 14 training accuracy is : 0.93750
batch 15 training loss is : 0.02011
batch 15 training accuracy is : 1.00000
batch 16 training loss is : 0.06282
batch 16 training accuracy is : 0.93750
batch 17 training loss i

Average training loss is 0.07220 at the end of epoch 68
Average training accuracy is 0.96431 at the end of epoch 68
batch 0 dev loss is : 0.76116
batch 0 dev accuracy is : 0.75000
batch 1 dev loss is : 0.37053
batch 1 dev accuracy is : 0.87500
batch 2 dev loss is : 0.63050
batch 2 dev accuracy is : 0.81250
batch 3 dev loss is : 0.93256
batch 3 dev accuracy is : 0.81250
batch 4 dev loss is : 0.84664
batch 4 dev accuracy is : 0.75000
batch 5 dev loss is : 0.48428
batch 5 dev accuracy is : 0.81250
batch 6 dev loss is : 0.59358
batch 6 dev accuracy is : 0.68750
batch 7 dev loss is : 1.52102
batch 7 dev accuracy is : 0.81250
batch 8 dev loss is : 1.72683
batch 8 dev accuracy is : 0.62500
batch 9 dev loss is : 0.58079
batch 9 dev accuracy is : 0.81250
batch 10 dev loss is : 1.71209
batch 10 dev accuracy is : 0.56250
batch 11 dev loss is : 0.93012
batch 11 dev accuracy is : 0.68750
batch 12 dev loss is : 0.75928
batch 12 dev accuracy is : 0.75000
batch 13 dev loss is : 1.73351
batch 13 dev ac

batch 81 training loss is : 0.18814
batch 81 training accuracy is : 0.93750
batch 82 training loss is : 0.00409
batch 82 training accuracy is : 1.00000
batch 83 training loss is : 0.14489
batch 83 training accuracy is : 0.93750
batch 84 training loss is : 0.09517
batch 84 training accuracy is : 0.93750
batch 85 training loss is : 0.00030
batch 85 training accuracy is : 1.00000
batch 86 training loss is : 0.07201
batch 86 training accuracy is : 0.93750
batch 87 training loss is : 0.09154
batch 87 training accuracy is : 0.93750
batch 88 training loss is : 0.09013
batch 88 training accuracy is : 1.00000
batch 89 training loss is : 0.13963
batch 89 training accuracy is : 0.93750
batch 90 training loss is : 0.24453
batch 90 training accuracy is : 0.75000
batch 91 training loss is : 0.03534
batch 91 training accuracy is : 1.00000
batch 92 training loss is : 0.02655
batch 92 training accuracy is : 1.00000
batch 93 training loss is : 0.00222
batch 93 training accuracy is : 1.00000
batch 94 tra

batch 50 training loss is : 0.12044
batch 50 training accuracy is : 0.93750
batch 51 training loss is : 0.03695
batch 51 training accuracy is : 1.00000
batch 52 training loss is : 0.11822
batch 52 training accuracy is : 0.93750
batch 53 training loss is : 0.00934
batch 53 training accuracy is : 1.00000
batch 54 training loss is : 0.00803
batch 54 training accuracy is : 1.00000
batch 55 training loss is : 0.01054
batch 55 training accuracy is : 1.00000
batch 56 training loss is : 0.00470
batch 56 training accuracy is : 1.00000
batch 57 training loss is : 0.06300
batch 57 training accuracy is : 1.00000
batch 58 training loss is : 0.02698
batch 58 training accuracy is : 1.00000
batch 59 training loss is : 0.04212
batch 59 training accuracy is : 1.00000
batch 60 training loss is : 0.10244
batch 60 training accuracy is : 0.93750
batch 61 training loss is : 0.05109
batch 61 training accuracy is : 1.00000
batch 62 training loss is : 0.01212
batch 62 training accuracy is : 1.00000
batch 63 tra

batch 20 training loss is : 0.08921
batch 20 training accuracy is : 0.93750
batch 21 training loss is : 0.09367
batch 21 training accuracy is : 0.93750
batch 22 training loss is : 0.07617
batch 22 training accuracy is : 1.00000
batch 23 training loss is : 0.16714
batch 23 training accuracy is : 0.93750
batch 24 training loss is : 0.04309
batch 24 training accuracy is : 1.00000
batch 25 training loss is : 0.13000
batch 25 training accuracy is : 0.93750
batch 26 training loss is : 0.25383
batch 26 training accuracy is : 0.87500
batch 27 training loss is : 0.58304
batch 27 training accuracy is : 0.81250
batch 28 training loss is : 0.00948
batch 28 training accuracy is : 1.00000
batch 29 training loss is : 0.07208
batch 29 training accuracy is : 0.93750
batch 30 training loss is : 0.00041
batch 30 training accuracy is : 1.00000
batch 31 training loss is : 0.03941
batch 31 training accuracy is : 1.00000
batch 32 training loss is : 0.08585
batch 32 training accuracy is : 1.00000
batch 33 tra

batch 18 dev loss is : 1.51497
batch 18 dev accuracy is : 0.62500
batch 19 dev loss is : 2.27108
batch 19 dev accuracy is : 0.87500
batch 20 dev loss is : 1.38691
batch 20 dev accuracy is : 0.75000
batch 21 dev loss is : 2.19039
batch 21 dev accuracy is : 0.75000
batch 22 dev loss is : 1.10647
batch 22 dev accuracy is : 0.87500
batch 23 dev loss is : 0.35212
batch 23 dev accuracy is : 0.87500
batch 24 dev loss is : 0.43311
batch 24 dev accuracy is : 0.81250
batch 25 dev loss is : 0.96241
batch 25 dev accuracy is : 0.68750
batch 26 dev loss is : 2.40587
batch 26 dev accuracy is : 0.68750
batch 27 dev loss is : 1.61321
batch 27 dev accuracy is : 0.68750
Average validation loss is 1.05749 at the end of epoch 71
Average validation accuracy is 0.75541 at the end of epoch 71
At 72-th epoch.
batch 0 training loss is : 0.05042
batch 0 training accuracy is : 0.93750
batch 1 training loss is : 0.02344
batch 1 training accuracy is : 1.00000
batch 2 training loss is : 0.03530
batch 2 training accu

batch 98 training loss is : 0.08139
batch 98 training accuracy is : 0.93750
batch 99 training loss is : 0.01546
batch 99 training accuracy is : 1.00000
batch 100 training loss is : 0.02181
batch 100 training accuracy is : 1.00000
batch 101 training loss is : 0.00627
batch 101 training accuracy is : 1.00000
batch 102 training loss is : 0.10510
batch 102 training accuracy is : 0.93750
batch 103 training loss is : 0.00342
batch 103 training accuracy is : 1.00000
batch 104 training loss is : 0.01986
batch 104 training accuracy is : 1.00000
batch 105 training loss is : 0.04091
batch 105 training accuracy is : 1.00000
batch 106 training loss is : 0.03497
batch 106 training accuracy is : 1.00000
batch 107 training loss is : 0.53705
batch 107 training accuracy is : 0.87500
batch 108 training loss is : 0.05771
batch 108 training accuracy is : 1.00000
batch 109 training loss is : 0.00997
batch 109 training accuracy is : 1.00000
batch 110 training loss is : 0.03552
batch 110 training accuracy is 

batch 68 training loss is : 0.18613
batch 68 training accuracy is : 0.87500
batch 69 training loss is : 0.01722
batch 69 training accuracy is : 1.00000
batch 70 training loss is : 0.12418
batch 70 training accuracy is : 0.93750
batch 71 training loss is : 0.01671
batch 71 training accuracy is : 1.00000
batch 72 training loss is : 0.21289
batch 72 training accuracy is : 0.87500
batch 73 training loss is : 0.02418
batch 73 training accuracy is : 1.00000
batch 74 training loss is : 0.00699
batch 74 training accuracy is : 1.00000
batch 75 training loss is : 0.07023
batch 75 training accuracy is : 0.93750
batch 76 training loss is : 0.05057
batch 76 training accuracy is : 1.00000
batch 77 training loss is : 0.04767
batch 77 training accuracy is : 1.00000
batch 78 training loss is : 0.00450
batch 78 training accuracy is : 1.00000
batch 79 training loss is : 0.05969
batch 79 training accuracy is : 1.00000
batch 80 training loss is : 0.11657
batch 80 training accuracy is : 0.93750
batch 81 tra

batch 36 training loss is : 0.17577
batch 36 training accuracy is : 0.93750
batch 37 training loss is : 0.03912
batch 37 training accuracy is : 1.00000
batch 38 training loss is : 0.21233
batch 38 training accuracy is : 0.93750
batch 39 training loss is : 0.30477
batch 39 training accuracy is : 0.87500
batch 40 training loss is : 0.02668
batch 40 training accuracy is : 1.00000
batch 41 training loss is : 0.00344
batch 41 training accuracy is : 1.00000
batch 42 training loss is : 0.03157
batch 42 training accuracy is : 1.00000
batch 43 training loss is : 0.00365
batch 43 training accuracy is : 1.00000
batch 44 training loss is : 0.00924
batch 44 training accuracy is : 1.00000
batch 45 training loss is : 0.04260
batch 45 training accuracy is : 1.00000
batch 46 training loss is : 0.03444
batch 46 training accuracy is : 1.00000
batch 47 training loss is : 0.13077
batch 47 training accuracy is : 0.93750
batch 48 training loss is : 0.02285
batch 48 training accuracy is : 1.00000
batch 49 tra

batch 4 training loss is : 0.08289
batch 4 training accuracy is : 0.93750
batch 5 training loss is : 0.00385
batch 5 training accuracy is : 1.00000
batch 6 training loss is : 0.00002
batch 6 training accuracy is : 1.00000
batch 7 training loss is : 0.04365
batch 7 training accuracy is : 1.00000
batch 8 training loss is : 0.02943
batch 8 training accuracy is : 1.00000
batch 9 training loss is : 0.11579
batch 9 training accuracy is : 0.93750
batch 10 training loss is : 0.15569
batch 10 training accuracy is : 0.87500
batch 11 training loss is : 0.24973
batch 11 training accuracy is : 0.93750
batch 12 training loss is : 0.03012
batch 12 training accuracy is : 1.00000
batch 13 training loss is : 0.03828
batch 13 training accuracy is : 1.00000
batch 14 training loss is : 0.06970
batch 14 training accuracy is : 0.93750
batch 15 training loss is : 0.00762
batch 15 training accuracy is : 1.00000
batch 16 training loss is : 0.05495
batch 16 training accuracy is : 1.00000
batch 17 training loss i

batch 112 training loss is : 0.03342
batch 112 training accuracy is : 1.00000
Average training loss is 0.08974 at the end of epoch 75
Average training accuracy is 0.95826 at the end of epoch 75
batch 0 dev loss is : 0.96162
batch 0 dev accuracy is : 0.81250
batch 1 dev loss is : 0.15962
batch 1 dev accuracy is : 0.87500
batch 2 dev loss is : 0.35560
batch 2 dev accuracy is : 0.81250
batch 3 dev loss is : 0.41631
batch 3 dev accuracy is : 0.87500
batch 4 dev loss is : 0.59470
batch 4 dev accuracy is : 0.75000
batch 5 dev loss is : 0.25497
batch 5 dev accuracy is : 0.87500
batch 6 dev loss is : 0.08783
batch 6 dev accuracy is : 1.00000
batch 7 dev loss is : 1.78909
batch 7 dev accuracy is : 0.87500
batch 8 dev loss is : 2.02410
batch 8 dev accuracy is : 0.62500
batch 9 dev loss is : 0.22755
batch 9 dev accuracy is : 0.87500
batch 10 dev loss is : 1.50186
batch 10 dev accuracy is : 0.68750
batch 11 dev loss is : 2.06642
batch 11 dev accuracy is : 0.50000
batch 12 dev loss is : 0.84883
bat

batch 82 training loss is : 0.25325
batch 82 training accuracy is : 0.93750
batch 83 training loss is : 0.09503
batch 83 training accuracy is : 0.93750
batch 84 training loss is : 0.36517
batch 84 training accuracy is : 0.87500
batch 85 training loss is : 0.09587
batch 85 training accuracy is : 0.93750
batch 86 training loss is : 0.02272
batch 86 training accuracy is : 1.00000
batch 87 training loss is : 0.19417
batch 87 training accuracy is : 0.93750
batch 88 training loss is : 0.00421
batch 88 training accuracy is : 1.00000
batch 89 training loss is : 0.04390
batch 89 training accuracy is : 1.00000
batch 90 training loss is : 0.01044
batch 90 training accuracy is : 1.00000
batch 91 training loss is : 0.04831
batch 91 training accuracy is : 1.00000
batch 92 training loss is : 0.08462
batch 92 training accuracy is : 0.93750
batch 93 training loss is : 0.04094
batch 93 training accuracy is : 1.00000
batch 94 training loss is : 0.01549
batch 94 training accuracy is : 1.00000
batch 95 tra

batch 51 training loss is : 0.03245
batch 51 training accuracy is : 1.00000
batch 52 training loss is : 0.13652
batch 52 training accuracy is : 0.93750
batch 53 training loss is : 0.03373
batch 53 training accuracy is : 1.00000
batch 54 training loss is : 0.19860
batch 54 training accuracy is : 0.93750
batch 55 training loss is : 0.30747
batch 55 training accuracy is : 0.87500
batch 56 training loss is : 0.05842
batch 56 training accuracy is : 1.00000
batch 57 training loss is : 0.08009
batch 57 training accuracy is : 1.00000
batch 58 training loss is : 0.12237
batch 58 training accuracy is : 0.93750
batch 59 training loss is : 0.05746
batch 59 training accuracy is : 1.00000
batch 60 training loss is : 0.02950
batch 60 training accuracy is : 1.00000
batch 61 training loss is : 0.12424
batch 61 training accuracy is : 0.93750
batch 62 training loss is : 0.03016
batch 62 training accuracy is : 1.00000
batch 63 training loss is : 0.25627
batch 63 training accuracy is : 0.87500
batch 64 tra

batch 21 training loss is : 0.00114
batch 21 training accuracy is : 1.00000
batch 22 training loss is : 0.41091
batch 22 training accuracy is : 0.87500
batch 23 training loss is : 0.06104
batch 23 training accuracy is : 1.00000
batch 24 training loss is : 0.24914
batch 24 training accuracy is : 0.87500
batch 25 training loss is : 0.01452
batch 25 training accuracy is : 1.00000
batch 26 training loss is : 0.00000
batch 26 training accuracy is : 1.00000
batch 27 training loss is : 0.00000
batch 27 training accuracy is : 1.00000
batch 28 training loss is : 0.13948
batch 28 training accuracy is : 0.93750
batch 29 training loss is : 0.00225
batch 29 training accuracy is : 1.00000
batch 30 training loss is : 0.01885
batch 30 training accuracy is : 1.00000
batch 31 training loss is : 0.08245
batch 31 training accuracy is : 0.93750
batch 32 training loss is : 0.23425
batch 32 training accuracy is : 0.87500
batch 33 training loss is : 0.20710
batch 33 training accuracy is : 0.87500
batch 34 tra

batch 17 dev loss is : 1.66178
batch 17 dev accuracy is : 0.62500
batch 18 dev loss is : 1.49684
batch 18 dev accuracy is : 0.68750
batch 19 dev loss is : 2.25832
batch 19 dev accuracy is : 0.87500
batch 20 dev loss is : 1.21063
batch 20 dev accuracy is : 0.87500
batch 21 dev loss is : 1.74848
batch 21 dev accuracy is : 0.81250
batch 22 dev loss is : 1.13633
batch 22 dev accuracy is : 0.81250
batch 23 dev loss is : 0.41144
batch 23 dev accuracy is : 0.93750
batch 24 dev loss is : 0.30951
batch 24 dev accuracy is : 0.93750
batch 25 dev loss is : 0.52021
batch 25 dev accuracy is : 0.75000
batch 26 dev loss is : 1.67798
batch 26 dev accuracy is : 0.68750
batch 27 dev loss is : 1.31066
batch 27 dev accuracy is : 0.75000
Average validation loss is 0.95541 at the end of epoch 78
Average validation accuracy is 0.78139 at the end of epoch 78
At 79-th epoch.
batch 0 training loss is : 0.26818
batch 0 training accuracy is : 0.75000
batch 1 training loss is : 0.05209
batch 1 training accuracy is 

batch 97 training loss is : 0.01974
batch 97 training accuracy is : 1.00000
batch 98 training loss is : 0.01968
batch 98 training accuracy is : 1.00000
batch 99 training loss is : 0.04790
batch 99 training accuracy is : 0.93750
batch 100 training loss is : 0.00167
batch 100 training accuracy is : 1.00000
batch 101 training loss is : 0.00335
batch 101 training accuracy is : 1.00000
batch 102 training loss is : 0.06165
batch 102 training accuracy is : 0.93750
batch 103 training loss is : 0.03646
batch 103 training accuracy is : 1.00000
batch 104 training loss is : 0.00836
batch 104 training accuracy is : 1.00000
batch 105 training loss is : 0.00538
batch 105 training accuracy is : 1.00000
batch 106 training loss is : 0.04534
batch 106 training accuracy is : 1.00000
batch 107 training loss is : 0.04241
batch 107 training accuracy is : 1.00000
batch 108 training loss is : 0.00571
batch 108 training accuracy is : 1.00000
batch 109 training loss is : 0.03192
batch 109 training accuracy is : 

batch 68 training loss is : 0.02147
batch 68 training accuracy is : 1.00000
batch 69 training loss is : 0.16419
batch 69 training accuracy is : 0.87500
batch 70 training loss is : 0.41268
batch 70 training accuracy is : 0.87500
batch 71 training loss is : 0.01888
batch 71 training accuracy is : 1.00000
batch 72 training loss is : 0.02369
batch 72 training accuracy is : 1.00000
batch 73 training loss is : 0.00035
batch 73 training accuracy is : 1.00000
batch 74 training loss is : 0.00329
batch 74 training accuracy is : 1.00000
batch 75 training loss is : 0.05923
batch 75 training accuracy is : 0.93750
batch 76 training loss is : 0.13712
batch 76 training accuracy is : 0.93750
batch 77 training loss is : 0.00199
batch 77 training accuracy is : 1.00000
batch 78 training loss is : 0.26650
batch 78 training accuracy is : 0.93750
batch 79 training loss is : 0.00128
batch 79 training accuracy is : 1.00000
batch 80 training loss is : 0.50649
batch 80 training accuracy is : 0.87500
batch 81 tra

batch 38 training loss is : 0.05167
batch 38 training accuracy is : 1.00000
batch 39 training loss is : 0.22294
batch 39 training accuracy is : 0.87500
batch 40 training loss is : 0.12234
batch 40 training accuracy is : 0.93750
batch 41 training loss is : 0.05824
batch 41 training accuracy is : 1.00000
batch 42 training loss is : 0.13673
batch 42 training accuracy is : 0.93750
batch 43 training loss is : 0.02121
batch 43 training accuracy is : 1.00000
batch 44 training loss is : 0.15211
batch 44 training accuracy is : 0.93750
batch 45 training loss is : 0.13055
batch 45 training accuracy is : 0.93750
batch 46 training loss is : 0.02139
batch 46 training accuracy is : 1.00000
batch 47 training loss is : 0.04485
batch 47 training accuracy is : 1.00000
batch 48 training loss is : 0.11579
batch 48 training accuracy is : 0.93750
batch 49 training loss is : 0.29578
batch 49 training accuracy is : 0.93750
batch 50 training loss is : 0.16259
batch 50 training accuracy is : 0.87500
batch 51 tra

batch 9 training loss is : 0.04440
batch 9 training accuracy is : 1.00000
batch 10 training loss is : 0.02592
batch 10 training accuracy is : 1.00000
batch 11 training loss is : 0.00021
batch 11 training accuracy is : 1.00000
batch 12 training loss is : 0.01438
batch 12 training accuracy is : 1.00000
batch 13 training loss is : 0.06776
batch 13 training accuracy is : 0.93750
batch 14 training loss is : 0.08718
batch 14 training accuracy is : 1.00000
batch 15 training loss is : 0.12092
batch 15 training accuracy is : 0.93750
batch 16 training loss is : 0.04078
batch 16 training accuracy is : 1.00000
batch 17 training loss is : 0.00343
batch 17 training accuracy is : 1.00000
batch 18 training loss is : 0.11304
batch 18 training accuracy is : 0.93750
batch 19 training loss is : 0.18918
batch 19 training accuracy is : 0.93750
batch 20 training loss is : 0.01627
batch 20 training accuracy is : 1.00000
batch 21 training loss is : 0.32151
batch 21 training accuracy is : 0.87500
batch 22 train

batch 4 dev loss is : 0.64999
batch 4 dev accuracy is : 0.81250
batch 5 dev loss is : 0.20648
batch 5 dev accuracy is : 0.87500
batch 6 dev loss is : 0.68678
batch 6 dev accuracy is : 0.75000
batch 7 dev loss is : 1.37351
batch 7 dev accuracy is : 0.75000
batch 8 dev loss is : 1.82161
batch 8 dev accuracy is : 0.62500
batch 9 dev loss is : 0.43396
batch 9 dev accuracy is : 0.81250
batch 10 dev loss is : 1.19394
batch 10 dev accuracy is : 0.62500
batch 11 dev loss is : 1.77746
batch 11 dev accuracy is : 0.62500
batch 12 dev loss is : 0.95480
batch 12 dev accuracy is : 0.81250
batch 13 dev loss is : 1.34945
batch 13 dev accuracy is : 0.68750
batch 14 dev loss is : 0.75675
batch 14 dev accuracy is : 0.81250
batch 15 dev loss is : 0.58769
batch 15 dev accuracy is : 0.81250
batch 16 dev loss is : 0.83051
batch 16 dev accuracy is : 0.81250
batch 17 dev loss is : 1.92076
batch 17 dev accuracy is : 0.62500
batch 18 dev loss is : 1.97252
batch 18 dev accuracy is : 0.68750
batch 19 dev loss is :

batch 87 training loss is : 0.14616
batch 87 training accuracy is : 0.93750
batch 88 training loss is : 0.12744
batch 88 training accuracy is : 0.93750
batch 89 training loss is : 0.00008
batch 89 training accuracy is : 1.00000
batch 90 training loss is : 0.02303
batch 90 training accuracy is : 1.00000
batch 91 training loss is : 0.00173
batch 91 training accuracy is : 1.00000
batch 92 training loss is : 0.01962
batch 92 training accuracy is : 1.00000
batch 93 training loss is : 0.12065
batch 93 training accuracy is : 0.93750
batch 94 training loss is : 0.06374
batch 94 training accuracy is : 0.93750
batch 95 training loss is : 0.63815
batch 95 training accuracy is : 0.87500
batch 96 training loss is : 0.00443
batch 96 training accuracy is : 1.00000
batch 97 training loss is : 0.03681
batch 97 training accuracy is : 1.00000
batch 98 training loss is : 0.07676
batch 98 training accuracy is : 0.93750
batch 99 training loss is : 0.08581
batch 99 training accuracy is : 1.00000
batch 100 tr

batch 56 training loss is : 0.09486
batch 56 training accuracy is : 0.93750
batch 57 training loss is : 0.00418
batch 57 training accuracy is : 1.00000
batch 58 training loss is : 0.47823
batch 58 training accuracy is : 0.93750
batch 59 training loss is : 0.04852
batch 59 training accuracy is : 1.00000
batch 60 training loss is : 0.12701
batch 60 training accuracy is : 0.87500
batch 61 training loss is : 0.04708
batch 61 training accuracy is : 1.00000
batch 62 training loss is : 0.26182
batch 62 training accuracy is : 0.87500
batch 63 training loss is : 0.02299
batch 63 training accuracy is : 1.00000
batch 64 training loss is : 0.00714
batch 64 training accuracy is : 1.00000
batch 65 training loss is : 0.19177
batch 65 training accuracy is : 0.93750
batch 66 training loss is : 0.25274
batch 66 training accuracy is : 0.93750
batch 67 training loss is : 0.13478
batch 67 training accuracy is : 0.93750
batch 68 training loss is : 0.19272
batch 68 training accuracy is : 0.93750
batch 69 tra

batch 24 training loss is : 0.23111
batch 24 training accuracy is : 0.93750
batch 25 training loss is : 0.20837
batch 25 training accuracy is : 0.93750
batch 26 training loss is : 0.01057
batch 26 training accuracy is : 1.00000
batch 27 training loss is : 0.06480
batch 27 training accuracy is : 0.93750
batch 28 training loss is : 0.00556
batch 28 training accuracy is : 1.00000
batch 29 training loss is : 0.00006
batch 29 training accuracy is : 1.00000
batch 30 training loss is : 0.00067
batch 30 training accuracy is : 1.00000
batch 31 training loss is : 0.02197
batch 31 training accuracy is : 1.00000
batch 32 training loss is : 0.00885
batch 32 training accuracy is : 1.00000
batch 33 training loss is : 0.22135
batch 33 training accuracy is : 0.93750
batch 34 training loss is : 0.01356
batch 34 training accuracy is : 1.00000
batch 35 training loss is : 0.24299
batch 35 training accuracy is : 0.87500
batch 36 training loss is : 0.06665
batch 36 training accuracy is : 0.93750
batch 37 tra

batch 20 dev loss is : 1.57904
batch 20 dev accuracy is : 0.81250
batch 21 dev loss is : 1.64373
batch 21 dev accuracy is : 0.68750
batch 22 dev loss is : 0.93050
batch 22 dev accuracy is : 0.81250
batch 23 dev loss is : 0.73429
batch 23 dev accuracy is : 0.75000
batch 24 dev loss is : 0.77000
batch 24 dev accuracy is : 0.81250
batch 25 dev loss is : 1.39733
batch 25 dev accuracy is : 0.75000
batch 26 dev loss is : 1.31893
batch 26 dev accuracy is : 0.75000
batch 27 dev loss is : 0.96700
batch 27 dev accuracy is : 0.75000
Average validation loss is 1.24749 at the end of epoch 85
Average validation accuracy is 0.72294 at the end of epoch 85
At 86-th epoch.
batch 0 training loss is : 0.03849
batch 0 training accuracy is : 1.00000
batch 1 training loss is : 0.10840
batch 1 training accuracy is : 0.93750
batch 2 training loss is : 0.13287
batch 2 training accuracy is : 0.93750
batch 3 training loss is : 0.02540
batch 3 training accuracy is : 1.00000
batch 4 training loss is : 0.05244
batch

batch 102 training loss is : 0.09692
batch 102 training accuracy is : 0.93750
batch 103 training loss is : 0.07433
batch 103 training accuracy is : 0.93750
batch 104 training loss is : 0.06878
batch 104 training accuracy is : 1.00000
batch 105 training loss is : 0.14797
batch 105 training accuracy is : 0.93750
batch 106 training loss is : 0.11752
batch 106 training accuracy is : 0.93750
batch 107 training loss is : 0.02430
batch 107 training accuracy is : 1.00000
batch 108 training loss is : 0.08676
batch 108 training accuracy is : 0.93750
batch 109 training loss is : 0.19956
batch 109 training accuracy is : 0.93750
batch 110 training loss is : 0.03649
batch 110 training accuracy is : 1.00000
batch 111 training loss is : 0.03561
batch 111 training accuracy is : 1.00000
batch 112 training loss is : 0.23527
batch 112 training accuracy is : 0.93750
Average training loss is 0.07796 at the end of epoch 86
Average training accuracy is 0.96266 at the end of epoch 86
batch 0 dev loss is : 0.67

batch 70 training loss is : 0.63839
batch 70 training accuracy is : 0.75000
batch 71 training loss is : 0.19672
batch 71 training accuracy is : 0.93750
batch 72 training loss is : 0.24157
batch 72 training accuracy is : 0.93750
batch 73 training loss is : 0.23377
batch 73 training accuracy is : 0.93750
batch 74 training loss is : 0.07312
batch 74 training accuracy is : 1.00000
batch 75 training loss is : 0.43346
batch 75 training accuracy is : 0.87500
batch 76 training loss is : 0.01830
batch 76 training accuracy is : 1.00000
batch 77 training loss is : 0.01466
batch 77 training accuracy is : 1.00000
batch 78 training loss is : 0.03540
batch 78 training accuracy is : 1.00000
batch 79 training loss is : 0.27860
batch 79 training accuracy is : 0.87500
batch 80 training loss is : 0.00001
batch 80 training accuracy is : 1.00000
batch 81 training loss is : 0.19771
batch 81 training accuracy is : 0.93750
batch 82 training loss is : 0.00768
batch 82 training accuracy is : 1.00000
batch 83 tra

batch 39 training loss is : 0.10928
batch 39 training accuracy is : 1.00000
batch 40 training loss is : 0.05117
batch 40 training accuracy is : 1.00000
batch 41 training loss is : 0.01042
batch 41 training accuracy is : 1.00000
batch 42 training loss is : 0.18928
batch 42 training accuracy is : 0.93750
batch 43 training loss is : 0.03046
batch 43 training accuracy is : 1.00000
batch 44 training loss is : 0.00533
batch 44 training accuracy is : 1.00000
batch 45 training loss is : 0.12635
batch 45 training accuracy is : 0.93750
batch 46 training loss is : 0.00494
batch 46 training accuracy is : 1.00000
batch 47 training loss is : 0.14808
batch 47 training accuracy is : 0.93750
batch 48 training loss is : 0.22495
batch 48 training accuracy is : 0.93750
batch 49 training loss is : 0.26062
batch 49 training accuracy is : 0.87500
batch 50 training loss is : 0.07534
batch 50 training accuracy is : 0.93750
batch 51 training loss is : 0.00623
batch 51 training accuracy is : 1.00000
batch 52 tra

batch 9 training loss is : 0.19446
batch 9 training accuracy is : 0.93750
batch 10 training loss is : 0.00918
batch 10 training accuracy is : 1.00000
batch 11 training loss is : 0.04423
batch 11 training accuracy is : 1.00000
batch 12 training loss is : 0.00003
batch 12 training accuracy is : 1.00000
batch 13 training loss is : 0.12457
batch 13 training accuracy is : 0.87500
batch 14 training loss is : 0.02175
batch 14 training accuracy is : 1.00000
batch 15 training loss is : 0.29504
batch 15 training accuracy is : 0.87500
batch 16 training loss is : 0.05336
batch 16 training accuracy is : 1.00000
batch 17 training loss is : 0.01988
batch 17 training accuracy is : 1.00000
batch 18 training loss is : 0.11376
batch 18 training accuracy is : 0.93750
batch 19 training loss is : 0.02444
batch 19 training accuracy is : 1.00000
batch 20 training loss is : 0.13700
batch 20 training accuracy is : 0.93750
batch 21 training loss is : 0.43416
batch 21 training accuracy is : 0.93750
batch 22 train

batch 3 dev loss is : 0.58100
batch 3 dev accuracy is : 0.81250
batch 4 dev loss is : 0.70708
batch 4 dev accuracy is : 0.81250
batch 5 dev loss is : 0.20364
batch 5 dev accuracy is : 0.87500
batch 6 dev loss is : 0.19007
batch 6 dev accuracy is : 0.93750
batch 7 dev loss is : 1.59679
batch 7 dev accuracy is : 0.81250
batch 8 dev loss is : 1.80820
batch 8 dev accuracy is : 0.68750
batch 9 dev loss is : 0.36849
batch 9 dev accuracy is : 0.87500
batch 10 dev loss is : 1.36859
batch 10 dev accuracy is : 0.68750
batch 11 dev loss is : 0.99952
batch 11 dev accuracy is : 0.75000
batch 12 dev loss is : 1.09260
batch 12 dev accuracy is : 0.75000
batch 13 dev loss is : 1.61980
batch 13 dev accuracy is : 0.68750
batch 14 dev loss is : 0.36802
batch 14 dev accuracy is : 0.87500
batch 15 dev loss is : 0.39011
batch 15 dev accuracy is : 0.93750
batch 16 dev loss is : 0.93370
batch 16 dev accuracy is : 0.81250
batch 17 dev loss is : 1.58893
batch 17 dev accuracy is : 0.62500
batch 18 dev loss is : 1

batch 87 training loss is : 0.00326
batch 87 training accuracy is : 1.00000
batch 88 training loss is : 0.06893
batch 88 training accuracy is : 1.00000
batch 89 training loss is : 0.13213
batch 89 training accuracy is : 0.93750
batch 90 training loss is : 0.07130
batch 90 training accuracy is : 0.93750
batch 91 training loss is : 0.09132
batch 91 training accuracy is : 0.93750
batch 92 training loss is : 0.15734
batch 92 training accuracy is : 0.87500
batch 93 training loss is : 0.13950
batch 93 training accuracy is : 0.93750
batch 94 training loss is : 0.11597
batch 94 training accuracy is : 0.93750
batch 95 training loss is : 0.05359
batch 95 training accuracy is : 1.00000
batch 96 training loss is : 0.06343
batch 96 training accuracy is : 1.00000
batch 97 training loss is : 0.00044
batch 97 training accuracy is : 1.00000
batch 98 training loss is : 0.09943
batch 98 training accuracy is : 0.93750
batch 99 training loss is : 0.00098
batch 99 training accuracy is : 1.00000
batch 100 tr

batch 59 training loss is : 0.00203
batch 59 training accuracy is : 1.00000
batch 60 training loss is : 0.01035
batch 60 training accuracy is : 1.00000
batch 61 training loss is : 0.10392
batch 61 training accuracy is : 0.93750
batch 62 training loss is : 0.09568
batch 62 training accuracy is : 0.93750
batch 63 training loss is : 0.05566
batch 63 training accuracy is : 1.00000
batch 64 training loss is : 0.08424
batch 64 training accuracy is : 0.93750
batch 65 training loss is : 0.03999
batch 65 training accuracy is : 1.00000
batch 66 training loss is : 0.00073
batch 66 training accuracy is : 1.00000
batch 67 training loss is : 0.15584
batch 67 training accuracy is : 0.87500
batch 68 training loss is : 0.19554
batch 68 training accuracy is : 0.93750
batch 69 training loss is : 0.05650
batch 69 training accuracy is : 1.00000
batch 70 training loss is : 0.13197
batch 70 training accuracy is : 0.93750
batch 71 training loss is : 0.03056
batch 71 training accuracy is : 1.00000
batch 72 tra

batch 29 training loss is : 0.40546
batch 29 training accuracy is : 0.81250
batch 30 training loss is : 0.00183
batch 30 training accuracy is : 1.00000
batch 31 training loss is : 0.26266
batch 31 training accuracy is : 0.93750
batch 32 training loss is : 0.00288
batch 32 training accuracy is : 1.00000
batch 33 training loss is : 0.03855
batch 33 training accuracy is : 1.00000
batch 34 training loss is : 0.00099
batch 34 training accuracy is : 1.00000
batch 35 training loss is : 0.04478
batch 35 training accuracy is : 1.00000
batch 36 training loss is : 0.01208
batch 36 training accuracy is : 1.00000
batch 37 training loss is : 0.04388
batch 37 training accuracy is : 1.00000
batch 38 training loss is : 0.00282
batch 38 training accuracy is : 1.00000
batch 39 training loss is : 0.08842
batch 39 training accuracy is : 0.93750
batch 40 training loss is : 0.13444
batch 40 training accuracy is : 0.93750
batch 41 training loss is : 0.68727
batch 41 training accuracy is : 0.87500
batch 42 tra

batch 26 dev loss is : 1.37226
batch 26 dev accuracy is : 0.75000
batch 27 dev loss is : 1.54853
batch 27 dev accuracy is : 0.75000
Average validation loss is 1.01723 at the end of epoch 92
Average validation accuracy is 0.78139 at the end of epoch 92
At 93-th epoch.
batch 0 training loss is : 0.00397
batch 0 training accuracy is : 1.00000
batch 1 training loss is : 0.07123
batch 1 training accuracy is : 1.00000
batch 2 training loss is : 0.38271
batch 2 training accuracy is : 0.81250
batch 3 training loss is : 0.07497
batch 3 training accuracy is : 0.93750
batch 4 training loss is : 0.30215
batch 4 training accuracy is : 0.87500
batch 5 training loss is : 0.04216
batch 5 training accuracy is : 1.00000
batch 6 training loss is : 0.02152
batch 6 training accuracy is : 1.00000
batch 7 training loss is : 0.37180
batch 7 training accuracy is : 0.81250
batch 8 training loss is : 0.04849
batch 8 training accuracy is : 1.00000
batch 9 training loss is : 0.20655
batch 9 training accuracy is : 

batch 107 training loss is : 0.21043
batch 107 training accuracy is : 0.87500
batch 108 training loss is : 0.03699
batch 108 training accuracy is : 1.00000
batch 109 training loss is : 0.51406
batch 109 training accuracy is : 0.75000
batch 110 training loss is : 0.23664
batch 110 training accuracy is : 0.93750
batch 111 training loss is : 0.21231
batch 111 training accuracy is : 0.93750
batch 112 training loss is : 0.02136
batch 112 training accuracy is : 1.00000
Average training loss is 0.09222 at the end of epoch 93
Average training accuracy is 0.95717 at the end of epoch 93
batch 0 dev loss is : 0.74017
batch 0 dev accuracy is : 0.75000
batch 1 dev loss is : 0.38476
batch 1 dev accuracy is : 0.87500
batch 2 dev loss is : 0.49002
batch 2 dev accuracy is : 0.87500
batch 3 dev loss is : 0.73671
batch 3 dev accuracy is : 0.81250
batch 4 dev loss is : 0.80026
batch 4 dev accuracy is : 0.75000
batch 5 dev loss is : 0.48583
batch 5 dev accuracy is : 0.87500
batch 6 dev loss is : 0.37250
ba

batch 76 training loss is : 0.11762
batch 76 training accuracy is : 0.93750
batch 77 training loss is : 0.12389
batch 77 training accuracy is : 0.93750
batch 78 training loss is : 0.01498
batch 78 training accuracy is : 1.00000
batch 79 training loss is : 0.54350
batch 79 training accuracy is : 0.81250
batch 80 training loss is : 0.00374
batch 80 training accuracy is : 1.00000
batch 81 training loss is : 0.03573
batch 81 training accuracy is : 1.00000
batch 82 training loss is : 0.00057
batch 82 training accuracy is : 1.00000
batch 83 training loss is : 0.00030
batch 83 training accuracy is : 1.00000
batch 84 training loss is : 0.02942
batch 84 training accuracy is : 1.00000
batch 85 training loss is : 0.00145
batch 85 training accuracy is : 1.00000
batch 86 training loss is : 0.00007
batch 86 training accuracy is : 1.00000
batch 87 training loss is : 0.20301
batch 87 training accuracy is : 0.93750
batch 88 training loss is : 0.00027
batch 88 training accuracy is : 1.00000
batch 89 tra

batch 44 training loss is : 0.05267
batch 44 training accuracy is : 1.00000
batch 45 training loss is : 0.04649
batch 45 training accuracy is : 1.00000
batch 46 training loss is : 0.13838
batch 46 training accuracy is : 0.87500
batch 47 training loss is : 0.42576
batch 47 training accuracy is : 0.87500
batch 48 training loss is : 0.03358
batch 48 training accuracy is : 1.00000
batch 49 training loss is : 0.02176
batch 49 training accuracy is : 1.00000
batch 50 training loss is : 0.04479
batch 50 training accuracy is : 1.00000
batch 51 training loss is : 0.00528
batch 51 training accuracy is : 1.00000
batch 52 training loss is : 0.06224
batch 52 training accuracy is : 1.00000
batch 53 training loss is : 0.00422
batch 53 training accuracy is : 1.00000
batch 54 training loss is : 0.23405
batch 54 training accuracy is : 0.93750
batch 55 training loss is : 0.04064
batch 55 training accuracy is : 1.00000
batch 56 training loss is : 0.04950
batch 56 training accuracy is : 1.00000
batch 57 tra

batch 15 training loss is : 0.13221
batch 15 training accuracy is : 0.93750
batch 16 training loss is : 0.13045
batch 16 training accuracy is : 0.93750
batch 17 training loss is : 0.09545
batch 17 training accuracy is : 0.93750
batch 18 training loss is : 0.11398
batch 18 training accuracy is : 0.93750
batch 19 training loss is : 0.01846
batch 19 training accuracy is : 1.00000
batch 20 training loss is : 0.00214
batch 20 training accuracy is : 1.00000
batch 21 training loss is : 0.02796
batch 21 training accuracy is : 1.00000
batch 22 training loss is : 0.00018
batch 22 training accuracy is : 1.00000
batch 23 training loss is : 0.20055
batch 23 training accuracy is : 0.87500
batch 24 training loss is : 0.11404
batch 24 training accuracy is : 0.93750
batch 25 training loss is : 0.00574
batch 25 training accuracy is : 1.00000
batch 26 training loss is : 0.01051
batch 26 training accuracy is : 1.00000
batch 27 training loss is : 0.17913
batch 27 training accuracy is : 0.93750
batch 28 tra

batch 12 dev loss is : 1.22380
batch 12 dev accuracy is : 0.75000
batch 13 dev loss is : 2.15388
batch 13 dev accuracy is : 0.68750
batch 14 dev loss is : 0.66172
batch 14 dev accuracy is : 0.81250
batch 15 dev loss is : 0.73052
batch 15 dev accuracy is : 0.87500
batch 16 dev loss is : 1.06137
batch 16 dev accuracy is : 0.81250
batch 17 dev loss is : 2.48905
batch 17 dev accuracy is : 0.68750
batch 18 dev loss is : 2.51116
batch 18 dev accuracy is : 0.68750
batch 19 dev loss is : 2.20479
batch 19 dev accuracy is : 0.75000
batch 20 dev loss is : 1.51844
batch 20 dev accuracy is : 0.75000
batch 21 dev loss is : 2.00007
batch 21 dev accuracy is : 0.75000
batch 22 dev loss is : 1.51079
batch 22 dev accuracy is : 0.81250
batch 23 dev loss is : 0.56410
batch 23 dev accuracy is : 0.81250
batch 24 dev loss is : 0.57653
batch 24 dev accuracy is : 0.81250
batch 25 dev loss is : 1.11105
batch 25 dev accuracy is : 0.75000
batch 26 dev loss is : 1.53526
batch 26 dev accuracy is : 0.68750
batch 27 d

batch 95 training loss is : 0.03665
batch 95 training accuracy is : 1.00000
batch 96 training loss is : 0.01382
batch 96 training accuracy is : 1.00000
batch 97 training loss is : 0.09342
batch 97 training accuracy is : 0.93750
batch 98 training loss is : 0.06144
batch 98 training accuracy is : 1.00000
batch 99 training loss is : 0.25018
batch 99 training accuracy is : 0.93750
batch 100 training loss is : 0.08721
batch 100 training accuracy is : 1.00000
batch 101 training loss is : 0.01045
batch 101 training accuracy is : 1.00000
batch 102 training loss is : 0.17693
batch 102 training accuracy is : 0.93750
batch 103 training loss is : 0.57840
batch 103 training accuracy is : 0.81250
batch 104 training loss is : 0.00706
batch 104 training accuracy is : 1.00000
batch 105 training loss is : 0.06925
batch 105 training accuracy is : 0.93750
batch 106 training loss is : 0.41863
batch 106 training accuracy is : 0.75000
batch 107 training loss is : 0.04192
batch 107 training accuracy is : 1.00

batch 63 training loss is : 0.07134
batch 63 training accuracy is : 1.00000
batch 64 training loss is : 0.04143
batch 64 training accuracy is : 1.00000
batch 65 training loss is : 0.12727
batch 65 training accuracy is : 0.93750
batch 66 training loss is : 0.00001
batch 66 training accuracy is : 1.00000
batch 67 training loss is : 0.00003
batch 67 training accuracy is : 1.00000
batch 68 training loss is : 0.18764
batch 68 training accuracy is : 0.93750
batch 69 training loss is : 0.08621
batch 69 training accuracy is : 1.00000
batch 70 training loss is : 0.02299
batch 70 training accuracy is : 1.00000
batch 71 training loss is : 0.00207
batch 71 training accuracy is : 1.00000
batch 72 training loss is : 0.10680
batch 72 training accuracy is : 0.93750
batch 73 training loss is : 0.01700
batch 73 training accuracy is : 1.00000
batch 74 training loss is : 0.00999
batch 74 training accuracy is : 1.00000
batch 75 training loss is : 0.00510
batch 75 training accuracy is : 1.00000
batch 76 tra

batch 33 training loss is : 0.00000
batch 33 training accuracy is : 1.00000
batch 34 training loss is : 0.01957
batch 34 training accuracy is : 1.00000
batch 35 training loss is : 0.01995
batch 35 training accuracy is : 1.00000
batch 36 training loss is : 0.20489
batch 36 training accuracy is : 0.93750
batch 37 training loss is : 0.04410
batch 37 training accuracy is : 1.00000
batch 38 training loss is : 0.02736
batch 38 training accuracy is : 1.00000
batch 39 training loss is : 0.00251
batch 39 training accuracy is : 1.00000
batch 40 training loss is : 0.07028
batch 40 training accuracy is : 1.00000
batch 41 training loss is : 0.06865
batch 41 training accuracy is : 0.93750
batch 42 training loss is : 0.10906
batch 42 training accuracy is : 0.93750
batch 43 training loss is : 0.50292
batch 43 training accuracy is : 0.75000
batch 44 training loss is : 0.01195
batch 44 training accuracy is : 1.00000
batch 45 training loss is : 0.05300
batch 45 training accuracy is : 1.00000
batch 46 tra

batch 3 training loss is : 0.32958
batch 3 training accuracy is : 0.81250
batch 4 training loss is : 0.02229
batch 4 training accuracy is : 1.00000
batch 5 training loss is : 0.00395
batch 5 training accuracy is : 1.00000
batch 6 training loss is : 0.03067
batch 6 training accuracy is : 1.00000
batch 7 training loss is : 0.05212
batch 7 training accuracy is : 1.00000
batch 8 training loss is : 0.00089
batch 8 training accuracy is : 1.00000
batch 9 training loss is : 0.00026
batch 9 training accuracy is : 1.00000
batch 10 training loss is : 0.11436
batch 10 training accuracy is : 0.93750
batch 11 training loss is : 0.01096
batch 11 training accuracy is : 1.00000
batch 12 training loss is : 0.05230
batch 12 training accuracy is : 0.93750
batch 13 training loss is : 0.05328
batch 13 training accuracy is : 0.93750
batch 14 training loss is : 0.21536
batch 14 training accuracy is : 0.81250
batch 15 training loss is : 0.27223
batch 15 training accuracy is : 0.87500
batch 16 training loss is 

batch 111 training loss is : 0.18323
batch 111 training accuracy is : 0.93750
batch 112 training loss is : 0.00448
batch 112 training accuracy is : 1.00000
Average training loss is 0.09951 at the end of epoch 100
Average training accuracy is 0.95277 at the end of epoch 100
batch 0 dev loss is : 0.71209
batch 0 dev accuracy is : 0.81250
batch 1 dev loss is : 0.48157
batch 1 dev accuracy is : 0.87500
batch 2 dev loss is : 0.72269
batch 2 dev accuracy is : 0.87500
batch 3 dev loss is : 0.51894
batch 3 dev accuracy is : 0.87500
batch 4 dev loss is : 0.55905
batch 4 dev accuracy is : 0.75000
batch 5 dev loss is : 0.11225
batch 5 dev accuracy is : 0.87500
batch 6 dev loss is : 0.31074
batch 6 dev accuracy is : 0.81250
batch 7 dev loss is : 1.66161
batch 7 dev accuracy is : 0.81250
batch 8 dev loss is : 1.99506
batch 8 dev accuracy is : 0.62500
batch 9 dev loss is : 0.31523
batch 9 dev accuracy is : 0.87500
batch 10 dev loss is : 1.47804
batch 10 dev accuracy is : 0.62500
batch 11 dev loss is

batch 82 training loss is : 0.22171
batch 82 training accuracy is : 0.93750
batch 83 training loss is : 0.21680
batch 83 training accuracy is : 0.87500
batch 84 training loss is : 0.02794
batch 84 training accuracy is : 1.00000
batch 85 training loss is : 0.00788
batch 85 training accuracy is : 1.00000
batch 86 training loss is : 0.05633
batch 86 training accuracy is : 1.00000
batch 87 training loss is : 0.00010
batch 87 training accuracy is : 1.00000
batch 88 training loss is : 0.14620
batch 88 training accuracy is : 0.87500
batch 89 training loss is : 0.00091
batch 89 training accuracy is : 1.00000
batch 90 training loss is : 0.08528
batch 90 training accuracy is : 1.00000
batch 91 training loss is : 0.12126
batch 91 training accuracy is : 0.93750
batch 92 training loss is : 0.19941
batch 92 training accuracy is : 0.87500
batch 93 training loss is : 0.07557
batch 93 training accuracy is : 1.00000
batch 94 training loss is : 0.00005
batch 94 training accuracy is : 1.00000
batch 95 tra

batch 50 training loss is : 0.02692
batch 50 training accuracy is : 1.00000
batch 51 training loss is : 0.07061
batch 51 training accuracy is : 0.93750
batch 52 training loss is : 0.01291
batch 52 training accuracy is : 1.00000
batch 53 training loss is : 0.01607
batch 53 training accuracy is : 1.00000
batch 54 training loss is : 0.17037
batch 54 training accuracy is : 0.87500
batch 55 training loss is : 0.01137
batch 55 training accuracy is : 1.00000
batch 56 training loss is : 0.05110
batch 56 training accuracy is : 0.93750
batch 57 training loss is : 0.03194
batch 57 training accuracy is : 1.00000
batch 58 training loss is : 0.41989
batch 58 training accuracy is : 0.87500
batch 59 training loss is : 0.16698
batch 59 training accuracy is : 0.87500
batch 60 training loss is : 0.06849
batch 60 training accuracy is : 0.93750
batch 61 training loss is : 0.01577
batch 61 training accuracy is : 1.00000
batch 62 training loss is : 0.00985
batch 62 training accuracy is : 1.00000
batch 63 tra

batch 19 training loss is : 0.06677
batch 19 training accuracy is : 1.00000
batch 20 training loss is : 0.41628
batch 20 training accuracy is : 0.81250
batch 21 training loss is : 0.30001
batch 21 training accuracy is : 0.93750
batch 22 training loss is : 0.00008
batch 22 training accuracy is : 1.00000
batch 23 training loss is : 0.00075
batch 23 training accuracy is : 1.00000
batch 24 training loss is : 0.05098
batch 24 training accuracy is : 0.93750
batch 25 training loss is : 0.07117
batch 25 training accuracy is : 0.93750
batch 26 training loss is : 0.13706
batch 26 training accuracy is : 0.87500
batch 27 training loss is : 0.02065
batch 27 training accuracy is : 1.00000
batch 28 training loss is : 0.00129
batch 28 training accuracy is : 1.00000
batch 29 training loss is : 0.01431
batch 29 training accuracy is : 1.00000
batch 30 training loss is : 0.24138
batch 30 training accuracy is : 0.87500
batch 31 training loss is : 0.17958
batch 31 training accuracy is : 0.87500
batch 32 tra

batch 15 dev loss is : 0.70016
batch 15 dev accuracy is : 0.87500
batch 16 dev loss is : 0.93441
batch 16 dev accuracy is : 0.81250
batch 17 dev loss is : 2.47936
batch 17 dev accuracy is : 0.56250
batch 18 dev loss is : 1.98442
batch 18 dev accuracy is : 0.75000
batch 19 dev loss is : 2.05297
batch 19 dev accuracy is : 0.81250
batch 20 dev loss is : 1.48788
batch 20 dev accuracy is : 0.75000
batch 21 dev loss is : 2.00640
batch 21 dev accuracy is : 0.81250
batch 22 dev loss is : 1.35424
batch 22 dev accuracy is : 0.81250
batch 23 dev loss is : 0.37910
batch 23 dev accuracy is : 0.81250
batch 24 dev loss is : 0.44702
batch 24 dev accuracy is : 0.87500
batch 25 dev loss is : 1.06576
batch 25 dev accuracy is : 0.68750
batch 26 dev loss is : 1.60093
batch 26 dev accuracy is : 0.68750
batch 27 dev loss is : 1.32474
batch 27 dev accuracy is : 0.75000
Average validation loss is 1.16620 at the end of epoch 103
Average validation accuracy is 0.73810 at the end of epoch 103
At 104-th epoch.
bat

batch 95 training loss is : 0.18648
batch 95 training accuracy is : 0.93750
batch 96 training loss is : 0.03494
batch 96 training accuracy is : 1.00000
batch 97 training loss is : 0.02371
batch 97 training accuracy is : 1.00000
batch 98 training loss is : 0.00395
batch 98 training accuracy is : 1.00000
batch 99 training loss is : 0.00862
batch 99 training accuracy is : 1.00000
batch 100 training loss is : 0.07343
batch 100 training accuracy is : 0.93750
batch 101 training loss is : 0.03274
batch 101 training accuracy is : 1.00000
batch 102 training loss is : 0.00391
batch 102 training accuracy is : 1.00000
batch 103 training loss is : 0.01369
batch 103 training accuracy is : 1.00000
batch 104 training loss is : 0.04513
batch 104 training accuracy is : 1.00000
batch 105 training loss is : 0.02763
batch 105 training accuracy is : 1.00000
batch 106 training loss is : 0.07289
batch 106 training accuracy is : 1.00000
batch 107 training loss is : 0.05300
batch 107 training accuracy is : 0.93

batch 64 training loss is : 0.03157
batch 64 training accuracy is : 1.00000
batch 65 training loss is : 0.19668
batch 65 training accuracy is : 0.87500
batch 66 training loss is : 0.20575
batch 66 training accuracy is : 0.87500
batch 67 training loss is : 0.02458
batch 67 training accuracy is : 1.00000
batch 68 training loss is : 0.91117
batch 68 training accuracy is : 0.93750
batch 69 training loss is : 0.02616
batch 69 training accuracy is : 1.00000
batch 70 training loss is : 0.05859
batch 70 training accuracy is : 0.93750
batch 71 training loss is : 0.00001
batch 71 training accuracy is : 1.00000
batch 72 training loss is : 0.00018
batch 72 training accuracy is : 1.00000
batch 73 training loss is : 0.15019
batch 73 training accuracy is : 0.93750
batch 74 training loss is : 0.00009
batch 74 training accuracy is : 1.00000
batch 75 training loss is : 0.15762
batch 75 training accuracy is : 0.93750
batch 76 training loss is : 0.00002
batch 76 training accuracy is : 1.00000
batch 77 tra

batch 34 training loss is : 0.02610
batch 34 training accuracy is : 1.00000
batch 35 training loss is : 0.01248
batch 35 training accuracy is : 1.00000
batch 36 training loss is : 0.06302
batch 36 training accuracy is : 0.93750
batch 37 training loss is : 0.01656
batch 37 training accuracy is : 1.00000
batch 38 training loss is : 0.09753
batch 38 training accuracy is : 0.93750
batch 39 training loss is : 0.00280
batch 39 training accuracy is : 1.00000
batch 40 training loss is : 0.00731
batch 40 training accuracy is : 1.00000
batch 41 training loss is : 0.03496
batch 41 training accuracy is : 1.00000
batch 42 training loss is : 0.00056
batch 42 training accuracy is : 1.00000
batch 43 training loss is : 0.00515
batch 43 training accuracy is : 1.00000
batch 44 training loss is : 0.37695
batch 44 training accuracy is : 0.93750
batch 45 training loss is : 0.18794
batch 45 training accuracy is : 0.93750
batch 46 training loss is : 0.07091
batch 46 training accuracy is : 0.93750
batch 47 tra

batch 5 training loss is : 0.30075
batch 5 training accuracy is : 0.81250
batch 6 training loss is : 0.03700
batch 6 training accuracy is : 1.00000
batch 7 training loss is : 0.08216
batch 7 training accuracy is : 0.93750
batch 8 training loss is : 0.10592
batch 8 training accuracy is : 0.93750
batch 9 training loss is : 0.02669
batch 9 training accuracy is : 1.00000
batch 10 training loss is : 0.04954
batch 10 training accuracy is : 1.00000
batch 11 training loss is : 0.01692
batch 11 training accuracy is : 1.00000
batch 12 training loss is : 0.35238
batch 12 training accuracy is : 0.87500
batch 13 training loss is : 0.09859
batch 13 training accuracy is : 0.93750
batch 14 training loss is : 0.00024
batch 14 training accuracy is : 1.00000
batch 15 training loss is : 0.11909
batch 15 training accuracy is : 0.93750
batch 16 training loss is : 0.24475
batch 16 training accuracy is : 0.81250
batch 17 training loss is : 0.17058
batch 17 training accuracy is : 0.87500
batch 18 training loss

Average training loss is 0.07948 at the end of epoch 107
Average training accuracy is 0.95991 at the end of epoch 107
batch 0 dev loss is : 0.81330
batch 0 dev accuracy is : 0.75000
batch 1 dev loss is : 0.45540
batch 1 dev accuracy is : 0.87500
batch 2 dev loss is : 0.64912
batch 2 dev accuracy is : 0.87500
batch 3 dev loss is : 0.81740
batch 3 dev accuracy is : 0.81250
batch 4 dev loss is : 0.73776
batch 4 dev accuracy is : 0.81250
batch 5 dev loss is : 0.35100
batch 5 dev accuracy is : 0.87500
batch 6 dev loss is : 0.52856
batch 6 dev accuracy is : 0.68750
batch 7 dev loss is : 1.88305
batch 7 dev accuracy is : 0.81250
batch 8 dev loss is : 1.74285
batch 8 dev accuracy is : 0.68750
batch 9 dev loss is : 0.47690
batch 9 dev accuracy is : 0.81250
batch 10 dev loss is : 1.63206
batch 10 dev accuracy is : 0.56250
batch 11 dev loss is : 1.08786
batch 11 dev accuracy is : 0.62500
batch 12 dev loss is : 1.10984
batch 12 dev accuracy is : 0.75000
batch 13 dev loss is : 1.80021
batch 13 dev 

batch 81 training loss is : 0.06453
batch 81 training accuracy is : 0.93750
batch 82 training loss is : 0.03129
batch 82 training accuracy is : 1.00000
batch 83 training loss is : 0.00754
batch 83 training accuracy is : 1.00000
batch 84 training loss is : 0.16318
batch 84 training accuracy is : 0.87500
batch 85 training loss is : 0.20754
batch 85 training accuracy is : 0.87500
batch 86 training loss is : 0.16396
batch 86 training accuracy is : 0.93750
batch 87 training loss is : 0.14300
batch 87 training accuracy is : 0.93750
batch 88 training loss is : 0.00629
batch 88 training accuracy is : 1.00000
batch 89 training loss is : 0.28108
batch 89 training accuracy is : 0.87500
batch 90 training loss is : 0.01830
batch 90 training accuracy is : 1.00000
batch 91 training loss is : 0.00038
batch 91 training accuracy is : 1.00000
batch 92 training loss is : 0.04904
batch 92 training accuracy is : 1.00000
batch 93 training loss is : 0.37569
batch 93 training accuracy is : 0.87500
batch 94 tra

batch 52 training loss is : 0.08052
batch 52 training accuracy is : 0.93750
batch 53 training loss is : 0.00142
batch 53 training accuracy is : 1.00000
batch 54 training loss is : 0.22424
batch 54 training accuracy is : 0.87500
batch 55 training loss is : 0.08947
batch 55 training accuracy is : 0.93750
batch 56 training loss is : 0.08791
batch 56 training accuracy is : 0.93750
batch 57 training loss is : 0.31887
batch 57 training accuracy is : 0.93750
batch 58 training loss is : 0.06102
batch 58 training accuracy is : 0.93750
batch 59 training loss is : 0.06186
batch 59 training accuracy is : 1.00000
batch 60 training loss is : 0.10665
batch 60 training accuracy is : 0.93750
batch 61 training loss is : 0.16822
batch 61 training accuracy is : 0.93750
batch 62 training loss is : 0.01916
batch 62 training accuracy is : 1.00000
batch 63 training loss is : 0.06639
batch 63 training accuracy is : 0.93750
batch 64 training loss is : 0.00001
batch 64 training accuracy is : 1.00000
batch 65 tra

batch 21 training loss is : 0.15452
batch 21 training accuracy is : 0.93750
batch 22 training loss is : 0.04899
batch 22 training accuracy is : 1.00000
batch 23 training loss is : 0.04439
batch 23 training accuracy is : 1.00000
batch 24 training loss is : 0.00287
batch 24 training accuracy is : 1.00000
batch 25 training loss is : 0.00007
batch 25 training accuracy is : 1.00000
batch 26 training loss is : 0.01126
batch 26 training accuracy is : 1.00000
batch 27 training loss is : 0.00107
batch 27 training accuracy is : 1.00000
batch 28 training loss is : 0.01535
batch 28 training accuracy is : 1.00000
batch 29 training loss is : 0.01228
batch 29 training accuracy is : 1.00000
batch 30 training loss is : 0.00565
batch 30 training accuracy is : 1.00000
batch 31 training loss is : 0.06844
batch 31 training accuracy is : 0.93750
batch 32 training loss is : 0.01074
batch 32 training accuracy is : 1.00000
batch 33 training loss is : 0.04284
batch 33 training accuracy is : 1.00000
batch 34 tra

batch 19 dev loss is : 2.46372
batch 19 dev accuracy is : 0.75000
batch 20 dev loss is : 1.67093
batch 20 dev accuracy is : 0.75000
batch 21 dev loss is : 1.79670
batch 21 dev accuracy is : 0.81250
batch 22 dev loss is : 1.50871
batch 22 dev accuracy is : 0.81250
batch 23 dev loss is : 0.46169
batch 23 dev accuracy is : 0.81250
batch 24 dev loss is : 0.59854
batch 24 dev accuracy is : 0.87500
batch 25 dev loss is : 0.88949
batch 25 dev accuracy is : 0.75000
batch 26 dev loss is : 1.14567
batch 26 dev accuracy is : 0.75000
batch 27 dev loss is : 1.36449
batch 27 dev accuracy is : 0.81250
Average validation loss is 1.20843 at the end of epoch 110
Average validation accuracy is 0.73593 at the end of epoch 110
At 111-th epoch.
batch 0 training loss is : 0.00259
batch 0 training accuracy is : 1.00000
batch 1 training loss is : 0.02426
batch 1 training accuracy is : 1.00000
batch 2 training loss is : 0.07832
batch 2 training accuracy is : 0.93750
batch 3 training loss is : 0.09577
batch 3 tr

batch 99 training loss is : 0.18470
batch 99 training accuracy is : 0.87500
batch 100 training loss is : 0.00097
batch 100 training accuracy is : 1.00000
batch 101 training loss is : 0.00325
batch 101 training accuracy is : 1.00000
batch 102 training loss is : 0.10232
batch 102 training accuracy is : 0.93750
batch 103 training loss is : 0.04611
batch 103 training accuracy is : 1.00000
batch 104 training loss is : 0.32915
batch 104 training accuracy is : 0.87500
batch 105 training loss is : 0.32010
batch 105 training accuracy is : 0.93750
batch 106 training loss is : 0.00193
batch 106 training accuracy is : 1.00000
batch 107 training loss is : 0.02283
batch 107 training accuracy is : 1.00000
batch 108 training loss is : 0.03969
batch 108 training accuracy is : 1.00000
batch 109 training loss is : 0.00049
batch 109 training accuracy is : 1.00000
batch 110 training loss is : 0.04512
batch 110 training accuracy is : 1.00000
batch 111 training loss is : 0.27712
batch 111 training accuracy i

batch 68 training loss is : 0.11532
batch 68 training accuracy is : 0.93750
batch 69 training loss is : 0.07178
batch 69 training accuracy is : 1.00000
batch 70 training loss is : 0.01774
batch 70 training accuracy is : 1.00000
batch 71 training loss is : 0.18108
batch 71 training accuracy is : 0.87500
batch 72 training loss is : 0.16598
batch 72 training accuracy is : 0.87500
batch 73 training loss is : 0.02228
batch 73 training accuracy is : 1.00000
batch 74 training loss is : 0.12766
batch 74 training accuracy is : 0.93750
batch 75 training loss is : 0.06786
batch 75 training accuracy is : 0.93750
batch 76 training loss is : 0.40991
batch 76 training accuracy is : 0.93750
batch 77 training loss is : 0.05127
batch 77 training accuracy is : 1.00000
batch 78 training loss is : 0.00145
batch 78 training accuracy is : 1.00000
batch 79 training loss is : 0.00974
batch 79 training accuracy is : 1.00000
batch 80 training loss is : 0.39263
batch 80 training accuracy is : 0.87500
batch 81 tra

batch 39 training loss is : 0.00001
batch 39 training accuracy is : 1.00000
batch 40 training loss is : 0.12705
batch 40 training accuracy is : 0.93750
batch 41 training loss is : 0.00512
batch 41 training accuracy is : 1.00000
batch 42 training loss is : 0.09112
batch 42 training accuracy is : 0.93750
batch 43 training loss is : 0.01377
batch 43 training accuracy is : 1.00000
batch 44 training loss is : 0.00141
batch 44 training accuracy is : 1.00000
batch 45 training loss is : 0.18149
batch 45 training accuracy is : 0.93750
batch 46 training loss is : 0.01363
batch 46 training accuracy is : 1.00000
batch 47 training loss is : 0.01819
batch 47 training accuracy is : 1.00000
batch 48 training loss is : 0.01143
batch 48 training accuracy is : 1.00000
batch 49 training loss is : 0.06226
batch 49 training accuracy is : 0.93750
batch 50 training loss is : 0.08283
batch 50 training accuracy is : 1.00000
batch 51 training loss is : 0.03633
batch 51 training accuracy is : 1.00000
batch 52 tra

batch 9 training loss is : 0.07029
batch 9 training accuracy is : 0.93750
batch 10 training loss is : 0.07600
batch 10 training accuracy is : 0.93750
batch 11 training loss is : 0.00565
batch 11 training accuracy is : 1.00000
batch 12 training loss is : 0.00160
batch 12 training accuracy is : 1.00000
batch 13 training loss is : 0.00361
batch 13 training accuracy is : 1.00000
batch 14 training loss is : 0.08489
batch 14 training accuracy is : 1.00000
batch 15 training loss is : 0.50569
batch 15 training accuracy is : 0.81250
batch 16 training loss is : 0.00013
batch 16 training accuracy is : 1.00000
batch 17 training loss is : 0.00080
batch 17 training accuracy is : 1.00000
batch 18 training loss is : 0.11445
batch 18 training accuracy is : 0.93750
batch 19 training loss is : 0.06955
batch 19 training accuracy is : 0.93750
batch 20 training loss is : 0.16263
batch 20 training accuracy is : 0.87500
batch 21 training loss is : 0.10306
batch 21 training accuracy is : 0.93750
batch 22 train

batch 4 dev loss is : 0.70894
batch 4 dev accuracy is : 0.81250
batch 5 dev loss is : 0.22147
batch 5 dev accuracy is : 0.87500
batch 6 dev loss is : 0.36631
batch 6 dev accuracy is : 0.81250
batch 7 dev loss is : 1.80067
batch 7 dev accuracy is : 0.81250
batch 8 dev loss is : 1.81556
batch 8 dev accuracy is : 0.68750
batch 9 dev loss is : 0.56233
batch 9 dev accuracy is : 0.81250
batch 10 dev loss is : 2.00877
batch 10 dev accuracy is : 0.68750
batch 11 dev loss is : 1.02574
batch 11 dev accuracy is : 0.81250
batch 12 dev loss is : 0.84203
batch 12 dev accuracy is : 0.81250
batch 13 dev loss is : 1.69309
batch 13 dev accuracy is : 0.68750
batch 14 dev loss is : 0.56794
batch 14 dev accuracy is : 0.81250
batch 15 dev loss is : 0.57125
batch 15 dev accuracy is : 0.93750
batch 16 dev loss is : 0.98420
batch 16 dev accuracy is : 0.75000
batch 17 dev loss is : 2.18455
batch 17 dev accuracy is : 0.56250
batch 18 dev loss is : 2.09443
batch 18 dev accuracy is : 0.62500
batch 19 dev loss is :

batch 86 training loss is : 0.29444
batch 86 training accuracy is : 0.81250
batch 87 training loss is : 0.00385
batch 87 training accuracy is : 1.00000
batch 88 training loss is : 0.26964
batch 88 training accuracy is : 0.87500
batch 89 training loss is : 0.11113
batch 89 training accuracy is : 0.93750
batch 90 training loss is : 0.00164
batch 90 training accuracy is : 1.00000
batch 91 training loss is : 0.11405
batch 91 training accuracy is : 0.93750
batch 92 training loss is : 0.16384
batch 92 training accuracy is : 0.93750
batch 93 training loss is : 0.12046
batch 93 training accuracy is : 0.93750
batch 94 training loss is : 0.08955
batch 94 training accuracy is : 1.00000
batch 95 training loss is : 0.00421
batch 95 training accuracy is : 1.00000
batch 96 training loss is : 0.20914
batch 96 training accuracy is : 0.93750
batch 97 training loss is : 0.01482
batch 97 training accuracy is : 1.00000
batch 98 training loss is : 0.00892
batch 98 training accuracy is : 1.00000
batch 99 tra

batch 54 training loss is : 0.00021
batch 54 training accuracy is : 1.00000
batch 55 training loss is : 0.00624
batch 55 training accuracy is : 1.00000
batch 56 training loss is : 0.01274
batch 56 training accuracy is : 1.00000
batch 57 training loss is : 0.10432
batch 57 training accuracy is : 0.93750
batch 58 training loss is : 0.00933
batch 58 training accuracy is : 1.00000
batch 59 training loss is : 0.00001
batch 59 training accuracy is : 1.00000
batch 60 training loss is : 0.00236
batch 60 training accuracy is : 1.00000
batch 61 training loss is : 0.00518
batch 61 training accuracy is : 1.00000
batch 62 training loss is : 0.01332
batch 62 training accuracy is : 1.00000
batch 63 training loss is : 0.03836
batch 63 training accuracy is : 1.00000
batch 64 training loss is : 0.00101
batch 64 training accuracy is : 1.00000
batch 65 training loss is : 0.03462
batch 65 training accuracy is : 1.00000
batch 66 training loss is : 0.03821
batch 66 training accuracy is : 1.00000
batch 67 tra

batch 24 training loss is : 0.01833
batch 24 training accuracy is : 1.00000
batch 25 training loss is : 0.06987
batch 25 training accuracy is : 0.93750
batch 26 training loss is : 0.01671
batch 26 training accuracy is : 1.00000
batch 27 training loss is : 0.00517
batch 27 training accuracy is : 1.00000
batch 28 training loss is : 0.10689
batch 28 training accuracy is : 0.93750
batch 29 training loss is : 0.02074
batch 29 training accuracy is : 1.00000
batch 30 training loss is : 0.00383
batch 30 training accuracy is : 1.00000
batch 31 training loss is : 0.04927
batch 31 training accuracy is : 1.00000
batch 32 training loss is : 0.08749
batch 32 training accuracy is : 0.93750
batch 33 training loss is : 0.17081
batch 33 training accuracy is : 0.93750
batch 34 training loss is : 0.11090
batch 34 training accuracy is : 0.93750
batch 35 training loss is : 0.00106
batch 35 training accuracy is : 1.00000
batch 36 training loss is : 0.01942
batch 36 training accuracy is : 1.00000
batch 37 tra

batch 21 dev loss is : 1.88871
batch 21 dev accuracy is : 0.81250
batch 22 dev loss is : 1.11427
batch 22 dev accuracy is : 0.81250
batch 23 dev loss is : 0.25523
batch 23 dev accuracy is : 0.93750
batch 24 dev loss is : 0.51611
batch 24 dev accuracy is : 0.81250
batch 25 dev loss is : 0.96571
batch 25 dev accuracy is : 0.68750
batch 26 dev loss is : 1.84169
batch 26 dev accuracy is : 0.68750
batch 27 dev loss is : 1.48229
batch 27 dev accuracy is : 0.68750
Average validation loss is 1.10081 at the end of epoch 117
Average validation accuracy is 0.77056 at the end of epoch 117
At 118-th epoch.
batch 0 training loss is : 0.07604
batch 0 training accuracy is : 1.00000
batch 1 training loss is : 0.04043
batch 1 training accuracy is : 1.00000
batch 2 training loss is : 0.02530
batch 2 training accuracy is : 1.00000
batch 3 training loss is : 0.00969
batch 3 training accuracy is : 1.00000
batch 4 training loss is : 0.05599
batch 4 training accuracy is : 1.00000
batch 5 training loss is : 0.

batch 101 training loss is : 0.02584
batch 101 training accuracy is : 1.00000
batch 102 training loss is : 0.00300
batch 102 training accuracy is : 1.00000
batch 103 training loss is : 0.02932
batch 103 training accuracy is : 1.00000
batch 104 training loss is : 0.21453
batch 104 training accuracy is : 0.87500
batch 105 training loss is : 0.02291
batch 105 training accuracy is : 1.00000
batch 106 training loss is : 0.07466
batch 106 training accuracy is : 0.93750
batch 107 training loss is : 0.00712
batch 107 training accuracy is : 1.00000
batch 108 training loss is : 0.03786
batch 108 training accuracy is : 1.00000
batch 109 training loss is : 0.00050
batch 109 training accuracy is : 1.00000
batch 110 training loss is : 0.01531
batch 110 training accuracy is : 1.00000
batch 111 training loss is : 0.03143
batch 111 training accuracy is : 1.00000
batch 112 training loss is : 0.02072
batch 112 training accuracy is : 1.00000
Average training loss is 0.05796 at the end of epoch 118
Average

batch 69 training loss is : 0.02826
batch 69 training accuracy is : 1.00000
batch 70 training loss is : 0.15581
batch 70 training accuracy is : 0.93750
batch 71 training loss is : 0.03869
batch 71 training accuracy is : 1.00000
batch 72 training loss is : 0.05923
batch 72 training accuracy is : 0.93750
batch 73 training loss is : 0.01934
batch 73 training accuracy is : 1.00000
batch 74 training loss is : 0.09821
batch 74 training accuracy is : 0.93750
batch 75 training loss is : 0.01351
batch 75 training accuracy is : 1.00000
batch 76 training loss is : 0.08912
batch 76 training accuracy is : 0.93750
batch 77 training loss is : 0.08007
batch 77 training accuracy is : 0.93750
batch 78 training loss is : 0.01646
batch 78 training accuracy is : 1.00000
batch 79 training loss is : 0.12172
batch 79 training accuracy is : 0.93750
batch 80 training loss is : 0.06805
batch 80 training accuracy is : 0.93750
batch 81 training loss is : 0.01094
batch 81 training accuracy is : 1.00000
batch 82 tra

batch 39 training loss is : 0.00319
batch 39 training accuracy is : 1.00000
batch 40 training loss is : 0.34481
batch 40 training accuracy is : 0.93750
batch 41 training loss is : 0.00653
batch 41 training accuracy is : 1.00000
batch 42 training loss is : 0.31570
batch 42 training accuracy is : 0.87500
batch 43 training loss is : 0.09593
batch 43 training accuracy is : 1.00000
batch 44 training loss is : 0.22251
batch 44 training accuracy is : 0.93750
batch 45 training loss is : 0.61255
batch 45 training accuracy is : 0.87500
batch 46 training loss is : 0.00504
batch 46 training accuracy is : 1.00000
batch 47 training loss is : 0.04784
batch 47 training accuracy is : 1.00000
batch 48 training loss is : 0.01450
batch 48 training accuracy is : 1.00000
batch 49 training loss is : 0.12704
batch 49 training accuracy is : 0.93750
batch 50 training loss is : 0.00505
batch 50 training accuracy is : 1.00000
batch 51 training loss is : 0.02250
batch 51 training accuracy is : 1.00000
batch 52 tra

batch 7 training loss is : 0.08509
batch 7 training accuracy is : 0.93750
batch 8 training loss is : 0.05201
batch 8 training accuracy is : 0.93750
batch 9 training loss is : 0.11226
batch 9 training accuracy is : 0.93750
batch 10 training loss is : 0.01105
batch 10 training accuracy is : 1.00000
batch 11 training loss is : 0.13553
batch 11 training accuracy is : 0.93750
batch 12 training loss is : 0.02113
batch 12 training accuracy is : 1.00000
batch 13 training loss is : 0.02623
batch 13 training accuracy is : 1.00000
batch 14 training loss is : 0.29901
batch 14 training accuracy is : 0.87500
batch 15 training loss is : 0.01072
batch 15 training accuracy is : 1.00000
batch 16 training loss is : 0.02417
batch 16 training accuracy is : 1.00000
batch 17 training loss is : 0.04773
batch 17 training accuracy is : 1.00000
batch 18 training loss is : 0.00145
batch 18 training accuracy is : 1.00000
batch 19 training loss is : 0.02184
batch 19 training accuracy is : 1.00000
batch 20 training 

batch 0 dev loss is : 0.93853
batch 0 dev accuracy is : 0.81250
batch 1 dev loss is : 0.38669
batch 1 dev accuracy is : 0.93750
batch 2 dev loss is : 0.40002
batch 2 dev accuracy is : 0.93750
batch 3 dev loss is : 0.44539
batch 3 dev accuracy is : 0.87500
batch 4 dev loss is : 0.67583
batch 4 dev accuracy is : 0.81250
batch 5 dev loss is : 0.13535
batch 5 dev accuracy is : 0.93750
batch 6 dev loss is : 0.13927
batch 6 dev accuracy is : 0.93750
batch 7 dev loss is : 1.92655
batch 7 dev accuracy is : 0.81250
batch 8 dev loss is : 1.90197
batch 8 dev accuracy is : 0.68750
batch 9 dev loss is : 0.36615
batch 9 dev accuracy is : 0.87500
batch 10 dev loss is : 1.59739
batch 10 dev accuracy is : 0.75000
batch 11 dev loss is : 1.68904
batch 11 dev accuracy is : 0.68750
batch 12 dev loss is : 1.05555
batch 12 dev accuracy is : 0.75000
batch 13 dev loss is : 1.91984
batch 13 dev accuracy is : 0.75000
batch 14 dev loss is : 0.98963
batch 14 dev accuracy is : 0.81250
batch 15 dev loss is : 0.53618

batch 83 training loss is : 0.05400
batch 83 training accuracy is : 0.93750
batch 84 training loss is : 0.60606
batch 84 training accuracy is : 0.81250
batch 85 training loss is : 0.00252
batch 85 training accuracy is : 1.00000
batch 86 training loss is : 0.02081
batch 86 training accuracy is : 1.00000
batch 87 training loss is : 0.00452
batch 87 training accuracy is : 1.00000
batch 88 training loss is : 0.12807
batch 88 training accuracy is : 0.93750
batch 89 training loss is : 0.06256
batch 89 training accuracy is : 0.93750
batch 90 training loss is : 0.05507
batch 90 training accuracy is : 1.00000
batch 91 training loss is : 0.00169
batch 91 training accuracy is : 1.00000
batch 92 training loss is : 0.03897
batch 92 training accuracy is : 1.00000
batch 93 training loss is : 0.01569
batch 93 training accuracy is : 1.00000
batch 94 training loss is : 0.02944
batch 94 training accuracy is : 1.00000
batch 95 training loss is : 0.00776
batch 95 training accuracy is : 1.00000
batch 96 tra

batch 51 training loss is : 0.05327
batch 51 training accuracy is : 0.93750
batch 52 training loss is : 0.15598
batch 52 training accuracy is : 0.93750
batch 53 training loss is : 0.02991
batch 53 training accuracy is : 1.00000
batch 54 training loss is : 0.01201
batch 54 training accuracy is : 1.00000
batch 55 training loss is : 0.20979
batch 55 training accuracy is : 0.87500
batch 56 training loss is : 0.03442
batch 56 training accuracy is : 1.00000
batch 57 training loss is : 0.15888
batch 57 training accuracy is : 0.87500
batch 58 training loss is : 0.13097
batch 58 training accuracy is : 0.93750
batch 59 training loss is : 0.03050
batch 59 training accuracy is : 1.00000
batch 60 training loss is : 0.00703
batch 60 training accuracy is : 1.00000
batch 61 training loss is : 0.00042
batch 61 training accuracy is : 1.00000
batch 62 training loss is : 0.07708
batch 62 training accuracy is : 0.93750
batch 63 training loss is : 0.41981
batch 63 training accuracy is : 0.81250
batch 64 tra

batch 19 training loss is : 0.06931
batch 19 training accuracy is : 1.00000
batch 20 training loss is : 0.11042
batch 20 training accuracy is : 0.93750
batch 21 training loss is : 0.06816
batch 21 training accuracy is : 1.00000
batch 22 training loss is : 0.16630
batch 22 training accuracy is : 0.87500
batch 23 training loss is : 0.00320
batch 23 training accuracy is : 1.00000
batch 24 training loss is : 0.02801
batch 24 training accuracy is : 1.00000
batch 25 training loss is : 0.06042
batch 25 training accuracy is : 1.00000
batch 26 training loss is : 0.06329
batch 26 training accuracy is : 1.00000
batch 27 training loss is : 0.01078
batch 27 training accuracy is : 1.00000
batch 28 training loss is : 0.11324
batch 28 training accuracy is : 0.93750
batch 29 training loss is : 0.03735
batch 29 training accuracy is : 1.00000
batch 30 training loss is : 0.05811
batch 30 training accuracy is : 0.93750
batch 31 training loss is : 0.09421
batch 31 training accuracy is : 0.93750
batch 32 tra

batch 15 dev loss is : 0.71547
batch 15 dev accuracy is : 0.87500
batch 16 dev loss is : 1.09361
batch 16 dev accuracy is : 0.75000
batch 17 dev loss is : 2.43241
batch 17 dev accuracy is : 0.62500
batch 18 dev loss is : 1.75384
batch 18 dev accuracy is : 0.68750
batch 19 dev loss is : 2.91811
batch 19 dev accuracy is : 0.87500
batch 20 dev loss is : 2.01405
batch 20 dev accuracy is : 0.68750
batch 21 dev loss is : 2.72700
batch 21 dev accuracy is : 0.68750
batch 22 dev loss is : 1.18933
batch 22 dev accuracy is : 0.81250
batch 23 dev loss is : 0.43062
batch 23 dev accuracy is : 0.93750
batch 24 dev loss is : 0.49155
batch 24 dev accuracy is : 0.81250
batch 25 dev loss is : 1.96882
batch 25 dev accuracy is : 0.62500
batch 26 dev loss is : 2.41727
batch 26 dev accuracy is : 0.62500
batch 27 dev loss is : 2.02167
batch 27 dev accuracy is : 0.62500
Average validation loss is 1.37780 at the end of epoch 124
Average validation accuracy is 0.74892 at the end of epoch 124
At 125-th epoch.
bat

batch 97 training loss is : 0.10437
batch 97 training accuracy is : 0.93750
batch 98 training loss is : 0.46276
batch 98 training accuracy is : 0.93750
batch 99 training loss is : 0.00537
batch 99 training accuracy is : 1.00000
batch 100 training loss is : 0.03542
batch 100 training accuracy is : 1.00000
batch 101 training loss is : 0.04456
batch 101 training accuracy is : 1.00000
batch 102 training loss is : 0.00734
batch 102 training accuracy is : 1.00000
batch 103 training loss is : 0.17148
batch 103 training accuracy is : 0.93750
batch 104 training loss is : 0.01265
batch 104 training accuracy is : 1.00000
batch 105 training loss is : 0.23937
batch 105 training accuracy is : 0.93750
batch 106 training loss is : 0.00146
batch 106 training accuracy is : 1.00000
batch 107 training loss is : 0.13304
batch 107 training accuracy is : 0.93750
batch 108 training loss is : 0.06306
batch 108 training accuracy is : 0.93750
batch 109 training loss is : 0.02475
batch 109 training accuracy is : 

batch 66 training loss is : 0.01471
batch 66 training accuracy is : 1.00000
batch 67 training loss is : 0.03395
batch 67 training accuracy is : 1.00000
batch 68 training loss is : 0.02401
batch 68 training accuracy is : 1.00000
batch 69 training loss is : 0.02461
batch 69 training accuracy is : 1.00000
batch 70 training loss is : 0.20669
batch 70 training accuracy is : 0.93750
batch 71 training loss is : 0.29954
batch 71 training accuracy is : 0.93750
batch 72 training loss is : 0.05391
batch 72 training accuracy is : 1.00000
batch 73 training loss is : 0.32050
batch 73 training accuracy is : 0.87500
batch 74 training loss is : 0.00640
batch 74 training accuracy is : 1.00000
batch 75 training loss is : 0.07396
batch 75 training accuracy is : 1.00000
batch 76 training loss is : 0.07581
batch 76 training accuracy is : 0.93750
batch 77 training loss is : 0.16051
batch 77 training accuracy is : 0.93750
batch 78 training loss is : 0.04754
batch 78 training accuracy is : 1.00000
batch 79 tra

batch 37 training loss is : 0.00532
batch 37 training accuracy is : 1.00000
batch 38 training loss is : 0.39026
batch 38 training accuracy is : 0.87500
batch 39 training loss is : 0.01435
batch 39 training accuracy is : 1.00000
batch 40 training loss is : 0.00002
batch 40 training accuracy is : 1.00000
batch 41 training loss is : 0.05047
batch 41 training accuracy is : 0.93750
batch 42 training loss is : 0.24133
batch 42 training accuracy is : 0.93750
batch 43 training loss is : 0.04532
batch 43 training accuracy is : 1.00000
batch 44 training loss is : 0.01144
batch 44 training accuracy is : 1.00000
batch 45 training loss is : 0.02942
batch 45 training accuracy is : 1.00000
batch 46 training loss is : 0.08106
batch 46 training accuracy is : 1.00000
batch 47 training loss is : 0.17376
batch 47 training accuracy is : 0.93750
batch 48 training loss is : 0.23898
batch 48 training accuracy is : 0.93750
batch 49 training loss is : 0.17737
batch 49 training accuracy is : 0.87500
batch 50 tra

batch 6 training loss is : 0.01494
batch 6 training accuracy is : 1.00000
batch 7 training loss is : 0.00144
batch 7 training accuracy is : 1.00000
batch 8 training loss is : 0.11470
batch 8 training accuracy is : 0.93750
batch 9 training loss is : 0.00104
batch 9 training accuracy is : 1.00000
batch 10 training loss is : 0.00620
batch 10 training accuracy is : 1.00000
batch 11 training loss is : 0.00290
batch 11 training accuracy is : 1.00000
batch 12 training loss is : 0.03186
batch 12 training accuracy is : 1.00000
batch 13 training loss is : 0.25002
batch 13 training accuracy is : 0.93750
batch 14 training loss is : 0.00171
batch 14 training accuracy is : 1.00000
batch 15 training loss is : 0.02296
batch 15 training accuracy is : 1.00000
batch 16 training loss is : 0.02501
batch 16 training accuracy is : 1.00000
batch 17 training loss is : 0.00018
batch 17 training accuracy is : 1.00000
batch 18 training loss is : 0.00000
batch 18 training accuracy is : 1.00000
batch 19 training lo

batch 0 dev loss is : 0.74010
batch 0 dev accuracy is : 0.81250
batch 1 dev loss is : 0.32158
batch 1 dev accuracy is : 0.87500
batch 2 dev loss is : 0.68278
batch 2 dev accuracy is : 0.87500
batch 3 dev loss is : 0.56275
batch 3 dev accuracy is : 0.87500
batch 4 dev loss is : 0.58189
batch 4 dev accuracy is : 0.75000
batch 5 dev loss is : 0.12442
batch 5 dev accuracy is : 0.93750
batch 6 dev loss is : 0.19589
batch 6 dev accuracy is : 0.93750
batch 7 dev loss is : 2.13496
batch 7 dev accuracy is : 0.81250
batch 8 dev loss is : 2.22415
batch 8 dev accuracy is : 0.62500
batch 9 dev loss is : 0.29271
batch 9 dev accuracy is : 0.87500
batch 10 dev loss is : 2.38414
batch 10 dev accuracy is : 0.68750
batch 11 dev loss is : 1.76509
batch 11 dev accuracy is : 0.56250
batch 12 dev loss is : 1.23471
batch 12 dev accuracy is : 0.81250
batch 13 dev loss is : 2.09212
batch 13 dev accuracy is : 0.68750
batch 14 dev loss is : 0.84722
batch 14 dev accuracy is : 0.81250
batch 15 dev loss is : 0.50770

batch 83 training loss is : 0.11234
batch 83 training accuracy is : 0.93750
batch 84 training loss is : 0.02308
batch 84 training accuracy is : 1.00000
batch 85 training loss is : 0.00459
batch 85 training accuracy is : 1.00000
batch 86 training loss is : 0.04727
batch 86 training accuracy is : 1.00000
batch 87 training loss is : 0.00010
batch 87 training accuracy is : 1.00000
batch 88 training loss is : 0.01755
batch 88 training accuracy is : 1.00000
batch 89 training loss is : 0.00971
batch 89 training accuracy is : 1.00000
batch 90 training loss is : 0.47392
batch 90 training accuracy is : 0.81250
batch 91 training loss is : 0.22368
batch 91 training accuracy is : 0.81250
batch 92 training loss is : 0.00427
batch 92 training accuracy is : 1.00000
batch 93 training loss is : 0.20184
batch 93 training accuracy is : 0.93750
batch 94 training loss is : 0.33816
batch 94 training accuracy is : 0.87500
batch 95 training loss is : 0.02437
batch 95 training accuracy is : 1.00000
batch 96 tra

batch 52 training loss is : 0.06169
batch 52 training accuracy is : 0.93750
batch 53 training loss is : 0.00005
batch 53 training accuracy is : 1.00000
batch 54 training loss is : 0.04549
batch 54 training accuracy is : 1.00000
batch 55 training loss is : 0.00001
batch 55 training accuracy is : 1.00000
batch 56 training loss is : 0.14048
batch 56 training accuracy is : 0.93750
batch 57 training loss is : 0.23958
batch 57 training accuracy is : 0.93750
batch 58 training loss is : 0.35590
batch 58 training accuracy is : 0.87500
batch 59 training loss is : 0.16312
batch 59 training accuracy is : 0.93750
batch 60 training loss is : 0.00369
batch 60 training accuracy is : 1.00000
batch 61 training loss is : 0.04067
batch 61 training accuracy is : 1.00000
batch 62 training loss is : 0.09872
batch 62 training accuracy is : 0.93750
batch 63 training loss is : 0.00672
batch 63 training accuracy is : 1.00000
batch 64 training loss is : 0.12255
batch 64 training accuracy is : 0.93750
batch 65 tra

batch 21 training loss is : 0.14375
batch 21 training accuracy is : 0.93750
batch 22 training loss is : 0.00464
batch 22 training accuracy is : 1.00000
batch 23 training loss is : 0.37401
batch 23 training accuracy is : 0.87500
batch 24 training loss is : 0.00000
batch 24 training accuracy is : 1.00000
batch 25 training loss is : 0.02459
batch 25 training accuracy is : 1.00000
batch 26 training loss is : 0.01008
batch 26 training accuracy is : 1.00000
batch 27 training loss is : 0.12607
batch 27 training accuracy is : 0.93750
batch 28 training loss is : 0.09397
batch 28 training accuracy is : 0.93750
batch 29 training loss is : 0.03936
batch 29 training accuracy is : 1.00000
batch 30 training loss is : 0.00621
batch 30 training accuracy is : 1.00000
batch 31 training loss is : 0.18136
batch 31 training accuracy is : 0.93750
batch 32 training loss is : 0.11092
batch 32 training accuracy is : 0.93750
batch 33 training loss is : 0.00589
batch 33 training accuracy is : 1.00000
batch 34 tra

batch 18 dev loss is : 2.56304
batch 18 dev accuracy is : 0.68750
batch 19 dev loss is : 2.36503
batch 19 dev accuracy is : 0.81250
batch 20 dev loss is : 1.69787
batch 20 dev accuracy is : 0.75000
batch 21 dev loss is : 1.78232
batch 21 dev accuracy is : 0.75000
batch 22 dev loss is : 1.33634
batch 22 dev accuracy is : 0.81250
batch 23 dev loss is : 0.54479
batch 23 dev accuracy is : 0.81250
batch 24 dev loss is : 0.86567
batch 24 dev accuracy is : 0.87500
batch 25 dev loss is : 0.98301
batch 25 dev accuracy is : 0.75000
batch 26 dev loss is : 1.46020
batch 26 dev accuracy is : 0.68750
batch 27 dev loss is : 1.08546
batch 27 dev accuracy is : 0.81250
Average validation loss is 1.27449 at the end of epoch 131
Average validation accuracy is 0.74242 at the end of epoch 131
At 132-th epoch.
batch 0 training loss is : 0.02806
batch 0 training accuracy is : 1.00000
batch 1 training loss is : 0.02746
batch 1 training accuracy is : 1.00000
batch 2 training loss is : 0.14127
batch 2 training a

batch 99 training loss is : 0.00071
batch 99 training accuracy is : 1.00000
batch 100 training loss is : 0.00229
batch 100 training accuracy is : 1.00000
batch 101 training loss is : 0.01645
batch 101 training accuracy is : 1.00000
batch 102 training loss is : 0.02315
batch 102 training accuracy is : 1.00000
batch 103 training loss is : 0.05534
batch 103 training accuracy is : 0.93750
batch 104 training loss is : 0.07809
batch 104 training accuracy is : 0.93750
batch 105 training loss is : 0.00039
batch 105 training accuracy is : 1.00000
batch 106 training loss is : 0.28677
batch 106 training accuracy is : 0.87500
batch 107 training loss is : 0.20039
batch 107 training accuracy is : 0.87500
batch 108 training loss is : 0.01756
batch 108 training accuracy is : 1.00000
batch 109 training loss is : 0.26578
batch 109 training accuracy is : 0.93750
batch 110 training loss is : 0.07230
batch 110 training accuracy is : 0.93750
batch 111 training loss is : 0.22060
batch 111 training accuracy i

batch 69 training loss is : 0.01894
batch 69 training accuracy is : 1.00000
batch 70 training loss is : 0.00166
batch 70 training accuracy is : 1.00000
batch 71 training loss is : 0.02318
batch 71 training accuracy is : 1.00000
batch 72 training loss is : 0.05337
batch 72 training accuracy is : 0.93750
batch 73 training loss is : 0.07255
batch 73 training accuracy is : 0.93750
batch 74 training loss is : 0.00059
batch 74 training accuracy is : 1.00000
batch 75 training loss is : 0.00989
batch 75 training accuracy is : 1.00000
batch 76 training loss is : 0.00000
batch 76 training accuracy is : 1.00000
batch 77 training loss is : 0.04695
batch 77 training accuracy is : 1.00000
batch 78 training loss is : 0.00000
batch 78 training accuracy is : 1.00000
batch 79 training loss is : 0.30782
batch 79 training accuracy is : 0.87500
batch 80 training loss is : 0.10177
batch 80 training accuracy is : 0.93750
batch 81 training loss is : 0.01214
batch 81 training accuracy is : 1.00000
batch 82 tra

batch 38 training loss is : 0.05757
batch 38 training accuracy is : 1.00000
batch 39 training loss is : 0.03734
batch 39 training accuracy is : 1.00000
batch 40 training loss is : 0.00337
batch 40 training accuracy is : 1.00000
batch 41 training loss is : 0.17399
batch 41 training accuracy is : 0.93750
batch 42 training loss is : 0.01275
batch 42 training accuracy is : 1.00000
batch 43 training loss is : 0.05072
batch 43 training accuracy is : 0.93750
batch 44 training loss is : 0.06640
batch 44 training accuracy is : 1.00000
batch 45 training loss is : 0.16149
batch 45 training accuracy is : 0.93750
batch 46 training loss is : 0.38492
batch 46 training accuracy is : 0.87500
batch 47 training loss is : 0.22581
batch 47 training accuracy is : 0.93750
batch 48 training loss is : 0.06914
batch 48 training accuracy is : 0.93750
batch 49 training loss is : 0.02227
batch 49 training accuracy is : 1.00000
batch 50 training loss is : 0.00199
batch 50 training accuracy is : 1.00000
batch 51 tra

batch 6 training loss is : 0.01023
batch 6 training accuracy is : 1.00000
batch 7 training loss is : 0.00513
batch 7 training accuracy is : 1.00000
batch 8 training loss is : 0.00040
batch 8 training accuracy is : 1.00000
batch 9 training loss is : 0.06526
batch 9 training accuracy is : 0.93750
batch 10 training loss is : 0.10009
batch 10 training accuracy is : 0.93750
batch 11 training loss is : 0.00094
batch 11 training accuracy is : 1.00000
batch 12 training loss is : 0.06881
batch 12 training accuracy is : 0.93750
batch 13 training loss is : 0.07263
batch 13 training accuracy is : 1.00000
batch 14 training loss is : 0.03850
batch 14 training accuracy is : 1.00000
batch 15 training loss is : 0.00082
batch 15 training accuracy is : 1.00000
batch 16 training loss is : 0.12627
batch 16 training accuracy is : 0.93750
batch 17 training loss is : 0.05999
batch 17 training accuracy is : 1.00000
batch 18 training loss is : 0.07249
batch 18 training accuracy is : 0.93750
batch 19 training lo

batch 0 dev loss is : 1.11455
batch 0 dev accuracy is : 0.81250
batch 1 dev loss is : 0.43838
batch 1 dev accuracy is : 0.87500
batch 2 dev loss is : 0.49724
batch 2 dev accuracy is : 0.87500
batch 3 dev loss is : 0.84966
batch 3 dev accuracy is : 0.87500
batch 4 dev loss is : 0.56914
batch 4 dev accuracy is : 0.81250
batch 5 dev loss is : 0.27909
batch 5 dev accuracy is : 0.87500
batch 6 dev loss is : 0.94893
batch 6 dev accuracy is : 0.75000
batch 7 dev loss is : 1.76502
batch 7 dev accuracy is : 0.81250
batch 8 dev loss is : 2.21192
batch 8 dev accuracy is : 0.62500
batch 9 dev loss is : 0.63188
batch 9 dev accuracy is : 0.81250
batch 10 dev loss is : 1.74254
batch 10 dev accuracy is : 0.56250
batch 11 dev loss is : 2.22138
batch 11 dev accuracy is : 0.62500
batch 12 dev loss is : 1.34715
batch 12 dev accuracy is : 0.81250
batch 13 dev loss is : 1.74815
batch 13 dev accuracy is : 0.62500
batch 14 dev loss is : 0.85583
batch 14 dev accuracy is : 0.81250
batch 15 dev loss is : 0.74126

batch 85 training loss is : 0.25979
batch 85 training accuracy is : 0.93750
batch 86 training loss is : 0.00656
batch 86 training accuracy is : 1.00000
batch 87 training loss is : 0.00140
batch 87 training accuracy is : 1.00000
batch 88 training loss is : 0.05534
batch 88 training accuracy is : 0.93750
batch 89 training loss is : 0.10220
batch 89 training accuracy is : 0.87500
batch 90 training loss is : 0.19710
batch 90 training accuracy is : 0.93750
batch 91 training loss is : 0.00152
batch 91 training accuracy is : 1.00000
batch 92 training loss is : 0.00122
batch 92 training accuracy is : 1.00000
batch 93 training loss is : 0.00513
batch 93 training accuracy is : 1.00000
batch 94 training loss is : 0.08110
batch 94 training accuracy is : 1.00000
batch 95 training loss is : 0.07680
batch 95 training accuracy is : 0.93750
batch 96 training loss is : 0.02476
batch 96 training accuracy is : 1.00000
batch 97 training loss is : 0.01972
batch 97 training accuracy is : 1.00000
batch 98 tra

batch 55 training loss is : 0.17202
batch 55 training accuracy is : 0.93750
batch 56 training loss is : 0.02947
batch 56 training accuracy is : 1.00000
batch 57 training loss is : 0.02594
batch 57 training accuracy is : 1.00000
batch 58 training loss is : 0.01945
batch 58 training accuracy is : 1.00000
batch 59 training loss is : 0.40574
batch 59 training accuracy is : 0.75000
batch 60 training loss is : 0.01860
batch 60 training accuracy is : 1.00000
batch 61 training loss is : 0.58102
batch 61 training accuracy is : 0.75000
batch 62 training loss is : 0.02010
batch 62 training accuracy is : 1.00000
batch 63 training loss is : 0.00638
batch 63 training accuracy is : 1.00000
batch 64 training loss is : 0.01000
batch 64 training accuracy is : 1.00000
batch 65 training loss is : 0.11033
batch 65 training accuracy is : 0.93750
batch 66 training loss is : 0.00025
batch 66 training accuracy is : 1.00000
batch 67 training loss is : 0.09318
batch 67 training accuracy is : 0.93750
batch 68 tra

batch 25 training loss is : 0.01710
batch 25 training accuracy is : 1.00000
batch 26 training loss is : 0.06776
batch 26 training accuracy is : 0.93750
batch 27 training loss is : 0.27937
batch 27 training accuracy is : 0.87500
batch 28 training loss is : 0.17053
batch 28 training accuracy is : 0.87500
batch 29 training loss is : 0.03784
batch 29 training accuracy is : 1.00000
batch 30 training loss is : 0.01221
batch 30 training accuracy is : 1.00000
batch 31 training loss is : 0.11692
batch 31 training accuracy is : 0.93750
batch 32 training loss is : 0.19881
batch 32 training accuracy is : 0.93750
batch 33 training loss is : 0.05956
batch 33 training accuracy is : 0.93750
batch 34 training loss is : 0.01133
batch 34 training accuracy is : 1.00000
batch 35 training loss is : 0.09874
batch 35 training accuracy is : 0.93750
batch 36 training loss is : 0.08966
batch 36 training accuracy is : 0.93750
batch 37 training loss is : 0.00872
batch 37 training accuracy is : 1.00000
batch 38 tra

batch 25 dev loss is : 0.61961
batch 25 dev accuracy is : 0.87500
batch 26 dev loss is : 1.90434
batch 26 dev accuracy is : 0.68750
batch 27 dev loss is : 1.16149
batch 27 dev accuracy is : 0.81250
Average validation loss is 1.15589 at the end of epoch 138
Average validation accuracy is 0.76623 at the end of epoch 138
At 139-th epoch.
batch 0 training loss is : 0.03743
batch 0 training accuracy is : 1.00000
batch 1 training loss is : 0.18843
batch 1 training accuracy is : 0.87500
batch 2 training loss is : 0.00136
batch 2 training accuracy is : 1.00000
batch 3 training loss is : 0.19271
batch 3 training accuracy is : 0.93750
batch 4 training loss is : 0.01183
batch 4 training accuracy is : 1.00000
batch 5 training loss is : 0.00052
batch 5 training accuracy is : 1.00000
batch 6 training loss is : 0.00597
batch 6 training accuracy is : 1.00000
batch 7 training loss is : 0.01746
batch 7 training accuracy is : 1.00000
batch 8 training loss is : 0.00594
batch 8 training accuracy is : 1.000

batch 106 training loss is : 0.00532
batch 106 training accuracy is : 1.00000
batch 107 training loss is : 0.05853
batch 107 training accuracy is : 1.00000
batch 108 training loss is : 0.00112
batch 108 training accuracy is : 1.00000
batch 109 training loss is : 0.25114
batch 109 training accuracy is : 0.93750
batch 110 training loss is : 0.10942
batch 110 training accuracy is : 0.87500
batch 111 training loss is : 0.02721
batch 111 training accuracy is : 1.00000
batch 112 training loss is : 0.01428
batch 112 training accuracy is : 1.00000
Average training loss is 0.07512 at the end of epoch 139
Average training accuracy is 0.96321 at the end of epoch 139
batch 0 dev loss is : 0.92567
batch 0 dev accuracy is : 0.81250
batch 1 dev loss is : 0.22542
batch 1 dev accuracy is : 0.93750
batch 2 dev loss is : 0.48554
batch 2 dev accuracy is : 0.93750
batch 3 dev loss is : 0.86780
batch 3 dev accuracy is : 0.81250
batch 4 dev loss is : 0.91926
batch 4 dev accuracy is : 0.87500
batch 5 dev loss

batch 76 training loss is : 0.31758
batch 76 training accuracy is : 0.87500
batch 77 training loss is : 0.39675
batch 77 training accuracy is : 0.93750
batch 78 training loss is : 0.01929
batch 78 training accuracy is : 1.00000
batch 79 training loss is : 0.06788
batch 79 training accuracy is : 0.93750
batch 80 training loss is : 0.06468
batch 80 training accuracy is : 0.93750
batch 81 training loss is : 0.32060
batch 81 training accuracy is : 0.81250
batch 82 training loss is : 0.04717
batch 82 training accuracy is : 1.00000
batch 83 training loss is : 0.21522
batch 83 training accuracy is : 0.87500
batch 84 training loss is : 0.00517
batch 84 training accuracy is : 1.00000
batch 85 training loss is : 0.00701
batch 85 training accuracy is : 1.00000
batch 86 training loss is : 0.02479
batch 86 training accuracy is : 1.00000
batch 87 training loss is : 0.03895
batch 87 training accuracy is : 1.00000
batch 88 training loss is : 0.01407
batch 88 training accuracy is : 1.00000
batch 89 tra

batch 45 training loss is : 0.07321
batch 45 training accuracy is : 0.93750
batch 46 training loss is : 0.01030
batch 46 training accuracy is : 1.00000
batch 47 training loss is : 0.14289
batch 47 training accuracy is : 0.93750
batch 48 training loss is : 0.01838
batch 48 training accuracy is : 1.00000
batch 49 training loss is : 0.00144
batch 49 training accuracy is : 1.00000
batch 50 training loss is : 0.19976
batch 50 training accuracy is : 0.93750
batch 51 training loss is : 0.02849
batch 51 training accuracy is : 1.00000
batch 52 training loss is : 0.00098
batch 52 training accuracy is : 1.00000
batch 53 training loss is : 0.01256
batch 53 training accuracy is : 1.00000
batch 54 training loss is : 0.00145
batch 54 training accuracy is : 1.00000
batch 55 training loss is : 0.00026
batch 55 training accuracy is : 1.00000
batch 56 training loss is : 0.15377
batch 56 training accuracy is : 0.93750
batch 57 training loss is : 0.01014
batch 57 training accuracy is : 1.00000
batch 58 tra

batch 15 training loss is : 0.04925
batch 15 training accuracy is : 1.00000
batch 16 training loss is : 0.05564
batch 16 training accuracy is : 0.93750
batch 17 training loss is : 0.01780
batch 17 training accuracy is : 1.00000
batch 18 training loss is : 0.00231
batch 18 training accuracy is : 1.00000
batch 19 training loss is : 0.18071
batch 19 training accuracy is : 0.93750
batch 20 training loss is : 0.00445
batch 20 training accuracy is : 1.00000
batch 21 training loss is : 0.02111
batch 21 training accuracy is : 1.00000
batch 22 training loss is : 0.00328
batch 22 training accuracy is : 1.00000
batch 23 training loss is : 0.10626
batch 23 training accuracy is : 0.93750
batch 24 training loss is : 0.00631
batch 24 training accuracy is : 1.00000
batch 25 training loss is : 0.05186
batch 25 training accuracy is : 1.00000
batch 26 training loss is : 0.02473
batch 26 training accuracy is : 1.00000
batch 27 training loss is : 0.00309
batch 27 training accuracy is : 1.00000
batch 28 tra

batch 12 dev loss is : 1.48356
batch 12 dev accuracy is : 0.75000
batch 13 dev loss is : 1.99233
batch 13 dev accuracy is : 0.75000
batch 14 dev loss is : 0.94249
batch 14 dev accuracy is : 0.81250
batch 15 dev loss is : 0.46332
batch 15 dev accuracy is : 0.87500
batch 16 dev loss is : 1.10270
batch 16 dev accuracy is : 0.81250
batch 17 dev loss is : 2.12280
batch 17 dev accuracy is : 0.62500
batch 18 dev loss is : 1.67723
batch 18 dev accuracy is : 0.62500
batch 19 dev loss is : 2.46246
batch 19 dev accuracy is : 0.81250
batch 20 dev loss is : 1.34308
batch 20 dev accuracy is : 0.87500
batch 21 dev loss is : 2.38087
batch 21 dev accuracy is : 0.81250
batch 22 dev loss is : 1.08285
batch 22 dev accuracy is : 0.75000
batch 23 dev loss is : 0.34126
batch 23 dev accuracy is : 0.93750
batch 24 dev loss is : 0.36351
batch 24 dev accuracy is : 0.87500
batch 25 dev loss is : 1.05852
batch 25 dev accuracy is : 0.68750
batch 26 dev loss is : 2.15464
batch 26 dev accuracy is : 0.68750
batch 27 d

batch 98 training loss is : 0.00631
batch 98 training accuracy is : 1.00000
batch 99 training loss is : 0.02256
batch 99 training accuracy is : 1.00000
batch 100 training loss is : 0.01094
batch 100 training accuracy is : 1.00000
batch 101 training loss is : 0.04868
batch 101 training accuracy is : 0.93750
batch 102 training loss is : 0.11035
batch 102 training accuracy is : 0.87500
batch 103 training loss is : 0.00219
batch 103 training accuracy is : 1.00000
batch 104 training loss is : 0.00001
batch 104 training accuracy is : 1.00000
batch 105 training loss is : 0.33452
batch 105 training accuracy is : 0.87500
batch 106 training loss is : 0.00239
batch 106 training accuracy is : 1.00000
batch 107 training loss is : 0.07302
batch 107 training accuracy is : 0.93750
batch 108 training loss is : 0.09287
batch 108 training accuracy is : 0.93750
batch 109 training loss is : 0.03558
batch 109 training accuracy is : 1.00000
batch 110 training loss is : 0.01740
batch 110 training accuracy is 

batch 66 training loss is : 0.06449
batch 66 training accuracy is : 0.93750
batch 67 training loss is : 0.05791
batch 67 training accuracy is : 0.93750
batch 68 training loss is : 0.00503
batch 68 training accuracy is : 1.00000
batch 69 training loss is : 0.00870
batch 69 training accuracy is : 1.00000
batch 70 training loss is : 0.01194
batch 70 training accuracy is : 1.00000
batch 71 training loss is : 0.02461
batch 71 training accuracy is : 1.00000
batch 72 training loss is : 0.01040
batch 72 training accuracy is : 1.00000
batch 73 training loss is : 0.08239
batch 73 training accuracy is : 0.93750
batch 74 training loss is : 0.04848
batch 74 training accuracy is : 1.00000
batch 75 training loss is : 0.01116
batch 75 training accuracy is : 1.00000
batch 76 training loss is : 0.04210
batch 76 training accuracy is : 1.00000
batch 77 training loss is : 0.01840
batch 77 training accuracy is : 1.00000
batch 78 training loss is : 0.03083
batch 78 training accuracy is : 1.00000
batch 79 tra

batch 36 training loss is : 0.00372
batch 36 training accuracy is : 1.00000
batch 37 training loss is : 0.32859
batch 37 training accuracy is : 0.87500
batch 38 training loss is : 0.46566
batch 38 training accuracy is : 0.81250
batch 39 training loss is : 0.00120
batch 39 training accuracy is : 1.00000
batch 40 training loss is : 0.07174
batch 40 training accuracy is : 0.93750
batch 41 training loss is : 0.42909
batch 41 training accuracy is : 0.81250
batch 42 training loss is : 0.00409
batch 42 training accuracy is : 1.00000
batch 43 training loss is : 0.04191
batch 43 training accuracy is : 1.00000
batch 44 training loss is : 0.09696
batch 44 training accuracy is : 0.93750
batch 45 training loss is : 0.21059
batch 45 training accuracy is : 0.93750
batch 46 training loss is : 0.00002
batch 46 training accuracy is : 1.00000
batch 47 training loss is : 0.04401
batch 47 training accuracy is : 1.00000
batch 48 training loss is : 0.04443
batch 48 training accuracy is : 1.00000
batch 49 tra

batch 6 training loss is : 0.08893
batch 6 training accuracy is : 0.93750
batch 7 training loss is : 0.02118
batch 7 training accuracy is : 1.00000
batch 8 training loss is : 0.30102
batch 8 training accuracy is : 0.87500
batch 9 training loss is : 0.01315
batch 9 training accuracy is : 1.00000
batch 10 training loss is : 0.04165
batch 10 training accuracy is : 1.00000
batch 11 training loss is : 0.03412
batch 11 training accuracy is : 1.00000
batch 12 training loss is : 0.00588
batch 12 training accuracy is : 1.00000
batch 13 training loss is : 0.01144
batch 13 training accuracy is : 1.00000
batch 14 training loss is : 0.06683
batch 14 training accuracy is : 0.93750
batch 15 training loss is : 0.00142
batch 15 training accuracy is : 1.00000
batch 16 training loss is : 0.00158
batch 16 training accuracy is : 1.00000
batch 17 training loss is : 0.00371
batch 17 training accuracy is : 1.00000
batch 18 training loss is : 0.01363
batch 18 training accuracy is : 1.00000
batch 19 training lo

batch 0 dev loss is : 0.89787
batch 0 dev accuracy is : 0.81250
batch 1 dev loss is : 0.91409
batch 1 dev accuracy is : 0.87500
batch 2 dev loss is : 1.24898
batch 2 dev accuracy is : 0.81250
batch 3 dev loss is : 1.49249
batch 3 dev accuracy is : 0.81250
batch 4 dev loss is : 1.13771
batch 4 dev accuracy is : 0.62500
batch 5 dev loss is : 0.77643
batch 5 dev accuracy is : 0.87500
batch 6 dev loss is : 1.47596
batch 6 dev accuracy is : 0.68750
batch 7 dev loss is : 1.88843
batch 7 dev accuracy is : 0.75000
batch 8 dev loss is : 1.83774
batch 8 dev accuracy is : 0.68750
batch 9 dev loss is : 1.20858
batch 9 dev accuracy is : 0.68750
batch 10 dev loss is : 2.51262
batch 10 dev accuracy is : 0.56250
batch 11 dev loss is : 1.46223
batch 11 dev accuracy is : 0.75000
batch 12 dev loss is : 1.52872
batch 12 dev accuracy is : 0.68750
batch 13 dev loss is : 2.18805
batch 13 dev accuracy is : 0.56250
batch 14 dev loss is : 0.60258
batch 14 dev accuracy is : 0.93750
batch 15 dev loss is : 0.80022

batch 85 training loss is : 0.01490
batch 85 training accuracy is : 1.00000
batch 86 training loss is : 0.03578
batch 86 training accuracy is : 1.00000
batch 87 training loss is : 0.20193
batch 87 training accuracy is : 0.87500
batch 88 training loss is : 0.04193
batch 88 training accuracy is : 1.00000
batch 89 training loss is : 0.00475
batch 89 training accuracy is : 1.00000
batch 90 training loss is : 0.00146
batch 90 training accuracy is : 1.00000
batch 91 training loss is : 0.25207
batch 91 training accuracy is : 0.93750
batch 92 training loss is : 0.07536
batch 92 training accuracy is : 1.00000
batch 93 training loss is : 0.00338
batch 93 training accuracy is : 1.00000
batch 94 training loss is : 0.01445
batch 94 training accuracy is : 1.00000
batch 95 training loss is : 0.00136
batch 95 training accuracy is : 1.00000
batch 96 training loss is : 0.05304
batch 96 training accuracy is : 0.93750
batch 97 training loss is : 0.02248
batch 97 training accuracy is : 1.00000
batch 98 tra

batch 56 training loss is : 0.04749
batch 56 training accuracy is : 0.93750
batch 57 training loss is : 0.00374
batch 57 training accuracy is : 1.00000
batch 58 training loss is : 0.06908
batch 58 training accuracy is : 0.93750
batch 59 training loss is : 0.01268
batch 59 training accuracy is : 1.00000
batch 60 training loss is : 0.06010
batch 60 training accuracy is : 1.00000
batch 61 training loss is : 0.16741
batch 61 training accuracy is : 0.93750
batch 62 training loss is : 0.03283
batch 62 training accuracy is : 1.00000
batch 63 training loss is : 0.00809
batch 63 training accuracy is : 1.00000
batch 64 training loss is : 0.05490
batch 64 training accuracy is : 1.00000
batch 65 training loss is : 0.09072
batch 65 training accuracy is : 0.93750
batch 66 training loss is : 0.21471
batch 66 training accuracy is : 0.93750
batch 67 training loss is : 0.01544
batch 67 training accuracy is : 1.00000
batch 68 training loss is : 0.01938
batch 68 training accuracy is : 1.00000
batch 69 tra

batch 27 training loss is : 0.04302
batch 27 training accuracy is : 1.00000
batch 28 training loss is : 0.08263
batch 28 training accuracy is : 1.00000
batch 29 training loss is : 0.11082
batch 29 training accuracy is : 0.93750
batch 30 training loss is : 0.04530
batch 30 training accuracy is : 1.00000
batch 31 training loss is : 0.09564
batch 31 training accuracy is : 1.00000
batch 32 training loss is : 0.02242
batch 32 training accuracy is : 1.00000
batch 33 training loss is : 0.04197
batch 33 training accuracy is : 1.00000
batch 34 training loss is : 0.00000
batch 34 training accuracy is : 1.00000
batch 35 training loss is : 0.05696
batch 35 training accuracy is : 1.00000
batch 36 training loss is : 0.01990
batch 36 training accuracy is : 1.00000
batch 37 training loss is : 0.15814
batch 37 training accuracy is : 0.93750
batch 38 training loss is : 0.04951
batch 38 training accuracy is : 1.00000
batch 39 training loss is : 0.07617
batch 39 training accuracy is : 1.00000
batch 40 tra

Average validation loss is 1.42578 at the end of epoch 149
Average validation accuracy is 0.72511 at the end of epoch 149
At 150-th epoch.
batch 0 training loss is : 0.11188
batch 0 training accuracy is : 0.93750
batch 1 training loss is : 0.40040
batch 1 training accuracy is : 0.93750
batch 2 training loss is : 0.01060
batch 2 training accuracy is : 1.00000
batch 3 training loss is : 0.02392
batch 3 training accuracy is : 1.00000
batch 4 training loss is : 0.01453
batch 4 training accuracy is : 1.00000
batch 5 training loss is : 0.02280
batch 5 training accuracy is : 1.00000
batch 6 training loss is : 0.04663
batch 6 training accuracy is : 1.00000
batch 7 training loss is : 0.07532
batch 7 training accuracy is : 0.93750
batch 8 training loss is : 0.24353
batch 8 training accuracy is : 0.87500
batch 9 training loss is : 0.00028
batch 9 training accuracy is : 1.00000
batch 10 training loss is : 0.01321
batch 10 training accuracy is : 1.00000
batch 11 training loss is : 0.15269
batch 11 

batch 109 training loss is : 0.00096
batch 109 training accuracy is : 1.00000
batch 110 training loss is : 0.15665
batch 110 training accuracy is : 0.93750
batch 111 training loss is : 0.00000
batch 111 training accuracy is : 1.00000
batch 112 training loss is : 0.05919
batch 112 training accuracy is : 1.00000
Average training loss is 0.07933 at the end of epoch 150
Average training accuracy is 0.96156 at the end of epoch 150
batch 0 dev loss is : 0.74133
batch 0 dev accuracy is : 0.81250
batch 1 dev loss is : 0.75349
batch 1 dev accuracy is : 0.87500
batch 2 dev loss is : 0.87112
batch 2 dev accuracy is : 0.87500
batch 3 dev loss is : 0.90310
batch 3 dev accuracy is : 0.81250
batch 4 dev loss is : 0.75840
batch 4 dev accuracy is : 0.81250
batch 5 dev loss is : 0.49026
batch 5 dev accuracy is : 0.87500
batch 6 dev loss is : 0.43066
batch 6 dev accuracy is : 0.81250
batch 7 dev loss is : 2.06074
batch 7 dev accuracy is : 0.81250
batch 8 dev loss is : 1.94640
batch 8 dev accuracy is : 0.

batch 79 training loss is : 0.00093
batch 79 training accuracy is : 1.00000
batch 80 training loss is : 0.20066
batch 80 training accuracy is : 0.87500
batch 81 training loss is : 0.02544
batch 81 training accuracy is : 1.00000
batch 82 training loss is : 0.00719
batch 82 training accuracy is : 1.00000
batch 83 training loss is : 0.05274
batch 83 training accuracy is : 0.93750
batch 84 training loss is : 0.00160
batch 84 training accuracy is : 1.00000
batch 85 training loss is : 0.04693
batch 85 training accuracy is : 0.93750
batch 86 training loss is : 0.33308
batch 86 training accuracy is : 0.93750
batch 87 training loss is : 0.20750
batch 87 training accuracy is : 0.87500
batch 88 training loss is : 0.04952
batch 88 training accuracy is : 0.93750
batch 89 training loss is : 0.15816
batch 89 training accuracy is : 0.87500
batch 90 training loss is : 0.18636
batch 90 training accuracy is : 0.93750
batch 91 training loss is : 0.04244
batch 91 training accuracy is : 1.00000
batch 92 tra

batch 48 training loss is : 0.01177
batch 48 training accuracy is : 1.00000
batch 49 training loss is : 0.00023
batch 49 training accuracy is : 1.00000
batch 50 training loss is : 0.00509
batch 50 training accuracy is : 1.00000
batch 51 training loss is : 0.00022
batch 51 training accuracy is : 1.00000
batch 52 training loss is : 0.06115
batch 52 training accuracy is : 0.93750
batch 53 training loss is : 0.00125
batch 53 training accuracy is : 1.00000
batch 54 training loss is : 0.02728
batch 54 training accuracy is : 1.00000
batch 55 training loss is : 0.01861
batch 55 training accuracy is : 1.00000
batch 56 training loss is : 0.01939
batch 56 training accuracy is : 1.00000
batch 57 training loss is : 0.00940
batch 57 training accuracy is : 1.00000
batch 58 training loss is : 0.36573
batch 58 training accuracy is : 0.87500
batch 59 training loss is : 0.21834
batch 59 training accuracy is : 0.93750
batch 60 training loss is : 0.03443
batch 60 training accuracy is : 1.00000
batch 61 tra

batch 18 training loss is : 0.02545
batch 18 training accuracy is : 1.00000
batch 19 training loss is : 0.03463
batch 19 training accuracy is : 1.00000
batch 20 training loss is : 0.06109
batch 20 training accuracy is : 1.00000
batch 21 training loss is : 0.06137
batch 21 training accuracy is : 0.93750
batch 22 training loss is : 0.00001
batch 22 training accuracy is : 1.00000
batch 23 training loss is : 0.08784
batch 23 training accuracy is : 0.93750
batch 24 training loss is : 0.13045
batch 24 training accuracy is : 0.93750
batch 25 training loss is : 0.00020
batch 25 training accuracy is : 1.00000
batch 26 training loss is : 0.00587
batch 26 training accuracy is : 1.00000
batch 27 training loss is : 0.00806
batch 27 training accuracy is : 1.00000
batch 28 training loss is : 0.13184
batch 28 training accuracy is : 0.93750
batch 29 training loss is : 0.13209
batch 29 training accuracy is : 0.93750
batch 30 training loss is : 0.05161
batch 30 training accuracy is : 0.93750
batch 31 tra

batch 15 dev loss is : 0.58853
batch 15 dev accuracy is : 0.87500
batch 16 dev loss is : 1.05459
batch 16 dev accuracy is : 0.81250
batch 17 dev loss is : 2.12730
batch 17 dev accuracy is : 0.56250
batch 18 dev loss is : 1.80710
batch 18 dev accuracy is : 0.62500
batch 19 dev loss is : 2.55276
batch 19 dev accuracy is : 0.81250
batch 20 dev loss is : 1.49841
batch 20 dev accuracy is : 0.87500
batch 21 dev loss is : 2.26953
batch 21 dev accuracy is : 0.81250
batch 22 dev loss is : 1.45745
batch 22 dev accuracy is : 0.68750
batch 23 dev loss is : 0.27709
batch 23 dev accuracy is : 0.93750
batch 24 dev loss is : 0.49476
batch 24 dev accuracy is : 0.87500
batch 25 dev loss is : 0.84207
batch 25 dev accuracy is : 0.75000
batch 26 dev loss is : 2.61720
batch 26 dev accuracy is : 0.68750
batch 27 dev loss is : 1.54787
batch 27 dev accuracy is : 0.68750
Average validation loss is 1.19081 at the end of epoch 153
Average validation accuracy is 0.76407 at the end of epoch 153
At 154-th epoch.
bat

batch 99 training accuracy is : 1.00000
batch 100 training loss is : 0.10613
batch 100 training accuracy is : 0.93750
batch 101 training loss is : 0.10730
batch 101 training accuracy is : 0.93750
batch 102 training loss is : 0.00816
batch 102 training accuracy is : 1.00000
batch 103 training loss is : 0.00280
batch 103 training accuracy is : 1.00000
batch 104 training loss is : 0.26767
batch 104 training accuracy is : 0.93750
batch 105 training loss is : 0.05096
batch 105 training accuracy is : 0.93750
batch 106 training loss is : 0.04234
batch 106 training accuracy is : 1.00000
batch 107 training loss is : 0.00853
batch 107 training accuracy is : 1.00000
batch 108 training loss is : 0.05832
batch 108 training accuracy is : 1.00000
batch 109 training loss is : 0.01032
batch 109 training accuracy is : 1.00000
batch 110 training loss is : 0.13247
batch 110 training accuracy is : 0.93750
batch 111 training loss is : 0.02972
batch 111 training accuracy is : 1.00000
batch 112 training loss 

batch 68 training loss is : 0.21077
batch 68 training accuracy is : 0.93750
batch 69 training loss is : 0.07906
batch 69 training accuracy is : 0.93750
batch 70 training loss is : 0.01471
batch 70 training accuracy is : 1.00000
batch 71 training loss is : 0.00000
batch 71 training accuracy is : 1.00000
batch 72 training loss is : 0.03500
batch 72 training accuracy is : 1.00000
batch 73 training loss is : 0.30180
batch 73 training accuracy is : 0.93750
batch 74 training loss is : 0.00297
batch 74 training accuracy is : 1.00000
batch 75 training loss is : 0.04483
batch 75 training accuracy is : 1.00000
batch 76 training loss is : 0.08422
batch 76 training accuracy is : 0.93750
batch 77 training loss is : 0.00008
batch 77 training accuracy is : 1.00000
batch 78 training loss is : 0.01693
batch 78 training accuracy is : 1.00000
batch 79 training loss is : 0.00492
batch 79 training accuracy is : 1.00000
batch 80 training loss is : 0.03001
batch 80 training accuracy is : 1.00000
batch 81 tra

batch 37 training loss is : 0.11003
batch 37 training accuracy is : 0.93750
batch 38 training loss is : 0.13113
batch 38 training accuracy is : 0.93750
batch 39 training loss is : 0.03621
batch 39 training accuracy is : 1.00000
batch 40 training loss is : 0.00272
batch 40 training accuracy is : 1.00000
batch 41 training loss is : 0.00042
batch 41 training accuracy is : 1.00000
batch 42 training loss is : 0.01824
batch 42 training accuracy is : 1.00000
batch 43 training loss is : 0.02809
batch 43 training accuracy is : 1.00000
batch 44 training loss is : 0.13406
batch 44 training accuracy is : 0.87500
batch 45 training loss is : 0.03849
batch 45 training accuracy is : 1.00000
batch 46 training loss is : 0.60224
batch 46 training accuracy is : 0.75000
batch 47 training loss is : 0.09951
batch 47 training accuracy is : 0.93750
batch 48 training loss is : 0.02967
batch 48 training accuracy is : 1.00000
batch 49 training loss is : 0.05161
batch 49 training accuracy is : 1.00000
batch 50 tra

batch 5 training loss is : 0.00342
batch 5 training accuracy is : 1.00000
batch 6 training loss is : 0.01465
batch 6 training accuracy is : 1.00000
batch 7 training loss is : 0.04971
batch 7 training accuracy is : 1.00000
batch 8 training loss is : 0.04655
batch 8 training accuracy is : 1.00000
batch 9 training loss is : 0.01009
batch 9 training accuracy is : 1.00000
batch 10 training loss is : 0.05623
batch 10 training accuracy is : 1.00000
batch 11 training loss is : 0.00343
batch 11 training accuracy is : 1.00000
batch 12 training loss is : 0.01299
batch 12 training accuracy is : 1.00000
batch 13 training loss is : 0.10993
batch 13 training accuracy is : 0.93750
batch 14 training loss is : 0.06153
batch 14 training accuracy is : 0.93750
batch 15 training loss is : 0.19078
batch 15 training accuracy is : 0.93750
batch 16 training loss is : 0.01031
batch 16 training accuracy is : 1.00000
batch 17 training loss is : 0.12793
batch 17 training accuracy is : 1.00000
batch 18 training loss

Average training loss is 0.07465 at the end of epoch 157
Average training accuracy is 0.96156 at the end of epoch 157
batch 0 dev loss is : 0.91546
batch 0 dev accuracy is : 0.81250
batch 1 dev loss is : 0.14527
batch 1 dev accuracy is : 0.93750
batch 2 dev loss is : 0.58564
batch 2 dev accuracy is : 0.81250
batch 3 dev loss is : 0.69284
batch 3 dev accuracy is : 0.81250
batch 4 dev loss is : 0.81739
batch 4 dev accuracy is : 0.81250
batch 5 dev loss is : 0.76050
batch 5 dev accuracy is : 0.75000
batch 6 dev loss is : 0.36017
batch 6 dev accuracy is : 0.93750
batch 7 dev loss is : 2.12898
batch 7 dev accuracy is : 0.81250
batch 8 dev loss is : 1.65746
batch 8 dev accuracy is : 0.62500
batch 9 dev loss is : 0.59376
batch 9 dev accuracy is : 0.87500
batch 10 dev loss is : 2.32636
batch 10 dev accuracy is : 0.62500
batch 11 dev loss is : 2.47121
batch 11 dev accuracy is : 0.62500
batch 12 dev loss is : 1.49291
batch 12 dev accuracy is : 0.81250
batch 13 dev loss is : 2.33499
batch 13 dev 

batch 82 training loss is : 0.10266
batch 82 training accuracy is : 1.00000
batch 83 training loss is : 0.00380
batch 83 training accuracy is : 1.00000
batch 84 training loss is : 0.00493
batch 84 training accuracy is : 1.00000
batch 85 training loss is : 0.19166
batch 85 training accuracy is : 0.93750
batch 86 training loss is : 0.11251
batch 86 training accuracy is : 0.93750
batch 87 training loss is : 0.07123
batch 87 training accuracy is : 0.93750
batch 88 training loss is : 0.01550
batch 88 training accuracy is : 1.00000
batch 89 training loss is : 0.13658
batch 89 training accuracy is : 0.93750
batch 90 training loss is : 0.02102
batch 90 training accuracy is : 1.00000
batch 91 training loss is : 0.09462
batch 91 training accuracy is : 0.93750
batch 92 training loss is : 0.00540
batch 92 training accuracy is : 1.00000
batch 93 training loss is : 0.00276
batch 93 training accuracy is : 1.00000
batch 94 training loss is : 0.12426
batch 94 training accuracy is : 0.93750
batch 95 tra

batch 50 training loss is : 0.03474
batch 50 training accuracy is : 1.00000
batch 51 training loss is : 0.29740
batch 51 training accuracy is : 0.93750
batch 52 training loss is : 0.07517
batch 52 training accuracy is : 0.93750
batch 53 training loss is : 0.00183
batch 53 training accuracy is : 1.00000
batch 54 training loss is : 0.63747
batch 54 training accuracy is : 0.75000
batch 55 training loss is : 0.13996
batch 55 training accuracy is : 0.93750
batch 56 training loss is : 0.02437
batch 56 training accuracy is : 1.00000
batch 57 training loss is : 0.10960
batch 57 training accuracy is : 0.93750
batch 58 training loss is : 0.02242
batch 58 training accuracy is : 1.00000
batch 59 training loss is : 0.08738
batch 59 training accuracy is : 0.93750
batch 60 training loss is : 0.09452
batch 60 training accuracy is : 0.93750
batch 61 training loss is : 0.04113
batch 61 training accuracy is : 1.00000
batch 62 training loss is : 0.02851
batch 62 training accuracy is : 1.00000
batch 63 tra

batch 20 training loss is : 0.00000
batch 20 training accuracy is : 1.00000
batch 21 training loss is : 0.12073
batch 21 training accuracy is : 0.93750
batch 22 training loss is : 0.05146
batch 22 training accuracy is : 0.93750
batch 23 training loss is : 0.13329
batch 23 training accuracy is : 0.93750
batch 24 training loss is : 0.12761
batch 24 training accuracy is : 0.87500
batch 25 training loss is : 0.02076
batch 25 training accuracy is : 1.00000
batch 26 training loss is : 0.01715
batch 26 training accuracy is : 1.00000
batch 27 training loss is : 0.00109
batch 27 training accuracy is : 1.00000
batch 28 training loss is : 0.05678
batch 28 training accuracy is : 0.93750
batch 29 training loss is : 0.01695
batch 29 training accuracy is : 1.00000
batch 30 training loss is : 0.04513
batch 30 training accuracy is : 1.00000
batch 31 training loss is : 0.02102
batch 31 training accuracy is : 1.00000
batch 32 training loss is : 0.13110
batch 32 training accuracy is : 0.93750
batch 33 tra

batch 18 dev loss is : 3.12298
batch 18 dev accuracy is : 0.62500
batch 19 dev loss is : 2.64651
batch 19 dev accuracy is : 0.75000
batch 20 dev loss is : 2.18118
batch 20 dev accuracy is : 0.68750
batch 21 dev loss is : 2.28616
batch 21 dev accuracy is : 0.68750
batch 22 dev loss is : 1.49745
batch 22 dev accuracy is : 0.81250
batch 23 dev loss is : 0.96976
batch 23 dev accuracy is : 0.81250
batch 24 dev loss is : 1.10441
batch 24 dev accuracy is : 0.81250
batch 25 dev loss is : 2.12507
batch 25 dev accuracy is : 0.62500
batch 26 dev loss is : 2.38532
batch 26 dev accuracy is : 0.81250
batch 27 dev loss is : 1.02675
batch 27 dev accuracy is : 0.68750
Average validation loss is 1.74472 at the end of epoch 160
Average validation accuracy is 0.70779 at the end of epoch 160
At 161-th epoch.
batch 0 training loss is : 0.00519
batch 0 training accuracy is : 1.00000
batch 1 training loss is : 0.11002
batch 1 training accuracy is : 0.93750
batch 2 training loss is : 0.01687
batch 2 training a

batch 99 training loss is : 0.11853
batch 99 training accuracy is : 0.93750
batch 100 training loss is : 0.20442
batch 100 training accuracy is : 0.93750
batch 101 training loss is : 0.03585
batch 101 training accuracy is : 1.00000
batch 102 training loss is : 0.00168
batch 102 training accuracy is : 1.00000
batch 103 training loss is : 0.01604
batch 103 training accuracy is : 1.00000
batch 104 training loss is : 0.18456
batch 104 training accuracy is : 0.93750
batch 105 training loss is : 0.04822
batch 105 training accuracy is : 1.00000
batch 106 training loss is : 0.01588
batch 106 training accuracy is : 1.00000
batch 107 training loss is : 0.00194
batch 107 training accuracy is : 1.00000
batch 108 training loss is : 0.11071
batch 108 training accuracy is : 0.93750
batch 109 training loss is : 0.02067
batch 109 training accuracy is : 1.00000
batch 110 training loss is : 0.03286
batch 110 training accuracy is : 1.00000
batch 111 training loss is : 0.00118
batch 111 training accuracy i

batch 70 training loss is : 0.00436
batch 70 training accuracy is : 1.00000
batch 71 training loss is : 0.01631
batch 71 training accuracy is : 1.00000
batch 72 training loss is : 0.11596
batch 72 training accuracy is : 0.93750
batch 73 training loss is : 0.30242
batch 73 training accuracy is : 0.93750
batch 74 training loss is : 0.00001
batch 74 training accuracy is : 1.00000
batch 75 training loss is : 0.07622
batch 75 training accuracy is : 0.93750
batch 76 training loss is : 0.20119
batch 76 training accuracy is : 0.93750
batch 77 training loss is : 0.21852
batch 77 training accuracy is : 0.93750
batch 78 training loss is : 0.19206
batch 78 training accuracy is : 0.93750
batch 79 training loss is : 0.13012
batch 79 training accuracy is : 0.93750
batch 80 training loss is : 0.00615
batch 80 training accuracy is : 1.00000
batch 81 training loss is : 0.21008
batch 81 training accuracy is : 0.93750
batch 82 training loss is : 0.11470
batch 82 training accuracy is : 0.93750
batch 83 tra

batch 38 training loss is : 0.03240
batch 38 training accuracy is : 1.00000
batch 39 training loss is : 0.00405
batch 39 training accuracy is : 1.00000
batch 40 training loss is : 0.00939
batch 40 training accuracy is : 1.00000
batch 41 training loss is : 0.46372
batch 41 training accuracy is : 0.87500
batch 42 training loss is : 0.00050
batch 42 training accuracy is : 1.00000
batch 43 training loss is : 0.02411
batch 43 training accuracy is : 1.00000
batch 44 training loss is : 0.08877
batch 44 training accuracy is : 0.93750
batch 45 training loss is : 0.29463
batch 45 training accuracy is : 0.81250
batch 46 training loss is : 0.12741
batch 46 training accuracy is : 0.93750
batch 47 training loss is : 0.01566
batch 47 training accuracy is : 1.00000
batch 48 training loss is : 0.04587
batch 48 training accuracy is : 1.00000
batch 49 training loss is : 0.12782
batch 49 training accuracy is : 0.93750
batch 50 training loss is : 0.03058
batch 50 training accuracy is : 1.00000
batch 51 tra

batch 9 training loss is : 0.03327
batch 9 training accuracy is : 1.00000
batch 10 training loss is : 0.00446
batch 10 training accuracy is : 1.00000
batch 11 training loss is : 0.04357
batch 11 training accuracy is : 1.00000
batch 12 training loss is : 0.03362
batch 12 training accuracy is : 1.00000
batch 13 training loss is : 0.19740
batch 13 training accuracy is : 0.93750
batch 14 training loss is : 0.06816
batch 14 training accuracy is : 0.93750
batch 15 training loss is : 0.03297
batch 15 training accuracy is : 1.00000
batch 16 training loss is : 0.17923
batch 16 training accuracy is : 0.93750
batch 17 training loss is : 0.01660
batch 17 training accuracy is : 1.00000
batch 18 training loss is : 0.00307
batch 18 training accuracy is : 1.00000
batch 19 training loss is : 0.00043
batch 19 training accuracy is : 1.00000
batch 20 training loss is : 0.03105
batch 20 training accuracy is : 1.00000
batch 21 training loss is : 0.02321
batch 21 training accuracy is : 1.00000
batch 22 train

batch 3 dev loss is : 0.55127
batch 3 dev accuracy is : 0.81250
batch 4 dev loss is : 0.88285
batch 4 dev accuracy is : 0.81250
batch 5 dev loss is : 0.28615
batch 5 dev accuracy is : 0.87500
batch 6 dev loss is : 0.29928
batch 6 dev accuracy is : 0.93750
batch 7 dev loss is : 1.95879
batch 7 dev accuracy is : 0.81250
batch 8 dev loss is : 1.69948
batch 8 dev accuracy is : 0.68750
batch 9 dev loss is : 0.51815
batch 9 dev accuracy is : 0.93750
batch 10 dev loss is : 1.58285
batch 10 dev accuracy is : 0.81250
batch 11 dev loss is : 1.57769
batch 11 dev accuracy is : 0.62500
batch 12 dev loss is : 1.60230
batch 12 dev accuracy is : 0.75000
batch 13 dev loss is : 1.94126
batch 13 dev accuracy is : 0.75000
batch 14 dev loss is : 0.85264
batch 14 dev accuracy is : 0.81250
batch 15 dev loss is : 0.45806
batch 15 dev accuracy is : 0.87500
batch 16 dev loss is : 1.04696
batch 16 dev accuracy is : 0.75000
batch 17 dev loss is : 2.07168
batch 17 dev accuracy is : 0.62500
batch 18 dev loss is : 1

batch 85 training loss is : 0.00001
batch 85 training accuracy is : 1.00000
batch 86 training loss is : 0.02155
batch 86 training accuracy is : 1.00000
batch 87 training loss is : 0.04095
batch 87 training accuracy is : 1.00000
batch 88 training loss is : 0.11362
batch 88 training accuracy is : 0.93750
batch 89 training loss is : 0.02565
batch 89 training accuracy is : 1.00000
batch 90 training loss is : 0.00717
batch 90 training accuracy is : 1.00000
batch 91 training loss is : 0.11469
batch 91 training accuracy is : 0.93750
batch 92 training loss is : 0.00000
batch 92 training accuracy is : 1.00000
batch 93 training loss is : 0.01396
batch 93 training accuracy is : 1.00000
batch 94 training loss is : 0.00560
batch 94 training accuracy is : 1.00000
batch 95 training loss is : 0.00663
batch 95 training accuracy is : 1.00000
batch 96 training loss is : 0.13333
batch 96 training accuracy is : 0.93750
batch 97 training loss is : 0.02546
batch 97 training accuracy is : 1.00000
batch 98 tra

batch 56 training loss is : 0.03390
batch 56 training accuracy is : 1.00000
batch 57 training loss is : 0.10848
batch 57 training accuracy is : 0.93750
batch 58 training loss is : 0.25214
batch 58 training accuracy is : 0.93750
batch 59 training loss is : 0.01960
batch 59 training accuracy is : 1.00000
batch 60 training loss is : 0.00129
batch 60 training accuracy is : 1.00000
batch 61 training loss is : 0.03954
batch 61 training accuracy is : 1.00000
batch 62 training loss is : 0.23747
batch 62 training accuracy is : 0.93750
batch 63 training loss is : 0.21087
batch 63 training accuracy is : 0.93750
batch 64 training loss is : 0.03232
batch 64 training accuracy is : 1.00000
batch 65 training loss is : 0.09444
batch 65 training accuracy is : 0.93750
batch 66 training loss is : 0.17700
batch 66 training accuracy is : 0.93750
batch 67 training loss is : 0.01360
batch 67 training accuracy is : 1.00000
batch 68 training loss is : 0.03569
batch 68 training accuracy is : 1.00000
batch 69 tra

batch 26 training loss is : 0.04068
batch 26 training accuracy is : 1.00000
batch 27 training loss is : 0.00080
batch 27 training accuracy is : 1.00000
batch 28 training loss is : 0.00230
batch 28 training accuracy is : 1.00000
batch 29 training loss is : 0.03185
batch 29 training accuracy is : 1.00000
batch 30 training loss is : 0.15045
batch 30 training accuracy is : 0.93750
batch 31 training loss is : 0.02837
batch 31 training accuracy is : 1.00000
batch 32 training loss is : 0.08350
batch 32 training accuracy is : 0.93750
batch 33 training loss is : 0.06121
batch 33 training accuracy is : 0.93750
batch 34 training loss is : 0.00950
batch 34 training accuracy is : 1.00000
batch 35 training loss is : 0.10992
batch 35 training accuracy is : 0.93750
batch 36 training loss is : 0.25583
batch 36 training accuracy is : 0.87500
batch 37 training loss is : 0.11218
batch 37 training accuracy is : 0.93750
batch 38 training loss is : 0.04145
batch 38 training accuracy is : 1.00000
batch 39 tra

batch 27 dev loss is : 1.03278
batch 27 dev accuracy is : 0.81250
Average validation loss is 1.57339 at the end of epoch 167
Average validation accuracy is 0.72511 at the end of epoch 167
At 168-th epoch.
batch 0 training loss is : 0.10066
batch 0 training accuracy is : 0.93750
batch 1 training loss is : 0.01396
batch 1 training accuracy is : 1.00000
batch 2 training loss is : 0.07975
batch 2 training accuracy is : 0.93750
batch 3 training loss is : 0.02961
batch 3 training accuracy is : 1.00000
batch 4 training loss is : 0.32445
batch 4 training accuracy is : 0.87500
batch 5 training loss is : 0.03733
batch 5 training accuracy is : 1.00000
batch 6 training loss is : 0.06215
batch 6 training accuracy is : 0.93750
batch 7 training loss is : 0.03940
batch 7 training accuracy is : 1.00000
batch 8 training loss is : 0.09804
batch 8 training accuracy is : 0.93750
batch 9 training loss is : 0.00010
batch 9 training accuracy is : 1.00000
batch 10 training loss is : 0.00508
batch 10 training a

batch 110 training loss is : 0.00426
batch 110 training accuracy is : 1.00000
batch 111 training loss is : 0.03447
batch 111 training accuracy is : 1.00000
batch 112 training loss is : 0.03498
batch 112 training accuracy is : 1.00000
Average training loss is 0.07591 at the end of epoch 168
Average training accuracy is 0.96595 at the end of epoch 168
batch 0 dev loss is : 0.76553
batch 0 dev accuracy is : 0.75000
batch 1 dev loss is : 0.28516
batch 1 dev accuracy is : 0.87500
batch 2 dev loss is : 0.51934
batch 2 dev accuracy is : 0.87500
batch 3 dev loss is : 0.93202
batch 3 dev accuracy is : 0.81250
batch 4 dev loss is : 0.75632
batch 4 dev accuracy is : 0.81250
batch 5 dev loss is : 0.39121
batch 5 dev accuracy is : 0.87500
batch 6 dev loss is : 0.76851
batch 6 dev accuracy is : 0.75000
batch 7 dev loss is : 1.65748
batch 7 dev accuracy is : 0.75000
batch 8 dev loss is : 2.13760
batch 8 dev accuracy is : 0.62500
batch 9 dev loss is : 0.62064
batch 9 dev accuracy is : 0.81250
batch 10

batch 81 training loss is : 0.08731
batch 81 training accuracy is : 0.93750
batch 82 training loss is : 0.01854
batch 82 training accuracy is : 1.00000
batch 83 training loss is : 0.21220
batch 83 training accuracy is : 0.87500
batch 84 training loss is : 0.00248
batch 84 training accuracy is : 1.00000
batch 85 training loss is : 0.01235
batch 85 training accuracy is : 1.00000
batch 86 training loss is : 0.01686
batch 86 training accuracy is : 1.00000
batch 87 training loss is : 0.00004
batch 87 training accuracy is : 1.00000
batch 88 training loss is : 0.01715
batch 88 training accuracy is : 1.00000
batch 89 training loss is : 0.41255
batch 89 training accuracy is : 0.93750
batch 90 training loss is : 0.00192
batch 90 training accuracy is : 1.00000
batch 91 training loss is : 0.01106
batch 91 training accuracy is : 1.00000
batch 92 training loss is : 0.12740
batch 92 training accuracy is : 0.93750
batch 93 training loss is : 0.00900
batch 93 training accuracy is : 1.00000
batch 94 tra

batch 50 training loss is : 0.22073
batch 50 training accuracy is : 0.87500
batch 51 training loss is : 0.02814
batch 51 training accuracy is : 1.00000
batch 52 training loss is : 0.00758
batch 52 training accuracy is : 1.00000
batch 53 training loss is : 0.23596
batch 53 training accuracy is : 0.93750
batch 54 training loss is : 0.21000
batch 54 training accuracy is : 0.87500
batch 55 training loss is : 0.01163
batch 55 training accuracy is : 1.00000
batch 56 training loss is : 0.00662
batch 56 training accuracy is : 1.00000
batch 57 training loss is : 0.01820
batch 57 training accuracy is : 1.00000
batch 58 training loss is : 0.06088
batch 58 training accuracy is : 0.93750
batch 59 training loss is : 0.00811
batch 59 training accuracy is : 1.00000
batch 60 training loss is : 0.01375
batch 60 training accuracy is : 1.00000
batch 61 training loss is : 0.01109
batch 61 training accuracy is : 1.00000
batch 62 training loss is : 0.09373
batch 62 training accuracy is : 0.93750
batch 63 tra

batch 19 training loss is : 0.31754
batch 19 training accuracy is : 0.93750
batch 20 training loss is : 0.00848
batch 20 training accuracy is : 1.00000
batch 21 training loss is : 0.02603
batch 21 training accuracy is : 1.00000
batch 22 training loss is : 0.00394
batch 22 training accuracy is : 1.00000
batch 23 training loss is : 0.07617
batch 23 training accuracy is : 0.93750
batch 24 training loss is : 0.00008
batch 24 training accuracy is : 1.00000
batch 25 training loss is : 0.05043
batch 25 training accuracy is : 1.00000
batch 26 training loss is : 0.02326
batch 26 training accuracy is : 1.00000
batch 27 training loss is : 0.02253
batch 27 training accuracy is : 1.00000
batch 28 training loss is : 0.00121
batch 28 training accuracy is : 1.00000
batch 29 training loss is : 0.00036
batch 29 training accuracy is : 1.00000
batch 30 training loss is : 0.00808
batch 30 training accuracy is : 1.00000
batch 31 training loss is : 0.15833
batch 31 training accuracy is : 0.93750
batch 32 tra

batch 17 dev loss is : 1.74404
batch 17 dev accuracy is : 0.62500
batch 18 dev loss is : 1.90571
batch 18 dev accuracy is : 0.62500
batch 19 dev loss is : 2.36598
batch 19 dev accuracy is : 0.87500
batch 20 dev loss is : 1.23984
batch 20 dev accuracy is : 0.81250
batch 21 dev loss is : 2.26951
batch 21 dev accuracy is : 0.81250
batch 22 dev loss is : 1.15969
batch 22 dev accuracy is : 0.81250
batch 23 dev loss is : 0.32308
batch 23 dev accuracy is : 0.87500
batch 24 dev loss is : 0.36523
batch 24 dev accuracy is : 0.93750
batch 25 dev loss is : 0.46254
batch 25 dev accuracy is : 0.81250
batch 26 dev loss is : 2.23046
batch 26 dev accuracy is : 0.68750
batch 27 dev loss is : 1.37738
batch 27 dev accuracy is : 0.75000
Average validation loss is 1.12346 at the end of epoch 171
Average validation accuracy is 0.77056 at the end of epoch 171
At 172-th epoch.
batch 0 training loss is : 0.38390
batch 0 training accuracy is : 0.87500
batch 1 training loss is : 0.14540
batch 1 training accuracy 

batch 98 training loss is : 0.15017
batch 98 training accuracy is : 0.93750
batch 99 training loss is : 0.43704
batch 99 training accuracy is : 0.87500
batch 100 training loss is : 0.00842
batch 100 training accuracy is : 1.00000
batch 101 training loss is : 0.09795
batch 101 training accuracy is : 0.93750
batch 102 training loss is : 0.06152
batch 102 training accuracy is : 0.93750
batch 103 training loss is : 0.03946
batch 103 training accuracy is : 1.00000
batch 104 training loss is : 0.00857
batch 104 training accuracy is : 1.00000
batch 105 training loss is : 0.00332
batch 105 training accuracy is : 1.00000
batch 106 training loss is : 0.08086
batch 106 training accuracy is : 0.93750
batch 107 training loss is : 0.00382
batch 107 training accuracy is : 1.00000
batch 108 training loss is : 0.04501
batch 108 training accuracy is : 1.00000
batch 109 training loss is : 0.33585
batch 109 training accuracy is : 0.87500
batch 110 training loss is : 0.00633
batch 110 training accuracy is 

batch 66 training loss is : 0.00685
batch 66 training accuracy is : 1.00000
batch 67 training loss is : 0.00767
batch 67 training accuracy is : 1.00000
batch 68 training loss is : 0.01169
batch 68 training accuracy is : 1.00000
batch 69 training loss is : 0.04099
batch 69 training accuracy is : 1.00000
batch 70 training loss is : 0.02400
batch 70 training accuracy is : 1.00000
batch 71 training loss is : 0.03122
batch 71 training accuracy is : 1.00000
batch 72 training loss is : 0.02496
batch 72 training accuracy is : 1.00000
batch 73 training loss is : 0.01376
batch 73 training accuracy is : 1.00000
batch 74 training loss is : 0.09383
batch 74 training accuracy is : 0.93750
batch 75 training loss is : 0.13542
batch 75 training accuracy is : 0.93750
batch 76 training loss is : 0.01895
batch 76 training accuracy is : 1.00000
batch 77 training loss is : 0.18469
batch 77 training accuracy is : 0.87500
batch 78 training loss is : 0.22476
batch 78 training accuracy is : 0.93750
batch 79 tra

batch 36 training loss is : 0.00073
batch 36 training accuracy is : 1.00000
batch 37 training loss is : 0.10800
batch 37 training accuracy is : 0.93750
batch 38 training loss is : 0.12384
batch 38 training accuracy is : 1.00000
batch 39 training loss is : 0.00466
batch 39 training accuracy is : 1.00000
batch 40 training loss is : 0.00002
batch 40 training accuracy is : 1.00000
batch 41 training loss is : 0.04373
batch 41 training accuracy is : 1.00000
batch 42 training loss is : 0.00266
batch 42 training accuracy is : 1.00000
batch 43 training loss is : 0.02271
batch 43 training accuracy is : 1.00000
batch 44 training loss is : 0.05597
batch 44 training accuracy is : 1.00000
batch 45 training loss is : 0.00000
batch 45 training accuracy is : 1.00000
batch 46 training loss is : 0.08365
batch 46 training accuracy is : 0.93750
batch 47 training loss is : 0.03435
batch 47 training accuracy is : 1.00000
batch 48 training loss is : 0.04211
batch 48 training accuracy is : 1.00000
batch 49 tra

batch 4 training loss is : 0.01939
batch 4 training accuracy is : 1.00000
batch 5 training loss is : 0.00165
batch 5 training accuracy is : 1.00000
batch 6 training loss is : 0.20501
batch 6 training accuracy is : 0.93750
batch 7 training loss is : 0.15744
batch 7 training accuracy is : 0.93750
batch 8 training loss is : 0.00769
batch 8 training accuracy is : 1.00000
batch 9 training loss is : 0.13575
batch 9 training accuracy is : 0.93750
batch 10 training loss is : 0.03062
batch 10 training accuracy is : 1.00000
batch 11 training loss is : 0.25823
batch 11 training accuracy is : 0.93750
batch 12 training loss is : 0.20526
batch 12 training accuracy is : 0.93750
batch 13 training loss is : 0.06347
batch 13 training accuracy is : 0.93750
batch 14 training loss is : 0.00196
batch 14 training accuracy is : 1.00000
batch 15 training loss is : 0.12095
batch 15 training accuracy is : 0.93750
batch 16 training loss is : 0.09243
batch 16 training accuracy is : 0.93750
batch 17 training loss i

Average training loss is 0.05995 at the end of epoch 175
Average training accuracy is 0.96980 at the end of epoch 175
batch 0 dev loss is : 0.85951
batch 0 dev accuracy is : 0.81250
batch 1 dev loss is : 0.14835
batch 1 dev accuracy is : 0.87500
batch 2 dev loss is : 0.60648
batch 2 dev accuracy is : 0.87500
batch 3 dev loss is : 0.65419
batch 3 dev accuracy is : 0.81250
batch 4 dev loss is : 0.69378
batch 4 dev accuracy is : 0.81250
batch 5 dev loss is : 0.37988
batch 5 dev accuracy is : 0.87500
batch 6 dev loss is : 0.66750
batch 6 dev accuracy is : 0.81250
batch 7 dev loss is : 1.74167
batch 7 dev accuracy is : 0.81250
batch 8 dev loss is : 2.20773
batch 8 dev accuracy is : 0.62500
batch 9 dev loss is : 0.61841
batch 9 dev accuracy is : 0.87500
batch 10 dev loss is : 1.60141
batch 10 dev accuracy is : 0.62500
batch 11 dev loss is : 2.37453
batch 11 dev accuracy is : 0.62500
batch 12 dev loss is : 1.64453
batch 12 dev accuracy is : 0.81250
batch 13 dev loss is : 1.97303
batch 13 dev 

batch 84 training loss is : 0.01224
batch 84 training accuracy is : 1.00000
batch 85 training loss is : 0.01984
batch 85 training accuracy is : 1.00000
batch 86 training loss is : 0.12985
batch 86 training accuracy is : 0.93750
batch 87 training loss is : 0.02082
batch 87 training accuracy is : 1.00000
batch 88 training loss is : 0.00119
batch 88 training accuracy is : 1.00000
batch 89 training loss is : 0.00546
batch 89 training accuracy is : 1.00000
batch 90 training loss is : 0.13991
batch 90 training accuracy is : 0.93750
batch 91 training loss is : 0.00629
batch 91 training accuracy is : 1.00000
batch 92 training loss is : 0.07890
batch 92 training accuracy is : 0.93750
batch 93 training loss is : 0.20593
batch 93 training accuracy is : 0.93750
batch 94 training loss is : 0.04651
batch 94 training accuracy is : 0.93750
batch 95 training loss is : 0.00233
batch 95 training accuracy is : 1.00000
batch 96 training loss is : 0.00233
batch 96 training accuracy is : 1.00000
batch 97 tra

batch 51 training accuracy is : 1.00000
batch 52 training loss is : 0.00829
batch 52 training accuracy is : 1.00000
batch 53 training loss is : 0.00062
batch 53 training accuracy is : 1.00000
batch 54 training loss is : 0.03396
batch 54 training accuracy is : 1.00000
batch 55 training loss is : 0.08572
batch 55 training accuracy is : 0.93750
batch 56 training loss is : 0.15284
batch 56 training accuracy is : 0.93750
batch 57 training loss is : 0.02091
batch 57 training accuracy is : 1.00000
batch 58 training loss is : 0.05660
batch 58 training accuracy is : 0.93750
batch 59 training loss is : 0.00174
batch 59 training accuracy is : 1.00000
batch 60 training loss is : 0.01675
batch 60 training accuracy is : 1.00000
batch 61 training loss is : 0.00134
batch 61 training accuracy is : 1.00000
batch 62 training loss is : 0.10284
batch 62 training accuracy is : 0.93750
batch 63 training loss is : 0.08975
batch 63 training accuracy is : 0.93750
batch 64 training loss is : 0.09657
batch 64 tra

batch 22 training loss is : 0.08616
batch 22 training accuracy is : 0.93750
batch 23 training loss is : 0.00078
batch 23 training accuracy is : 1.00000
batch 24 training loss is : 0.10090
batch 24 training accuracy is : 0.87500
batch 25 training loss is : 0.02466
batch 25 training accuracy is : 1.00000
batch 26 training loss is : 0.13138
batch 26 training accuracy is : 0.93750
batch 27 training loss is : 0.01075
batch 27 training accuracy is : 1.00000
batch 28 training loss is : 0.00863
batch 28 training accuracy is : 1.00000
batch 29 training loss is : 0.03648
batch 29 training accuracy is : 1.00000
batch 30 training loss is : 0.00021
batch 30 training accuracy is : 1.00000
batch 31 training loss is : 0.28639
batch 31 training accuracy is : 0.93750
batch 32 training loss is : 0.00942
batch 32 training accuracy is : 1.00000
batch 33 training loss is : 0.02550
batch 33 training accuracy is : 1.00000
batch 34 training loss is : 0.13896
batch 34 training accuracy is : 0.93750
batch 35 tra

batch 19 dev loss is : 2.52788
batch 19 dev accuracy is : 0.81250
batch 20 dev loss is : 1.43458
batch 20 dev accuracy is : 0.75000
batch 21 dev loss is : 2.32582
batch 21 dev accuracy is : 0.75000
batch 22 dev loss is : 1.06001
batch 22 dev accuracy is : 0.81250
batch 23 dev loss is : 0.36867
batch 23 dev accuracy is : 0.81250
batch 24 dev loss is : 0.57420
batch 24 dev accuracy is : 0.87500
batch 25 dev loss is : 1.25807
batch 25 dev accuracy is : 0.75000
batch 26 dev loss is : 1.90443
batch 26 dev accuracy is : 0.68750
batch 27 dev loss is : 1.38645
batch 27 dev accuracy is : 0.68750
Average validation loss is 1.26918 at the end of epoch 178
Average validation accuracy is 0.74459 at the end of epoch 178
At 179-th epoch.
batch 0 training loss is : 0.00532
batch 0 training accuracy is : 1.00000
batch 1 training loss is : 0.03006
batch 1 training accuracy is : 1.00000
batch 2 training loss is : 0.03682
batch 2 training accuracy is : 1.00000
batch 3 training loss is : 0.00000
batch 3 tr

batch 99 training loss is : 0.00038
batch 99 training accuracy is : 1.00000
batch 100 training loss is : 0.26685
batch 100 training accuracy is : 0.87500
batch 101 training loss is : 0.11130
batch 101 training accuracy is : 0.93750
batch 102 training loss is : 0.04069
batch 102 training accuracy is : 1.00000
batch 103 training loss is : 0.37476
batch 103 training accuracy is : 0.87500
batch 104 training loss is : 0.21158
batch 104 training accuracy is : 0.93750
batch 105 training loss is : 0.01144
batch 105 training accuracy is : 1.00000
batch 106 training loss is : 0.00598
batch 106 training accuracy is : 1.00000
batch 107 training loss is : 0.01174
batch 107 training accuracy is : 1.00000
batch 108 training loss is : 0.02309
batch 108 training accuracy is : 1.00000
batch 109 training loss is : 0.05392
batch 109 training accuracy is : 1.00000
batch 110 training loss is : 0.19791
batch 110 training accuracy is : 0.87500
batch 111 training loss is : 0.01486
batch 111 training accuracy i

batch 70 training loss is : 0.02375
batch 70 training accuracy is : 1.00000
batch 71 training loss is : 0.15403
batch 71 training accuracy is : 0.93750
batch 72 training loss is : 0.00216
batch 72 training accuracy is : 1.00000
batch 73 training loss is : 0.01899
batch 73 training accuracy is : 1.00000
batch 74 training loss is : 0.00067
batch 74 training accuracy is : 1.00000
batch 75 training loss is : 0.13778
batch 75 training accuracy is : 0.93750
batch 76 training loss is : 0.03314
batch 76 training accuracy is : 1.00000
batch 77 training loss is : 0.11440
batch 77 training accuracy is : 0.93750
batch 78 training loss is : 0.02324
batch 78 training accuracy is : 1.00000
batch 79 training loss is : 0.11199
batch 79 training accuracy is : 0.93750
batch 80 training loss is : 0.01322
batch 80 training accuracy is : 1.00000
batch 81 training loss is : 0.03264
batch 81 training accuracy is : 1.00000
batch 82 training loss is : 0.07653
batch 82 training accuracy is : 0.93750
batch 83 tra

batch 40 training loss is : 0.13751
batch 40 training accuracy is : 0.93750
batch 41 training loss is : 0.00095
batch 41 training accuracy is : 1.00000
batch 42 training loss is : 0.21175
batch 42 training accuracy is : 0.93750
batch 43 training loss is : 0.06204
batch 43 training accuracy is : 0.93750
batch 44 training loss is : 0.17682
batch 44 training accuracy is : 0.93750
batch 45 training loss is : 0.12512
batch 45 training accuracy is : 0.93750
batch 46 training loss is : 0.01981
batch 46 training accuracy is : 1.00000
batch 47 training loss is : 0.00522
batch 47 training accuracy is : 1.00000
batch 48 training loss is : 0.06238
batch 48 training accuracy is : 0.93750
batch 49 training loss is : 0.02394
batch 49 training accuracy is : 1.00000
batch 50 training loss is : 0.00734
batch 50 training accuracy is : 1.00000
batch 51 training loss is : 0.00863
batch 51 training accuracy is : 1.00000
batch 52 training loss is : 0.09124
batch 52 training accuracy is : 0.93750
batch 53 tra

batch 10 training loss is : 0.01384
batch 10 training accuracy is : 1.00000
batch 11 training loss is : 0.13418
batch 11 training accuracy is : 0.87500
batch 12 training loss is : 0.38623
batch 12 training accuracy is : 0.87500
batch 13 training loss is : 0.00416
batch 13 training accuracy is : 1.00000
batch 14 training loss is : 0.00190
batch 14 training accuracy is : 1.00000
batch 15 training loss is : 0.00545
batch 15 training accuracy is : 1.00000
batch 16 training loss is : 0.22454
batch 16 training accuracy is : 0.93750
batch 17 training loss is : 0.02379
batch 17 training accuracy is : 1.00000
batch 18 training loss is : 0.00349
batch 18 training accuracy is : 1.00000
batch 19 training loss is : 0.00396
batch 19 training accuracy is : 1.00000
batch 20 training loss is : 0.07301
batch 20 training accuracy is : 0.93750
batch 21 training loss is : 0.03875
batch 21 training accuracy is : 1.00000
batch 22 training loss is : 0.04505
batch 22 training accuracy is : 0.93750
batch 23 tra

batch 4 dev loss is : 0.83750
batch 4 dev accuracy is : 0.81250
batch 5 dev loss is : 0.44157
batch 5 dev accuracy is : 0.87500
batch 6 dev loss is : 0.63855
batch 6 dev accuracy is : 0.81250
batch 7 dev loss is : 1.87208
batch 7 dev accuracy is : 0.81250
batch 8 dev loss is : 2.12680
batch 8 dev accuracy is : 0.62500
batch 9 dev loss is : 0.67462
batch 9 dev accuracy is : 0.81250
batch 10 dev loss is : 1.79338
batch 10 dev accuracy is : 0.50000
batch 11 dev loss is : 2.43100
batch 11 dev accuracy is : 0.62500
batch 12 dev loss is : 1.51093
batch 12 dev accuracy is : 0.75000
batch 13 dev loss is : 2.20370
batch 13 dev accuracy is : 0.68750
batch 14 dev loss is : 0.86666
batch 14 dev accuracy is : 0.75000
batch 15 dev loss is : 0.81793
batch 15 dev accuracy is : 0.87500
batch 16 dev loss is : 1.05316
batch 16 dev accuracy is : 0.81250
batch 17 dev loss is : 2.77517
batch 17 dev accuracy is : 0.62500
batch 18 dev loss is : 2.21069
batch 18 dev accuracy is : 0.75000
batch 19 dev loss is :

batch 88 training loss is : 0.02776
batch 88 training accuracy is : 1.00000
batch 89 training loss is : 0.05557
batch 89 training accuracy is : 0.93750
batch 90 training loss is : 0.02229
batch 90 training accuracy is : 1.00000
batch 91 training loss is : 0.00000
batch 91 training accuracy is : 1.00000
batch 92 training loss is : 0.01695
batch 92 training accuracy is : 1.00000
batch 93 training loss is : 0.00107
batch 93 training accuracy is : 1.00000
batch 94 training loss is : 0.00345
batch 94 training accuracy is : 1.00000
batch 95 training loss is : 0.00359
batch 95 training accuracy is : 1.00000
batch 96 training loss is : 0.03802
batch 96 training accuracy is : 1.00000
batch 97 training loss is : 0.03426
batch 97 training accuracy is : 1.00000
batch 98 training loss is : 0.02055
batch 98 training accuracy is : 1.00000
batch 99 training loss is : 0.28494
batch 99 training accuracy is : 0.93750
batch 100 training loss is : 0.03309
batch 100 training accuracy is : 1.00000
batch 101 

batch 58 training loss is : 0.02392
batch 58 training accuracy is : 1.00000
batch 59 training loss is : 0.09637
batch 59 training accuracy is : 0.93750
batch 60 training loss is : 0.09574
batch 60 training accuracy is : 0.93750
batch 61 training loss is : 0.00061
batch 61 training accuracy is : 1.00000
batch 62 training loss is : 0.01833
batch 62 training accuracy is : 1.00000
batch 63 training loss is : 0.02181
batch 63 training accuracy is : 1.00000
batch 64 training loss is : 0.00015
batch 64 training accuracy is : 1.00000
batch 65 training loss is : 0.02093
batch 65 training accuracy is : 1.00000
batch 66 training loss is : 0.16400
batch 66 training accuracy is : 0.87500
batch 67 training loss is : 0.05394
batch 67 training accuracy is : 1.00000
batch 68 training loss is : 0.10731
batch 68 training accuracy is : 0.93750
batch 69 training loss is : 0.27831
batch 69 training accuracy is : 0.93750
batch 70 training loss is : 0.00171
batch 70 training accuracy is : 1.00000
batch 71 tra

batch 29 training loss is : 0.06037
batch 29 training accuracy is : 1.00000
batch 30 training loss is : 0.02536
batch 30 training accuracy is : 1.00000
batch 31 training loss is : 0.00010
batch 31 training accuracy is : 1.00000
batch 32 training loss is : 0.00000
batch 32 training accuracy is : 1.00000
batch 33 training loss is : 0.00533
batch 33 training accuracy is : 1.00000
batch 34 training loss is : 0.00255
batch 34 training accuracy is : 1.00000
batch 35 training loss is : 0.03943
batch 35 training accuracy is : 1.00000
batch 36 training loss is : 0.01558
batch 36 training accuracy is : 1.00000
batch 37 training loss is : 0.00073
batch 37 training accuracy is : 1.00000
batch 38 training loss is : 0.04435
batch 38 training accuracy is : 1.00000
batch 39 training loss is : 0.08927
batch 39 training accuracy is : 0.93750
batch 40 training loss is : 0.01203
batch 40 training accuracy is : 1.00000
batch 41 training loss is : 0.00130
batch 41 training accuracy is : 1.00000
batch 42 tra

Average validation loss is 1.22972 at the end of epoch 185
Average validation accuracy is 0.75108 at the end of epoch 185
At 186-th epoch.
batch 0 training loss is : 0.33743
batch 0 training accuracy is : 0.93750
batch 1 training loss is : 0.00178
batch 1 training accuracy is : 1.00000
batch 2 training loss is : 0.08727
batch 2 training accuracy is : 0.93750
batch 3 training loss is : 0.12290
batch 3 training accuracy is : 0.93750
batch 4 training loss is : 0.00456
batch 4 training accuracy is : 1.00000
batch 5 training loss is : 0.16494
batch 5 training accuracy is : 0.93750
batch 6 training loss is : 0.19537
batch 6 training accuracy is : 0.93750
batch 7 training loss is : 0.02203
batch 7 training accuracy is : 1.00000
batch 8 training loss is : 0.01045
batch 8 training accuracy is : 1.00000
batch 9 training loss is : 0.00000
batch 9 training accuracy is : 1.00000
batch 10 training loss is : 0.02916
batch 10 training accuracy is : 1.00000
batch 11 training loss is : 0.03381
batch 11 

batch 107 training loss is : 0.05840
batch 107 training accuracy is : 1.00000
batch 108 training loss is : 0.06146
batch 108 training accuracy is : 1.00000
batch 109 training loss is : 0.00472
batch 109 training accuracy is : 1.00000
batch 110 training loss is : 0.00186
batch 110 training accuracy is : 1.00000
batch 111 training loss is : 0.02380
batch 111 training accuracy is : 1.00000
batch 112 training loss is : 0.05943
batch 112 training accuracy is : 1.00000
Average training loss is 0.07872 at the end of epoch 186
Average training accuracy is 0.96540 at the end of epoch 186
batch 0 dev loss is : 1.32659
batch 0 dev accuracy is : 0.75000
batch 1 dev loss is : 0.13164
batch 1 dev accuracy is : 0.87500
batch 2 dev loss is : 0.61766
batch 2 dev accuracy is : 0.81250
batch 3 dev loss is : 0.92416
batch 3 dev accuracy is : 0.81250
batch 4 dev loss is : 0.77223
batch 4 dev accuracy is : 0.75000
batch 5 dev loss is : 0.73230
batch 5 dev accuracy is : 0.75000
batch 6 dev loss is : 0.71587


batch 79 training loss is : 0.00328
batch 79 training accuracy is : 1.00000
batch 80 training loss is : 0.02513
batch 80 training accuracy is : 1.00000
batch 81 training loss is : 0.00007
batch 81 training accuracy is : 1.00000
batch 82 training loss is : 0.00548
batch 82 training accuracy is : 1.00000
batch 83 training loss is : 0.01465
batch 83 training accuracy is : 1.00000
batch 84 training loss is : 0.21425
batch 84 training accuracy is : 0.87500
batch 85 training loss is : 0.00481
batch 85 training accuracy is : 1.00000
batch 86 training loss is : 0.03272
batch 86 training accuracy is : 1.00000
batch 87 training loss is : 0.01158
batch 87 training accuracy is : 1.00000
batch 88 training loss is : 0.02701
batch 88 training accuracy is : 1.00000
batch 89 training loss is : 0.02517
batch 89 training accuracy is : 1.00000
batch 90 training loss is : 0.01430
batch 90 training accuracy is : 1.00000
batch 91 training loss is : 0.02398
batch 91 training accuracy is : 1.00000
batch 92 tra

batch 47 training loss is : 0.09290
batch 47 training accuracy is : 0.93750
batch 48 training loss is : 0.00472
batch 48 training accuracy is : 1.00000
batch 49 training loss is : 0.13958
batch 49 training accuracy is : 0.93750
batch 50 training loss is : 0.01110
batch 50 training accuracy is : 1.00000
batch 51 training loss is : 0.09519
batch 51 training accuracy is : 0.93750
batch 52 training loss is : 0.15166
batch 52 training accuracy is : 0.93750
batch 53 training loss is : 0.08773
batch 53 training accuracy is : 0.93750
batch 54 training loss is : 0.24628
batch 54 training accuracy is : 0.87500
batch 55 training loss is : 0.12779
batch 55 training accuracy is : 0.87500
batch 56 training loss is : 0.00000
batch 56 training accuracy is : 1.00000
batch 57 training loss is : 0.02634
batch 57 training accuracy is : 1.00000
batch 58 training loss is : 0.23770
batch 58 training accuracy is : 0.93750
batch 59 training loss is : 0.03118
batch 59 training accuracy is : 1.00000
batch 60 tra

batch 17 training loss is : 0.13545
batch 17 training accuracy is : 0.93750
batch 18 training loss is : 0.03330
batch 18 training accuracy is : 1.00000
batch 19 training loss is : 0.00039
batch 19 training accuracy is : 1.00000
batch 20 training loss is : 0.09896
batch 20 training accuracy is : 0.93750
batch 21 training loss is : 0.29322
batch 21 training accuracy is : 0.87500
batch 22 training loss is : 0.01838
batch 22 training accuracy is : 1.00000
batch 23 training loss is : 0.01483
batch 23 training accuracy is : 1.00000
batch 24 training loss is : 0.00004
batch 24 training accuracy is : 1.00000
batch 25 training loss is : 0.00392
batch 25 training accuracy is : 1.00000
batch 26 training loss is : 0.03576
batch 26 training accuracy is : 1.00000
batch 27 training loss is : 0.00625
batch 27 training accuracy is : 1.00000
batch 28 training loss is : 0.01137
batch 28 training accuracy is : 1.00000
batch 29 training loss is : 0.00045
batch 29 training accuracy is : 1.00000
batch 30 tra

batch 12 dev loss is : 1.48550
batch 12 dev accuracy is : 0.75000
batch 13 dev loss is : 2.48211
batch 13 dev accuracy is : 0.68750
batch 14 dev loss is : 1.19765
batch 14 dev accuracy is : 0.75000
batch 15 dev loss is : 1.06662
batch 15 dev accuracy is : 0.87500
batch 16 dev loss is : 1.22512
batch 16 dev accuracy is : 0.68750
batch 17 dev loss is : 3.17831
batch 17 dev accuracy is : 0.68750
batch 18 dev loss is : 2.81725
batch 18 dev accuracy is : 0.68750
batch 19 dev loss is : 2.67321
batch 19 dev accuracy is : 0.81250
batch 20 dev loss is : 1.90708
batch 20 dev accuracy is : 0.62500
batch 21 dev loss is : 2.50354
batch 21 dev accuracy is : 0.75000
batch 22 dev loss is : 1.65810
batch 22 dev accuracy is : 0.81250
batch 23 dev loss is : 0.53310
batch 23 dev accuracy is : 0.81250
batch 24 dev loss is : 0.71109
batch 24 dev accuracy is : 0.81250
batch 25 dev loss is : 1.82560
batch 25 dev accuracy is : 0.68750
batch 26 dev loss is : 2.01195
batch 26 dev accuracy is : 0.68750
batch 27 d

batch 94 training loss is : 0.10003
batch 94 training accuracy is : 0.93750
batch 95 training loss is : 0.16812
batch 95 training accuracy is : 0.93750
batch 96 training loss is : 0.04748
batch 96 training accuracy is : 1.00000
batch 97 training loss is : 0.29175
batch 97 training accuracy is : 0.93750
batch 98 training loss is : 0.04164
batch 98 training accuracy is : 1.00000
batch 99 training loss is : 0.00846
batch 99 training accuracy is : 1.00000
batch 100 training loss is : 0.19208
batch 100 training accuracy is : 0.87500
batch 101 training loss is : 0.09325
batch 101 training accuracy is : 0.93750
batch 102 training loss is : 0.01438
batch 102 training accuracy is : 1.00000
batch 103 training loss is : 0.08477
batch 103 training accuracy is : 0.93750
batch 104 training loss is : 0.00240
batch 104 training accuracy is : 1.00000
batch 105 training loss is : 0.00131
batch 105 training accuracy is : 1.00000
batch 106 training loss is : 0.00100
batch 106 training accuracy is : 1.0000

batch 62 training loss is : 0.09630
batch 62 training accuracy is : 0.93750
batch 63 training loss is : 0.00246
batch 63 training accuracy is : 1.00000
batch 64 training loss is : 0.00044
batch 64 training accuracy is : 1.00000
batch 65 training loss is : 0.19864
batch 65 training accuracy is : 0.93750
batch 66 training loss is : 0.13367
batch 66 training accuracy is : 0.93750
batch 67 training loss is : 0.10019
batch 67 training accuracy is : 0.93750
batch 68 training loss is : 0.04484
batch 68 training accuracy is : 1.00000
batch 69 training loss is : 0.01364
batch 69 training accuracy is : 1.00000
batch 70 training loss is : 0.08920
batch 70 training accuracy is : 0.93750
batch 71 training loss is : 0.03080
batch 71 training accuracy is : 1.00000
batch 72 training loss is : 0.00793
batch 72 training accuracy is : 1.00000
batch 73 training loss is : 0.01962
batch 73 training accuracy is : 1.00000
batch 74 training loss is : 0.01713
batch 74 training accuracy is : 1.00000
batch 75 tra

batch 36 training loss is : 0.03357
batch 36 training accuracy is : 1.00000
batch 37 training loss is : 0.04648
batch 37 training accuracy is : 1.00000
batch 38 training loss is : 0.00037
batch 38 training accuracy is : 1.00000
batch 39 training loss is : 0.02046
batch 39 training accuracy is : 1.00000
batch 40 training loss is : 0.11648
batch 40 training accuracy is : 0.93750
batch 41 training loss is : 0.00194
batch 41 training accuracy is : 1.00000
batch 42 training loss is : 0.10754
batch 42 training accuracy is : 0.93750
batch 43 training loss is : 0.02792
batch 43 training accuracy is : 1.00000
batch 44 training loss is : 0.06342
batch 44 training accuracy is : 1.00000
batch 45 training loss is : 0.01102
batch 45 training accuracy is : 1.00000
batch 46 training loss is : 0.41943
batch 46 training accuracy is : 0.81250
batch 47 training loss is : 0.01079
batch 47 training accuracy is : 1.00000
batch 48 training loss is : 0.00084
batch 48 training accuracy is : 1.00000
batch 49 tra

batch 5 training loss is : 0.06075
batch 5 training accuracy is : 1.00000
batch 6 training loss is : 0.00000
batch 6 training accuracy is : 1.00000
batch 7 training loss is : 0.16112
batch 7 training accuracy is : 0.93750
batch 8 training loss is : 0.12901
batch 8 training accuracy is : 0.93750
batch 9 training loss is : 0.00000
batch 9 training accuracy is : 1.00000
batch 10 training loss is : 0.20687
batch 10 training accuracy is : 0.87500
batch 11 training loss is : 0.15971
batch 11 training accuracy is : 0.87500
batch 12 training loss is : 0.09252
batch 12 training accuracy is : 0.93750
batch 13 training loss is : 0.29808
batch 13 training accuracy is : 0.87500
batch 14 training loss is : 0.06656
batch 14 training accuracy is : 0.93750
batch 15 training loss is : 0.02140
batch 15 training accuracy is : 1.00000
batch 16 training loss is : 0.04423
batch 16 training accuracy is : 1.00000
batch 17 training loss is : 0.00221
batch 17 training accuracy is : 1.00000
batch 18 training loss

Average training loss is 0.10227 at the end of epoch 193
Average training accuracy is 0.95387 at the end of epoch 193
batch 0 dev loss is : 0.86090
batch 0 dev accuracy is : 0.81250
batch 1 dev loss is : 0.69949
batch 1 dev accuracy is : 0.87500
batch 2 dev loss is : 0.74745
batch 2 dev accuracy is : 0.87500
batch 3 dev loss is : 0.61057
batch 3 dev accuracy is : 0.87500
batch 4 dev loss is : 0.65064
batch 4 dev accuracy is : 0.75000
batch 5 dev loss is : 0.18066
batch 5 dev accuracy is : 0.87500
batch 6 dev loss is : 0.12527
batch 6 dev accuracy is : 1.00000
batch 7 dev loss is : 2.11615
batch 7 dev accuracy is : 0.81250
batch 8 dev loss is : 2.26697
batch 8 dev accuracy is : 0.62500
batch 9 dev loss is : 0.40105
batch 9 dev accuracy is : 0.87500
batch 10 dev loss is : 2.11607
batch 10 dev accuracy is : 0.68750
batch 11 dev loss is : 1.38544
batch 11 dev accuracy is : 0.68750
batch 12 dev loss is : 1.25627
batch 12 dev accuracy is : 0.75000
batch 13 dev loss is : 2.03498
batch 13 dev 

batch 83 training loss is : 0.00210
batch 83 training accuracy is : 1.00000
batch 84 training loss is : 0.20806
batch 84 training accuracy is : 0.93750
batch 85 training loss is : 0.06375
batch 85 training accuracy is : 0.93750
batch 86 training loss is : 0.01506
batch 86 training accuracy is : 1.00000
batch 87 training loss is : 0.28212
batch 87 training accuracy is : 0.93750
batch 88 training loss is : 0.00012
batch 88 training accuracy is : 1.00000
batch 89 training loss is : 0.02269
batch 89 training accuracy is : 1.00000
batch 90 training loss is : 0.00303
batch 90 training accuracy is : 1.00000
batch 91 training loss is : 0.16506
batch 91 training accuracy is : 0.93750
batch 92 training loss is : 0.01736
batch 92 training accuracy is : 1.00000
batch 93 training loss is : 0.00033
batch 93 training accuracy is : 1.00000
batch 94 training loss is : 0.01044
batch 94 training accuracy is : 1.00000
batch 95 training loss is : 0.01692
batch 95 training accuracy is : 1.00000
batch 96 tra

batch 57 training loss is : 0.01794
batch 57 training accuracy is : 1.00000
batch 58 training loss is : 0.12348
batch 58 training accuracy is : 0.93750
batch 59 training loss is : 0.15319
batch 59 training accuracy is : 0.93750
batch 60 training loss is : 0.14268
batch 60 training accuracy is : 0.93750
batch 61 training loss is : 0.12455
batch 61 training accuracy is : 0.93750
batch 62 training loss is : 0.00096
batch 62 training accuracy is : 1.00000
batch 63 training loss is : 0.07900
batch 63 training accuracy is : 1.00000
batch 64 training loss is : 0.00152
batch 64 training accuracy is : 1.00000
batch 65 training loss is : 0.00586
batch 65 training accuracy is : 1.00000
batch 66 training loss is : 0.02915
batch 66 training accuracy is : 1.00000
batch 67 training loss is : 0.37474
batch 67 training accuracy is : 0.87500
batch 68 training loss is : 0.14719
batch 68 training accuracy is : 0.93750
batch 69 training loss is : 0.02186
batch 69 training accuracy is : 1.00000
batch 70 tra

batch 27 training loss is : 0.10794
batch 27 training accuracy is : 0.93750
batch 28 training loss is : 0.01212
batch 28 training accuracy is : 1.00000
batch 29 training loss is : 0.01224
batch 29 training accuracy is : 1.00000
batch 30 training loss is : 0.16127
batch 30 training accuracy is : 0.87500
batch 31 training loss is : 0.04432
batch 31 training accuracy is : 1.00000
batch 32 training loss is : 0.02196
batch 32 training accuracy is : 1.00000
batch 33 training loss is : 0.00583
batch 33 training accuracy is : 1.00000
batch 34 training loss is : 0.00000
batch 34 training accuracy is : 1.00000
batch 35 training loss is : 0.04421
batch 35 training accuracy is : 1.00000
batch 36 training loss is : 0.01859
batch 36 training accuracy is : 1.00000
batch 37 training loss is : 0.06549
batch 37 training accuracy is : 1.00000
batch 38 training loss is : 0.01516
batch 38 training accuracy is : 1.00000
batch 39 training loss is : 0.10768
batch 39 training accuracy is : 0.93750
batch 40 tra

Average validation loss is 1.45326 at the end of epoch 196
Average validation accuracy is 0.73810 at the end of epoch 196
At 197-th epoch.
batch 0 training loss is : 0.02146
batch 0 training accuracy is : 1.00000
batch 1 training loss is : 0.00810
batch 1 training accuracy is : 1.00000
batch 2 training loss is : 0.25221
batch 2 training accuracy is : 0.87500
batch 3 training loss is : 0.10409
batch 3 training accuracy is : 0.93750
batch 4 training loss is : 0.02267
batch 4 training accuracy is : 1.00000
batch 5 training loss is : 0.05874
batch 5 training accuracy is : 0.93750
batch 6 training loss is : 0.02774
batch 6 training accuracy is : 1.00000
batch 7 training loss is : 0.05616
batch 7 training accuracy is : 0.93750
batch 8 training loss is : 0.06740
batch 8 training accuracy is : 0.93750
batch 9 training loss is : 0.00498
batch 9 training accuracy is : 1.00000
batch 10 training loss is : 0.04723
batch 10 training accuracy is : 1.00000
batch 11 training loss is : 0.01057
batch 11 

batch 108 training loss is : 0.00001
batch 108 training accuracy is : 1.00000
batch 109 training loss is : 0.01962
batch 109 training accuracy is : 1.00000
batch 110 training loss is : 0.18035
batch 110 training accuracy is : 0.93750
batch 111 training loss is : 0.00150
batch 111 training accuracy is : 1.00000
batch 112 training loss is : 0.14750
batch 112 training accuracy is : 0.93750
Average training loss is 0.05877 at the end of epoch 197
Average training accuracy is 0.96705 at the end of epoch 197
batch 0 dev loss is : 0.88890
batch 0 dev accuracy is : 0.81250
batch 1 dev loss is : 0.35379
batch 1 dev accuracy is : 0.87500
batch 2 dev loss is : 0.53313
batch 2 dev accuracy is : 0.93750
batch 3 dev loss is : 0.81651
batch 3 dev accuracy is : 0.81250
batch 4 dev loss is : 0.86013
batch 4 dev accuracy is : 0.81250
batch 5 dev loss is : 0.55639
batch 5 dev accuracy is : 0.81250
batch 6 dev loss is : 0.36597
batch 6 dev accuracy is : 0.93750
batch 7 dev loss is : 2.34714
batch 7 dev ac

batch 82 training loss is : 0.00168
batch 82 training accuracy is : 1.00000
batch 83 training loss is : 0.00058
batch 83 training accuracy is : 1.00000
batch 84 training loss is : 0.11157
batch 84 training accuracy is : 0.93750
batch 85 training loss is : 0.00425
batch 85 training accuracy is : 1.00000
batch 86 training loss is : 0.21343
batch 86 training accuracy is : 0.93750
batch 87 training loss is : 0.05145
batch 87 training accuracy is : 1.00000
batch 88 training loss is : 0.00121
batch 88 training accuracy is : 1.00000
batch 89 training loss is : 0.00986
batch 89 training accuracy is : 1.00000
batch 90 training loss is : 0.00000
batch 90 training accuracy is : 1.00000
batch 91 training loss is : 0.00643
batch 91 training accuracy is : 1.00000
batch 92 training loss is : 0.11272
batch 92 training accuracy is : 0.93750
batch 93 training loss is : 0.22812
batch 93 training accuracy is : 0.93750
batch 94 training loss is : 0.02002
batch 94 training accuracy is : 1.00000
batch 95 tra

batch 50 training loss is : 0.00185
batch 50 training accuracy is : 1.00000
batch 51 training loss is : 0.00103
batch 51 training accuracy is : 1.00000
batch 52 training loss is : 0.00067
batch 52 training accuracy is : 1.00000
batch 53 training loss is : 0.00489
batch 53 training accuracy is : 1.00000
batch 54 training loss is : 0.54378
batch 54 training accuracy is : 0.75000
batch 55 training loss is : 0.04766
batch 55 training accuracy is : 0.93750
batch 56 training loss is : 0.06960
batch 56 training accuracy is : 1.00000
batch 57 training loss is : 0.00245
batch 57 training accuracy is : 1.00000
batch 58 training loss is : 0.00737
batch 58 training accuracy is : 1.00000
batch 59 training loss is : 0.08068
batch 59 training accuracy is : 0.93750
batch 60 training loss is : 0.00430
batch 60 training accuracy is : 1.00000
batch 61 training loss is : 0.02105
batch 61 training accuracy is : 1.00000
batch 62 training loss is : 0.06194
batch 62 training accuracy is : 1.00000
batch 63 tra

In [5]:
model = MyEnsemble(modelA, modelB, modelC)
model = nn.DataParallel(model, device_ids=gpu_ids)
model.to(device)
checkpoint = torch.load('/home/aidana_massalimova/classifier/agnostic/model1_upd.pt')
model.load_state_dict(checkpoint['model_state_dict'])
optimizer.load_state_dict(checkpoint['optimizer_state_dict'])
model.eval()

DataParallel(
  (module): MyEnsemble(
    (modelA): DataParallel(
      (module): ResNet18(
        (resnet18): ResNet(
          (conv1): Conv2d(3, 64, kernel_size=(7, 7), stride=(2, 2), padding=(3, 3), bias=False)
          (bn1): BatchNorm2d(64, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
          (relu): ReLU(inplace=True)
          (maxpool): MaxPool2d(kernel_size=3, stride=2, padding=1, dilation=1, ceil_mode=False)
          (layer1): Sequential(
            (0): BasicBlock(
              (conv1): Conv2d(64, 64, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1), bias=False)
              (bn1): BatchNorm2d(64, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
              (relu): ReLU(inplace=True)
              (conv2): Conv2d(64, 64, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1), bias=False)
              (bn2): BatchNorm2d(64, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
            )
            (1): BasicBlock(
     

In [33]:
ground_truths=[]
predictions=[]
for it, test_data in enumerate(test_loader):
    with torch.no_grad():
        t1w,FA, MD, labels = Variable(test_data['t1w']).to(device),Variable(test_data['FA']).to(device),Variable(test_data['MD']).to(device), Variable(test_data['label']).to(device) 
        integer_encoded = labels.data.cpu().numpy()
        ground_truth = Variable(torch.from_numpy(integer_encoded)).long()
        for el in ground_truth.numpy():
            ground_truths.append(el)

    test_output = model(t1w,FA,MD)
    test_prob_predict = F.softmax(test_output, dim=1)
    _, predict = test_prob_predict.topk(1)
    predict=torch.transpose(predict, 0,1)
    predict2=predict.cpu().numpy()
    for el2 in predict2:
        for el3 in el2:
            predictions.append(el3)


In [27]:
from sklearn.metrics import confusion_matrix,plot_confusion_matrix
print(confusion_matrix(ground_truths, predictions))

[[97  0  3]
 [ 1 82 20]
 [ 9  8 84]]


In [34]:
from sklearn.metrics import classification_report, confusion_matrix
print(classification_report(ground_truths, predictions))

              precision    recall  f1-score   support

           0       0.60      0.78      0.68       122
           1       0.96      0.87      0.91       122
           2       0.72      0.57      0.64       124

    accuracy                           0.74       368
   macro avg       0.76      0.74      0.74       368
weighted avg       0.76      0.74      0.74       368



In [10]:
checkpoint['epoch']

24