In [1]:
from google.colab import drive
drive.mount('/content/drive')

Mounted at /content/drive


In [2]:
import sys
sys.path.append('/content/drive/MyDrive/stat940project')

In [3]:
%load_ext autoreload
%autoreload 2

In [4]:
%reload_ext autoreload

In [5]:
import torch
import torch.nn as nn
import torch.nn.functional as F
from torchvision import transforms
from torch.utils.data import DataLoader, Dataset
import os
import numpy as np
import random
import math
import torch.optim as optim
from tqdm.auto import tqdm, trange

In [6]:
from dataset import load_data, ModelNet40Dataset
from utils.augmentations import *
from utils.utils import run, set_seed
from models import Pointnet, DGCNN

In [7]:
set_seed(1)

In [8]:
parent_dir = '/content/drive/MyDrive/stat940project'
checkpoint_path = os.path.join(parent_dir, 'checkpoints/dgcnn')

if not os.path.exists(checkpoint_path):
    os.mkdir(checkpoint_path)

data_path = os.path.join(parent_dir, 'data/ModelNet40')

In [9]:
train_X, train_y = load_data(data_path)
test_X, test_y = load_data(data_path, mode='test')

In [10]:
default_transforms = transforms.Compose(
    [
        ToTensor()
    ]
)

train_transforms = transforms.Compose(
    [
        Translate(),
        Shuffle(),
        ToTensor()
    ]
)

In [11]:
trainset = ModelNet40Dataset(train_X, train_y, transforms=train_transforms)
testset = ModelNet40Dataset(test_X, test_y, transforms=default_transforms)

trainloader = DataLoader(trainset, batch_size=32, shuffle=True)
testloader = DataLoader(testset, batch_size=32, shuffle=True)

In [12]:
if torch.cuda.is_available():
    device = torch.device('cuda:0')
    print('running on GPU')

else:
    device = torch.device('cpu')
    print('running on CPU')

running on GPU


In [13]:
model = DGCNN(1024, 20, output_channels=40).to(device)
n_epochs = 200
train_hist, test_hist = run(model, n_epochs, device, trainloader, testloader, model_name="dgcnn", checkpoint_path=checkpoint_path)

Epochs:   0%|          | 0/201 [00:00<?, ?it/s]


Epoch 0:


Batches:   0%|          | 0/308 [00:00<?, ?it/s]

    Train [608/9843]	 | 	Loss: 2.91496
    Train [1248/9843]	 | 	Loss: 2.59546
    Train [1888/9843]	 | 	Loss: 2.13159
    Train [2528/9843]	 | 	Loss: 1.70473
    Train [3168/9843]	 | 	Loss: 2.02211
    Train [3808/9843]	 | 	Loss: 1.52020
    Train [4448/9843]	 | 	Loss: 1.33371
    Train [5088/9843]	 | 	Loss: 1.65207
    Train [5728/9843]	 | 	Loss: 1.71719
    Train [6368/9843]	 | 	Loss: 1.58474
    Train [7008/9843]	 | 	Loss: 1.42403
    Train [7648/9843]	 | 	Loss: 1.49823
    Train [8288/9843]	 | 	Loss: 1.11996
    Train [8928/9843]	 | 	Loss: 1.15940
    Train [9568/9843]	 | 	Loss: 1.11819
==> Train | Average loss: 1.7260
==> Test  | Average loss: 0.9540
==> Test  | Accuracy: 75.8104
Best epoch: 0
Best accuracy: 75.81037277147487

Epoch 1:


Batches:   0%|          | 0/308 [00:00<?, ?it/s]

    Train [608/9843]	 | 	Loss: 1.19883
    Train [1248/9843]	 | 	Loss: 1.04100
    Train [1888/9843]	 | 	Loss: 0.79162
    Train [2528/9843]	 | 	Loss: 1.13984
    Train [3168/9843]	 | 	Loss: 1.21258
    Train [3808/9843]	 | 	Loss: 0.63364
    Train [4448/9843]	 | 	Loss: 0.95759
    Train [5088/9843]	 | 	Loss: 1.05743
    Train [5728/9843]	 | 	Loss: 0.92616
    Train [6368/9843]	 | 	Loss: 0.52429
    Train [7008/9843]	 | 	Loss: 0.73052
    Train [7648/9843]	 | 	Loss: 0.78181
    Train [8288/9843]	 | 	Loss: 0.88372
    Train [8928/9843]	 | 	Loss: 0.96252
    Train [9568/9843]	 | 	Loss: 0.75734
==> Train | Average loss: 0.9426
==> Test  | Average loss: 0.6514
==> Test  | Accuracy: 82.4149
Best epoch: 1
Best accuracy: 82.41491085899514

Epoch 2:


Batches:   0%|          | 0/308 [00:00<?, ?it/s]

    Train [608/9843]	 | 	Loss: 1.00159
    Train [1248/9843]	 | 	Loss: 0.75541
    Train [1888/9843]	 | 	Loss: 0.76882
    Train [2528/9843]	 | 	Loss: 0.50193
    Train [3168/9843]	 | 	Loss: 0.81955
    Train [3808/9843]	 | 	Loss: 0.53895
    Train [4448/9843]	 | 	Loss: 0.94870
    Train [5088/9843]	 | 	Loss: 1.05764
    Train [5728/9843]	 | 	Loss: 0.90639
    Train [6368/9843]	 | 	Loss: 0.67758
    Train [7008/9843]	 | 	Loss: 1.18614
    Train [7648/9843]	 | 	Loss: 0.99027
    Train [8288/9843]	 | 	Loss: 0.35161
    Train [8928/9843]	 | 	Loss: 0.66980
    Train [9568/9843]	 | 	Loss: 0.57435
==> Train | Average loss: 0.7445
==> Test  | Average loss: 0.5685
==> Test  | Accuracy: 82.6580
Best epoch: 2
Best accuracy: 82.6580226904376

Epoch 3:


Batches:   0%|          | 0/308 [00:00<?, ?it/s]

    Train [608/9843]	 | 	Loss: 0.59390
    Train [1248/9843]	 | 	Loss: 0.97699
    Train [1888/9843]	 | 	Loss: 0.61028
    Train [2528/9843]	 | 	Loss: 0.45688
    Train [3168/9843]	 | 	Loss: 0.47971
    Train [3808/9843]	 | 	Loss: 0.67421
    Train [4448/9843]	 | 	Loss: 0.74062
    Train [5088/9843]	 | 	Loss: 0.46219
    Train [5728/9843]	 | 	Loss: 0.69874
    Train [6368/9843]	 | 	Loss: 0.57270
    Train [7008/9843]	 | 	Loss: 0.70925
    Train [7648/9843]	 | 	Loss: 0.88555
    Train [8288/9843]	 | 	Loss: 0.65956
    Train [8928/9843]	 | 	Loss: 0.41441
    Train [9568/9843]	 | 	Loss: 0.44820
==> Train | Average loss: 0.6514
==> Test  | Average loss: 0.5147
==> Test  | Accuracy: 84.1977
Best epoch: 3
Best accuracy: 84.19773095623987

Epoch 4:


Batches:   0%|          | 0/308 [00:00<?, ?it/s]

    Train [608/9843]	 | 	Loss: 0.61949
    Train [1248/9843]	 | 	Loss: 0.52915
    Train [1888/9843]	 | 	Loss: 0.57716
    Train [2528/9843]	 | 	Loss: 1.28120
    Train [3168/9843]	 | 	Loss: 0.60205
    Train [3808/9843]	 | 	Loss: 0.54745
    Train [4448/9843]	 | 	Loss: 0.34923
    Train [5088/9843]	 | 	Loss: 0.57548
    Train [5728/9843]	 | 	Loss: 0.72646
    Train [6368/9843]	 | 	Loss: 0.81856
    Train [7008/9843]	 | 	Loss: 0.41048
    Train [7648/9843]	 | 	Loss: 0.78840
    Train [8288/9843]	 | 	Loss: 0.37199
    Train [8928/9843]	 | 	Loss: 0.63472
    Train [9568/9843]	 | 	Loss: 0.46068
==> Train | Average loss: 0.5982
==> Test  | Average loss: 0.4901
==> Test  | Accuracy: 84.6029
Best epoch: 4
Best accuracy: 84.60291734197732

Epoch 5:


Batches:   0%|          | 0/308 [00:00<?, ?it/s]

    Train [608/9843]	 | 	Loss: 0.36966
    Train [1248/9843]	 | 	Loss: 0.56964
    Train [1888/9843]	 | 	Loss: 0.23198
    Train [2528/9843]	 | 	Loss: 0.61833
    Train [3168/9843]	 | 	Loss: 0.40599
    Train [3808/9843]	 | 	Loss: 0.31801
    Train [4448/9843]	 | 	Loss: 0.54202
    Train [5088/9843]	 | 	Loss: 0.81952
    Train [5728/9843]	 | 	Loss: 0.40597
    Train [6368/9843]	 | 	Loss: 0.58077
    Train [7008/9843]	 | 	Loss: 0.14823
    Train [7648/9843]	 | 	Loss: 0.43797
    Train [8288/9843]	 | 	Loss: 0.53335
    Train [8928/9843]	 | 	Loss: 0.39621
    Train [9568/9843]	 | 	Loss: 0.95497
==> Train | Average loss: 0.5557
==> Test  | Average loss: 0.4143
==> Test  | Accuracy: 86.7909
Best epoch: 5
Best accuracy: 86.79092382495948

Epoch 6:


Batches:   0%|          | 0/308 [00:00<?, ?it/s]

    Train [608/9843]	 | 	Loss: 0.31550
    Train [1248/9843]	 | 	Loss: 0.40352
    Train [1888/9843]	 | 	Loss: 0.34638
    Train [2528/9843]	 | 	Loss: 0.23082
    Train [3168/9843]	 | 	Loss: 0.40604
    Train [3808/9843]	 | 	Loss: 0.34746
    Train [4448/9843]	 | 	Loss: 0.67831
    Train [5088/9843]	 | 	Loss: 0.43509
    Train [5728/9843]	 | 	Loss: 0.51957
    Train [6368/9843]	 | 	Loss: 0.74900
    Train [7008/9843]	 | 	Loss: 0.45986
    Train [7648/9843]	 | 	Loss: 0.48778
    Train [8288/9843]	 | 	Loss: 0.55719
    Train [8928/9843]	 | 	Loss: 0.45358
    Train [9568/9843]	 | 	Loss: 0.18643
==> Train | Average loss: 0.5170
==> Test  | Average loss: 0.4021
==> Test  | Accuracy: 87.6418
Best epoch: 6
Best accuracy: 87.6418152350081

Epoch 7:


Batches:   0%|          | 0/308 [00:00<?, ?it/s]

    Train [608/9843]	 | 	Loss: 0.60312
    Train [1248/9843]	 | 	Loss: 0.68863
    Train [1888/9843]	 | 	Loss: 0.69570
    Train [2528/9843]	 | 	Loss: 0.34959
    Train [3168/9843]	 | 	Loss: 0.60353
    Train [3808/9843]	 | 	Loss: 0.35849
    Train [4448/9843]	 | 	Loss: 0.40517
    Train [5088/9843]	 | 	Loss: 0.50637
    Train [5728/9843]	 | 	Loss: 0.33574
    Train [6368/9843]	 | 	Loss: 0.66443
    Train [7008/9843]	 | 	Loss: 0.57303
    Train [7648/9843]	 | 	Loss: 0.67041
    Train [8288/9843]	 | 	Loss: 0.34421
    Train [8928/9843]	 | 	Loss: 0.65384
    Train [9568/9843]	 | 	Loss: 0.27477
==> Train | Average loss: 0.5089
==> Test  | Average loss: 0.3977
==> Test  | Accuracy: 87.0746
Best epoch: 6
Best accuracy: 87.6418152350081

Epoch 8:


Batches:   0%|          | 0/308 [00:00<?, ?it/s]

    Train [608/9843]	 | 	Loss: 0.33548
    Train [1248/9843]	 | 	Loss: 0.67849
    Train [1888/9843]	 | 	Loss: 0.39334
    Train [2528/9843]	 | 	Loss: 0.60380
    Train [3168/9843]	 | 	Loss: 0.42169
    Train [3808/9843]	 | 	Loss: 0.57077
    Train [4448/9843]	 | 	Loss: 0.32219
    Train [5088/9843]	 | 	Loss: 0.68933
    Train [5728/9843]	 | 	Loss: 0.41479
    Train [6368/9843]	 | 	Loss: 0.53774
    Train [7008/9843]	 | 	Loss: 0.19363
    Train [7648/9843]	 | 	Loss: 0.69435
    Train [8288/9843]	 | 	Loss: 0.47857
    Train [8928/9843]	 | 	Loss: 0.59258
    Train [9568/9843]	 | 	Loss: 0.45332
==> Train | Average loss: 0.4454
==> Test  | Average loss: 0.4145
==> Test  | Accuracy: 86.8314
Best epoch: 6
Best accuracy: 87.6418152350081

Epoch 9:


Batches:   0%|          | 0/308 [00:00<?, ?it/s]

    Train [608/9843]	 | 	Loss: 0.34627
    Train [1248/9843]	 | 	Loss: 0.38705
    Train [1888/9843]	 | 	Loss: 0.37323
    Train [2528/9843]	 | 	Loss: 0.20467
    Train [3168/9843]	 | 	Loss: 0.27448
    Train [3808/9843]	 | 	Loss: 0.31005
    Train [4448/9843]	 | 	Loss: 0.42347
    Train [5088/9843]	 | 	Loss: 0.31292
    Train [5728/9843]	 | 	Loss: 0.51613
    Train [6368/9843]	 | 	Loss: 0.68135
    Train [7008/9843]	 | 	Loss: 0.33205
    Train [7648/9843]	 | 	Loss: 0.26074
    Train [8288/9843]	 | 	Loss: 0.56702
    Train [8928/9843]	 | 	Loss: 0.76686
    Train [9568/9843]	 | 	Loss: 0.47183
==> Train | Average loss: 0.4413
==> Test  | Average loss: 0.4284
==> Test  | Accuracy: 86.1426
Best epoch: 6
Best accuracy: 87.6418152350081

Epoch 10:


Batches:   0%|          | 0/308 [00:00<?, ?it/s]

    Train [608/9843]	 | 	Loss: 0.32221
    Train [1248/9843]	 | 	Loss: 0.30846
    Train [1888/9843]	 | 	Loss: 0.47222
    Train [2528/9843]	 | 	Loss: 0.32676
    Train [3168/9843]	 | 	Loss: 0.68221
    Train [3808/9843]	 | 	Loss: 0.35939
    Train [4448/9843]	 | 	Loss: 0.22449
    Train [5088/9843]	 | 	Loss: 0.33953
    Train [5728/9843]	 | 	Loss: 0.41935
    Train [6368/9843]	 | 	Loss: 0.60663
    Train [7008/9843]	 | 	Loss: 0.53955
    Train [7648/9843]	 | 	Loss: 0.29464
    Train [8288/9843]	 | 	Loss: 0.45375
    Train [8928/9843]	 | 	Loss: 0.55860
    Train [9568/9843]	 | 	Loss: 0.42277
==> Train | Average loss: 0.4155
==> Test  | Average loss: 0.4415
==> Test  | Accuracy: 86.2642
Best epoch: 6
Best accuracy: 87.6418152350081

Epoch 11:


Batches:   0%|          | 0/308 [00:00<?, ?it/s]

    Train [608/9843]	 | 	Loss: 0.25683
    Train [1248/9843]	 | 	Loss: 0.18239
    Train [1888/9843]	 | 	Loss: 0.33299
    Train [2528/9843]	 | 	Loss: 0.32632
    Train [3168/9843]	 | 	Loss: 0.52479
    Train [3808/9843]	 | 	Loss: 0.14646
    Train [4448/9843]	 | 	Loss: 0.63451
    Train [5088/9843]	 | 	Loss: 0.13561
    Train [5728/9843]	 | 	Loss: 0.63203
    Train [6368/9843]	 | 	Loss: 0.65477
    Train [7008/9843]	 | 	Loss: 0.55139
    Train [7648/9843]	 | 	Loss: 0.76958
    Train [8288/9843]	 | 	Loss: 0.63875
    Train [8928/9843]	 | 	Loss: 0.41122
    Train [9568/9843]	 | 	Loss: 0.34584
==> Train | Average loss: 0.4133
==> Test  | Average loss: 0.3768
==> Test  | Accuracy: 87.7229
Best epoch: 11
Best accuracy: 87.7228525121556

Epoch 12:


Batches:   0%|          | 0/308 [00:00<?, ?it/s]

    Train [608/9843]	 | 	Loss: 0.49997
    Train [1248/9843]	 | 	Loss: 0.27880
    Train [1888/9843]	 | 	Loss: 0.41829
    Train [2528/9843]	 | 	Loss: 0.36942
    Train [3168/9843]	 | 	Loss: 0.42814
    Train [3808/9843]	 | 	Loss: 0.47684
    Train [4448/9843]	 | 	Loss: 0.33079
    Train [5088/9843]	 | 	Loss: 0.50408
    Train [5728/9843]	 | 	Loss: 0.42291
    Train [6368/9843]	 | 	Loss: 0.42997
    Train [7008/9843]	 | 	Loss: 0.44108
    Train [7648/9843]	 | 	Loss: 0.36687
    Train [8288/9843]	 | 	Loss: 0.35981
    Train [8928/9843]	 | 	Loss: 0.16140
    Train [9568/9843]	 | 	Loss: 0.33527
==> Train | Average loss: 0.3982
==> Test  | Average loss: 0.3385
==> Test  | Accuracy: 90.1135
Best epoch: 12
Best accuracy: 90.11345218800648

Epoch 13:


Batches:   0%|          | 0/308 [00:00<?, ?it/s]

    Train [608/9843]	 | 	Loss: 0.37222
    Train [1248/9843]	 | 	Loss: 0.27784
    Train [1888/9843]	 | 	Loss: 0.93665
    Train [2528/9843]	 | 	Loss: 0.42940
    Train [3168/9843]	 | 	Loss: 0.55453
    Train [3808/9843]	 | 	Loss: 0.49775
    Train [4448/9843]	 | 	Loss: 0.29971
    Train [5088/9843]	 | 	Loss: 0.19131
    Train [5728/9843]	 | 	Loss: 0.25654
    Train [6368/9843]	 | 	Loss: 0.68469
    Train [7008/9843]	 | 	Loss: 0.27344
    Train [7648/9843]	 | 	Loss: 0.36992
    Train [8288/9843]	 | 	Loss: 0.32264
    Train [8928/9843]	 | 	Loss: 0.45706
    Train [9568/9843]	 | 	Loss: 0.41002
==> Train | Average loss: 0.3808
==> Test  | Average loss: 0.3678
==> Test  | Accuracy: 88.4522
Best epoch: 12
Best accuracy: 90.11345218800648

Epoch 14:


Batches:   0%|          | 0/308 [00:00<?, ?it/s]

    Train [608/9843]	 | 	Loss: 0.23116
    Train [1248/9843]	 | 	Loss: 0.36613
    Train [1888/9843]	 | 	Loss: 0.22762
    Train [2528/9843]	 | 	Loss: 0.35267
    Train [3168/9843]	 | 	Loss: 0.25362
    Train [3808/9843]	 | 	Loss: 0.38503
    Train [4448/9843]	 | 	Loss: 0.71450
    Train [5088/9843]	 | 	Loss: 0.82579
    Train [5728/9843]	 | 	Loss: 0.69541
    Train [6368/9843]	 | 	Loss: 0.38074
    Train [7008/9843]	 | 	Loss: 0.34111
    Train [7648/9843]	 | 	Loss: 0.46198
    Train [8288/9843]	 | 	Loss: 0.37193
    Train [8928/9843]	 | 	Loss: 0.54752
    Train [9568/9843]	 | 	Loss: 0.31907
==> Train | Average loss: 0.3854
==> Test  | Average loss: 0.3033
==> Test  | Accuracy: 90.3160
Best epoch: 14
Best accuracy: 90.3160453808752

Epoch 15:


Batches:   0%|          | 0/308 [00:00<?, ?it/s]

    Train [608/9843]	 | 	Loss: 0.41320
    Train [1248/9843]	 | 	Loss: 0.24005
    Train [1888/9843]	 | 	Loss: 0.46335
    Train [2528/9843]	 | 	Loss: 0.68586
    Train [3168/9843]	 | 	Loss: 0.33251
    Train [3808/9843]	 | 	Loss: 0.34840
    Train [4448/9843]	 | 	Loss: 0.22435
    Train [5088/9843]	 | 	Loss: 0.17417
    Train [5728/9843]	 | 	Loss: 0.18864
    Train [6368/9843]	 | 	Loss: 0.35413
    Train [7008/9843]	 | 	Loss: 0.27934
    Train [7648/9843]	 | 	Loss: 0.64545
    Train [8288/9843]	 | 	Loss: 0.41027
    Train [8928/9843]	 | 	Loss: 0.41352
    Train [9568/9843]	 | 	Loss: 0.22896
==> Train | Average loss: 0.3754
==> Test  | Average loss: 0.3699
==> Test  | Accuracy: 88.2901
Best epoch: 14
Best accuracy: 90.3160453808752

Epoch 16:


Batches:   0%|          | 0/308 [00:00<?, ?it/s]

    Train [608/9843]	 | 	Loss: 0.30038
    Train [1248/9843]	 | 	Loss: 0.33281
    Train [1888/9843]	 | 	Loss: 0.31790
    Train [2528/9843]	 | 	Loss: 0.33910
    Train [3168/9843]	 | 	Loss: 0.17212
    Train [3808/9843]	 | 	Loss: 0.22452
    Train [4448/9843]	 | 	Loss: 0.32054
    Train [5088/9843]	 | 	Loss: 0.27786
    Train [5728/9843]	 | 	Loss: 0.53782
    Train [6368/9843]	 | 	Loss: 0.39570
    Train [7008/9843]	 | 	Loss: 0.32610
    Train [7648/9843]	 | 	Loss: 0.28707
    Train [8288/9843]	 | 	Loss: 0.38008
    Train [8928/9843]	 | 	Loss: 0.37839
    Train [9568/9843]	 | 	Loss: 0.54216
==> Train | Average loss: 0.3607
==> Test  | Average loss: 0.3504
==> Test  | Accuracy: 89.0194
Best epoch: 14
Best accuracy: 90.3160453808752

Epoch 17:


Batches:   0%|          | 0/308 [00:00<?, ?it/s]

    Train [608/9843]	 | 	Loss: 0.20620
    Train [1248/9843]	 | 	Loss: 0.34846
    Train [1888/9843]	 | 	Loss: 0.32272
    Train [2528/9843]	 | 	Loss: 0.25965
    Train [3168/9843]	 | 	Loss: 0.38298
    Train [3808/9843]	 | 	Loss: 0.17766
    Train [4448/9843]	 | 	Loss: 0.37863
    Train [5088/9843]	 | 	Loss: 0.35117
    Train [5728/9843]	 | 	Loss: 0.41761
    Train [6368/9843]	 | 	Loss: 0.18071
    Train [7008/9843]	 | 	Loss: 0.61935
    Train [7648/9843]	 | 	Loss: 0.23004
    Train [8288/9843]	 | 	Loss: 0.33450
    Train [8928/9843]	 | 	Loss: 0.42137
    Train [9568/9843]	 | 	Loss: 0.32015
==> Train | Average loss: 0.3422
==> Test  | Average loss: 0.3790
==> Test  | Accuracy: 87.4797
Best epoch: 14
Best accuracy: 90.3160453808752

Epoch 18:


Batches:   0%|          | 0/308 [00:00<?, ?it/s]

    Train [608/9843]	 | 	Loss: 0.31328
    Train [1248/9843]	 | 	Loss: 0.23362
    Train [1888/9843]	 | 	Loss: 0.34371
    Train [2528/9843]	 | 	Loss: 0.13676
    Train [3168/9843]	 | 	Loss: 0.24341
    Train [3808/9843]	 | 	Loss: 0.31312
    Train [4448/9843]	 | 	Loss: 0.22518
    Train [5088/9843]	 | 	Loss: 0.16947
    Train [5728/9843]	 | 	Loss: 0.75448
    Train [6368/9843]	 | 	Loss: 0.32589
    Train [7008/9843]	 | 	Loss: 0.42123
    Train [7648/9843]	 | 	Loss: 0.37350
    Train [8288/9843]	 | 	Loss: 0.30230
    Train [8928/9843]	 | 	Loss: 0.42874
    Train [9568/9843]	 | 	Loss: 0.52425
==> Train | Average loss: 0.3512
==> Test  | Average loss: 0.3590
==> Test  | Accuracy: 88.9789
Best epoch: 14
Best accuracy: 90.3160453808752

Epoch 19:


Batches:   0%|          | 0/308 [00:00<?, ?it/s]

    Train [608/9843]	 | 	Loss: 0.17710
    Train [1248/9843]	 | 	Loss: 0.21430
    Train [1888/9843]	 | 	Loss: 0.12236
    Train [2528/9843]	 | 	Loss: 0.32087
    Train [3168/9843]	 | 	Loss: 0.12518
    Train [3808/9843]	 | 	Loss: 0.24470
    Train [4448/9843]	 | 	Loss: 0.34375
    Train [5088/9843]	 | 	Loss: 0.04418
    Train [5728/9843]	 | 	Loss: 0.14747
    Train [6368/9843]	 | 	Loss: 0.17843
    Train [7008/9843]	 | 	Loss: 0.14606
    Train [7648/9843]	 | 	Loss: 0.09234
    Train [8288/9843]	 | 	Loss: 0.33537
    Train [8928/9843]	 | 	Loss: 0.19260
    Train [9568/9843]	 | 	Loss: 0.16752
==> Train | Average loss: 0.2896
==> Test  | Average loss: 0.2917
==> Test  | Accuracy: 90.2350
Best epoch: 14
Best accuracy: 90.3160453808752

Epoch 20:


Batches:   0%|          | 0/308 [00:00<?, ?it/s]

    Train [608/9843]	 | 	Loss: 0.28913
    Train [1248/9843]	 | 	Loss: 0.31282
    Train [1888/9843]	 | 	Loss: 0.11892
    Train [2528/9843]	 | 	Loss: 0.08936
    Train [3168/9843]	 | 	Loss: 0.10976
    Train [3808/9843]	 | 	Loss: 0.26121
    Train [4448/9843]	 | 	Loss: 0.24383
    Train [5088/9843]	 | 	Loss: 0.20928
    Train [5728/9843]	 | 	Loss: 0.38320
    Train [6368/9843]	 | 	Loss: 0.19758
    Train [7008/9843]	 | 	Loss: 0.15297
    Train [7648/9843]	 | 	Loss: 0.06521
    Train [8288/9843]	 | 	Loss: 0.45183
    Train [8928/9843]	 | 	Loss: 0.21340
    Train [9568/9843]	 | 	Loss: 0.32983
==> Train | Average loss: 0.2604
==> Test  | Average loss: 0.3029
==> Test  | Accuracy: 90.0729
Best epoch: 14
Best accuracy: 90.3160453808752

Epoch 21:


Batches:   0%|          | 0/308 [00:00<?, ?it/s]

    Train [608/9843]	 | 	Loss: 0.26346
    Train [1248/9843]	 | 	Loss: 0.15034
    Train [1888/9843]	 | 	Loss: 0.44266
    Train [2528/9843]	 | 	Loss: 0.15448
    Train [3168/9843]	 | 	Loss: 0.32173
    Train [3808/9843]	 | 	Loss: 0.13193
    Train [4448/9843]	 | 	Loss: 0.22919
    Train [5088/9843]	 | 	Loss: 0.09518
    Train [5728/9843]	 | 	Loss: 0.64671
    Train [6368/9843]	 | 	Loss: 0.15878
    Train [7008/9843]	 | 	Loss: 0.41900
    Train [7648/9843]	 | 	Loss: 0.10453
    Train [8288/9843]	 | 	Loss: 0.15273
    Train [8928/9843]	 | 	Loss: 0.25847
    Train [9568/9843]	 | 	Loss: 0.35458
==> Train | Average loss: 0.2534
==> Test  | Average loss: 0.3042
==> Test  | Accuracy: 90.1135
Best epoch: 14
Best accuracy: 90.3160453808752

Epoch 22:


Batches:   0%|          | 0/308 [00:00<?, ?it/s]

    Train [608/9843]	 | 	Loss: 0.22740
    Train [1248/9843]	 | 	Loss: 0.15035
    Train [1888/9843]	 | 	Loss: 0.37514
    Train [2528/9843]	 | 	Loss: 0.19225
    Train [3168/9843]	 | 	Loss: 0.07554
    Train [3808/9843]	 | 	Loss: 0.12690
    Train [4448/9843]	 | 	Loss: 0.37685
    Train [5088/9843]	 | 	Loss: 0.32409
    Train [5728/9843]	 | 	Loss: 0.11536
    Train [6368/9843]	 | 	Loss: 0.03009
    Train [7008/9843]	 | 	Loss: 0.46857
    Train [7648/9843]	 | 	Loss: 0.50416
    Train [8288/9843]	 | 	Loss: 0.19825
    Train [8928/9843]	 | 	Loss: 0.35051
    Train [9568/9843]	 | 	Loss: 0.34241
==> Train | Average loss: 0.2420
==> Test  | Average loss: 0.3006
==> Test  | Accuracy: 90.5592
Best epoch: 22
Best accuracy: 90.55915721231767

Epoch 23:


Batches:   0%|          | 0/308 [00:00<?, ?it/s]

    Train [608/9843]	 | 	Loss: 0.29342
    Train [1248/9843]	 | 	Loss: 0.24236
    Train [1888/9843]	 | 	Loss: 0.21847
    Train [2528/9843]	 | 	Loss: 0.13718
    Train [3168/9843]	 | 	Loss: 0.27018
    Train [3808/9843]	 | 	Loss: 0.19498
    Train [4448/9843]	 | 	Loss: 0.18727
    Train [5088/9843]	 | 	Loss: 0.19295
    Train [5728/9843]	 | 	Loss: 0.13705
    Train [6368/9843]	 | 	Loss: 0.40568
    Train [7008/9843]	 | 	Loss: 0.25592
    Train [7648/9843]	 | 	Loss: 0.18922
    Train [8288/9843]	 | 	Loss: 0.13419
    Train [8928/9843]	 | 	Loss: 0.21231
    Train [9568/9843]	 | 	Loss: 0.16216
==> Train | Average loss: 0.2430
==> Test  | Average loss: 0.2913
==> Test  | Accuracy: 90.2755
Best epoch: 22
Best accuracy: 90.55915721231767

Epoch 24:


Batches:   0%|          | 0/308 [00:00<?, ?it/s]

    Train [608/9843]	 | 	Loss: 0.15145
    Train [1248/9843]	 | 	Loss: 0.42539
    Train [1888/9843]	 | 	Loss: 0.22488
    Train [2528/9843]	 | 	Loss: 0.25386
    Train [3168/9843]	 | 	Loss: 0.36728
    Train [3808/9843]	 | 	Loss: 0.33209
    Train [4448/9843]	 | 	Loss: 0.42291
    Train [5088/9843]	 | 	Loss: 0.21680
    Train [5728/9843]	 | 	Loss: 0.37306
    Train [6368/9843]	 | 	Loss: 0.14349
    Train [7008/9843]	 | 	Loss: 0.13516
    Train [7648/9843]	 | 	Loss: 0.36502
    Train [8288/9843]	 | 	Loss: 0.36586
    Train [8928/9843]	 | 	Loss: 0.27230
    Train [9568/9843]	 | 	Loss: 0.13260
==> Train | Average loss: 0.2389
==> Test  | Average loss: 0.2985
==> Test  | Accuracy: 90.2755
Best epoch: 22
Best accuracy: 90.55915721231767

Epoch 25:


Batches:   0%|          | 0/308 [00:00<?, ?it/s]

    Train [608/9843]	 | 	Loss: 0.08760
    Train [1248/9843]	 | 	Loss: 0.21055
    Train [1888/9843]	 | 	Loss: 0.08773
    Train [2528/9843]	 | 	Loss: 0.14784
    Train [3168/9843]	 | 	Loss: 0.20232
    Train [3808/9843]	 | 	Loss: 0.17438
    Train [4448/9843]	 | 	Loss: 0.29610
    Train [5088/9843]	 | 	Loss: 0.10284
    Train [5728/9843]	 | 	Loss: 0.16653
    Train [6368/9843]	 | 	Loss: 0.29806
    Train [7008/9843]	 | 	Loss: 0.37864
    Train [7648/9843]	 | 	Loss: 0.29637
    Train [8288/9843]	 | 	Loss: 0.10191
    Train [8928/9843]	 | 	Loss: 0.36650
    Train [9568/9843]	 | 	Loss: 0.12912
==> Train | Average loss: 0.2248
==> Test  | Average loss: 0.3451
==> Test  | Accuracy: 89.3436
Best epoch: 22
Best accuracy: 90.55915721231767

Epoch 26:


Batches:   0%|          | 0/308 [00:00<?, ?it/s]

    Train [608/9843]	 | 	Loss: 0.05794
    Train [1248/9843]	 | 	Loss: 0.15201
    Train [1888/9843]	 | 	Loss: 0.15298
    Train [2528/9843]	 | 	Loss: 0.17130
    Train [3168/9843]	 | 	Loss: 0.23552
    Train [3808/9843]	 | 	Loss: 0.19901
    Train [4448/9843]	 | 	Loss: 0.19990
    Train [5088/9843]	 | 	Loss: 0.06502
    Train [5728/9843]	 | 	Loss: 0.52309
    Train [6368/9843]	 | 	Loss: 0.13629
    Train [7008/9843]	 | 	Loss: 0.23440
    Train [7648/9843]	 | 	Loss: 0.21733
    Train [8288/9843]	 | 	Loss: 0.13565
    Train [8928/9843]	 | 	Loss: 0.29766
    Train [9568/9843]	 | 	Loss: 0.44839
==> Train | Average loss: 0.2297
==> Test  | Average loss: 0.2942
==> Test  | Accuracy: 90.7618
Best epoch: 26
Best accuracy: 90.76175040518638

Epoch 27:


Batches:   0%|          | 0/308 [00:00<?, ?it/s]

    Train [608/9843]	 | 	Loss: 0.09379
    Train [1248/9843]	 | 	Loss: 0.35729
    Train [1888/9843]	 | 	Loss: 0.19057
    Train [2528/9843]	 | 	Loss: 0.14203
    Train [3168/9843]	 | 	Loss: 0.21513
    Train [3808/9843]	 | 	Loss: 0.32218
    Train [4448/9843]	 | 	Loss: 0.12579
    Train [5088/9843]	 | 	Loss: 0.13526
    Train [5728/9843]	 | 	Loss: 0.33439
    Train [6368/9843]	 | 	Loss: 0.24942
    Train [7008/9843]	 | 	Loss: 0.31487
    Train [7648/9843]	 | 	Loss: 0.19853
    Train [8288/9843]	 | 	Loss: 0.31166
    Train [8928/9843]	 | 	Loss: 0.18576
    Train [9568/9843]	 | 	Loss: 0.19005
==> Train | Average loss: 0.2410
==> Test  | Average loss: 0.3398
==> Test  | Accuracy: 89.5462
Best epoch: 26
Best accuracy: 90.76175040518638

Epoch 28:


Batches:   0%|          | 0/308 [00:00<?, ?it/s]

    Train [608/9843]	 | 	Loss: 0.43815
    Train [1248/9843]	 | 	Loss: 0.16118
    Train [1888/9843]	 | 	Loss: 0.12382
    Train [2528/9843]	 | 	Loss: 0.18889
    Train [3168/9843]	 | 	Loss: 0.29916
    Train [3808/9843]	 | 	Loss: 0.21188
    Train [4448/9843]	 | 	Loss: 0.22461
    Train [5088/9843]	 | 	Loss: 0.10943
    Train [5728/9843]	 | 	Loss: 0.25468
    Train [6368/9843]	 | 	Loss: 0.30932
    Train [7008/9843]	 | 	Loss: 0.08693
    Train [7648/9843]	 | 	Loss: 0.28544
    Train [8288/9843]	 | 	Loss: 0.25973
    Train [8928/9843]	 | 	Loss: 0.19175
    Train [9568/9843]	 | 	Loss: 0.13096
==> Train | Average loss: 0.2148
==> Test  | Average loss: 0.3114
==> Test  | Accuracy: 89.7893
Best epoch: 26
Best accuracy: 90.76175040518638

Epoch 29:


Batches:   0%|          | 0/308 [00:00<?, ?it/s]

    Train [608/9843]	 | 	Loss: 0.47785
    Train [1248/9843]	 | 	Loss: 0.36922
    Train [1888/9843]	 | 	Loss: 0.31813
    Train [2528/9843]	 | 	Loss: 0.18260
    Train [3168/9843]	 | 	Loss: 0.28525
    Train [3808/9843]	 | 	Loss: 0.34739
    Train [4448/9843]	 | 	Loss: 0.23034
    Train [5088/9843]	 | 	Loss: 0.18579
    Train [5728/9843]	 | 	Loss: 0.19516
    Train [6368/9843]	 | 	Loss: 0.20635
    Train [7008/9843]	 | 	Loss: 0.36691
    Train [7648/9843]	 | 	Loss: 0.08694
    Train [8288/9843]	 | 	Loss: 0.14790
    Train [8928/9843]	 | 	Loss: 0.16966
    Train [9568/9843]	 | 	Loss: 0.36022
==> Train | Average loss: 0.2168
==> Test  | Average loss: 0.3182
==> Test  | Accuracy: 90.3566
Best epoch: 26
Best accuracy: 90.76175040518638

Epoch 30:


Batches:   0%|          | 0/308 [00:00<?, ?it/s]

    Train [608/9843]	 | 	Loss: 0.25778
    Train [1248/9843]	 | 	Loss: 0.11981
    Train [1888/9843]	 | 	Loss: 0.28209
    Train [2528/9843]	 | 	Loss: 0.06432
    Train [3168/9843]	 | 	Loss: 0.07591
    Train [3808/9843]	 | 	Loss: 0.13817
    Train [4448/9843]	 | 	Loss: 0.19570
    Train [5088/9843]	 | 	Loss: 0.07267
    Train [5728/9843]	 | 	Loss: 0.19075
    Train [6368/9843]	 | 	Loss: 0.15818
    Train [7008/9843]	 | 	Loss: 0.08524
    Train [7648/9843]	 | 	Loss: 0.07129
    Train [8288/9843]	 | 	Loss: 0.21101
    Train [8928/9843]	 | 	Loss: 0.28147
    Train [9568/9843]	 | 	Loss: 0.35733
==> Train | Average loss: 0.2127
==> Test  | Average loss: 0.3383
==> Test  | Accuracy: 89.8298
Best epoch: 26
Best accuracy: 90.76175040518638

Epoch 31:


Batches:   0%|          | 0/308 [00:00<?, ?it/s]

    Train [608/9843]	 | 	Loss: 0.02780
    Train [1248/9843]	 | 	Loss: 0.16580
    Train [1888/9843]	 | 	Loss: 0.18543
    Train [2528/9843]	 | 	Loss: 0.14619
    Train [3168/9843]	 | 	Loss: 0.24351
    Train [3808/9843]	 | 	Loss: 0.42487
    Train [4448/9843]	 | 	Loss: 0.20897
    Train [5088/9843]	 | 	Loss: 0.23414
    Train [5728/9843]	 | 	Loss: 0.18061
    Train [6368/9843]	 | 	Loss: 0.19025
    Train [7008/9843]	 | 	Loss: 0.23574
    Train [7648/9843]	 | 	Loss: 0.13779
    Train [8288/9843]	 | 	Loss: 0.16547
    Train [8928/9843]	 | 	Loss: 0.31058
    Train [9568/9843]	 | 	Loss: 0.57817
==> Train | Average loss: 0.2102
==> Test  | Average loss: 0.3041
==> Test  | Accuracy: 90.8023
Best epoch: 31
Best accuracy: 90.80226904376013

Epoch 32:


Batches:   0%|          | 0/308 [00:00<?, ?it/s]

    Train [608/9843]	 | 	Loss: 0.10307
    Train [1248/9843]	 | 	Loss: 0.19681
    Train [1888/9843]	 | 	Loss: 0.21684
    Train [2528/9843]	 | 	Loss: 0.08363
    Train [3168/9843]	 | 	Loss: 0.52665
    Train [3808/9843]	 | 	Loss: 0.44439
    Train [4448/9843]	 | 	Loss: 0.08346
    Train [5088/9843]	 | 	Loss: 0.08525
    Train [5728/9843]	 | 	Loss: 0.57634
    Train [6368/9843]	 | 	Loss: 0.06473
    Train [7008/9843]	 | 	Loss: 0.57785
    Train [7648/9843]	 | 	Loss: 0.16637
    Train [8288/9843]	 | 	Loss: 0.10757
    Train [8928/9843]	 | 	Loss: 0.17831
    Train [9568/9843]	 | 	Loss: 0.46590
==> Train | Average loss: 0.2042
==> Test  | Average loss: 0.3088
==> Test  | Accuracy: 90.4781
Best epoch: 31
Best accuracy: 90.80226904376013

Epoch 33:


Batches:   0%|          | 0/308 [00:00<?, ?it/s]

    Train [608/9843]	 | 	Loss: 0.12536
    Train [1248/9843]	 | 	Loss: 0.37575
    Train [1888/9843]	 | 	Loss: 0.18094
    Train [2528/9843]	 | 	Loss: 0.30518
    Train [3168/9843]	 | 	Loss: 0.08033
    Train [3808/9843]	 | 	Loss: 0.15499
    Train [4448/9843]	 | 	Loss: 0.40479
    Train [5088/9843]	 | 	Loss: 0.17188
    Train [5728/9843]	 | 	Loss: 0.20526
    Train [6368/9843]	 | 	Loss: 0.38711
    Train [7008/9843]	 | 	Loss: 0.33642
    Train [7648/9843]	 | 	Loss: 0.18843
    Train [8288/9843]	 | 	Loss: 0.08130
    Train [8928/9843]	 | 	Loss: 0.24060
    Train [9568/9843]	 | 	Loss: 0.22746
==> Train | Average loss: 0.2010
==> Test  | Average loss: 0.3317
==> Test  | Accuracy: 89.6677
Best epoch: 31
Best accuracy: 90.80226904376013

Epoch 34:


Batches:   0%|          | 0/308 [00:00<?, ?it/s]

    Train [608/9843]	 | 	Loss: 0.07824
    Train [1248/9843]	 | 	Loss: 0.16358
    Train [1888/9843]	 | 	Loss: 0.30895
    Train [2528/9843]	 | 	Loss: 0.20334
    Train [3168/9843]	 | 	Loss: 0.21165
    Train [3808/9843]	 | 	Loss: 0.13621
    Train [4448/9843]	 | 	Loss: 0.16027
    Train [5088/9843]	 | 	Loss: 0.06696
    Train [5728/9843]	 | 	Loss: 0.10166
    Train [6368/9843]	 | 	Loss: 0.30617
    Train [7008/9843]	 | 	Loss: 0.08580
    Train [7648/9843]	 | 	Loss: 0.13433
    Train [8288/9843]	 | 	Loss: 0.10592
    Train [8928/9843]	 | 	Loss: 0.05658
    Train [9568/9843]	 | 	Loss: 0.11067
==> Train | Average loss: 0.1869
==> Test  | Average loss: 0.3308
==> Test  | Accuracy: 89.8298
Best epoch: 31
Best accuracy: 90.80226904376013

Epoch 35:


Batches:   0%|          | 0/308 [00:00<?, ?it/s]

    Train [608/9843]	 | 	Loss: 0.10475
    Train [1248/9843]	 | 	Loss: 0.23348
    Train [1888/9843]	 | 	Loss: 0.37147
    Train [2528/9843]	 | 	Loss: 0.12970
    Train [3168/9843]	 | 	Loss: 0.02358
    Train [3808/9843]	 | 	Loss: 0.23483
    Train [4448/9843]	 | 	Loss: 0.50302
    Train [5088/9843]	 | 	Loss: 0.11294
    Train [5728/9843]	 | 	Loss: 0.32904
    Train [6368/9843]	 | 	Loss: 0.11715
    Train [7008/9843]	 | 	Loss: 0.20475
    Train [7648/9843]	 | 	Loss: 0.17030
    Train [8288/9843]	 | 	Loss: 0.04684
    Train [8928/9843]	 | 	Loss: 0.13288
    Train [9568/9843]	 | 	Loss: 0.26577
==> Train | Average loss: 0.1849
==> Test  | Average loss: 0.3166
==> Test  | Accuracy: 90.4376
Best epoch: 31
Best accuracy: 90.80226904376013

Epoch 36:


Batches:   0%|          | 0/308 [00:00<?, ?it/s]

    Train [608/9843]	 | 	Loss: 0.13019
    Train [1248/9843]	 | 	Loss: 0.10300
    Train [1888/9843]	 | 	Loss: 0.47439
    Train [2528/9843]	 | 	Loss: 0.10686
    Train [3168/9843]	 | 	Loss: 0.11813
    Train [3808/9843]	 | 	Loss: 0.14190
    Train [4448/9843]	 | 	Loss: 0.14007
    Train [5088/9843]	 | 	Loss: 0.19395
    Train [5728/9843]	 | 	Loss: 0.14992
    Train [6368/9843]	 | 	Loss: 0.23179
    Train [7008/9843]	 | 	Loss: 0.13821
    Train [7648/9843]	 | 	Loss: 0.12885
    Train [8288/9843]	 | 	Loss: 0.10162
    Train [8928/9843]	 | 	Loss: 0.20785
    Train [9568/9843]	 | 	Loss: 0.14759
==> Train | Average loss: 0.1853
==> Test  | Average loss: 0.3268
==> Test  | Accuracy: 90.2350
Best epoch: 31
Best accuracy: 90.80226904376013

Epoch 37:


Batches:   0%|          | 0/308 [00:00<?, ?it/s]

    Train [608/9843]	 | 	Loss: 0.12430
    Train [1248/9843]	 | 	Loss: 0.12346
    Train [1888/9843]	 | 	Loss: 0.20267
    Train [2528/9843]	 | 	Loss: 0.12281
    Train [3168/9843]	 | 	Loss: 0.05348
    Train [3808/9843]	 | 	Loss: 0.16242
    Train [4448/9843]	 | 	Loss: 0.38311
    Train [5088/9843]	 | 	Loss: 0.20356
    Train [5728/9843]	 | 	Loss: 0.10448
    Train [6368/9843]	 | 	Loss: 0.14639
    Train [7008/9843]	 | 	Loss: 0.15842
    Train [7648/9843]	 | 	Loss: 0.18435
    Train [8288/9843]	 | 	Loss: 0.16575
    Train [8928/9843]	 | 	Loss: 0.33596
    Train [9568/9843]	 | 	Loss: 0.38808
==> Train | Average loss: 0.1911
==> Test  | Average loss: 0.3607
==> Test  | Accuracy: 89.5057
Best epoch: 31
Best accuracy: 90.80226904376013

Epoch 38:


Batches:   0%|          | 0/308 [00:00<?, ?it/s]

    Train [608/9843]	 | 	Loss: 0.23826
    Train [1248/9843]	 | 	Loss: 0.03168
    Train [1888/9843]	 | 	Loss: 0.20944
    Train [2528/9843]	 | 	Loss: 0.33037
    Train [3168/9843]	 | 	Loss: 0.26393
    Train [3808/9843]	 | 	Loss: 0.06211
    Train [4448/9843]	 | 	Loss: 0.13713
    Train [5088/9843]	 | 	Loss: 0.25795
    Train [5728/9843]	 | 	Loss: 0.13065
    Train [6368/9843]	 | 	Loss: 0.08629
    Train [7008/9843]	 | 	Loss: 0.08051
    Train [7648/9843]	 | 	Loss: 0.19206
    Train [8288/9843]	 | 	Loss: 0.07423
    Train [8928/9843]	 | 	Loss: 0.22323
    Train [9568/9843]	 | 	Loss: 0.12871
==> Train | Average loss: 0.1855
==> Test  | Average loss: 0.3119
==> Test  | Accuracy: 90.4781
Best epoch: 31
Best accuracy: 90.80226904376013

Epoch 39:


Batches:   0%|          | 0/308 [00:00<?, ?it/s]

    Train [608/9843]	 | 	Loss: 0.08259
    Train [1248/9843]	 | 	Loss: 0.08865
    Train [1888/9843]	 | 	Loss: 0.07018
    Train [2528/9843]	 | 	Loss: 0.07888
    Train [3168/9843]	 | 	Loss: 0.06104
    Train [3808/9843]	 | 	Loss: 0.14657
    Train [4448/9843]	 | 	Loss: 0.16258
    Train [5088/9843]	 | 	Loss: 0.12998
    Train [5728/9843]	 | 	Loss: 0.22634
    Train [6368/9843]	 | 	Loss: 0.14603
    Train [7008/9843]	 | 	Loss: 0.07236
    Train [7648/9843]	 | 	Loss: 0.21217
    Train [8288/9843]	 | 	Loss: 0.05900
    Train [8928/9843]	 | 	Loss: 0.12191
    Train [9568/9843]	 | 	Loss: 0.05775
==> Train | Average loss: 0.1589
==> Test  | Average loss: 0.2983
==> Test  | Accuracy: 91.1264
Best epoch: 39
Best accuracy: 91.12641815235008

Epoch 40:


Batches:   0%|          | 0/308 [00:00<?, ?it/s]

    Train [608/9843]	 | 	Loss: 0.09292
    Train [1248/9843]	 | 	Loss: 0.10100
    Train [1888/9843]	 | 	Loss: 0.11531
    Train [2528/9843]	 | 	Loss: 0.28369
    Train [3168/9843]	 | 	Loss: 0.16862
    Train [3808/9843]	 | 	Loss: 0.03748
    Train [4448/9843]	 | 	Loss: 0.14773
    Train [5088/9843]	 | 	Loss: 0.03624
    Train [5728/9843]	 | 	Loss: 0.34471
    Train [6368/9843]	 | 	Loss: 0.11325
    Train [7008/9843]	 | 	Loss: 0.10707
    Train [7648/9843]	 | 	Loss: 0.14186
    Train [8288/9843]	 | 	Loss: 0.05505
    Train [8928/9843]	 | 	Loss: 0.21902
    Train [9568/9843]	 | 	Loss: 0.10529
==> Train | Average loss: 0.1513
==> Test  | Average loss: 0.2992
==> Test  | Accuracy: 90.9643
Best epoch: 39
Best accuracy: 91.12641815235008

Epoch 41:


Batches:   0%|          | 0/308 [00:00<?, ?it/s]

    Train [608/9843]	 | 	Loss: 0.10532
    Train [1248/9843]	 | 	Loss: 0.21109
    Train [1888/9843]	 | 	Loss: 0.03252
    Train [2528/9843]	 | 	Loss: 0.29943
    Train [3168/9843]	 | 	Loss: 0.09494
    Train [3808/9843]	 | 	Loss: 0.09296
    Train [4448/9843]	 | 	Loss: 0.12231
    Train [5088/9843]	 | 	Loss: 0.22437
    Train [5728/9843]	 | 	Loss: 0.28487
    Train [6368/9843]	 | 	Loss: 0.04586
    Train [7008/9843]	 | 	Loss: 0.22813
    Train [7648/9843]	 | 	Loss: 0.06995
    Train [8288/9843]	 | 	Loss: 0.03442
    Train [8928/9843]	 | 	Loss: 0.10715
    Train [9568/9843]	 | 	Loss: 0.18414
==> Train | Average loss: 0.1442
==> Test  | Average loss: 0.2994
==> Test  | Accuracy: 91.2075
Best epoch: 41
Best accuracy: 91.20745542949756

Epoch 42:


Batches:   0%|          | 0/308 [00:00<?, ?it/s]

    Train [608/9843]	 | 	Loss: 0.10031
    Train [1248/9843]	 | 	Loss: 0.07118
    Train [1888/9843]	 | 	Loss: 0.11666
    Train [2528/9843]	 | 	Loss: 0.04418
    Train [3168/9843]	 | 	Loss: 0.15550
    Train [3808/9843]	 | 	Loss: 0.16307
    Train [4448/9843]	 | 	Loss: 0.04749
    Train [5088/9843]	 | 	Loss: 0.05762
    Train [5728/9843]	 | 	Loss: 0.19652
    Train [6368/9843]	 | 	Loss: 0.20804
    Train [7008/9843]	 | 	Loss: 0.18262
    Train [7648/9843]	 | 	Loss: 0.04682
    Train [8288/9843]	 | 	Loss: 0.03413
    Train [8928/9843]	 | 	Loss: 0.05081
    Train [9568/9843]	 | 	Loss: 0.12365
==> Train | Average loss: 0.1462
==> Test  | Average loss: 0.2977
==> Test  | Accuracy: 91.3695
Best epoch: 42
Best accuracy: 91.36952998379255

Epoch 43:


Batches:   0%|          | 0/308 [00:00<?, ?it/s]

    Train [608/9843]	 | 	Loss: 0.10110
    Train [1248/9843]	 | 	Loss: 0.13201
    Train [1888/9843]	 | 	Loss: 0.10884
    Train [2528/9843]	 | 	Loss: 0.02795
    Train [3168/9843]	 | 	Loss: 0.10043
    Train [3808/9843]	 | 	Loss: 0.07243
    Train [4448/9843]	 | 	Loss: 0.14835
    Train [5088/9843]	 | 	Loss: 0.11563
    Train [5728/9843]	 | 	Loss: 0.07625
    Train [6368/9843]	 | 	Loss: 0.33806
    Train [7008/9843]	 | 	Loss: 0.12916
    Train [7648/9843]	 | 	Loss: 0.07745
    Train [8288/9843]	 | 	Loss: 0.09668
    Train [8928/9843]	 | 	Loss: 0.07501
    Train [9568/9843]	 | 	Loss: 0.16695
==> Train | Average loss: 0.1368
==> Test  | Average loss: 0.3026
==> Test  | Accuracy: 90.9643
Best epoch: 42
Best accuracy: 91.36952998379255

Epoch 44:


Batches:   0%|          | 0/308 [00:00<?, ?it/s]

    Train [608/9843]	 | 	Loss: 0.09372
    Train [1248/9843]	 | 	Loss: 0.02791
    Train [1888/9843]	 | 	Loss: 0.05182
    Train [2528/9843]	 | 	Loss: 0.27530
    Train [3168/9843]	 | 	Loss: 0.02545
    Train [3808/9843]	 | 	Loss: 0.16242
    Train [4448/9843]	 | 	Loss: 0.04268
    Train [5088/9843]	 | 	Loss: 0.13335
    Train [5728/9843]	 | 	Loss: 0.03493
    Train [6368/9843]	 | 	Loss: 0.09776
    Train [7008/9843]	 | 	Loss: 0.08516
    Train [7648/9843]	 | 	Loss: 0.03451
    Train [8288/9843]	 | 	Loss: 0.08485
    Train [8928/9843]	 | 	Loss: 0.08505
    Train [9568/9843]	 | 	Loss: 0.10300
==> Train | Average loss: 0.1297
==> Test  | Average loss: 0.2940
==> Test  | Accuracy: 91.1669
Best epoch: 42
Best accuracy: 91.36952998379255

Epoch 45:


Batches:   0%|          | 0/308 [00:00<?, ?it/s]

    Train [608/9843]	 | 	Loss: 0.15828
    Train [1248/9843]	 | 	Loss: 0.06428
    Train [1888/9843]	 | 	Loss: 0.08748
    Train [2528/9843]	 | 	Loss: 0.08626
    Train [3168/9843]	 | 	Loss: 0.31072
    Train [3808/9843]	 | 	Loss: 0.07791
    Train [4448/9843]	 | 	Loss: 0.07746
    Train [5088/9843]	 | 	Loss: 0.37719
    Train [5728/9843]	 | 	Loss: 0.07959
    Train [6368/9843]	 | 	Loss: 0.11743
    Train [7008/9843]	 | 	Loss: 0.13346
    Train [7648/9843]	 | 	Loss: 0.19334
    Train [8288/9843]	 | 	Loss: 0.09952
    Train [8928/9843]	 | 	Loss: 0.10000
    Train [9568/9843]	 | 	Loss: 0.09256
==> Train | Average loss: 0.1327
==> Test  | Average loss: 0.3155
==> Test  | Accuracy: 90.6807
Best epoch: 42
Best accuracy: 91.36952998379255

Epoch 46:


Batches:   0%|          | 0/308 [00:00<?, ?it/s]

    Train [608/9843]	 | 	Loss: 0.09301
    Train [1248/9843]	 | 	Loss: 0.05709
    Train [1888/9843]	 | 	Loss: 0.06135
    Train [2528/9843]	 | 	Loss: 0.03565
    Train [3168/9843]	 | 	Loss: 0.22228
    Train [3808/9843]	 | 	Loss: 0.13389
    Train [4448/9843]	 | 	Loss: 0.08086
    Train [5088/9843]	 | 	Loss: 0.19724
    Train [5728/9843]	 | 	Loss: 0.19749
    Train [6368/9843]	 | 	Loss: 0.28251
    Train [7008/9843]	 | 	Loss: 0.11975
    Train [7648/9843]	 | 	Loss: 0.08789
    Train [8288/9843]	 | 	Loss: 0.19780
    Train [8928/9843]	 | 	Loss: 0.32446
    Train [9568/9843]	 | 	Loss: 0.09562
==> Train | Average loss: 0.1365
==> Test  | Average loss: 0.3148
==> Test  | Accuracy: 90.3566
Best epoch: 42
Best accuracy: 91.36952998379255

Epoch 47:


Batches:   0%|          | 0/308 [00:00<?, ?it/s]

    Train [608/9843]	 | 	Loss: 0.07378
    Train [1248/9843]	 | 	Loss: 0.06857
    Train [1888/9843]	 | 	Loss: 0.18835
    Train [2528/9843]	 | 	Loss: 0.06727
    Train [3168/9843]	 | 	Loss: 0.08049
    Train [3808/9843]	 | 	Loss: 0.35286
    Train [4448/9843]	 | 	Loss: 0.20454
    Train [5088/9843]	 | 	Loss: 0.20868
    Train [5728/9843]	 | 	Loss: 0.10624
    Train [6368/9843]	 | 	Loss: 0.18791
    Train [7008/9843]	 | 	Loss: 0.23560
    Train [7648/9843]	 | 	Loss: 0.06275
    Train [8288/9843]	 | 	Loss: 0.25615
    Train [8928/9843]	 | 	Loss: 0.04962
    Train [9568/9843]	 | 	Loss: 0.03062
==> Train | Average loss: 0.1237
==> Test  | Average loss: 0.3298
==> Test  | Accuracy: 90.3566
Best epoch: 42
Best accuracy: 91.36952998379255

Epoch 48:


Batches:   0%|          | 0/308 [00:00<?, ?it/s]

    Train [608/9843]	 | 	Loss: 0.08856
    Train [1248/9843]	 | 	Loss: 0.20897
    Train [1888/9843]	 | 	Loss: 0.16084
    Train [2528/9843]	 | 	Loss: 0.11759
    Train [3168/9843]	 | 	Loss: 0.10673
    Train [3808/9843]	 | 	Loss: 0.05837
    Train [4448/9843]	 | 	Loss: 0.20054
    Train [5088/9843]	 | 	Loss: 0.04044
    Train [5728/9843]	 | 	Loss: 0.13078
    Train [6368/9843]	 | 	Loss: 0.08773
    Train [7008/9843]	 | 	Loss: 0.09188
    Train [7648/9843]	 | 	Loss: 0.16859
    Train [8288/9843]	 | 	Loss: 0.06897
    Train [8928/9843]	 | 	Loss: 0.11106
    Train [9568/9843]	 | 	Loss: 0.05682
==> Train | Average loss: 0.1314
==> Test  | Average loss: 0.3362
==> Test  | Accuracy: 90.3160
Best epoch: 42
Best accuracy: 91.36952998379255

Epoch 49:


Batches:   0%|          | 0/308 [00:00<?, ?it/s]

    Train [608/9843]	 | 	Loss: 0.05523
    Train [1248/9843]	 | 	Loss: 0.34809
    Train [1888/9843]	 | 	Loss: 0.12134
    Train [2528/9843]	 | 	Loss: 0.04798
    Train [3168/9843]	 | 	Loss: 0.11328
    Train [3808/9843]	 | 	Loss: 0.09210
    Train [4448/9843]	 | 	Loss: 0.18967
    Train [5088/9843]	 | 	Loss: 0.11691
    Train [5728/9843]	 | 	Loss: 0.10359
    Train [6368/9843]	 | 	Loss: 0.00740
    Train [7008/9843]	 | 	Loss: 0.11489
    Train [7648/9843]	 | 	Loss: 0.17460
    Train [8288/9843]	 | 	Loss: 0.03320
    Train [8928/9843]	 | 	Loss: 0.10921
    Train [9568/9843]	 | 	Loss: 0.06795
==> Train | Average loss: 0.1224
==> Test  | Average loss: 0.3398
==> Test  | Accuracy: 90.2755
Best epoch: 42
Best accuracy: 91.36952998379255

Epoch 50:


Batches:   0%|          | 0/308 [00:00<?, ?it/s]

    Train [608/9843]	 | 	Loss: 0.10652
    Train [1248/9843]	 | 	Loss: 0.12727
    Train [1888/9843]	 | 	Loss: 0.06972
    Train [2528/9843]	 | 	Loss: 0.21490
    Train [3168/9843]	 | 	Loss: 0.11220
    Train [3808/9843]	 | 	Loss: 0.05422
    Train [4448/9843]	 | 	Loss: 0.10847
    Train [5088/9843]	 | 	Loss: 0.14314
    Train [5728/9843]	 | 	Loss: 0.15955
    Train [6368/9843]	 | 	Loss: 0.15027
    Train [7008/9843]	 | 	Loss: 0.25619
    Train [7648/9843]	 | 	Loss: 0.17369
    Train [8288/9843]	 | 	Loss: 0.05384
    Train [8928/9843]	 | 	Loss: 0.09331
    Train [9568/9843]	 | 	Loss: 0.11310
==> Train | Average loss: 0.1187
==> Test  | Average loss: 0.3244
==> Test  | Accuracy: 90.1945
Best epoch: 42
Best accuracy: 91.36952998379255

Epoch 51:


Batches:   0%|          | 0/308 [00:00<?, ?it/s]

    Train [608/9843]	 | 	Loss: 0.02252
    Train [1248/9843]	 | 	Loss: 0.15056
    Train [1888/9843]	 | 	Loss: 0.06326
    Train [2528/9843]	 | 	Loss: 0.07241
    Train [3168/9843]	 | 	Loss: 0.15529
    Train [3808/9843]	 | 	Loss: 0.21875
    Train [4448/9843]	 | 	Loss: 0.28267
    Train [5088/9843]	 | 	Loss: 0.16621
    Train [5728/9843]	 | 	Loss: 0.05504
    Train [6368/9843]	 | 	Loss: 0.11900
    Train [7008/9843]	 | 	Loss: 0.12021
    Train [7648/9843]	 | 	Loss: 0.03797
    Train [8288/9843]	 | 	Loss: 0.08979
    Train [8928/9843]	 | 	Loss: 0.09987
    Train [9568/9843]	 | 	Loss: 0.02801
==> Train | Average loss: 0.1180
==> Test  | Average loss: 0.3073
==> Test  | Accuracy: 90.7212
Best epoch: 42
Best accuracy: 91.36952998379255

Epoch 52:


Batches:   0%|          | 0/308 [00:00<?, ?it/s]

    Train [608/9843]	 | 	Loss: 0.20065
    Train [1248/9843]	 | 	Loss: 0.25535
    Train [1888/9843]	 | 	Loss: 0.25451
    Train [2528/9843]	 | 	Loss: 0.05801
    Train [3168/9843]	 | 	Loss: 0.09952
    Train [3808/9843]	 | 	Loss: 0.08246
    Train [4448/9843]	 | 	Loss: 0.08506
    Train [5088/9843]	 | 	Loss: 0.04511
    Train [5728/9843]	 | 	Loss: 0.01625
    Train [6368/9843]	 | 	Loss: 0.13663
    Train [7008/9843]	 | 	Loss: 0.05387
    Train [7648/9843]	 | 	Loss: 0.04412
    Train [8288/9843]	 | 	Loss: 0.23705
    Train [8928/9843]	 | 	Loss: 0.11400
    Train [9568/9843]	 | 	Loss: 0.09271
==> Train | Average loss: 0.1236
==> Test  | Average loss: 0.3340
==> Test  | Accuracy: 90.3160
Best epoch: 42
Best accuracy: 91.36952998379255

Epoch 53:


Batches:   0%|          | 0/308 [00:00<?, ?it/s]

    Train [608/9843]	 | 	Loss: 0.07560
    Train [1248/9843]	 | 	Loss: 0.12282
    Train [1888/9843]	 | 	Loss: 0.03947
    Train [2528/9843]	 | 	Loss: 0.23221
    Train [3168/9843]	 | 	Loss: 0.17088
    Train [3808/9843]	 | 	Loss: 0.08784
    Train [4448/9843]	 | 	Loss: 0.24857
    Train [5088/9843]	 | 	Loss: 0.19155
    Train [5728/9843]	 | 	Loss: 0.13499
    Train [6368/9843]	 | 	Loss: 0.12035
    Train [7008/9843]	 | 	Loss: 0.15495
    Train [7648/9843]	 | 	Loss: 0.18572
    Train [8288/9843]	 | 	Loss: 0.05946
    Train [8928/9843]	 | 	Loss: 0.20800
    Train [9568/9843]	 | 	Loss: 0.16064
==> Train | Average loss: 0.1092
==> Test  | Average loss: 0.3290
==> Test  | Accuracy: 90.3971
Best epoch: 42
Best accuracy: 91.36952998379255

Epoch 54:


Batches:   0%|          | 0/308 [00:00<?, ?it/s]

    Train [608/9843]	 | 	Loss: 0.04769
    Train [1248/9843]	 | 	Loss: 0.12375
    Train [1888/9843]	 | 	Loss: 0.05363
    Train [2528/9843]	 | 	Loss: 0.06001
    Train [3168/9843]	 | 	Loss: 0.17387
    Train [3808/9843]	 | 	Loss: 0.05718
    Train [4448/9843]	 | 	Loss: 0.12812
    Train [5088/9843]	 | 	Loss: 0.14846
    Train [5728/9843]	 | 	Loss: 0.02465
    Train [6368/9843]	 | 	Loss: 0.02627
    Train [7008/9843]	 | 	Loss: 0.22169
    Train [7648/9843]	 | 	Loss: 0.01145
    Train [8288/9843]	 | 	Loss: 0.05557
    Train [8928/9843]	 | 	Loss: 0.23833
    Train [9568/9843]	 | 	Loss: 0.11870
==> Train | Average loss: 0.1129
==> Test  | Average loss: 0.3312
==> Test  | Accuracy: 90.5997
Best epoch: 42
Best accuracy: 91.36952998379255

Epoch 55:


Batches:   0%|          | 0/308 [00:00<?, ?it/s]

    Train [608/9843]	 | 	Loss: 0.08985
    Train [1248/9843]	 | 	Loss: 0.12887
    Train [1888/9843]	 | 	Loss: 0.16904
    Train [2528/9843]	 | 	Loss: 0.18673
    Train [3168/9843]	 | 	Loss: 0.05364
    Train [3808/9843]	 | 	Loss: 0.08538
    Train [4448/9843]	 | 	Loss: 0.24893
    Train [5088/9843]	 | 	Loss: 0.07901
    Train [5728/9843]	 | 	Loss: 0.10350
    Train [6368/9843]	 | 	Loss: 0.01247
    Train [7008/9843]	 | 	Loss: 0.04461
    Train [7648/9843]	 | 	Loss: 0.05127
    Train [8288/9843]	 | 	Loss: 0.06696
    Train [8928/9843]	 | 	Loss: 0.13166
    Train [9568/9843]	 | 	Loss: 0.05159
==> Train | Average loss: 0.1065
==> Test  | Average loss: 0.3511
==> Test  | Accuracy: 90.1135
Best epoch: 42
Best accuracy: 91.36952998379255

Epoch 56:


Batches:   0%|          | 0/308 [00:00<?, ?it/s]

    Train [608/9843]	 | 	Loss: 0.07336
    Train [1248/9843]	 | 	Loss: 0.18221
    Train [1888/9843]	 | 	Loss: 0.19688
    Train [2528/9843]	 | 	Loss: 0.16733
    Train [3168/9843]	 | 	Loss: 0.02183
    Train [3808/9843]	 | 	Loss: 0.04609
    Train [4448/9843]	 | 	Loss: 0.11879
    Train [5088/9843]	 | 	Loss: 0.11809
    Train [5728/9843]	 | 	Loss: 0.17419
    Train [6368/9843]	 | 	Loss: 0.10661
    Train [7008/9843]	 | 	Loss: 0.03747
    Train [7648/9843]	 | 	Loss: 0.09901
    Train [8288/9843]	 | 	Loss: 0.03216
    Train [8928/9843]	 | 	Loss: 0.18162
    Train [9568/9843]	 | 	Loss: 0.02566
==> Train | Average loss: 0.1048
==> Test  | Average loss: 0.3241
==> Test  | Accuracy: 91.2480
Best epoch: 42
Best accuracy: 91.36952998379255

Epoch 57:


Batches:   0%|          | 0/308 [00:00<?, ?it/s]

    Train [608/9843]	 | 	Loss: 0.23946
    Train [1248/9843]	 | 	Loss: 0.22654
    Train [1888/9843]	 | 	Loss: 0.10912
    Train [2528/9843]	 | 	Loss: 0.09650
    Train [3168/9843]	 | 	Loss: 0.15813
    Train [3808/9843]	 | 	Loss: 0.22735
    Train [4448/9843]	 | 	Loss: 0.07892
    Train [5088/9843]	 | 	Loss: 0.10148
    Train [5728/9843]	 | 	Loss: 0.26366
    Train [6368/9843]	 | 	Loss: 0.04185
    Train [7008/9843]	 | 	Loss: 0.14620
    Train [7648/9843]	 | 	Loss: 0.08600
    Train [8288/9843]	 | 	Loss: 0.10379
    Train [8928/9843]	 | 	Loss: 0.14996
    Train [9568/9843]	 | 	Loss: 0.16786
==> Train | Average loss: 0.1167
==> Test  | Average loss: 0.3204
==> Test  | Accuracy: 91.0454
Best epoch: 42
Best accuracy: 91.36952998379255

Epoch 58:


Batches:   0%|          | 0/308 [00:00<?, ?it/s]

    Train [608/9843]	 | 	Loss: 0.16933
    Train [1248/9843]	 | 	Loss: 0.10848
    Train [1888/9843]	 | 	Loss: 0.13612
    Train [2528/9843]	 | 	Loss: 0.10401
    Train [3168/9843]	 | 	Loss: 0.03586
    Train [3808/9843]	 | 	Loss: 0.08352
    Train [4448/9843]	 | 	Loss: 0.15605
    Train [5088/9843]	 | 	Loss: 0.02767
    Train [5728/9843]	 | 	Loss: 0.13333
    Train [6368/9843]	 | 	Loss: 0.04086
    Train [7008/9843]	 | 	Loss: 0.05314
    Train [7648/9843]	 | 	Loss: 0.10708
    Train [8288/9843]	 | 	Loss: 0.04785
    Train [8928/9843]	 | 	Loss: 0.05835
    Train [9568/9843]	 | 	Loss: 0.04838
==> Train | Average loss: 0.1073
==> Test  | Average loss: 0.3326
==> Test  | Accuracy: 89.9514
Best epoch: 42
Best accuracy: 91.36952998379255

Epoch 59:


Batches:   0%|          | 0/308 [00:00<?, ?it/s]

    Train [608/9843]	 | 	Loss: 0.13153
    Train [1248/9843]	 | 	Loss: 0.08371
    Train [1888/9843]	 | 	Loss: 0.12316
    Train [2528/9843]	 | 	Loss: 0.12729
    Train [3168/9843]	 | 	Loss: 0.00221
    Train [3808/9843]	 | 	Loss: 0.10735
    Train [4448/9843]	 | 	Loss: 0.05970
    Train [5088/9843]	 | 	Loss: 0.08265
    Train [5728/9843]	 | 	Loss: 0.09377
    Train [6368/9843]	 | 	Loss: 0.02614
    Train [7008/9843]	 | 	Loss: 0.06514
    Train [7648/9843]	 | 	Loss: 0.03749
    Train [8288/9843]	 | 	Loss: 0.06633
    Train [8928/9843]	 | 	Loss: 0.05730
    Train [9568/9843]	 | 	Loss: 0.06251
==> Train | Average loss: 0.0984
==> Test  | Average loss: 0.3346
==> Test  | Accuracy: 90.5592
Best epoch: 42
Best accuracy: 91.36952998379255

Epoch 60:


Batches:   0%|          | 0/308 [00:00<?, ?it/s]

    Train [608/9843]	 | 	Loss: 0.07066
    Train [1248/9843]	 | 	Loss: 0.07559
    Train [1888/9843]	 | 	Loss: 0.03197
    Train [2528/9843]	 | 	Loss: 0.06213
    Train [3168/9843]	 | 	Loss: 0.13094
    Train [3808/9843]	 | 	Loss: 0.06004
    Train [4448/9843]	 | 	Loss: 0.67675
    Train [5088/9843]	 | 	Loss: 0.05861
    Train [5728/9843]	 | 	Loss: 0.08896
    Train [6368/9843]	 | 	Loss: 0.03017
    Train [7008/9843]	 | 	Loss: 0.05090
    Train [7648/9843]	 | 	Loss: 0.08126
    Train [8288/9843]	 | 	Loss: 0.02490
    Train [8928/9843]	 | 	Loss: 0.04917
    Train [9568/9843]	 | 	Loss: 0.04262
==> Train | Average loss: 0.0982
==> Test  | Average loss: 0.3250
==> Test  | Accuracy: 90.8023
Best epoch: 42
Best accuracy: 91.36952998379255

Epoch 61:


Batches:   0%|          | 0/308 [00:00<?, ?it/s]

    Train [608/9843]	 | 	Loss: 0.12776
    Train [1248/9843]	 | 	Loss: 0.06301
    Train [1888/9843]	 | 	Loss: 0.04543
    Train [2528/9843]	 | 	Loss: 0.14797
    Train [3168/9843]	 | 	Loss: 0.10836
    Train [3808/9843]	 | 	Loss: 0.03423
    Train [4448/9843]	 | 	Loss: 0.10499
    Train [5088/9843]	 | 	Loss: 0.02739
    Train [5728/9843]	 | 	Loss: 0.05915
    Train [6368/9843]	 | 	Loss: 0.03621
    Train [7008/9843]	 | 	Loss: 0.06261
    Train [7648/9843]	 | 	Loss: 0.00832
    Train [8288/9843]	 | 	Loss: 0.04603
    Train [8928/9843]	 | 	Loss: 0.08291
    Train [9568/9843]	 | 	Loss: 0.03634
==> Train | Average loss: 0.0879
==> Test  | Average loss: 0.3356
==> Test  | Accuracy: 90.4781
Best epoch: 42
Best accuracy: 91.36952998379255

Epoch 62:


Batches:   0%|          | 0/308 [00:00<?, ?it/s]

    Train [608/9843]	 | 	Loss: 0.07891
    Train [1248/9843]	 | 	Loss: 0.04386
    Train [1888/9843]	 | 	Loss: 0.01745
    Train [2528/9843]	 | 	Loss: 0.10655
    Train [3168/9843]	 | 	Loss: 0.03819
    Train [3808/9843]	 | 	Loss: 0.04400
    Train [4448/9843]	 | 	Loss: 0.10844
    Train [5088/9843]	 | 	Loss: 0.02767
    Train [5728/9843]	 | 	Loss: 0.02962
    Train [6368/9843]	 | 	Loss: 0.08756
    Train [7008/9843]	 | 	Loss: 0.11487
    Train [7648/9843]	 | 	Loss: 0.04698
    Train [8288/9843]	 | 	Loss: 0.03924
    Train [8928/9843]	 | 	Loss: 0.02552
    Train [9568/9843]	 | 	Loss: 0.12062
==> Train | Average loss: 0.0885
==> Test  | Average loss: 0.3300
==> Test  | Accuracy: 90.7212
Best epoch: 42
Best accuracy: 91.36952998379255

Epoch 63:


Batches:   0%|          | 0/308 [00:00<?, ?it/s]

    Train [608/9843]	 | 	Loss: 0.02152
    Train [1248/9843]	 | 	Loss: 0.02341
    Train [1888/9843]	 | 	Loss: 0.08774
    Train [2528/9843]	 | 	Loss: 0.08518
    Train [3168/9843]	 | 	Loss: 0.02733
    Train [3808/9843]	 | 	Loss: 0.08163
    Train [4448/9843]	 | 	Loss: 0.15080
    Train [5088/9843]	 | 	Loss: 0.06647
    Train [5728/9843]	 | 	Loss: 0.11230
    Train [6368/9843]	 | 	Loss: 0.09451
    Train [7008/9843]	 | 	Loss: 0.04997
    Train [7648/9843]	 | 	Loss: 0.08640
    Train [8288/9843]	 | 	Loss: 0.04187
    Train [8928/9843]	 | 	Loss: 0.07307
    Train [9568/9843]	 | 	Loss: 0.12356
==> Train | Average loss: 0.0810
==> Test  | Average loss: 0.3345
==> Test  | Accuracy: 90.8023
Best epoch: 42
Best accuracy: 91.36952998379255

Epoch 64:


Batches:   0%|          | 0/308 [00:00<?, ?it/s]

    Train [608/9843]	 | 	Loss: 0.06857
    Train [1248/9843]	 | 	Loss: 0.22261
    Train [1888/9843]	 | 	Loss: 0.11374
    Train [2528/9843]	 | 	Loss: 0.13599
    Train [3168/9843]	 | 	Loss: 0.29181
    Train [3808/9843]	 | 	Loss: 0.20088
    Train [4448/9843]	 | 	Loss: 0.18374
    Train [5088/9843]	 | 	Loss: 0.09374
    Train [5728/9843]	 | 	Loss: 0.05090
    Train [6368/9843]	 | 	Loss: 0.09685
    Train [7008/9843]	 | 	Loss: 0.06422
    Train [7648/9843]	 | 	Loss: 0.17210
    Train [8288/9843]	 | 	Loss: 0.02575
    Train [8928/9843]	 | 	Loss: 0.01496
    Train [9568/9843]	 | 	Loss: 0.01359
==> Train | Average loss: 0.0913
==> Test  | Average loss: 0.3322
==> Test  | Accuracy: 90.8833
Best epoch: 42
Best accuracy: 91.36952998379255

Epoch 65:


Batches:   0%|          | 0/308 [00:00<?, ?it/s]

    Train [608/9843]	 | 	Loss: 0.04041
    Train [1248/9843]	 | 	Loss: 0.09407
    Train [1888/9843]	 | 	Loss: 0.19891
    Train [2528/9843]	 | 	Loss: 0.13451
    Train [3168/9843]	 | 	Loss: 0.06283
    Train [3808/9843]	 | 	Loss: 0.06842
    Train [4448/9843]	 | 	Loss: 0.13914
    Train [5088/9843]	 | 	Loss: 0.07859
    Train [5728/9843]	 | 	Loss: 0.02865
    Train [6368/9843]	 | 	Loss: 0.01839
    Train [7008/9843]	 | 	Loss: 0.08034
    Train [7648/9843]	 | 	Loss: 0.08518
    Train [8288/9843]	 | 	Loss: 0.16480
    Train [8928/9843]	 | 	Loss: 0.33922
    Train [9568/9843]	 | 	Loss: 0.02834
==> Train | Average loss: 0.0838
==> Test  | Average loss: 0.3315
==> Test  | Accuracy: 90.8833
Best epoch: 42
Best accuracy: 91.36952998379255

Epoch 66:


Batches:   0%|          | 0/308 [00:00<?, ?it/s]

    Train [608/9843]	 | 	Loss: 0.24743
    Train [1248/9843]	 | 	Loss: 0.07017
    Train [1888/9843]	 | 	Loss: 0.09791
    Train [2528/9843]	 | 	Loss: 0.03151
    Train [3168/9843]	 | 	Loss: 0.02726
    Train [3808/9843]	 | 	Loss: 0.12301
    Train [4448/9843]	 | 	Loss: 0.00865
    Train [5088/9843]	 | 	Loss: 0.12200
    Train [5728/9843]	 | 	Loss: 0.03776
    Train [6368/9843]	 | 	Loss: 0.00978
    Train [7008/9843]	 | 	Loss: 0.04752
    Train [7648/9843]	 | 	Loss: 0.08650
    Train [8288/9843]	 | 	Loss: 0.19805
    Train [8928/9843]	 | 	Loss: 0.09101
    Train [9568/9843]	 | 	Loss: 0.12856
==> Train | Average loss: 0.0862
==> Test  | Average loss: 0.3528
==> Test  | Accuracy: 90.5186
Best epoch: 42
Best accuracy: 91.36952998379255

Epoch 67:


Batches:   0%|          | 0/308 [00:00<?, ?it/s]

    Train [608/9843]	 | 	Loss: 0.05140
    Train [1248/9843]	 | 	Loss: 0.06977
    Train [1888/9843]	 | 	Loss: 0.08474
    Train [2528/9843]	 | 	Loss: 0.08459
    Train [3168/9843]	 | 	Loss: 0.05733
    Train [3808/9843]	 | 	Loss: 0.17591
    Train [4448/9843]	 | 	Loss: 0.18387
    Train [5088/9843]	 | 	Loss: 0.02012
    Train [5728/9843]	 | 	Loss: 0.08440
    Train [6368/9843]	 | 	Loss: 0.16160
    Train [7008/9843]	 | 	Loss: 0.00893
    Train [7648/9843]	 | 	Loss: 0.08164
    Train [8288/9843]	 | 	Loss: 0.00525
    Train [8928/9843]	 | 	Loss: 0.10197
    Train [9568/9843]	 | 	Loss: 0.06990
==> Train | Average loss: 0.0800
==> Test  | Average loss: 0.3290
==> Test  | Accuracy: 90.8428
Best epoch: 42
Best accuracy: 91.36952998379255

Epoch 68:


Batches:   0%|          | 0/308 [00:00<?, ?it/s]

    Train [608/9843]	 | 	Loss: 0.07076
    Train [1248/9843]	 | 	Loss: 0.01118
    Train [1888/9843]	 | 	Loss: 0.05426
    Train [2528/9843]	 | 	Loss: 0.08999
    Train [3168/9843]	 | 	Loss: 0.05098
    Train [3808/9843]	 | 	Loss: 0.03168
    Train [4448/9843]	 | 	Loss: 0.08934
    Train [5088/9843]	 | 	Loss: 0.17674
    Train [5728/9843]	 | 	Loss: 0.04686
    Train [6368/9843]	 | 	Loss: 0.02548
    Train [7008/9843]	 | 	Loss: 0.08609
    Train [7648/9843]	 | 	Loss: 0.04104
    Train [8288/9843]	 | 	Loss: 0.04425
    Train [8928/9843]	 | 	Loss: 0.17073
    Train [9568/9843]	 | 	Loss: 0.03978
==> Train | Average loss: 0.0819
==> Test  | Average loss: 0.3352
==> Test  | Accuracy: 90.6807
Best epoch: 42
Best accuracy: 91.36952998379255

Epoch 69:


Batches:   0%|          | 0/308 [00:00<?, ?it/s]

    Train [608/9843]	 | 	Loss: 0.06922
    Train [1248/9843]	 | 	Loss: 0.02419
    Train [1888/9843]	 | 	Loss: 0.10903
    Train [2528/9843]	 | 	Loss: 0.08484
    Train [3168/9843]	 | 	Loss: 0.18194
    Train [3808/9843]	 | 	Loss: 0.02227
    Train [4448/9843]	 | 	Loss: 0.01502
    Train [5088/9843]	 | 	Loss: 0.04963
    Train [5728/9843]	 | 	Loss: 0.09919
    Train [6368/9843]	 | 	Loss: 0.03460
    Train [7008/9843]	 | 	Loss: 0.04967
    Train [7648/9843]	 | 	Loss: 0.01110
    Train [8288/9843]	 | 	Loss: 0.08218
    Train [8928/9843]	 | 	Loss: 0.02162
    Train [9568/9843]	 | 	Loss: 0.16380
==> Train | Average loss: 0.0824
==> Test  | Average loss: 0.3489
==> Test  | Accuracy: 90.2755
Best epoch: 42
Best accuracy: 91.36952998379255

Epoch 70:


Batches:   0%|          | 0/308 [00:00<?, ?it/s]

    Train [608/9843]	 | 	Loss: 0.04288
    Train [1248/9843]	 | 	Loss: 0.06359
    Train [1888/9843]	 | 	Loss: 0.00780
    Train [2528/9843]	 | 	Loss: 0.08531
    Train [3168/9843]	 | 	Loss: 0.01023
    Train [3808/9843]	 | 	Loss: 0.04416
    Train [4448/9843]	 | 	Loss: 0.04913
    Train [5088/9843]	 | 	Loss: 0.00632
    Train [5728/9843]	 | 	Loss: 0.02328
    Train [6368/9843]	 | 	Loss: 0.26429
    Train [7008/9843]	 | 	Loss: 0.09601
    Train [7648/9843]	 | 	Loss: 0.07096
    Train [8288/9843]	 | 	Loss: 0.04080
    Train [8928/9843]	 | 	Loss: 0.07127
    Train [9568/9843]	 | 	Loss: 0.04245
==> Train | Average loss: 0.0788
==> Test  | Average loss: 0.3407
==> Test  | Accuracy: 90.7212
Best epoch: 42
Best accuracy: 91.36952998379255

Epoch 71:


Batches:   0%|          | 0/308 [00:00<?, ?it/s]

    Train [608/9843]	 | 	Loss: 0.02664
    Train [1248/9843]	 | 	Loss: 0.06354
    Train [1888/9843]	 | 	Loss: 0.44851
    Train [2528/9843]	 | 	Loss: 0.01253
    Train [3168/9843]	 | 	Loss: 0.19956
    Train [3808/9843]	 | 	Loss: 0.02676
    Train [4448/9843]	 | 	Loss: 0.05561
    Train [5088/9843]	 | 	Loss: 0.20500
    Train [5728/9843]	 | 	Loss: 0.15637
    Train [6368/9843]	 | 	Loss: 0.06279
    Train [7008/9843]	 | 	Loss: 0.01519
    Train [7648/9843]	 | 	Loss: 0.04566
    Train [8288/9843]	 | 	Loss: 0.00702
    Train [8928/9843]	 | 	Loss: 0.11601
    Train [9568/9843]	 | 	Loss: 0.23698
==> Train | Average loss: 0.0777
==> Test  | Average loss: 0.3391
==> Test  | Accuracy: 90.3160
Best epoch: 42
Best accuracy: 91.36952998379255

Epoch 72:


Batches:   0%|          | 0/308 [00:00<?, ?it/s]

    Train [608/9843]	 | 	Loss: 0.20662
    Train [1248/9843]	 | 	Loss: 0.02955
    Train [1888/9843]	 | 	Loss: 0.15429
    Train [2528/9843]	 | 	Loss: 0.01610
    Train [3168/9843]	 | 	Loss: 0.09129
    Train [3808/9843]	 | 	Loss: 0.01496
    Train [4448/9843]	 | 	Loss: 0.09014
    Train [5088/9843]	 | 	Loss: 0.10629
    Train [5728/9843]	 | 	Loss: 0.05398
    Train [6368/9843]	 | 	Loss: 0.01669
    Train [7008/9843]	 | 	Loss: 0.01302
    Train [7648/9843]	 | 	Loss: 0.34221
    Train [8288/9843]	 | 	Loss: 0.01587
    Train [8928/9843]	 | 	Loss: 0.05304
    Train [9568/9843]	 | 	Loss: 0.04510
==> Train | Average loss: 0.0784
==> Test  | Average loss: 0.3457
==> Test  | Accuracy: 90.8023
Best epoch: 42
Best accuracy: 91.36952998379255

Epoch 73:


Batches:   0%|          | 0/308 [00:00<?, ?it/s]

    Train [608/9843]	 | 	Loss: 0.37742
    Train [1248/9843]	 | 	Loss: 0.15832
    Train [1888/9843]	 | 	Loss: 0.04178
    Train [2528/9843]	 | 	Loss: 0.04788
    Train [3168/9843]	 | 	Loss: 0.01922
    Train [3808/9843]	 | 	Loss: 0.09152
    Train [4448/9843]	 | 	Loss: 0.08423
    Train [5088/9843]	 | 	Loss: 0.03916
    Train [5728/9843]	 | 	Loss: 0.02180
    Train [6368/9843]	 | 	Loss: 0.08048
    Train [7008/9843]	 | 	Loss: 0.05752
    Train [7648/9843]	 | 	Loss: 0.06398
    Train [8288/9843]	 | 	Loss: 0.25252
    Train [8928/9843]	 | 	Loss: 0.04482
    Train [9568/9843]	 | 	Loss: 0.11291
==> Train | Average loss: 0.0799
==> Test  | Average loss: 0.3475
==> Test  | Accuracy: 90.6402
Best epoch: 42
Best accuracy: 91.36952998379255

Epoch 74:


Batches:   0%|          | 0/308 [00:00<?, ?it/s]

    Train [608/9843]	 | 	Loss: 0.04064
    Train [1248/9843]	 | 	Loss: 0.04904
    Train [1888/9843]	 | 	Loss: 0.12905
    Train [2528/9843]	 | 	Loss: 0.01769
    Train [3168/9843]	 | 	Loss: 0.08201
    Train [3808/9843]	 | 	Loss: 0.01538
    Train [4448/9843]	 | 	Loss: 0.02356
    Train [5088/9843]	 | 	Loss: 0.11448
    Train [5728/9843]	 | 	Loss: 0.13993
    Train [6368/9843]	 | 	Loss: 0.03600
    Train [7008/9843]	 | 	Loss: 0.34971
    Train [7648/9843]	 | 	Loss: 0.02785
    Train [8288/9843]	 | 	Loss: 0.07017
    Train [8928/9843]	 | 	Loss: 0.05575
    Train [9568/9843]	 | 	Loss: 0.14650
==> Train | Average loss: 0.0784
==> Test  | Average loss: 0.3576
==> Test  | Accuracy: 90.5186
Best epoch: 42
Best accuracy: 91.36952998379255

Epoch 75:


Batches:   0%|          | 0/308 [00:00<?, ?it/s]

    Train [608/9843]	 | 	Loss: 0.03180
    Train [1248/9843]	 | 	Loss: 0.01701
    Train [1888/9843]	 | 	Loss: 0.02079
    Train [2528/9843]	 | 	Loss: 0.02935
    Train [3168/9843]	 | 	Loss: 0.04282
    Train [3808/9843]	 | 	Loss: 0.06709
    Train [4448/9843]	 | 	Loss: 0.08381
    Train [5088/9843]	 | 	Loss: 0.01583
    Train [5728/9843]	 | 	Loss: 0.00532
    Train [6368/9843]	 | 	Loss: 0.10570
    Train [7008/9843]	 | 	Loss: 0.03123
    Train [7648/9843]	 | 	Loss: 0.06840
    Train [8288/9843]	 | 	Loss: 0.13962
    Train [8928/9843]	 | 	Loss: 0.10465
    Train [9568/9843]	 | 	Loss: 0.00847
==> Train | Average loss: 0.0760
==> Test  | Average loss: 0.3429
==> Test  | Accuracy: 90.5592
Best epoch: 42
Best accuracy: 91.36952998379255

Epoch 76:


Batches:   0%|          | 0/308 [00:00<?, ?it/s]

    Train [608/9843]	 | 	Loss: 0.10390
    Train [1248/9843]	 | 	Loss: 0.07872
    Train [1888/9843]	 | 	Loss: 0.08334
    Train [2528/9843]	 | 	Loss: 0.06950
    Train [3168/9843]	 | 	Loss: 0.01681
    Train [3808/9843]	 | 	Loss: 0.05471
    Train [4448/9843]	 | 	Loss: 0.01032
    Train [5088/9843]	 | 	Loss: 0.03461
    Train [5728/9843]	 | 	Loss: 0.02841
    Train [6368/9843]	 | 	Loss: 0.07419
    Train [7008/9843]	 | 	Loss: 0.01893
    Train [7648/9843]	 | 	Loss: 0.01478
    Train [8288/9843]	 | 	Loss: 0.05627
    Train [8928/9843]	 | 	Loss: 0.08021
    Train [9568/9843]	 | 	Loss: 0.03303
==> Train | Average loss: 0.0706
==> Test  | Average loss: 0.3562
==> Test  | Accuracy: 90.7618
Best epoch: 42
Best accuracy: 91.36952998379255

Epoch 77:


Batches:   0%|          | 0/308 [00:00<?, ?it/s]

    Train [608/9843]	 | 	Loss: 0.04146
    Train [1248/9843]	 | 	Loss: 0.05207
    Train [1888/9843]	 | 	Loss: 0.08022
    Train [2528/9843]	 | 	Loss: 0.06852
    Train [3168/9843]	 | 	Loss: 0.05969
    Train [3808/9843]	 | 	Loss: 0.02980
    Train [4448/9843]	 | 	Loss: 0.02854
    Train [5088/9843]	 | 	Loss: 0.03633
    Train [5728/9843]	 | 	Loss: 0.10739
    Train [6368/9843]	 | 	Loss: 0.10638
    Train [7008/9843]	 | 	Loss: 0.03231
    Train [7648/9843]	 | 	Loss: 0.07112
    Train [8288/9843]	 | 	Loss: 0.08459
    Train [8928/9843]	 | 	Loss: 0.00510
    Train [9568/9843]	 | 	Loss: 0.04241
==> Train | Average loss: 0.0764
==> Test  | Average loss: 0.3529
==> Test  | Accuracy: 90.6807
Best epoch: 42
Best accuracy: 91.36952998379255

Epoch 78:


Batches:   0%|          | 0/308 [00:00<?, ?it/s]

    Train [608/9843]	 | 	Loss: 0.06951
    Train [1248/9843]	 | 	Loss: 0.11227
    Train [1888/9843]	 | 	Loss: 0.00894
    Train [2528/9843]	 | 	Loss: 0.15200
    Train [3168/9843]	 | 	Loss: 0.07079
    Train [3808/9843]	 | 	Loss: 0.13760
    Train [4448/9843]	 | 	Loss: 0.04806
    Train [5088/9843]	 | 	Loss: 0.10376
    Train [5728/9843]	 | 	Loss: 0.03825
    Train [6368/9843]	 | 	Loss: 0.00899
    Train [7008/9843]	 | 	Loss: 0.09345
    Train [7648/9843]	 | 	Loss: 0.01527
    Train [8288/9843]	 | 	Loss: 0.02790
    Train [8928/9843]	 | 	Loss: 0.20382
    Train [9568/9843]	 | 	Loss: 0.01742
==> Train | Average loss: 0.0781
==> Test  | Average loss: 0.3488
==> Test  | Accuracy: 90.5186
Best epoch: 42
Best accuracy: 91.36952998379255

Epoch 79:


Batches:   0%|          | 0/308 [00:00<?, ?it/s]

    Train [608/9843]	 | 	Loss: 0.01196
    Train [1248/9843]	 | 	Loss: 0.07928
    Train [1888/9843]	 | 	Loss: 0.05722
    Train [2528/9843]	 | 	Loss: 0.02474
    Train [3168/9843]	 | 	Loss: 0.09830
    Train [3808/9843]	 | 	Loss: 0.16216
    Train [4448/9843]	 | 	Loss: 0.01764
    Train [5088/9843]	 | 	Loss: 0.03695
    Train [5728/9843]	 | 	Loss: 0.09432
    Train [6368/9843]	 | 	Loss: 0.04193
    Train [7008/9843]	 | 	Loss: 0.00605
    Train [7648/9843]	 | 	Loss: 0.03618
    Train [8288/9843]	 | 	Loss: 0.03301
    Train [8928/9843]	 | 	Loss: 0.02358
    Train [9568/9843]	 | 	Loss: 0.01935
==> Train | Average loss: 0.0674
==> Test  | Average loss: 0.3424
==> Test  | Accuracy: 90.8833
Best epoch: 42
Best accuracy: 91.36952998379255

Epoch 80:


Batches:   0%|          | 0/308 [00:00<?, ?it/s]

    Train [608/9843]	 | 	Loss: 0.11713
    Train [1248/9843]	 | 	Loss: 0.00561
    Train [1888/9843]	 | 	Loss: 0.06239
    Train [2528/9843]	 | 	Loss: 0.04064
    Train [3168/9843]	 | 	Loss: 0.02802
    Train [3808/9843]	 | 	Loss: 0.01675
    Train [4448/9843]	 | 	Loss: 0.20365
    Train [5088/9843]	 | 	Loss: 0.00559
    Train [5728/9843]	 | 	Loss: 0.04238
    Train [6368/9843]	 | 	Loss: 0.20063
    Train [7008/9843]	 | 	Loss: 0.09653
    Train [7648/9843]	 | 	Loss: 0.09094
    Train [8288/9843]	 | 	Loss: 0.03230
    Train [8928/9843]	 | 	Loss: 0.01723
    Train [9568/9843]	 | 	Loss: 0.11828
==> Train | Average loss: 0.0698
==> Test  | Average loss: 0.3447
==> Test  | Accuracy: 91.2480
Best epoch: 42
Best accuracy: 91.36952998379255

Epoch 81:


Batches:   0%|          | 0/308 [00:00<?, ?it/s]

    Train [608/9843]	 | 	Loss: 0.11886
    Train [1248/9843]	 | 	Loss: 0.05125
    Train [1888/9843]	 | 	Loss: 0.02385
    Train [2528/9843]	 | 	Loss: 0.06973
    Train [3168/9843]	 | 	Loss: 0.05836
    Train [3808/9843]	 | 	Loss: 0.26547
    Train [4448/9843]	 | 	Loss: 0.07814
    Train [5088/9843]	 | 	Loss: 0.00671
    Train [5728/9843]	 | 	Loss: 0.01061
    Train [6368/9843]	 | 	Loss: 0.16065
    Train [7008/9843]	 | 	Loss: 0.06003
    Train [7648/9843]	 | 	Loss: 0.03039
    Train [8288/9843]	 | 	Loss: 0.00970
    Train [8928/9843]	 | 	Loss: 0.00477
    Train [9568/9843]	 | 	Loss: 0.01135
==> Train | Average loss: 0.0685
==> Test  | Average loss: 0.3513
==> Test  | Accuracy: 91.2885
Best epoch: 42
Best accuracy: 91.36952998379255

Epoch 82:


Batches:   0%|          | 0/308 [00:00<?, ?it/s]

    Train [608/9843]	 | 	Loss: 0.03015
    Train [1248/9843]	 | 	Loss: 0.19371
    Train [1888/9843]	 | 	Loss: 0.04565
    Train [2528/9843]	 | 	Loss: 0.04027
    Train [3168/9843]	 | 	Loss: 0.00926
    Train [3808/9843]	 | 	Loss: 0.02437
    Train [4448/9843]	 | 	Loss: 0.04175
    Train [5088/9843]	 | 	Loss: 0.08587
    Train [5728/9843]	 | 	Loss: 0.00877
    Train [6368/9843]	 | 	Loss: 0.08678
    Train [7008/9843]	 | 	Loss: 0.09715
    Train [7648/9843]	 | 	Loss: 0.02826
    Train [8288/9843]	 | 	Loss: 0.02394
    Train [8928/9843]	 | 	Loss: 0.02718
    Train [9568/9843]	 | 	Loss: 0.03629
==> Train | Average loss: 0.0615
==> Test  | Average loss: 0.3559
==> Test  | Accuracy: 90.6402
Best epoch: 42
Best accuracy: 91.36952998379255

Epoch 83:


Batches:   0%|          | 0/308 [00:00<?, ?it/s]

    Train [608/9843]	 | 	Loss: 0.00538
    Train [1248/9843]	 | 	Loss: 0.02829
    Train [1888/9843]	 | 	Loss: 0.05602
    Train [2528/9843]	 | 	Loss: 0.04149
    Train [3168/9843]	 | 	Loss: 0.08198
    Train [3808/9843]	 | 	Loss: 0.04656
    Train [4448/9843]	 | 	Loss: 0.03351
    Train [5088/9843]	 | 	Loss: 0.00720
    Train [5728/9843]	 | 	Loss: 0.09195
    Train [6368/9843]	 | 	Loss: 0.05119
    Train [7008/9843]	 | 	Loss: 0.06585
    Train [7648/9843]	 | 	Loss: 0.03728
    Train [8288/9843]	 | 	Loss: 0.08100
    Train [8928/9843]	 | 	Loss: 0.03079
    Train [9568/9843]	 | 	Loss: 0.05317
==> Train | Average loss: 0.0659
==> Test  | Average loss: 0.3506
==> Test  | Accuracy: 90.5186
Best epoch: 42
Best accuracy: 91.36952998379255

Epoch 84:


Batches:   0%|          | 0/308 [00:00<?, ?it/s]

    Train [608/9843]	 | 	Loss: 0.08936
    Train [1248/9843]	 | 	Loss: 0.06975
    Train [1888/9843]	 | 	Loss: 0.00587
    Train [2528/9843]	 | 	Loss: 0.03002
    Train [3168/9843]	 | 	Loss: 0.02915
    Train [3808/9843]	 | 	Loss: 0.01648
    Train [4448/9843]	 | 	Loss: 0.01544
    Train [5088/9843]	 | 	Loss: 0.04904
    Train [5728/9843]	 | 	Loss: 0.03164
    Train [6368/9843]	 | 	Loss: 0.00692
    Train [7008/9843]	 | 	Loss: 0.03958
    Train [7648/9843]	 | 	Loss: 0.03465
    Train [8288/9843]	 | 	Loss: 0.04520
    Train [8928/9843]	 | 	Loss: 0.05364
    Train [9568/9843]	 | 	Loss: 0.04939
==> Train | Average loss: 0.0624
==> Test  | Average loss: 0.3509
==> Test  | Accuracy: 90.8023
Best epoch: 42
Best accuracy: 91.36952998379255

Epoch 85:


Batches:   0%|          | 0/308 [00:00<?, ?it/s]

    Train [608/9843]	 | 	Loss: 0.01738
    Train [1248/9843]	 | 	Loss: 0.07016
    Train [1888/9843]	 | 	Loss: 0.04659
    Train [2528/9843]	 | 	Loss: 0.04975
    Train [3168/9843]	 | 	Loss: 0.19023
    Train [3808/9843]	 | 	Loss: 0.05957
    Train [4448/9843]	 | 	Loss: 0.05702
    Train [5088/9843]	 | 	Loss: 0.03884
    Train [5728/9843]	 | 	Loss: 0.05905
    Train [6368/9843]	 | 	Loss: 0.10401
    Train [7008/9843]	 | 	Loss: 0.10756
    Train [7648/9843]	 | 	Loss: 0.02947
    Train [8288/9843]	 | 	Loss: 0.02332
    Train [8928/9843]	 | 	Loss: 0.10619
    Train [9568/9843]	 | 	Loss: 0.03072
==> Train | Average loss: 0.0637
==> Test  | Average loss: 0.3594
==> Test  | Accuracy: 90.6807
Best epoch: 42
Best accuracy: 91.36952998379255

Epoch 86:


Batches:   0%|          | 0/308 [00:00<?, ?it/s]

    Train [608/9843]	 | 	Loss: 0.03482
    Train [1248/9843]	 | 	Loss: 0.06865
    Train [1888/9843]	 | 	Loss: 0.02881
    Train [2528/9843]	 | 	Loss: 0.14206
    Train [3168/9843]	 | 	Loss: 0.03621
    Train [3808/9843]	 | 	Loss: 0.00896
    Train [4448/9843]	 | 	Loss: 0.02842
    Train [5088/9843]	 | 	Loss: 0.21788
    Train [5728/9843]	 | 	Loss: 0.05983
    Train [6368/9843]	 | 	Loss: 0.08200
    Train [7008/9843]	 | 	Loss: 0.02313
    Train [7648/9843]	 | 	Loss: 0.04608
    Train [8288/9843]	 | 	Loss: 0.00961
    Train [8928/9843]	 | 	Loss: 0.00805
    Train [9568/9843]	 | 	Loss: 0.04398
==> Train | Average loss: 0.0647
==> Test  | Average loss: 0.3560
==> Test  | Accuracy: 90.5592
Best epoch: 42
Best accuracy: 91.36952998379255

Epoch 87:


Batches:   0%|          | 0/308 [00:00<?, ?it/s]

    Train [608/9843]	 | 	Loss: 0.03675
    Train [1248/9843]	 | 	Loss: 0.01905
    Train [1888/9843]	 | 	Loss: 0.03953
    Train [2528/9843]	 | 	Loss: 0.07099
    Train [3168/9843]	 | 	Loss: 0.02681
    Train [3808/9843]	 | 	Loss: 0.05568
    Train [4448/9843]	 | 	Loss: 0.02396
    Train [5088/9843]	 | 	Loss: 0.01905
    Train [5728/9843]	 | 	Loss: 0.10905
    Train [6368/9843]	 | 	Loss: 0.04175
    Train [7008/9843]	 | 	Loss: 0.00799
    Train [7648/9843]	 | 	Loss: 0.04228
    Train [8288/9843]	 | 	Loss: 0.07431
    Train [8928/9843]	 | 	Loss: 0.09064
    Train [9568/9843]	 | 	Loss: 0.23027
==> Train | Average loss: 0.0627
==> Test  | Average loss: 0.3820
==> Test  | Accuracy: 90.5997
Best epoch: 42
Best accuracy: 91.36952998379255

Epoch 88:


Batches:   0%|          | 0/308 [00:00<?, ?it/s]

    Train [608/9843]	 | 	Loss: 0.08267
    Train [1248/9843]	 | 	Loss: 0.03713
    Train [1888/9843]	 | 	Loss: 0.04830
    Train [2528/9843]	 | 	Loss: 0.00300
    Train [3168/9843]	 | 	Loss: 0.03089
    Train [3808/9843]	 | 	Loss: 0.15232
    Train [4448/9843]	 | 	Loss: 0.01412
    Train [5088/9843]	 | 	Loss: 0.01524
    Train [5728/9843]	 | 	Loss: 0.04786
    Train [6368/9843]	 | 	Loss: 0.04804
    Train [7008/9843]	 | 	Loss: 0.05680
    Train [7648/9843]	 | 	Loss: 0.01922
    Train [8288/9843]	 | 	Loss: 0.11871
    Train [8928/9843]	 | 	Loss: 0.10407
    Train [9568/9843]	 | 	Loss: 0.09353
==> Train | Average loss: 0.0617
==> Test  | Average loss: 0.3625
==> Test  | Accuracy: 90.5997
Best epoch: 42
Best accuracy: 91.36952998379255

Epoch 89:


Batches:   0%|          | 0/308 [00:00<?, ?it/s]

    Train [608/9843]	 | 	Loss: 0.02602
    Train [1248/9843]	 | 	Loss: 0.02954
    Train [1888/9843]	 | 	Loss: 0.01084
    Train [2528/9843]	 | 	Loss: 0.01081
    Train [3168/9843]	 | 	Loss: 0.03011
    Train [3808/9843]	 | 	Loss: 0.01544
    Train [4448/9843]	 | 	Loss: 0.03022
    Train [5088/9843]	 | 	Loss: 0.05280
    Train [5728/9843]	 | 	Loss: 0.00837
    Train [6368/9843]	 | 	Loss: 0.01368
    Train [7008/9843]	 | 	Loss: 0.04911
    Train [7648/9843]	 | 	Loss: 0.17789
    Train [8288/9843]	 | 	Loss: 0.10283
    Train [8928/9843]	 | 	Loss: 0.09095
    Train [9568/9843]	 | 	Loss: 0.04354
==> Train | Average loss: 0.0608
==> Test  | Average loss: 0.3645
==> Test  | Accuracy: 90.5592
Best epoch: 42
Best accuracy: 91.36952998379255

Epoch 90:


Batches:   0%|          | 0/308 [00:00<?, ?it/s]

    Train [608/9843]	 | 	Loss: 0.03867
    Train [1248/9843]	 | 	Loss: 0.18835
    Train [1888/9843]	 | 	Loss: 0.05781
    Train [2528/9843]	 | 	Loss: 0.20271
    Train [3168/9843]	 | 	Loss: 0.02138
    Train [3808/9843]	 | 	Loss: 0.36293
    Train [4448/9843]	 | 	Loss: 0.00905
    Train [5088/9843]	 | 	Loss: 0.16164
    Train [5728/9843]	 | 	Loss: 0.11789
    Train [6368/9843]	 | 	Loss: 0.02597
    Train [7008/9843]	 | 	Loss: 0.03384
    Train [7648/9843]	 | 	Loss: 0.02723
    Train [8288/9843]	 | 	Loss: 0.01298
    Train [8928/9843]	 | 	Loss: 0.02936
    Train [9568/9843]	 | 	Loss: 0.04293
==> Train | Average loss: 0.0643
==> Test  | Average loss: 0.3784
==> Test  | Accuracy: 90.8428
Best epoch: 42
Best accuracy: 91.36952998379255

Epoch 91:


Batches:   0%|          | 0/308 [00:00<?, ?it/s]

    Train [608/9843]	 | 	Loss: 0.00709
    Train [1248/9843]	 | 	Loss: 0.06611
    Train [1888/9843]	 | 	Loss: 0.03594
    Train [2528/9843]	 | 	Loss: 0.02804
    Train [3168/9843]	 | 	Loss: 0.02404
    Train [3808/9843]	 | 	Loss: 0.00730
    Train [4448/9843]	 | 	Loss: 0.16404
    Train [5088/9843]	 | 	Loss: 0.03523
    Train [5728/9843]	 | 	Loss: 0.03518
    Train [6368/9843]	 | 	Loss: 0.01887
    Train [7008/9843]	 | 	Loss: 0.05034
    Train [7648/9843]	 | 	Loss: 0.15162
    Train [8288/9843]	 | 	Loss: 0.09956
    Train [8928/9843]	 | 	Loss: 0.00686
    Train [9568/9843]	 | 	Loss: 0.01455
==> Train | Average loss: 0.0582
==> Test  | Average loss: 0.3652
==> Test  | Accuracy: 90.6402
Best epoch: 42
Best accuracy: 91.36952998379255

Epoch 92:


Batches:   0%|          | 0/308 [00:00<?, ?it/s]

    Train [608/9843]	 | 	Loss: 0.01105
    Train [1248/9843]	 | 	Loss: 0.07676
    Train [1888/9843]	 | 	Loss: 0.00768
    Train [2528/9843]	 | 	Loss: 0.00936
    Train [3168/9843]	 | 	Loss: 0.09137
    Train [3808/9843]	 | 	Loss: 0.19329
    Train [4448/9843]	 | 	Loss: 0.03806
    Train [5088/9843]	 | 	Loss: 0.05417
    Train [5728/9843]	 | 	Loss: 0.04224
    Train [6368/9843]	 | 	Loss: 0.03746
    Train [7008/9843]	 | 	Loss: 0.02140
    Train [7648/9843]	 | 	Loss: 0.07654
    Train [8288/9843]	 | 	Loss: 0.05017
    Train [8928/9843]	 | 	Loss: 0.36620
    Train [9568/9843]	 | 	Loss: 0.10376
==> Train | Average loss: 0.0617
==> Test  | Average loss: 0.3628
==> Test  | Accuracy: 90.8023
Best epoch: 42
Best accuracy: 91.36952998379255

Epoch 93:


Batches:   0%|          | 0/308 [00:00<?, ?it/s]

    Train [608/9843]	 | 	Loss: 0.04250
    Train [1248/9843]	 | 	Loss: 0.06911
    Train [1888/9843]	 | 	Loss: 0.15251
    Train [2528/9843]	 | 	Loss: 0.05162
    Train [3168/9843]	 | 	Loss: 0.06760
    Train [3808/9843]	 | 	Loss: 0.14364
    Train [4448/9843]	 | 	Loss: 0.03438
    Train [5088/9843]	 | 	Loss: 0.08623
    Train [5728/9843]	 | 	Loss: 0.02720
    Train [6368/9843]	 | 	Loss: 0.01040
    Train [7008/9843]	 | 	Loss: 0.08100
    Train [7648/9843]	 | 	Loss: 0.10727
    Train [8288/9843]	 | 	Loss: 0.00624
    Train [8928/9843]	 | 	Loss: 0.01629
    Train [9568/9843]	 | 	Loss: 0.02453
==> Train | Average loss: 0.0590
==> Test  | Average loss: 0.3569
==> Test  | Accuracy: 90.7212
Best epoch: 42
Best accuracy: 91.36952998379255

Epoch 94:


Batches:   0%|          | 0/308 [00:00<?, ?it/s]

    Train [608/9843]	 | 	Loss: 0.05889
    Train [1248/9843]	 | 	Loss: 0.01830
    Train [1888/9843]	 | 	Loss: 0.01308
    Train [2528/9843]	 | 	Loss: 0.01573
    Train [3168/9843]	 | 	Loss: 0.00826
    Train [3808/9843]	 | 	Loss: 0.12600
    Train [4448/9843]	 | 	Loss: 0.02351
    Train [5088/9843]	 | 	Loss: 0.06886
    Train [5728/9843]	 | 	Loss: 0.04567
    Train [6368/9843]	 | 	Loss: 0.01196
    Train [7008/9843]	 | 	Loss: 0.02302
    Train [7648/9843]	 | 	Loss: 0.05849
    Train [8288/9843]	 | 	Loss: 0.03369
    Train [8928/9843]	 | 	Loss: 0.01877
    Train [9568/9843]	 | 	Loss: 0.05308
==> Train | Average loss: 0.0639
==> Test  | Average loss: 0.3726
==> Test  | Accuracy: 90.6807
Best epoch: 42
Best accuracy: 91.36952998379255

Epoch 95:


Batches:   0%|          | 0/308 [00:00<?, ?it/s]

    Train [608/9843]	 | 	Loss: 0.02896
    Train [1248/9843]	 | 	Loss: 0.16826
    Train [1888/9843]	 | 	Loss: 0.11292
    Train [2528/9843]	 | 	Loss: 0.00343
    Train [3168/9843]	 | 	Loss: 0.03454
    Train [3808/9843]	 | 	Loss: 0.02350
    Train [4448/9843]	 | 	Loss: 0.15038
    Train [5088/9843]	 | 	Loss: 0.00599
    Train [5728/9843]	 | 	Loss: 0.07881
    Train [6368/9843]	 | 	Loss: 0.04843
    Train [7008/9843]	 | 	Loss: 0.11237
    Train [7648/9843]	 | 	Loss: 0.02079
    Train [8288/9843]	 | 	Loss: 0.02234
    Train [8928/9843]	 | 	Loss: 0.02146
    Train [9568/9843]	 | 	Loss: 0.06107
==> Train | Average loss: 0.0609
==> Test  | Average loss: 0.3607
==> Test  | Accuracy: 90.8023
Best epoch: 42
Best accuracy: 91.36952998379255

Epoch 96:


Batches:   0%|          | 0/308 [00:00<?, ?it/s]

    Train [608/9843]	 | 	Loss: 0.18295
    Train [1248/9843]	 | 	Loss: 0.09999
    Train [1888/9843]	 | 	Loss: 0.11797
    Train [2528/9843]	 | 	Loss: 0.07554
    Train [3168/9843]	 | 	Loss: 0.18048
    Train [3808/9843]	 | 	Loss: 0.01934
    Train [4448/9843]	 | 	Loss: 0.06336
    Train [5088/9843]	 | 	Loss: 0.07844
    Train [5728/9843]	 | 	Loss: 0.14180
    Train [6368/9843]	 | 	Loss: 0.06051
    Train [7008/9843]	 | 	Loss: 0.00906
    Train [7648/9843]	 | 	Loss: 0.16236
    Train [8288/9843]	 | 	Loss: 0.02216
    Train [8928/9843]	 | 	Loss: 0.06853
    Train [9568/9843]	 | 	Loss: 0.20338
==> Train | Average loss: 0.0604
==> Test  | Average loss: 0.3659
==> Test  | Accuracy: 90.9238
Best epoch: 42
Best accuracy: 91.36952998379255

Epoch 97:


Batches:   0%|          | 0/308 [00:00<?, ?it/s]

    Train [608/9843]	 | 	Loss: 0.01625
    Train [1248/9843]	 | 	Loss: 0.06990
    Train [1888/9843]	 | 	Loss: 0.11454
    Train [2528/9843]	 | 	Loss: 0.00623
    Train [3168/9843]	 | 	Loss: 0.02849
    Train [3808/9843]	 | 	Loss: 0.01984
    Train [4448/9843]	 | 	Loss: 0.04499
    Train [5088/9843]	 | 	Loss: 0.01770
    Train [5728/9843]	 | 	Loss: 0.04731
    Train [6368/9843]	 | 	Loss: 0.01197
    Train [7008/9843]	 | 	Loss: 0.06943
    Train [7648/9843]	 | 	Loss: 0.09640
    Train [8288/9843]	 | 	Loss: 0.14786
    Train [8928/9843]	 | 	Loss: 0.20673
    Train [9568/9843]	 | 	Loss: 0.07346
==> Train | Average loss: 0.0543
==> Test  | Average loss: 0.3572
==> Test  | Accuracy: 91.0049
Best epoch: 42
Best accuracy: 91.36952998379255

Epoch 98:


Batches:   0%|          | 0/308 [00:00<?, ?it/s]

    Train [608/9843]	 | 	Loss: 0.03055
    Train [1248/9843]	 | 	Loss: 0.01213
    Train [1888/9843]	 | 	Loss: 0.09225
    Train [2528/9843]	 | 	Loss: 0.00460
    Train [3168/9843]	 | 	Loss: 0.06523
    Train [3808/9843]	 | 	Loss: 0.05060
    Train [4448/9843]	 | 	Loss: 0.10118
    Train [5088/9843]	 | 	Loss: 0.01679
    Train [5728/9843]	 | 	Loss: 0.02774
    Train [6368/9843]	 | 	Loss: 0.01593
    Train [7008/9843]	 | 	Loss: 0.05786
    Train [7648/9843]	 | 	Loss: 0.04523
    Train [8288/9843]	 | 	Loss: 0.01229
    Train [8928/9843]	 | 	Loss: 0.01408
    Train [9568/9843]	 | 	Loss: 0.01488
==> Train | Average loss: 0.0580
==> Test  | Average loss: 0.3780
==> Test  | Accuracy: 90.8428
Best epoch: 42
Best accuracy: 91.36952998379255

Epoch 99:


Batches:   0%|          | 0/308 [00:00<?, ?it/s]

    Train [608/9843]	 | 	Loss: 0.01606
    Train [1248/9843]	 | 	Loss: 0.07994
    Train [1888/9843]	 | 	Loss: 0.09747
    Train [2528/9843]	 | 	Loss: 0.03654


KeyboardInterrupt: 