In [0]:
import pdb
import argparse
import numpy as np
from tqdm import tqdm
import math

import torch
import torch.nn as nn
import torch.nn.functional as F
from torch.autograd import Variable
import torch.backends.cudnn as cudnn
from torch.optim.lr_scheduler import MultiStepLR

import torchvision
import torchvision.transforms as transforms
from torchvision.utils import make_grid
from torchvision import datasets, transforms

In [2]:
from google.colab import drive
drive.mount('/content/gdrive')

Go to this URL in a browser: https://accounts.google.com/o/oauth2/auth?client_id=947318989803-6bn6qk8qdgf4n4g3pfee6491hc0brc4i.apps.googleusercontent.com&redirect_uri=urn%3Aietf%3Awg%3Aoauth%3A2.0%3Aoob&scope=email%20https%3A%2F%2Fwww.googleapis.com%2Fauth%2Fdocs.test%20https%3A%2F%2Fwww.googleapis.com%2Fauth%2Fdrive%20https%3A%2F%2Fwww.googleapis.com%2Fauth%2Fdrive.photos.readonly%20https%3A%2F%2Fwww.googleapis.com%2Fauth%2Fpeopleapi.readonly&response_type=code

Enter your authorization code:
··········
Mounted at /content/gdrive


In [0]:
class Cutout(object):
    """Randomly mask out one or more patches from an image.

    Args:
        n_holes (int): Number of patches to cut out of each image.
        length (int): The length (in pixels) of each square patch.
    """
    def __init__(self, n_holes, length):
        self.n_holes = n_holes
        self.length = length

    def __call__(self, img):
        """
        Args:
            img (Tensor): Tensor image of size (C, H, W).
        Returns:
            Tensor: Image with n_holes of dimension length x length cut out of it.
        """
        h = img.size(1)
        w = img.size(2)

        mask = np.ones((h, w), np.float32)

        for n in range(self.n_holes):
            y = np.random.randint(h)
            x = np.random.randint(w)

            y1 = np.clip(y - self.length // 2, 0, h)
            y2 = np.clip(y + self.length // 2, 0, h)
            x1 = np.clip(x - self.length // 2, 0, w)
            x2 = np.clip(x + self.length // 2, 0, w)

            mask[y1: y2, x1: x2] = 0.

        mask = torch.from_numpy(mask)
        mask = mask.expand_as(img)
        img = img * mask

        return img


In [0]:
class BasicBlock(nn.Module):
    def __init__(self, in_planes, out_planes, stride, dropRate=0.0):
        super(BasicBlock, self).__init__()
        self.bn1 = nn.BatchNorm2d(in_planes)
        self.relu1 = nn.ReLU(inplace=True)
        self.conv1 = nn.Conv2d(in_planes, out_planes, kernel_size=3, stride=stride,
                               padding=1, bias=False)
        self.bn2 = nn.BatchNorm2d(out_planes)
        self.relu2 = nn.ReLU(inplace=True)
        self.conv2 = nn.Conv2d(out_planes, out_planes, kernel_size=3, stride=1,
                               padding=1, bias=False)
        self.droprate = dropRate
        self.equalInOut = (in_planes == out_planes)
        self.convShortcut = (not self.equalInOut) and nn.Conv2d(in_planes, out_planes, kernel_size=1, stride=stride,
                               padding=0, bias=False) or None
    def forward(self, x):
        if not self.equalInOut:
            x = self.relu1(self.bn1(x))
        else:
            out = self.relu1(self.bn1(x))
        out = self.relu2(self.bn2(self.conv1(out if self.equalInOut else x)))
        if self.droprate > 0:
            out = F.dropout(out, p=self.droprate, training=self.training)
        out = self.conv2(out)
        return torch.add(x if self.equalInOut else self.convShortcut(x), out)

class NetworkBlock(nn.Module):
    def __init__(self, nb_layers, in_planes, out_planes, block, stride, dropRate=0.0):
        super(NetworkBlock, self).__init__()
        self.layer = self._make_layer(block, in_planes, out_planes, nb_layers, stride, dropRate)
    def _make_layer(self, block, in_planes, out_planes, nb_layers, stride, dropRate):
        layers = []
        for i in range(int(nb_layers)):
            layers.append(block(i == 0 and in_planes or out_planes, out_planes, i == 0 and stride or 1, dropRate))
        return nn.Sequential(*layers)
    def forward(self, x):
        return self.layer(x)

class WideResNet(nn.Module):
    def __init__(self, depth, num_classes, widen_factor=1, dropRate=0.0):
        super(WideResNet, self).__init__()
        nChannels = [16, 16*widen_factor, 32*widen_factor, 64*widen_factor]
        assert((depth - 4) % 6 == 0)
        n = (depth - 4) / 6
        block = BasicBlock
        # 1st conv before any network block
        self.conv1 = nn.Conv2d(3, nChannels[0], kernel_size=3, stride=1,
                               padding=1, bias=False)
        # 1st block
        self.block1 = NetworkBlock(n, nChannels[0], nChannels[1], block, 1, dropRate)
        # 2nd block
        self.block2 = NetworkBlock(n, nChannels[1], nChannels[2], block, 2, dropRate)
        # 3rd block
        self.block3 = NetworkBlock(n, nChannels[2], nChannels[3], block, 2, dropRate)
        # global average pooling and classifier
        self.bn1 = nn.BatchNorm2d(nChannels[3])
        self.relu = nn.ReLU(inplace=True)
        self.fc = nn.Linear(nChannels[3], num_classes)
        self.nChannels = nChannels[3]

        for m in self.modules():
            if isinstance(m, nn.Conv2d):
                n = m.kernel_size[0] * m.kernel_size[1] * m.out_channels
                m.weight.data.normal_(0, math.sqrt(2. / n))
            elif isinstance(m, nn.BatchNorm2d):
                m.weight.data.fill_(1)
                m.bias.data.zero_()
            elif isinstance(m, nn.Linear):
                m.bias.data.zero_()
    def forward(self, x):
        out = self.conv1(x)
        out = self.block1(out)
        out = self.block2(out)
        out = self.block3(out)
        out = self.relu(self.bn1(out))

        out = F.avg_pool2d(out, 8)
        out = out.view(-1, self.nChannels)
        out = self.fc(out)
        return out


In [0]:
normalize = transforms.Normalize(mean=[x / 255.0 for x in [125.3, 123.0, 113.9]],
                                     std=[x / 255.0 for x in [63.0, 62.1, 66.7]])

In [0]:
train_transform = transforms.Compose([])
train_transform.transforms.append(transforms.RandomCrop(32, padding=4))
train_transform.transforms.append(transforms.RandomHorizontalFlip())
train_transform.transforms.append(transforms.ToTensor())
train_transform.transforms.append(normalize)
train_transform.transforms.append(Cutout(n_holes=1, length=16))

In [0]:
test_transform = transforms.Compose([
    transforms.ToTensor(),
    normalize])

In [8]:
trainset = torchvision.datasets.CIFAR100(root='./data',train=True,download=True,transform=train_transform)

0it [00:00, ?it/s]

Downloading https://www.cs.toronto.edu/~kriz/cifar-100-python.tar.gz to ./data/cifar-100-python.tar.gz


169009152it [00:03, 42820359.36it/s]                               


In [0]:
trainLoader = torch.utils.data.DataLoader(trainset, batch_size=128, shuffle=True,num_workers=2,pin_memory=True)

In [10]:
testset = torchvision.datasets.CIFAR100(root='./data',train=False,download=True,transform = test_transform)

Files already downloaded and verified


In [0]:
testLoader = torch.utils.data.DataLoader(testset, batch_size=128,shuffle=False,num_workers=2,pin_memory=True)

In [0]:
classes = tuple(trainset.classes)

In [0]:
cnn = WideResNet(28,100)

In [0]:
import torch.optim as optim
cnn = cnn.cuda()
criterion = nn.CrossEntropyLoss().cuda()
cnn_optimizer = torch.optim.SGD(cnn.parameters(), lr=0.1,
                                momentum=0.9, nesterov=True, weight_decay=5e-4)

In [0]:
cudnn.benchmark = True

In [0]:
scheduler = MultiStepLR(cnn_optimizer, milestones=[60, 120, 160, 200, 240, 280, 320, 340, 360, 380], gamma=0.2)

In [0]:
def test(loader):
    cnn.eval()    # Change model to 'eval' mode (BN uses moving mean/var).
    correct = 0.
    total = 0.
    for images, labels in loader:
        images = images.cuda()
        labels = labels.cuda()

        with torch.no_grad():
            pred = cnn(images)

        pred = torch.max(pred.data, 1)[1]
        total += labels.size(0)
        correct += (pred == labels).sum().item()

    val_acc = correct / total
    cnn.train()
    return val_acc

In [0]:

def train(sepoch, eepoch, lr=0.1):
  
  for epoch in range(sepoch,eepoch):

    xentropy_loss_avg = 0.
    correct = 0.
    total = 0.

    progress_bar = tqdm(trainLoader)
    for i, (images, labels) in enumerate(progress_bar):
        progress_bar.set_description('Epoch ' + str(epoch))

        images = images.cuda()
        labels = labels.cuda()

        cnn.zero_grad()
        pred = cnn(images)

        xentropy_loss = criterion(pred, labels)
        xentropy_loss.backward()
        cnn_optimizer.step()

        xentropy_loss_avg += xentropy_loss.item()

        # Calculate running average of accuracy
        pred = torch.max(pred.data, 1)[1]
        total += labels.size(0)
        correct += (pred == labels.data).sum().item()
        accuracy = correct / total

        progress_bar.set_postfix(
            xentropy='%.3f' % (xentropy_loss_avg / (i + 1)),
            acc='%.3f' % accuracy)
        
    test_acc = test(testLoader)
    tqdm.write('test_acc: %.3f' % (test_acc))

    scheduler.step(epoch)
    

In [21]:
train(0,400)

Epoch 0: 100%|██████████| 391/391 [00:36<00:00, 10.76it/s, acc=0.140, xentropy=3.550]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.186


Epoch 1: 100%|██████████| 391/391 [00:36<00:00, 12.11it/s, acc=0.207, xentropy=3.170]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.241


Epoch 2: 100%|██████████| 391/391 [00:36<00:00, 12.11it/s, acc=0.264, xentropy=2.868]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.251


Epoch 3: 100%|██████████| 391/391 [00:36<00:00, 10.82it/s, acc=0.306, xentropy=2.675]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.300


Epoch 4: 100%|██████████| 391/391 [00:35<00:00, 12.46it/s, acc=0.332, xentropy=2.550]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.294


Epoch 5: 100%|██████████| 391/391 [00:36<00:00, 10.79it/s, acc=0.356, xentropy=2.438]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.350


Epoch 6: 100%|██████████| 391/391 [00:35<00:00, 12.16it/s, acc=0.372, xentropy=2.354]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.368


Epoch 7: 100%|██████████| 391/391 [00:34<00:00, 11.20it/s, acc=0.388, xentropy=2.287]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.355


Epoch 8: 100%|██████████| 391/391 [00:34<00:00, 12.20it/s, acc=0.405, xentropy=2.230]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.348


Epoch 9: 100%|██████████| 391/391 [00:34<00:00, 12.48it/s, acc=0.411, xentropy=2.185]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.403


Epoch 10: 100%|██████████| 391/391 [00:34<00:00, 11.21it/s, acc=0.423, xentropy=2.145]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.336


Epoch 11: 100%|██████████| 391/391 [00:34<00:00, 12.38it/s, acc=0.432, xentropy=2.104]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.412


Epoch 12: 100%|██████████| 391/391 [00:34<00:00, 12.60it/s, acc=0.437, xentropy=2.081]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.381


Epoch 13: 100%|██████████| 391/391 [00:34<00:00, 11.29it/s, acc=0.445, xentropy=2.055]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.392


Epoch 14: 100%|██████████| 391/391 [00:34<00:00, 11.31it/s, acc=0.447, xentropy=2.032]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.307


Epoch 15: 100%|██████████| 391/391 [00:34<00:00, 11.28it/s, acc=0.454, xentropy=2.018]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.410


Epoch 16: 100%|██████████| 391/391 [00:34<00:00, 12.48it/s, acc=0.457, xentropy=1.992]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.388


Epoch 17: 100%|██████████| 391/391 [00:34<00:00, 11.19it/s, acc=0.458, xentropy=1.982]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.444


Epoch 18: 100%|██████████| 391/391 [00:34<00:00, 11.20it/s, acc=0.464, xentropy=1.975]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.378


Epoch 19: 100%|██████████| 391/391 [00:34<00:00, 12.53it/s, acc=0.466, xentropy=1.957]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.458


Epoch 20: 100%|██████████| 391/391 [00:34<00:00, 12.40it/s, acc=0.468, xentropy=1.950]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.446


Epoch 21: 100%|██████████| 391/391 [00:34<00:00, 11.19it/s, acc=0.468, xentropy=1.937]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.456


Epoch 22: 100%|██████████| 391/391 [00:35<00:00, 11.17it/s, acc=0.473, xentropy=1.931]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.440


Epoch 23: 100%|██████████| 391/391 [00:35<00:00, 11.10it/s, acc=0.476, xentropy=1.924]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.468


Epoch 24: 100%|██████████| 391/391 [00:36<00:00, 12.14it/s, acc=0.477, xentropy=1.915]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.407


Epoch 25: 100%|██████████| 391/391 [00:36<00:00, 10.86it/s, acc=0.479, xentropy=1.908]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.410


Epoch 26: 100%|██████████| 391/391 [00:35<00:00, 10.91it/s, acc=0.481, xentropy=1.894]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.430


Epoch 27: 100%|██████████| 391/391 [00:35<00:00, 10.89it/s, acc=0.480, xentropy=1.900]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.476


Epoch 28: 100%|██████████| 391/391 [00:35<00:00, 10.96it/s, acc=0.480, xentropy=1.892]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.479


Epoch 29: 100%|██████████| 391/391 [00:35<00:00, 10.94it/s, acc=0.482, xentropy=1.886]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.442


Epoch 30: 100%|██████████| 391/391 [00:35<00:00, 12.31it/s, acc=0.485, xentropy=1.880]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.472


Epoch 31: 100%|██████████| 391/391 [00:35<00:00, 10.89it/s, acc=0.486, xentropy=1.876]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.386


Epoch 32: 100%|██████████| 391/391 [00:34<00:00, 12.48it/s, acc=0.487, xentropy=1.870]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.450


Epoch 33: 100%|██████████| 391/391 [00:34<00:00, 12.30it/s, acc=0.490, xentropy=1.864]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.401


Epoch 34: 100%|██████████| 391/391 [00:34<00:00, 11.33it/s, acc=0.493, xentropy=1.858]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.456


Epoch 35: 100%|██████████| 391/391 [00:34<00:00, 11.34it/s, acc=0.488, xentropy=1.859]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.479


Epoch 36: 100%|██████████| 391/391 [00:34<00:00, 11.24it/s, acc=0.492, xentropy=1.851]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.453


Epoch 37: 100%|██████████| 391/391 [00:34<00:00, 11.24it/s, acc=0.488, xentropy=1.859]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.465


Epoch 38: 100%|██████████| 391/391 [00:35<00:00, 12.59it/s, acc=0.492, xentropy=1.842]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.423


Epoch 39: 100%|██████████| 391/391 [00:35<00:00, 11.17it/s, acc=0.494, xentropy=1.841]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.463


Epoch 40: 100%|██████████| 391/391 [00:34<00:00, 11.24it/s, acc=0.496, xentropy=1.839]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.460


Epoch 41: 100%|██████████| 391/391 [00:35<00:00, 11.15it/s, acc=0.498, xentropy=1.833]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.478


Epoch 42: 100%|██████████| 391/391 [00:34<00:00, 12.32it/s, acc=0.495, xentropy=1.835]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.434


Epoch 43: 100%|██████████| 391/391 [00:35<00:00, 11.15it/s, acc=0.501, xentropy=1.825]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.472


Epoch 44: 100%|██████████| 391/391 [00:34<00:00, 12.44it/s, acc=0.499, xentropy=1.830]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.487


Epoch 45: 100%|██████████| 391/391 [00:34<00:00, 11.29it/s, acc=0.498, xentropy=1.825]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.478


Epoch 46: 100%|██████████| 391/391 [00:34<00:00, 12.35it/s, acc=0.498, xentropy=1.818]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.466


Epoch 47: 100%|██████████| 391/391 [00:35<00:00, 12.42it/s, acc=0.495, xentropy=1.842]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.473


Epoch 48: 100%|██████████| 391/391 [00:34<00:00, 11.29it/s, acc=0.500, xentropy=1.822]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.434


Epoch 49: 100%|██████████| 391/391 [00:34<00:00, 11.22it/s, acc=0.501, xentropy=1.814]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.482


Epoch 50: 100%|██████████| 391/391 [00:35<00:00, 11.15it/s, acc=0.500, xentropy=1.816]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.495


Epoch 51: 100%|██████████| 391/391 [00:34<00:00, 12.48it/s, acc=0.503, xentropy=1.812]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.490


Epoch 52: 100%|██████████| 391/391 [00:34<00:00, 11.28it/s, acc=0.502, xentropy=1.812]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.481


Epoch 53: 100%|██████████| 391/391 [00:34<00:00, 12.46it/s, acc=0.504, xentropy=1.801]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.460


Epoch 54: 100%|██████████| 391/391 [00:35<00:00, 12.22it/s, acc=0.504, xentropy=1.810]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.487


Epoch 55: 100%|██████████| 391/391 [00:35<00:00, 10.98it/s, acc=0.502, xentropy=1.804]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.443


Epoch 56: 100%|██████████| 391/391 [00:35<00:00, 12.10it/s, acc=0.503, xentropy=1.805]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.438


Epoch 57: 100%|██████████| 391/391 [00:35<00:00, 10.86it/s, acc=0.507, xentropy=1.794]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.455


Epoch 58: 100%|██████████| 391/391 [00:35<00:00, 10.90it/s, acc=0.505, xentropy=1.797]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.434


Epoch 59: 100%|██████████| 391/391 [00:36<00:00, 11.94it/s, acc=0.504, xentropy=1.802]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.478


Epoch 60: 100%|██████████| 391/391 [00:35<00:00, 12.09it/s, acc=0.506, xentropy=1.801]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.484


Epoch 61: 100%|██████████| 391/391 [00:35<00:00, 10.88it/s, acc=0.591, xentropy=1.455]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.621


Epoch 62: 100%|██████████| 391/391 [00:35<00:00, 12.60it/s, acc=0.614, xentropy=1.364]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.619


Epoch 63: 100%|██████████| 391/391 [00:34<00:00, 12.44it/s, acc=0.622, xentropy=1.334]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.624


Epoch 64: 100%|██████████| 391/391 [00:34<00:00, 11.28it/s, acc=0.625, xentropy=1.316]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.622


Epoch 65: 100%|██████████| 391/391 [00:34<00:00, 12.78it/s, acc=0.627, xentropy=1.315]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.632


Epoch 66: 100%|██████████| 391/391 [00:34<00:00, 11.96it/s, acc=0.626, xentropy=1.306]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.622


Epoch 67: 100%|██████████| 391/391 [00:34<00:00, 11.23it/s, acc=0.626, xentropy=1.304]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.628


Epoch 68: 100%|██████████| 391/391 [00:34<00:00, 11.28it/s, acc=0.624, xentropy=1.304]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.621


Epoch 69: 100%|██████████| 391/391 [00:35<00:00, 11.10it/s, acc=0.628, xentropy=1.302]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.611


Epoch 70: 100%|██████████| 391/391 [00:35<00:00, 10.92it/s, acc=0.629, xentropy=1.300]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.615


Epoch 71: 100%|██████████| 391/391 [00:36<00:00, 10.86it/s, acc=0.628, xentropy=1.295]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.624


Epoch 72: 100%|██████████| 391/391 [00:35<00:00, 10.92it/s, acc=0.627, xentropy=1.303]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.602


Epoch 73: 100%|██████████| 391/391 [00:35<00:00, 11.91it/s, acc=0.628, xentropy=1.302]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.607


Epoch 74: 100%|██████████| 391/391 [00:36<00:00, 12.00it/s, acc=0.629, xentropy=1.300]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.607


Epoch 75: 100%|██████████| 391/391 [00:35<00:00, 12.39it/s, acc=0.626, xentropy=1.310]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.603


Epoch 76: 100%|██████████| 391/391 [00:36<00:00, 10.78it/s, acc=0.628, xentropy=1.301]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.593


Epoch 77: 100%|██████████| 391/391 [00:35<00:00, 12.46it/s, acc=0.628, xentropy=1.294]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.571


Epoch 78: 100%|██████████| 391/391 [00:34<00:00, 12.47it/s, acc=0.624, xentropy=1.310]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.623


Epoch 79: 100%|██████████| 391/391 [00:34<00:00, 11.22it/s, acc=0.628, xentropy=1.302]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.585


Epoch 80: 100%|██████████| 391/391 [00:34<00:00, 12.51it/s, acc=0.625, xentropy=1.308]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.622


Epoch 81: 100%|██████████| 391/391 [00:34<00:00, 12.27it/s, acc=0.630, xentropy=1.307]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.627


Epoch 82: 100%|██████████| 391/391 [00:34<00:00, 11.28it/s, acc=0.630, xentropy=1.297]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.590


Epoch 83: 100%|██████████| 391/391 [00:34<00:00, 11.33it/s, acc=0.628, xentropy=1.293]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.598


Epoch 84: 100%|██████████| 391/391 [00:34<00:00, 11.27it/s, acc=0.628, xentropy=1.299]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.600


Epoch 85: 100%|██████████| 391/391 [00:34<00:00, 11.37it/s, acc=0.630, xentropy=1.294]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.602


Epoch 86: 100%|██████████| 391/391 [00:34<00:00, 12.59it/s, acc=0.631, xentropy=1.300]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.609


Epoch 87: 100%|██████████| 391/391 [00:34<00:00, 11.22it/s, acc=0.630, xentropy=1.288]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.607


Epoch 88: 100%|██████████| 391/391 [00:34<00:00, 12.84it/s, acc=0.631, xentropy=1.291]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.599


Epoch 89: 100%|██████████| 391/391 [00:34<00:00, 11.34it/s, acc=0.631, xentropy=1.292]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.586


Epoch 90: 100%|██████████| 391/391 [00:34<00:00, 12.43it/s, acc=0.630, xentropy=1.291]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.592


Epoch 91: 100%|██████████| 391/391 [00:34<00:00, 12.63it/s, acc=0.629, xentropy=1.295]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.607


Epoch 92: 100%|██████████| 391/391 [00:34<00:00, 11.32it/s, acc=0.630, xentropy=1.286]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.609


Epoch 93: 100%|██████████| 391/391 [00:34<00:00, 11.42it/s, acc=0.632, xentropy=1.281]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.624


Epoch 94: 100%|██████████| 391/391 [00:34<00:00, 12.86it/s, acc=0.633, xentropy=1.285]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.577


Epoch 95: 100%|██████████| 391/391 [00:34<00:00, 12.76it/s, acc=0.634, xentropy=1.279]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.611


Epoch 96: 100%|██████████| 391/391 [00:34<00:00, 12.93it/s, acc=0.632, xentropy=1.283]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.610


Epoch 97: 100%|██████████| 391/391 [00:34<00:00, 12.58it/s, acc=0.635, xentropy=1.276]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.598


Epoch 98: 100%|██████████| 391/391 [00:34<00:00, 12.90it/s, acc=0.634, xentropy=1.276]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.606


Epoch 99: 100%|██████████| 391/391 [00:34<00:00, 11.48it/s, acc=0.636, xentropy=1.268]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.608


Epoch 100: 100%|██████████| 391/391 [00:34<00:00, 11.40it/s, acc=0.633, xentropy=1.280]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.594


Epoch 101: 100%|██████████| 391/391 [00:34<00:00, 12.82it/s, acc=0.638, xentropy=1.268]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.611


Epoch 102: 100%|██████████| 391/391 [00:34<00:00, 11.44it/s, acc=0.640, xentropy=1.260]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.608


Epoch 103: 100%|██████████| 391/391 [00:34<00:00, 11.47it/s, acc=0.637, xentropy=1.266]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.616


Epoch 104: 100%|██████████| 391/391 [00:34<00:00, 11.39it/s, acc=0.633, xentropy=1.287]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.625


Epoch 105: 100%|██████████| 391/391 [00:34<00:00, 12.27it/s, acc=0.637, xentropy=1.268]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.616


Epoch 106: 100%|██████████| 391/391 [00:34<00:00, 12.62it/s, acc=0.642, xentropy=1.258]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.606


Epoch 107: 100%|██████████| 391/391 [00:34<00:00, 12.86it/s, acc=0.636, xentropy=1.263]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.608


Epoch 108: 100%|██████████| 391/391 [00:34<00:00, 11.42it/s, acc=0.635, xentropy=1.265]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.613


Epoch 109: 100%|██████████| 391/391 [00:34<00:00, 11.46it/s, acc=0.640, xentropy=1.254]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.620


Epoch 110: 100%|██████████| 391/391 [00:34<00:00, 11.42it/s, acc=0.638, xentropy=1.263]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.594


Epoch 111: 100%|██████████| 391/391 [00:33<00:00, 12.47it/s, acc=0.640, xentropy=1.258]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.622


Epoch 112: 100%|██████████| 391/391 [00:33<00:00, 12.14it/s, acc=0.639, xentropy=1.258]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.567


Epoch 113: 100%|██████████| 391/391 [00:33<00:00, 11.50it/s, acc=0.641, xentropy=1.254]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.591


Epoch 114: 100%|██████████| 391/391 [00:34<00:00, 11.47it/s, acc=0.640, xentropy=1.262]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.605


Epoch 115: 100%|██████████| 391/391 [00:33<00:00, 11.53it/s, acc=0.638, xentropy=1.254]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.563


Epoch 116: 100%|██████████| 391/391 [00:34<00:00, 11.48it/s, acc=0.641, xentropy=1.250]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.602


Epoch 117: 100%|██████████| 391/391 [00:33<00:00, 12.69it/s, acc=0.639, xentropy=1.252]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.629


Epoch 118: 100%|██████████| 391/391 [00:33<00:00, 11.52it/s, acc=0.640, xentropy=1.252]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.618


Epoch 119: 100%|██████████| 391/391 [00:33<00:00, 11.57it/s, acc=0.642, xentropy=1.248]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.607


Epoch 120: 100%|██████████| 391/391 [00:34<00:00, 11.47it/s, acc=0.645, xentropy=1.240]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.604


Epoch 121: 100%|██████████| 391/391 [00:34<00:00, 11.45it/s, acc=0.696, xentropy=1.054]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.689


Epoch 122: 100%|██████████| 391/391 [00:33<00:00, 12.70it/s, acc=0.713, xentropy=0.987]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.692


Epoch 123: 100%|██████████| 391/391 [00:34<00:00, 12.33it/s, acc=0.715, xentropy=0.973]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.689


Epoch 124: 100%|██████████| 391/391 [00:33<00:00, 11.52it/s, acc=0.721, xentropy=0.960]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.683


Epoch 125: 100%|██████████| 391/391 [00:33<00:00, 12.44it/s, acc=0.722, xentropy=0.956]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.688


Epoch 126: 100%|██████████| 391/391 [00:34<00:00, 11.43it/s, acc=0.723, xentropy=0.947]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.700


Epoch 127: 100%|██████████| 391/391 [00:33<00:00, 11.54it/s, acc=0.726, xentropy=0.942]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.693


Epoch 128: 100%|██████████| 391/391 [00:33<00:00, 11.53it/s, acc=0.726, xentropy=0.938]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.693


Epoch 129: 100%|██████████| 391/391 [00:34<00:00, 11.48it/s, acc=0.728, xentropy=0.930]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.692


Epoch 130: 100%|██████████| 391/391 [00:34<00:00, 11.49it/s, acc=0.730, xentropy=0.925]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.696


Epoch 131: 100%|██████████| 391/391 [00:34<00:00, 11.47it/s, acc=0.731, xentropy=0.921]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.698


Epoch 132: 100%|██████████| 391/391 [00:33<00:00, 11.50it/s, acc=0.735, xentropy=0.915]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.694


Epoch 133: 100%|██████████| 391/391 [00:33<00:00, 11.54it/s, acc=0.731, xentropy=0.916]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.699


Epoch 134: 100%|██████████| 391/391 [00:33<00:00, 11.51it/s, acc=0.734, xentropy=0.907]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.688


Epoch 135: 100%|██████████| 391/391 [00:34<00:00, 11.46it/s, acc=0.733, xentropy=0.911]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.692


Epoch 136: 100%|██████████| 391/391 [00:33<00:00, 11.54it/s, acc=0.733, xentropy=0.910]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.691


Epoch 137: 100%|██████████| 391/391 [00:33<00:00, 11.51it/s, acc=0.737, xentropy=0.903]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.689


Epoch 138: 100%|██████████| 391/391 [00:33<00:00, 12.30it/s, acc=0.735, xentropy=0.906]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.685


Epoch 139: 100%|██████████| 391/391 [00:33<00:00, 12.59it/s, acc=0.734, xentropy=0.908]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.684


Epoch 140: 100%|██████████| 391/391 [00:33<00:00, 11.50it/s, acc=0.735, xentropy=0.903]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.687


Epoch 141: 100%|██████████| 391/391 [00:33<00:00, 12.58it/s, acc=0.735, xentropy=0.900]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.687


Epoch 142: 100%|██████████| 391/391 [00:34<00:00, 12.54it/s, acc=0.741, xentropy=0.893]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.680


Epoch 143: 100%|██████████| 391/391 [00:34<00:00, 12.41it/s, acc=0.735, xentropy=0.898]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.693


Epoch 144: 100%|██████████| 391/391 [00:34<00:00, 12.49it/s, acc=0.737, xentropy=0.897]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.682


Epoch 145: 100%|██████████| 391/391 [00:34<00:00, 11.49it/s, acc=0.734, xentropy=0.899]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.685


Epoch 146: 100%|██████████| 391/391 [00:34<00:00, 11.44it/s, acc=0.735, xentropy=0.900]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.692


Epoch 147: 100%|██████████| 391/391 [00:34<00:00, 12.93it/s, acc=0.742, xentropy=0.893]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.682


Epoch 148: 100%|██████████| 391/391 [00:33<00:00, 11.55it/s, acc=0.738, xentropy=0.896]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.682


Epoch 149: 100%|██████████| 391/391 [00:34<00:00, 12.43it/s, acc=0.736, xentropy=0.897]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.687


Epoch 150: 100%|██████████| 391/391 [00:34<00:00, 11.38it/s, acc=0.738, xentropy=0.887]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.685


Epoch 151: 100%|██████████| 391/391 [00:34<00:00, 11.46it/s, acc=0.741, xentropy=0.890]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.687


Epoch 152: 100%|██████████| 391/391 [00:34<00:00, 12.39it/s, acc=0.738, xentropy=0.891]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.689


Epoch 153: 100%|██████████| 391/391 [00:34<00:00, 11.42it/s, acc=0.740, xentropy=0.886]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.674


Epoch 154: 100%|██████████| 391/391 [00:34<00:00, 11.39it/s, acc=0.738, xentropy=0.891]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.691


Epoch 155: 100%|██████████| 391/391 [00:34<00:00, 11.48it/s, acc=0.737, xentropy=0.895]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.689


Epoch 156: 100%|██████████| 391/391 [00:33<00:00, 12.88it/s, acc=0.739, xentropy=0.892]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.686


Epoch 157: 100%|██████████| 391/391 [00:34<00:00, 12.40it/s, acc=0.738, xentropy=0.889]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.693


Epoch 158: 100%|██████████| 391/391 [00:33<00:00, 11.51it/s, acc=0.737, xentropy=0.893]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.687


Epoch 159: 100%|██████████| 391/391 [00:34<00:00, 11.48it/s, acc=0.738, xentropy=0.892]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.690


Epoch 160: 100%|██████████| 391/391 [00:34<00:00, 11.46it/s, acc=0.738, xentropy=0.889]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.684


Epoch 161: 100%|██████████| 391/391 [00:33<00:00, 11.51it/s, acc=0.762, xentropy=0.808]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.708


Epoch 162: 100%|██████████| 391/391 [00:34<00:00, 11.49it/s, acc=0.768, xentropy=0.789]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.710


Epoch 163: 100%|██████████| 391/391 [00:34<00:00, 12.71it/s, acc=0.770, xentropy=0.780]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.706


Epoch 164: 100%|██████████| 391/391 [00:34<00:00, 12.71it/s, acc=0.772, xentropy=0.773]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.709


Epoch 165: 100%|██████████| 391/391 [00:33<00:00, 11.56it/s, acc=0.774, xentropy=0.765]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.711


Epoch 166: 100%|██████████| 391/391 [00:34<00:00, 11.45it/s, acc=0.778, xentropy=0.760]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.713


Epoch 167: 100%|██████████| 391/391 [00:34<00:00, 11.39it/s, acc=0.776, xentropy=0.764]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.711


Epoch 168: 100%|██████████| 391/391 [00:34<00:00, 12.72it/s, acc=0.778, xentropy=0.760]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.712


Epoch 169: 100%|██████████| 391/391 [00:34<00:00, 11.46it/s, acc=0.775, xentropy=0.757]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.711


Epoch 170: 100%|██████████| 391/391 [00:33<00:00, 11.50it/s, acc=0.778, xentropy=0.753]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.713


Epoch 171: 100%|██████████| 391/391 [00:33<00:00, 13.10it/s, acc=0.776, xentropy=0.753]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.710


Epoch 172: 100%|██████████| 391/391 [00:33<00:00, 11.53it/s, acc=0.779, xentropy=0.751]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.711


Epoch 173: 100%|██████████| 391/391 [00:34<00:00, 12.66it/s, acc=0.778, xentropy=0.753]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.707


Epoch 174: 100%|██████████| 391/391 [00:34<00:00, 12.61it/s, acc=0.780, xentropy=0.751]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.711


Epoch 175: 100%|██████████| 391/391 [00:34<00:00, 11.50it/s, acc=0.781, xentropy=0.746]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.710


Epoch 176: 100%|██████████| 391/391 [00:34<00:00, 12.82it/s, acc=0.781, xentropy=0.747]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.711


Epoch 177: 100%|██████████| 391/391 [00:34<00:00, 11.33it/s, acc=0.782, xentropy=0.738]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.711


Epoch 178: 100%|██████████| 391/391 [00:34<00:00, 11.34it/s, acc=0.782, xentropy=0.740]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.710


Epoch 179: 100%|██████████| 391/391 [00:34<00:00, 11.39it/s, acc=0.780, xentropy=0.742]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.709


Epoch 180: 100%|██████████| 391/391 [00:34<00:00, 12.64it/s, acc=0.781, xentropy=0.742]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.710


Epoch 181: 100%|██████████| 391/391 [00:34<00:00, 11.31it/s, acc=0.782, xentropy=0.739]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.709


Epoch 182: 100%|██████████| 391/391 [00:34<00:00, 11.26it/s, acc=0.780, xentropy=0.743]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.710


Epoch 183: 100%|██████████| 391/391 [00:34<00:00, 11.45it/s, acc=0.783, xentropy=0.741]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.713


Epoch 184: 100%|██████████| 391/391 [00:34<00:00, 12.32it/s, acc=0.784, xentropy=0.738]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.709


Epoch 185: 100%|██████████| 391/391 [00:34<00:00, 11.33it/s, acc=0.786, xentropy=0.733]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.709


Epoch 186: 100%|██████████| 391/391 [00:34<00:00, 12.85it/s, acc=0.783, xentropy=0.732]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.712


Epoch 187: 100%|██████████| 391/391 [00:34<00:00, 11.33it/s, acc=0.788, xentropy=0.724]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.710


Epoch 188: 100%|██████████| 391/391 [00:34<00:00, 12.69it/s, acc=0.782, xentropy=0.735]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.712


Epoch 189: 100%|██████████| 391/391 [00:34<00:00, 11.29it/s, acc=0.787, xentropy=0.729]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.711


Epoch 190: 100%|██████████| 391/391 [00:34<00:00, 12.87it/s, acc=0.785, xentropy=0.729]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.712


Epoch 191: 100%|██████████| 391/391 [00:34<00:00, 11.29it/s, acc=0.783, xentropy=0.732]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.709


Epoch 192: 100%|██████████| 391/391 [00:34<00:00, 11.27it/s, acc=0.783, xentropy=0.731]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.708


Epoch 193: 100%|██████████| 391/391 [00:34<00:00, 12.55it/s, acc=0.787, xentropy=0.721]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.712


Epoch 194: 100%|██████████| 391/391 [00:34<00:00, 12.80it/s, acc=0.786, xentropy=0.728]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.711


Epoch 195: 100%|██████████| 391/391 [00:34<00:00, 11.35it/s, acc=0.787, xentropy=0.724]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.709


Epoch 196: 100%|██████████| 391/391 [00:34<00:00, 11.31it/s, acc=0.785, xentropy=0.730]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.706


Epoch 197: 100%|██████████| 391/391 [00:34<00:00, 12.49it/s, acc=0.785, xentropy=0.722]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.712


Epoch 198: 100%|██████████| 391/391 [00:34<00:00, 12.30it/s, acc=0.787, xentropy=0.726]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.704


Epoch 199: 100%|██████████| 391/391 [00:34<00:00, 12.46it/s, acc=0.786, xentropy=0.721]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.711


Epoch 200: 100%|██████████| 391/391 [00:34<00:00, 11.25it/s, acc=0.789, xentropy=0.722]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.711


Epoch 201: 100%|██████████| 391/391 [00:34<00:00, 11.27it/s, acc=0.794, xentropy=0.699]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.714


Epoch 202: 100%|██████████| 391/391 [00:34<00:00, 11.20it/s, acc=0.794, xentropy=0.699]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.715


Epoch 203: 100%|██████████| 391/391 [00:34<00:00, 12.31it/s, acc=0.795, xentropy=0.697]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.716


Epoch 204: 100%|██████████| 391/391 [00:34<00:00, 11.27it/s, acc=0.796, xentropy=0.691]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.714


Epoch 205: 100%|██████████| 391/391 [00:34<00:00, 12.35it/s, acc=0.796, xentropy=0.694]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.714


Epoch 206: 100%|██████████| 391/391 [00:34<00:00, 11.25it/s, acc=0.797, xentropy=0.689]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.713


Epoch 207: 100%|██████████| 391/391 [00:34<00:00, 12.36it/s, acc=0.797, xentropy=0.693]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.716


Epoch 208: 100%|██████████| 391/391 [00:34<00:00, 11.32it/s, acc=0.799, xentropy=0.683]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.716


Epoch 209: 100%|██████████| 391/391 [00:34<00:00, 11.27it/s, acc=0.798, xentropy=0.684]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.715


Epoch 210: 100%|██████████| 391/391 [00:34<00:00, 12.24it/s, acc=0.798, xentropy=0.684]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.717


Epoch 211: 100%|██████████| 391/391 [00:35<00:00, 11.17it/s, acc=0.797, xentropy=0.687]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.715


Epoch 212: 100%|██████████| 391/391 [00:34<00:00, 12.63it/s, acc=0.799, xentropy=0.685]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.715


Epoch 213: 100%|██████████| 391/391 [00:34<00:00, 11.20it/s, acc=0.796, xentropy=0.693]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.717


Epoch 214: 100%|██████████| 391/391 [00:34<00:00, 11.25it/s, acc=0.799, xentropy=0.686]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.717


Epoch 215: 100%|██████████| 391/391 [00:34<00:00, 11.26it/s, acc=0.800, xentropy=0.681]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.715


Epoch 216: 100%|██████████| 391/391 [00:34<00:00, 12.49it/s, acc=0.801, xentropy=0.682]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.716


Epoch 217: 100%|██████████| 391/391 [00:34<00:00, 11.34it/s, acc=0.798, xentropy=0.684]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.716


Epoch 218: 100%|██████████| 391/391 [00:34<00:00, 12.50it/s, acc=0.800, xentropy=0.683]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.714


Epoch 219: 100%|██████████| 391/391 [00:34<00:00, 12.68it/s, acc=0.798, xentropy=0.689]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.716


Epoch 220: 100%|██████████| 391/391 [00:34<00:00, 11.25it/s, acc=0.798, xentropy=0.682]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.715


Epoch 221: 100%|██████████| 391/391 [00:34<00:00, 11.20it/s, acc=0.801, xentropy=0.679]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.715


Epoch 222: 100%|██████████| 391/391 [00:34<00:00, 11.26it/s, acc=0.800, xentropy=0.683]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.715


Epoch 223: 100%|██████████| 391/391 [00:34<00:00, 11.28it/s, acc=0.802, xentropy=0.675]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.714


Epoch 224: 100%|██████████| 391/391 [00:34<00:00, 12.51it/s, acc=0.800, xentropy=0.684]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.714


Epoch 225: 100%|██████████| 391/391 [00:34<00:00, 11.27it/s, acc=0.800, xentropy=0.683]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.713


Epoch 226: 100%|██████████| 391/391 [00:34<00:00, 11.23it/s, acc=0.801, xentropy=0.681]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.714


Epoch 227: 100%|██████████| 391/391 [00:34<00:00, 11.21it/s, acc=0.801, xentropy=0.678]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.715


Epoch 228: 100%|██████████| 391/391 [00:34<00:00, 11.22it/s, acc=0.799, xentropy=0.686]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.713


Epoch 229: 100%|██████████| 391/391 [00:34<00:00, 11.30it/s, acc=0.799, xentropy=0.680]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.716


Epoch 230: 100%|██████████| 391/391 [00:34<00:00, 11.28it/s, acc=0.796, xentropy=0.685]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.715


Epoch 231: 100%|██████████| 391/391 [00:34<00:00, 11.32it/s, acc=0.802, xentropy=0.680]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.716


Epoch 232: 100%|██████████| 391/391 [00:34<00:00, 11.35it/s, acc=0.800, xentropy=0.678]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.716


Epoch 233: 100%|██████████| 391/391 [00:34<00:00, 12.37it/s, acc=0.800, xentropy=0.680]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.717


Epoch 234: 100%|██████████| 391/391 [00:34<00:00, 11.25it/s, acc=0.804, xentropy=0.675]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.715


Epoch 235: 100%|██████████| 391/391 [00:34<00:00, 11.23it/s, acc=0.800, xentropy=0.683]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.716


Epoch 236: 100%|██████████| 391/391 [00:34<00:00, 12.44it/s, acc=0.801, xentropy=0.677]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.713


Epoch 237: 100%|██████████| 391/391 [00:34<00:00, 12.45it/s, acc=0.802, xentropy=0.675]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.714


Epoch 238: 100%|██████████| 391/391 [00:34<00:00, 12.42it/s, acc=0.800, xentropy=0.683]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.714


Epoch 239: 100%|██████████| 391/391 [00:34<00:00, 11.37it/s, acc=0.800, xentropy=0.676]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.713


Epoch 240: 100%|██████████| 391/391 [00:34<00:00, 12.27it/s, acc=0.798, xentropy=0.683]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.713


Epoch 241: 100%|██████████| 391/391 [00:34<00:00, 12.89it/s, acc=0.802, xentropy=0.672]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.715


Epoch 242: 100%|██████████| 391/391 [00:34<00:00, 12.53it/s, acc=0.806, xentropy=0.664]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.715


Epoch 243: 100%|██████████| 391/391 [00:34<00:00, 11.20it/s, acc=0.802, xentropy=0.673]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.713


Epoch 244: 100%|██████████| 391/391 [00:34<00:00, 12.44it/s, acc=0.802, xentropy=0.675]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.714


Epoch 245: 100%|██████████| 391/391 [00:34<00:00, 11.30it/s, acc=0.803, xentropy=0.670]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.715


Epoch 246: 100%|██████████| 391/391 [00:34<00:00, 11.19it/s, acc=0.803, xentropy=0.670]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.715


Epoch 247: 100%|██████████| 391/391 [00:34<00:00, 11.25it/s, acc=0.801, xentropy=0.673]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.714


Epoch 248: 100%|██████████| 391/391 [00:34<00:00, 12.34it/s, acc=0.801, xentropy=0.669]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.714


Epoch 249: 100%|██████████| 391/391 [00:34<00:00, 12.54it/s, acc=0.802, xentropy=0.673]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.715


Epoch 250: 100%|██████████| 391/391 [00:34<00:00, 12.05it/s, acc=0.800, xentropy=0.678]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.715


Epoch 251: 100%|██████████| 391/391 [00:34<00:00, 11.33it/s, acc=0.805, xentropy=0.667]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.715


Epoch 252: 100%|██████████| 391/391 [00:34<00:00, 11.19it/s, acc=0.802, xentropy=0.669]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.713


Epoch 253: 100%|██████████| 391/391 [00:34<00:00, 12.16it/s, acc=0.803, xentropy=0.668]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.715


Epoch 254: 100%|██████████| 391/391 [00:34<00:00, 11.24it/s, acc=0.801, xentropy=0.670]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.715


Epoch 255: 100%|██████████| 391/391 [00:34<00:00, 12.52it/s, acc=0.804, xentropy=0.668]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.715


Epoch 256: 100%|██████████| 391/391 [00:34<00:00, 11.23it/s, acc=0.802, xentropy=0.675]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.711


Epoch 257: 100%|██████████| 391/391 [00:34<00:00, 12.78it/s, acc=0.803, xentropy=0.672]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.716


Epoch 258: 100%|██████████| 391/391 [00:34<00:00, 11.28it/s, acc=0.804, xentropy=0.666]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.713


Epoch 259: 100%|██████████| 391/391 [00:35<00:00, 11.16it/s, acc=0.802, xentropy=0.677]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.715


Epoch 260: 100%|██████████| 391/391 [00:35<00:00, 11.16it/s, acc=0.803, xentropy=0.671]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.714


Epoch 261: 100%|██████████| 391/391 [00:34<00:00, 12.36it/s, acc=0.804, xentropy=0.670]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.714


Epoch 262: 100%|██████████| 391/391 [00:34<00:00, 13.04it/s, acc=0.802, xentropy=0.671]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.714


Epoch 263: 100%|██████████| 391/391 [00:34<00:00, 12.55it/s, acc=0.802, xentropy=0.672]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.715


Epoch 264: 100%|██████████| 391/391 [00:34<00:00, 11.23it/s, acc=0.802, xentropy=0.672]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.716


Epoch 265: 100%|██████████| 391/391 [00:35<00:00, 11.17it/s, acc=0.804, xentropy=0.670]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.714


Epoch 266: 100%|██████████| 391/391 [00:35<00:00, 11.09it/s, acc=0.801, xentropy=0.674]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.715


Epoch 267: 100%|██████████| 391/391 [00:34<00:00, 11.27it/s, acc=0.803, xentropy=0.669]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.714


Epoch 268: 100%|██████████| 391/391 [00:34<00:00, 11.25it/s, acc=0.805, xentropy=0.666]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.714


Epoch 269: 100%|██████████| 391/391 [00:34<00:00, 12.52it/s, acc=0.803, xentropy=0.667]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.715


Epoch 270: 100%|██████████| 391/391 [00:34<00:00, 12.11it/s, acc=0.803, xentropy=0.668]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.714


Epoch 271: 100%|██████████| 391/391 [00:34<00:00, 11.20it/s, acc=0.799, xentropy=0.675]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.715


Epoch 272: 100%|██████████| 391/391 [00:34<00:00, 12.62it/s, acc=0.799, xentropy=0.677]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.712


Epoch 273: 100%|██████████| 391/391 [00:35<00:00, 11.15it/s, acc=0.804, xentropy=0.667]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.713


Epoch 274: 100%|██████████| 391/391 [00:35<00:00, 12.53it/s, acc=0.802, xentropy=0.669]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.716


Epoch 275: 100%|██████████| 391/391 [00:35<00:00, 12.43it/s, acc=0.803, xentropy=0.666]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.715


Epoch 276: 100%|██████████| 391/391 [00:34<00:00, 12.29it/s, acc=0.802, xentropy=0.671]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.714


Epoch 277: 100%|██████████| 391/391 [00:34<00:00, 11.18it/s, acc=0.805, xentropy=0.667]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.714


Epoch 278: 100%|██████████| 391/391 [00:34<00:00, 11.25it/s, acc=0.804, xentropy=0.675]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.715


Epoch 279: 100%|██████████| 391/391 [00:34<00:00, 11.29it/s, acc=0.803, xentropy=0.668]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.715


Epoch 280: 100%|██████████| 391/391 [00:34<00:00, 12.61it/s, acc=0.804, xentropy=0.668]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.714


Epoch 281: 100%|██████████| 391/391 [00:34<00:00, 12.44it/s, acc=0.804, xentropy=0.664]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.716


Epoch 282: 100%|██████████| 391/391 [00:34<00:00, 12.63it/s, acc=0.805, xentropy=0.668]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.715


Epoch 283: 100%|██████████| 391/391 [00:34<00:00, 11.30it/s, acc=0.804, xentropy=0.664]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.714


Epoch 284: 100%|██████████| 391/391 [00:34<00:00, 11.21it/s, acc=0.802, xentropy=0.674]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.714


Epoch 285: 100%|██████████| 391/391 [00:34<00:00, 12.41it/s, acc=0.801, xentropy=0.667]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.714


Epoch 286: 100%|██████████| 391/391 [00:34<00:00, 12.22it/s, acc=0.804, xentropy=0.668]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.714


Epoch 287: 100%|██████████| 391/391 [00:34<00:00, 11.26it/s, acc=0.804, xentropy=0.666]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.714


Epoch 288: 100%|██████████| 391/391 [00:34<00:00, 11.22it/s, acc=0.805, xentropy=0.667]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.716


Epoch 289: 100%|██████████| 391/391 [00:35<00:00, 12.44it/s, acc=0.801, xentropy=0.673]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.714


Epoch 290: 100%|██████████| 391/391 [00:34<00:00, 11.17it/s, acc=0.802, xentropy=0.666]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.715


Epoch 291: 100%|██████████| 391/391 [00:34<00:00, 12.66it/s, acc=0.804, xentropy=0.670]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.713


Epoch 292: 100%|██████████| 391/391 [00:35<00:00, 11.17it/s, acc=0.805, xentropy=0.667]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.716


Epoch 293: 100%|██████████| 391/391 [00:35<00:00, 11.17it/s, acc=0.803, xentropy=0.665]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.714


Epoch 294: 100%|██████████| 391/391 [00:34<00:00, 12.59it/s, acc=0.805, xentropy=0.666]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.715


Epoch 295: 100%|██████████| 391/391 [00:34<00:00, 11.20it/s, acc=0.802, xentropy=0.667]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.716


Epoch 296: 100%|██████████| 391/391 [00:34<00:00, 12.43it/s, acc=0.802, xentropy=0.675]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.714


Epoch 297: 100%|██████████| 391/391 [00:34<00:00, 11.27it/s, acc=0.804, xentropy=0.667]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.714


Epoch 298: 100%|██████████| 391/391 [00:34<00:00, 11.28it/s, acc=0.805, xentropy=0.667]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.715


Epoch 299: 100%|██████████| 391/391 [00:34<00:00, 12.72it/s, acc=0.805, xentropy=0.665]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.715


Epoch 300: 100%|██████████| 391/391 [00:34<00:00, 12.44it/s, acc=0.804, xentropy=0.668]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.713


Epoch 301: 100%|██████████| 391/391 [00:34<00:00, 11.19it/s, acc=0.803, xentropy=0.668]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.714


Epoch 302: 100%|██████████| 391/391 [00:34<00:00, 11.31it/s, acc=0.807, xentropy=0.662]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.715


Epoch 303: 100%|██████████| 391/391 [00:34<00:00, 11.26it/s, acc=0.804, xentropy=0.671]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.716


Epoch 304: 100%|██████████| 391/391 [00:34<00:00, 11.29it/s, acc=0.806, xentropy=0.663]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.714


Epoch 305: 100%|██████████| 391/391 [00:34<00:00, 12.24it/s, acc=0.805, xentropy=0.663]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.715


Epoch 306: 100%|██████████| 391/391 [00:34<00:00, 11.24it/s, acc=0.806, xentropy=0.666]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.714


Epoch 307: 100%|██████████| 391/391 [00:34<00:00, 11.26it/s, acc=0.802, xentropy=0.667]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.714


Epoch 308: 100%|██████████| 391/391 [00:34<00:00, 11.34it/s, acc=0.804, xentropy=0.666]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.716


Epoch 309: 100%|██████████| 391/391 [00:34<00:00, 12.39it/s, acc=0.804, xentropy=0.668]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.713


Epoch 310: 100%|██████████| 391/391 [00:34<00:00, 11.27it/s, acc=0.805, xentropy=0.668]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.715


Epoch 311: 100%|██████████| 391/391 [00:34<00:00, 12.79it/s, acc=0.801, xentropy=0.668]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.716


Epoch 312: 100%|██████████| 391/391 [00:34<00:00, 12.44it/s, acc=0.807, xentropy=0.663]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.715


Epoch 313: 100%|██████████| 391/391 [00:34<00:00, 11.28it/s, acc=0.802, xentropy=0.664]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.714


Epoch 314: 100%|██████████| 391/391 [00:34<00:00, 12.25it/s, acc=0.805, xentropy=0.663]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.716


Epoch 315: 100%|██████████| 391/391 [00:34<00:00, 11.25it/s, acc=0.804, xentropy=0.665]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.714


Epoch 316: 100%|██████████| 391/391 [00:34<00:00, 12.50it/s, acc=0.808, xentropy=0.663]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.716


Epoch 317: 100%|██████████| 391/391 [00:34<00:00, 12.55it/s, acc=0.802, xentropy=0.667]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.717


Epoch 318: 100%|██████████| 391/391 [00:34<00:00, 12.28it/s, acc=0.806, xentropy=0.666]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.716


Epoch 319: 100%|██████████| 391/391 [00:34<00:00, 11.25it/s, acc=0.805, xentropy=0.663]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.715


Epoch 320: 100%|██████████| 391/391 [00:34<00:00, 11.19it/s, acc=0.804, xentropy=0.667]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.716


Epoch 321: 100%|██████████| 391/391 [00:34<00:00, 11.22it/s, acc=0.804, xentropy=0.668]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.715


Epoch 322: 100%|██████████| 391/391 [00:34<00:00, 11.24it/s, acc=0.807, xentropy=0.655]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.715


Epoch 323: 100%|██████████| 391/391 [00:34<00:00, 11.23it/s, acc=0.802, xentropy=0.671]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.715


Epoch 324: 100%|██████████| 391/391 [00:34<00:00, 12.68it/s, acc=0.805, xentropy=0.665]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.715


Epoch 325: 100%|██████████| 391/391 [00:34<00:00, 12.70it/s, acc=0.805, xentropy=0.665]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.715


Epoch 326: 100%|██████████| 391/391 [00:34<00:00, 11.28it/s, acc=0.805, xentropy=0.665]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.716


Epoch 327: 100%|██████████| 391/391 [00:34<00:00, 12.73it/s, acc=0.805, xentropy=0.665]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.714


Epoch 328: 100%|██████████| 391/391 [00:34<00:00, 13.20it/s, acc=0.804, xentropy=0.664]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.715


Epoch 329: 100%|██████████| 391/391 [00:34<00:00, 11.29it/s, acc=0.802, xentropy=0.668]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.714


Epoch 330: 100%|██████████| 391/391 [00:35<00:00, 11.16it/s, acc=0.801, xentropy=0.673]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.714


Epoch 331: 100%|██████████| 391/391 [00:34<00:00, 11.31it/s, acc=0.804, xentropy=0.666]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.715


Epoch 332: 100%|██████████| 391/391 [00:34<00:00, 12.46it/s, acc=0.803, xentropy=0.668]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.717


Epoch 333: 100%|██████████| 391/391 [00:34<00:00, 12.18it/s, acc=0.804, xentropy=0.662]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.715


Epoch 334: 100%|██████████| 391/391 [00:34<00:00, 11.26it/s, acc=0.805, xentropy=0.666]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.714


Epoch 335: 100%|██████████| 391/391 [00:34<00:00, 11.25it/s, acc=0.804, xentropy=0.669]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.714


Epoch 336: 100%|██████████| 391/391 [00:34<00:00, 12.46it/s, acc=0.807, xentropy=0.659]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.714


Epoch 337: 100%|██████████| 391/391 [00:34<00:00, 12.43it/s, acc=0.804, xentropy=0.666]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.714


Epoch 338: 100%|██████████| 391/391 [00:34<00:00, 12.56it/s, acc=0.807, xentropy=0.663]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.717


Epoch 339: 100%|██████████| 391/391 [00:34<00:00, 11.27it/s, acc=0.804, xentropy=0.669]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.715


Epoch 340: 100%|██████████| 391/391 [00:34<00:00, 11.30it/s, acc=0.803, xentropy=0.668]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.715


Epoch 341: 100%|██████████| 391/391 [00:34<00:00, 11.34it/s, acc=0.803, xentropy=0.670]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.714


Epoch 342: 100%|██████████| 391/391 [00:34<00:00, 11.19it/s, acc=0.805, xentropy=0.668]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.715


Epoch 343: 100%|██████████| 391/391 [00:34<00:00, 11.22it/s, acc=0.806, xentropy=0.668]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.715


Epoch 344: 100%|██████████| 391/391 [00:34<00:00, 12.48it/s, acc=0.807, xentropy=0.657]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.714


Epoch 345: 100%|██████████| 391/391 [00:34<00:00, 11.21it/s, acc=0.804, xentropy=0.667]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.717


Epoch 346: 100%|██████████| 391/391 [00:34<00:00, 12.64it/s, acc=0.804, xentropy=0.669]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.715


Epoch 347: 100%|██████████| 391/391 [00:34<00:00, 12.46it/s, acc=0.802, xentropy=0.670]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.717


Epoch 348: 100%|██████████| 391/391 [00:34<00:00, 11.25it/s, acc=0.806, xentropy=0.669]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.714


Epoch 349: 100%|██████████| 391/391 [00:34<00:00, 12.48it/s, acc=0.805, xentropy=0.666]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.714


Epoch 350: 100%|██████████| 391/391 [00:34<00:00, 12.50it/s, acc=0.804, xentropy=0.666]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.715


Epoch 351: 100%|██████████| 391/391 [00:34<00:00, 11.20it/s, acc=0.804, xentropy=0.666]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.715


Epoch 352: 100%|██████████| 391/391 [00:34<00:00, 11.31it/s, acc=0.804, xentropy=0.664]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.715


Epoch 353: 100%|██████████| 391/391 [00:34<00:00, 11.24it/s, acc=0.805, xentropy=0.668]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.713


Epoch 354: 100%|██████████| 391/391 [00:34<00:00, 12.33it/s, acc=0.805, xentropy=0.666]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.715


Epoch 355: 100%|██████████| 391/391 [00:34<00:00, 12.13it/s, acc=0.804, xentropy=0.667]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.716


Epoch 356: 100%|██████████| 391/391 [00:34<00:00, 12.31it/s, acc=0.805, xentropy=0.665]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.713


Epoch 357: 100%|██████████| 391/391 [00:34<00:00, 11.29it/s, acc=0.803, xentropy=0.665]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.714


Epoch 358: 100%|██████████| 391/391 [00:34<00:00, 12.17it/s, acc=0.804, xentropy=0.669]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.716


Epoch 359: 100%|██████████| 391/391 [00:34<00:00, 12.65it/s, acc=0.804, xentropy=0.665]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.714


Epoch 360: 100%|██████████| 391/391 [00:34<00:00, 12.09it/s, acc=0.804, xentropy=0.668]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.716


Epoch 361: 100%|██████████| 391/391 [00:34<00:00, 11.26it/s, acc=0.804, xentropy=0.667]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.716


Epoch 362: 100%|██████████| 391/391 [00:34<00:00, 12.22it/s, acc=0.805, xentropy=0.668]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.716


Epoch 363: 100%|██████████| 391/391 [00:34<00:00, 12.82it/s, acc=0.805, xentropy=0.665]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.717


Epoch 364: 100%|██████████| 391/391 [00:34<00:00, 12.12it/s, acc=0.804, xentropy=0.671]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.716


Epoch 365: 100%|██████████| 391/391 [00:34<00:00, 12.39it/s, acc=0.805, xentropy=0.665]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.713


Epoch 366: 100%|██████████| 391/391 [00:34<00:00, 12.73it/s, acc=0.806, xentropy=0.668]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.714


Epoch 367: 100%|██████████| 391/391 [00:34<00:00, 11.19it/s, acc=0.805, xentropy=0.662]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.716


Epoch 368: 100%|██████████| 391/391 [00:34<00:00, 12.02it/s, acc=0.805, xentropy=0.662]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.716


Epoch 369: 100%|██████████| 391/391 [00:34<00:00, 12.55it/s, acc=0.804, xentropy=0.669]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.714


Epoch 370: 100%|██████████| 391/391 [00:34<00:00, 11.18it/s, acc=0.804, xentropy=0.667]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.714


Epoch 371: 100%|██████████| 391/391 [00:34<00:00, 12.99it/s, acc=0.807, xentropy=0.654]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.714


Epoch 372: 100%|██████████| 391/391 [00:34<00:00, 12.45it/s, acc=0.803, xentropy=0.668]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.714


Epoch 373: 100%|██████████| 391/391 [00:34<00:00, 11.22it/s, acc=0.805, xentropy=0.667]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.715


Epoch 374: 100%|██████████| 391/391 [00:34<00:00, 12.26it/s, acc=0.803, xentropy=0.668]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.715


Epoch 375: 100%|██████████| 391/391 [00:34<00:00, 12.66it/s, acc=0.804, xentropy=0.666]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.715


Epoch 376: 100%|██████████| 391/391 [00:35<00:00, 11.15it/s, acc=0.804, xentropy=0.670]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.714


Epoch 377: 100%|██████████| 391/391 [00:34<00:00, 11.29it/s, acc=0.806, xentropy=0.668]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.716


Epoch 378: 100%|██████████| 391/391 [00:34<00:00, 11.27it/s, acc=0.805, xentropy=0.669]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.716


Epoch 379: 100%|██████████| 391/391 [00:34<00:00, 11.30it/s, acc=0.802, xentropy=0.665]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.714


Epoch 380: 100%|██████████| 391/391 [00:34<00:00, 11.23it/s, acc=0.805, xentropy=0.666]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.715


Epoch 381: 100%|██████████| 391/391 [00:34<00:00, 12.52it/s, acc=0.805, xentropy=0.668]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.716


Epoch 382: 100%|██████████| 391/391 [00:35<00:00, 12.35it/s, acc=0.802, xentropy=0.671]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.714


Epoch 383: 100%|██████████| 391/391 [00:34<00:00, 12.70it/s, acc=0.805, xentropy=0.667]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.714


Epoch 384: 100%|██████████| 391/391 [00:34<00:00, 11.23it/s, acc=0.804, xentropy=0.668]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.716


Epoch 385: 100%|██████████| 391/391 [00:34<00:00, 11.20it/s, acc=0.806, xentropy=0.665]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.716


Epoch 386: 100%|██████████| 391/391 [00:35<00:00, 11.78it/s, acc=0.805, xentropy=0.663]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.715


Epoch 387: 100%|██████████| 391/391 [00:36<00:00, 10.85it/s, acc=0.806, xentropy=0.663]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.715


Epoch 388: 100%|██████████| 391/391 [00:35<00:00, 12.43it/s, acc=0.806, xentropy=0.662]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.714


Epoch 389: 100%|██████████| 391/391 [00:35<00:00, 10.91it/s, acc=0.805, xentropy=0.664]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.714


Epoch 390: 100%|██████████| 391/391 [00:35<00:00, 11.11it/s, acc=0.805, xentropy=0.667]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.715


Epoch 391: 100%|██████████| 391/391 [00:34<00:00, 11.33it/s, acc=0.805, xentropy=0.668]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.715


Epoch 392: 100%|██████████| 391/391 [00:34<00:00, 11.33it/s, acc=0.804, xentropy=0.664]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.714


Epoch 393: 100%|██████████| 391/391 [00:34<00:00, 11.40it/s, acc=0.805, xentropy=0.668]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.715


Epoch 394: 100%|██████████| 391/391 [00:35<00:00, 12.45it/s, acc=0.804, xentropy=0.666]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.714


Epoch 395: 100%|██████████| 391/391 [00:34<00:00, 12.81it/s, acc=0.805, xentropy=0.671]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.713


Epoch 396: 100%|██████████| 391/391 [00:34<00:00, 11.37it/s, acc=0.805, xentropy=0.664]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.715


Epoch 397: 100%|██████████| 391/391 [00:34<00:00, 12.60it/s, acc=0.806, xentropy=0.665]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.717


Epoch 398: 100%|██████████| 391/391 [00:34<00:00, 12.31it/s, acc=0.803, xentropy=0.666]
  0%|          | 0/391 [00:00<?, ?it/s]

test_acc: 0.716


Epoch 399: 100%|██████████| 391/391 [00:34<00:00, 11.27it/s, acc=0.803, xentropy=0.670]


test_acc: 0.716


In [22]:
test(testLoader)

0.7156

In [0]:
torch.save(cnn.cuda().state_dict(), '/content/gdrive/My Drive/checkpoints/model.pt')