# Pytorch Tutorial

Pytorch is a popular deep learning framework and it's easy to get started.

In [12]:
import torch
import torch.nn as nn
import torch.nn.functional as F
import torch.optim as optim
import torch.utils.data as data
import torchvision
import torchvision.transforms as transforms
from tqdm import tqdm
import time
import sys

BATCH_SIZE = 128
NUM_EPOCHS = 10

First, we read the mnist data, preprocess them and encapsulate them into dataloader form.

In [13]:
# preprocessing
normalize = transforms.Normalize(mean=[.5], std=[.5])
transform = transforms.Compose([transforms.ToTensor(), normalize])

# download and load the data
train_dataset = torchvision.datasets.MNIST(root='./mnist/', train=True, transform=transform, download=True)
test_dataset = torchvision.datasets.MNIST(root='./mnist/', train=False, transform=transform, download=False)

# encapsulate them into dataloader form
train_loader = data.DataLoader(train_dataset, batch_size=BATCH_SIZE, shuffle=True, drop_last=True)
test_loader = data.DataLoader(test_dataset, batch_size=BATCH_SIZE, shuffle=False, drop_last=True)

Then, we define the model, object function and optimizer that we use to classify.

In [14]:
class SimpleNet(nn.Module):
# TODO:define model

    def __init__(self):
        super().__init__()
        self.conv1 = nn.Conv2d(1, 6, 5, padding = 2)
        self.pool1 = nn.MaxPool2d(2)
        self.conv2 = nn.Conv2d(6, 16, 5, padding = 0)
        self.pool2 = nn.MaxPool2d(2)
        self.fc1 = nn.Linear(400, 120)
        self.fc2 = nn.Linear(120, 84)
        self.fc3 = nn.Linear(84, 10)

    def forward(self, x):
        x = self.conv1(x)
        x = F.relu(x)
        x = self.pool1(x)
        x = self.conv2(x)
        x = F.relu(x)
        x = self.pool2(x)
        x = x.reshape(-1, 400)
        x = self.fc1(x)
        x = F.relu(x)
        x = self.fc2(x)
        x = F.relu(x)
        x = self.fc3(x)

        return x

model = SimpleNet()

# TODO:define loss function and optimiter
criterion = F.cross_entropy
optimizer = optim.Adam(model.parameters())

Next, we can start to train and evaluate!

In [18]:
# train and evaluate
for epoch in range(NUM_EPOCHS):
    train_err = 0
    train_acc = 0
    t = tqdm(train_loader, leave=True)
    for i, (images, labels) in enumerate(t):
        # TODO:forward + backward + optimize
        
        optimizer.zero_grad()
        y_pred = model.forward(images)
        err = criterion(y_pred, labels)
        err.backward()
        optimizer.step()
        train_err = (train_err * i + err.item()) / (i + 1)
        train_acc = (train_acc * i + (labels == y_pred.argmax(-1)).float().mean().item())\
            / (i + 1)
        t.set_description(
            "Loss: %.4f | Train Set Acc: %.4f |"
            % (train_err, train_acc))
        
        
        
    # evaluate
    # TODO:calculate the accuracy using traning and testing dataset
    
    test_acc = 0
    for i, (images, labels) in enumerate(test_loader):
        y_pred = model.forward(images)
        test_acc = (test_acc * i + (labels == y_pred.argmax(-1)).float().mean().item()) \
            / (i + 1)
    print("Test Set Acc: %.4f" % (test_acc), file = sys.stderr)
    
    



  0%|          | 0/468 [00:00<?, ?it/s][A
Loss: 2.3061 | Train Set Acc: 0.1016 |:   0%|          | 0/468 [00:00<?, ?it/s][A
Loss: 2.2971 | Train Set Acc: 0.1094 |:   0%|          | 0/468 [00:00<?, ?it/s][A
Loss: 2.2971 | Train Set Acc: 0.1094 |:   0%|          | 2/468 [00:00<00:27, 16.71it/s][A
Loss: 2.2992 | Train Set Acc: 0.1068 |:   0%|          | 2/468 [00:00<00:27, 16.71it/s][A
Loss: 2.2939 | Train Set Acc: 0.1406 |:   0%|          | 2/468 [00:00<00:27, 16.71it/s][A
Loss: 2.2939 | Train Set Acc: 0.1406 |:   1%|          | 4/468 [00:00<00:27, 16.88it/s][A
Loss: 2.2904 | Train Set Acc: 0.1562 |:   1%|          | 4/468 [00:00<00:27, 16.88it/s][A
Loss: 2.2870 | Train Set Acc: 0.1628 |:   1%|          | 4/468 [00:00<00:27, 16.88it/s][A
Loss: 2.2870 | Train Set Acc: 0.1628 |:   1%|▏         | 6/468 [00:00<00:27, 16.87it/s][A
Loss: 2.2826 | Train Set Acc: 0.1719 |:   1%|▏         | 6/468 [00:00<00:27, 16.87it/s][A
Loss: 2.2780 | Train Set Acc: 0.1777 |:   1%|▏         | 6/468

Loss: 1.2249 | Train Set Acc: 0.6386 |:  13%|█▎        | 62/468 [00:03<00:18, 22.21it/s][A
Loss: 1.2249 | Train Set Acc: 0.6386 |:  14%|█▍        | 65/468 [00:03<00:18, 21.75it/s][A
Loss: 1.2167 | Train Set Acc: 0.6412 |:  14%|█▍        | 65/468 [00:03<00:18, 21.75it/s][A
Loss: 1.2066 | Train Set Acc: 0.6441 |:  14%|█▍        | 65/468 [00:03<00:18, 21.75it/s][A
Loss: 1.1972 | Train Set Acc: 0.6467 |:  14%|█▍        | 65/468 [00:03<00:18, 21.75it/s][A
Loss: 1.1972 | Train Set Acc: 0.6467 |:  15%|█▍        | 68/468 [00:03<00:19, 20.64it/s][A
Loss: 1.1866 | Train Set Acc: 0.6495 |:  15%|█▍        | 68/468 [00:03<00:19, 20.64it/s][A
Loss: 1.1747 | Train Set Acc: 0.6526 |:  15%|█▍        | 68/468 [00:03<00:19, 20.64it/s][A
Loss: 1.1625 | Train Set Acc: 0.6557 |:  15%|█▍        | 68/468 [00:03<00:19, 20.64it/s][A
Loss: 1.1625 | Train Set Acc: 0.6557 |:  15%|█▌        | 71/468 [00:03<00:19, 20.34it/s][A
Loss: 1.1514 | Train Set Acc: 0.6593 |:  15%|█▌        | 71/468 [00:03<00:19, 20

Loss: 0.7802 | Train Set Acc: 0.7691 |:  27%|██▋       | 128/468 [00:06<00:17, 19.45it/s][A
Loss: 0.7758 | Train Set Acc: 0.7703 |:  27%|██▋       | 128/468 [00:06<00:17, 19.45it/s][A
Loss: 0.7714 | Train Set Acc: 0.7715 |:  27%|██▋       | 128/468 [00:06<00:17, 19.45it/s][A
Loss: 0.7714 | Train Set Acc: 0.7715 |:  28%|██▊       | 131/468 [00:06<00:17, 19.75it/s][A
Loss: 0.7670 | Train Set Acc: 0.7728 |:  28%|██▊       | 131/468 [00:06<00:17, 19.75it/s][A
Loss: 0.7629 | Train Set Acc: 0.7738 |:  28%|██▊       | 131/468 [00:06<00:17, 19.75it/s][A
Loss: 0.7593 | Train Set Acc: 0.7747 |:  28%|██▊       | 131/468 [00:06<00:17, 19.75it/s][A
Loss: 0.7593 | Train Set Acc: 0.7747 |:  29%|██▊       | 134/468 [00:06<00:16, 20.08it/s][A
Loss: 0.7547 | Train Set Acc: 0.7760 |:  29%|██▊       | 134/468 [00:06<00:16, 20.08it/s][A
Loss: 0.7506 | Train Set Acc: 0.7773 |:  29%|██▊       | 134/468 [00:06<00:16, 20.08it/s][A
Loss: 0.7465 | Train Set Acc: 0.7785 |:  29%|██▊       | 134/468 [00:0

Loss: 0.5856 | Train Set Acc: 0.8260 |:  41%|████      | 191/468 [00:09<00:12, 21.58it/s][A
Loss: 0.5856 | Train Set Acc: 0.8260 |:  41%|████▏     | 194/468 [00:09<00:13, 20.53it/s][A
Loss: 0.5835 | Train Set Acc: 0.8267 |:  41%|████▏     | 194/468 [00:09<00:13, 20.53it/s][A
Loss: 0.5815 | Train Set Acc: 0.8272 |:  41%|████▏     | 194/468 [00:09<00:13, 20.53it/s][A
Loss: 0.5800 | Train Set Acc: 0.8277 |:  41%|████▏     | 194/468 [00:09<00:13, 20.53it/s][A
Loss: 0.5800 | Train Set Acc: 0.8277 |:  42%|████▏     | 197/468 [00:09<00:13, 20.55it/s][A
Loss: 0.5779 | Train Set Acc: 0.8282 |:  42%|████▏     | 197/468 [00:09<00:13, 20.55it/s][A
Loss: 0.5758 | Train Set Acc: 0.8289 |:  42%|████▏     | 197/468 [00:09<00:13, 20.55it/s][A
Loss: 0.5738 | Train Set Acc: 0.8294 |:  42%|████▏     | 197/468 [00:09<00:13, 20.55it/s][A
Loss: 0.5738 | Train Set Acc: 0.8294 |:  43%|████▎     | 200/468 [00:09<00:12, 20.65it/s][A
Loss: 0.5716 | Train Set Acc: 0.8300 |:  43%|████▎     | 200/468 [00:0

Loss: 0.4741 | Train Set Acc: 0.8587 |:  55%|█████▍    | 257/468 [00:12<00:10, 20.95it/s][A
Loss: 0.4726 | Train Set Acc: 0.8591 |:  55%|█████▍    | 257/468 [00:12<00:10, 20.95it/s][A
Loss: 0.4726 | Train Set Acc: 0.8591 |:  56%|█████▌    | 260/468 [00:12<00:09, 21.65it/s][A
Loss: 0.4712 | Train Set Acc: 0.8595 |:  56%|█████▌    | 260/468 [00:12<00:09, 21.65it/s][A
Loss: 0.4698 | Train Set Acc: 0.8599 |:  56%|█████▌    | 260/468 [00:12<00:09, 21.65it/s][A
Loss: 0.4684 | Train Set Acc: 0.8603 |:  56%|█████▌    | 260/468 [00:12<00:09, 21.65it/s][A
Loss: 0.4684 | Train Set Acc: 0.8603 |:  56%|█████▌    | 263/468 [00:12<00:09, 22.37it/s][A
Loss: 0.4668 | Train Set Acc: 0.8608 |:  56%|█████▌    | 263/468 [00:12<00:09, 22.37it/s][A
Loss: 0.4657 | Train Set Acc: 0.8611 |:  56%|█████▌    | 263/468 [00:12<00:09, 22.37it/s][A
Loss: 0.4644 | Train Set Acc: 0.8615 |:  56%|█████▌    | 263/468 [00:12<00:09, 22.37it/s][A
Loss: 0.4644 | Train Set Acc: 0.8615 |:  57%|█████▋    | 266/468 [00:1

Loss: 0.4052 | Train Set Acc: 0.8794 |:  69%|██████▉   | 323/468 [00:15<00:07, 19.76it/s][A
Loss: 0.4052 | Train Set Acc: 0.8794 |:  69%|██████▉   | 325/468 [00:15<00:07, 19.79it/s][A
Loss: 0.4043 | Train Set Acc: 0.8796 |:  69%|██████▉   | 325/468 [00:15<00:07, 19.79it/s][A
Loss: 0.4035 | Train Set Acc: 0.8798 |:  69%|██████▉   | 325/468 [00:15<00:07, 19.79it/s][A
Loss: 0.4035 | Train Set Acc: 0.8798 |:  70%|██████▉   | 327/468 [00:15<00:07, 19.58it/s][A
Loss: 0.4025 | Train Set Acc: 0.8801 |:  70%|██████▉   | 327/468 [00:15<00:07, 19.58it/s][A
Loss: 0.4016 | Train Set Acc: 0.8804 |:  70%|██████▉   | 327/468 [00:15<00:07, 19.58it/s][A
Loss: 0.4016 | Train Set Acc: 0.8804 |:  70%|███████   | 329/468 [00:15<00:07, 19.43it/s][A
Loss: 0.4008 | Train Set Acc: 0.8806 |:  70%|███████   | 329/468 [00:16<00:07, 19.43it/s][A
Loss: 0.3999 | Train Set Acc: 0.8808 |:  70%|███████   | 329/468 [00:16<00:07, 19.43it/s][A
Loss: 0.3991 | Train Set Acc: 0.8811 |:  70%|███████   | 329/468 [00:1

Loss: 0.3572 | Train Set Acc: 0.8933 |:  83%|████████▎ | 388/468 [00:18<00:04, 18.07it/s][A
Loss: 0.3567 | Train Set Acc: 0.8936 |:  83%|████████▎ | 388/468 [00:18<00:04, 18.07it/s][A
Loss: 0.3561 | Train Set Acc: 0.8938 |:  83%|████████▎ | 388/468 [00:19<00:04, 18.07it/s][A
Loss: 0.3556 | Train Set Acc: 0.8939 |:  83%|████████▎ | 388/468 [00:19<00:04, 18.07it/s][A
Loss: 0.3556 | Train Set Acc: 0.8939 |:  84%|████████▎ | 391/468 [00:19<00:03, 19.40it/s][A
Loss: 0.3547 | Train Set Acc: 0.8942 |:  84%|████████▎ | 391/468 [00:19<00:03, 19.40it/s][A
Loss: 0.3541 | Train Set Acc: 0.8944 |:  84%|████████▎ | 391/468 [00:19<00:03, 19.40it/s][A
Loss: 0.3535 | Train Set Acc: 0.8945 |:  84%|████████▎ | 391/468 [00:19<00:03, 19.40it/s][A
Loss: 0.3535 | Train Set Acc: 0.8945 |:  84%|████████▍ | 394/468 [00:19<00:03, 20.51it/s][A
Loss: 0.3528 | Train Set Acc: 0.8947 |:  84%|████████▍ | 394/468 [00:19<00:03, 20.51it/s][A
Loss: 0.3521 | Train Set Acc: 0.8949 |:  84%|████████▍ | 394/468 [00:1

Loss: 0.3215 | Train Set Acc: 0.9040 |:  96%|█████████▌| 450/468 [00:22<00:00, 18.28it/s][A
Loss: 0.3209 | Train Set Acc: 0.9042 |:  96%|█████████▌| 450/468 [00:22<00:00, 18.28it/s][A
Loss: 0.3209 | Train Set Acc: 0.9042 |:  97%|█████████▋| 452/468 [00:22<00:00, 18.02it/s][A
Loss: 0.3203 | Train Set Acc: 0.9043 |:  97%|█████████▋| 452/468 [00:22<00:00, 18.02it/s][A
Loss: 0.3197 | Train Set Acc: 0.9045 |:  97%|█████████▋| 452/468 [00:22<00:00, 18.02it/s][A
Loss: 0.3197 | Train Set Acc: 0.9045 |:  97%|█████████▋| 454/468 [00:22<00:00, 18.48it/s][A
Loss: 0.3192 | Train Set Acc: 0.9047 |:  97%|█████████▋| 454/468 [00:22<00:00, 18.48it/s][A
Loss: 0.3189 | Train Set Acc: 0.9048 |:  97%|█████████▋| 454/468 [00:22<00:00, 18.48it/s][A
Loss: 0.3183 | Train Set Acc: 0.9049 |:  97%|█████████▋| 454/468 [00:22<00:00, 18.48it/s][A
Loss: 0.3183 | Train Set Acc: 0.9049 |:  98%|█████████▊| 457/468 [00:22<00:00, 19.22it/s][A
Loss: 0.3177 | Train Set Acc: 0.9051 |:  98%|█████████▊| 457/468 [00:2

Loss: 0.0941 | Train Set Acc: 0.9738 |:  10%|▉         | 45/468 [00:02<00:25, 16.69it/s][A
Loss: 0.0929 | Train Set Acc: 0.9742 |:  10%|▉         | 45/468 [00:02<00:25, 16.69it/s][A
Loss: 0.0923 | Train Set Acc: 0.9742 |:  10%|▉         | 45/468 [00:02<00:25, 16.69it/s][A
Loss: 0.0923 | Train Set Acc: 0.9742 |:  10%|█         | 47/468 [00:02<00:25, 16.21it/s][A
Loss: 0.0915 | Train Set Acc: 0.9743 |:  10%|█         | 47/468 [00:02<00:25, 16.21it/s][A
Loss: 0.0914 | Train Set Acc: 0.9740 |:  10%|█         | 47/468 [00:02<00:25, 16.21it/s][A
Loss: 0.0914 | Train Set Acc: 0.9740 |:  10%|█         | 49/468 [00:02<00:25, 16.36it/s][A
Loss: 0.0900 | Train Set Acc: 0.9744 |:  10%|█         | 49/468 [00:02<00:25, 16.36it/s][A
Loss: 0.0892 | Train Set Acc: 0.9747 |:  10%|█         | 49/468 [00:02<00:25, 16.36it/s][A
Loss: 0.0892 | Train Set Acc: 0.9747 |:  11%|█         | 51/468 [00:02<00:25, 16.26it/s][A
Loss: 0.0895 | Train Set Acc: 0.9745 |:  11%|█         | 51/468 [00:02<00:25, 16

Loss: 0.0804 | Train Set Acc: 0.9761 |:  23%|██▎       | 107/468 [00:05<00:17, 20.66it/s][A
Loss: 0.0804 | Train Set Acc: 0.9761 |:  24%|██▎       | 110/468 [00:05<00:17, 20.15it/s][A
Loss: 0.0809 | Train Set Acc: 0.9760 |:  24%|██▎       | 110/468 [00:05<00:17, 20.15it/s][A
Loss: 0.0817 | Train Set Acc: 0.9760 |:  24%|██▎       | 110/468 [00:05<00:17, 20.15it/s][A
Loss: 0.0815 | Train Set Acc: 0.9761 |:  24%|██▎       | 110/468 [00:05<00:17, 20.15it/s][A
Loss: 0.0815 | Train Set Acc: 0.9761 |:  24%|██▍       | 113/468 [00:05<00:17, 20.70it/s][A
Loss: 0.0817 | Train Set Acc: 0.9760 |:  24%|██▍       | 113/468 [00:05<00:17, 20.70it/s][A
Loss: 0.0815 | Train Set Acc: 0.9760 |:  24%|██▍       | 113/468 [00:05<00:17, 20.70it/s][A
Loss: 0.0812 | Train Set Acc: 0.9760 |:  24%|██▍       | 113/468 [00:05<00:17, 20.70it/s][A
Loss: 0.0812 | Train Set Acc: 0.9760 |:  25%|██▍       | 116/468 [00:05<00:17, 20.17it/s][A
Loss: 0.0809 | Train Set Acc: 0.9761 |:  25%|██▍       | 116/468 [00:0

Loss: 0.0832 | Train Set Acc: 0.9745 |:  37%|███▋      | 172/468 [00:08<00:15, 18.64it/s][A
Loss: 0.0832 | Train Set Acc: 0.9745 |:  37%|███▋      | 174/468 [00:08<00:16, 18.06it/s][A
Loss: 0.0831 | Train Set Acc: 0.9746 |:  37%|███▋      | 174/468 [00:08<00:16, 18.06it/s][A
Loss: 0.0828 | Train Set Acc: 0.9747 |:  37%|███▋      | 174/468 [00:08<00:16, 18.06it/s][A
Loss: 0.0828 | Train Set Acc: 0.9747 |:  38%|███▊      | 176/468 [00:08<00:17, 16.92it/s][A
Loss: 0.0826 | Train Set Acc: 0.9748 |:  38%|███▊      | 176/468 [00:09<00:17, 16.92it/s][A
Loss: 0.0826 | Train Set Acc: 0.9748 |:  38%|███▊      | 176/468 [00:09<00:17, 16.92it/s][A
Loss: 0.0826 | Train Set Acc: 0.9748 |:  38%|███▊      | 178/468 [00:09<00:17, 16.94it/s][A
Loss: 0.0824 | Train Set Acc: 0.9748 |:  38%|███▊      | 178/468 [00:09<00:17, 16.94it/s][A
Loss: 0.0829 | Train Set Acc: 0.9747 |:  38%|███▊      | 178/468 [00:09<00:17, 16.94it/s][A
Loss: 0.0829 | Train Set Acc: 0.9747 |:  38%|███▊      | 180/468 [00:0

Loss: 0.0812 | Train Set Acc: 0.9753 |:  50%|█████     | 235/468 [00:12<00:11, 20.36it/s][A
Loss: 0.0811 | Train Set Acc: 0.9753 |:  50%|█████     | 235/468 [00:12<00:11, 20.36it/s][A
Loss: 0.0811 | Train Set Acc: 0.9753 |:  50%|█████     | 235/468 [00:12<00:11, 20.36it/s][A
Loss: 0.0811 | Train Set Acc: 0.9753 |:  51%|█████     | 238/468 [00:12<00:11, 20.15it/s][A
Loss: 0.0811 | Train Set Acc: 0.9753 |:  51%|█████     | 238/468 [00:12<00:11, 20.15it/s][A
Loss: 0.0810 | Train Set Acc: 0.9754 |:  51%|█████     | 238/468 [00:12<00:11, 20.15it/s][A
Loss: 0.0809 | Train Set Acc: 0.9754 |:  51%|█████     | 238/468 [00:12<00:11, 20.15it/s][A
Loss: 0.0809 | Train Set Acc: 0.9754 |:  51%|█████▏    | 241/468 [00:12<00:11, 19.84it/s][A
Loss: 0.0808 | Train Set Acc: 0.9755 |:  51%|█████▏    | 241/468 [00:12<00:11, 19.84it/s][A
Loss: 0.0809 | Train Set Acc: 0.9754 |:  51%|█████▏    | 241/468 [00:12<00:11, 19.84it/s][A
Loss: 0.0809 | Train Set Acc: 0.9754 |:  52%|█████▏    | 243/468 [00:1

Loss: 0.0789 | Train Set Acc: 0.9760 |:  64%|██████▍   | 300/468 [00:15<00:08, 19.10it/s][A
Loss: 0.0788 | Train Set Acc: 0.9760 |:  64%|██████▍   | 300/468 [00:15<00:08, 19.10it/s][A
Loss: 0.0788 | Train Set Acc: 0.9760 |:  64%|██████▍   | 300/468 [00:15<00:08, 19.10it/s][A
Loss: 0.0788 | Train Set Acc: 0.9760 |:  64%|██████▍   | 300/468 [00:15<00:08, 19.10it/s][A
Loss: 0.0788 | Train Set Acc: 0.9760 |:  65%|██████▍   | 303/468 [00:15<00:08, 19.68it/s][A
Loss: 0.0790 | Train Set Acc: 0.9760 |:  65%|██████▍   | 303/468 [00:15<00:08, 19.68it/s][A
Loss: 0.0793 | Train Set Acc: 0.9759 |:  65%|██████▍   | 303/468 [00:15<00:08, 19.68it/s][A
Loss: 0.0793 | Train Set Acc: 0.9759 |:  65%|██████▍   | 303/468 [00:15<00:08, 19.68it/s][A
Loss: 0.0793 | Train Set Acc: 0.9759 |:  65%|██████▌   | 306/468 [00:15<00:08, 20.07it/s][A
Loss: 0.0793 | Train Set Acc: 0.9759 |:  65%|██████▌   | 306/468 [00:15<00:08, 20.07it/s][A
Loss: 0.0793 | Train Set Acc: 0.9759 |:  65%|██████▌   | 306/468 [00:1

Loss: 0.0791 | Train Set Acc: 0.9760 |:  78%|███████▊  | 364/468 [00:18<00:05, 20.08it/s][A
Loss: 0.0791 | Train Set Acc: 0.9760 |:  78%|███████▊  | 364/468 [00:18<00:05, 20.08it/s][A
Loss: 0.0791 | Train Set Acc: 0.9760 |:  78%|███████▊  | 364/468 [00:18<00:05, 20.08it/s][A
Loss: 0.0792 | Train Set Acc: 0.9759 |:  78%|███████▊  | 364/468 [00:18<00:05, 20.08it/s][A
Loss: 0.0792 | Train Set Acc: 0.9759 |:  78%|███████▊  | 367/468 [00:18<00:05, 19.56it/s][A
Loss: 0.0792 | Train Set Acc: 0.9759 |:  78%|███████▊  | 367/468 [00:18<00:05, 19.56it/s][A
Loss: 0.0790 | Train Set Acc: 0.9760 |:  78%|███████▊  | 367/468 [00:18<00:05, 19.56it/s][A
Loss: 0.0790 | Train Set Acc: 0.9760 |:  79%|███████▉  | 369/468 [00:18<00:05, 19.65it/s][A
Loss: 0.0790 | Train Set Acc: 0.9760 |:  79%|███████▉  | 369/468 [00:18<00:05, 19.65it/s][A
Loss: 0.0791 | Train Set Acc: 0.9760 |:  79%|███████▉  | 369/468 [00:18<00:05, 19.65it/s][A
Loss: 0.0791 | Train Set Acc: 0.9760 |:  79%|███████▉  | 371/468 [00:1

Loss: 0.0767 | Train Set Acc: 0.9767 |:  91%|█████████ | 427/468 [00:21<00:01, 21.28it/s][A
Loss: 0.0767 | Train Set Acc: 0.9767 |:  91%|█████████ | 427/468 [00:21<00:01, 21.28it/s][A
Loss: 0.0766 | Train Set Acc: 0.9768 |:  91%|█████████ | 427/468 [00:21<00:01, 21.28it/s][A
Loss: 0.0768 | Train Set Acc: 0.9767 |:  91%|█████████ | 427/468 [00:21<00:01, 21.28it/s][A
Loss: 0.0768 | Train Set Acc: 0.9767 |:  92%|█████████▏| 430/468 [00:21<00:01, 21.29it/s][A
Loss: 0.0768 | Train Set Acc: 0.9767 |:  92%|█████████▏| 430/468 [00:21<00:01, 21.29it/s][A
Loss: 0.0768 | Train Set Acc: 0.9767 |:  92%|█████████▏| 430/468 [00:21<00:01, 21.29it/s][A
Loss: 0.0767 | Train Set Acc: 0.9767 |:  92%|█████████▏| 430/468 [00:21<00:01, 21.29it/s][A
Loss: 0.0767 | Train Set Acc: 0.9767 |:  93%|█████████▎| 433/468 [00:21<00:01, 21.49it/s][A
Loss: 0.0767 | Train Set Acc: 0.9768 |:  93%|█████████▎| 433/468 [00:21<00:01, 21.49it/s][A
Loss: 0.0766 | Train Set Acc: 0.9768 |:  93%|█████████▎| 433/468 [00:2

Loss: 0.0618 | Train Set Acc: 0.9807 |:   4%|▍         | 20/468 [00:01<00:26, 17.12it/s][A
Loss: 0.0623 | Train Set Acc: 0.9808 |:   4%|▍         | 20/468 [00:01<00:26, 17.12it/s][A
Loss: 0.0623 | Train Set Acc: 0.9808 |:   5%|▍         | 22/468 [00:01<00:25, 17.30it/s][A
Loss: 0.0612 | Train Set Acc: 0.9810 |:   5%|▍         | 22/468 [00:01<00:25, 17.30it/s][A
Loss: 0.0644 | Train Set Acc: 0.9805 |:   5%|▍         | 22/468 [00:01<00:25, 17.30it/s][A
Loss: 0.0627 | Train Set Acc: 0.9809 |:   5%|▍         | 22/468 [00:01<00:25, 17.30it/s][A
Loss: 0.0627 | Train Set Acc: 0.9809 |:   5%|▌         | 25/468 [00:01<00:24, 18.37it/s][A
Loss: 0.0611 | Train Set Acc: 0.9814 |:   5%|▌         | 25/468 [00:01<00:24, 18.37it/s][A
Loss: 0.0602 | Train Set Acc: 0.9812 |:   5%|▌         | 25/468 [00:01<00:24, 18.37it/s][A
Loss: 0.0598 | Train Set Acc: 0.9816 |:   5%|▌         | 25/468 [00:01<00:24, 18.37it/s][A
Loss: 0.0598 | Train Set Acc: 0.9816 |:   6%|▌         | 28/468 [00:01<00:22, 19

Loss: 0.0504 | Train Set Acc: 0.9847 |:  18%|█▊        | 83/468 [00:04<00:18, 20.78it/s][A
Loss: 0.0505 | Train Set Acc: 0.9846 |:  18%|█▊        | 83/468 [00:04<00:18, 20.78it/s][A
Loss: 0.0505 | Train Set Acc: 0.9846 |:  18%|█▊        | 86/468 [00:04<00:20, 19.07it/s][A
Loss: 0.0511 | Train Set Acc: 0.9846 |:  18%|█▊        | 86/468 [00:04<00:20, 19.07it/s][A
Loss: 0.0507 | Train Set Acc: 0.9847 |:  18%|█▊        | 86/468 [00:04<00:20, 19.07it/s][A
Loss: 0.0507 | Train Set Acc: 0.9847 |:  19%|█▉        | 88/468 [00:04<00:20, 18.45it/s][A
Loss: 0.0505 | Train Set Acc: 0.9847 |:  19%|█▉        | 88/468 [00:04<00:20, 18.45it/s][A
Loss: 0.0503 | Train Set Acc: 0.9848 |:  19%|█▉        | 88/468 [00:04<00:20, 18.45it/s][A
Loss: 0.0503 | Train Set Acc: 0.9848 |:  19%|█▉        | 90/468 [00:04<00:20, 18.69it/s][A
Loss: 0.0502 | Train Set Acc: 0.9848 |:  19%|█▉        | 90/468 [00:04<00:20, 18.69it/s][A
Loss: 0.0497 | Train Set Acc: 0.9850 |:  19%|█▉        | 90/468 [00:04<00:20, 18

Loss: 0.0514 | Train Set Acc: 0.9844 |:  31%|███▏      | 147/468 [00:07<00:14, 22.49it/s][A
Loss: 0.0514 | Train Set Acc: 0.9844 |:  32%|███▏      | 150/468 [00:07<00:13, 22.84it/s][A
Loss: 0.0515 | Train Set Acc: 0.9843 |:  32%|███▏      | 150/468 [00:07<00:13, 22.84it/s][A
Loss: 0.0515 | Train Set Acc: 0.9843 |:  32%|███▏      | 150/468 [00:07<00:13, 22.84it/s][A
Loss: 0.0517 | Train Set Acc: 0.9843 |:  32%|███▏      | 150/468 [00:07<00:13, 22.84it/s][A
Loss: 0.0517 | Train Set Acc: 0.9843 |:  33%|███▎      | 153/468 [00:07<00:13, 23.03it/s][A
Loss: 0.0515 | Train Set Acc: 0.9843 |:  33%|███▎      | 153/468 [00:07<00:13, 23.03it/s][A
Loss: 0.0515 | Train Set Acc: 0.9844 |:  33%|███▎      | 153/468 [00:07<00:13, 23.03it/s][A
Loss: 0.0515 | Train Set Acc: 0.9843 |:  33%|███▎      | 153/468 [00:07<00:13, 23.03it/s][A
Loss: 0.0515 | Train Set Acc: 0.9843 |:  33%|███▎      | 156/468 [00:07<00:13, 22.44it/s][A
Loss: 0.0515 | Train Set Acc: 0.9843 |:  33%|███▎      | 156/468 [00:0

Loss: 0.0524 | Train Set Acc: 0.9839 |:  46%|████▌     | 213/468 [00:10<00:12, 19.71it/s][A
Loss: 0.0523 | Train Set Acc: 0.9839 |:  46%|████▌     | 213/468 [00:10<00:12, 19.71it/s][A
Loss: 0.0523 | Train Set Acc: 0.9839 |:  46%|████▌     | 216/468 [00:10<00:12, 19.85it/s][A
Loss: 0.0523 | Train Set Acc: 0.9839 |:  46%|████▌     | 216/468 [00:11<00:12, 19.85it/s][A
Loss: 0.0523 | Train Set Acc: 0.9839 |:  46%|████▌     | 216/468 [00:11<00:12, 19.85it/s][A
Loss: 0.0523 | Train Set Acc: 0.9839 |:  47%|████▋     | 218/468 [00:11<00:12, 19.45it/s][A
Loss: 0.0523 | Train Set Acc: 0.9838 |:  47%|████▋     | 218/468 [00:11<00:12, 19.45it/s][A
Loss: 0.0525 | Train Set Acc: 0.9838 |:  47%|████▋     | 218/468 [00:11<00:12, 19.45it/s][A
Loss: 0.0525 | Train Set Acc: 0.9837 |:  47%|████▋     | 218/468 [00:11<00:12, 19.45it/s][A
Loss: 0.0525 | Train Set Acc: 0.9837 |:  47%|████▋     | 221/468 [00:11<00:12, 20.14it/s][A
Loss: 0.0523 | Train Set Acc: 0.9838 |:  47%|████▋     | 221/468 [00:1

Loss: 0.0544 | Train Set Acc: 0.9830 |:  59%|█████▉    | 278/468 [00:14<00:08, 21.64it/s][A
Loss: 0.0544 | Train Set Acc: 0.9830 |:  60%|██████    | 281/468 [00:14<00:09, 20.49it/s][A
Loss: 0.0543 | Train Set Acc: 0.9831 |:  60%|██████    | 281/468 [00:14<00:09, 20.49it/s][A
Loss: 0.0545 | Train Set Acc: 0.9830 |:  60%|██████    | 281/468 [00:14<00:09, 20.49it/s][A
Loss: 0.0544 | Train Set Acc: 0.9830 |:  60%|██████    | 281/468 [00:14<00:09, 20.49it/s][A
Loss: 0.0544 | Train Set Acc: 0.9830 |:  61%|██████    | 284/468 [00:14<00:09, 19.99it/s][A
Loss: 0.0544 | Train Set Acc: 0.9830 |:  61%|██████    | 284/468 [00:14<00:09, 19.99it/s][A
Loss: 0.0543 | Train Set Acc: 0.9830 |:  61%|██████    | 284/468 [00:14<00:09, 19.99it/s][A
Loss: 0.0543 | Train Set Acc: 0.9830 |:  61%|██████    | 284/468 [00:14<00:09, 19.99it/s][A
Loss: 0.0543 | Train Set Acc: 0.9830 |:  61%|██████▏   | 287/468 [00:14<00:09, 19.73it/s][A
Loss: 0.0543 | Train Set Acc: 0.9830 |:  61%|██████▏   | 287/468 [00:1

Loss: 0.0531 | Train Set Acc: 0.9837 |:  72%|███████▏  | 339/468 [00:17<00:07, 18.28it/s][A
Loss: 0.0530 | Train Set Acc: 0.9837 |:  72%|███████▏  | 339/468 [00:17<00:07, 18.28it/s][A
Loss: 0.0530 | Train Set Acc: 0.9837 |:  73%|███████▎  | 342/468 [00:17<00:06, 19.98it/s][A
Loss: 0.0531 | Train Set Acc: 0.9837 |:  73%|███████▎  | 342/468 [00:17<00:06, 19.98it/s][A
Loss: 0.0531 | Train Set Acc: 0.9837 |:  73%|███████▎  | 342/468 [00:17<00:06, 19.98it/s][A
Loss: 0.0531 | Train Set Acc: 0.9837 |:  73%|███████▎  | 342/468 [00:17<00:06, 19.98it/s][A
Loss: 0.0531 | Train Set Acc: 0.9837 |:  74%|███████▎  | 345/468 [00:17<00:05, 21.18it/s][A
Loss: 0.0530 | Train Set Acc: 0.9837 |:  74%|███████▎  | 345/468 [00:17<00:05, 21.18it/s][A
Loss: 0.0532 | Train Set Acc: 0.9836 |:  74%|███████▎  | 345/468 [00:17<00:05, 21.18it/s][A
Loss: 0.0530 | Train Set Acc: 0.9837 |:  74%|███████▎  | 345/468 [00:17<00:05, 21.18it/s][A
Loss: 0.0530 | Train Set Acc: 0.9837 |:  74%|███████▍  | 348/468 [00:1

Loss: 0.0536 | Train Set Acc: 0.9835 |:  86%|████████▌ | 403/468 [00:20<00:03, 18.03it/s][A
Loss: 0.0537 | Train Set Acc: 0.9835 |:  86%|████████▌ | 403/468 [00:20<00:03, 18.03it/s][A
Loss: 0.0538 | Train Set Acc: 0.9835 |:  86%|████████▌ | 403/468 [00:20<00:03, 18.03it/s][A
Loss: 0.0538 | Train Set Acc: 0.9835 |:  87%|████████▋ | 405/468 [00:20<00:03, 17.75it/s][A
Loss: 0.0538 | Train Set Acc: 0.9835 |:  87%|████████▋ | 405/468 [00:20<00:03, 17.75it/s][A
Loss: 0.0538 | Train Set Acc: 0.9835 |:  87%|████████▋ | 405/468 [00:20<00:03, 17.75it/s][A
Loss: 0.0538 | Train Set Acc: 0.9835 |:  87%|████████▋ | 407/468 [00:20<00:03, 17.85it/s][A
Loss: 0.0537 | Train Set Acc: 0.9836 |:  87%|████████▋ | 407/468 [00:20<00:03, 17.85it/s][A
Loss: 0.0538 | Train Set Acc: 0.9835 |:  87%|████████▋ | 407/468 [00:20<00:03, 17.85it/s][A
Loss: 0.0538 | Train Set Acc: 0.9835 |:  87%|████████▋ | 409/468 [00:20<00:03, 18.30it/s][A
Loss: 0.0537 | Train Set Acc: 0.9836 |:  87%|████████▋ | 409/468 [00:2

Loss: 0.0529 | Train Set Acc: 0.9838 |:  99%|█████████▉| 464/468 [00:23<00:00, 21.99it/s][A
Loss: 0.0529 | Train Set Acc: 0.9838 |:  99%|█████████▉| 464/468 [00:23<00:00, 21.99it/s][A
Loss: 0.0529 | Train Set Acc: 0.9839 |:  99%|█████████▉| 464/468 [00:23<00:00, 21.99it/s][A
Loss: 0.0529 | Train Set Acc: 0.9839 |: 100%|█████████▉| 467/468 [00:23<00:00, 22.68it/s][A
Loss: 0.0529 | Train Set Acc: 0.9838 |: 100%|██████████| 468/468 [00:23<00:00, 19.64it/s][A
Test Set Acc: 0.9863

  0%|          | 0/468 [00:00<?, ?it/s][A
Loss: 0.0294 | Train Set Acc: 0.9922 |:   0%|          | 0/468 [00:00<?, ?it/s][A
Loss: 0.0329 | Train Set Acc: 0.9922 |:   0%|          | 0/468 [00:00<?, ?it/s][A
Loss: 0.0329 | Train Set Acc: 0.9922 |:   0%|          | 2/468 [00:00<00:24, 18.74it/s][A
Loss: 0.0372 | Train Set Acc: 0.9922 |:   0%|          | 2/468 [00:00<00:24, 18.74it/s][A
Loss: 0.0294 | Train Set Acc: 0.9941 |:   0%|          | 2/468 [00:00<00:24, 18.74it/s][A
Loss: 0.0294 | Train Set Acc: 0

Loss: 0.0389 | Train Set Acc: 0.9883 |:  12%|█▏        | 58/468 [00:03<00:22, 17.95it/s][A
Loss: 0.0389 | Train Set Acc: 0.9883 |:  12%|█▏        | 58/468 [00:03<00:22, 17.95it/s][A
Loss: 0.0389 | Train Set Acc: 0.9883 |:  13%|█▎        | 60/468 [00:03<00:22, 17.98it/s][A
Loss: 0.0392 | Train Set Acc: 0.9882 |:  13%|█▎        | 60/468 [00:03<00:22, 17.98it/s][A
Loss: 0.0387 | Train Set Acc: 0.9884 |:  13%|█▎        | 60/468 [00:03<00:22, 17.98it/s][A
Loss: 0.0399 | Train Set Acc: 0.9880 |:  13%|█▎        | 60/468 [00:03<00:22, 17.98it/s][A
Loss: 0.0399 | Train Set Acc: 0.9880 |:  13%|█▎        | 63/468 [00:03<00:21, 19.27it/s][A
Loss: 0.0396 | Train Set Acc: 0.9880 |:  13%|█▎        | 63/468 [00:03<00:21, 19.27it/s][A
Loss: 0.0399 | Train Set Acc: 0.9877 |:  13%|█▎        | 63/468 [00:03<00:21, 19.27it/s][A
Loss: 0.0400 | Train Set Acc: 0.9878 |:  13%|█▎        | 63/468 [00:03<00:21, 19.27it/s][A
Loss: 0.0400 | Train Set Acc: 0.9878 |:  14%|█▍        | 66/468 [00:03<00:20, 19

Loss: 0.0418 | Train Set Acc: 0.9872 |:  26%|██▌       | 120/468 [00:06<00:19, 18.12it/s][A
Loss: 0.0418 | Train Set Acc: 0.9872 |:  26%|██▌       | 122/468 [00:06<00:20, 17.26it/s][A
Loss: 0.0426 | Train Set Acc: 0.9870 |:  26%|██▌       | 122/468 [00:06<00:20, 17.26it/s][A
Loss: 0.0425 | Train Set Acc: 0.9871 |:  26%|██▌       | 122/468 [00:06<00:20, 17.26it/s][A
Loss: 0.0425 | Train Set Acc: 0.9871 |:  26%|██▋       | 124/468 [00:06<00:21, 16.10it/s][A
Loss: 0.0426 | Train Set Acc: 0.9870 |:  26%|██▋       | 124/468 [00:06<00:21, 16.10it/s][A
Loss: 0.0424 | Train Set Acc: 0.9870 |:  26%|██▋       | 124/468 [00:06<00:21, 16.10it/s][A
Loss: 0.0424 | Train Set Acc: 0.9870 |:  27%|██▋       | 126/468 [00:06<00:21, 15.78it/s][A
Loss: 0.0423 | Train Set Acc: 0.9870 |:  27%|██▋       | 126/468 [00:06<00:21, 15.78it/s][A
Loss: 0.0424 | Train Set Acc: 0.9869 |:  27%|██▋       | 126/468 [00:06<00:21, 15.78it/s][A
Loss: 0.0424 | Train Set Acc: 0.9869 |:  27%|██▋       | 128/468 [00:0

Loss: 0.0421 | Train Set Acc: 0.9868 |:  40%|███▉      | 185/468 [00:09<00:13, 20.73it/s][A
Loss: 0.0420 | Train Set Acc: 0.9868 |:  40%|███▉      | 185/468 [00:09<00:13, 20.73it/s][A
Loss: 0.0420 | Train Set Acc: 0.9868 |:  40%|███▉      | 185/468 [00:09<00:13, 20.73it/s][A
Loss: 0.0419 | Train Set Acc: 0.9868 |:  40%|███▉      | 185/468 [00:09<00:13, 20.73it/s][A
Loss: 0.0419 | Train Set Acc: 0.9868 |:  40%|████      | 188/468 [00:09<00:13, 21.22it/s][A
Loss: 0.0418 | Train Set Acc: 0.9868 |:  40%|████      | 188/468 [00:09<00:13, 21.22it/s][A
Loss: 0.0419 | Train Set Acc: 0.9867 |:  40%|████      | 188/468 [00:09<00:13, 21.22it/s][A
Loss: 0.0423 | Train Set Acc: 0.9866 |:  40%|████      | 188/468 [00:09<00:13, 21.22it/s][A
Loss: 0.0423 | Train Set Acc: 0.9866 |:  41%|████      | 191/468 [00:09<00:12, 21.67it/s][A
Loss: 0.0424 | Train Set Acc: 0.9866 |:  41%|████      | 191/468 [00:09<00:12, 21.67it/s][A
Loss: 0.0423 | Train Set Acc: 0.9866 |:  41%|████      | 191/468 [00:0

Loss: 0.0418 | Train Set Acc: 0.9866 |:  54%|█████▎    | 251/468 [00:12<00:10, 19.93it/s][A
Loss: 0.0418 | Train Set Acc: 0.9866 |:  54%|█████▎    | 251/468 [00:12<00:10, 19.93it/s][A
Loss: 0.0417 | Train Set Acc: 0.9866 |:  54%|█████▎    | 251/468 [00:12<00:10, 19.93it/s][A
Loss: 0.0417 | Train Set Acc: 0.9866 |:  54%|█████▎    | 251/468 [00:12<00:10, 19.93it/s][A
Loss: 0.0417 | Train Set Acc: 0.9866 |:  54%|█████▍    | 254/468 [00:12<00:10, 20.33it/s][A
Loss: 0.0416 | Train Set Acc: 0.9866 |:  54%|█████▍    | 254/468 [00:12<00:10, 20.33it/s][A
Loss: 0.0416 | Train Set Acc: 0.9866 |:  54%|█████▍    | 254/468 [00:12<00:10, 20.33it/s][A
Loss: 0.0416 | Train Set Acc: 0.9866 |:  54%|█████▍    | 254/468 [00:12<00:10, 20.33it/s][A
Loss: 0.0416 | Train Set Acc: 0.9866 |:  55%|█████▍    | 257/468 [00:12<00:10, 20.16it/s][A
Loss: 0.0415 | Train Set Acc: 0.9866 |:  55%|█████▍    | 257/468 [00:12<00:10, 20.16it/s][A
Loss: 0.0415 | Train Set Acc: 0.9866 |:  55%|█████▍    | 257/468 [00:1

Loss: 0.0433 | Train Set Acc: 0.9860 |:  68%|██████▊   | 316/468 [00:15<00:06, 22.84it/s][A
Loss: 0.0433 | Train Set Acc: 0.9860 |:  68%|██████▊   | 316/468 [00:15<00:06, 22.84it/s][A
Loss: 0.0432 | Train Set Acc: 0.9860 |:  68%|██████▊   | 316/468 [00:15<00:06, 22.84it/s][A
Loss: 0.0432 | Train Set Acc: 0.9861 |:  68%|██████▊   | 316/468 [00:15<00:06, 22.84it/s][A
Loss: 0.0432 | Train Set Acc: 0.9861 |:  68%|██████▊   | 319/468 [00:15<00:06, 23.41it/s][A
Loss: 0.0431 | Train Set Acc: 0.9861 |:  68%|██████▊   | 319/468 [00:15<00:06, 23.41it/s][A
Loss: 0.0432 | Train Set Acc: 0.9861 |:  68%|██████▊   | 319/468 [00:15<00:06, 23.41it/s][A
Loss: 0.0431 | Train Set Acc: 0.9861 |:  68%|██████▊   | 319/468 [00:16<00:06, 23.41it/s][A
Loss: 0.0431 | Train Set Acc: 0.9861 |:  69%|██████▉   | 322/468 [00:16<00:06, 22.90it/s][A
Loss: 0.0431 | Train Set Acc: 0.9861 |:  69%|██████▉   | 322/468 [00:16<00:06, 22.90it/s][A
Loss: 0.0431 | Train Set Acc: 0.9862 |:  69%|██████▉   | 322/468 [00:1

Loss: 0.0429 | Train Set Acc: 0.9863 |:  81%|████████  | 380/468 [00:19<00:04, 19.49it/s][A
Loss: 0.0429 | Train Set Acc: 0.9863 |:  82%|████████▏ | 382/468 [00:19<00:04, 18.88it/s][A
Loss: 0.0428 | Train Set Acc: 0.9863 |:  82%|████████▏ | 382/468 [00:19<00:04, 18.88it/s][A
Loss: 0.0428 | Train Set Acc: 0.9863 |:  82%|████████▏ | 382/468 [00:19<00:04, 18.88it/s][A
Loss: 0.0428 | Train Set Acc: 0.9863 |:  82%|████████▏ | 384/468 [00:19<00:04, 18.89it/s][A
Loss: 0.0429 | Train Set Acc: 0.9863 |:  82%|████████▏ | 384/468 [00:19<00:04, 18.89it/s][A
Loss: 0.0428 | Train Set Acc: 0.9863 |:  82%|████████▏ | 384/468 [00:19<00:04, 18.89it/s][A
Loss: 0.0428 | Train Set Acc: 0.9863 |:  82%|████████▏ | 386/468 [00:19<00:04, 19.12it/s][A
Loss: 0.0428 | Train Set Acc: 0.9863 |:  82%|████████▏ | 386/468 [00:19<00:04, 19.12it/s][A
Loss: 0.0429 | Train Set Acc: 0.9863 |:  82%|████████▏ | 386/468 [00:19<00:04, 19.12it/s][A
Loss: 0.0429 | Train Set Acc: 0.9863 |:  82%|████████▏ | 386/468 [00:1

Loss: 0.0432 | Train Set Acc: 0.9863 |:  95%|█████████▍| 444/468 [00:22<00:01, 22.21it/s][A
Loss: 0.0432 | Train Set Acc: 0.9863 |:  95%|█████████▍| 444/468 [00:22<00:01, 22.21it/s][A
Loss: 0.0432 | Train Set Acc: 0.9863 |:  96%|█████████▌| 447/468 [00:22<00:01, 20.42it/s][A
Loss: 0.0432 | Train Set Acc: 0.9863 |:  96%|█████████▌| 447/468 [00:22<00:01, 20.42it/s][A
Loss: 0.0433 | Train Set Acc: 0.9864 |:  96%|█████████▌| 447/468 [00:22<00:01, 20.42it/s][A
Loss: 0.0432 | Train Set Acc: 0.9864 |:  96%|█████████▌| 447/468 [00:22<00:01, 20.42it/s][A
Loss: 0.0432 | Train Set Acc: 0.9864 |:  96%|█████████▌| 450/468 [00:22<00:00, 19.71it/s][A
Loss: 0.0431 | Train Set Acc: 0.9864 |:  96%|█████████▌| 450/468 [00:22<00:00, 19.71it/s][A
Loss: 0.0431 | Train Set Acc: 0.9864 |:  96%|█████████▌| 450/468 [00:22<00:00, 19.71it/s][A
Loss: 0.0430 | Train Set Acc: 0.9864 |:  96%|█████████▌| 450/468 [00:22<00:00, 19.71it/s][A
Loss: 0.0430 | Train Set Acc: 0.9864 |:  97%|█████████▋| 453/468 [00:2

Loss: 0.0297 | Train Set Acc: 0.9897 |:   8%|▊         | 39/468 [00:01<00:21, 19.97it/s][A
Loss: 0.0293 | Train Set Acc: 0.9900 |:   8%|▊         | 39/468 [00:02<00:21, 19.97it/s][A
Loss: 0.0293 | Train Set Acc: 0.9900 |:   9%|▉         | 42/468 [00:02<00:20, 20.70it/s][A
Loss: 0.0289 | Train Set Acc: 0.9900 |:   9%|▉         | 42/468 [00:02<00:20, 20.70it/s][A
Loss: 0.0285 | Train Set Acc: 0.9902 |:   9%|▉         | 42/468 [00:02<00:20, 20.70it/s][A
Loss: 0.0288 | Train Set Acc: 0.9899 |:   9%|▉         | 42/468 [00:02<00:20, 20.70it/s][A
Loss: 0.0288 | Train Set Acc: 0.9899 |:  10%|▉         | 45/468 [00:02<00:20, 21.15it/s][A
Loss: 0.0297 | Train Set Acc: 0.9896 |:  10%|▉         | 45/468 [00:02<00:20, 21.15it/s][A
Loss: 0.0293 | Train Set Acc: 0.9899 |:  10%|▉         | 45/468 [00:02<00:20, 21.15it/s][A
Loss: 0.0296 | Train Set Acc: 0.9896 |:  10%|▉         | 45/468 [00:02<00:20, 21.15it/s][A
Loss: 0.0296 | Train Set Acc: 0.9896 |:  10%|█         | 48/468 [00:02<00:19, 21

Loss: 0.0320 | Train Set Acc: 0.9894 |:  22%|██▏       | 105/468 [00:05<00:18, 20.09it/s][A
Loss: 0.0318 | Train Set Acc: 0.9895 |:  22%|██▏       | 105/468 [00:05<00:18, 20.09it/s][A
Loss: 0.0317 | Train Set Acc: 0.9895 |:  22%|██▏       | 105/468 [00:05<00:18, 20.09it/s][A
Loss: 0.0317 | Train Set Acc: 0.9895 |:  23%|██▎       | 108/468 [00:05<00:17, 20.37it/s][A
Loss: 0.0323 | Train Set Acc: 0.9894 |:  23%|██▎       | 108/468 [00:05<00:17, 20.37it/s][A
Loss: 0.0324 | Train Set Acc: 0.9893 |:  23%|██▎       | 108/468 [00:05<00:17, 20.37it/s][A
Loss: 0.0322 | Train Set Acc: 0.9894 |:  23%|██▎       | 108/468 [00:05<00:17, 20.37it/s][A
Loss: 0.0322 | Train Set Acc: 0.9894 |:  24%|██▎       | 111/468 [00:05<00:17, 20.60it/s][A
Loss: 0.0327 | Train Set Acc: 0.9893 |:  24%|██▎       | 111/468 [00:05<00:17, 20.60it/s][A
Loss: 0.0328 | Train Set Acc: 0.9892 |:  24%|██▎       | 111/468 [00:05<00:17, 20.60it/s][A
Loss: 0.0327 | Train Set Acc: 0.9892 |:  24%|██▎       | 111/468 [00:0

Loss: 0.0320 | Train Set Acc: 0.9897 |:  36%|███▌      | 168/468 [00:08<00:14, 20.56it/s][A
Loss: 0.0320 | Train Set Acc: 0.9897 |:  37%|███▋      | 171/468 [00:08<00:14, 21.14it/s][A
Loss: 0.0320 | Train Set Acc: 0.9897 |:  37%|███▋      | 171/468 [00:08<00:14, 21.14it/s][A
Loss: 0.0319 | Train Set Acc: 0.9897 |:  37%|███▋      | 171/468 [00:08<00:14, 21.14it/s][A
Loss: 0.0319 | Train Set Acc: 0.9897 |:  37%|███▋      | 171/468 [00:08<00:14, 21.14it/s][A
Loss: 0.0319 | Train Set Acc: 0.9897 |:  37%|███▋      | 174/468 [00:08<00:13, 21.20it/s][A
Loss: 0.0318 | Train Set Acc: 0.9897 |:  37%|███▋      | 174/468 [00:08<00:13, 21.20it/s][A
Loss: 0.0319 | Train Set Acc: 0.9896 |:  37%|███▋      | 174/468 [00:08<00:13, 21.20it/s][A
Loss: 0.0319 | Train Set Acc: 0.9896 |:  37%|███▋      | 174/468 [00:08<00:13, 21.20it/s][A
Loss: 0.0319 | Train Set Acc: 0.9896 |:  38%|███▊      | 177/468 [00:08<00:13, 21.10it/s][A
Loss: 0.0318 | Train Set Acc: 0.9896 |:  38%|███▊      | 177/468 [00:0

Loss: 0.0334 | Train Set Acc: 0.9892 |:  50%|████▉     | 232/468 [00:11<00:11, 19.74it/s][A
Loss: 0.0334 | Train Set Acc: 0.9892 |:  50%|█████     | 234/468 [00:11<00:12, 18.62it/s][A
Loss: 0.0333 | Train Set Acc: 0.9893 |:  50%|█████     | 234/468 [00:11<00:12, 18.62it/s][A
Loss: 0.0332 | Train Set Acc: 0.9893 |:  50%|█████     | 234/468 [00:11<00:12, 18.62it/s][A
Loss: 0.0332 | Train Set Acc: 0.9893 |:  50%|█████     | 236/468 [00:11<00:12, 18.30it/s][A
Loss: 0.0331 | Train Set Acc: 0.9893 |:  50%|█████     | 236/468 [00:11<00:12, 18.30it/s][A
Loss: 0.0333 | Train Set Acc: 0.9893 |:  50%|█████     | 236/468 [00:11<00:12, 18.30it/s][A
Loss: 0.0333 | Train Set Acc: 0.9893 |:  51%|█████     | 238/468 [00:11<00:12, 17.70it/s][A
Loss: 0.0333 | Train Set Acc: 0.9892 |:  51%|█████     | 238/468 [00:11<00:12, 17.70it/s][A
Loss: 0.0334 | Train Set Acc: 0.9892 |:  51%|█████     | 238/468 [00:11<00:12, 17.70it/s][A
Loss: 0.0334 | Train Set Acc: 0.9892 |:  51%|█████▏    | 240/468 [00:1

Loss: 0.0346 | Train Set Acc: 0.9887 |:  63%|██████▎   | 294/468 [00:14<00:08, 21.48it/s][A
Loss: 0.0346 | Train Set Acc: 0.9887 |:  63%|██████▎   | 297/468 [00:14<00:08, 21.03it/s][A
Loss: 0.0346 | Train Set Acc: 0.9888 |:  63%|██████▎   | 297/468 [00:14<00:08, 21.03it/s][A
Loss: 0.0346 | Train Set Acc: 0.9887 |:  63%|██████▎   | 297/468 [00:14<00:08, 21.03it/s][A
Loss: 0.0346 | Train Set Acc: 0.9887 |:  63%|██████▎   | 297/468 [00:14<00:08, 21.03it/s][A
Loss: 0.0346 | Train Set Acc: 0.9887 |:  64%|██████▍   | 300/468 [00:14<00:08, 20.73it/s][A
Loss: 0.0346 | Train Set Acc: 0.9888 |:  64%|██████▍   | 300/468 [00:14<00:08, 20.73it/s][A
Loss: 0.0345 | Train Set Acc: 0.9888 |:  64%|██████▍   | 300/468 [00:14<00:08, 20.73it/s][A
Loss: 0.0345 | Train Set Acc: 0.9888 |:  64%|██████▍   | 300/468 [00:14<00:08, 20.73it/s][A
Loss: 0.0345 | Train Set Acc: 0.9888 |:  65%|██████▍   | 303/468 [00:14<00:08, 20.48it/s][A
Loss: 0.0345 | Train Set Acc: 0.9888 |:  65%|██████▍   | 303/468 [00:1

Loss: 0.0348 | Train Set Acc: 0.9885 |:  77%|███████▋  | 362/468 [00:17<00:05, 18.92it/s][A
Loss: 0.0348 | Train Set Acc: 0.9885 |:  77%|███████▋  | 362/468 [00:17<00:05, 18.92it/s][A
Loss: 0.0350 | Train Set Acc: 0.9885 |:  77%|███████▋  | 362/468 [00:17<00:05, 18.92it/s][A
Loss: 0.0350 | Train Set Acc: 0.9885 |:  77%|███████▋  | 362/468 [00:17<00:05, 18.92it/s][A
Loss: 0.0350 | Train Set Acc: 0.9885 |:  78%|███████▊  | 365/468 [00:17<00:05, 20.05it/s][A
Loss: 0.0350 | Train Set Acc: 0.9885 |:  78%|███████▊  | 365/468 [00:17<00:05, 20.05it/s][A
Loss: 0.0350 | Train Set Acc: 0.9885 |:  78%|███████▊  | 365/468 [00:18<00:05, 20.05it/s][A
Loss: 0.0350 | Train Set Acc: 0.9885 |:  78%|███████▊  | 365/468 [00:18<00:05, 20.05it/s][A
Loss: 0.0350 | Train Set Acc: 0.9885 |:  79%|███████▊  | 368/468 [00:18<00:04, 20.63it/s][A
Loss: 0.0350 | Train Set Acc: 0.9885 |:  79%|███████▊  | 368/468 [00:18<00:04, 20.63it/s][A
Loss: 0.0349 | Train Set Acc: 0.9885 |:  79%|███████▊  | 368/468 [00:1

Loss: 0.0347 | Train Set Acc: 0.9887 |:  91%|█████████ | 425/468 [00:20<00:02, 20.69it/s][A
Loss: 0.0346 | Train Set Acc: 0.9888 |:  91%|█████████ | 425/468 [00:21<00:02, 20.69it/s][A
Loss: 0.0346 | Train Set Acc: 0.9888 |:  91%|█████████▏| 428/468 [00:21<00:01, 20.71it/s][A
Loss: 0.0346 | Train Set Acc: 0.9888 |:  91%|█████████▏| 428/468 [00:21<00:01, 20.71it/s][A
Loss: 0.0345 | Train Set Acc: 0.9888 |:  91%|█████████▏| 428/468 [00:21<00:01, 20.71it/s][A
Loss: 0.0348 | Train Set Acc: 0.9887 |:  91%|█████████▏| 428/468 [00:21<00:01, 20.71it/s][A
Loss: 0.0348 | Train Set Acc: 0.9887 |:  92%|█████████▏| 431/468 [00:21<00:01, 20.55it/s][A
Loss: 0.0348 | Train Set Acc: 0.9887 |:  92%|█████████▏| 431/468 [00:21<00:01, 20.55it/s][A
Loss: 0.0349 | Train Set Acc: 0.9887 |:  92%|█████████▏| 431/468 [00:21<00:01, 20.55it/s][A
Loss: 0.0350 | Train Set Acc: 0.9887 |:  92%|█████████▏| 431/468 [00:21<00:01, 20.55it/s][A
Loss: 0.0350 | Train Set Acc: 0.9887 |:  93%|█████████▎| 434/468 [00:2

Loss: 0.0393 | Train Set Acc: 0.9889 |:   5%|▌         | 24/468 [00:01<00:19, 22.22it/s][A
Loss: 0.0383 | Train Set Acc: 0.9894 |:   5%|▌         | 24/468 [00:01<00:19, 22.22it/s][A
Loss: 0.0372 | Train Set Acc: 0.9898 |:   5%|▌         | 24/468 [00:01<00:19, 22.22it/s][A
Loss: 0.0367 | Train Set Acc: 0.9899 |:   5%|▌         | 24/468 [00:01<00:19, 22.22it/s][A
Loss: 0.0367 | Train Set Acc: 0.9899 |:   6%|▌         | 27/468 [00:01<00:19, 22.79it/s][A
Loss: 0.0370 | Train Set Acc: 0.9894 |:   6%|▌         | 27/468 [00:01<00:19, 22.79it/s][A
Loss: 0.0368 | Train Set Acc: 0.9895 |:   6%|▌         | 27/468 [00:01<00:19, 22.79it/s][A
Loss: 0.0363 | Train Set Acc: 0.9896 |:   6%|▌         | 27/468 [00:01<00:19, 22.79it/s][A
Loss: 0.0363 | Train Set Acc: 0.9896 |:   6%|▋         | 30/468 [00:01<00:18, 23.21it/s][A
Loss: 0.0360 | Train Set Acc: 0.9897 |:   6%|▋         | 30/468 [00:01<00:18, 23.21it/s][A
Loss: 0.0354 | Train Set Acc: 0.9897 |:   6%|▋         | 30/468 [00:01<00:18, 23

Loss: 0.0322 | Train Set Acc: 0.9908 |:  19%|█▊        | 87/468 [00:04<00:21, 17.79it/s][A
Loss: 0.0319 | Train Set Acc: 0.9909 |:  19%|█▊        | 87/468 [00:04<00:21, 17.79it/s][A
Loss: 0.0319 | Train Set Acc: 0.9909 |:  19%|█▉        | 89/468 [00:04<00:21, 17.97it/s][A
Loss: 0.0318 | Train Set Acc: 0.9909 |:  19%|█▉        | 89/468 [00:04<00:21, 17.97it/s][A
Loss: 0.0315 | Train Set Acc: 0.9910 |:  19%|█▉        | 89/468 [00:04<00:21, 17.97it/s][A
Loss: 0.0314 | Train Set Acc: 0.9910 |:  19%|█▉        | 89/468 [00:04<00:21, 17.97it/s][A
Loss: 0.0314 | Train Set Acc: 0.9910 |:  20%|█▉        | 92/468 [00:04<00:20, 18.48it/s][A
Loss: 0.0314 | Train Set Acc: 0.9910 |:  20%|█▉        | 92/468 [00:04<00:20, 18.48it/s][A
Loss: 0.0310 | Train Set Acc: 0.9911 |:  20%|█▉        | 92/468 [00:04<00:20, 18.48it/s][A
Loss: 0.0309 | Train Set Acc: 0.9911 |:  20%|█▉        | 92/468 [00:04<00:20, 18.48it/s][A
Loss: 0.0309 | Train Set Acc: 0.9911 |:  20%|██        | 95/468 [00:04<00:19, 19

Loss: 0.0299 | Train Set Acc: 0.9915 |:  32%|███▏      | 152/468 [00:07<00:15, 20.99it/s][A
Loss: 0.0300 | Train Set Acc: 0.9915 |:  32%|███▏      | 152/468 [00:07<00:15, 20.99it/s][A
Loss: 0.0300 | Train Set Acc: 0.9915 |:  33%|███▎      | 155/468 [00:07<00:15, 20.62it/s][A
Loss: 0.0300 | Train Set Acc: 0.9915 |:  33%|███▎      | 155/468 [00:07<00:15, 20.62it/s][A
Loss: 0.0299 | Train Set Acc: 0.9915 |:  33%|███▎      | 155/468 [00:07<00:15, 20.62it/s][A
Loss: 0.0302 | Train Set Acc: 0.9913 |:  33%|███▎      | 155/468 [00:07<00:15, 20.62it/s][A
Loss: 0.0302 | Train Set Acc: 0.9913 |:  34%|███▍      | 158/468 [00:07<00:15, 20.44it/s][A
Loss: 0.0300 | Train Set Acc: 0.9914 |:  34%|███▍      | 158/468 [00:07<00:15, 20.44it/s][A
Loss: 0.0301 | Train Set Acc: 0.9914 |:  34%|███▍      | 158/468 [00:07<00:15, 20.44it/s][A
Loss: 0.0299 | Train Set Acc: 0.9914 |:  34%|███▍      | 158/468 [00:07<00:15, 20.44it/s][A
Loss: 0.0299 | Train Set Acc: 0.9914 |:  34%|███▍      | 161/468 [00:0

Loss: 0.0283 | Train Set Acc: 0.9917 |:  47%|████▋     | 218/468 [00:10<00:12, 20.31it/s][A
Loss: 0.0282 | Train Set Acc: 0.9917 |:  47%|████▋     | 218/468 [00:10<00:12, 20.31it/s][A
Loss: 0.0282 | Train Set Acc: 0.9917 |:  47%|████▋     | 218/468 [00:10<00:12, 20.31it/s][A
Loss: 0.0282 | Train Set Acc: 0.9917 |:  47%|████▋     | 218/468 [00:10<00:12, 20.31it/s][A
Loss: 0.0282 | Train Set Acc: 0.9917 |:  47%|████▋     | 221/468 [00:10<00:11, 21.17it/s][A
Loss: 0.0282 | Train Set Acc: 0.9917 |:  47%|████▋     | 221/468 [00:10<00:11, 21.17it/s][A
Loss: 0.0282 | Train Set Acc: 0.9916 |:  47%|████▋     | 221/468 [00:11<00:11, 21.17it/s][A
Loss: 0.0281 | Train Set Acc: 0.9916 |:  47%|████▋     | 221/468 [00:11<00:11, 21.17it/s][A
Loss: 0.0281 | Train Set Acc: 0.9916 |:  48%|████▊     | 224/468 [00:11<00:11, 21.77it/s][A
Loss: 0.0281 | Train Set Acc: 0.9917 |:  48%|████▊     | 224/468 [00:11<00:11, 21.77it/s][A
Loss: 0.0281 | Train Set Acc: 0.9917 |:  48%|████▊     | 224/468 [00:1

Loss: 0.0297 | Train Set Acc: 0.9909 |:  60%|██████    | 282/468 [00:13<00:09, 20.42it/s][A
Loss: 0.0296 | Train Set Acc: 0.9910 |:  60%|██████    | 282/468 [00:13<00:09, 20.42it/s][A
Loss: 0.0296 | Train Set Acc: 0.9910 |:  61%|██████    | 285/468 [00:13<00:09, 19.59it/s][A
Loss: 0.0296 | Train Set Acc: 0.9910 |:  61%|██████    | 285/468 [00:14<00:09, 19.59it/s][A
Loss: 0.0296 | Train Set Acc: 0.9909 |:  61%|██████    | 285/468 [00:14<00:09, 19.59it/s][A
Loss: 0.0296 | Train Set Acc: 0.9909 |:  61%|██████▏   | 287/468 [00:14<00:09, 19.22it/s][A
Loss: 0.0297 | Train Set Acc: 0.9909 |:  61%|██████▏   | 287/468 [00:14<00:09, 19.22it/s][A
Loss: 0.0296 | Train Set Acc: 0.9910 |:  61%|██████▏   | 287/468 [00:14<00:09, 19.22it/s][A
Loss: 0.0296 | Train Set Acc: 0.9910 |:  62%|██████▏   | 289/468 [00:14<00:09, 19.18it/s][A
Loss: 0.0296 | Train Set Acc: 0.9910 |:  62%|██████▏   | 289/468 [00:14<00:09, 19.18it/s][A
Loss: 0.0295 | Train Set Acc: 0.9910 |:  62%|██████▏   | 289/468 [00:1

Loss: 0.0288 | Train Set Acc: 0.9910 |:  74%|███████▍  | 348/468 [00:16<00:05, 20.69it/s][A
Loss: 0.0288 | Train Set Acc: 0.9910 |:  74%|███████▍  | 348/468 [00:17<00:05, 20.69it/s][A
Loss: 0.0288 | Train Set Acc: 0.9909 |:  74%|███████▍  | 348/468 [00:17<00:05, 20.69it/s][A
Loss: 0.0288 | Train Set Acc: 0.9910 |:  74%|███████▍  | 348/468 [00:17<00:05, 20.69it/s][A
Loss: 0.0288 | Train Set Acc: 0.9910 |:  75%|███████▌  | 351/468 [00:17<00:05, 20.25it/s][A
Loss: 0.0287 | Train Set Acc: 0.9910 |:  75%|███████▌  | 351/468 [00:17<00:05, 20.25it/s][A
Loss: 0.0287 | Train Set Acc: 0.9910 |:  75%|███████▌  | 351/468 [00:17<00:05, 20.25it/s][A
Loss: 0.0287 | Train Set Acc: 0.9910 |:  75%|███████▌  | 351/468 [00:17<00:05, 20.25it/s][A
Loss: 0.0287 | Train Set Acc: 0.9910 |:  76%|███████▌  | 354/468 [00:17<00:05, 20.82it/s][A
Loss: 0.0286 | Train Set Acc: 0.9910 |:  76%|███████▌  | 354/468 [00:17<00:05, 20.82it/s][A
Loss: 0.0287 | Train Set Acc: 0.9910 |:  76%|███████▌  | 354/468 [00:1

Loss: 0.0286 | Train Set Acc: 0.9910 |:  88%|████████▊ | 410/468 [00:20<00:03, 18.06it/s][A
Loss: 0.0286 | Train Set Acc: 0.9910 |:  88%|████████▊ | 410/468 [00:20<00:03, 18.06it/s][A
Loss: 0.0286 | Train Set Acc: 0.9910 |:  88%|████████▊ | 412/468 [00:20<00:03, 17.92it/s][A
Loss: 0.0287 | Train Set Acc: 0.9910 |:  88%|████████▊ | 412/468 [00:20<00:03, 17.92it/s][A
Loss: 0.0287 | Train Set Acc: 0.9910 |:  88%|████████▊ | 412/468 [00:20<00:03, 17.92it/s][A
Loss: 0.0287 | Train Set Acc: 0.9910 |:  88%|████████▊ | 414/468 [00:20<00:02, 18.25it/s][A
Loss: 0.0286 | Train Set Acc: 0.9910 |:  88%|████████▊ | 414/468 [00:20<00:02, 18.25it/s][A
Loss: 0.0287 | Train Set Acc: 0.9910 |:  88%|████████▊ | 414/468 [00:20<00:02, 18.25it/s][A
Loss: 0.0287 | Train Set Acc: 0.9910 |:  89%|████████▉ | 416/468 [00:20<00:02, 18.45it/s][A
Loss: 0.0287 | Train Set Acc: 0.9910 |:  89%|████████▉ | 416/468 [00:20<00:02, 18.45it/s][A
Loss: 0.0288 | Train Set Acc: 0.9909 |:  89%|████████▉ | 416/468 [00:2

Loss: 0.0173 | Train Set Acc: 0.9955 |:   1%|▏         | 6/468 [00:00<00:20, 22.58it/s][A
Loss: 0.0191 | Train Set Acc: 0.9941 |:   1%|▏         | 6/468 [00:00<00:20, 22.58it/s][A
Loss: 0.0177 | Train Set Acc: 0.9948 |:   1%|▏         | 6/468 [00:00<00:20, 22.58it/s][A
Loss: 0.0177 | Train Set Acc: 0.9948 |:   2%|▏         | 9/468 [00:00<00:19, 22.95it/s][A
Loss: 0.0248 | Train Set Acc: 0.9922 |:   2%|▏         | 9/468 [00:00<00:19, 22.95it/s][A
Loss: 0.0236 | Train Set Acc: 0.9922 |:   2%|▏         | 9/468 [00:00<00:19, 22.95it/s][A
Loss: 0.0236 | Train Set Acc: 0.9922 |:   2%|▏         | 11/468 [00:00<00:21, 21.64it/s][A
Loss: 0.0268 | Train Set Acc: 0.9909 |:   2%|▏         | 11/468 [00:00<00:21, 21.64it/s][A
Loss: 0.0249 | Train Set Acc: 0.9916 |:   2%|▏         | 11/468 [00:00<00:21, 21.64it/s][A
Loss: 0.0249 | Train Set Acc: 0.9916 |:   3%|▎         | 13/468 [00:00<00:22, 20.06it/s][A
Loss: 0.0249 | Train Set Acc: 0.9911 |:   3%|▎         | 13/468 [00:00<00:22, 20.06it/

Loss: 0.0299 | Train Set Acc: 0.9901 |:  15%|█▍        | 70/468 [00:03<00:21, 18.85it/s][A
Loss: 0.0296 | Train Set Acc: 0.9902 |:  15%|█▍        | 70/468 [00:03<00:21, 18.85it/s][A
Loss: 0.0293 | Train Set Acc: 0.9903 |:  15%|█▍        | 70/468 [00:03<00:21, 18.85it/s][A
Loss: 0.0293 | Train Set Acc: 0.9903 |:  15%|█▌        | 72/468 [00:03<00:21, 18.30it/s][A
Loss: 0.0294 | Train Set Acc: 0.9903 |:  15%|█▌        | 72/468 [00:03<00:21, 18.30it/s][A
Loss: 0.0293 | Train Set Acc: 0.9903 |:  15%|█▌        | 72/468 [00:03<00:21, 18.30it/s][A
Loss: 0.0293 | Train Set Acc: 0.9903 |:  16%|█▌        | 74/468 [00:03<00:21, 18.64it/s][A
Loss: 0.0292 | Train Set Acc: 0.9903 |:  16%|█▌        | 74/468 [00:03<00:21, 18.64it/s][A
Loss: 0.0293 | Train Set Acc: 0.9902 |:  16%|█▌        | 74/468 [00:03<00:21, 18.64it/s][A
Loss: 0.0291 | Train Set Acc: 0.9904 |:  16%|█▌        | 74/468 [00:03<00:21, 18.64it/s][A
Loss: 0.0291 | Train Set Acc: 0.9904 |:  16%|█▋        | 77/468 [00:03<00:19, 19

Loss: 0.0267 | Train Set Acc: 0.9910 |:  29%|██▊       | 134/468 [00:06<00:14, 22.89it/s][A
Loss: 0.0267 | Train Set Acc: 0.9910 |:  29%|██▊       | 134/468 [00:06<00:14, 22.89it/s][A
Loss: 0.0267 | Train Set Acc: 0.9910 |:  29%|██▉       | 137/468 [00:06<00:15, 21.86it/s][A
Loss: 0.0266 | Train Set Acc: 0.9911 |:  29%|██▉       | 137/468 [00:06<00:15, 21.86it/s][A
Loss: 0.0265 | Train Set Acc: 0.9912 |:  29%|██▉       | 137/468 [00:06<00:15, 21.86it/s][A
Loss: 0.0265 | Train Set Acc: 0.9912 |:  29%|██▉       | 137/468 [00:06<00:15, 21.86it/s][A
Loss: 0.0265 | Train Set Acc: 0.9912 |:  30%|██▉       | 140/468 [00:06<00:15, 21.11it/s][A
Loss: 0.0267 | Train Set Acc: 0.9912 |:  30%|██▉       | 140/468 [00:06<00:15, 21.11it/s][A
Loss: 0.0269 | Train Set Acc: 0.9911 |:  30%|██▉       | 140/468 [00:06<00:15, 21.11it/s][A
Loss: 0.0268 | Train Set Acc: 0.9911 |:  30%|██▉       | 140/468 [00:06<00:15, 21.11it/s][A
Loss: 0.0268 | Train Set Acc: 0.9911 |:  31%|███       | 143/468 [00:0

Loss: 0.0248 | Train Set Acc: 0.9916 |:  42%|████▏     | 196/468 [00:09<00:15, 17.58it/s][A
Loss: 0.0247 | Train Set Acc: 0.9916 |:  42%|████▏     | 196/468 [00:09<00:15, 17.58it/s][A
Loss: 0.0247 | Train Set Acc: 0.9916 |:  43%|████▎     | 199/468 [00:09<00:14, 18.42it/s][A
Loss: 0.0249 | Train Set Acc: 0.9916 |:  43%|████▎     | 199/468 [00:09<00:14, 18.42it/s][A
Loss: 0.0249 | Train Set Acc: 0.9916 |:  43%|████▎     | 199/468 [00:10<00:14, 18.42it/s][A
Loss: 0.0249 | Train Set Acc: 0.9916 |:  43%|████▎     | 201/468 [00:10<00:14, 18.52it/s][A
Loss: 0.0248 | Train Set Acc: 0.9916 |:  43%|████▎     | 201/468 [00:10<00:14, 18.52it/s][A
Loss: 0.0247 | Train Set Acc: 0.9916 |:  43%|████▎     | 201/468 [00:10<00:14, 18.52it/s][A
Loss: 0.0248 | Train Set Acc: 0.9917 |:  43%|████▎     | 201/468 [00:10<00:14, 18.52it/s][A
Loss: 0.0248 | Train Set Acc: 0.9917 |:  44%|████▎     | 204/468 [00:10<00:13, 19.43it/s][A
Loss: 0.0248 | Train Set Acc: 0.9916 |:  44%|████▎     | 204/468 [00:1

Loss: 0.0246 | Train Set Acc: 0.9918 |:  56%|█████▌    | 260/468 [00:13<00:10, 19.97it/s][A
Loss: 0.0246 | Train Set Acc: 0.9918 |:  56%|█████▌    | 263/468 [00:13<00:10, 19.65it/s][A
Loss: 0.0245 | Train Set Acc: 0.9918 |:  56%|█████▌    | 263/468 [00:13<00:10, 19.65it/s][A
Loss: 0.0245 | Train Set Acc: 0.9918 |:  56%|█████▌    | 263/468 [00:13<00:10, 19.65it/s][A
Loss: 0.0245 | Train Set Acc: 0.9918 |:  57%|█████▋    | 265/468 [00:13<00:10, 19.65it/s][A
Loss: 0.0246 | Train Set Acc: 0.9918 |:  57%|█████▋    | 265/468 [00:13<00:10, 19.65it/s][A
Loss: 0.0247 | Train Set Acc: 0.9918 |:  57%|█████▋    | 265/468 [00:13<00:10, 19.65it/s][A
Loss: 0.0247 | Train Set Acc: 0.9918 |:  57%|█████▋    | 267/468 [00:13<00:10, 19.31it/s][A
Loss: 0.0246 | Train Set Acc: 0.9919 |:  57%|█████▋    | 267/468 [00:13<00:10, 19.31it/s][A
Loss: 0.0247 | Train Set Acc: 0.9918 |:  57%|█████▋    | 267/468 [00:13<00:10, 19.31it/s][A
Loss: 0.0247 | Train Set Acc: 0.9918 |:  57%|█████▋    | 267/468 [00:1

Loss: 0.0238 | Train Set Acc: 0.9919 |:  70%|██████▉   | 327/468 [00:16<00:06, 22.66it/s][A
Loss: 0.0239 | Train Set Acc: 0.9919 |:  70%|██████▉   | 327/468 [00:16<00:06, 22.66it/s][A
Loss: 0.0238 | Train Set Acc: 0.9919 |:  70%|██████▉   | 327/468 [00:16<00:06, 22.66it/s][A
Loss: 0.0238 | Train Set Acc: 0.9919 |:  70%|██████▉   | 327/468 [00:16<00:06, 22.66it/s][A
Loss: 0.0238 | Train Set Acc: 0.9919 |:  71%|███████   | 330/468 [00:16<00:06, 22.15it/s][A
Loss: 0.0238 | Train Set Acc: 0.9919 |:  71%|███████   | 330/468 [00:16<00:06, 22.15it/s][A
Loss: 0.0239 | Train Set Acc: 0.9918 |:  71%|███████   | 330/468 [00:16<00:06, 22.15it/s][A
Loss: 0.0240 | Train Set Acc: 0.9918 |:  71%|███████   | 330/468 [00:16<00:06, 22.15it/s][A
Loss: 0.0240 | Train Set Acc: 0.9918 |:  71%|███████   | 333/468 [00:16<00:06, 22.24it/s][A
Loss: 0.0241 | Train Set Acc: 0.9918 |:  71%|███████   | 333/468 [00:16<00:06, 22.24it/s][A
Loss: 0.0242 | Train Set Acc: 0.9918 |:  71%|███████   | 333/468 [00:1

Loss: 0.0252 | Train Set Acc: 0.9914 |:  83%|████████▎ | 389/468 [00:19<00:04, 18.50it/s][A
Loss: 0.0252 | Train Set Acc: 0.9914 |:  84%|████████▎ | 391/468 [00:19<00:04, 18.37it/s][A
Loss: 0.0252 | Train Set Acc: 0.9914 |:  84%|████████▎ | 391/468 [00:19<00:04, 18.37it/s][A
Loss: 0.0253 | Train Set Acc: 0.9914 |:  84%|████████▎ | 391/468 [00:19<00:04, 18.37it/s][A
Loss: 0.0253 | Train Set Acc: 0.9914 |:  84%|████████▍ | 393/468 [00:19<00:04, 18.63it/s][A
Loss: 0.0254 | Train Set Acc: 0.9914 |:  84%|████████▍ | 393/468 [00:19<00:04, 18.63it/s][A
Loss: 0.0254 | Train Set Acc: 0.9914 |:  84%|████████▍ | 393/468 [00:19<00:04, 18.63it/s][A
Loss: 0.0254 | Train Set Acc: 0.9914 |:  84%|████████▍ | 395/468 [00:19<00:03, 18.72it/s][A
Loss: 0.0254 | Train Set Acc: 0.9914 |:  84%|████████▍ | 395/468 [00:19<00:03, 18.72it/s][A
Loss: 0.0253 | Train Set Acc: 0.9914 |:  84%|████████▍ | 395/468 [00:19<00:03, 18.72it/s][A
Loss: 0.0253 | Train Set Acc: 0.9914 |:  84%|████████▍ | 395/468 [00:1

Loss: 0.0256 | Train Set Acc: 0.9914 |:  97%|█████████▋| 453/468 [00:22<00:00, 21.94it/s][A
Loss: 0.0256 | Train Set Acc: 0.9914 |:  97%|█████████▋| 453/468 [00:22<00:00, 21.94it/s][A
Loss: 0.0256 | Train Set Acc: 0.9914 |:  97%|█████████▋| 456/468 [00:22<00:00, 20.55it/s][A
Loss: 0.0256 | Train Set Acc: 0.9915 |:  97%|█████████▋| 456/468 [00:22<00:00, 20.55it/s][A
Loss: 0.0255 | Train Set Acc: 0.9915 |:  97%|█████████▋| 456/468 [00:22<00:00, 20.55it/s][A
Loss: 0.0255 | Train Set Acc: 0.9915 |:  97%|█████████▋| 456/468 [00:22<00:00, 20.55it/s][A
Loss: 0.0255 | Train Set Acc: 0.9915 |:  98%|█████████▊| 459/468 [00:22<00:00, 20.40it/s][A
Loss: 0.0256 | Train Set Acc: 0.9914 |:  98%|█████████▊| 459/468 [00:22<00:00, 20.40it/s][A
Loss: 0.0256 | Train Set Acc: 0.9914 |:  98%|█████████▊| 459/468 [00:22<00:00, 20.40it/s][A
Loss: 0.0257 | Train Set Acc: 0.9914 |:  98%|█████████▊| 459/468 [00:22<00:00, 20.40it/s][A
Loss: 0.0257 | Train Set Acc: 0.9914 |:  99%|█████████▊| 462/468 [00:2

Loss: 0.0145 | Train Set Acc: 0.9957 |:  10%|█         | 48/468 [00:02<00:21, 19.87it/s][A
Loss: 0.0145 | Train Set Acc: 0.9956 |:  10%|█         | 48/468 [00:02<00:21, 19.87it/s][A
Loss: 0.0151 | Train Set Acc: 0.9954 |:  10%|█         | 48/468 [00:02<00:21, 19.87it/s][A
Loss: 0.0151 | Train Set Acc: 0.9954 |:  11%|█         | 51/468 [00:02<00:20, 20.41it/s][A
Loss: 0.0171 | Train Set Acc: 0.9952 |:  11%|█         | 51/468 [00:02<00:20, 20.41it/s][A
Loss: 0.0174 | Train Set Acc: 0.9950 |:  11%|█         | 51/468 [00:02<00:20, 20.41it/s][A
Loss: 0.0178 | Train Set Acc: 0.9948 |:  11%|█         | 51/468 [00:02<00:20, 20.41it/s][A
Loss: 0.0178 | Train Set Acc: 0.9948 |:  12%|█▏        | 54/468 [00:02<00:19, 20.72it/s][A
Loss: 0.0185 | Train Set Acc: 0.9946 |:  12%|█▏        | 54/468 [00:02<00:19, 20.72it/s][A
Loss: 0.0183 | Train Set Acc: 0.9947 |:  12%|█▏        | 54/468 [00:02<00:19, 20.72it/s][A
Loss: 0.0181 | Train Set Acc: 0.9948 |:  12%|█▏        | 54/468 [00:02<00:19, 20

Loss: 0.0225 | Train Set Acc: 0.9937 |:  24%|██▍       | 114/468 [00:05<00:17, 19.84it/s][A
Loss: 0.0223 | Train Set Acc: 0.9938 |:  24%|██▍       | 114/468 [00:05<00:17, 19.84it/s][A
Loss: 0.0222 | Train Set Acc: 0.9938 |:  24%|██▍       | 114/468 [00:05<00:17, 19.84it/s][A
Loss: 0.0222 | Train Set Acc: 0.9938 |:  24%|██▍       | 114/468 [00:05<00:17, 19.84it/s][A
Loss: 0.0222 | Train Set Acc: 0.9938 |:  25%|██▌       | 117/468 [00:05<00:17, 19.86it/s][A
Loss: 0.0221 | Train Set Acc: 0.9938 |:  25%|██▌       | 117/468 [00:05<00:17, 19.86it/s][A
Loss: 0.0220 | Train Set Acc: 0.9939 |:  25%|██▌       | 117/468 [00:05<00:17, 19.86it/s][A
Loss: 0.0220 | Train Set Acc: 0.9939 |:  25%|██▌       | 119/468 [00:05<00:17, 19.68it/s][A
Loss: 0.0220 | Train Set Acc: 0.9939 |:  25%|██▌       | 119/468 [00:06<00:17, 19.68it/s][A
Loss: 0.0218 | Train Set Acc: 0.9939 |:  25%|██▌       | 119/468 [00:06<00:17, 19.68it/s][A
Loss: 0.0218 | Train Set Acc: 0.9939 |:  26%|██▌       | 121/468 [00:0

Loss: 0.0208 | Train Set Acc: 0.9939 |:  38%|███▊      | 177/468 [00:08<00:13, 21.33it/s][A
Loss: 0.0208 | Train Set Acc: 0.9939 |:  38%|███▊      | 177/468 [00:08<00:13, 21.33it/s][A
Loss: 0.0208 | Train Set Acc: 0.9939 |:  38%|███▊      | 177/468 [00:08<00:13, 21.33it/s][A
Loss: 0.0208 | Train Set Acc: 0.9939 |:  38%|███▊      | 180/468 [00:08<00:13, 21.89it/s][A
Loss: 0.0208 | Train Set Acc: 0.9939 |:  38%|███▊      | 180/468 [00:08<00:13, 21.89it/s][A
Loss: 0.0207 | Train Set Acc: 0.9939 |:  38%|███▊      | 180/468 [00:09<00:13, 21.89it/s][A
Loss: 0.0207 | Train Set Acc: 0.9939 |:  38%|███▊      | 180/468 [00:09<00:13, 21.89it/s][A
Loss: 0.0207 | Train Set Acc: 0.9939 |:  39%|███▉      | 183/468 [00:09<00:13, 21.81it/s][A
Loss: 0.0206 | Train Set Acc: 0.9939 |:  39%|███▉      | 183/468 [00:09<00:13, 21.81it/s][A
Loss: 0.0206 | Train Set Acc: 0.9940 |:  39%|███▉      | 183/468 [00:09<00:13, 21.81it/s][A
Loss: 0.0205 | Train Set Acc: 0.9940 |:  39%|███▉      | 183/468 [00:0

Loss: 0.0208 | Train Set Acc: 0.9938 |:  52%|█████▏    | 242/468 [00:12<00:12, 18.79it/s][A
Loss: 0.0207 | Train Set Acc: 0.9938 |:  52%|█████▏    | 242/468 [00:12<00:12, 18.79it/s][A
Loss: 0.0207 | Train Set Acc: 0.9938 |:  52%|█████▏    | 244/468 [00:12<00:11, 18.88it/s][A
Loss: 0.0207 | Train Set Acc: 0.9938 |:  52%|█████▏    | 244/468 [00:12<00:11, 18.88it/s][A
Loss: 0.0206 | Train Set Acc: 0.9938 |:  52%|█████▏    | 244/468 [00:12<00:11, 18.88it/s][A
Loss: 0.0206 | Train Set Acc: 0.9939 |:  52%|█████▏    | 244/468 [00:12<00:11, 18.88it/s][A
Loss: 0.0206 | Train Set Acc: 0.9939 |:  53%|█████▎    | 247/468 [00:12<00:11, 19.22it/s][A
Loss: 0.0205 | Train Set Acc: 0.9939 |:  53%|█████▎    | 247/468 [00:12<00:11, 19.22it/s][A
Loss: 0.0205 | Train Set Acc: 0.9939 |:  53%|█████▎    | 247/468 [00:12<00:11, 19.22it/s][A
Loss: 0.0205 | Train Set Acc: 0.9939 |:  53%|█████▎    | 249/468 [00:12<00:11, 19.40it/s][A
Loss: 0.0205 | Train Set Acc: 0.9938 |:  53%|█████▎    | 249/468 [00:1

Loss: 0.0210 | Train Set Acc: 0.9937 |:  65%|██████▌   | 306/468 [00:15<00:07, 22.78it/s][A
Loss: 0.0209 | Train Set Acc: 0.9937 |:  65%|██████▌   | 306/468 [00:15<00:07, 22.78it/s][A
Loss: 0.0209 | Train Set Acc: 0.9937 |:  65%|██████▌   | 306/468 [00:15<00:07, 22.78it/s][A
Loss: 0.0209 | Train Set Acc: 0.9937 |:  66%|██████▌   | 309/468 [00:15<00:07, 22.03it/s][A
Loss: 0.0209 | Train Set Acc: 0.9937 |:  66%|██████▌   | 309/468 [00:15<00:07, 22.03it/s][A
Loss: 0.0209 | Train Set Acc: 0.9937 |:  66%|██████▌   | 309/468 [00:15<00:07, 22.03it/s][A
Loss: 0.0208 | Train Set Acc: 0.9937 |:  66%|██████▌   | 309/468 [00:15<00:07, 22.03it/s][A
Loss: 0.0208 | Train Set Acc: 0.9937 |:  67%|██████▋   | 312/468 [00:15<00:07, 21.08it/s][A
Loss: 0.0208 | Train Set Acc: 0.9937 |:  67%|██████▋   | 312/468 [00:15<00:07, 21.08it/s][A
Loss: 0.0208 | Train Set Acc: 0.9937 |:  67%|██████▋   | 312/468 [00:15<00:07, 21.08it/s][A
Loss: 0.0209 | Train Set Acc: 0.9937 |:  67%|██████▋   | 312/468 [00:1

Loss: 0.0211 | Train Set Acc: 0.9935 |:  79%|███████▊  | 368/468 [00:18<00:05, 18.07it/s][A
Loss: 0.0211 | Train Set Acc: 0.9935 |:  79%|███████▉  | 371/468 [00:18<00:05, 18.97it/s][A
Loss: 0.0211 | Train Set Acc: 0.9935 |:  79%|███████▉  | 371/468 [00:18<00:05, 18.97it/s][A
Loss: 0.0212 | Train Set Acc: 0.9934 |:  79%|███████▉  | 371/468 [00:18<00:05, 18.97it/s][A
Loss: 0.0213 | Train Set Acc: 0.9934 |:  79%|███████▉  | 371/468 [00:18<00:05, 18.97it/s][A
Loss: 0.0213 | Train Set Acc: 0.9934 |:  80%|███████▉  | 374/468 [00:18<00:04, 19.66it/s][A
Loss: 0.0213 | Train Set Acc: 0.9934 |:  80%|███████▉  | 374/468 [00:18<00:04, 19.66it/s][A
Loss: 0.0214 | Train Set Acc: 0.9934 |:  80%|███████▉  | 374/468 [00:18<00:04, 19.66it/s][A
Loss: 0.0214 | Train Set Acc: 0.9934 |:  80%|███████▉  | 374/468 [00:18<00:04, 19.66it/s][A
Loss: 0.0214 | Train Set Acc: 0.9934 |:  81%|████████  | 377/468 [00:18<00:04, 20.63it/s][A
Loss: 0.0215 | Train Set Acc: 0.9934 |:  81%|████████  | 377/468 [00:1

Loss: 0.0220 | Train Set Acc: 0.9932 |:  93%|█████████▎| 434/468 [00:21<00:01, 20.58it/s][A
Loss: 0.0220 | Train Set Acc: 0.9932 |:  93%|█████████▎| 437/468 [00:21<00:01, 20.17it/s][A
Loss: 0.0220 | Train Set Acc: 0.9932 |:  93%|█████████▎| 437/468 [00:21<00:01, 20.17it/s][A
Loss: 0.0221 | Train Set Acc: 0.9932 |:  93%|█████████▎| 437/468 [00:21<00:01, 20.17it/s][A
Loss: 0.0223 | Train Set Acc: 0.9931 |:  93%|█████████▎| 437/468 [00:21<00:01, 20.17it/s][A
Loss: 0.0223 | Train Set Acc: 0.9931 |:  94%|█████████▍| 440/468 [00:21<00:01, 19.97it/s][A
Loss: 0.0223 | Train Set Acc: 0.9931 |:  94%|█████████▍| 440/468 [00:21<00:01, 19.97it/s][A
Loss: 0.0222 | Train Set Acc: 0.9931 |:  94%|█████████▍| 440/468 [00:21<00:01, 19.97it/s][A
Loss: 0.0223 | Train Set Acc: 0.9931 |:  94%|█████████▍| 440/468 [00:21<00:01, 19.97it/s][A
Loss: 0.0223 | Train Set Acc: 0.9931 |:  95%|█████████▍| 443/468 [00:21<00:01, 20.08it/s][A
Loss: 0.0223 | Train Set Acc: 0.9931 |:  95%|█████████▍| 443/468 [00:2

Loss: 0.0273 | Train Set Acc: 0.9908 |:   7%|▋         | 33/468 [00:01<00:20, 21.45it/s][A
Loss: 0.0266 | Train Set Acc: 0.9910 |:   7%|▋         | 33/468 [00:01<00:20, 21.45it/s][A
Loss: 0.0262 | Train Set Acc: 0.9913 |:   7%|▋         | 33/468 [00:01<00:20, 21.45it/s][A
Loss: 0.0258 | Train Set Acc: 0.9915 |:   7%|▋         | 33/468 [00:01<00:20, 21.45it/s][A
Loss: 0.0258 | Train Set Acc: 0.9915 |:   8%|▊         | 36/468 [00:01<00:20, 21.55it/s][A
Loss: 0.0252 | Train Set Acc: 0.9918 |:   8%|▊         | 36/468 [00:01<00:20, 21.55it/s][A
Loss: 0.0253 | Train Set Acc: 0.9918 |:   8%|▊         | 36/468 [00:01<00:20, 21.55it/s][A
Loss: 0.0250 | Train Set Acc: 0.9918 |:   8%|▊         | 36/468 [00:01<00:20, 21.55it/s][A
Loss: 0.0250 | Train Set Acc: 0.9918 |:   8%|▊         | 39/468 [00:01<00:20, 21.40it/s][A
Loss: 0.0256 | Train Set Acc: 0.9910 |:   8%|▊         | 39/468 [00:01<00:20, 21.40it/s][A
Loss: 0.0255 | Train Set Acc: 0.9910 |:   8%|▊         | 39/468 [00:01<00:20, 21

Loss: 0.0218 | Train Set Acc: 0.9931 |:  21%|██        | 97/468 [00:04<00:18, 20.29it/s][A
Loss: 0.0220 | Train Set Acc: 0.9930 |:  21%|██        | 97/468 [00:04<00:18, 20.29it/s][A
Loss: 0.0220 | Train Set Acc: 0.9930 |:  21%|██▏       | 100/468 [00:04<00:18, 20.30it/s][A
Loss: 0.0220 | Train Set Acc: 0.9930 |:  21%|██▏       | 100/468 [00:04<00:18, 20.30it/s][A
Loss: 0.0219 | Train Set Acc: 0.9930 |:  21%|██▏       | 100/468 [00:04<00:18, 20.30it/s][A
Loss: 0.0219 | Train Set Acc: 0.9929 |:  21%|██▏       | 100/468 [00:05<00:18, 20.30it/s][A
Loss: 0.0219 | Train Set Acc: 0.9929 |:  22%|██▏       | 103/468 [00:05<00:17, 20.51it/s][A
Loss: 0.0218 | Train Set Acc: 0.9929 |:  22%|██▏       | 103/468 [00:05<00:17, 20.51it/s][A
Loss: 0.0217 | Train Set Acc: 0.9930 |:  22%|██▏       | 103/468 [00:05<00:17, 20.51it/s][A
Loss: 0.0218 | Train Set Acc: 0.9929 |:  22%|██▏       | 103/468 [00:05<00:17, 20.51it/s][A
Loss: 0.0218 | Train Set Acc: 0.9929 |:  23%|██▎       | 106/468 [00:05<

Loss: 0.0201 | Train Set Acc: 0.9935 |:  35%|███▍      | 162/468 [00:08<00:15, 19.38it/s][A
Loss: 0.0200 | Train Set Acc: 0.9935 |:  35%|███▍      | 162/468 [00:08<00:15, 19.38it/s][A
Loss: 0.0200 | Train Set Acc: 0.9935 |:  35%|███▌      | 164/468 [00:08<00:17, 17.12it/s][A
Loss: 0.0199 | Train Set Acc: 0.9936 |:  35%|███▌      | 164/468 [00:08<00:17, 17.12it/s][A
Loss: 0.0198 | Train Set Acc: 0.9936 |:  35%|███▌      | 164/468 [00:08<00:17, 17.12it/s][A
Loss: 0.0198 | Train Set Acc: 0.9936 |:  35%|███▌      | 166/468 [00:08<00:18, 16.29it/s][A
Loss: 0.0198 | Train Set Acc: 0.9936 |:  35%|███▌      | 166/468 [00:08<00:18, 16.29it/s][A
Loss: 0.0197 | Train Set Acc: 0.9936 |:  35%|███▌      | 166/468 [00:08<00:18, 16.29it/s][A
Loss: 0.0197 | Train Set Acc: 0.9936 |:  36%|███▌      | 168/468 [00:08<00:19, 15.46it/s][A
Loss: 0.0196 | Train Set Acc: 0.9937 |:  36%|███▌      | 168/468 [00:08<00:19, 15.46it/s][A
Loss: 0.0196 | Train Set Acc: 0.9937 |:  36%|███▌      | 168/468 [00:0

Loss: 0.0189 | Train Set Acc: 0.9937 |:  48%|████▊     | 223/468 [00:11<00:13, 17.91it/s][A
Loss: 0.0190 | Train Set Acc: 0.9937 |:  48%|████▊     | 223/468 [00:11<00:13, 17.91it/s][A
Loss: 0.0190 | Train Set Acc: 0.9937 |:  48%|████▊     | 225/468 [00:11<00:13, 17.96it/s][A
Loss: 0.0189 | Train Set Acc: 0.9937 |:  48%|████▊     | 225/468 [00:11<00:13, 17.96it/s][A
Loss: 0.0189 | Train Set Acc: 0.9937 |:  48%|████▊     | 225/468 [00:11<00:13, 17.96it/s][A
Loss: 0.0189 | Train Set Acc: 0.9937 |:  49%|████▊     | 227/468 [00:11<00:13, 17.61it/s][A
Loss: 0.0188 | Train Set Acc: 0.9938 |:  49%|████▊     | 227/468 [00:11<00:13, 17.61it/s][A
Loss: 0.0188 | Train Set Acc: 0.9938 |:  49%|████▊     | 227/468 [00:11<00:13, 17.61it/s][A
Loss: 0.0188 | Train Set Acc: 0.9938 |:  49%|████▉     | 229/468 [00:11<00:13, 17.79it/s][A
Loss: 0.0189 | Train Set Acc: 0.9938 |:  49%|████▉     | 229/468 [00:11<00:13, 17.79it/s][A
Loss: 0.0189 | Train Set Acc: 0.9937 |:  49%|████▉     | 229/468 [00:1

Loss: 0.0196 | Train Set Acc: 0.9935 |:  61%|██████    | 286/468 [00:14<00:09, 19.55it/s][A
Loss: 0.0196 | Train Set Acc: 0.9935 |:  62%|██████▏   | 288/468 [00:14<00:09, 19.58it/s][A
Loss: 0.0196 | Train Set Acc: 0.9935 |:  62%|██████▏   | 288/468 [00:14<00:09, 19.58it/s][A
Loss: 0.0199 | Train Set Acc: 0.9935 |:  62%|██████▏   | 288/468 [00:14<00:09, 19.58it/s][A
Loss: 0.0199 | Train Set Acc: 0.9935 |:  62%|██████▏   | 290/468 [00:14<00:09, 19.55it/s][A
Loss: 0.0199 | Train Set Acc: 0.9935 |:  62%|██████▏   | 290/468 [00:14<00:09, 19.55it/s][A
Loss: 0.0199 | Train Set Acc: 0.9935 |:  62%|██████▏   | 290/468 [00:14<00:09, 19.55it/s][A
Loss: 0.0199 | Train Set Acc: 0.9935 |:  62%|██████▏   | 292/468 [00:14<00:08, 19.64it/s][A
Loss: 0.0200 | Train Set Acc: 0.9935 |:  62%|██████▏   | 292/468 [00:14<00:08, 19.64it/s][A
Loss: 0.0200 | Train Set Acc: 0.9934 |:  62%|██████▏   | 292/468 [00:15<00:08, 19.64it/s][A
Loss: 0.0200 | Train Set Acc: 0.9934 |:  63%|██████▎   | 294/468 [00:1

Loss: 0.0196 | Train Set Acc: 0.9937 |:  75%|███████▍  | 349/468 [00:17<00:05, 20.69it/s][A
Loss: 0.0197 | Train Set Acc: 0.9937 |:  75%|███████▍  | 349/468 [00:17<00:05, 20.69it/s][A
Loss: 0.0197 | Train Set Acc: 0.9937 |:  75%|███████▌  | 352/468 [00:17<00:05, 20.46it/s][A
Loss: 0.0197 | Train Set Acc: 0.9937 |:  75%|███████▌  | 352/468 [00:17<00:05, 20.46it/s][A
Loss: 0.0197 | Train Set Acc: 0.9936 |:  75%|███████▌  | 352/468 [00:17<00:05, 20.46it/s][A
Loss: 0.0197 | Train Set Acc: 0.9936 |:  75%|███████▌  | 352/468 [00:18<00:05, 20.46it/s][A
Loss: 0.0197 | Train Set Acc: 0.9936 |:  76%|███████▌  | 355/468 [00:18<00:05, 20.75it/s][A
Loss: 0.0197 | Train Set Acc: 0.9937 |:  76%|███████▌  | 355/468 [00:18<00:05, 20.75it/s][A
Loss: 0.0196 | Train Set Acc: 0.9937 |:  76%|███████▌  | 355/468 [00:18<00:05, 20.75it/s][A
Loss: 0.0197 | Train Set Acc: 0.9937 |:  76%|███████▌  | 355/468 [00:18<00:05, 20.75it/s][A
Loss: 0.0197 | Train Set Acc: 0.9937 |:  76%|███████▋  | 358/468 [00:1

Loss: 0.0202 | Train Set Acc: 0.9933 |:  88%|████████▊ | 414/468 [00:20<00:02, 19.22it/s][A
Loss: 0.0203 | Train Set Acc: 0.9932 |:  88%|████████▊ | 414/468 [00:21<00:02, 19.22it/s][A
Loss: 0.0202 | Train Set Acc: 0.9932 |:  88%|████████▊ | 414/468 [00:21<00:02, 19.22it/s][A
Loss: 0.0202 | Train Set Acc: 0.9932 |:  89%|████████▉ | 416/468 [00:21<00:02, 18.91it/s][A
Loss: 0.0202 | Train Set Acc: 0.9932 |:  89%|████████▉ | 416/468 [00:21<00:02, 18.91it/s][A
Loss: 0.0202 | Train Set Acc: 0.9932 |:  89%|████████▉ | 416/468 [00:21<00:02, 18.91it/s][A
Loss: 0.0202 | Train Set Acc: 0.9932 |:  89%|████████▉ | 418/468 [00:21<00:02, 19.13it/s][A
Loss: 0.0202 | Train Set Acc: 0.9932 |:  89%|████████▉ | 418/468 [00:21<00:02, 19.13it/s][A
Loss: 0.0202 | Train Set Acc: 0.9932 |:  89%|████████▉ | 418/468 [00:21<00:02, 19.13it/s][A
Loss: 0.0203 | Train Set Acc: 0.9932 |:  89%|████████▉ | 418/468 [00:21<00:02, 19.13it/s][A
Loss: 0.0203 | Train Set Acc: 0.9932 |:  90%|████████▉ | 421/468 [00:2

Loss: 0.0103 | Train Set Acc: 0.9974 |:   1%|▏         | 7/468 [00:00<00:22, 20.57it/s][A
Loss: 0.0103 | Train Set Acc: 0.9974 |:   2%|▏         | 9/468 [00:00<00:23, 19.81it/s][A
Loss: 0.0112 | Train Set Acc: 0.9969 |:   2%|▏         | 9/468 [00:00<00:23, 19.81it/s][A
Loss: 0.0105 | Train Set Acc: 0.9972 |:   2%|▏         | 9/468 [00:00<00:23, 19.81it/s][A
Loss: 0.0105 | Train Set Acc: 0.9972 |:   2%|▏         | 11/468 [00:00<00:23, 19.20it/s][A
Loss: 0.0097 | Train Set Acc: 0.9974 |:   2%|▏         | 11/468 [00:00<00:23, 19.20it/s][A
Loss: 0.0116 | Train Set Acc: 0.9970 |:   2%|▏         | 11/468 [00:00<00:23, 19.20it/s][A
Loss: 0.0109 | Train Set Acc: 0.9972 |:   2%|▏         | 11/468 [00:00<00:23, 19.20it/s][A
Loss: 0.0109 | Train Set Acc: 0.9972 |:   3%|▎         | 14/468 [00:00<00:23, 19.52it/s][A
Loss: 0.0112 | Train Set Acc: 0.9969 |:   3%|▎         | 14/468 [00:00<00:23, 19.52it/s][A
Loss: 0.0108 | Train Set Acc: 0.9971 |:   3%|▎         | 14/468 [00:00<00:23, 19.52i

Loss: 0.0117 | Train Set Acc: 0.9965 |:  15%|█▍        | 70/468 [00:03<00:19, 20.13it/s][A
Loss: 0.0129 | Train Set Acc: 0.9964 |:  15%|█▍        | 70/468 [00:03<00:19, 20.13it/s][A
Loss: 0.0129 | Train Set Acc: 0.9964 |:  16%|█▌        | 73/468 [00:03<00:20, 19.60it/s][A
Loss: 0.0130 | Train Set Acc: 0.9962 |:  16%|█▌        | 73/468 [00:03<00:20, 19.60it/s][A
Loss: 0.0129 | Train Set Acc: 0.9962 |:  16%|█▌        | 73/468 [00:03<00:20, 19.60it/s][A
Loss: 0.0128 | Train Set Acc: 0.9963 |:  16%|█▌        | 73/468 [00:03<00:20, 19.60it/s][A
Loss: 0.0128 | Train Set Acc: 0.9963 |:  16%|█▌        | 76/468 [00:03<00:19, 20.46it/s][A
Loss: 0.0128 | Train Set Acc: 0.9963 |:  16%|█▌        | 76/468 [00:03<00:19, 20.46it/s][A
Loss: 0.0130 | Train Set Acc: 0.9963 |:  16%|█▌        | 76/468 [00:03<00:19, 20.46it/s][A
Loss: 0.0130 | Train Set Acc: 0.9961 |:  16%|█▌        | 76/468 [00:03<00:19, 20.46it/s][A
Loss: 0.0130 | Train Set Acc: 0.9961 |:  17%|█▋        | 79/468 [00:03<00:18, 21

Loss: 0.0155 | Train Set Acc: 0.9953 |:  29%|██▉       | 136/468 [00:06<00:17, 19.07it/s][A
Loss: 0.0154 | Train Set Acc: 0.9953 |:  29%|██▉       | 136/468 [00:06<00:17, 19.07it/s][A
Loss: 0.0155 | Train Set Acc: 0.9953 |:  29%|██▉       | 136/468 [00:06<00:17, 19.07it/s][A
Loss: 0.0154 | Train Set Acc: 0.9953 |:  29%|██▉       | 136/468 [00:07<00:17, 19.07it/s][A
Loss: 0.0154 | Train Set Acc: 0.9953 |:  30%|██▉       | 139/468 [00:07<00:16, 19.39it/s][A
Loss: 0.0154 | Train Set Acc: 0.9953 |:  30%|██▉       | 139/468 [00:07<00:16, 19.39it/s][A
Loss: 0.0153 | Train Set Acc: 0.9953 |:  30%|██▉       | 139/468 [00:07<00:16, 19.39it/s][A
Loss: 0.0153 | Train Set Acc: 0.9953 |:  30%|███       | 141/468 [00:07<00:16, 19.42it/s][A
Loss: 0.0153 | Train Set Acc: 0.9953 |:  30%|███       | 141/468 [00:07<00:16, 19.42it/s][A
Loss: 0.0152 | Train Set Acc: 0.9954 |:  30%|███       | 141/468 [00:07<00:16, 19.42it/s][A
Loss: 0.0152 | Train Set Acc: 0.9954 |:  31%|███       | 143/468 [00:0

Loss: 0.0148 | Train Set Acc: 0.9955 |:  43%|████▎     | 199/468 [00:09<00:12, 22.22it/s][A
Loss: 0.0147 | Train Set Acc: 0.9955 |:  43%|████▎     | 199/468 [00:09<00:12, 22.22it/s][A
Loss: 0.0147 | Train Set Acc: 0.9955 |:  43%|████▎     | 199/468 [00:10<00:12, 22.22it/s][A
Loss: 0.0147 | Train Set Acc: 0.9955 |:  43%|████▎     | 202/468 [00:10<00:11, 22.24it/s][A
Loss: 0.0147 | Train Set Acc: 0.9955 |:  43%|████▎     | 202/468 [00:10<00:11, 22.24it/s][A
Loss: 0.0146 | Train Set Acc: 0.9955 |:  43%|████▎     | 202/468 [00:10<00:11, 22.24it/s][A
Loss: 0.0146 | Train Set Acc: 0.9955 |:  43%|████▎     | 202/468 [00:10<00:11, 22.24it/s][A
Loss: 0.0146 | Train Set Acc: 0.9955 |:  44%|████▍     | 205/468 [00:10<00:12, 21.22it/s][A
Loss: 0.0147 | Train Set Acc: 0.9955 |:  44%|████▍     | 205/468 [00:10<00:12, 21.22it/s][A
Loss: 0.0147 | Train Set Acc: 0.9955 |:  44%|████▍     | 205/468 [00:10<00:12, 21.22it/s][A
Loss: 0.0146 | Train Set Acc: 0.9956 |:  44%|████▍     | 205/468 [00:1

Loss: 0.0163 | Train Set Acc: 0.9949 |:  56%|█████▌    | 262/468 [00:13<00:11, 17.47it/s][A
Loss: 0.0163 | Train Set Acc: 0.9949 |:  56%|█████▋    | 264/468 [00:13<00:11, 17.19it/s][A
Loss: 0.0163 | Train Set Acc: 0.9949 |:  56%|█████▋    | 264/468 [00:13<00:11, 17.19it/s][A
Loss: 0.0164 | Train Set Acc: 0.9949 |:  56%|█████▋    | 264/468 [00:13<00:11, 17.19it/s][A
Loss: 0.0164 | Train Set Acc: 0.9949 |:  57%|█████▋    | 266/468 [00:13<00:11, 17.31it/s][A
Loss: 0.0163 | Train Set Acc: 0.9949 |:  57%|█████▋    | 266/468 [00:13<00:11, 17.31it/s][A
Loss: 0.0163 | Train Set Acc: 0.9949 |:  57%|█████▋    | 266/468 [00:13<00:11, 17.31it/s][A
Loss: 0.0163 | Train Set Acc: 0.9949 |:  57%|█████▋    | 268/468 [00:13<00:11, 17.12it/s][A
Loss: 0.0163 | Train Set Acc: 0.9949 |:  57%|█████▋    | 268/468 [00:13<00:11, 17.12it/s][A
Loss: 0.0163 | Train Set Acc: 0.9949 |:  57%|█████▋    | 268/468 [00:13<00:11, 17.12it/s][A
Loss: 0.0163 | Train Set Acc: 0.9949 |:  58%|█████▊    | 270/468 [00:1

Loss: 0.0158 | Train Set Acc: 0.9951 |:  70%|██████▉   | 326/468 [00:16<00:07, 19.74it/s][A
Loss: 0.0158 | Train Set Acc: 0.9951 |:  70%|██████▉   | 326/468 [00:16<00:07, 19.74it/s][A
Loss: 0.0157 | Train Set Acc: 0.9951 |:  70%|██████▉   | 326/468 [00:16<00:07, 19.74it/s][A
Loss: 0.0157 | Train Set Acc: 0.9951 |:  70%|███████   | 328/468 [00:16<00:07, 19.54it/s][A
Loss: 0.0158 | Train Set Acc: 0.9951 |:  70%|███████   | 328/468 [00:16<00:07, 19.54it/s][A
Loss: 0.0158 | Train Set Acc: 0.9951 |:  70%|███████   | 328/468 [00:16<00:07, 19.54it/s][A
Loss: 0.0158 | Train Set Acc: 0.9951 |:  71%|███████   | 330/468 [00:16<00:07, 19.35it/s][A
Loss: 0.0158 | Train Set Acc: 0.9951 |:  71%|███████   | 330/468 [00:16<00:07, 19.35it/s][A
Loss: 0.0158 | Train Set Acc: 0.9951 |:  71%|███████   | 330/468 [00:16<00:07, 19.35it/s][A
Loss: 0.0158 | Train Set Acc: 0.9951 |:  71%|███████   | 332/468 [00:16<00:07, 19.39it/s][A
Loss: 0.0157 | Train Set Acc: 0.9951 |:  71%|███████   | 332/468 [00:1

Loss: 0.0155 | Train Set Acc: 0.9953 |:  83%|████████▎ | 387/468 [00:19<00:03, 20.74it/s][A
Loss: 0.0157 | Train Set Acc: 0.9952 |:  83%|████████▎ | 387/468 [00:19<00:03, 20.74it/s][A
Loss: 0.0157 | Train Set Acc: 0.9952 |:  83%|████████▎ | 390/468 [00:19<00:03, 21.23it/s][A
Loss: 0.0157 | Train Set Acc: 0.9952 |:  83%|████████▎ | 390/468 [00:19<00:03, 21.23it/s][A
Loss: 0.0157 | Train Set Acc: 0.9952 |:  83%|████████▎ | 390/468 [00:19<00:03, 21.23it/s][A
Loss: 0.0157 | Train Set Acc: 0.9952 |:  83%|████████▎ | 390/468 [00:19<00:03, 21.23it/s][A
Loss: 0.0157 | Train Set Acc: 0.9952 |:  84%|████████▍ | 393/468 [00:19<00:03, 21.86it/s][A
Loss: 0.0158 | Train Set Acc: 0.9952 |:  84%|████████▍ | 393/468 [00:19<00:03, 21.86it/s][A
Loss: 0.0158 | Train Set Acc: 0.9952 |:  84%|████████▍ | 393/468 [00:19<00:03, 21.86it/s][A
Loss: 0.0158 | Train Set Acc: 0.9952 |:  84%|████████▍ | 393/468 [00:19<00:03, 21.86it/s][A
Loss: 0.0158 | Train Set Acc: 0.9952 |:  85%|████████▍ | 396/468 [00:1

Loss: 0.0157 | Train Set Acc: 0.9952 |:  97%|█████████▋| 452/468 [00:22<00:00, 18.97it/s][A
Loss: 0.0157 | Train Set Acc: 0.9952 |:  97%|█████████▋| 452/468 [00:22<00:00, 18.97it/s][A
Loss: 0.0157 | Train Set Acc: 0.9952 |:  97%|█████████▋| 454/468 [00:22<00:00, 19.06it/s][A
Loss: 0.0158 | Train Set Acc: 0.9952 |:  97%|█████████▋| 454/468 [00:22<00:00, 19.06it/s][A
Loss: 0.0158 | Train Set Acc: 0.9952 |:  97%|█████████▋| 454/468 [00:22<00:00, 19.06it/s][A
Loss: 0.0158 | Train Set Acc: 0.9952 |:  97%|█████████▋| 456/468 [00:22<00:00, 18.86it/s][A
Loss: 0.0158 | Train Set Acc: 0.9952 |:  97%|█████████▋| 456/468 [00:22<00:00, 18.86it/s][A
Loss: 0.0158 | Train Set Acc: 0.9952 |:  97%|█████████▋| 456/468 [00:23<00:00, 18.86it/s][A
Loss: 0.0158 | Train Set Acc: 0.9952 |:  98%|█████████▊| 458/468 [00:23<00:00, 18.77it/s][A
Loss: 0.0158 | Train Set Acc: 0.9952 |:  98%|█████████▊| 458/468 [00:23<00:00, 18.77it/s][A
Loss: 0.0158 | Train Set Acc: 0.9952 |:  98%|█████████▊| 458/468 [00:2

#### Q5:
Please print the training and testing accuracy.

In [19]:
print("Epoch: %d Train Acc: %.4f; Test Acc: %.4f" % (epoch, train_acc, test_acc))

Epoch: 9 Train Acc: 0.9951; Test Acc: 0.9884
