In [44]:
import torch
import torch.nn as nn
import torchvision
import torchvision.transforms as transforms

In [45]:
device = torch.device('cuda' if torch.cuda.is_available() else 'cpu')

In [46]:
# Define Hyper-parameters 
input_size = 784
hidden_size = 500
num_classes = 10
num_epochs = 20
batch_size = 1
learning_rate = 0.001

### MNIST dataset 

In [47]:
train_dataset = torchvision.datasets.MNIST(root='..//set', 
                                           train=True, 
                                           transform=transforms.ToTensor(),  
                                           download=True)

In [48]:
test_dataset = torchvision.datasets.MNIST(root='..///set', 
                                          train=False, 
                                          transform=transforms.ToTensor())

In [49]:
# Data loader
train_loader = torch.utils.data.DataLoader(dataset=train_dataset, 
                                           batch_size=batch_size, 
                                           shuffle=True)

test_loader = torch.utils.data.DataLoader(dataset=test_dataset, 
                                          batch_size=batch_size, 
                                          shuffle=False)

In [None]:
model = torch.hub.load('pytorch/vision:v0.6.0', 'squeezenet1_0', pretrained=True)

### Fully connected neural network

In [None]:
scaling=transforms.Compose([
        transforms.Resize(224),
        transforms.ToTensor(),
        transforms.Lambda(lambda x: x.expand(3, -1, -1))
    ])

In [50]:
class NeuralNet(nn.Module):
    def __init__(self, input_size, hidden_size, num_classes):
        super(NeuralNet, self).__init__()
        self.fc1 = nn.Linear(input_size, hidden_size) 
        self.relu = nn.ReLU()
        self.fc2 = nn.Linear(hidden_size, num_classes)  
    
    def forward(self, x):
        out = self.fc1(x)
        out = self.relu(out)
        out = self.fc2(out)
        return out

In [51]:
model = NeuralNet(input_size, hidden_size, num_classes).to(device)

### Loss and optimizer

In [52]:
criterion = nn.CrossEntropyLoss()
optimizer = torch.optim.Adam(model.parameters(), lr=learning_rate)  

### Train Model

In [None]:
total_step = len(train_loader)
for epoch in range(num_epochs):
    for i, (images, labels) in enumerate(train_loader):  
        # Move tensors to the configured device
        images = images.reshape(-1, 28*28).to(device)
        labels = labels.to(device)
        
        # Forward pass
        outputs = model(images)
        loss = criterion(outputs, labels)
        
        # Backprpagation and optimization
        optimizer.zero_grad()
        loss.backward()
        optimizer.step()
        
        if (i+1) % 100 == 0:
            print ('Epoch [{}/{}], Step [{}/{}], Loss: {:.4f}' 
                   .format(epoch+1, num_epochs, i+1, total_step, loss.item()))

Epoch [1/20], Step [100/60000], Loss: 2.6201
Epoch [1/20], Step [200/60000], Loss: 0.9726
Epoch [1/20], Step [300/60000], Loss: 0.0760
Epoch [1/20], Step [400/60000], Loss: 0.0181
Epoch [1/20], Step [500/60000], Loss: 1.9133
Epoch [1/20], Step [600/60000], Loss: 0.0760
Epoch [1/20], Step [700/60000], Loss: 0.1122
Epoch [1/20], Step [800/60000], Loss: 0.0147
Epoch [1/20], Step [900/60000], Loss: 0.3848
Epoch [1/20], Step [1000/60000], Loss: 0.0041
Epoch [1/20], Step [1100/60000], Loss: 1.1265
Epoch [1/20], Step [1200/60000], Loss: 0.6525
Epoch [1/20], Step [1300/60000], Loss: 0.0211
Epoch [1/20], Step [1400/60000], Loss: 0.4906
Epoch [1/20], Step [1500/60000], Loss: 0.0016
Epoch [1/20], Step [1600/60000], Loss: 0.0045
Epoch [1/20], Step [1700/60000], Loss: 1.3407
Epoch [1/20], Step [1800/60000], Loss: 0.0001
Epoch [1/20], Step [1900/60000], Loss: 0.6571
Epoch [1/20], Step [2000/60000], Loss: 0.9784
Epoch [1/20], Step [2100/60000], Loss: 0.0035
Epoch [1/20], Step [2200/60000], Loss: 0.00

Epoch [1/20], Step [17800/60000], Loss: 0.0000
Epoch [1/20], Step [17900/60000], Loss: 0.0024
Epoch [1/20], Step [18000/60000], Loss: 0.0000
Epoch [1/20], Step [18100/60000], Loss: 0.0016
Epoch [1/20], Step [18200/60000], Loss: 0.0001
Epoch [1/20], Step [18300/60000], Loss: 1.1044
Epoch [1/20], Step [18400/60000], Loss: 0.4465
Epoch [1/20], Step [18500/60000], Loss: 0.0158
Epoch [1/20], Step [18600/60000], Loss: 0.0049
Epoch [1/20], Step [18700/60000], Loss: 0.0082
Epoch [1/20], Step [18800/60000], Loss: 0.0024
Epoch [1/20], Step [18900/60000], Loss: 0.0000
Epoch [1/20], Step [19000/60000], Loss: 0.0000
Epoch [1/20], Step [19100/60000], Loss: 0.0000
Epoch [1/20], Step [19200/60000], Loss: 0.0042
Epoch [1/20], Step [19300/60000], Loss: 0.0017
Epoch [1/20], Step [19400/60000], Loss: 0.2010
Epoch [1/20], Step [19500/60000], Loss: 0.0000
Epoch [1/20], Step [19600/60000], Loss: 0.0066
Epoch [1/20], Step [19700/60000], Loss: 0.0738
Epoch [1/20], Step [19800/60000], Loss: 0.0000
Epoch [1/20],

Epoch [1/20], Step [35300/60000], Loss: 0.0001
Epoch [1/20], Step [35400/60000], Loss: 0.0084
Epoch [1/20], Step [35500/60000], Loss: 2.9725
Epoch [1/20], Step [35600/60000], Loss: 4.8266
Epoch [1/20], Step [35700/60000], Loss: 0.0000
Epoch [1/20], Step [35800/60000], Loss: 0.0000
Epoch [1/20], Step [35900/60000], Loss: 0.0537
Epoch [1/20], Step [36000/60000], Loss: 0.0000
Epoch [1/20], Step [36100/60000], Loss: 0.0000
Epoch [1/20], Step [36200/60000], Loss: 2.1155
Epoch [1/20], Step [36300/60000], Loss: 0.0032
Epoch [1/20], Step [36400/60000], Loss: 0.0006
Epoch [1/20], Step [36500/60000], Loss: 1.3712
Epoch [1/20], Step [36600/60000], Loss: 0.0078
Epoch [1/20], Step [36700/60000], Loss: 0.0004
Epoch [1/20], Step [36800/60000], Loss: 0.0010
Epoch [1/20], Step [36900/60000], Loss: 0.0000
Epoch [1/20], Step [37000/60000], Loss: 0.0000
Epoch [1/20], Step [37100/60000], Loss: 0.0009
Epoch [1/20], Step [37200/60000], Loss: 0.0606
Epoch [1/20], Step [37300/60000], Loss: 0.0018
Epoch [1/20],

Epoch [1/20], Step [52800/60000], Loss: 0.0002
Epoch [1/20], Step [52900/60000], Loss: 0.0000
Epoch [1/20], Step [53000/60000], Loss: 0.0204
Epoch [1/20], Step [53100/60000], Loss: 0.0000
Epoch [1/20], Step [53200/60000], Loss: 0.0000
Epoch [1/20], Step [53300/60000], Loss: 0.0000
Epoch [1/20], Step [53400/60000], Loss: 0.0000
Epoch [1/20], Step [53500/60000], Loss: 0.0000
Epoch [1/20], Step [53600/60000], Loss: 0.0001
Epoch [1/20], Step [53700/60000], Loss: 0.0000
Epoch [1/20], Step [53800/60000], Loss: 5.1784
Epoch [1/20], Step [53900/60000], Loss: 0.0028
Epoch [1/20], Step [54000/60000], Loss: 0.0000
Epoch [1/20], Step [54100/60000], Loss: 0.9091
Epoch [1/20], Step [54200/60000], Loss: 0.3173
Epoch [1/20], Step [54300/60000], Loss: 0.0001
Epoch [1/20], Step [54400/60000], Loss: 0.0093
Epoch [1/20], Step [54500/60000], Loss: 0.0186
Epoch [1/20], Step [54600/60000], Loss: 0.0702
Epoch [1/20], Step [54700/60000], Loss: 0.2919
Epoch [1/20], Step [54800/60000], Loss: 0.0010
Epoch [1/20],

Epoch [2/20], Step [10500/60000], Loss: 0.0000
Epoch [2/20], Step [10600/60000], Loss: 0.0040
Epoch [2/20], Step [10700/60000], Loss: 0.0000
Epoch [2/20], Step [10800/60000], Loss: 0.0000
Epoch [2/20], Step [10900/60000], Loss: 0.0000
Epoch [2/20], Step [11000/60000], Loss: 0.0056
Epoch [2/20], Step [11100/60000], Loss: 0.0006
Epoch [2/20], Step [11200/60000], Loss: 0.0000
Epoch [2/20], Step [11300/60000], Loss: 0.0000
Epoch [2/20], Step [11400/60000], Loss: 0.0007
Epoch [2/20], Step [11500/60000], Loss: 0.0001
Epoch [2/20], Step [11600/60000], Loss: 0.0005
Epoch [2/20], Step [11700/60000], Loss: 0.0000
Epoch [2/20], Step [11800/60000], Loss: 0.0000
Epoch [2/20], Step [11900/60000], Loss: 0.0000
Epoch [2/20], Step [12000/60000], Loss: 0.0000
Epoch [2/20], Step [12100/60000], Loss: 0.0000
Epoch [2/20], Step [12200/60000], Loss: 0.0000
Epoch [2/20], Step [12300/60000], Loss: 0.0000
Epoch [2/20], Step [12400/60000], Loss: 0.0000
Epoch [2/20], Step [12500/60000], Loss: 0.0000
Epoch [2/20],

Epoch [2/20], Step [28000/60000], Loss: 0.0000
Epoch [2/20], Step [28100/60000], Loss: 0.0000
Epoch [2/20], Step [28200/60000], Loss: 0.0000
Epoch [2/20], Step [28300/60000], Loss: 0.0000
Epoch [2/20], Step [28400/60000], Loss: 0.0000
Epoch [2/20], Step [28500/60000], Loss: 0.0060
Epoch [2/20], Step [28600/60000], Loss: 0.0000
Epoch [2/20], Step [28700/60000], Loss: 0.0000
Epoch [2/20], Step [28800/60000], Loss: 0.0000
Epoch [2/20], Step [28900/60000], Loss: 0.0000
Epoch [2/20], Step [29000/60000], Loss: 0.0000
Epoch [2/20], Step [29100/60000], Loss: 0.5653
Epoch [2/20], Step [29200/60000], Loss: 0.0000
Epoch [2/20], Step [29300/60000], Loss: 0.0000
Epoch [2/20], Step [29400/60000], Loss: 0.0000
Epoch [2/20], Step [29500/60000], Loss: 0.0000
Epoch [2/20], Step [29600/60000], Loss: 0.0001
Epoch [2/20], Step [29700/60000], Loss: 0.0000
Epoch [2/20], Step [29800/60000], Loss: 0.1479
Epoch [2/20], Step [29900/60000], Loss: 0.0000
Epoch [2/20], Step [30000/60000], Loss: 0.0000
Epoch [2/20],

Epoch [2/20], Step [45500/60000], Loss: 0.0000
Epoch [2/20], Step [45600/60000], Loss: 0.0265
Epoch [2/20], Step [45700/60000], Loss: 0.0000
Epoch [2/20], Step [45800/60000], Loss: 0.0000
Epoch [2/20], Step [45900/60000], Loss: 0.0053
Epoch [2/20], Step [46000/60000], Loss: 0.0000
Epoch [2/20], Step [46100/60000], Loss: 0.0001
Epoch [2/20], Step [46200/60000], Loss: 0.0093
Epoch [2/20], Step [46300/60000], Loss: 0.0000
Epoch [2/20], Step [46400/60000], Loss: 0.0000
Epoch [2/20], Step [46500/60000], Loss: 0.0253
Epoch [2/20], Step [46600/60000], Loss: 0.0000
Epoch [2/20], Step [46700/60000], Loss: 0.0000
Epoch [2/20], Step [46800/60000], Loss: 10.3209
Epoch [2/20], Step [46900/60000], Loss: 0.0000
Epoch [2/20], Step [47000/60000], Loss: 0.0000
Epoch [2/20], Step [47100/60000], Loss: 0.0000
Epoch [2/20], Step [47200/60000], Loss: 0.0008
Epoch [2/20], Step [47300/60000], Loss: 0.5108
Epoch [2/20], Step [47400/60000], Loss: 0.0000
Epoch [2/20], Step [47500/60000], Loss: 0.0042
Epoch [2/20]

Epoch [3/20], Step [3100/60000], Loss: 0.0000
Epoch [3/20], Step [3200/60000], Loss: 0.0000
Epoch [3/20], Step [3300/60000], Loss: 0.0000
Epoch [3/20], Step [3400/60000], Loss: 0.0000
Epoch [3/20], Step [3500/60000], Loss: 0.0000
Epoch [3/20], Step [3600/60000], Loss: 0.0000
Epoch [3/20], Step [3700/60000], Loss: 0.0000
Epoch [3/20], Step [3800/60000], Loss: 0.0000
Epoch [3/20], Step [3900/60000], Loss: 0.0000
Epoch [3/20], Step [4000/60000], Loss: 0.0000
Epoch [3/20], Step [4100/60000], Loss: 0.0000
Epoch [3/20], Step [4200/60000], Loss: 0.0000
Epoch [3/20], Step [4300/60000], Loss: 0.0072
Epoch [3/20], Step [4400/60000], Loss: 0.0000
Epoch [3/20], Step [4500/60000], Loss: 0.0018
Epoch [3/20], Step [4600/60000], Loss: 0.0006
Epoch [3/20], Step [4700/60000], Loss: 0.0005
Epoch [3/20], Step [4800/60000], Loss: 0.0000
Epoch [3/20], Step [4900/60000], Loss: 0.0000
Epoch [3/20], Step [5000/60000], Loss: 0.0000
Epoch [3/20], Step [5100/60000], Loss: 0.2288
Epoch [3/20], Step [5200/60000], L

Epoch [3/20], Step [20700/60000], Loss: 0.0000
Epoch [3/20], Step [20800/60000], Loss: 0.0000
Epoch [3/20], Step [20900/60000], Loss: 0.0000
Epoch [3/20], Step [21000/60000], Loss: 0.0000
Epoch [3/20], Step [21100/60000], Loss: 0.0000
Epoch [3/20], Step [21200/60000], Loss: 0.0017
Epoch [3/20], Step [21300/60000], Loss: 4.7471
Epoch [3/20], Step [21400/60000], Loss: 0.0000
Epoch [3/20], Step [21500/60000], Loss: 0.0000
Epoch [3/20], Step [21600/60000], Loss: 0.0345
Epoch [3/20], Step [21700/60000], Loss: 0.0000
Epoch [3/20], Step [21800/60000], Loss: 0.0000
Epoch [3/20], Step [21900/60000], Loss: 0.0000
Epoch [3/20], Step [22000/60000], Loss: 0.0496
Epoch [3/20], Step [22100/60000], Loss: 0.0000
Epoch [3/20], Step [22200/60000], Loss: 0.0002
Epoch [3/20], Step [22300/60000], Loss: 3.0973
Epoch [3/20], Step [22400/60000], Loss: 0.0000
Epoch [3/20], Step [22500/60000], Loss: 0.0000
Epoch [3/20], Step [22600/60000], Loss: 0.0000
Epoch [3/20], Step [22700/60000], Loss: 0.0000
Epoch [3/20],

Epoch [3/20], Step [38200/60000], Loss: 0.0000
Epoch [3/20], Step [38300/60000], Loss: 0.0000
Epoch [3/20], Step [38400/60000], Loss: 0.0000
Epoch [3/20], Step [38500/60000], Loss: 0.0000
Epoch [3/20], Step [38600/60000], Loss: 0.0000
Epoch [3/20], Step [38700/60000], Loss: 0.0000
Epoch [3/20], Step [38800/60000], Loss: 0.0000
Epoch [3/20], Step [38900/60000], Loss: 0.0000
Epoch [3/20], Step [39000/60000], Loss: 0.0000
Epoch [3/20], Step [39100/60000], Loss: 0.0002
Epoch [3/20], Step [39200/60000], Loss: 0.0000
Epoch [3/20], Step [39300/60000], Loss: 0.0000
Epoch [3/20], Step [39400/60000], Loss: 0.0000
Epoch [3/20], Step [39500/60000], Loss: 0.0000
Epoch [3/20], Step [39600/60000], Loss: 0.0000
Epoch [3/20], Step [39700/60000], Loss: 0.0000
Epoch [3/20], Step [39800/60000], Loss: 0.0000
Epoch [3/20], Step [39900/60000], Loss: 0.0000
Epoch [3/20], Step [40000/60000], Loss: 0.0000
Epoch [3/20], Step [40100/60000], Loss: 0.0000
Epoch [3/20], Step [40200/60000], Loss: 0.0000
Epoch [3/20],

Epoch [3/20], Step [55700/60000], Loss: 0.0132
Epoch [3/20], Step [55800/60000], Loss: 0.0000
Epoch [3/20], Step [55900/60000], Loss: 0.0000
Epoch [3/20], Step [56000/60000], Loss: 0.0000
Epoch [3/20], Step [56100/60000], Loss: 0.0000
Epoch [3/20], Step [56200/60000], Loss: 0.0000
Epoch [3/20], Step [56300/60000], Loss: 0.0000
Epoch [3/20], Step [56400/60000], Loss: 0.0000
Epoch [3/20], Step [56500/60000], Loss: 0.0000
Epoch [3/20], Step [56600/60000], Loss: 0.0000
Epoch [3/20], Step [56700/60000], Loss: 0.0000
Epoch [3/20], Step [56800/60000], Loss: 0.0000
Epoch [3/20], Step [56900/60000], Loss: 0.0010
Epoch [3/20], Step [57000/60000], Loss: 0.0000
Epoch [3/20], Step [57100/60000], Loss: 0.0000
Epoch [3/20], Step [57200/60000], Loss: 0.1371
Epoch [3/20], Step [57300/60000], Loss: 0.0000
Epoch [3/20], Step [57400/60000], Loss: 0.0000
Epoch [3/20], Step [57500/60000], Loss: 0.0000
Epoch [3/20], Step [57600/60000], Loss: 0.0000
Epoch [3/20], Step [57700/60000], Loss: 0.0147
Epoch [3/20],

Epoch [4/20], Step [13400/60000], Loss: 0.0000
Epoch [4/20], Step [13500/60000], Loss: 0.0000
Epoch [4/20], Step [13600/60000], Loss: 0.0000
Epoch [4/20], Step [13700/60000], Loss: 0.0000
Epoch [4/20], Step [13800/60000], Loss: 0.0000
Epoch [4/20], Step [13900/60000], Loss: 0.0009
Epoch [4/20], Step [14000/60000], Loss: 0.0000
Epoch [4/20], Step [14100/60000], Loss: 0.0000
Epoch [4/20], Step [14200/60000], Loss: 0.0000
Epoch [4/20], Step [14300/60000], Loss: 0.0000
Epoch [4/20], Step [14400/60000], Loss: 0.0000
Epoch [4/20], Step [14500/60000], Loss: 0.0000
Epoch [4/20], Step [14600/60000], Loss: 0.0000
Epoch [4/20], Step [14700/60000], Loss: 0.0000
Epoch [4/20], Step [14800/60000], Loss: 0.1871
Epoch [4/20], Step [14900/60000], Loss: 0.0000
Epoch [4/20], Step [15000/60000], Loss: 0.0000
Epoch [4/20], Step [15100/60000], Loss: 0.0000
Epoch [4/20], Step [15200/60000], Loss: 0.0000
Epoch [4/20], Step [15300/60000], Loss: 0.0000
Epoch [4/20], Step [15400/60000], Loss: 0.0000
Epoch [4/20],

Epoch [4/20], Step [30900/60000], Loss: 0.0000
Epoch [4/20], Step [31000/60000], Loss: 0.0000
Epoch [4/20], Step [31100/60000], Loss: 0.0000
Epoch [4/20], Step [31200/60000], Loss: 0.0000
Epoch [4/20], Step [31300/60000], Loss: 0.0000
Epoch [4/20], Step [31400/60000], Loss: 0.0000
Epoch [4/20], Step [31500/60000], Loss: 0.0000
Epoch [4/20], Step [31600/60000], Loss: 0.0000
Epoch [4/20], Step [31700/60000], Loss: 0.0747
Epoch [4/20], Step [31800/60000], Loss: 0.0000
Epoch [4/20], Step [31900/60000], Loss: 0.0000
Epoch [4/20], Step [32000/60000], Loss: 0.0000
Epoch [4/20], Step [32100/60000], Loss: 0.0000
Epoch [4/20], Step [32200/60000], Loss: 0.0000
Epoch [4/20], Step [32300/60000], Loss: 0.0000
Epoch [4/20], Step [32400/60000], Loss: 0.0000
Epoch [4/20], Step [32500/60000], Loss: 0.0000
Epoch [4/20], Step [32600/60000], Loss: 0.0000
Epoch [4/20], Step [32700/60000], Loss: 0.0000
Epoch [4/20], Step [32800/60000], Loss: 0.0000
Epoch [4/20], Step [32900/60000], Loss: 0.0000
Epoch [4/20],

Epoch [4/20], Step [48400/60000], Loss: 0.0000
Epoch [4/20], Step [48500/60000], Loss: 0.0000
Epoch [4/20], Step [48600/60000], Loss: 0.0000
Epoch [4/20], Step [48700/60000], Loss: 0.0005
Epoch [4/20], Step [48800/60000], Loss: 0.1759
Epoch [4/20], Step [48900/60000], Loss: 0.0000
Epoch [4/20], Step [49000/60000], Loss: 0.0000
Epoch [4/20], Step [49100/60000], Loss: 0.0000
Epoch [4/20], Step [49200/60000], Loss: 0.0000
Epoch [4/20], Step [49300/60000], Loss: 0.0000
Epoch [4/20], Step [49400/60000], Loss: 0.0000
Epoch [4/20], Step [49500/60000], Loss: 0.0000
Epoch [4/20], Step [49600/60000], Loss: 0.0000
Epoch [4/20], Step [49700/60000], Loss: 0.0000
Epoch [4/20], Step [49800/60000], Loss: 0.0000
Epoch [4/20], Step [49900/60000], Loss: 0.0000
Epoch [4/20], Step [50000/60000], Loss: 0.0000
Epoch [4/20], Step [50100/60000], Loss: 0.0000
Epoch [4/20], Step [50200/60000], Loss: 0.0000
Epoch [4/20], Step [50300/60000], Loss: 0.0000
Epoch [4/20], Step [50400/60000], Loss: 0.0000
Epoch [4/20],

Epoch [5/20], Step [6000/60000], Loss: 0.0000
Epoch [5/20], Step [6100/60000], Loss: 0.0000
Epoch [5/20], Step [6200/60000], Loss: 1.8086
Epoch [5/20], Step [6300/60000], Loss: 0.0000
Epoch [5/20], Step [6400/60000], Loss: 0.0000
Epoch [5/20], Step [6500/60000], Loss: 0.0000
Epoch [5/20], Step [6600/60000], Loss: 0.0000
Epoch [5/20], Step [6700/60000], Loss: 0.0000
Epoch [5/20], Step [6800/60000], Loss: 0.0000
Epoch [5/20], Step [6900/60000], Loss: 0.0000
Epoch [5/20], Step [7000/60000], Loss: 0.0000
Epoch [5/20], Step [7100/60000], Loss: 0.0000
Epoch [5/20], Step [7200/60000], Loss: 0.0000
Epoch [5/20], Step [7300/60000], Loss: 0.0000
Epoch [5/20], Step [7400/60000], Loss: 0.0000
Epoch [5/20], Step [7500/60000], Loss: 0.0000
Epoch [5/20], Step [7600/60000], Loss: 0.0000
Epoch [5/20], Step [7700/60000], Loss: 0.0000
Epoch [5/20], Step [7800/60000], Loss: 0.0000
Epoch [5/20], Step [7900/60000], Loss: 0.0000
Epoch [5/20], Step [8000/60000], Loss: 0.0000
Epoch [5/20], Step [8100/60000], L

Epoch [5/20], Step [23600/60000], Loss: 0.0000
Epoch [5/20], Step [23700/60000], Loss: 0.0000
Epoch [5/20], Step [23800/60000], Loss: 0.0000
Epoch [5/20], Step [23900/60000], Loss: 0.0000
Epoch [5/20], Step [24000/60000], Loss: 0.0000
Epoch [5/20], Step [24100/60000], Loss: 0.0000
Epoch [5/20], Step [24200/60000], Loss: 0.0000
Epoch [5/20], Step [24300/60000], Loss: 0.0000
Epoch [5/20], Step [24400/60000], Loss: 0.0000
Epoch [5/20], Step [24500/60000], Loss: 0.0000
Epoch [5/20], Step [24600/60000], Loss: 0.0000
Epoch [5/20], Step [24700/60000], Loss: 0.0000
Epoch [5/20], Step [24800/60000], Loss: 0.0000
Epoch [5/20], Step [24900/60000], Loss: 0.0000
Epoch [5/20], Step [25000/60000], Loss: 0.0000
Epoch [5/20], Step [25100/60000], Loss: 0.0000
Epoch [5/20], Step [25200/60000], Loss: 0.3106
Epoch [5/20], Step [25300/60000], Loss: 0.0000
Epoch [5/20], Step [25400/60000], Loss: 0.0000
Epoch [5/20], Step [25500/60000], Loss: 0.0000
Epoch [5/20], Step [25600/60000], Loss: 0.0000
Epoch [5/20],

Epoch [5/20], Step [41100/60000], Loss: 0.0000
Epoch [5/20], Step [41200/60000], Loss: 0.0000
Epoch [5/20], Step [41300/60000], Loss: 0.0000
Epoch [5/20], Step [41400/60000], Loss: 0.0731
Epoch [5/20], Step [41500/60000], Loss: 0.0002
Epoch [5/20], Step [41600/60000], Loss: 0.0000
Epoch [5/20], Step [41700/60000], Loss: 0.0000
Epoch [5/20], Step [41800/60000], Loss: 0.0000
Epoch [5/20], Step [41900/60000], Loss: 0.0000
Epoch [5/20], Step [42000/60000], Loss: 0.0000
Epoch [5/20], Step [42100/60000], Loss: 0.0000
Epoch [5/20], Step [42200/60000], Loss: 0.0000
Epoch [5/20], Step [42300/60000], Loss: 0.0000
Epoch [5/20], Step [42400/60000], Loss: 0.0000
Epoch [5/20], Step [42500/60000], Loss: 0.0000
Epoch [5/20], Step [42600/60000], Loss: 0.0000
Epoch [5/20], Step [42700/60000], Loss: 0.0000
Epoch [5/20], Step [42800/60000], Loss: 0.0000
Epoch [5/20], Step [42900/60000], Loss: 0.0000
Epoch [5/20], Step [43000/60000], Loss: 0.0000
Epoch [5/20], Step [43100/60000], Loss: 0.0000
Epoch [5/20],

Epoch [5/20], Step [58600/60000], Loss: 0.0000
Epoch [5/20], Step [58700/60000], Loss: 0.0000
Epoch [5/20], Step [58800/60000], Loss: 0.0000
Epoch [5/20], Step [58900/60000], Loss: 0.0000
Epoch [5/20], Step [59000/60000], Loss: 0.0000
Epoch [5/20], Step [59100/60000], Loss: 0.0000
Epoch [5/20], Step [59200/60000], Loss: 0.0000
Epoch [5/20], Step [59300/60000], Loss: 0.0000
Epoch [5/20], Step [59400/60000], Loss: 0.0000
Epoch [5/20], Step [59500/60000], Loss: 0.0000
Epoch [5/20], Step [59600/60000], Loss: 0.0000
Epoch [5/20], Step [59700/60000], Loss: 0.0000
Epoch [5/20], Step [59800/60000], Loss: 0.0000
Epoch [5/20], Step [59900/60000], Loss: 0.0000
Epoch [5/20], Step [60000/60000], Loss: 0.0000
Epoch [6/20], Step [100/60000], Loss: 0.0000
Epoch [6/20], Step [200/60000], Loss: 0.0000
Epoch [6/20], Step [300/60000], Loss: 0.0000
Epoch [6/20], Step [400/60000], Loss: 0.6478
Epoch [6/20], Step [500/60000], Loss: 0.0006
Epoch [6/20], Step [600/60000], Loss: 0.0000
Epoch [6/20], Step [700/6

Epoch [6/20], Step [16300/60000], Loss: 0.0000
Epoch [6/20], Step [16400/60000], Loss: 0.0000
Epoch [6/20], Step [16500/60000], Loss: 6.0718
Epoch [6/20], Step [16600/60000], Loss: 8.6293
Epoch [6/20], Step [16700/60000], Loss: 0.0000
Epoch [6/20], Step [16800/60000], Loss: 0.0000
Epoch [6/20], Step [16900/60000], Loss: 0.0000
Epoch [6/20], Step [17000/60000], Loss: 0.0000
Epoch [6/20], Step [17100/60000], Loss: 0.0000
Epoch [6/20], Step [17200/60000], Loss: 0.0000
Epoch [6/20], Step [17300/60000], Loss: 0.0000
Epoch [6/20], Step [17400/60000], Loss: 0.0000
Epoch [6/20], Step [17500/60000], Loss: 0.0000
Epoch [6/20], Step [17600/60000], Loss: 0.0000
Epoch [6/20], Step [17700/60000], Loss: 0.0000
Epoch [6/20], Step [17800/60000], Loss: 0.0000
Epoch [6/20], Step [17900/60000], Loss: 0.0000
Epoch [6/20], Step [18000/60000], Loss: 0.0000
Epoch [6/20], Step [18100/60000], Loss: 0.0000
Epoch [6/20], Step [18200/60000], Loss: 0.0000
Epoch [6/20], Step [18300/60000], Loss: 0.0001
Epoch [6/20],

Epoch [6/20], Step [33800/60000], Loss: 0.0008
Epoch [6/20], Step [33900/60000], Loss: 0.0000
Epoch [6/20], Step [34000/60000], Loss: 0.0000
Epoch [6/20], Step [34100/60000], Loss: 0.0023
Epoch [6/20], Step [34200/60000], Loss: 0.0000
Epoch [6/20], Step [34300/60000], Loss: 0.0000
Epoch [6/20], Step [34400/60000], Loss: 0.0000
Epoch [6/20], Step [34500/60000], Loss: 0.0000
Epoch [6/20], Step [34600/60000], Loss: 0.0000
Epoch [6/20], Step [34700/60000], Loss: 0.0000
Epoch [6/20], Step [34800/60000], Loss: 0.0000
Epoch [6/20], Step [34900/60000], Loss: 0.0000
Epoch [6/20], Step [35000/60000], Loss: 0.0000
Epoch [6/20], Step [35100/60000], Loss: 0.0000
Epoch [6/20], Step [35200/60000], Loss: 0.0000
Epoch [6/20], Step [35300/60000], Loss: 0.0000
Epoch [6/20], Step [35400/60000], Loss: 0.0000
Epoch [6/20], Step [35500/60000], Loss: 0.0000
Epoch [6/20], Step [35600/60000], Loss: 0.0000
Epoch [6/20], Step [35700/60000], Loss: 0.0000
Epoch [6/20], Step [35800/60000], Loss: 0.0000
Epoch [6/20],

Epoch [6/20], Step [51300/60000], Loss: 0.0000
Epoch [6/20], Step [51400/60000], Loss: 0.0000
Epoch [6/20], Step [51500/60000], Loss: 0.0000
Epoch [6/20], Step [51600/60000], Loss: 0.0000
Epoch [6/20], Step [51700/60000], Loss: 0.0000
Epoch [6/20], Step [51800/60000], Loss: 0.0000
Epoch [6/20], Step [51900/60000], Loss: 0.0000
Epoch [6/20], Step [52000/60000], Loss: 0.0000
Epoch [6/20], Step [52100/60000], Loss: 0.0000
Epoch [6/20], Step [52200/60000], Loss: 0.0000
Epoch [6/20], Step [52300/60000], Loss: 0.0000
Epoch [6/20], Step [52400/60000], Loss: 0.0000
Epoch [6/20], Step [52500/60000], Loss: 0.0000
Epoch [6/20], Step [52600/60000], Loss: 0.0000
Epoch [6/20], Step [52700/60000], Loss: 0.0000
Epoch [6/20], Step [52800/60000], Loss: 0.0000
Epoch [6/20], Step [52900/60000], Loss: 0.0000
Epoch [6/20], Step [53000/60000], Loss: 0.0000
Epoch [6/20], Step [53100/60000], Loss: 0.0000
Epoch [6/20], Step [53200/60000], Loss: 0.0000
Epoch [6/20], Step [53300/60000], Loss: 0.0000
Epoch [6/20],

Epoch [7/20], Step [9000/60000], Loss: 6.8657
Epoch [7/20], Step [9100/60000], Loss: 0.0000
Epoch [7/20], Step [9200/60000], Loss: 0.0000
Epoch [7/20], Step [9300/60000], Loss: 0.0000
Epoch [7/20], Step [9400/60000], Loss: 0.0000
Epoch [7/20], Step [9500/60000], Loss: 0.0000
Epoch [7/20], Step [9600/60000], Loss: 0.0000
Epoch [7/20], Step [9700/60000], Loss: 0.0000
Epoch [7/20], Step [9800/60000], Loss: 0.0000
Epoch [7/20], Step [9900/60000], Loss: 0.0000
Epoch [7/20], Step [10000/60000], Loss: 0.0000
Epoch [7/20], Step [10100/60000], Loss: 0.0000
Epoch [7/20], Step [10200/60000], Loss: 0.0000
Epoch [7/20], Step [10300/60000], Loss: 0.0000
Epoch [7/20], Step [10400/60000], Loss: 0.0000
Epoch [7/20], Step [10500/60000], Loss: 0.0000
Epoch [7/20], Step [10600/60000], Loss: 0.0000
Epoch [7/20], Step [10700/60000], Loss: 0.0000
Epoch [7/20], Step [10800/60000], Loss: 0.0000
Epoch [7/20], Step [10900/60000], Loss: 0.0000
Epoch [7/20], Step [11000/60000], Loss: 0.0000
Epoch [7/20], Step [111

Epoch [7/20], Step [26500/60000], Loss: 0.0000
Epoch [7/20], Step [26600/60000], Loss: 0.0000
Epoch [7/20], Step [26700/60000], Loss: 0.0000
Epoch [7/20], Step [26800/60000], Loss: 0.0000
Epoch [7/20], Step [26900/60000], Loss: 0.0000
Epoch [7/20], Step [27000/60000], Loss: 0.0000
Epoch [7/20], Step [27100/60000], Loss: 0.0000
Epoch [7/20], Step [27200/60000], Loss: 0.0000
Epoch [7/20], Step [27300/60000], Loss: 0.0000
Epoch [7/20], Step [27400/60000], Loss: 0.0000
Epoch [7/20], Step [27500/60000], Loss: 0.0000
Epoch [7/20], Step [27600/60000], Loss: 15.3183
Epoch [7/20], Step [27700/60000], Loss: 0.0000
Epoch [7/20], Step [27800/60000], Loss: 0.0000
Epoch [7/20], Step [27900/60000], Loss: 0.0001
Epoch [7/20], Step [28000/60000], Loss: 0.0000
Epoch [7/20], Step [28100/60000], Loss: 0.0000
Epoch [7/20], Step [28200/60000], Loss: 0.0000
Epoch [7/20], Step [28300/60000], Loss: 0.0000
Epoch [7/20], Step [28400/60000], Loss: 0.0000
Epoch [7/20], Step [28500/60000], Loss: 0.0000
Epoch [7/20]

Epoch [7/20], Step [44000/60000], Loss: 0.0000
Epoch [7/20], Step [44100/60000], Loss: 0.0000
Epoch [7/20], Step [44200/60000], Loss: 0.0000
Epoch [7/20], Step [44300/60000], Loss: 0.0000
Epoch [7/20], Step [44400/60000], Loss: 0.0000
Epoch [7/20], Step [44500/60000], Loss: 0.0000
Epoch [7/20], Step [44600/60000], Loss: 0.0000
Epoch [7/20], Step [44700/60000], Loss: 0.0000
Epoch [7/20], Step [44800/60000], Loss: 0.0000
Epoch [7/20], Step [44900/60000], Loss: 0.0000
Epoch [7/20], Step [45000/60000], Loss: 0.0000
Epoch [7/20], Step [45100/60000], Loss: 0.0000
Epoch [7/20], Step [45200/60000], Loss: 0.0000
Epoch [7/20], Step [45300/60000], Loss: 0.0000
Epoch [7/20], Step [45400/60000], Loss: 0.0000
Epoch [7/20], Step [45500/60000], Loss: 0.0000
Epoch [7/20], Step [45600/60000], Loss: 0.0000
Epoch [7/20], Step [45700/60000], Loss: 0.0041
Epoch [7/20], Step [45800/60000], Loss: 0.0000
Epoch [7/20], Step [45900/60000], Loss: 0.0000
Epoch [7/20], Step [46000/60000], Loss: 0.4135
Epoch [7/20],

Epoch [8/20], Step [1500/60000], Loss: 0.0000
Epoch [8/20], Step [1600/60000], Loss: 0.0000
Epoch [8/20], Step [1700/60000], Loss: 0.0000
Epoch [8/20], Step [1800/60000], Loss: 0.0000
Epoch [8/20], Step [1900/60000], Loss: 0.0000
Epoch [8/20], Step [2000/60000], Loss: 0.0055
Epoch [8/20], Step [2100/60000], Loss: 0.0000
Epoch [8/20], Step [2200/60000], Loss: 0.0000
Epoch [8/20], Step [2300/60000], Loss: 0.0000
Epoch [8/20], Step [2400/60000], Loss: 0.0000
Epoch [8/20], Step [2500/60000], Loss: 0.0000
Epoch [8/20], Step [2600/60000], Loss: 0.0000
Epoch [8/20], Step [2700/60000], Loss: 0.0000
Epoch [8/20], Step [2800/60000], Loss: 0.0000
Epoch [8/20], Step [2900/60000], Loss: 0.0000
Epoch [8/20], Step [3000/60000], Loss: 0.0000
Epoch [8/20], Step [3100/60000], Loss: 0.0000
Epoch [8/20], Step [3200/60000], Loss: 0.0000
Epoch [8/20], Step [3300/60000], Loss: 0.0000
Epoch [8/20], Step [3400/60000], Loss: 0.0000
Epoch [8/20], Step [3500/60000], Loss: 0.0000
Epoch [8/20], Step [3600/60000], L

Epoch [8/20], Step [19200/60000], Loss: 0.0000
Epoch [8/20], Step [19300/60000], Loss: 0.0000
Epoch [8/20], Step [19400/60000], Loss: 0.0000
Epoch [8/20], Step [19500/60000], Loss: 0.0000
Epoch [8/20], Step [19600/60000], Loss: 0.0000
Epoch [8/20], Step [19700/60000], Loss: 0.0000
Epoch [8/20], Step [19800/60000], Loss: 0.0000
Epoch [8/20], Step [19900/60000], Loss: 0.0000
Epoch [8/20], Step [20000/60000], Loss: 0.0000
Epoch [8/20], Step [20100/60000], Loss: 0.0000
Epoch [8/20], Step [20200/60000], Loss: 0.0000
Epoch [8/20], Step [20300/60000], Loss: 0.0000
Epoch [8/20], Step [20400/60000], Loss: 0.0000
Epoch [8/20], Step [20500/60000], Loss: 0.0000
Epoch [8/20], Step [20600/60000], Loss: 0.0000
Epoch [8/20], Step [20700/60000], Loss: 0.0000
Epoch [8/20], Step [20800/60000], Loss: 0.0000
Epoch [8/20], Step [20900/60000], Loss: 22.1154
Epoch [8/20], Step [21000/60000], Loss: 0.0000
Epoch [8/20], Step [21100/60000], Loss: 0.0000
Epoch [8/20], Step [21200/60000], Loss: 0.0000
Epoch [8/20]

Epoch [8/20], Step [36700/60000], Loss: 0.0000
Epoch [8/20], Step [36800/60000], Loss: 0.0000
Epoch [8/20], Step [36900/60000], Loss: 0.0000
Epoch [8/20], Step [37000/60000], Loss: 0.0000
Epoch [8/20], Step [37100/60000], Loss: 0.0000
Epoch [8/20], Step [37200/60000], Loss: 0.0000
Epoch [8/20], Step [37300/60000], Loss: 0.0000
Epoch [8/20], Step [37400/60000], Loss: 0.0000
Epoch [8/20], Step [37500/60000], Loss: 0.0000
Epoch [8/20], Step [37600/60000], Loss: 0.0000
Epoch [8/20], Step [37700/60000], Loss: 0.0000
Epoch [8/20], Step [37800/60000], Loss: 0.0000
Epoch [8/20], Step [37900/60000], Loss: 0.0000
Epoch [8/20], Step [38000/60000], Loss: 0.0000
Epoch [8/20], Step [38100/60000], Loss: 0.0000
Epoch [8/20], Step [38200/60000], Loss: 0.0000
Epoch [8/20], Step [38300/60000], Loss: 0.0000
Epoch [8/20], Step [38400/60000], Loss: 0.0000
Epoch [8/20], Step [38500/60000], Loss: 0.0000
Epoch [8/20], Step [38600/60000], Loss: 0.0000
Epoch [8/20], Step [38700/60000], Loss: 0.0000
Epoch [8/20],

Epoch [8/20], Step [54200/60000], Loss: 0.0000
Epoch [8/20], Step [54300/60000], Loss: 0.0000
Epoch [8/20], Step [54400/60000], Loss: 0.0000
Epoch [8/20], Step [54500/60000], Loss: 0.0000
Epoch [8/20], Step [54600/60000], Loss: 0.0000
Epoch [8/20], Step [54700/60000], Loss: 0.0000
Epoch [8/20], Step [54800/60000], Loss: 0.0000
Epoch [8/20], Step [54900/60000], Loss: 0.0000
Epoch [8/20], Step [55000/60000], Loss: 0.0000
Epoch [8/20], Step [55100/60000], Loss: 0.0000
Epoch [8/20], Step [55200/60000], Loss: 0.0000
Epoch [8/20], Step [55300/60000], Loss: 0.0000
Epoch [8/20], Step [55400/60000], Loss: 0.0000
Epoch [8/20], Step [55500/60000], Loss: 0.0000
Epoch [8/20], Step [55600/60000], Loss: 0.0000
Epoch [8/20], Step [55700/60000], Loss: 0.0000
Epoch [8/20], Step [55800/60000], Loss: 0.0000
Epoch [8/20], Step [55900/60000], Loss: 0.0000
Epoch [8/20], Step [56000/60000], Loss: 0.0000
Epoch [8/20], Step [56100/60000], Loss: 0.0000
Epoch [8/20], Step [56200/60000], Loss: 0.0000
Epoch [8/20],

Epoch [9/20], Step [11900/60000], Loss: 0.0000
Epoch [9/20], Step [12000/60000], Loss: 0.0000
Epoch [9/20], Step [12100/60000], Loss: 0.0000
Epoch [9/20], Step [12200/60000], Loss: 0.0000
Epoch [9/20], Step [12300/60000], Loss: 0.0000
Epoch [9/20], Step [12400/60000], Loss: 0.0000
Epoch [9/20], Step [12500/60000], Loss: 0.0000
Epoch [9/20], Step [12600/60000], Loss: 0.0000
Epoch [9/20], Step [12700/60000], Loss: 0.0000
Epoch [9/20], Step [12800/60000], Loss: 0.0000
Epoch [9/20], Step [12900/60000], Loss: 0.0000
Epoch [9/20], Step [13000/60000], Loss: 0.0000
Epoch [9/20], Step [13100/60000], Loss: 0.0000
Epoch [9/20], Step [13200/60000], Loss: 0.0000
Epoch [9/20], Step [13300/60000], Loss: 0.0000
Epoch [9/20], Step [13400/60000], Loss: 0.0000
Epoch [9/20], Step [13500/60000], Loss: 0.0000
Epoch [9/20], Step [13600/60000], Loss: 0.0000
Epoch [9/20], Step [13700/60000], Loss: 0.0000
Epoch [9/20], Step [13800/60000], Loss: 0.0000
Epoch [9/20], Step [13900/60000], Loss: 0.0000
Epoch [9/20],

Epoch [9/20], Step [29400/60000], Loss: 0.0000
Epoch [9/20], Step [29500/60000], Loss: 0.0000
Epoch [9/20], Step [29600/60000], Loss: 0.0000
Epoch [9/20], Step [29700/60000], Loss: 0.0000
Epoch [9/20], Step [29800/60000], Loss: 0.0000
Epoch [9/20], Step [29900/60000], Loss: 0.0000
Epoch [9/20], Step [30000/60000], Loss: 0.0000
Epoch [9/20], Step [30100/60000], Loss: 0.0000
Epoch [9/20], Step [30200/60000], Loss: 0.0000
Epoch [9/20], Step [30300/60000], Loss: 0.0000
Epoch [9/20], Step [30400/60000], Loss: 0.0000
Epoch [9/20], Step [30500/60000], Loss: 0.0000
Epoch [9/20], Step [30600/60000], Loss: 0.0000
Epoch [9/20], Step [30700/60000], Loss: 0.0000
Epoch [9/20], Step [30800/60000], Loss: 0.0000
Epoch [9/20], Step [30900/60000], Loss: 0.0000
Epoch [9/20], Step [31000/60000], Loss: 0.0000
Epoch [9/20], Step [31100/60000], Loss: 0.0000
Epoch [9/20], Step [31200/60000], Loss: 0.0000
Epoch [9/20], Step [31300/60000], Loss: 0.0000
Epoch [9/20], Step [31400/60000], Loss: 0.0000
Epoch [9/20],

Epoch [9/20], Step [46900/60000], Loss: 0.0000
Epoch [9/20], Step [47000/60000], Loss: 0.0000
Epoch [9/20], Step [47100/60000], Loss: 0.0000
Epoch [9/20], Step [47200/60000], Loss: 0.0000
Epoch [9/20], Step [47300/60000], Loss: 0.0000
Epoch [9/20], Step [47400/60000], Loss: 0.0000
Epoch [9/20], Step [47500/60000], Loss: 0.0000
Epoch [9/20], Step [47600/60000], Loss: 0.0000
Epoch [9/20], Step [47700/60000], Loss: 0.0000
Epoch [9/20], Step [47800/60000], Loss: 0.0000
Epoch [9/20], Step [47900/60000], Loss: 0.0000
Epoch [9/20], Step [48000/60000], Loss: 0.0000
Epoch [9/20], Step [48100/60000], Loss: 0.0000
Epoch [9/20], Step [48200/60000], Loss: 0.0000
Epoch [9/20], Step [48300/60000], Loss: 0.0000
Epoch [9/20], Step [48400/60000], Loss: 0.0000
Epoch [9/20], Step [48500/60000], Loss: 0.0390
Epoch [9/20], Step [48600/60000], Loss: 0.0000
Epoch [9/20], Step [48700/60000], Loss: 0.0000
Epoch [9/20], Step [48800/60000], Loss: 0.0000
Epoch [9/20], Step [48900/60000], Loss: 0.0000
Epoch [9/20],

Epoch [10/20], Step [4400/60000], Loss: 0.0000
Epoch [10/20], Step [4500/60000], Loss: 0.0000
Epoch [10/20], Step [4600/60000], Loss: 0.0000
Epoch [10/20], Step [4700/60000], Loss: 0.0000
Epoch [10/20], Step [4800/60000], Loss: 0.0000
Epoch [10/20], Step [4900/60000], Loss: 0.0000
Epoch [10/20], Step [5000/60000], Loss: 0.0000
Epoch [10/20], Step [5100/60000], Loss: 0.0000
Epoch [10/20], Step [5200/60000], Loss: 0.0000
Epoch [10/20], Step [5300/60000], Loss: 0.0000
Epoch [10/20], Step [5400/60000], Loss: 0.0000
Epoch [10/20], Step [5500/60000], Loss: 0.0000
Epoch [10/20], Step [5600/60000], Loss: 0.0000
Epoch [10/20], Step [5700/60000], Loss: 0.0000
Epoch [10/20], Step [5800/60000], Loss: 0.0000
Epoch [10/20], Step [5900/60000], Loss: 0.0000
Epoch [10/20], Step [6000/60000], Loss: 0.0000
Epoch [10/20], Step [6100/60000], Loss: 0.0000
Epoch [10/20], Step [6200/60000], Loss: 0.0000
Epoch [10/20], Step [6300/60000], Loss: 0.0000
Epoch [10/20], Step [6400/60000], Loss: 0.0000
Epoch [10/20]

Epoch [10/20], Step [21600/60000], Loss: 0.0000
Epoch [10/20], Step [21700/60000], Loss: 0.0000
Epoch [10/20], Step [21800/60000], Loss: 0.0000
Epoch [10/20], Step [21900/60000], Loss: 0.0000
Epoch [10/20], Step [22000/60000], Loss: 0.0000
Epoch [10/20], Step [22100/60000], Loss: 0.0000
Epoch [10/20], Step [22200/60000], Loss: 0.0000
Epoch [10/20], Step [22300/60000], Loss: 0.0000
Epoch [10/20], Step [22400/60000], Loss: 0.0000
Epoch [10/20], Step [22500/60000], Loss: 0.0000
Epoch [10/20], Step [22600/60000], Loss: 0.0000
Epoch [10/20], Step [22700/60000], Loss: 0.0000
Epoch [10/20], Step [22800/60000], Loss: 0.0000
Epoch [10/20], Step [22900/60000], Loss: 0.0000
Epoch [10/20], Step [23000/60000], Loss: 0.0000
Epoch [10/20], Step [23100/60000], Loss: 0.0000
Epoch [10/20], Step [23200/60000], Loss: 0.0000
Epoch [10/20], Step [23300/60000], Loss: 0.0000
Epoch [10/20], Step [23400/60000], Loss: 0.0000
Epoch [10/20], Step [23500/60000], Loss: 0.0000
Epoch [10/20], Step [23600/60000], Loss:

Epoch [10/20], Step [38700/60000], Loss: 0.0000
Epoch [10/20], Step [38800/60000], Loss: 0.0000
Epoch [10/20], Step [38900/60000], Loss: 0.0000
Epoch [10/20], Step [39000/60000], Loss: 0.0000
Epoch [10/20], Step [39100/60000], Loss: 0.0000
Epoch [10/20], Step [39200/60000], Loss: 0.0000
Epoch [10/20], Step [39300/60000], Loss: 0.0000
Epoch [10/20], Step [39400/60000], Loss: 0.0000
Epoch [10/20], Step [39500/60000], Loss: 0.0000
Epoch [10/20], Step [39600/60000], Loss: 0.0000
Epoch [10/20], Step [39700/60000], Loss: 0.0000
Epoch [10/20], Step [39800/60000], Loss: 0.0000
Epoch [10/20], Step [39900/60000], Loss: 0.0000
Epoch [10/20], Step [40000/60000], Loss: 0.0017
Epoch [10/20], Step [40100/60000], Loss: 0.0000
Epoch [10/20], Step [40200/60000], Loss: 0.0000
Epoch [10/20], Step [40300/60000], Loss: 0.0000
Epoch [10/20], Step [40400/60000], Loss: 0.0000
Epoch [10/20], Step [40500/60000], Loss: 0.0000
Epoch [10/20], Step [40600/60000], Loss: 0.0000
Epoch [10/20], Step [40700/60000], Loss:

Epoch [10/20], Step [55800/60000], Loss: 0.0000
Epoch [10/20], Step [55900/60000], Loss: 0.0000
Epoch [10/20], Step [56000/60000], Loss: 0.0000
Epoch [10/20], Step [56100/60000], Loss: 0.0000
Epoch [10/20], Step [56200/60000], Loss: 0.0000
Epoch [10/20], Step [56300/60000], Loss: 0.0042
Epoch [10/20], Step [56400/60000], Loss: 0.0000
Epoch [10/20], Step [56500/60000], Loss: 0.0000
Epoch [10/20], Step [56600/60000], Loss: 0.0000
Epoch [10/20], Step [56700/60000], Loss: 0.0000
Epoch [10/20], Step [56800/60000], Loss: 0.0000
Epoch [10/20], Step [56900/60000], Loss: 0.0000
Epoch [10/20], Step [57000/60000], Loss: 0.0000
Epoch [10/20], Step [57100/60000], Loss: 0.0000
Epoch [10/20], Step [57200/60000], Loss: 0.0000
Epoch [10/20], Step [57300/60000], Loss: 0.0000
Epoch [10/20], Step [57400/60000], Loss: 0.0000
Epoch [10/20], Step [57500/60000], Loss: 0.0000
Epoch [10/20], Step [57600/60000], Loss: 0.0000
Epoch [10/20], Step [57700/60000], Loss: 0.0000
Epoch [10/20], Step [57800/60000], Loss:

Epoch [11/20], Step [13100/60000], Loss: 0.0037
Epoch [11/20], Step [13200/60000], Loss: 0.0000
Epoch [11/20], Step [13300/60000], Loss: 0.0000
Epoch [11/20], Step [13400/60000], Loss: 0.1084
Epoch [11/20], Step [13500/60000], Loss: 0.0000
Epoch [11/20], Step [13600/60000], Loss: 0.1951
Epoch [11/20], Step [13700/60000], Loss: 0.0000
Epoch [11/20], Step [13800/60000], Loss: 0.0000
Epoch [11/20], Step [13900/60000], Loss: 0.0094
Epoch [11/20], Step [14000/60000], Loss: 0.0000
Epoch [11/20], Step [14100/60000], Loss: 0.0000
Epoch [11/20], Step [14200/60000], Loss: 0.0000
Epoch [11/20], Step [14300/60000], Loss: 0.0000
Epoch [11/20], Step [14400/60000], Loss: 0.0000
Epoch [11/20], Step [14500/60000], Loss: 0.0000
Epoch [11/20], Step [14600/60000], Loss: 0.0000
Epoch [11/20], Step [14700/60000], Loss: 0.0001
Epoch [11/20], Step [14800/60000], Loss: 0.0000
Epoch [11/20], Step [14900/60000], Loss: 0.0000
Epoch [11/20], Step [15000/60000], Loss: 0.0000
Epoch [11/20], Step [15100/60000], Loss:

Epoch [11/20], Step [30200/60000], Loss: 0.0000
Epoch [11/20], Step [30300/60000], Loss: 0.0000
Epoch [11/20], Step [30400/60000], Loss: 0.0000
Epoch [11/20], Step [30500/60000], Loss: 0.0000
Epoch [11/20], Step [30600/60000], Loss: 0.0000
Epoch [11/20], Step [30700/60000], Loss: 0.0000
Epoch [11/20], Step [30800/60000], Loss: 0.0000
Epoch [11/20], Step [30900/60000], Loss: 0.0000
Epoch [11/20], Step [31000/60000], Loss: 0.0000
Epoch [11/20], Step [31100/60000], Loss: 0.0000
Epoch [11/20], Step [31200/60000], Loss: 0.0000
Epoch [11/20], Step [31300/60000], Loss: 0.0000
Epoch [11/20], Step [31400/60000], Loss: 0.0000
Epoch [11/20], Step [31500/60000], Loss: 0.0000
Epoch [11/20], Step [31600/60000], Loss: 0.0000
Epoch [11/20], Step [31700/60000], Loss: 0.0000
Epoch [11/20], Step [31800/60000], Loss: 0.0000
Epoch [11/20], Step [31900/60000], Loss: 0.0000
Epoch [11/20], Step [32000/60000], Loss: 0.0000
Epoch [11/20], Step [32100/60000], Loss: 0.0000
Epoch [11/20], Step [32200/60000], Loss:

Epoch [11/20], Step [47300/60000], Loss: 0.0000
Epoch [11/20], Step [47400/60000], Loss: 0.0000
Epoch [11/20], Step [47500/60000], Loss: 0.0000
Epoch [11/20], Step [47600/60000], Loss: 0.0000
Epoch [11/20], Step [47700/60000], Loss: 0.0000
Epoch [11/20], Step [47800/60000], Loss: 0.0000
Epoch [11/20], Step [47900/60000], Loss: 0.0000
Epoch [11/20], Step [48000/60000], Loss: 0.0000
Epoch [11/20], Step [48100/60000], Loss: 0.0000
Epoch [11/20], Step [48200/60000], Loss: 0.0000
Epoch [11/20], Step [48300/60000], Loss: 0.0000
Epoch [11/20], Step [48400/60000], Loss: 0.0000
Epoch [11/20], Step [48500/60000], Loss: 0.0000
Epoch [11/20], Step [48600/60000], Loss: 0.0000
Epoch [11/20], Step [48700/60000], Loss: 0.0000
Epoch [11/20], Step [48800/60000], Loss: 0.0000
Epoch [11/20], Step [48900/60000], Loss: 0.0000
Epoch [11/20], Step [49000/60000], Loss: 0.0000
Epoch [11/20], Step [49100/60000], Loss: 0.0000
Epoch [11/20], Step [49200/60000], Loss: 0.0000
Epoch [11/20], Step [49300/60000], Loss:

Epoch [12/20], Step [4500/60000], Loss: 0.0000
Epoch [12/20], Step [4600/60000], Loss: 0.0000
Epoch [12/20], Step [4700/60000], Loss: 0.0000
Epoch [12/20], Step [4800/60000], Loss: 0.0000
Epoch [12/20], Step [4900/60000], Loss: 0.0000
Epoch [12/20], Step [5000/60000], Loss: 0.0000
Epoch [12/20], Step [5100/60000], Loss: 0.0000
Epoch [12/20], Step [5200/60000], Loss: 0.0000
Epoch [12/20], Step [5300/60000], Loss: 0.0000
Epoch [12/20], Step [5400/60000], Loss: 0.0000
Epoch [12/20], Step [5500/60000], Loss: 0.0000
Epoch [12/20], Step [5600/60000], Loss: 0.0000
Epoch [12/20], Step [5700/60000], Loss: 0.0000
Epoch [12/20], Step [5800/60000], Loss: 0.0000
Epoch [12/20], Step [5900/60000], Loss: 0.0000
Epoch [12/20], Step [6000/60000], Loss: 0.0000
Epoch [12/20], Step [6100/60000], Loss: 0.0000
Epoch [12/20], Step [6200/60000], Loss: 0.0000
Epoch [12/20], Step [6300/60000], Loss: 0.0000
Epoch [12/20], Step [6400/60000], Loss: 0.0000
Epoch [12/20], Step [6500/60000], Loss: 0.0000
Epoch [12/20]

Epoch [12/20], Step [21700/60000], Loss: 0.0000
Epoch [12/20], Step [21800/60000], Loss: 0.0000
Epoch [12/20], Step [21900/60000], Loss: 0.0000
Epoch [12/20], Step [22000/60000], Loss: 0.0000
Epoch [12/20], Step [22100/60000], Loss: 0.0000
Epoch [12/20], Step [22200/60000], Loss: 0.0000
Epoch [12/20], Step [22300/60000], Loss: 0.0000
Epoch [12/20], Step [22400/60000], Loss: 0.0000
Epoch [12/20], Step [22500/60000], Loss: 0.0000
Epoch [12/20], Step [22600/60000], Loss: 0.0000
Epoch [12/20], Step [22700/60000], Loss: 0.0000
Epoch [12/20], Step [22800/60000], Loss: 0.0000
Epoch [12/20], Step [22900/60000], Loss: 0.0000
Epoch [12/20], Step [23000/60000], Loss: 1.6542
Epoch [12/20], Step [23100/60000], Loss: 0.0000
Epoch [12/20], Step [23200/60000], Loss: 0.0000
Epoch [12/20], Step [23300/60000], Loss: 0.0000
Epoch [12/20], Step [23400/60000], Loss: 0.0000
Epoch [12/20], Step [23500/60000], Loss: 0.0000
Epoch [12/20], Step [23600/60000], Loss: 0.0000
Epoch [12/20], Step [23700/60000], Loss:

Epoch [12/20], Step [38800/60000], Loss: 0.0000
Epoch [12/20], Step [38900/60000], Loss: 0.0000
Epoch [12/20], Step [39000/60000], Loss: 0.4961
Epoch [12/20], Step [39100/60000], Loss: 0.0000
Epoch [12/20], Step [39200/60000], Loss: 0.0000
Epoch [12/20], Step [39300/60000], Loss: 0.0000
Epoch [12/20], Step [39400/60000], Loss: 0.0000
Epoch [12/20], Step [39500/60000], Loss: 0.0000
Epoch [12/20], Step [39600/60000], Loss: 0.0000
Epoch [12/20], Step [39700/60000], Loss: 0.0000
Epoch [12/20], Step [39800/60000], Loss: 0.0000
Epoch [12/20], Step [39900/60000], Loss: 0.0000
Epoch [12/20], Step [40000/60000], Loss: 0.0000
Epoch [12/20], Step [40100/60000], Loss: 0.0000
Epoch [12/20], Step [40200/60000], Loss: 0.0000
Epoch [12/20], Step [40300/60000], Loss: 0.0000
Epoch [12/20], Step [40400/60000], Loss: 0.0000
Epoch [12/20], Step [40500/60000], Loss: 0.0000
Epoch [12/20], Step [40600/60000], Loss: 0.0000
Epoch [12/20], Step [40700/60000], Loss: 0.0000
Epoch [12/20], Step [40800/60000], Loss:

Epoch [12/20], Step [55900/60000], Loss: 0.0000
Epoch [12/20], Step [56000/60000], Loss: 0.0000
Epoch [12/20], Step [56100/60000], Loss: 0.0000
Epoch [12/20], Step [56200/60000], Loss: 0.0000
Epoch [12/20], Step [56300/60000], Loss: 0.0000
Epoch [12/20], Step [56400/60000], Loss: 0.0000
Epoch [12/20], Step [56500/60000], Loss: 0.0000
Epoch [12/20], Step [56600/60000], Loss: 0.0000
Epoch [12/20], Step [56700/60000], Loss: 0.0000
Epoch [12/20], Step [56800/60000], Loss: 0.0000
Epoch [12/20], Step [56900/60000], Loss: 0.0000
Epoch [12/20], Step [57000/60000], Loss: 0.0000
Epoch [12/20], Step [57100/60000], Loss: 0.0000
Epoch [12/20], Step [57200/60000], Loss: 0.0000
Epoch [12/20], Step [57300/60000], Loss: 0.0000
Epoch [12/20], Step [57400/60000], Loss: 0.0000
Epoch [12/20], Step [57500/60000], Loss: 0.0000
Epoch [12/20], Step [57600/60000], Loss: 0.0000
Epoch [12/20], Step [57700/60000], Loss: 0.0000
Epoch [12/20], Step [57800/60000], Loss: 0.0035
Epoch [12/20], Step [57900/60000], Loss:

Epoch [13/20], Step [13200/60000], Loss: 0.0000
Epoch [13/20], Step [13300/60000], Loss: 0.0000
Epoch [13/20], Step [13400/60000], Loss: 0.0000
Epoch [13/20], Step [13500/60000], Loss: 0.0000
Epoch [13/20], Step [13600/60000], Loss: 0.0000
Epoch [13/20], Step [13700/60000], Loss: 0.0000
Epoch [13/20], Step [13800/60000], Loss: 0.0000
Epoch [13/20], Step [13900/60000], Loss: 0.0000
Epoch [13/20], Step [14000/60000], Loss: 0.0000
Epoch [13/20], Step [14100/60000], Loss: 0.0000
Epoch [13/20], Step [14200/60000], Loss: 0.0000
Epoch [13/20], Step [14300/60000], Loss: 0.0000
Epoch [13/20], Step [14400/60000], Loss: 0.0000
Epoch [13/20], Step [14500/60000], Loss: 0.0000
Epoch [13/20], Step [14600/60000], Loss: 0.0000
Epoch [13/20], Step [14700/60000], Loss: 0.0000
Epoch [13/20], Step [14800/60000], Loss: 0.0000
Epoch [13/20], Step [14900/60000], Loss: 0.0000
Epoch [13/20], Step [15000/60000], Loss: 0.0000
Epoch [13/20], Step [15100/60000], Loss: 0.0000
Epoch [13/20], Step [15200/60000], Loss:

Epoch [13/20], Step [30300/60000], Loss: 0.0000
Epoch [13/20], Step [30400/60000], Loss: 0.0000
Epoch [13/20], Step [30500/60000], Loss: 0.0000
Epoch [13/20], Step [30600/60000], Loss: 0.0000
Epoch [13/20], Step [30700/60000], Loss: 0.0000
Epoch [13/20], Step [30800/60000], Loss: 0.0000
Epoch [13/20], Step [30900/60000], Loss: 0.0000
Epoch [13/20], Step [31000/60000], Loss: 0.0000
Epoch [13/20], Step [31100/60000], Loss: 0.0000
Epoch [13/20], Step [31200/60000], Loss: 0.0000
Epoch [13/20], Step [31300/60000], Loss: 0.0000
Epoch [13/20], Step [31400/60000], Loss: 0.0000
Epoch [13/20], Step [31500/60000], Loss: 0.0000
Epoch [13/20], Step [31600/60000], Loss: 0.0000
Epoch [13/20], Step [31700/60000], Loss: 0.0000
Epoch [13/20], Step [31800/60000], Loss: 0.0000
Epoch [13/20], Step [31900/60000], Loss: 0.0000
Epoch [13/20], Step [32000/60000], Loss: 0.0000
Epoch [13/20], Step [32100/60000], Loss: 0.0000
Epoch [13/20], Step [32200/60000], Loss: 0.0000
Epoch [13/20], Step [32300/60000], Loss:

Epoch [13/20], Step [47400/60000], Loss: 0.0000
Epoch [13/20], Step [47500/60000], Loss: 0.0000
Epoch [13/20], Step [47600/60000], Loss: 0.0000
Epoch [13/20], Step [47700/60000], Loss: 0.0000
Epoch [13/20], Step [47800/60000], Loss: 0.0000
Epoch [13/20], Step [47900/60000], Loss: 0.0000
Epoch [13/20], Step [48000/60000], Loss: 0.0000
Epoch [13/20], Step [48100/60000], Loss: 0.0000
Epoch [13/20], Step [48200/60000], Loss: 0.0000
Epoch [13/20], Step [48300/60000], Loss: 0.0000
Epoch [13/20], Step [48400/60000], Loss: 0.0000
Epoch [13/20], Step [48500/60000], Loss: 0.0000
Epoch [13/20], Step [48600/60000], Loss: 0.0000
Epoch [13/20], Step [48700/60000], Loss: 0.0000
Epoch [13/20], Step [48800/60000], Loss: 0.0000
Epoch [13/20], Step [48900/60000], Loss: 0.0000
Epoch [13/20], Step [49000/60000], Loss: 0.0000
Epoch [13/20], Step [49100/60000], Loss: 0.0000
Epoch [13/20], Step [49200/60000], Loss: 0.0000
Epoch [13/20], Step [49300/60000], Loss: 0.0000
Epoch [13/20], Step [49400/60000], Loss:

Epoch [14/20], Step [4600/60000], Loss: 0.0000
Epoch [14/20], Step [4700/60000], Loss: 0.0000
Epoch [14/20], Step [4800/60000], Loss: 0.0000
Epoch [14/20], Step [4900/60000], Loss: 0.0000
Epoch [14/20], Step [5000/60000], Loss: 0.0000
Epoch [14/20], Step [5100/60000], Loss: 0.0000
Epoch [14/20], Step [5200/60000], Loss: 0.0000
Epoch [14/20], Step [5300/60000], Loss: 0.0000
Epoch [14/20], Step [5400/60000], Loss: 0.0000
Epoch [14/20], Step [5500/60000], Loss: 0.0000
Epoch [14/20], Step [5600/60000], Loss: 0.0000
Epoch [14/20], Step [5700/60000], Loss: 0.0000
Epoch [14/20], Step [5800/60000], Loss: 0.0000
Epoch [14/20], Step [5900/60000], Loss: 0.0000
Epoch [14/20], Step [6000/60000], Loss: 0.0000
Epoch [14/20], Step [6100/60000], Loss: 0.0000
Epoch [14/20], Step [6200/60000], Loss: 0.0000
Epoch [14/20], Step [6300/60000], Loss: 0.0000
Epoch [14/20], Step [6400/60000], Loss: 0.0000
Epoch [14/20], Step [6500/60000], Loss: 0.0000
Epoch [14/20], Step [6600/60000], Loss: 0.0000
Epoch [14/20]

Epoch [14/20], Step [21800/60000], Loss: 0.0000
Epoch [14/20], Step [21900/60000], Loss: 0.0000
Epoch [14/20], Step [22000/60000], Loss: 0.0000
Epoch [14/20], Step [22100/60000], Loss: 0.0000
Epoch [14/20], Step [22200/60000], Loss: 0.0000
Epoch [14/20], Step [22300/60000], Loss: 0.0000
Epoch [14/20], Step [22400/60000], Loss: 0.0000
Epoch [14/20], Step [22500/60000], Loss: 0.0000
Epoch [14/20], Step [22600/60000], Loss: 0.0000
Epoch [14/20], Step [22700/60000], Loss: 0.0000
Epoch [14/20], Step [22800/60000], Loss: 0.0000
Epoch [14/20], Step [22900/60000], Loss: 0.0000
Epoch [14/20], Step [23000/60000], Loss: 0.0000
Epoch [14/20], Step [23100/60000], Loss: 0.0000
Epoch [14/20], Step [23200/60000], Loss: 0.0000
Epoch [14/20], Step [23300/60000], Loss: 0.0000
Epoch [14/20], Step [23400/60000], Loss: 0.0000
Epoch [14/20], Step [23500/60000], Loss: 0.0000
Epoch [14/20], Step [23600/60000], Loss: 0.0000
Epoch [14/20], Step [23700/60000], Loss: 0.0000
Epoch [14/20], Step [23800/60000], Loss:

Epoch [14/20], Step [38900/60000], Loss: 0.0000
Epoch [14/20], Step [39000/60000], Loss: 0.0000
Epoch [14/20], Step [39100/60000], Loss: 0.0000
Epoch [14/20], Step [39200/60000], Loss: 0.0000
Epoch [14/20], Step [39300/60000], Loss: 0.0000
Epoch [14/20], Step [39400/60000], Loss: 0.0000
Epoch [14/20], Step [39500/60000], Loss: 0.0000
Epoch [14/20], Step [39600/60000], Loss: 0.0000
Epoch [14/20], Step [39700/60000], Loss: 0.0000
Epoch [14/20], Step [39800/60000], Loss: 0.0000
Epoch [14/20], Step [39900/60000], Loss: 0.0000
Epoch [14/20], Step [40000/60000], Loss: 0.0000
Epoch [14/20], Step [40100/60000], Loss: 0.0000
Epoch [14/20], Step [40200/60000], Loss: 0.0000
Epoch [14/20], Step [40300/60000], Loss: 0.0000
Epoch [14/20], Step [40400/60000], Loss: 0.0000
Epoch [14/20], Step [40500/60000], Loss: 0.0000
Epoch [14/20], Step [40600/60000], Loss: 0.0000
Epoch [14/20], Step [40700/60000], Loss: 0.0000
Epoch [14/20], Step [40800/60000], Loss: 0.0000
Epoch [14/20], Step [40900/60000], Loss:

Epoch [14/20], Step [56000/60000], Loss: 0.0000
Epoch [14/20], Step [56100/60000], Loss: 0.0000
Epoch [14/20], Step [56200/60000], Loss: 0.0000
Epoch [14/20], Step [56300/60000], Loss: 0.0000
Epoch [14/20], Step [56400/60000], Loss: 0.0000
Epoch [14/20], Step [56500/60000], Loss: 0.0000
Epoch [14/20], Step [56600/60000], Loss: 0.0000
Epoch [14/20], Step [56700/60000], Loss: 0.0000
Epoch [14/20], Step [56800/60000], Loss: 0.0000
Epoch [14/20], Step [56900/60000], Loss: 0.0000
Epoch [14/20], Step [57000/60000], Loss: 0.0000
Epoch [14/20], Step [57100/60000], Loss: 0.0000
Epoch [14/20], Step [57200/60000], Loss: 0.0000
Epoch [14/20], Step [57300/60000], Loss: 0.0000
Epoch [14/20], Step [57400/60000], Loss: 0.0000
Epoch [14/20], Step [57500/60000], Loss: 0.0000
Epoch [14/20], Step [57600/60000], Loss: 0.0000
Epoch [14/20], Step [57700/60000], Loss: 0.0000
Epoch [14/20], Step [57800/60000], Loss: 0.0000
Epoch [14/20], Step [57900/60000], Loss: 0.0000
Epoch [14/20], Step [58000/60000], Loss:

Epoch [15/20], Step [13300/60000], Loss: 0.0000
Epoch [15/20], Step [13400/60000], Loss: 0.0000
Epoch [15/20], Step [13500/60000], Loss: 0.0000
Epoch [15/20], Step [13600/60000], Loss: 0.0000
Epoch [15/20], Step [13700/60000], Loss: 0.0000
Epoch [15/20], Step [13800/60000], Loss: 0.0000
Epoch [15/20], Step [13900/60000], Loss: 0.0000
Epoch [15/20], Step [14000/60000], Loss: 0.0000
Epoch [15/20], Step [14100/60000], Loss: 0.0000
Epoch [15/20], Step [14200/60000], Loss: 0.0000
Epoch [15/20], Step [14300/60000], Loss: 0.0000
Epoch [15/20], Step [14400/60000], Loss: 0.0000
Epoch [15/20], Step [14500/60000], Loss: 0.0000
Epoch [15/20], Step [14600/60000], Loss: 0.0000
Epoch [15/20], Step [14700/60000], Loss: 0.0000
Epoch [15/20], Step [14800/60000], Loss: 0.0000
Epoch [15/20], Step [14900/60000], Loss: 0.0000
Epoch [15/20], Step [15000/60000], Loss: 0.0000
Epoch [15/20], Step [15100/60000], Loss: 0.0000
Epoch [15/20], Step [15200/60000], Loss: 0.0000
Epoch [15/20], Step [15300/60000], Loss:

Epoch [15/20], Step [30400/60000], Loss: 0.0000
Epoch [15/20], Step [30500/60000], Loss: 0.0000
Epoch [15/20], Step [30600/60000], Loss: 0.0000
Epoch [15/20], Step [30700/60000], Loss: 0.0000
Epoch [15/20], Step [30800/60000], Loss: 0.0000
Epoch [15/20], Step [30900/60000], Loss: 0.0000
Epoch [15/20], Step [31000/60000], Loss: 0.0000
Epoch [15/20], Step [31100/60000], Loss: 0.0000
Epoch [15/20], Step [31200/60000], Loss: 0.0000
Epoch [15/20], Step [31300/60000], Loss: 0.0000
Epoch [15/20], Step [31400/60000], Loss: 0.0000
Epoch [15/20], Step [31500/60000], Loss: 0.0000
Epoch [15/20], Step [31600/60000], Loss: 0.0008
Epoch [15/20], Step [31700/60000], Loss: 0.0000
Epoch [15/20], Step [31800/60000], Loss: 0.0000
Epoch [15/20], Step [31900/60000], Loss: 0.0000
Epoch [15/20], Step [32000/60000], Loss: 0.0000
Epoch [15/20], Step [32100/60000], Loss: 0.0000
Epoch [15/20], Step [32200/60000], Loss: 0.0000
Epoch [15/20], Step [32300/60000], Loss: 0.0000
Epoch [15/20], Step [32400/60000], Loss:

Epoch [15/20], Step [47500/60000], Loss: 0.0000
Epoch [15/20], Step [47600/60000], Loss: 0.0000
Epoch [15/20], Step [47700/60000], Loss: 0.0000
Epoch [15/20], Step [47800/60000], Loss: 0.0000
Epoch [15/20], Step [47900/60000], Loss: 0.0000
Epoch [15/20], Step [48000/60000], Loss: 0.0000
Epoch [15/20], Step [48100/60000], Loss: 0.0000
Epoch [15/20], Step [48200/60000], Loss: 0.0000
Epoch [15/20], Step [48300/60000], Loss: 0.0000
Epoch [15/20], Step [48400/60000], Loss: 0.0000
Epoch [15/20], Step [48500/60000], Loss: 0.0000
Epoch [15/20], Step [48600/60000], Loss: 0.0000
Epoch [15/20], Step [48700/60000], Loss: 0.0000
Epoch [15/20], Step [48800/60000], Loss: 0.0000
Epoch [15/20], Step [48900/60000], Loss: 0.0000
Epoch [15/20], Step [49000/60000], Loss: 0.0000
Epoch [15/20], Step [49100/60000], Loss: 0.0000
Epoch [15/20], Step [49200/60000], Loss: 0.0000
Epoch [15/20], Step [49300/60000], Loss: 0.0000
Epoch [15/20], Step [49400/60000], Loss: 0.0000
Epoch [15/20], Step [49500/60000], Loss:

Epoch [16/20], Step [4700/60000], Loss: 0.0000
Epoch [16/20], Step [4800/60000], Loss: 0.0000
Epoch [16/20], Step [4900/60000], Loss: 0.0000
Epoch [16/20], Step [5000/60000], Loss: 0.0000
Epoch [16/20], Step [5100/60000], Loss: 0.0000
Epoch [16/20], Step [5200/60000], Loss: 0.0000
Epoch [16/20], Step [5300/60000], Loss: 0.0000
Epoch [16/20], Step [5400/60000], Loss: 0.0000
Epoch [16/20], Step [5500/60000], Loss: 0.0000
Epoch [16/20], Step [5600/60000], Loss: 0.0000
Epoch [16/20], Step [5700/60000], Loss: 0.0000
Epoch [16/20], Step [5800/60000], Loss: 0.0000
Epoch [16/20], Step [5900/60000], Loss: 0.0000
Epoch [16/20], Step [6000/60000], Loss: 0.0000
Epoch [16/20], Step [6100/60000], Loss: 2.8234
Epoch [16/20], Step [6200/60000], Loss: 0.0000
Epoch [16/20], Step [6300/60000], Loss: 0.0000
Epoch [16/20], Step [6400/60000], Loss: 0.0000
Epoch [16/20], Step [6500/60000], Loss: 0.0000
Epoch [16/20], Step [6600/60000], Loss: 0.0000
Epoch [16/20], Step [6700/60000], Loss: 0.0000
Epoch [16/20]

Epoch [16/20], Step [21900/60000], Loss: 0.0000
Epoch [16/20], Step [22000/60000], Loss: 0.0000
Epoch [16/20], Step [22100/60000], Loss: 0.0000
Epoch [16/20], Step [22200/60000], Loss: 0.0000
Epoch [16/20], Step [22300/60000], Loss: 0.0000
Epoch [16/20], Step [22400/60000], Loss: 0.0000
Epoch [16/20], Step [22500/60000], Loss: 0.0000
Epoch [16/20], Step [22600/60000], Loss: 0.0000
Epoch [16/20], Step [22700/60000], Loss: 0.0000
Epoch [16/20], Step [22800/60000], Loss: 0.0000
Epoch [16/20], Step [22900/60000], Loss: 0.0000
Epoch [16/20], Step [23000/60000], Loss: 0.0000
Epoch [16/20], Step [23100/60000], Loss: 0.0000
Epoch [16/20], Step [23200/60000], Loss: 0.0000
Epoch [16/20], Step [23300/60000], Loss: 0.0000
Epoch [16/20], Step [23400/60000], Loss: 0.0000
Epoch [16/20], Step [23500/60000], Loss: 0.0000
Epoch [16/20], Step [23600/60000], Loss: 0.0000
Epoch [16/20], Step [23700/60000], Loss: 0.0000
Epoch [16/20], Step [23800/60000], Loss: 0.0000
Epoch [16/20], Step [23900/60000], Loss:

Epoch [16/20], Step [39000/60000], Loss: 0.0000
Epoch [16/20], Step [39100/60000], Loss: 0.0000
Epoch [16/20], Step [39200/60000], Loss: 0.0000
Epoch [16/20], Step [39300/60000], Loss: 0.0000
Epoch [16/20], Step [39400/60000], Loss: 0.0000
Epoch [16/20], Step [39500/60000], Loss: 0.0000
Epoch [16/20], Step [39600/60000], Loss: 0.0000
Epoch [16/20], Step [39700/60000], Loss: 0.0000
Epoch [16/20], Step [39800/60000], Loss: 0.0000
Epoch [16/20], Step [39900/60000], Loss: 0.0000
Epoch [16/20], Step [40000/60000], Loss: 0.0000
Epoch [16/20], Step [40100/60000], Loss: 0.0000


In [None]:
# Test the model
# In the test phase, don't need to compute gradients (for memory efficiency)
with torch.no_grad():
    correct = 0
    total = 0
    for images, labels in test_loader:
        images = images.reshape(-1, 28*28).to(device)
        labels = labels.to(device)
        outputs = model(images)
        _, predicted = torch.max(outputs.data, 1)
        total += labels.size(0)
        correct += (predicted == labels).sum().item()

    print('Accuracy of the network on the 10000 test images: {} %'.format(100 * correct / total))

# Save the model checkpoint
torch.save(model.state_dict(), 'model.ckpt')

### Confusion Matrix