In [7]:
from __future__ import print_function
import argparse
import torch
import torch.utils.data
from torch import nn, optim
from torch.nn import functional as F
from torchvision import datasets, transforms
from torchvision.utils import save_image

"""
parser = argparse.ArgumentParser(description='VAE MNIST Example')
parser.add_argument('--batch-size', type=int, default=128, metavar='N',
                    help='input batch size for training (default: 128)')
parser.add_argument('--epochs', type=int, default=10, metavar='N',
                    help='number of epochs to train (default: 10)')
parser.add_argument('--no-cuda', action='store_true', default=False,
                    help='enables CUDA training')
parser.add_argument('--seed', type=int, default=1, metavar='S',
                    help='random seed (default: 1)')
parser.add_argument('--log-interval', type=int, default=10, metavar='N',
                    help='how many batches to wait before logging training status')
args = parser.parse_args()
args.cuda = not args.no_cuda and torch.cuda.is_available()
"""


cuda = True
batch_size = 128
epochs = 10
seed = 1
log_interval = 10




#torch.manual_seed(args.seed)
torch.manual_seed(seed)

#device = torch.device("cuda" if args.cuda else "cpu")
device = torch.device("cuda" if cuda else "cpu")

#kwargs = {'num_workers': 1, 'pin_memory': True} if args.cuda else {}
kwargs = {'num_workers': 1, 'pin_memory': True} if cuda else {}
train_loader = torch.utils.data.DataLoader(
    datasets.MNIST('../data', train=True, download=True,
                   transform=transforms.ToTensor()),
    batch_size=batch_size, shuffle=True, **kwargs)
test_loader = torch.utils.data.DataLoader(
    datasets.MNIST('../data', train=False, transform=transforms.ToTensor()),
    batch_size=batch_size, shuffle=True, **kwargs)


class VAE(nn.Module):
    def __init__(self):
        super(VAE, self).__init__()

        self.fc1 = nn.Linear(784, 400)
        self.fc21 = nn.Linear(400, 20)
        self.fc22 = nn.Linear(400, 20)
        self.fc3 = nn.Linear(20, 400)
        self.fc4 = nn.Linear(400, 784)

    def encode(self, x):
        h1 = F.relu(self.fc1(x))
        return self.fc21(h1), self.fc22(h1)

    def reparameterize(self, mu, logvar):
        #print(logvar.shape)
        if self.training:
            std = torch.exp(0.5*logvar)
            eps = torch.randn_like(std)
            return eps.mul(std).add_(mu)
        else:
            return mu

    def decode(self, z):
        h3 = F.relu(self.fc3(z))
        return F.sigmoid(self.fc4(h3))

    def forward(self, x):
        mu, logvar = self.encode(x.view(-1, 784))
        z = self.reparameterize(mu, logvar)
        return self.decode(z), mu, logvar


model = VAE().to(device)
optimizer = optim.Adam(model.parameters(), lr=1e-3)


# Reconstruction + KL divergence losses summed over all elements and batch
def loss_function(recon_x, x, mu, logvar):
    # recon_x is output from the activation layer. if recon_x has not gone through sigmoid activation, 
    # use binary_cross_entropy_with_logits
    BCE = F.binary_cross_entropy(recon_x, x.view(-1, 784), size_average=False)
    #print("BCE: "+str(BCE/batch_size))

    # see Appendix B from VAE paper:
    # Kingma and Welling. Auto-Encoding Variational Bayes. ICLR, 2014
    # https://arxiv.org/abs/1312.6114
    # 0.5 * sum(1 + log(sigma^2) - mu^2 - sigma^2)
    #tmp = 1 + logvar - mu.pow(2) - logvar.exp()
    #print("tmp: "+str(tmp.shape))
    #KLD = -0.5*torch.sum(tmp)
    #print("KLD: "+str(KLD.shape))
    KLD = -0.5 * torch.sum(1 + logvar - mu.pow(2) - logvar.exp())
    #print(BCE)

    return BCE + KLD


def train(epoch):
    model.train()
    train_loss = 0
    for batch_idx, (data, _) in enumerate(train_loader):
        data = data.to(device)
        optimizer.zero_grad()
        recon_batch, mu, logvar = model(data)
        #print("recon: "+str(recon_batch.shape))
        print("var: "+str(torch.exp(logvar)))
        loss = loss_function(recon_batch, data, mu, logvar)
        print("loss: "+str(loss.item()/len(data)))
        loss.backward()
        train_loss += loss.item()
        optimizer.step()
        #print(len(data))
        if batch_idx % log_interval == 0:
            print('Train Epoch: {} [{}/{} ({:.0f}%)]\tLoss: {:.6f}'.format(
                epoch, batch_idx * len(data), len(train_loader.dataset),
                100. * batch_idx / len(train_loader),
                loss.item() / len(data)))
            #print("loss "+str(loss.item()))
            #print("len "+str(len(data)))

    print('====> Epoch: {} Average loss: {:.4f}'.format(
          epoch, train_loss / len(train_loader.dataset)))


def test(epoch):
    model.eval()
    test_loss = 0
    with torch.no_grad():
        for i, (data, _) in enumerate(test_loader):
            data = data.to(device)
            recon_batch, mu, logvar = model(data)
            test_loss += loss_function(recon_batch, data, mu, logvar).item()
            if i == 0:
                n = min(data.size(0), 8)
                comparison = torch.cat([data[:n],
                                      recon_batch.view(batch_size, 1, 28, 28)[:n]])
                save_image(comparison.cpu(),
                         'results/reconstruction_' + str(epoch) + '.png', nrow=n)

    test_loss /= len(test_loader.dataset)
    print('====> Test set loss: {:.4f}'.format(test_loss))


for epoch in range(1, epochs + 1):
    train(epoch)
    test(epoch)
    with torch.no_grad():
        sample = torch.randn(64, 20).to(device)
        sample = model.decode(sample).cpu()
        save_image(sample.view(64, 1, 28, 28),
                   'results/sample_' + str(epoch) + '.png')

var: tensor([[ 1.1782,  0.8515,  1.0940,  ...,  0.8643,  0.9668,  0.9706],
        [ 1.0580,  0.9721,  0.9502,  ...,  0.9682,  0.9837,  0.9705],
        [ 1.1617,  0.9663,  0.9707,  ...,  0.9858,  0.9584,  0.9860],
        ...,
        [ 1.1230,  0.9552,  1.0000,  ...,  0.9267,  0.9816,  0.9507],
        [ 1.1661,  0.9986,  1.0591,  ...,  1.0481,  0.9561,  1.0799],
        [ 1.1048,  0.9539,  1.0786,  ...,  0.9627,  0.9527,  1.0502]], device='cuda:0')
loss: 550.533935546875
var: tensor([[ 1.0796,  0.7673,  0.8584,  ...,  0.7815,  0.8559,  0.9554],
        [ 1.0496,  0.8532,  0.9247,  ...,  0.8541,  0.9616,  0.8868],
        [ 1.0548,  0.8855,  0.8624,  ...,  0.8406,  0.9457,  0.9093],
        ...,
        [ 1.1076,  0.8541,  0.9705,  ...,  0.8133,  0.9215,  0.8864],
        [ 1.0507,  0.7393,  0.8018,  ...,  0.7745,  0.9037,  0.8419],
        [ 1.0024,  0.8035,  0.8333,  ...,  0.7731,  0.8878,  0.9596]], device='cuda:0')
loss: 524.7174072265625
var: tensor([[ 1.0780,  0.8557,  0.9668, 

var: tensor([[ 1.5859,  1.6430,  1.4111,  ...,  1.3620,  1.1278,  0.8353],
        [ 1.4167,  1.4803,  1.3889,  ...,  1.2685,  1.1509,  0.9777],
        [ 1.4834,  1.8299,  1.3650,  ...,  1.5066,  1.2126,  0.8945],
        ...,
        [ 1.6243,  1.9405,  1.4895,  ...,  1.4984,  1.2933,  0.9524],
        [ 1.5460,  1.9276,  1.5649,  ...,  1.4637,  1.5014,  0.9884],
        [ 1.5007,  1.5791,  1.3014,  ...,  1.3473,  1.1413,  0.9949]], device='cuda:0')
loss: 220.20741271972656
var: tensor([[ 1.4040,  1.5361,  1.2334,  ...,  1.2398,  1.1023,  0.9822],
        [ 1.3588,  1.4225,  1.2145,  ...,  1.2251,  1.0788,  0.8691],
        [ 1.3687,  1.7626,  1.3418,  ...,  1.3020,  1.1215,  0.8474],
        ...,
        [ 1.4469,  1.3419,  1.2859,  ...,  1.1433,  1.0060,  0.9948],
        [ 1.4815,  1.8467,  1.4196,  ...,  1.3137,  1.1842,  0.9544],
        [ 1.4554,  1.6248,  1.2514,  ...,  1.3272,  1.2012,  0.9049]], device='cuda:0')
loss: 223.70199584960938
var: tensor([[ 1.5477,  1.8109,  1.576

var: tensor([[ 1.1523,  1.1899,  1.0071,  ...,  1.1061,  0.7179,  0.6374],
        [ 1.1782,  1.2283,  1.0857,  ...,  1.1342,  0.7627,  0.6110],
        [ 1.0658,  1.0671,  0.9766,  ...,  1.0289,  0.7757,  0.6138],
        ...,
        [ 1.0651,  0.9063,  0.8659,  ...,  1.0302,  0.7206,  0.6343],
        [ 1.1603,  1.2113,  1.0775,  ...,  1.0216,  0.8757,  0.6295],
        [ 1.4675,  1.4463,  1.3603,  ...,  1.2301,  0.7238,  0.5573]], device='cuda:0')
loss: 211.1358642578125
var: tensor([[ 1.8680,  2.0850,  1.7268,  ...,  1.6558,  0.9745,  0.7404],
        [ 1.0522,  1.0734,  0.8216,  ...,  1.0911,  0.5792,  0.4718],
        [ 1.2601,  1.2490,  1.2196,  ...,  1.2174,  0.8189,  0.6956],
        ...,
        [ 1.1002,  1.0152,  1.0039,  ...,  0.9733,  0.8285,  0.8280],
        [ 1.1645,  1.0774,  1.0529,  ...,  1.0688,  0.7447,  0.5355],
        [ 1.1152,  1.1028,  1.0897,  ...,  1.1131,  0.8071,  0.6224]], device='cuda:0')
loss: 208.5605926513672
var: tensor([[ 1.1093,  1.0400,  0.9618,

loss: 190.5810546875
var: tensor([[ 0.7874,  0.8682,  0.7015,  ...,  0.8210,  0.4784,  0.4372],
        [ 0.8112,  0.9667,  0.7262,  ...,  0.8170,  0.4265,  0.4021],
        [ 0.7408,  0.9174,  0.7282,  ...,  0.7974,  0.3430,  0.3140],
        ...,
        [ 0.9803,  1.4119,  0.9244,  ...,  0.7706,  0.7163,  0.7107],
        [ 0.9238,  1.1974,  1.0405,  ...,  0.8919,  0.5536,  0.4909],
        [ 0.9248,  1.1978,  0.7726,  ...,  0.7495,  0.5674,  0.5599]], device='cuda:0')
loss: 195.196044921875
var: tensor([[ 0.9543,  1.2895,  1.0196,  ...,  0.8769,  0.7165,  0.6714],
        [ 0.8630,  1.0724,  0.8558,  ...,  0.7366,  0.3835,  0.3533],
        [ 0.8394,  0.9853,  0.8398,  ...,  0.8326,  0.4486,  0.3953],
        ...,
        [ 0.8532,  0.9804,  0.8920,  ...,  0.8665,  0.4608,  0.4860],
        [ 0.8779,  1.1167,  0.8902,  ...,  0.9565,  0.6477,  0.6119],
        [ 0.9851,  1.1518,  0.9218,  ...,  0.9093,  0.6425,  0.5768]], device='cuda:0')
loss: 197.09439086914062
var: tensor([[ 0.86

var: tensor([[ 0.6765,  0.8642,  0.5525,  ...,  0.8365,  0.3528,  0.5015],
        [ 0.7098,  0.8609,  0.6346,  ...,  0.8410,  0.4057,  0.6210],
        [ 0.4990,  0.5623,  0.2982,  ...,  0.5307,  0.2512,  0.4217],
        ...,
        [ 0.5758,  0.8077,  0.4441,  ...,  0.7541,  0.3555,  0.4822],
        [ 0.4926,  0.5940,  0.3455,  ...,  0.5660,  0.2362,  0.4103],
        [ 0.4930,  0.6393,  0.2370,  ...,  0.5560,  0.2510,  0.3542]], device='cuda:0')
loss: 182.35888671875
var: tensor([[ 0.5749,  0.5986,  0.3213,  ...,  0.7275,  0.3070,  0.3726],
        [ 0.6261,  0.8977,  0.3882,  ...,  0.6766,  0.2997,  0.4459],
        [ 0.5528,  0.7494,  0.3460,  ...,  0.7526,  0.2959,  0.3979],
        ...,
        [ 0.5300,  0.6791,  0.2963,  ...,  0.5714,  0.3039,  0.4384],
        [ 0.6435,  0.8430,  0.5070,  ...,  0.7275,  0.2637,  0.4985],
        [ 0.6892,  0.8131,  0.5769,  ...,  0.7349,  0.3843,  0.6533]], device='cuda:0')
loss: 183.93333435058594
var: tensor([[ 0.6589,  1.0118,  0.5934, 

var: tensor([[ 0.5216,  0.3513,  0.2644,  ...,  0.4748,  0.3262,  0.4240],
        [ 0.4905,  0.5479,  0.2945,  ...,  0.4689,  0.2666,  0.4769],
        [ 0.6767,  0.9298,  0.3862,  ...,  0.5823,  0.3582,  0.4407],
        ...,
        [ 0.4995,  0.6307,  0.2911,  ...,  0.4920,  0.2202,  0.3859],
        [ 0.2808,  0.2386,  0.1105,  ...,  0.2428,  0.0943,  0.1759],
        [ 0.7398,  0.8737,  0.5419,  ...,  0.6884,  0.4696,  0.6506]], device='cuda:0')
loss: 175.52027893066406
var: tensor([[ 0.3117,  0.3795,  0.1346,  ...,  0.2971,  0.1486,  0.2520],
        [ 0.6938,  0.8704,  0.4354,  ...,  0.7092,  0.4102,  0.6212],
        [ 0.6351,  0.7203,  0.4357,  ...,  0.6238,  0.4571,  0.6257],
        ...,
        [ 0.6182,  0.8763,  0.5928,  ...,  0.6768,  0.4995,  0.7227],
        [ 0.5007,  0.6119,  0.3793,  ...,  0.5294,  0.2709,  0.4388],
        [ 0.5755,  0.8221,  0.4134,  ...,  0.6051,  0.3876,  0.5441]], device='cuda:0')
loss: 168.2433624267578
var: tensor([[ 0.4865,  0.4922,  0.2264

loss: 162.8747100830078
var: tensor([[ 0.6929,  0.5402,  0.3805,  ...,  0.5352,  0.3084,  0.4229],
        [ 0.4195,  0.3908,  0.3222,  ...,  0.3843,  0.2269,  0.3525],
        [ 0.3980,  0.3594,  0.2181,  ...,  0.4218,  0.2611,  0.3118],
        ...,
        [ 0.3821,  0.3708,  0.3444,  ...,  0.4423,  0.4970,  0.4411],
        [ 0.3735,  0.3596,  0.2971,  ...,  0.3125,  0.2668,  0.3833],
        [ 0.5691,  0.4810,  0.4142,  ...,  0.4822,  0.4647,  0.5255]], device='cuda:0')
loss: 164.44338989257812
var: tensor([[ 0.4486,  0.3704,  0.2741,  ...,  0.3662,  0.3456,  0.4095],
        [ 0.5208,  0.5995,  0.4663,  ...,  0.5527,  0.4379,  0.5374],
        [ 0.3254,  0.3273,  0.2213,  ...,  0.3094,  0.1500,  0.2044],
        ...,
        [ 0.3931,  0.4270,  0.2633,  ...,  0.3945,  0.1749,  0.2272],
        [ 0.6132,  0.5693,  0.4371,  ...,  0.6348,  0.3460,  0.5476],
        [ 0.2665,  0.2204,  0.1155,  ...,  0.2616,  0.1681,  0.1505]], device='cuda:0')
loss: 160.41531372070312
var: tensor([[

var: tensor([[ 0.5344,  0.5445,  0.4658,  ...,  0.5866,  0.4523,  0.5670],
        [ 0.4362,  0.5012,  0.3520,  ...,  0.5571,  0.3247,  0.4522],
        [ 0.2874,  0.2593,  0.2702,  ...,  0.3738,  0.2886,  0.3268],
        ...,
        [ 0.5959,  0.6123,  0.4978,  ...,  0.6849,  0.4104,  0.4791],
        [ 0.2871,  0.2724,  0.2514,  ...,  0.3747,  0.2865,  0.3372],
        [ 0.4829,  0.4602,  0.3044,  ...,  0.5477,  0.3646,  0.4496]], device='cuda:0')
loss: 158.7930450439453
var: tensor([[ 0.2829,  0.2994,  0.2038,  ...,  0.4525,  0.1822,  0.2988],
        [ 0.2421,  0.1919,  0.1353,  ...,  0.2911,  0.1436,  0.2095],
        [ 0.4352,  0.3549,  0.2470,  ...,  0.5828,  0.3063,  0.3462],
        ...,
        [ 0.5336,  0.5553,  0.4276,  ...,  0.6262,  0.3940,  0.4474],
        [ 0.3884,  0.2989,  0.2093,  ...,  0.4039,  0.2336,  0.2728],
        [ 0.2642,  0.2354,  0.2288,  ...,  0.3536,  0.2076,  0.2801]], device='cuda:0')
loss: 156.0472412109375
var: tensor([[ 0.3714,  0.3800,  0.2850,

var: tensor([[ 0.3218,  0.3934,  0.2565,  ...,  0.5298,  0.3167,  0.4560],
        [ 0.4005,  0.3106,  0.2349,  ...,  0.4576,  0.3066,  0.3458],
        [ 0.3912,  0.3761,  0.3256,  ...,  0.6470,  0.4073,  0.4468],
        ...,
        [ 0.3617,  0.2542,  0.1819,  ...,  0.4321,  0.2365,  0.3131],
        [ 0.3763,  0.3246,  0.2041,  ...,  0.5384,  0.2885,  0.2939],
        [ 0.5563,  0.5180,  0.3398,  ...,  0.6950,  0.4049,  0.4181]], device='cuda:0')
loss: 152.64608764648438
var: tensor([[ 0.2402,  0.3184,  0.2021,  ...,  0.4797,  0.2723,  0.3313],
        [ 0.3240,  0.3098,  0.2762,  ...,  0.5679,  0.3808,  0.3839],
        [ 0.2877,  0.4097,  0.2628,  ...,  0.5660,  0.2832,  0.3200],
        ...,
        [ 0.2677,  0.1885,  0.1940,  ...,  0.3935,  0.2250,  0.2344],
        [ 0.3070,  0.4105,  0.2515,  ...,  0.5036,  0.3550,  0.4560],
        [ 0.5905,  0.4893,  0.4328,  ...,  0.6837,  0.4686,  0.4782]], device='cuda:0')
loss: 151.07965087890625
var: tensor([[ 0.2702,  0.2925,  0.166

loss: 146.11549377441406
var: tensor([[ 0.1500,  0.1560,  0.1344,  ...,  0.4261,  0.1618,  0.2454],
        [ 0.2862,  0.4685,  0.2510,  ...,  0.6659,  0.4068,  0.4711],
        [ 0.3571,  0.2661,  0.1917,  ...,  0.6428,  0.2404,  0.3407],
        ...,
        [ 0.2247,  0.3737,  0.2097,  ...,  0.5420,  0.3268,  0.3878],
        [ 0.3502,  0.2237,  0.1646,  ...,  0.4977,  0.1618,  0.3015],
        [ 0.3222,  0.2208,  0.1719,  ...,  0.4960,  0.3615,  0.3290]], device='cuda:0')
loss: 150.77090454101562
var: tensor([[ 0.1819,  0.1314,  0.1037,  ...,  0.3097,  0.1430,  0.1902],
        [ 0.2915,  0.4053,  0.2211,  ...,  0.5842,  0.2674,  0.4700],
        [ 0.2668,  0.2176,  0.1543,  ...,  0.6004,  0.2259,  0.3231],
        ...,
        [ 0.2023,  0.1953,  0.1041,  ...,  0.2886,  0.1567,  0.2101],
        [ 0.3887,  0.3354,  0.2658,  ...,  0.6613,  0.3132,  0.4335],
        [ 0.3373,  0.3412,  0.3085,  ...,  0.6020,  0.3651,  0.4521]], device='cuda:0')
loss: 145.27828979492188
var: tensor([

var: tensor([[ 0.2648,  0.1790,  0.2499,  ...,  0.3427,  0.3118,  0.2703],
        [ 0.3295,  0.3726,  0.2079,  ...,  0.4420,  0.2734,  0.2890],
        [ 0.1699,  0.1061,  0.1195,  ...,  0.2603,  0.2298,  0.1881],
        ...,
        [ 0.2467,  0.1993,  0.1911,  ...,  0.3669,  0.2414,  0.2757],
        [ 0.3537,  0.4019,  0.3508,  ...,  0.5038,  0.4239,  0.3499],
        [ 0.3832,  0.4506,  0.3181,  ...,  0.4489,  0.3781,  0.3363]], device='cuda:0')
loss: 143.3829345703125
var: tensor([[ 0.1583,  0.2082,  0.1824,  ...,  0.3713,  0.2381,  0.1775],
        [ 0.2025,  0.1835,  0.1111,  ...,  0.2518,  0.1920,  0.1788],
        [ 0.2530,  0.1836,  0.1869,  ...,  0.4598,  0.3336,  0.3518],
        ...,
        [ 0.1601,  0.0975,  0.1380,  ...,  0.2934,  0.2284,  0.1916],
        [ 0.1181,  0.1042,  0.1590,  ...,  0.2865,  0.2250,  0.1836],
        [ 0.1565,  0.1648,  0.1798,  ...,  0.3370,  0.2845,  0.2211]], device='cuda:0')
loss: 141.4600372314453
var: tensor([[ 0.1970,  0.1546,  0.1442,

var: tensor([[ 0.2073,  0.1376,  0.1082,  ...,  0.2327,  0.1782,  0.1854],
        [ 0.1125,  0.0989,  0.0593,  ...,  0.1510,  0.1096,  0.1291],
        [ 0.1867,  0.1548,  0.1481,  ...,  0.3028,  0.2414,  0.2335],
        ...,
        [ 0.2162,  0.2049,  0.1286,  ...,  0.3560,  0.3167,  0.3171],
        [ 0.4597,  0.4478,  0.3253,  ...,  0.5599,  0.4531,  0.5091],
        [ 0.2154,  0.1984,  0.1351,  ...,  0.3199,  0.2141,  0.2286]], device='cuda:0')
loss: 142.81106567382812
var: tensor([[ 0.1718,  0.1769,  0.1353,  ...,  0.3244,  0.2133,  0.1803],
        [ 0.2422,  0.3469,  0.2316,  ...,  0.4772,  0.3924,  0.3342],
        [ 0.1463,  0.2180,  0.1274,  ...,  0.2900,  0.2414,  0.1855],
        ...,
        [ 0.2323,  0.3093,  0.1566,  ...,  0.3705,  0.2587,  0.2548],
        [ 0.1389,  0.1273,  0.0984,  ...,  0.2525,  0.1507,  0.1556],
        [ 0.2239,  0.2356,  0.1962,  ...,  0.3475,  0.2597,  0.2065]], device='cuda:0')
loss: 144.26031494140625
var: tensor([[ 0.2953,  0.3354,  0.183

var: tensor([[ 0.3611,  0.3315,  0.2786,  ...,  0.4684,  0.3078,  0.3003],
        [ 0.3254,  0.2752,  0.2334,  ...,  0.4879,  0.3241,  0.3871],
        [ 0.2189,  0.1980,  0.1816,  ...,  0.3177,  0.2129,  0.2766],
        ...,
        [ 0.3592,  0.3871,  0.2975,  ...,  0.4667,  0.3701,  0.3404],
        [ 0.1739,  0.2002,  0.1890,  ...,  0.3072,  0.1994,  0.2006],
        [ 0.1204,  0.1294,  0.1005,  ...,  0.2317,  0.1559,  0.1629]], device='cuda:0')
loss: 139.35568237304688
var: tensor([[ 0.2402,  0.2338,  0.1729,  ...,  0.3590,  0.3405,  0.3779],
        [ 0.2177,  0.2626,  0.1647,  ...,  0.3977,  0.1888,  0.2346],
        [ 0.1491,  0.1687,  0.1791,  ...,  0.2404,  0.1759,  0.1477],
        ...,
        [ 0.1751,  0.1488,  0.1429,  ...,  0.3498,  0.1759,  0.2132],
        [ 0.1963,  0.2267,  0.1352,  ...,  0.3102,  0.1772,  0.1990],
        [ 0.1589,  0.1886,  0.1175,  ...,  0.3030,  0.2010,  0.2197]], device='cuda:0')
loss: 138.56924438476562
var: tensor([[ 0.2902,  0.4377,  0.292

var: tensor([[ 0.0799,  0.0551,  0.0355,  ...,  0.1169,  0.0686,  0.1016],
        [ 0.2927,  0.2678,  0.1666,  ...,  0.3718,  0.2930,  0.3089],
        [ 0.1782,  0.1793,  0.1025,  ...,  0.2274,  0.1620,  0.1377],
        ...,
        [ 0.1192,  0.1334,  0.0771,  ...,  0.2028,  0.1645,  0.1443],
        [ 0.1996,  0.1799,  0.0862,  ...,  0.2918,  0.1668,  0.1680],
        [ 0.1225,  0.1411,  0.1224,  ...,  0.1930,  0.1699,  0.1723]], device='cuda:0')
loss: 134.13189697265625
var: tensor([[ 0.2592,  0.1785,  0.1505,  ...,  0.3257,  0.2759,  0.2651],
        [ 0.2065,  0.1238,  0.1351,  ...,  0.2569,  0.2071,  0.1477],
        [ 0.1152,  0.1558,  0.0740,  ...,  0.2100,  0.1687,  0.1924],
        ...,
        [ 0.2685,  0.2353,  0.1694,  ...,  0.3522,  0.2769,  0.2412],
        [ 0.1142,  0.1446,  0.1305,  ...,  0.2183,  0.1783,  0.1529],
        [ 0.2325,  0.2213,  0.2005,  ...,  0.3179,  0.3254,  0.2806]], device='cuda:0')
loss: 139.4166259765625
var: tensor([[ 0.2546,  0.3049,  0.1994

var: tensor([[ 0.1043,  0.0640,  0.0593,  ...,  0.1926,  0.0903,  0.0845],
        [ 0.0615,  0.0402,  0.0590,  ...,  0.1213,  0.0561,  0.0639],
        [ 0.1085,  0.1249,  0.1484,  ...,  0.2227,  0.1690,  0.1476],
        ...,
        [ 0.1122,  0.0764,  0.0887,  ...,  0.1565,  0.1055,  0.0885],
        [ 0.1149,  0.0892,  0.1044,  ...,  0.2036,  0.1382,  0.0973],
        [ 0.1301,  0.1085,  0.1450,  ...,  0.2007,  0.1390,  0.0968]], device='cuda:0')
loss: 133.88613891601562
var: tensor([[ 0.2061,  0.1488,  0.1370,  ...,  0.3195,  0.1660,  0.1459],
        [ 0.3178,  0.2259,  0.1815,  ...,  0.3450,  0.2343,  0.2040],
        [ 0.2197,  0.1496,  0.1361,  ...,  0.3088,  0.1672,  0.1497],
        ...,
        [ 0.1415,  0.1179,  0.1129,  ...,  0.2468,  0.1935,  0.2231],
        [ 0.2809,  0.2784,  0.2307,  ...,  0.4454,  0.3005,  0.3268],
        [ 0.1136,  0.1117,  0.1360,  ...,  0.2228,  0.1552,  0.1554]], device='cuda:0')
loss: 132.0762939453125
var: tensor([[ 0.2799,  0.1594,  0.1442

var: tensor([[ 0.1973,  0.2709,  0.1850,  ...,  0.2869,  0.2129,  0.1873],
        [ 0.3118,  0.2974,  0.2254,  ...,  0.4224,  0.3565,  0.3341],
        [ 0.1802,  0.1686,  0.1181,  ...,  0.2186,  0.1979,  0.1478],
        ...,
        [ 0.2123,  0.1611,  0.0987,  ...,  0.2371,  0.1900,  0.1360],
        [ 0.1832,  0.1413,  0.1048,  ...,  0.1959,  0.1829,  0.1510],
        [ 0.0507,  0.0519,  0.0397,  ...,  0.0932,  0.0952,  0.0670]], device='cuda:0')
loss: 128.00001525878906
var: tensor([[ 0.2669,  0.2276,  0.1857,  ...,  0.2801,  0.2408,  0.1785],
        [ 0.0704,  0.0866,  0.0609,  ...,  0.0977,  0.1148,  0.0903],
        [ 0.2109,  0.1521,  0.1181,  ...,  0.2032,  0.1742,  0.1255],
        ...,
        [ 0.1087,  0.1300,  0.0923,  ...,  0.1963,  0.1979,  0.1470],
        [ 0.1811,  0.2128,  0.1731,  ...,  0.2787,  0.2127,  0.1958],
        [ 0.1634,  0.2250,  0.1173,  ...,  0.1911,  0.1708,  0.1458]], device='cuda:0')
loss: 133.46530151367188
var: tensor([[ 0.1938,  0.2021,  0.111

loss: 130.6473388671875
var: tensor([[ 0.1538,  0.1896,  0.1522,  ...,  0.2213,  0.2080,  0.1322],
        [ 0.2358,  0.2815,  0.1763,  ...,  0.2707,  0.2742,  0.2850],
        [ 0.2136,  0.1677,  0.1279,  ...,  0.1881,  0.1646,  0.1429],
        ...,
        [ 0.1471,  0.1314,  0.1120,  ...,  0.1595,  0.1454,  0.0948],
        [ 0.1842,  0.2903,  0.1690,  ...,  0.2362,  0.2454,  0.2267],
        [ 0.1027,  0.1178,  0.1058,  ...,  0.1523,  0.1323,  0.1277]], device='cuda:0')
loss: 129.21214294433594
var: tensor([[ 0.1040,  0.0827,  0.0524,  ...,  0.1054,  0.0883,  0.0630],
        [ 0.1922,  0.3081,  0.2223,  ...,  0.2976,  0.2996,  0.2252],
        [ 0.1621,  0.1740,  0.1056,  ...,  0.2279,  0.2047,  0.1552],
        ...,
        [ 0.1209,  0.1914,  0.1403,  ...,  0.1688,  0.1843,  0.1502],
        [ 0.1409,  0.1103,  0.0856,  ...,  0.1273,  0.1039,  0.1340],
        [ 0.0788,  0.0649,  0.0408,  ...,  0.0877,  0.0691,  0.0617]], device='cuda:0')
loss: 131.5867156982422
var: tensor([[ 

====> Test set loss: 119.9020
var: tensor([[ 0.0798,  0.2270,  0.1105,  ...,  0.1579,  0.1228,  0.1097],
        [ 0.1621,  0.2173,  0.0993,  ...,  0.2211,  0.1614,  0.1401],
        [ 0.1639,  0.1871,  0.1128,  ...,  0.2313,  0.1497,  0.1767],
        ...,
        [ 0.1329,  0.1161,  0.0626,  ...,  0.1573,  0.0969,  0.0805],
        [ 0.1394,  0.0950,  0.0578,  ...,  0.1537,  0.0860,  0.0879],
        [ 0.1530,  0.1223,  0.0614,  ...,  0.1142,  0.0789,  0.0828]], device='cuda:0')
loss: 126.50235748291016
var: tensor([[ 0.3606,  0.3281,  0.2102,  ...,  0.3160,  0.2264,  0.2401],
        [ 0.1459,  0.2338,  0.1181,  ...,  0.1733,  0.1490,  0.1190],
        [ 0.1100,  0.0894,  0.0486,  ...,  0.1107,  0.0716,  0.0727],
        ...,
        [ 0.1205,  0.0950,  0.0556,  ...,  0.1466,  0.0815,  0.0853],
        [ 0.1155,  0.1312,  0.0823,  ...,  0.1561,  0.1008,  0.0962],
        [ 0.0998,  0.1525,  0.0644,  ...,  0.1782,  0.1299,  0.1260]], device='cuda:0')
loss: 127.91333770751953
var: ten

var: tensor([[ 0.1158,  0.1226,  0.0980,  ...,  0.1398,  0.1095,  0.0893],
        [ 0.1584,  0.1001,  0.0961,  ...,  0.1304,  0.1275,  0.1241],
        [ 0.1110,  0.0771,  0.0652,  ...,  0.1276,  0.0721,  0.1060],
        ...,
        [ 0.1231,  0.1273,  0.1358,  ...,  0.1411,  0.1143,  0.1186],
        [ 0.1017,  0.1205,  0.0976,  ...,  0.1293,  0.1408,  0.1048],
        [ 0.1299,  0.1421,  0.1135,  ...,  0.1971,  0.1401,  0.1267]], device='cuda:0')
loss: 131.67727661132812
var: tensor([[ 0.1662,  0.2056,  0.1231,  ...,  0.1774,  0.1283,  0.1319],
        [ 0.0377,  0.0340,  0.0397,  ...,  0.0471,  0.0434,  0.0477],
        [ 0.2706,  0.1991,  0.1563,  ...,  0.2316,  0.1862,  0.1755],
        ...,
        [ 0.1031,  0.0828,  0.0834,  ...,  0.1209,  0.1034,  0.1193],
        [ 0.1044,  0.0877,  0.0705,  ...,  0.0963,  0.0677,  0.0890],
        [ 0.0940,  0.0891,  0.0717,  ...,  0.1310,  0.0959,  0.1121]], device='cuda:0')
loss: 124.4809799194336
var: tensor([[ 0.0652,  0.0777,  0.0568

var: tensor([[ 0.1884,  0.1294,  0.0940,  ...,  0.2254,  0.1630,  0.1302],
        [ 0.0783,  0.0704,  0.0586,  ...,  0.1125,  0.1006,  0.0970],
        [ 0.1562,  0.0918,  0.0835,  ...,  0.1283,  0.1438,  0.1026],
        ...,
        [ 0.1310,  0.0921,  0.0717,  ...,  0.1484,  0.1227,  0.1397],
        [ 0.0904,  0.0725,  0.0544,  ...,  0.1107,  0.0792,  0.1176],
        [ 0.1146,  0.1043,  0.0968,  ...,  0.1336,  0.1015,  0.1140]], device='cuda:0')
loss: 128.39491271972656
var: tensor([[ 0.1666,  0.1394,  0.0824,  ...,  0.1531,  0.1301,  0.1370],
        [ 0.2266,  0.1863,  0.1165,  ...,  0.1905,  0.1600,  0.1606],
        [ 0.2934,  0.2207,  0.1552,  ...,  0.2704,  0.1832,  0.1883],
        ...,
        [ 0.0961,  0.0832,  0.0588,  ...,  0.1419,  0.0892,  0.1116],
        [ 0.0745,  0.1028,  0.1021,  ...,  0.1343,  0.1430,  0.1282],
        [ 0.1264,  0.1271,  0.0765,  ...,  0.1415,  0.1431,  0.1183]], device='cuda:0')
loss: 123.57833862304688
var: tensor([[ 0.1113,  0.1294,  0.130

var: tensor([[ 0.1159,  0.1914,  0.0993,  ...,  0.2116,  0.1538,  0.1558],
        [ 0.1721,  0.1633,  0.0977,  ...,  0.2044,  0.1337,  0.1909],
        [ 0.1544,  0.1592,  0.1039,  ...,  0.1829,  0.1681,  0.1563],
        ...,
        [ 0.1146,  0.1410,  0.0613,  ...,  0.1968,  0.1214,  0.1039],
        [ 0.0598,  0.0947,  0.0686,  ...,  0.1384,  0.1080,  0.0965],
        [ 0.1077,  0.1269,  0.0827,  ...,  0.1771,  0.1331,  0.1547]], device='cuda:0')
loss: 129.33180236816406
var: tensor([[ 0.0873,  0.1148,  0.1010,  ...,  0.1559,  0.1159,  0.1222],
        [ 0.1448,  0.1712,  0.0968,  ...,  0.2184,  0.2198,  0.2050],
        [ 0.0415,  0.0526,  0.0250,  ...,  0.0779,  0.0636,  0.0858],
        ...,
        [ 0.0962,  0.1047,  0.0833,  ...,  0.1589,  0.1170,  0.1252],
        [ 0.1722,  0.1690,  0.0958,  ...,  0.2841,  0.1482,  0.1651],
        [ 0.0814,  0.1408,  0.1286,  ...,  0.1703,  0.1333,  0.1405]], device='cuda:0')
loss: 125.19691467285156
var: tensor([[ 0.1285,  0.2327,  0.144

var: tensor([[ 0.0462,  0.0465,  0.0534,  ...,  0.1022,  0.0720,  0.0844],
        [ 0.2354,  0.2781,  0.1807,  ...,  0.2349,  0.2373,  0.2360],
        [ 0.0750,  0.1182,  0.0868,  ...,  0.1240,  0.1004,  0.0874],
        ...,
        [ 0.0552,  0.0825,  0.0847,  ...,  0.1349,  0.1430,  0.0981],
        [ 0.1078,  0.1074,  0.0749,  ...,  0.1681,  0.1504,  0.1185],
        [ 0.0624,  0.0912,  0.0615,  ...,  0.1395,  0.1330,  0.1009]], device='cuda:0')
loss: 124.41822814941406
var: tensor([[ 0.1323,  0.0730,  0.0573,  ...,  0.1370,  0.1012,  0.0823],
        [ 0.1490,  0.2234,  0.1642,  ...,  0.2440,  0.2332,  0.1879],
        [ 0.1253,  0.1191,  0.0894,  ...,  0.2075,  0.1512,  0.1525],
        ...,
        [ 0.1129,  0.1010,  0.0672,  ...,  0.1608,  0.1316,  0.1021],
        [ 0.1674,  0.1335,  0.0768,  ...,  0.2337,  0.1994,  0.1294],
        [ 0.1531,  0.2089,  0.1673,  ...,  0.2488,  0.2431,  0.1921]], device='cuda:0')
loss: 129.78041076660156
var: tensor([[ 0.2861,  0.2221,  0.148

var: tensor([[ 0.0843,  0.0722,  0.0448,  ...,  0.0747,  0.0893,  0.1071],
        [ 0.1650,  0.1828,  0.1157,  ...,  0.2239,  0.1630,  0.1414],
        [ 0.1221,  0.0965,  0.0728,  ...,  0.1844,  0.1176,  0.1311],
        ...,
        [ 0.0946,  0.1359,  0.1510,  ...,  0.1310,  0.1383,  0.1176],
        [ 0.0942,  0.1297,  0.0758,  ...,  0.1327,  0.1178,  0.1243],
        [ 0.1232,  0.0941,  0.0628,  ...,  0.1206,  0.0870,  0.0953]], device='cuda:0')
loss: 122.64205932617188
var: tensor([[ 0.1611,  0.1115,  0.0850,  ...,  0.1424,  0.1255,  0.1310],
        [ 0.1245,  0.1154,  0.0706,  ...,  0.1660,  0.1155,  0.0989],
        [ 0.1400,  0.1325,  0.0899,  ...,  0.2010,  0.1396,  0.1228],
        ...,
        [ 0.0595,  0.0753,  0.0648,  ...,  0.0769,  0.0537,  0.0734],
        [ 0.1347,  0.1364,  0.0879,  ...,  0.1431,  0.1137,  0.0898],
        [ 0.1035,  0.0940,  0.0498,  ...,  0.1052,  0.0795,  0.0662]], device='cuda:0')
loss: 123.64157104492188
var: tensor([[ 0.1080,  0.0865,  0.062

var: tensor([[ 0.0655,  0.0801,  0.0520,  ...,  0.0829,  0.0760,  0.1030],
        [ 0.1171,  0.1360,  0.0615,  ...,  0.1171,  0.0917,  0.1009],
        [ 0.1457,  0.2432,  0.1576,  ...,  0.2133,  0.2004,  0.1734],
        ...,
        [ 0.0638,  0.1277,  0.0698,  ...,  0.1277,  0.1056,  0.1242],
        [ 0.0917,  0.1488,  0.0791,  ...,  0.1580,  0.1032,  0.1382],
        [ 0.1881,  0.1398,  0.0995,  ...,  0.2043,  0.1388,  0.1452]], device='cuda:0')
loss: 124.72734832763672
var: tensor([[ 0.1226,  0.1181,  0.0701,  ...,  0.1392,  0.1002,  0.1208],
        [ 0.1422,  0.1844,  0.1211,  ...,  0.3120,  0.1652,  0.2340],
        [ 0.1354,  0.1244,  0.0721,  ...,  0.1971,  0.1146,  0.1360],
        ...,
        [ 0.0974,  0.2625,  0.1611,  ...,  0.2005,  0.1770,  0.1789],
        [ 0.1201,  0.1119,  0.0760,  ...,  0.1409,  0.0999,  0.1277],
        [ 0.1486,  0.3012,  0.1848,  ...,  0.2813,  0.2128,  0.2223]], device='cuda:0')
loss: 123.73063659667969
var: tensor([[ 0.0706,  0.1016,  0.061

var: tensor([[ 0.0901,  0.1261,  0.0756,  ...,  0.1216,  0.0885,  0.1165],
        [ 0.1096,  0.1066,  0.0602,  ...,  0.1100,  0.0659,  0.1196],
        [ 0.0809,  0.0960,  0.0778,  ...,  0.1028,  0.0860,  0.1433],
        ...,
        [ 0.1237,  0.1452,  0.1015,  ...,  0.2003,  0.1344,  0.1808],
        [ 0.1773,  0.1622,  0.1279,  ...,  0.2104,  0.1599,  0.1866],
        [ 0.1405,  0.1793,  0.1270,  ...,  0.2231,  0.1514,  0.1699]], device='cuda:0')
loss: 128.55007934570312
var: tensor([[ 0.1063,  0.1785,  0.1043,  ...,  0.1641,  0.1135,  0.1486],
        [ 0.0922,  0.0925,  0.1040,  ...,  0.1572,  0.1070,  0.1522],
        [ 0.0998,  0.1051,  0.0715,  ...,  0.1060,  0.0953,  0.0902],
        ...,
        [ 0.0444,  0.0534,  0.0498,  ...,  0.0653,  0.0761,  0.0719],
        [ 0.1459,  0.2228,  0.1531,  ...,  0.1672,  0.1739,  0.1465],
        [ 0.1272,  0.1155,  0.0840,  ...,  0.1232,  0.0781,  0.1122]], device='cuda:0')
loss: 125.09326171875
var: tensor([[ 0.0618,  0.0964,  0.0971, 

var: tensor([[ 0.2282,  0.2346,  0.1238,  ...,  0.2244,  0.1862,  0.2096],
        [ 0.0516,  0.0770,  0.0535,  ...,  0.1112,  0.1212,  0.1342],
        [ 0.0950,  0.1122,  0.0747,  ...,  0.1297,  0.1081,  0.1072],
        ...,
        [ 0.0534,  0.1177,  0.0604,  ...,  0.1089,  0.0817,  0.1027],
        [ 0.1195,  0.1168,  0.0880,  ...,  0.1473,  0.1362,  0.1309],
        [ 0.0730,  0.0758,  0.0639,  ...,  0.1120,  0.1036,  0.1782]], device='cuda:0')
loss: 118.50933837890625
var: tensor([[ 0.0838,  0.1449,  0.0994,  ...,  0.1251,  0.1190,  0.1248],
        [ 0.1006,  0.1087,  0.0642,  ...,  0.1718,  0.1017,  0.1217],
        [ 0.1238,  0.1628,  0.1256,  ...,  0.1770,  0.1558,  0.1536],
        ...,
        [ 0.0875,  0.1065,  0.0821,  ...,  0.1523,  0.1199,  0.1704],
        [ 0.1236,  0.1042,  0.0719,  ...,  0.1317,  0.1233,  0.1148],
        [ 0.2321,  0.2289,  0.1694,  ...,  0.2265,  0.1764,  0.2239]], device='cuda:0')
loss: 118.76591491699219
var: tensor([[ 0.0958,  0.1226,  0.102

var: tensor([[ 0.1421,  0.1210,  0.1007,  ...,  0.1461,  0.1421,  0.1365],
        [ 0.0915,  0.0871,  0.0655,  ...,  0.1382,  0.1103,  0.1045],
        [ 0.2309,  0.1826,  0.1244,  ...,  0.1897,  0.1554,  0.1556],
        ...,
        [ 0.1162,  0.0849,  0.0765,  ...,  0.1320,  0.1113,  0.1474],
        [ 0.1029,  0.0970,  0.0706,  ...,  0.1364,  0.1368,  0.1025],
        [ 0.1169,  0.1363,  0.0771,  ...,  0.1680,  0.1038,  0.1191]], device='cuda:0')
loss: 120.3469009399414
var: tensor([[ 0.0519,  0.0329,  0.0298,  ...,  0.0585,  0.0430,  0.0765],
        [ 0.1099,  0.0922,  0.0801,  ...,  0.1648,  0.0896,  0.1284],
        [ 0.1574,  0.1764,  0.1315,  ...,  0.2130,  0.1825,  0.1910],
        ...,
        [ 0.1276,  0.1310,  0.0985,  ...,  0.1379,  0.1314,  0.1113],
        [ 0.0660,  0.1006,  0.0776,  ...,  0.1360,  0.1091,  0.1201],
        [ 0.0749,  0.0830,  0.0876,  ...,  0.0994,  0.1187,  0.1276]], device='cuda:0')
loss: 123.831298828125
var: tensor([[ 0.0835,  0.0978,  0.0821, 

var: tensor([[ 0.1087,  0.1127,  0.0742,  ...,  0.1379,  0.1177,  0.0721],
        [ 0.1146,  0.1410,  0.1034,  ...,  0.1576,  0.1610,  0.1508],
        [ 0.0949,  0.0762,  0.0490,  ...,  0.0949,  0.0754,  0.0546],
        ...,
        [ 0.1612,  0.1567,  0.1166,  ...,  0.1653,  0.1435,  0.1380],
        [ 0.1309,  0.1183,  0.1014,  ...,  0.1804,  0.1434,  0.0999],
        [ 0.0751,  0.0747,  0.0727,  ...,  0.1206,  0.0890,  0.0967]], device='cuda:0')
loss: 117.98685455322266
var: tensor([[ 0.1478,  0.1060,  0.0912,  ...,  0.1817,  0.1081,  0.1097],
        [ 0.1544,  0.1736,  0.1195,  ...,  0.2077,  0.1715,  0.1156],
        [ 0.1231,  0.1212,  0.0746,  ...,  0.1582,  0.1080,  0.1092],
        ...,
        [ 0.1553,  0.1425,  0.1192,  ...,  0.1606,  0.1250,  0.1339],
        [ 0.0920,  0.1080,  0.0678,  ...,  0.1148,  0.0966,  0.0829],
        [ 0.0606,  0.0975,  0.0574,  ...,  0.1239,  0.0848,  0.0781]], device='cuda:0')
loss: 120.49422454833984
var: tensor([[ 0.0941,  0.1219,  0.064

var: tensor([[ 0.0891,  0.2262,  0.1307,  ...,  0.1826,  0.1677,  0.1448],
        [ 0.1519,  0.1167,  0.0877,  ...,  0.1429,  0.1012,  0.1817],
        [ 0.1332,  0.1351,  0.0924,  ...,  0.1662,  0.1288,  0.1121],
        ...,
        [ 0.1524,  0.1468,  0.0894,  ...,  0.1756,  0.1106,  0.1240],
        [ 0.0744,  0.0612,  0.0696,  ...,  0.0761,  0.0728,  0.0900],
        [ 0.0841,  0.1423,  0.0763,  ...,  0.1295,  0.1037,  0.1283]], device='cuda:0')
loss: 119.95726776123047
var: tensor([[ 0.0553,  0.0856,  0.0541,  ...,  0.1132,  0.0713,  0.0966],
        [ 0.1234,  0.2348,  0.1256,  ...,  0.1721,  0.1394,  0.1446],
        [ 0.1182,  0.0848,  0.0709,  ...,  0.1247,  0.0811,  0.0967],
        ...,
        [ 0.1665,  0.0796,  0.0736,  ...,  0.1244,  0.0764,  0.1009],
        [ 0.0978,  0.0804,  0.0793,  ...,  0.1463,  0.1040,  0.1323],
        [ 0.0759,  0.0715,  0.0682,  ...,  0.1284,  0.0765,  0.1105]], device='cuda:0')
loss: 120.98863220214844
var: tensor([[ 0.1276,  0.0769,  0.064

var: tensor([[ 0.0964,  0.0891,  0.0584,  ...,  0.0992,  0.0943,  0.0916],
        [ 0.1140,  0.1048,  0.0662,  ...,  0.1313,  0.1140,  0.0771],
        [ 0.0684,  0.0866,  0.0511,  ...,  0.0997,  0.0709,  0.0704],
        ...,
        [ 0.2292,  0.2070,  0.1150,  ...,  0.2142,  0.1598,  0.1695],
        [ 0.0587,  0.0630,  0.0578,  ...,  0.1093,  0.0952,  0.1072],
        [ 0.0561,  0.0470,  0.0514,  ...,  0.0597,  0.0624,  0.0913]], device='cuda:0')
loss: 121.15462493896484
var: tensor([[ 0.1721,  0.1679,  0.1148,  ...,  0.1784,  0.1558,  0.1153],
        [ 0.1510,  0.0792,  0.0726,  ...,  0.1146,  0.0922,  0.1117],
        [ 0.1073,  0.0968,  0.0789,  ...,  0.1342,  0.1416,  0.1064],
        ...,
        [ 0.1034,  0.0944,  0.0770,  ...,  0.1295,  0.1102,  0.1014],
        [ 0.0885,  0.1078,  0.0870,  ...,  0.1374,  0.1117,  0.0895],
        [ 0.0904,  0.0601,  0.0584,  ...,  0.1332,  0.1289,  0.0926]], device='cuda:0')
loss: 121.53187561035156
var: tensor([[ 0.0722,  0.0809,  0.053

var: tensor([[ 0.0632,  0.0948,  0.0778,  ...,  0.1051,  0.0997,  0.1033],
        [ 0.0515,  0.1036,  0.0966,  ...,  0.1001,  0.1059,  0.1030],
        [ 0.0599,  0.1022,  0.0691,  ...,  0.0871,  0.0843,  0.0877],
        ...,
        [ 0.0780,  0.0714,  0.0495,  ...,  0.0698,  0.0613,  0.0884],
        [ 0.0945,  0.1184,  0.0842,  ...,  0.1510,  0.1197,  0.1592],
        [ 0.0605,  0.0799,  0.0609,  ...,  0.0740,  0.0796,  0.0781]], device='cuda:0')
loss: 119.46731567382812
var: tensor([[ 0.0874,  0.1030,  0.0704,  ...,  0.0984,  0.0990,  0.0803],
        [ 0.0988,  0.1002,  0.0807,  ...,  0.1253,  0.1301,  0.1353],
        [ 0.1959,  0.2175,  0.1092,  ...,  0.1829,  0.1568,  0.1547],
        ...,
        [ 0.1644,  0.1057,  0.0922,  ...,  0.1208,  0.0992,  0.1504],
        [ 0.0731,  0.1787,  0.1279,  ...,  0.1196,  0.1266,  0.1357],
        [ 0.0885,  0.0925,  0.0774,  ...,  0.0944,  0.0849,  0.0985]], device='cuda:0')
loss: 115.8714599609375
var: tensor([[ 0.0379,  0.0438,  0.0332

var: tensor([[ 0.1247,  0.1093,  0.0762,  ...,  0.1283,  0.0984,  0.1008],
        [ 0.1428,  0.1212,  0.0876,  ...,  0.1922,  0.1243,  0.1167],
        [ 0.2104,  0.1981,  0.1306,  ...,  0.2037,  0.1635,  0.1796],
        ...,
        [ 0.0996,  0.0946,  0.0606,  ...,  0.0969,  0.0862,  0.1079],
        [ 0.1532,  0.1670,  0.1105,  ...,  0.1792,  0.1462,  0.1560],
        [ 0.1019,  0.1192,  0.0795,  ...,  0.1362,  0.1333,  0.1637]], device='cuda:0')
loss: 123.18246459960938
var: tensor([[ 0.1135,  0.1037,  0.0879,  ...,  0.1636,  0.0937,  0.1234],
        [ 0.0860,  0.0760,  0.0588,  ...,  0.1561,  0.1107,  0.0807],
        [ 0.0838,  0.1172,  0.1139,  ...,  0.1302,  0.1168,  0.0902],
        ...,
        [ 0.1485,  0.1557,  0.1104,  ...,  0.1939,  0.1486,  0.1649],
        [ 0.0580,  0.0826,  0.0785,  ...,  0.1303,  0.1094,  0.0950],
        [ 0.1830,  0.1343,  0.1083,  ...,  0.1636,  0.1193,  0.1398]], device='cuda:0')
loss: 115.44300842285156
var: tensor([[ 0.0774,  0.1231,  0.105

var: tensor([[ 0.0985,  0.0748,  0.0441,  ...,  0.1007,  0.0816,  0.0901],
        [ 0.1576,  0.2195,  0.0961,  ...,  0.1541,  0.1367,  0.1533],
        [ 0.0818,  0.0888,  0.0699,  ...,  0.1172,  0.1151,  0.1095],
        ...,
        [ 0.0784,  0.1073,  0.0427,  ...,  0.0956,  0.0697,  0.0994],
        [ 0.0620,  0.0684,  0.0530,  ...,  0.0871,  0.0781,  0.0753],
        [ 0.1893,  0.1818,  0.1010,  ...,  0.1789,  0.1512,  0.1282]], device='cuda:0')
loss: 121.62622833251953
var: tensor([[ 0.0891,  0.0959,  0.0488,  ...,  0.1114,  0.0661,  0.0797],
        [ 0.0707,  0.1077,  0.0593,  ...,  0.1649,  0.1173,  0.1082],
        [ 0.1193,  0.1460,  0.0850,  ...,  0.1767,  0.1426,  0.0885],
        ...,
        [ 0.0681,  0.1089,  0.0745,  ...,  0.1279,  0.1323,  0.1050],
        [ 0.1057,  0.1124,  0.0833,  ...,  0.1078,  0.1184,  0.0817],
        [ 0.0623,  0.0886,  0.0427,  ...,  0.1149,  0.0701,  0.0739]], device='cuda:0')
loss: 117.66133880615234
var: tensor([[ 0.0939,  0.0848,  0.055

var: tensor([[ 0.0966,  0.1286,  0.0688,  ...,  0.1051,  0.1054,  0.1491],
        [ 0.0740,  0.0817,  0.0373,  ...,  0.0830,  0.0555,  0.0870],
        [ 0.0809,  0.2632,  0.1301,  ...,  0.1699,  0.1546,  0.1636],
        ...,
        [ 0.0832,  0.1068,  0.0584,  ...,  0.1005,  0.0954,  0.1038],
        [ 0.1500,  0.1638,  0.0919,  ...,  0.2131,  0.1722,  0.1277],
        [ 0.1176,  0.1133,  0.0701,  ...,  0.1637,  0.0983,  0.1121]], device='cuda:0')
loss: 115.8741226196289
var: tensor([[ 0.1787,  0.2487,  0.1048,  ...,  0.1689,  0.1439,  0.1431],
        [ 0.2434,  0.1995,  0.1084,  ...,  0.2209,  0.1604,  0.1696],
        [ 0.1659,  0.1394,  0.1007,  ...,  0.1428,  0.1120,  0.1501],
        ...,
        [ 0.1176,  0.0960,  0.0552,  ...,  0.1029,  0.0930,  0.0963],
        [ 0.0684,  0.1222,  0.0572,  ...,  0.0847,  0.0953,  0.1021],
        [ 0.1123,  0.1139,  0.0555,  ...,  0.1272,  0.0917,  0.0990]], device='cuda:0')
loss: 122.1640853881836
var: tensor([[ 0.1047,  0.0938,  0.0467,

var: tensor([[ 0.0886,  0.0755,  0.0678,  ...,  0.0882,  0.0828,  0.1134],
        [ 0.0685,  0.0958,  0.0652,  ...,  0.1004,  0.0997,  0.1110],
        [ 0.1588,  0.1230,  0.0934,  ...,  0.1613,  0.1204,  0.1420],
        ...,
        [ 0.0681,  0.0868,  0.0485,  ...,  0.0957,  0.0928,  0.0891],
        [ 0.0909,  0.1112,  0.0656,  ...,  0.0954,  0.1193,  0.1286],
        [ 0.1242,  0.1415,  0.0826,  ...,  0.1476,  0.1215,  0.1235]], device='cuda:0')
loss: 117.5843276977539
var: tensor([[ 0.0643,  0.0859,  0.0612,  ...,  0.0991,  0.1042,  0.1160],
        [ 0.0739,  0.0697,  0.0535,  ...,  0.0907,  0.0871,  0.0941],
        [ 0.1142,  0.1126,  0.0693,  ...,  0.1021,  0.0752,  0.1025],
        ...,
        [ 0.0497,  0.0568,  0.0445,  ...,  0.0780,  0.0615,  0.0823],
        [ 0.0570,  0.1127,  0.0620,  ...,  0.0951,  0.0790,  0.0789],
        [ 0.0569,  0.1015,  0.0636,  ...,  0.0799,  0.0715,  0.0879]], device='cuda:0')
loss: 116.12383270263672
var: tensor([[ 0.1399,  0.1158,  0.0644

====> Test set loss: 106.8811
var: tensor([[ 0.0903,  0.1201,  0.1041,  ...,  0.1548,  0.1008,  0.1257],
        [ 0.1000,  0.0757,  0.0695,  ...,  0.1235,  0.0774,  0.1096],
        [ 0.0893,  0.0849,  0.0932,  ...,  0.0976,  0.0858,  0.0874],
        ...,
        [ 0.0798,  0.1009,  0.0949,  ...,  0.1428,  0.1082,  0.1243],
        [ 0.0470,  0.0624,  0.0651,  ...,  0.0885,  0.0722,  0.0648],
        [ 0.0781,  0.1112,  0.1315,  ...,  0.0968,  0.1039,  0.0952]], device='cuda:0')
loss: 117.23515319824219
var: tensor([[ 0.0575,  0.0876,  0.0577,  ...,  0.0890,  0.0636,  0.0707],
        [ 0.1109,  0.0630,  0.0586,  ...,  0.0884,  0.0657,  0.0765],
        [ 0.0909,  0.1136,  0.1016,  ...,  0.0953,  0.0873,  0.0872],
        ...,
        [ 0.0615,  0.0642,  0.0527,  ...,  0.0918,  0.0809,  0.0859],
        [ 0.0873,  0.0920,  0.0862,  ...,  0.1187,  0.1188,  0.1098],
        [ 0.1350,  0.1161,  0.1213,  ...,  0.1139,  0.1209,  0.1066]], device='cuda:0')
loss: 118.35233306884766
var: ten

var: tensor([[ 0.0842,  0.0826,  0.0580,  ...,  0.1136,  0.0890,  0.0858],
        [ 0.0571,  0.0622,  0.0472,  ...,  0.0785,  0.0680,  0.0520],
        [ 0.0671,  0.0701,  0.0523,  ...,  0.1129,  0.0715,  0.0728],
        ...,
        [ 0.0704,  0.0954,  0.0698,  ...,  0.1155,  0.0905,  0.0694],
        [ 0.0918,  0.1047,  0.0766,  ...,  0.1152,  0.0903,  0.0930],
        [ 0.0600,  0.0611,  0.0518,  ...,  0.0822,  0.0640,  0.0868]], device='cuda:0')
loss: 114.30518341064453
var: tensor([[ 0.0723,  0.1071,  0.0781,  ...,  0.1513,  0.0948,  0.0926],
        [ 0.1250,  0.1298,  0.1057,  ...,  0.1460,  0.1256,  0.1242],
        [ 0.0973,  0.0924,  0.0779,  ...,  0.1216,  0.0935,  0.0883],
        ...,
        [ 0.0888,  0.0602,  0.0523,  ...,  0.1003,  0.0784,  0.0798],
        [ 0.1496,  0.1872,  0.1003,  ...,  0.1731,  0.1317,  0.1324],
        [ 0.0680,  0.1078,  0.0755,  ...,  0.1347,  0.0938,  0.0907]], device='cuda:0')
loss: 115.87199401855469
var: tensor([[ 0.0701,  0.1933,  0.144

var: tensor([[ 0.2309,  0.1522,  0.1137,  ...,  0.1731,  0.1426,  0.1448],
        [ 0.1224,  0.0987,  0.0545,  ...,  0.1275,  0.0932,  0.0722],
        [ 0.0642,  0.0723,  0.0640,  ...,  0.1039,  0.1172,  0.0928],
        ...,
        [ 0.0640,  0.0829,  0.0574,  ...,  0.1058,  0.0890,  0.0691],
        [ 0.1068,  0.0915,  0.0801,  ...,  0.1121,  0.1078,  0.0839],
        [ 0.0863,  0.0695,  0.0459,  ...,  0.1030,  0.0746,  0.0829]], device='cuda:0')
loss: 115.74210357666016
var: tensor([[ 0.0928,  0.2091,  0.1362,  ...,  0.1454,  0.1421,  0.1306],
        [ 0.0741,  0.0963,  0.0828,  ...,  0.0951,  0.1077,  0.0790],
        [ 0.1013,  0.0834,  0.0727,  ...,  0.0931,  0.0994,  0.0822],
        ...,
        [ 0.1373,  0.1042,  0.0655,  ...,  0.1369,  0.1274,  0.0755],
        [ 0.1060,  0.1277,  0.1097,  ...,  0.1347,  0.1451,  0.0977],
        [ 0.0960,  0.1054,  0.0752,  ...,  0.1242,  0.1391,  0.0879]], device='cuda:0')
loss: 118.4056396484375
var: tensor([[ 0.0867,  0.0997,  0.0766

var: tensor([[ 0.0876,  0.0800,  0.0573,  ...,  0.0918,  0.0883,  0.0749],
        [ 0.1107,  0.0626,  0.0474,  ...,  0.1122,  0.0660,  0.0908],
        [ 0.0647,  0.0613,  0.0422,  ...,  0.1078,  0.0682,  0.0690],
        ...,
        [ 0.0782,  0.1233,  0.0779,  ...,  0.1369,  0.0943,  0.0833],
        [ 0.0464,  0.0362,  0.0343,  ...,  0.0664,  0.0719,  0.0572],
        [ 0.0715,  0.0842,  0.0516,  ...,  0.1389,  0.0735,  0.0847]], device='cuda:0')
loss: 115.06472778320312
var: tensor([[ 0.0613,  0.0553,  0.0470,  ...,  0.0796,  0.0922,  0.0752],
        [ 0.0778,  0.0707,  0.0597,  ...,  0.0815,  0.0891,  0.1078],
        [ 0.1225,  0.0951,  0.0486,  ...,  0.1633,  0.1115,  0.1019],
        ...,
        [ 0.0852,  0.0457,  0.0374,  ...,  0.0757,  0.0709,  0.0582],
        [ 0.0569,  0.0579,  0.0370,  ...,  0.0974,  0.0782,  0.0880],
        [ 0.1283,  0.0951,  0.0607,  ...,  0.1520,  0.0976,  0.0730]], device='cuda:0')
loss: 116.9495849609375
var: tensor([[ 0.1110,  0.1349,  0.0846

loss: 114.95245361328125
var: tensor([[ 0.0312,  0.0341,  0.0337,  ...,  0.0564,  0.0344,  0.0813],
        [ 0.0830,  0.0916,  0.0585,  ...,  0.1058,  0.0810,  0.0945],
        [ 0.0549,  0.0642,  0.0539,  ...,  0.0960,  0.0570,  0.1015],
        ...,
        [ 0.0488,  0.0878,  0.0573,  ...,  0.0795,  0.0720,  0.0874],
        [ 0.0478,  0.0481,  0.0501,  ...,  0.0609,  0.0551,  0.0924],
        [ 0.0758,  0.0601,  0.0542,  ...,  0.0899,  0.0594,  0.1036]], device='cuda:0')
loss: 115.3641586303711
var: tensor([[ 0.0702,  0.0577,  0.0474,  ...,  0.0605,  0.0455,  0.0913],
        [ 0.0514,  0.0729,  0.0557,  ...,  0.0998,  0.0861,  0.0976],
        [ 0.0873,  0.1487,  0.0724,  ...,  0.1358,  0.0949,  0.1296],
        ...,
        [ 0.0341,  0.0364,  0.0429,  ...,  0.0631,  0.0499,  0.0930],
        [ 0.1059,  0.1033,  0.0591,  ...,  0.1397,  0.0939,  0.0905],
        [ 0.1538,  0.1697,  0.1195,  ...,  0.1803,  0.1158,  0.1471]], device='cuda:0')
loss: 110.31698608398438
var: tensor([[

var: tensor([[ 0.1422,  0.1463,  0.0880,  ...,  0.1462,  0.1209,  0.1330],
        [ 0.0580,  0.0690,  0.0410,  ...,  0.0934,  0.0557,  0.0801],
        [ 0.0985,  0.0908,  0.0971,  ...,  0.0970,  0.0837,  0.0917],
        ...,
        [ 0.0806,  0.0907,  0.0734,  ...,  0.1033,  0.0912,  0.0833],
        [ 0.0532,  0.0942,  0.0474,  ...,  0.0803,  0.0499,  0.0714],
        [ 0.0820,  0.1486,  0.0926,  ...,  0.1220,  0.0885,  0.1098]], device='cuda:0')
loss: 111.28326416015625
var: tensor([[ 0.0574,  0.0602,  0.0544,  ...,  0.0717,  0.0947,  0.0823],
        [ 0.1049,  0.1098,  0.0716,  ...,  0.1469,  0.0953,  0.1118],
        [ 0.1198,  0.1163,  0.0545,  ...,  0.1113,  0.0743,  0.0893],
        ...,
        [ 0.1170,  0.1103,  0.0526,  ...,  0.1324,  0.0960,  0.1028],
        [ 0.0755,  0.0802,  0.0641,  ...,  0.0991,  0.1072,  0.0803],
        [ 0.2468,  0.2132,  0.1145,  ...,  0.2229,  0.1663,  0.1769]], device='cuda:0')
loss: 117.03300476074219
var: tensor([[ 0.0739,  0.0972,  0.066

var: tensor([[ 0.0566,  0.0885,  0.0552,  ...,  0.0826,  0.0742,  0.0944],
        [ 0.0487,  0.0682,  0.0490,  ...,  0.0768,  0.0570,  0.0586],
        [ 0.1769,  0.1328,  0.1130,  ...,  0.1715,  0.1016,  0.1254],
        ...,
        [ 0.0438,  0.0664,  0.0784,  ...,  0.0844,  0.0684,  0.0549],
        [ 0.1192,  0.1298,  0.0788,  ...,  0.1522,  0.1352,  0.0774],
        [ 0.0944,  0.0711,  0.0566,  ...,  0.1086,  0.0794,  0.0745]], device='cuda:0')
loss: 115.74842071533203
var: tensor([[ 0.1239,  0.1123,  0.0727,  ...,  0.1336,  0.1106,  0.0966],
        [ 0.0779,  0.0860,  0.0614,  ...,  0.1114,  0.0868,  0.0585],
        [ 0.0741,  0.1111,  0.1070,  ...,  0.0966,  0.0956,  0.0870],
        ...,
        [ 0.0740,  0.1122,  0.0732,  ...,  0.1455,  0.0867,  0.1128],
        [ 0.1478,  0.0885,  0.0620,  ...,  0.1274,  0.0883,  0.0946],
        [ 0.0619,  0.0838,  0.0720,  ...,  0.0811,  0.0734,  0.0562]], device='cuda:0')
loss: 115.7939453125
var: tensor([[ 0.0940,  0.0784,  0.0548,  

var: tensor([[ 0.1075,  0.1028,  0.0589,  ...,  0.1171,  0.0876,  0.0941],
        [ 0.0442,  0.1040,  0.0547,  ...,  0.0814,  0.0741,  0.0795],
        [ 0.0709,  0.1171,  0.0614,  ...,  0.0985,  0.0793,  0.0925],
        ...,
        [ 0.0684,  0.1213,  0.0751,  ...,  0.1014,  0.1035,  0.0954],
        [ 0.0577,  0.0770,  0.0730,  ...,  0.0947,  0.0911,  0.0676],
        [ 0.0535,  0.0621,  0.0359,  ...,  0.0679,  0.0502,  0.0930]], device='cuda:0')
loss: 111.84814453125
var: tensor([[ 0.0424,  0.0659,  0.0328,  ...,  0.0879,  0.0876,  0.0811],
        [ 0.0740,  0.1691,  0.0923,  ...,  0.1392,  0.1091,  0.1194],
        [ 0.0715,  0.0700,  0.0528,  ...,  0.0946,  0.0846,  0.0817],
        ...,
        [ 0.0753,  0.2395,  0.1266,  ...,  0.1818,  0.1500,  0.1823],
        [ 0.0681,  0.0785,  0.0475,  ...,  0.0928,  0.0891,  0.0825],
        [ 0.1150,  0.1095,  0.0560,  ...,  0.0999,  0.0990,  0.0873]], device='cuda:0')
loss: 108.68892669677734
var: tensor([[ 0.0373,  0.0593,  0.0340, 

loss: 117.10725402832031
var: tensor([[ 0.0748,  0.0491,  0.0591,  ...,  0.0713,  0.0539,  0.0566],
        [ 0.1089,  0.0701,  0.0868,  ...,  0.1059,  0.0761,  0.0846],
        [ 0.0406,  0.0423,  0.0509,  ...,  0.0714,  0.0598,  0.0528],
        ...,
        [ 0.0702,  0.0654,  0.0616,  ...,  0.0835,  0.0542,  0.0699],
        [ 0.0732,  0.0649,  0.0722,  ...,  0.1030,  0.0584,  0.0832],
        [ 0.0581,  0.0543,  0.0570,  ...,  0.0730,  0.0535,  0.0739]], device='cuda:0')
loss: 116.57991790771484
var: tensor([[ 0.0816,  0.1079,  0.0846,  ...,  0.1331,  0.0903,  0.1232],
        [ 0.0959,  0.1819,  0.1338,  ...,  0.1710,  0.1125,  0.1538],
        [ 0.0345,  0.0429,  0.0582,  ...,  0.0534,  0.0604,  0.0565],
        ...,
        [ 0.0791,  0.0628,  0.0672,  ...,  0.1210,  0.1004,  0.0908],
        [ 0.0581,  0.0663,  0.0542,  ...,  0.0960,  0.0677,  0.1188],
        [ 0.0585,  0.0524,  0.0609,  ...,  0.0901,  0.0761,  0.0847]], device='cuda:0')
loss: 115.38731384277344
var: tensor([

var: tensor([[ 0.0856,  0.0810,  0.0598,  ...,  0.1148,  0.0888,  0.0823],
        [ 0.0710,  0.0478,  0.0455,  ...,  0.0886,  0.0525,  0.0671],
        [ 0.0755,  0.0783,  0.0708,  ...,  0.1254,  0.0927,  0.0874],
        ...,
        [ 0.0890,  0.0730,  0.0633,  ...,  0.1276,  0.0742,  0.0863],
        [ 0.0770,  0.0680,  0.0754,  ...,  0.1041,  0.0816,  0.0846],
        [ 0.0881,  0.1065,  0.0858,  ...,  0.0927,  0.0725,  0.0802]], device='cuda:0')
loss: 111.31430053710938
var: tensor([[ 0.0513,  0.0682,  0.0495,  ...,  0.0793,  0.0543,  0.0592],
        [ 0.0776,  0.0969,  0.0996,  ...,  0.1052,  0.0893,  0.0908],
        [ 0.0720,  0.0718,  0.0620,  ...,  0.0890,  0.0687,  0.0742],
        ...,
        [ 0.0516,  0.0801,  0.0596,  ...,  0.0846,  0.0625,  0.0609],
        [ 0.0610,  0.1951,  0.1258,  ...,  0.1663,  0.1379,  0.1645],
        [ 0.0551,  0.1100,  0.0617,  ...,  0.1130,  0.0756,  0.0918]], device='cuda:0')
loss: 110.1442642211914
var: tensor([[ 0.1051,  0.1088,  0.0666

var: tensor([[ 0.0628,  0.0337,  0.0433,  ...,  0.0769,  0.0476,  0.0683],
        [ 0.0786,  0.0975,  0.0572,  ...,  0.1414,  0.0722,  0.1004],
        [ 0.0862,  0.0854,  0.0639,  ...,  0.1344,  0.0855,  0.0889],
        ...,
        [ 0.0831,  0.0614,  0.0512,  ...,  0.0909,  0.0669,  0.0744],
        [ 0.0622,  0.0819,  0.0730,  ...,  0.1079,  0.0839,  0.0934],
        [ 0.0719,  0.0781,  0.0692,  ...,  0.0949,  0.0930,  0.0984]], device='cuda:0')
loss: 116.919189453125
var: tensor([[ 0.1177,  0.1239,  0.0806,  ...,  0.1300,  0.1108,  0.0815],
        [ 0.0881,  0.0815,  0.0487,  ...,  0.1125,  0.0599,  0.0812],
        [ 0.0796,  0.0539,  0.0406,  ...,  0.0831,  0.0427,  0.0745],
        ...,
        [ 0.0903,  0.0646,  0.0549,  ...,  0.1000,  0.0649,  0.1048],
        [ 0.0578,  0.0659,  0.0521,  ...,  0.0914,  0.0483,  0.0686],
        [ 0.2614,  0.1981,  0.0969,  ...,  0.1980,  0.1535,  0.1606]], device='cuda:0')
loss: 115.88372039794922
var: tensor([[ 0.1789,  0.1549,  0.1168,

loss: 113.06412506103516
var: tensor([[ 0.0877,  0.0887,  0.0666,  ...,  0.0957,  0.0781,  0.1008],
        [ 0.0491,  0.0837,  0.0920,  ...,  0.0844,  0.0780,  0.0589],
        [ 0.0932,  0.0893,  0.0786,  ...,  0.1196,  0.0842,  0.1150],
        ...,
        [ 0.0736,  0.1004,  0.0816,  ...,  0.0880,  0.0825,  0.0877],
        [ 0.0805,  0.1040,  0.1144,  ...,  0.1008,  0.1056,  0.0854],
        [ 0.1061,  0.1205,  0.0767,  ...,  0.1225,  0.1067,  0.0774]], device='cuda:0')
loss: 115.91743469238281
var: tensor([[ 0.1120,  0.1254,  0.0864,  ...,  0.1078,  0.1241,  0.0851],
        [ 0.1221,  0.1885,  0.1219,  ...,  0.1694,  0.1355,  0.1597],
        [ 0.0899,  0.0947,  0.0689,  ...,  0.0881,  0.0778,  0.1138],
        ...,
        [ 0.1801,  0.2274,  0.1136,  ...,  0.1748,  0.1516,  0.1515],
        [ 0.0661,  0.0785,  0.0649,  ...,  0.1130,  0.0787,  0.0988],
        [ 0.1230,  0.1045,  0.0775,  ...,  0.1300,  0.1028,  0.1132]], device='cuda:0')
loss: 112.14698791503906
var: tensor([

        [ 0.0488,  0.0783,  0.0492,  ...,  0.0905,  0.0605,  0.0656]], device='cuda:0')
loss: 111.2768325805664
var: tensor([[ 0.0805,  0.0895,  0.0672,  ...,  0.0863,  0.1114,  0.0826],
        [ 0.1428,  0.1430,  0.0774,  ...,  0.1508,  0.1139,  0.1130],
        [ 0.0921,  0.1312,  0.0720,  ...,  0.1090,  0.1209,  0.0953],
        ...,
        [ 0.2303,  0.2222,  0.0879,  ...,  0.1664,  0.1564,  0.1337],
        [ 0.0600,  0.1696,  0.1376,  ...,  0.1401,  0.1384,  0.1317],
        [ 0.0662,  0.1094,  0.0948,  ...,  0.0785,  0.0886,  0.0740]], device='cuda:0')
loss: 110.40440368652344
var: tensor([[ 0.1399,  0.1923,  0.0852,  ...,  0.1767,  0.1394,  0.1224],
        [ 0.0831,  0.0631,  0.0529,  ...,  0.0803,  0.1035,  0.0788],
        [ 0.1003,  0.1047,  0.0676,  ...,  0.1055,  0.0847,  0.0893],
        ...,
        [ 0.1169,  0.0855,  0.0485,  ...,  0.0780,  0.0737,  0.0786],
        [ 0.0542,  0.0666,  0.0504,  ...,  0.0798,  0.0847,  0.0643],
        [ 0.0856,  0.0958,  0.0699,  ..

var: tensor([[ 0.0500,  0.0491,  0.0408,  ...,  0.0703,  0.0775,  0.0544],
        [ 0.0913,  0.1649,  0.1125,  ...,  0.1592,  0.1278,  0.1299],
        [ 0.0650,  0.0987,  0.0828,  ...,  0.0760,  0.0735,  0.0576],
        ...,
        [ 0.0447,  0.0465,  0.0382,  ...,  0.0598,  0.0675,  0.0467],
        [ 0.0742,  0.0631,  0.0477,  ...,  0.0856,  0.0759,  0.0659],
        [ 0.0821,  0.0589,  0.0459,  ...,  0.1110,  0.0896,  0.0787]], device='cuda:0')
loss: 116.87761688232422
var: tensor([[ 0.0858,  0.0699,  0.0381,  ...,  0.0946,  0.0579,  0.0505],
        [ 0.0887,  0.0678,  0.0357,  ...,  0.0618,  0.0503,  0.0703],
        [ 0.0716,  0.0766,  0.0601,  ...,  0.0959,  0.0808,  0.0724],
        ...,
        [ 0.0817,  0.0639,  0.0350,  ...,  0.0702,  0.0439,  0.0470],
        [ 0.0807,  0.0925,  0.0826,  ...,  0.0968,  0.0996,  0.0715],
        [ 0.0656,  0.0595,  0.0374,  ...,  0.0911,  0.0529,  0.0555]], device='cuda:0')
loss: 110.1270751953125
var: tensor([[ 0.0749,  0.0716,  0.0476

var: tensor([[ 0.0804,  0.0604,  0.0627,  ...,  0.0927,  0.0660,  0.0894],
        [ 0.0968,  0.0825,  0.1112,  ...,  0.1120,  0.0919,  0.1138],
        [ 0.0993,  0.0926,  0.0636,  ...,  0.0934,  0.0734,  0.0704],
        ...,
        [ 0.0602,  0.0637,  0.0751,  ...,  0.0831,  0.0997,  0.0788],
        [ 0.2362,  0.1447,  0.0932,  ...,  0.1866,  0.1444,  0.1558],
        [ 0.0814,  0.0964,  0.0912,  ...,  0.1333,  0.1229,  0.0967]], device='cuda:0')
loss: 117.86289978027344
var: tensor([[ 0.0764,  0.0690,  0.0438,  ...,  0.0751,  0.0622,  0.0565],
        [ 0.0559,  0.0610,  0.0642,  ...,  0.0592,  0.0819,  0.0581],
        [ 0.0885,  0.1372,  0.0896,  ...,  0.1306,  0.1259,  0.0962],
        ...,
        [ 0.0850,  0.0912,  0.0783,  ...,  0.1133,  0.0894,  0.0911],
        [ 0.0722,  0.2132,  0.1600,  ...,  0.1859,  0.1571,  0.1781],
        [ 0.1002,  0.0942,  0.0821,  ...,  0.1279,  0.0998,  0.0832]], device='cuda:0')
loss: 111.90663146972656
var: tensor([[ 0.1081,  0.0869,  0.066

var: tensor([[ 0.0562,  0.0879,  0.0530,  ...,  0.1161,  0.0745,  0.0732],
        [ 0.0460,  0.0420,  0.0353,  ...,  0.0655,  0.0714,  0.0546],
        [ 0.0400,  0.0352,  0.0323,  ...,  0.0493,  0.0750,  0.0638],
        ...,
        [ 0.0830,  0.1449,  0.0553,  ...,  0.1479,  0.0986,  0.0797],
        [ 0.0885,  0.1182,  0.0529,  ...,  0.1080,  0.0708,  0.0912],
        [ 0.1142,  0.1019,  0.0890,  ...,  0.1105,  0.0895,  0.0987]], device='cuda:0')
loss: 109.46456146240234
var: tensor([[ 0.0946,  0.0778,  0.0584,  ...,  0.1001,  0.0647,  0.0753],
        [ 0.0476,  0.0689,  0.0719,  ...,  0.1029,  0.0592,  0.0709],
        [ 0.1089,  0.1191,  0.0576,  ...,  0.1208,  0.0977,  0.0727],
        ...,
        [ 0.1129,  0.1356,  0.0587,  ...,  0.1342,  0.0927,  0.0803],
        [ 0.1769,  0.2129,  0.0928,  ...,  0.1995,  0.1445,  0.1694],
        [ 0.0988,  0.1170,  0.0645,  ...,  0.0981,  0.0821,  0.0723]], device='cuda:0')
loss: 115.8231430053711
var: tensor([[ 0.0690,  0.0685,  0.0455

var: tensor([[ 0.0461,  0.0641,  0.0514,  ...,  0.0801,  0.0672,  0.0551],
        [ 0.0592,  0.0688,  0.0741,  ...,  0.1153,  0.0830,  0.0661],
        [ 0.0921,  0.0912,  0.0876,  ...,  0.1465,  0.0886,  0.0973],
        ...,
        [ 0.0268,  0.0285,  0.0325,  ...,  0.0525,  0.0548,  0.0398],
        [ 0.1008,  0.0849,  0.0798,  ...,  0.1250,  0.0999,  0.0853],
        [ 0.0527,  0.0505,  0.0544,  ...,  0.0689,  0.0686,  0.0601]], device='cuda:0')
loss: 111.24981689453125
var: tensor([[ 0.0853,  0.0659,  0.0623,  ...,  0.1116,  0.0679,  0.0743],
        [ 0.0498,  0.0557,  0.0584,  ...,  0.0808,  0.0638,  0.0721],
        [ 0.1100,  0.0522,  0.0384,  ...,  0.0647,  0.0541,  0.0719],
        ...,
        [ 0.0607,  0.0689,  0.0857,  ...,  0.0753,  0.0688,  0.0591],
        [ 0.1309,  0.0766,  0.0708,  ...,  0.1209,  0.0783,  0.0803],
        [ 0.0956,  0.1800,  0.1288,  ...,  0.1780,  0.1314,  0.1536]], device='cuda:0')
loss: 111.58296203613281
var: tensor([[ 0.0470,  0.0452,  0.055

var: tensor([[ 0.0600,  0.0627,  0.0458,  ...,  0.0639,  0.0721,  0.0491],
        [ 0.1647,  0.1736,  0.0835,  ...,  0.1311,  0.1434,  0.1174],
        [ 0.0973,  0.0808,  0.0499,  ...,  0.1159,  0.0774,  0.0829],
        ...,
        [ 0.0347,  0.0511,  0.0401,  ...,  0.0672,  0.0643,  0.0506],
        [ 0.0788,  0.0992,  0.0471,  ...,  0.0854,  0.0787,  0.0504],
        [ 0.0608,  0.0927,  0.0596,  ...,  0.0859,  0.0726,  0.0603]], device='cuda:0')
loss: 111.14790344238281
var: tensor([[ 0.0506,  0.0796,  0.0640,  ...,  0.0885,  0.0920,  0.0725],
        [ 0.1636,  0.2158,  0.0899,  ...,  0.1738,  0.1611,  0.1399],
        [ 0.0815,  0.1071,  0.0505,  ...,  0.1143,  0.0918,  0.0709],
        ...,
        [ 0.0481,  0.1519,  0.1162,  ...,  0.1164,  0.1408,  0.1221],
        [ 0.0432,  0.0557,  0.0437,  ...,  0.0590,  0.0859,  0.0520],
        [ 0.1110,  0.1813,  0.1059,  ...,  0.1374,  0.1277,  0.1347]], device='cuda:0')
loss: 111.44050598144531
var: tensor([[ 0.1218,  0.0658,  0.048

var: tensor([[ 0.0628,  0.0741,  0.0513,  ...,  0.1072,  0.0847,  0.0625],
        [ 0.0668,  0.0777,  0.0570,  ...,  0.1101,  0.0629,  0.0726],
        [ 0.0986,  0.0904,  0.0699,  ...,  0.1127,  0.1067,  0.0611],
        ...,
        [ 0.0251,  0.0533,  0.0434,  ...,  0.0639,  0.0646,  0.0477],
        [ 0.0659,  0.1593,  0.1422,  ...,  0.1491,  0.1391,  0.0822],
        [ 0.1171,  0.1222,  0.0718,  ...,  0.1005,  0.0951,  0.0728]], device='cuda:0')
loss: 113.80101776123047
var: tensor([[ 0.0565,  0.0642,  0.0469,  ...,  0.0803,  0.0559,  0.0408],
        [ 0.0708,  0.1878,  0.1463,  ...,  0.1738,  0.1226,  0.1240],
        [ 0.0630,  0.0758,  0.0466,  ...,  0.0706,  0.0955,  0.0394],
        ...,
        [ 0.0379,  0.0516,  0.0501,  ...,  0.0518,  0.0993,  0.0366],
        [ 0.0513,  0.0716,  0.0710,  ...,  0.0895,  0.0846,  0.0522],
        [ 0.0737,  0.0713,  0.0522,  ...,  0.1208,  0.0733,  0.0556]], device='cuda:0')
loss: 113.08482360839844
var: tensor([[ 0.0485,  0.0572,  0.054

var: tensor([[ 0.0726,  0.0917,  0.0706,  ...,  0.1140,  0.0833,  0.0859],
        [ 0.1077,  0.1311,  0.0707,  ...,  0.1148,  0.0865,  0.0878],
        [ 0.0629,  0.0615,  0.0542,  ...,  0.0862,  0.0705,  0.0598],
        ...,
        [ 0.0675,  0.0665,  0.0945,  ...,  0.0995,  0.0833,  0.0643],
        [ 0.0827,  0.0817,  0.0676,  ...,  0.0943,  0.0770,  0.0697],
        [ 0.0550,  0.0411,  0.0489,  ...,  0.0842,  0.0414,  0.0640]], device='cuda:0')
loss: 115.29399871826172
var: tensor([[ 0.0525,  0.0753,  0.0408,  ...,  0.0853,  0.0536,  0.0608],
        [ 0.0566,  0.0592,  0.0650,  ...,  0.1093,  0.0638,  0.0651],
        [ 0.0725,  0.0575,  0.0420,  ...,  0.0840,  0.0568,  0.0604],
        ...,
        [ 0.2531,  0.1710,  0.1016,  ...,  0.2151,  0.1873,  0.1484],
        [ 0.0599,  0.0656,  0.0465,  ...,  0.0770,  0.0548,  0.0771],
        [ 0.0840,  0.0576,  0.0516,  ...,  0.1006,  0.0575,  0.0793]], device='cuda:0')
loss: 113.02757263183594
var: tensor([[ 0.0962,  0.0721,  0.058

loss: 114.95018005371094
var: tensor([[ 0.0470,  0.0437,  0.0550,  ...,  0.0633,  0.0489,  0.0625],
        [ 0.0785,  0.1177,  0.0440,  ...,  0.1252,  0.0845,  0.0645],
        [ 0.0536,  0.0739,  0.0480,  ...,  0.0931,  0.0653,  0.0615],
        ...,
        [ 0.0872,  0.0764,  0.0547,  ...,  0.1205,  0.0772,  0.0798],
        [ 0.2222,  0.2097,  0.0810,  ...,  0.1974,  0.1754,  0.1294],
        [ 0.0533,  0.0555,  0.0551,  ...,  0.0798,  0.0785,  0.0676]], device='cuda:0')
loss: 110.48460388183594
var: tensor([[ 0.0910,  0.1054,  0.0590,  ...,  0.1260,  0.1069,  0.0665],
        [ 0.0658,  0.0866,  0.0575,  ...,  0.1051,  0.0846,  0.0708],
        [ 0.0645,  0.0502,  0.0434,  ...,  0.0833,  0.0735,  0.0621],
        ...,
        [ 0.0796,  0.1246,  0.0468,  ...,  0.1103,  0.0929,  0.0650],
        [ 0.0558,  0.1213,  0.0937,  ...,  0.1138,  0.1264,  0.1001],
        [ 0.0686,  0.0388,  0.0438,  ...,  0.0645,  0.0600,  0.0606]], device='cuda:0')
loss: 111.06893920898438
var: tensor([

var: tensor([[ 0.0568,  0.0818,  0.0639,  ...,  0.0868,  0.0882,  0.0946],
        [ 0.0631,  0.0726,  0.0563,  ...,  0.0864,  0.0859,  0.0639],
        [ 0.0623,  0.0689,  0.0596,  ...,  0.0760,  0.0697,  0.0674],
        ...,
        [ 0.0561,  0.0621,  0.0481,  ...,  0.0704,  0.0569,  0.0594],
        [ 0.0323,  0.0657,  0.0452,  ...,  0.0621,  0.0754,  0.0606],
        [ 0.0387,  0.0454,  0.0516,  ...,  0.0704,  0.0907,  0.0740]], device='cuda:0')
loss: 112.24855041503906
var: tensor([[ 0.0767,  0.1975,  0.1285,  ...,  0.1543,  0.1143,  0.1585],
        [ 0.0824,  0.1312,  0.0618,  ...,  0.1147,  0.0717,  0.0973],
        [ 0.0449,  0.0752,  0.0679,  ...,  0.0832,  0.0849,  0.0594],
        ...,
        [ 0.1467,  0.2046,  0.0864,  ...,  0.1406,  0.1176,  0.1105],
        [ 0.0777,  0.0907,  0.0767,  ...,  0.0910,  0.0752,  0.0811],
        [ 0.0760,  0.1019,  0.0644,  ...,  0.0906,  0.0886,  0.0774]], device='cuda:0')
loss: 109.85098266601562
var: tensor([[ 0.0419,  0.1093,  0.045

var: tensor([[ 0.0725,  0.0816,  0.0549,  ...,  0.0868,  0.0703,  0.1013],
        [ 0.0645,  0.0790,  0.0557,  ...,  0.1241,  0.0671,  0.0619],
        [ 0.0496,  0.0546,  0.0490,  ...,  0.0880,  0.1000,  0.0524],
        ...,
        [ 0.0498,  0.0533,  0.0413,  ...,  0.1275,  0.0706,  0.0693],
        [ 0.0503,  0.0421,  0.0418,  ...,  0.1147,  0.0610,  0.0686],
        [ 0.0647,  0.1746,  0.1318,  ...,  0.1926,  0.1267,  0.1619]], device='cuda:0')
loss: 109.98819732666016
var: tensor([[ 0.0433,  0.0410,  0.0314,  ...,  0.0760,  0.0614,  0.0528],
        [ 0.0364,  0.0452,  0.0377,  ...,  0.0781,  0.0445,  0.0495],
        [ 0.0540,  0.0467,  0.0478,  ...,  0.0798,  0.0786,  0.0631],
        ...,
        [ 0.0405,  0.0490,  0.0406,  ...,  0.0872,  0.0666,  0.0569],
        [ 0.1015,  0.1075,  0.0736,  ...,  0.1397,  0.0780,  0.1156],
        [ 0.0443,  0.0472,  0.0405,  ...,  0.0760,  0.0629,  0.0549]], device='cuda:0')
loss: 112.67774200439453
var: tensor([[ 0.0818,  0.0693,  0.049

loss: 114.36190795898438
var: tensor([[ 0.0451,  0.0596,  0.0427,  ...,  0.0906,  0.0524,  0.0628],
        [ 0.1827,  0.1692,  0.0735,  ...,  0.1978,  0.1569,  0.1361],
        [ 0.0689,  0.0787,  0.0600,  ...,  0.1328,  0.0675,  0.0831],
        ...,
        [ 0.0503,  0.0615,  0.0614,  ...,  0.0671,  0.0622,  0.0528],
        [ 0.0528,  0.0793,  0.0581,  ...,  0.0953,  0.0727,  0.0673],
        [ 0.0585,  0.0563,  0.0474,  ...,  0.0925,  0.0750,  0.0661]], device='cuda:0')
loss: 108.26148986816406
var: tensor([[ 0.0799,  0.0877,  0.0762,  ...,  0.1101,  0.0751,  0.0870],
        [ 0.0977,  0.1993,  0.1206,  ...,  0.1846,  0.1540,  0.1517],
        [ 0.0542,  0.0555,  0.0439,  ...,  0.0868,  0.0749,  0.0694],
        ...,
        [ 0.0393,  0.0554,  0.0435,  ...,  0.0800,  0.0787,  0.0875],
        [ 0.0337,  0.0595,  0.0702,  ...,  0.0777,  0.0862,  0.0519],
        [ 0.0758,  0.0515,  0.0470,  ...,  0.1001,  0.0602,  0.0584]], device='cuda:0')
loss: 112.19412231445312
var: tensor([

var: tensor([[ 0.0609,  0.0684,  0.0601,  ...,  0.0757,  0.0683,  0.0605],
        [ 0.0390,  0.0476,  0.0430,  ...,  0.0538,  0.0777,  0.0747],
        [ 0.0484,  0.0745,  0.0542,  ...,  0.0732,  0.0578,  0.0697],
        ...,
        [ 0.0784,  0.0636,  0.0527,  ...,  0.0711,  0.0638,  0.0850],
        [ 0.0401,  0.0437,  0.0389,  ...,  0.0471,  0.0635,  0.0431],
        [ 0.0777,  0.0605,  0.0608,  ...,  0.0743,  0.0489,  0.0871]], device='cuda:0')
loss: 107.22459411621094
var: tensor([[ 0.0440,  0.0646,  0.0497,  ...,  0.0682,  0.0542,  0.0560],
        [ 0.0624,  0.0658,  0.0590,  ...,  0.0786,  0.0667,  0.0673],
        [ 0.0320,  0.0533,  0.0321,  ...,  0.0864,  0.0685,  0.0581],
        ...,
        [ 0.0404,  0.0710,  0.0539,  ...,  0.0569,  0.0584,  0.0586],
        [ 0.0751,  0.0920,  0.0625,  ...,  0.0907,  0.0670,  0.0728],
        [ 0.0745,  0.0658,  0.0410,  ...,  0.0924,  0.0470,  0.0535]], device='cuda:0')
loss: 114.68283081054688
var: tensor([[ 0.0617,  0.0771,  0.059

var: tensor([[ 0.0441,  0.0506,  0.0304,  ...,  0.0582,  0.0868,  0.0492],
        [ 0.0733,  0.0718,  0.0377,  ...,  0.1272,  0.1068,  0.0527],
        [ 0.0380,  0.0667,  0.0337,  ...,  0.0843,  0.0912,  0.0766],
        ...,
        [ 0.0541,  0.0615,  0.0397,  ...,  0.0771,  0.0751,  0.1083],
        [ 0.0529,  0.0551,  0.0387,  ...,  0.0835,  0.1014,  0.0701],
        [ 0.0775,  0.0669,  0.0325,  ...,  0.0751,  0.0686,  0.0827]], device='cuda:0')
loss: 111.93504333496094
var: tensor([[ 0.0531,  0.0597,  0.0337,  ...,  0.0721,  0.0534,  0.0579],
        [ 0.0640,  0.0960,  0.0587,  ...,  0.0812,  0.0713,  0.0691],
        [ 0.0630,  0.1813,  0.1117,  ...,  0.1670,  0.1606,  0.1421],
        ...,
        [ 0.0489,  0.0630,  0.0485,  ...,  0.0803,  0.0895,  0.0750],
        [ 0.0464,  0.0546,  0.0519,  ...,  0.0762,  0.0881,  0.0815],
        [ 0.0404,  0.0354,  0.0317,  ...,  0.0580,  0.0537,  0.0508]], device='cuda:0')
loss: 111.6052017211914
var: tensor([[ 0.0749,  0.0636,  0.0295

loss: 108.3156509399414
var: tensor([[ 0.0599,  0.1280,  0.0620,  ...,  0.1407,  0.0915,  0.0695],
        [ 0.0545,  0.0562,  0.0421,  ...,  0.0732,  0.0723,  0.0491],
        [ 0.0634,  0.0637,  0.0477,  ...,  0.0865,  0.0750,  0.0673],
        ...,
        [ 0.0660,  0.0580,  0.0266,  ...,  0.0753,  0.0545,  0.0538],
        [ 0.0448,  0.0569,  0.0386,  ...,  0.0594,  0.0430,  0.0461],
        [ 0.0454,  0.1584,  0.1031,  ...,  0.1653,  0.1593,  0.1135]], device='cuda:0')
loss: 111.6851806640625
var: tensor([[ 0.0950,  0.0928,  0.0488,  ...,  0.0917,  0.0712,  0.0603],
        [ 0.0807,  0.1478,  0.0595,  ...,  0.1391,  0.1132,  0.0702],
        [ 0.0267,  0.0422,  0.0281,  ...,  0.0566,  0.0367,  0.0411],
        ...,
        [ 0.0585,  0.0567,  0.0516,  ...,  0.0895,  0.0626,  0.0585],
        [ 0.0412,  0.0503,  0.0461,  ...,  0.0727,  0.0690,  0.0538],
        [ 0.0802,  0.0810,  0.0560,  ...,  0.1178,  0.1131,  0.0509]], device='cuda:0')
loss: 113.02381896972656
var: tensor([[ 

var: tensor([[ 0.0661,  0.0701,  0.0465,  ...,  0.0937,  0.0736,  0.1169],
        [ 0.1335,  0.1258,  0.0704,  ...,  0.1138,  0.0951,  0.0825],
        [ 0.0910,  0.0986,  0.0403,  ...,  0.0805,  0.0553,  0.0726],
        ...,
        [ 0.0430,  0.1077,  0.0423,  ...,  0.0839,  0.0504,  0.0567],
        [ 0.0382,  0.0593,  0.0437,  ...,  0.0536,  0.0638,  0.0436],
        [ 0.0443,  0.0599,  0.0387,  ...,  0.0596,  0.0457,  0.0510]], device='cuda:0')
loss: 108.58782196044922
var: tensor([[ 0.1108,  0.1939,  0.1192,  ...,  0.1644,  0.1316,  0.1514],
        [ 0.0583,  0.1035,  0.0903,  ...,  0.1127,  0.0855,  0.0728],
        [ 0.0473,  0.0550,  0.0412,  ...,  0.0502,  0.0483,  0.0345],
        ...,
        [ 0.1488,  0.0839,  0.0486,  ...,  0.1108,  0.0565,  0.0835],
        [ 0.0812,  0.0918,  0.0556,  ...,  0.1093,  0.1032,  0.0830],
        [ 0.0648,  0.0793,  0.0486,  ...,  0.0650,  0.0598,  0.0625]], device='cuda:0')
loss: 109.72782897949219
var: tensor([[ 0.1015,  0.1217,  0.054

var: tensor([[ 0.1072,  0.1777,  0.1319,  ...,  0.1659,  0.1342,  0.1461],
        [ 0.0656,  0.0730,  0.0505,  ...,  0.0811,  0.0551,  0.0862],
        [ 0.1087,  0.0813,  0.0581,  ...,  0.0936,  0.0653,  0.0866],
        ...,
        [ 0.0712,  0.0580,  0.0601,  ...,  0.0992,  0.0626,  0.0806],
        [ 0.0404,  0.0478,  0.0455,  ...,  0.0639,  0.0551,  0.0489],
        [ 0.0534,  0.0919,  0.0604,  ...,  0.0757,  0.0661,  0.0610]], device='cuda:0')
loss: 109.76848602294922
var: tensor([[ 0.0598,  0.0370,  0.0296,  ...,  0.0586,  0.0372,  0.0535],
        [ 0.1094,  0.0708,  0.0503,  ...,  0.0837,  0.0513,  0.0731],
        [ 0.0432,  0.0710,  0.0422,  ...,  0.0553,  0.0623,  0.0578],
        ...,
        [ 0.0640,  0.1020,  0.0486,  ...,  0.0955,  0.0679,  0.0723],
        [ 0.0443,  0.0557,  0.0491,  ...,  0.0492,  0.0810,  0.0455],
        [ 0.0777,  0.0625,  0.0502,  ...,  0.0844,  0.0581,  0.0663]], device='cuda:0')
loss: 111.93211364746094
var: tensor([[ 0.0326,  0.0430,  0.026

loss: 107.9942626953125
var: tensor([[ 0.0596,  0.0534,  0.0446,  ...,  0.0662,  0.0556,  0.0636],
        [ 0.0828,  0.0633,  0.0560,  ...,  0.0754,  0.0747,  0.0746],
        [ 0.0696,  0.0888,  0.0573,  ...,  0.0889,  0.0665,  0.0839],
        ...,
        [ 0.0526,  0.0574,  0.0425,  ...,  0.0543,  0.0777,  0.0846],
        [ 0.0532,  0.0806,  0.0871,  ...,  0.0696,  0.0760,  0.0647],
        [ 0.0725,  0.1014,  0.0941,  ...,  0.0912,  0.0885,  0.0945]], device='cuda:0')
loss: 108.44580078125
var: tensor([[ 0.0551,  0.1009,  0.0583,  ...,  0.0738,  0.0808,  0.0864],
        [ 0.0881,  0.0916,  0.0542,  ...,  0.1003,  0.0888,  0.0682],
        [ 0.0552,  0.0817,  0.0634,  ...,  0.0861,  0.0713,  0.0911],
        ...,
        [ 0.0518,  0.0505,  0.0487,  ...,  0.0492,  0.0836,  0.0420],
        [ 0.0839,  0.0687,  0.0714,  ...,  0.0804,  0.0770,  0.0809],
        [ 0.0866,  0.1224,  0.0701,  ...,  0.0929,  0.0886,  0.0827]], device='cuda:0')
loss: 112.66441345214844
var: tensor([[ 0.

var: tensor([[ 0.1222,  0.1259,  0.0629,  ...,  0.0958,  0.0927,  0.0959],
        [ 0.0460,  0.0649,  0.0546,  ...,  0.0722,  0.0686,  0.0512],
        [ 0.0579,  0.0498,  0.0336,  ...,  0.0795,  0.0454,  0.0647],
        ...,
        [ 0.0821,  0.0971,  0.0568,  ...,  0.1011,  0.0832,  0.0632],
        [ 0.2003,  0.1774,  0.0852,  ...,  0.1482,  0.1443,  0.1489],
        [ 0.0743,  0.1150,  0.0470,  ...,  0.0906,  0.0830,  0.0729]], device='cuda:0')
loss: 109.28620147705078
var: tensor([[ 0.0646,  0.0459,  0.0440,  ...,  0.0715,  0.0430,  0.0529],
        [ 0.0433,  0.0544,  0.0339,  ...,  0.0512,  0.0371,  0.0468],
        [ 0.0535,  0.0407,  0.0433,  ...,  0.0527,  0.0448,  0.0455],
        ...,
        [ 0.1263,  0.1208,  0.0693,  ...,  0.1105,  0.1149,  0.0770],
        [ 0.0658,  0.0855,  0.0558,  ...,  0.0859,  0.0677,  0.0792],
        [ 0.1175,  0.1533,  0.0702,  ...,  0.1224,  0.1117,  0.0858]], device='cuda:0')
loss: 109.62202453613281
var: tensor([[ 0.0524,  0.0501,  0.037

loss: 105.99962615966797
var: tensor([[ 0.0990,  0.0929,  0.0545,  ...,  0.0839,  0.0676,  0.0821],
        [ 0.0433,  0.0447,  0.0445,  ...,  0.0592,  0.0583,  0.0611],
        [ 0.1093,  0.0910,  0.0572,  ...,  0.1024,  0.0689,  0.0810],
        ...,
        [ 0.0518,  0.0551,  0.0475,  ...,  0.0881,  0.0683,  0.1035],
        [ 0.0431,  0.0677,  0.0441,  ...,  0.0798,  0.0513,  0.0538],
        [ 0.1748,  0.2175,  0.0807,  ...,  0.1819,  0.1510,  0.1454]], device='cuda:0')
loss: 107.84664916992188
var: tensor([[ 0.0402,  0.0416,  0.0374,  ...,  0.0550,  0.0548,  0.0470],
        [ 0.0635,  0.0722,  0.0572,  ...,  0.0900,  0.0651,  0.0585],
        [ 0.0423,  0.0494,  0.0372,  ...,  0.0567,  0.0519,  0.0508],
        ...,
        [ 0.0674,  0.0556,  0.0480,  ...,  0.0698,  0.0411,  0.0880],
        [ 0.0771,  0.1527,  0.0820,  ...,  0.1219,  0.0907,  0.1109],
        [ 0.0498,  0.0883,  0.0842,  ...,  0.0957,  0.0629,  0.0663]], device='cuda:0')
loss: 112.90152740478516
var: tensor([

var: tensor([[ 0.0451,  0.1541,  0.1132,  ...,  0.1494,  0.1269,  0.1348],
        [ 0.0562,  0.0460,  0.0503,  ...,  0.0918,  0.0846,  0.0853],
        [ 0.0719,  0.0930,  0.0715,  ...,  0.0945,  0.0855,  0.0675],
        ...,
        [ 0.0414,  0.0321,  0.0337,  ...,  0.0951,  0.0647,  0.0878],
        [ 0.0684,  0.0876,  0.0768,  ...,  0.0933,  0.0793,  0.0695],
        [ 0.0394,  0.0917,  0.0741,  ...,  0.1003,  0.0865,  0.0721]], device='cuda:0')
loss: 116.66316223144531
var: tensor([[ 0.0550,  0.0516,  0.0472,  ...,  0.0718,  0.0623,  0.0531],
        [ 0.0966,  0.0649,  0.0567,  ...,  0.1239,  0.0769,  0.0756],
        [ 0.0316,  0.0373,  0.0374,  ...,  0.0601,  0.0601,  0.0394],
        ...,
        [ 0.0430,  0.0464,  0.0386,  ...,  0.0760,  0.0600,  0.0512],
        [ 0.0713,  0.0443,  0.0421,  ...,  0.0848,  0.0463,  0.0702],
        [ 0.0516,  0.0948,  0.0628,  ...,  0.1153,  0.1155,  0.1062]], device='cuda:0')
loss: 108.46623229980469
var: tensor([[ 0.0486,  0.0579,  0.031

loss: 114.20599365234375
var: tensor([[ 0.0556,  0.0747,  0.0518,  ...,  0.1144,  0.0584,  0.0755],
        [ 0.1567,  0.0833,  0.0569,  ...,  0.1433,  0.0808,  0.1017],
        [ 0.0778,  0.0907,  0.0624,  ...,  0.1142,  0.0920,  0.0795],
        ...,
        [ 0.1010,  0.0529,  0.0523,  ...,  0.0918,  0.0481,  0.0830],
        [ 0.0840,  0.0551,  0.0476,  ...,  0.0997,  0.0529,  0.0768],
        [ 0.0753,  0.0851,  0.0563,  ...,  0.0789,  0.0739,  0.0585]], device='cuda:0')
loss: 111.17068481445312
var: tensor([[ 0.1181,  0.1812,  0.1151,  ...,  0.2117,  0.1273,  0.1461],
        [ 0.1260,  0.0755,  0.0585,  ...,  0.1044,  0.0746,  0.0804],
        [ 0.0480,  0.0550,  0.0440,  ...,  0.0932,  0.0693,  0.0734],
        ...,
        [ 0.0617,  0.0850,  0.0542,  ...,  0.1077,  0.0705,  0.0662],
        [ 0.0685,  0.0899,  0.0726,  ...,  0.1393,  0.0952,  0.0783],
        [ 0.0471,  0.0501,  0.0368,  ...,  0.0737,  0.0665,  0.0600]], device='cuda:0')
loss: 109.54129028320312
var: tensor([

var: tensor([[ 0.0428,  0.0565,  0.0433,  ...,  0.0556,  0.0545,  0.0686],
        [ 0.0475,  0.0600,  0.0550,  ...,  0.0627,  0.0876,  0.0769],
        [ 0.0450,  0.0621,  0.0449,  ...,  0.0769,  0.0736,  0.0935],
        ...,
        [ 0.0483,  0.0867,  0.0540,  ...,  0.0675,  0.0543,  0.0639],
        [ 0.0360,  0.0711,  0.0408,  ...,  0.0646,  0.0455,  0.0455],
        [ 0.1746,  0.1492,  0.0700,  ...,  0.1635,  0.1168,  0.1176]], device='cuda:0')
loss: 113.95613861083984
var: tensor([[ 0.0457,  0.0559,  0.0599,  ...,  0.0575,  0.0456,  0.0353],
        [ 0.0437,  0.0624,  0.0501,  ...,  0.0659,  0.0627,  0.0697],
        [ 0.0634,  0.0829,  0.0593,  ...,  0.0788,  0.0511,  0.0701],
        ...,
        [ 0.0916,  0.0817,  0.0799,  ...,  0.0914,  0.0739,  0.0983],
        [ 0.0704,  0.0878,  0.0657,  ...,  0.0886,  0.0658,  0.0587],
        [ 0.0577,  0.0690,  0.0481,  ...,  0.0641,  0.0509,  0.0750]], device='cuda:0')
loss: 114.49578094482422
var: tensor([[ 0.0352,  0.0689,  0.037

loss: 110.19932556152344
var: tensor([[ 0.0565,  0.0723,  0.0467,  ...,  0.0876,  0.0461,  0.0725],
        [ 0.0629,  0.0858,  0.0516,  ...,  0.0929,  0.0729,  0.0765],
        [ 0.0545,  0.0609,  0.0445,  ...,  0.0889,  0.0585,  0.0657],
        ...,
        [ 0.0811,  0.0614,  0.0555,  ...,  0.0750,  0.0447,  0.0721],
        [ 0.0255,  0.0346,  0.0279,  ...,  0.0462,  0.0443,  0.0475],
        [ 0.1030,  0.0616,  0.0429,  ...,  0.0728,  0.0431,  0.0633]], device='cuda:0')
loss: 112.80530548095703
var: tensor([[ 0.0461,  0.0574,  0.0447,  ...,  0.0640,  0.0741,  0.0585],
        [ 0.0518,  0.0891,  0.0478,  ...,  0.0741,  0.0653,  0.0709],
        [ 0.0356,  0.0483,  0.0340,  ...,  0.0694,  0.0455,  0.0766],
        ...,
        [ 0.0511,  0.0679,  0.0498,  ...,  0.0727,  0.0795,  0.0714],
        [ 0.0459,  0.0424,  0.0301,  ...,  0.0752,  0.0445,  0.0629],
        [ 0.0823,  0.0797,  0.0484,  ...,  0.0947,  0.0781,  0.0675]], device='cuda:0')
loss: 110.90689849853516
var: tensor([

var: tensor([[ 0.0576,  0.0979,  0.0436,  ...,  0.0816,  0.0539,  0.1091],
        [ 0.0883,  0.0603,  0.0565,  ...,  0.0916,  0.0560,  0.0902],
        [ 0.1085,  0.1096,  0.0480,  ...,  0.1204,  0.0718,  0.0919],
        ...,
        [ 0.0482,  0.2269,  0.1368,  ...,  0.1860,  0.1154,  0.1644],
        [ 0.0542,  0.0806,  0.0415,  ...,  0.0771,  0.0566,  0.0575],
        [ 0.1497,  0.1469,  0.0629,  ...,  0.1559,  0.1065,  0.1307]], device='cuda:0')
loss: 109.54251098632812
var: tensor([[ 0.0552,  0.0859,  0.0746,  ...,  0.0969,  0.0738,  0.0763],
        [ 0.0531,  0.1187,  0.0574,  ...,  0.0879,  0.0690,  0.1034],
        [ 0.0700,  0.1198,  0.0573,  ...,  0.0990,  0.0762,  0.0664],
        ...,
        [ 0.0536,  0.0611,  0.0457,  ...,  0.0943,  0.0419,  0.0657],
        [ 0.0375,  0.0490,  0.0458,  ...,  0.0660,  0.0693,  0.0642],
        [ 0.0971,  0.1129,  0.0560,  ...,  0.1329,  0.0746,  0.0935]], device='cuda:0')
loss: 114.12417602539062
var: tensor([[ 0.0582,  0.0718,  0.042

var: tensor([[ 0.0356,  0.0484,  0.0306,  ...,  0.0754,  0.0556,  0.0523],
        [ 0.0978,  0.0902,  0.0685,  ...,  0.1249,  0.0772,  0.1012],
        [ 0.0332,  0.0379,  0.0315,  ...,  0.0754,  0.0681,  0.0803],
        ...,
        [ 0.0769,  0.0973,  0.0505,  ...,  0.1235,  0.0976,  0.0675],
        [ 0.0625,  0.0881,  0.0723,  ...,  0.1150,  0.0780,  0.0858],
        [ 0.0651,  0.0662,  0.0455,  ...,  0.0840,  0.0482,  0.0701]], device='cuda:0')
loss: 110.90158081054688
var: tensor([[ 0.1119,  0.1028,  0.0815,  ...,  0.1103,  0.0844,  0.0849],
        [ 0.0595,  0.0628,  0.0543,  ...,  0.1049,  0.0708,  0.0731],
        [ 0.0461,  0.0399,  0.0316,  ...,  0.0761,  0.0517,  0.0830],
        ...,
        [ 0.0585,  0.0699,  0.0569,  ...,  0.1058,  0.0719,  0.0825],
        [ 0.0713,  0.0677,  0.0460,  ...,  0.0906,  0.0673,  0.0548],
        [ 0.0756,  0.0808,  0.0615,  ...,  0.0974,  0.0880,  0.0703]], device='cuda:0')
loss: 110.34622192382812
var: tensor([[ 0.0852,  0.1053,  0.060

var: tensor([[ 0.0727,  0.0790,  0.0766,  ...,  0.1125,  0.0865,  0.0687],
        [ 0.0359,  0.0793,  0.0560,  ...,  0.0920,  0.0709,  0.0755],
        [ 0.0735,  0.0628,  0.0847,  ...,  0.1024,  0.0810,  0.0835],
        ...,
        [ 0.0341,  0.0448,  0.0393,  ...,  0.0578,  0.0908,  0.0504],
        [ 0.0455,  0.0485,  0.0417,  ...,  0.0546,  0.0671,  0.0478],
        [ 0.0520,  0.0734,  0.0508,  ...,  0.0971,  0.0901,  0.0923]], device='cuda:0')
loss: 108.11622619628906
var: tensor([[ 0.0885,  0.1058,  0.0929,  ...,  0.1091,  0.1120,  0.0785],
        [ 0.0643,  0.0485,  0.0440,  ...,  0.0791,  0.0502,  0.0593],
        [ 0.0712,  0.1203,  0.0582,  ...,  0.1242,  0.1097,  0.0734],
        ...,
        [ 0.0421,  0.0578,  0.0483,  ...,  0.0930,  0.0695,  0.0553],
        [ 0.0515,  0.0706,  0.0702,  ...,  0.0696,  0.0576,  0.0642],
        [ 0.0475,  0.0858,  0.0458,  ...,  0.0863,  0.0596,  0.0701]], device='cuda:0')
loss: 113.95130920410156
var: tensor([[ 0.0628,  0.1101,  0.079

var: tensor([[ 0.0434,  0.0542,  0.0357,  ...,  0.0732,  0.0684,  0.0629],
        [ 0.0430,  0.0492,  0.0528,  ...,  0.0577,  0.0935,  0.0500],
        [ 0.0553,  0.0708,  0.0441,  ...,  0.0813,  0.0716,  0.0589],
        ...,
        [ 0.0591,  0.0881,  0.0455,  ...,  0.0898,  0.0632,  0.0725],
        [ 0.0761,  0.0909,  0.0753,  ...,  0.0968,  0.0811,  0.0754],
        [ 0.0497,  0.1760,  0.1539,  ...,  0.1529,  0.1361,  0.1382]], device='cuda:0')
loss: 107.66681671142578
var: tensor([[ 0.0839,  0.1771,  0.1220,  ...,  0.1645,  0.1047,  0.1671],
        [ 0.0437,  0.0526,  0.0465,  ...,  0.0780,  0.0532,  0.0684],
        [ 0.0752,  0.0810,  0.0405,  ...,  0.0950,  0.0983,  0.0536],
        ...,
        [ 0.0541,  0.0793,  0.0385,  ...,  0.0648,  0.0767,  0.0615],
        [ 0.0495,  0.0775,  0.0421,  ...,  0.0801,  0.0595,  0.0764],
        [ 0.0420,  0.0604,  0.0505,  ...,  0.0504,  0.0972,  0.0529]], device='cuda:0')
loss: 108.31490325927734
var: tensor([[ 0.0632,  0.0698,  0.053

var: tensor([[ 0.0711,  0.2201,  0.1706,  ...,  0.2271,  0.1602,  0.2446],
        [ 0.0438,  0.0415,  0.0343,  ...,  0.0485,  0.0564,  0.0648],
        [ 0.0670,  0.0726,  0.0359,  ...,  0.0927,  0.0637,  0.0576],
        ...,
        [ 0.1613,  0.1486,  0.1010,  ...,  0.1838,  0.1374,  0.1585],
        [ 0.0995,  0.1159,  0.0567,  ...,  0.1153,  0.0988,  0.0885],
        [ 0.0670,  0.1051,  0.0787,  ...,  0.0906,  0.0749,  0.0896]], device='cuda:0')
loss: 112.39920806884766
var: tensor([[ 0.0832,  0.1726,  0.0958,  ...,  0.1586,  0.1197,  0.1129],
        [ 0.0331,  0.0443,  0.0313,  ...,  0.0447,  0.0618,  0.0473],
        [ 0.0433,  0.0749,  0.0436,  ...,  0.0766,  0.0674,  0.0641],
        ...,
        [ 0.1058,  0.1172,  0.0680,  ...,  0.1458,  0.1040,  0.0950],
        [ 0.1458,  0.0920,  0.0509,  ...,  0.1030,  0.0987,  0.0869],
        [ 0.1479,  0.0743,  0.0517,  ...,  0.0970,  0.0670,  0.0923]], device='cuda:0')
loss: 107.00897979736328
var: tensor([[ 0.1068,  0.0631,  0.041

loss: 108.96638488769531
var: tensor([[ 0.0474,  0.0515,  0.0424,  ...,  0.0671,  0.0594,  0.0626],
        [ 0.0849,  0.0804,  0.0550,  ...,  0.1313,  0.0788,  0.0494],
        [ 0.0627,  0.0633,  0.0426,  ...,  0.0613,  0.0806,  0.0483],
        ...,
        [ 0.0685,  0.0794,  0.0633,  ...,  0.0875,  0.0891,  0.0757],
        [ 0.1336,  0.1646,  0.0970,  ...,  0.1952,  0.1614,  0.1244],
        [ 0.0567,  0.0907,  0.0533,  ...,  0.1086,  0.0878,  0.0545]], device='cuda:0')
loss: 112.3749008178711
var: tensor([[ 0.0781,  0.0709,  0.0404,  ...,  0.0885,  0.0653,  0.0626],
        [ 0.1380,  0.2007,  0.1014,  ...,  0.1665,  0.1394,  0.1118],
        [ 0.0471,  0.0649,  0.0424,  ...,  0.0745,  0.0514,  0.0424],
        ...,
        [ 0.0695,  0.0534,  0.0333,  ...,  0.0994,  0.0745,  0.0352],
        [ 0.0714,  0.0502,  0.0484,  ...,  0.0747,  0.0553,  0.0716],
        [ 0.0397,  0.0503,  0.0443,  ...,  0.0475,  0.0553,  0.0395]], device='cuda:0')
loss: 111.29524993896484
var: tensor([[

var: tensor([[ 0.0585,  0.1700,  0.1386,  ...,  0.1860,  0.1096,  0.1354],
        [ 0.0453,  0.0681,  0.0626,  ...,  0.0968,  0.0614,  0.0593],
        [ 0.0512,  0.0925,  0.0663,  ...,  0.0867,  0.0630,  0.0659],
        ...,
        [ 0.0507,  0.0536,  0.0540,  ...,  0.0853,  0.0359,  0.0585],
        [ 0.0283,  0.0332,  0.0329,  ...,  0.0589,  0.0466,  0.0433],
        [ 0.0352,  0.0380,  0.0387,  ...,  0.0757,  0.0754,  0.0485]], device='cuda:0')
loss: 110.42401123046875
var: tensor([[ 0.0503,  0.0966,  0.0720,  ...,  0.0820,  0.0647,  0.0513],
        [ 0.1614,  0.0874,  0.0690,  ...,  0.1227,  0.0770,  0.0973],
        [ 0.0701,  0.0917,  0.0750,  ...,  0.1120,  0.0667,  0.0660],
        ...,
        [ 0.0588,  0.0516,  0.0462,  ...,  0.0876,  0.0456,  0.0426],
        [ 0.1411,  0.1089,  0.0932,  ...,  0.1408,  0.0947,  0.1302],
        [ 0.0539,  0.0617,  0.0614,  ...,  0.0856,  0.0658,  0.0594]], device='cuda:0')
loss: 111.40492248535156
var: tensor([[ 0.0816,  0.1000,  0.067

var: tensor([[ 0.0551,  0.1016,  0.0515,  ...,  0.0845,  0.0805,  0.0654],
        [ 0.1528,  0.1767,  0.1084,  ...,  0.1918,  0.1378,  0.1447],
        [ 0.0488,  0.0788,  0.0603,  ...,  0.1101,  0.0578,  0.0629],
        ...,
        [ 0.0630,  0.0808,  0.0508,  ...,  0.1123,  0.0723,  0.0698],
        [ 0.0345,  0.0498,  0.0509,  ...,  0.0878,  0.0553,  0.0500],
        [ 0.0635,  0.0522,  0.0558,  ...,  0.0957,  0.0575,  0.0588]], device='cuda:0')
loss: 110.59707641601562
var: tensor([[ 0.0390,  0.0584,  0.0556,  ...,  0.0635,  0.0786,  0.0523],
        [ 0.0924,  0.0594,  0.0558,  ...,  0.1246,  0.0620,  0.0687],
        [ 0.1416,  0.2102,  0.0947,  ...,  0.1987,  0.1245,  0.1373],
        ...,
        [ 0.0298,  0.0425,  0.0450,  ...,  0.0472,  0.0779,  0.0482],
        [ 0.0732,  0.0415,  0.0494,  ...,  0.0709,  0.0384,  0.0486],
        [ 0.1212,  0.1407,  0.0781,  ...,  0.1903,  0.1244,  0.1176]], device='cuda:0')
loss: 107.58586883544922
var: tensor([[ 0.0586,  0.0587,  0.067

var: tensor([[ 0.0854,  0.1741,  0.0762,  ...,  0.1246,  0.0851,  0.0831],
        [ 0.0575,  0.0903,  0.0480,  ...,  0.0861,  0.0711,  0.0729],
        [ 0.0360,  0.0513,  0.0393,  ...,  0.0586,  0.0393,  0.0498],
        ...,
        [ 0.1203,  0.1042,  0.0746,  ...,  0.1208,  0.1128,  0.0770],
        [ 0.0431,  0.0666,  0.0464,  ...,  0.0470,  0.0853,  0.0582],
        [ 0.0568,  0.0938,  0.0472,  ...,  0.1031,  0.0658,  0.0844]], device='cuda:0')
loss: 109.83172607421875
var: tensor([[ 0.0466,  0.0758,  0.0583,  ...,  0.0921,  0.0644,  0.0846],
        [ 0.0485,  0.0713,  0.0804,  ...,  0.0628,  0.0488,  0.0481],
        [ 0.0587,  0.0773,  0.0486,  ...,  0.0806,  0.0744,  0.1061],
        ...,
        [ 0.0811,  0.0670,  0.0583,  ...,  0.0856,  0.0655,  0.0866],
        [ 0.0900,  0.0838,  0.0522,  ...,  0.1064,  0.0625,  0.0849],
        [ 0.1886,  0.1631,  0.0781,  ...,  0.1961,  0.1449,  0.1385]], device='cuda:0')
loss: 110.19145202636719
var: tensor([[ 0.0429,  0.0897,  0.051

loss: 108.35936737060547
var: tensor([[ 0.0420,  0.0663,  0.0464,  ...,  0.0813,  0.0445,  0.0741],
        [ 0.0550,  0.0606,  0.0656,  ...,  0.0696,  0.0579,  0.0620],
        [ 0.0386,  0.0596,  0.0469,  ...,  0.0704,  0.0569,  0.0810],
        ...,
        [ 0.0491,  0.0299,  0.0285,  ...,  0.0571,  0.0284,  0.0422],
        [ 0.0506,  0.0351,  0.0256,  ...,  0.0702,  0.0415,  0.0622],
        [ 0.1039,  0.0994,  0.0602,  ...,  0.1286,  0.0785,  0.0974]], device='cuda:0')
loss: 110.26141357421875
var: tensor([[ 0.0574,  0.0719,  0.0410,  ...,  0.0943,  0.0893,  0.0580],
        [ 0.0470,  0.0553,  0.0514,  ...,  0.0752,  0.0585,  0.0661],
        [ 0.0659,  0.0442,  0.0393,  ...,  0.0821,  0.0737,  0.0794],
        ...,
        [ 0.0529,  0.0818,  0.0698,  ...,  0.0813,  0.0593,  0.0660],
        [ 0.0360,  0.0386,  0.0413,  ...,  0.0747,  0.0686,  0.0853],
        [ 0.0741,  0.1294,  0.0594,  ...,  0.1278,  0.1000,  0.0828]], device='cuda:0')
loss: 110.4359130859375
var: tensor([[

var: tensor([[ 0.0478,  0.0608,  0.0371,  ...,  0.0947,  0.0731,  0.0836],
        [ 0.0667,  0.0851,  0.0465,  ...,  0.1147,  0.0875,  0.0429],
        [ 0.0512,  0.1974,  0.1580,  ...,  0.1583,  0.1277,  0.0933],
        ...,
        [ 0.1504,  0.1475,  0.0832,  ...,  0.1942,  0.1250,  0.1738],
        [ 0.0523,  0.0707,  0.0443,  ...,  0.0762,  0.0905,  0.0722],
        [ 0.1150,  0.0940,  0.0740,  ...,  0.1037,  0.0884,  0.0769]], device='cuda:0')
loss: 113.90997314453125
var: tensor([[ 0.0418,  0.0556,  0.0536,  ...,  0.0526,  0.0618,  0.0455],
        [ 0.0548,  0.0663,  0.0636,  ...,  0.0742,  0.0728,  0.0482],
        [ 0.0348,  0.0521,  0.0325,  ...,  0.0798,  0.0621,  0.0547],
        ...,
        [ 0.1317,  0.2126,  0.1047,  ...,  0.2015,  0.1429,  0.1750],
        [ 0.0440,  0.0488,  0.0350,  ...,  0.0625,  0.0533,  0.0533],
        [ 0.0323,  0.0591,  0.0409,  ...,  0.0759,  0.0697,  0.0600]], device='cuda:0')
loss: 111.57255554199219
var: tensor([[ 0.0496,  0.0741,  0.055

var: tensor([[ 0.0709,  0.0648,  0.0459,  ...,  0.0870,  0.0562,  0.0699],
        [ 0.0209,  0.0398,  0.0283,  ...,  0.0485,  0.0712,  0.0358],
        [ 0.0810,  0.0661,  0.0385,  ...,  0.0903,  0.0505,  0.0673],
        ...,
        [ 0.0853,  0.0946,  0.0454,  ...,  0.0862,  0.0852,  0.0769],
        [ 0.0857,  0.1001,  0.0522,  ...,  0.0959,  0.0839,  0.0960],
        [ 0.0790,  0.0483,  0.0380,  ...,  0.0918,  0.0464,  0.0656]], device='cuda:0')
loss: 108.53689575195312
var: tensor([[ 0.0607,  0.0942,  0.0410,  ...,  0.0851,  0.0814,  0.0669],
        [ 0.0324,  0.0531,  0.0390,  ...,  0.0646,  0.0701,  0.0404],
        [ 0.0588,  0.0627,  0.0358,  ...,  0.0832,  0.0564,  0.0610],
        ...,
        [ 0.0504,  0.0505,  0.0291,  ...,  0.0798,  0.0532,  0.0525],
        [ 0.0342,  0.0825,  0.0471,  ...,  0.0849,  0.0572,  0.0607],
        [ 0.0460,  0.0667,  0.0406,  ...,  0.0760,  0.0521,  0.0458]], device='cuda:0')
loss: 110.20054626464844
var: tensor([[ 0.0597,  0.0371,  0.027

var: tensor([[ 0.0554,  0.0564,  0.0493,  ...,  0.0914,  0.0689,  0.0881],
        [ 0.0588,  0.0849,  0.0457,  ...,  0.0835,  0.0676,  0.0820],
        [ 0.0444,  0.0381,  0.0313,  ...,  0.0539,  0.0465,  0.0618],
        ...,
        [ 0.0701,  0.0753,  0.0682,  ...,  0.0964,  0.0941,  0.0754],
        [ 0.0514,  0.0543,  0.0489,  ...,  0.0869,  0.0715,  0.0699],
        [ 0.0683,  0.0851,  0.0374,  ...,  0.1217,  0.1163,  0.0589]], device='cuda:0')
loss: 109.30279541015625
var: tensor([[ 0.0411,  0.0526,  0.0454,  ...,  0.0701,  0.1024,  0.0762],
        [ 0.1094,  0.2216,  0.1409,  ...,  0.1982,  0.1484,  0.1612],
        [ 0.0493,  0.1358,  0.1030,  ...,  0.1114,  0.1666,  0.1483],
        ...,
        [ 0.0542,  0.0513,  0.0454,  ...,  0.0752,  0.0664,  0.0612],
        [ 0.1723,  0.1816,  0.0991,  ...,  0.2189,  0.1743,  0.1637],
        [ 0.0497,  0.0731,  0.0456,  ...,  0.0816,  0.0648,  0.0709]], device='cuda:0')
loss: 107.08883666992188
var: tensor([[ 0.0911,  0.0818,  0.062

var: tensor([[ 0.0850,  0.0771,  0.0580,  ...,  0.1161,  0.1106,  0.1360],
        [ 0.0515,  0.0575,  0.0497,  ...,  0.0817,  0.0933,  0.0690],
        [ 0.0558,  0.0394,  0.0418,  ...,  0.0671,  0.0695,  0.0623],
        ...,
        [ 0.0740,  0.1038,  0.0741,  ...,  0.1089,  0.1139,  0.0948],
        [ 0.0711,  0.0567,  0.0411,  ...,  0.0924,  0.0958,  0.0903],
        [ 0.0394,  0.0622,  0.0530,  ...,  0.0949,  0.0934,  0.0874]], device='cuda:0')
loss: 107.95016479492188
var: tensor([[ 0.0712,  0.0858,  0.0473,  ...,  0.1055,  0.0949,  0.0769],
        [ 0.0630,  0.0524,  0.0478,  ...,  0.0854,  0.0840,  0.0944],
        [ 0.0298,  0.0474,  0.0351,  ...,  0.0612,  0.0754,  0.0588],
        ...,
        [ 0.0530,  0.0734,  0.0416,  ...,  0.0804,  0.1034,  0.0935],
        [ 0.0562,  0.0564,  0.0394,  ...,  0.0790,  0.0690,  0.0740],
        [ 0.0522,  0.1792,  0.1354,  ...,  0.1623,  0.1462,  0.1513]], device='cuda:0')
loss: 108.16997528076172
var: tensor([[ 0.0436,  0.0844,  0.085

var: tensor([[ 0.0395,  0.0499,  0.0421,  ...,  0.0659,  0.0703,  0.0540],
        [ 0.0379,  0.0429,  0.0472,  ...,  0.0633,  0.0642,  0.0660],
        [ 0.0504,  0.0460,  0.0326,  ...,  0.0618,  0.0627,  0.0609],
        ...,
        [ 0.0933,  0.0837,  0.0501,  ...,  0.0858,  0.0689,  0.0706],
        [ 0.0302,  0.0791,  0.0567,  ...,  0.0778,  0.0683,  0.0817],
        [ 0.0340,  0.0362,  0.0444,  ...,  0.0578,  0.0545,  0.0514]], device='cuda:0')
loss: 110.52682495117188
var: tensor([[ 0.0883,  0.1285,  0.0698,  ...,  0.0957,  0.1091,  0.0814],
        [ 0.1006,  0.0739,  0.0408,  ...,  0.0940,  0.0706,  0.0736],
        [ 0.0396,  0.0356,  0.0372,  ...,  0.0513,  0.0588,  0.0465],
        ...,
        [ 0.0741,  0.0608,  0.0364,  ...,  0.0889,  0.0846,  0.0470],
        [ 0.0401,  0.0456,  0.0391,  ...,  0.0815,  0.0702,  0.0780],
        [ 0.0867,  0.1178,  0.0530,  ...,  0.0856,  0.0758,  0.0814]], device='cuda:0')
loss: 108.43382263183594
var: tensor([[ 0.0334,  0.0486,  0.040

var: tensor([[ 0.1533,  0.1615,  0.0580,  ...,  0.1706,  0.1199,  0.1381],
        [ 0.0932,  0.1940,  0.1180,  ...,  0.1685,  0.1383,  0.2217],
        [ 0.0505,  0.0793,  0.0745,  ...,  0.0832,  0.0844,  0.0590],
        ...,
        [ 0.0348,  0.0452,  0.0242,  ...,  0.0641,  0.0404,  0.0493],
        [ 0.0301,  0.0576,  0.0391,  ...,  0.0739,  0.0560,  0.0562],
        [ 0.0725,  0.0658,  0.0417,  ...,  0.0918,  0.0711,  0.0593]], device='cuda:0')
loss: 110.02336120605469
var: tensor([[ 0.0334,  0.0567,  0.0297,  ...,  0.0838,  0.0482,  0.0624],
        [ 0.0335,  0.0457,  0.0357,  ...,  0.0611,  0.0523,  0.0516],
        [ 0.0493,  0.0768,  0.0317,  ...,  0.0843,  0.0594,  0.0654],
        ...,
        [ 0.0946,  0.1081,  0.0466,  ...,  0.1014,  0.0790,  0.0545],
        [ 0.0802,  0.0705,  0.0364,  ...,  0.0666,  0.0412,  0.0619],
        [ 0.0762,  0.1098,  0.0484,  ...,  0.1357,  0.0904,  0.0811]], device='cuda:0')
loss: 110.57672882080078
var: tensor([[ 0.0755,  0.0938,  0.055

loss: 108.59345245361328
var: tensor([[ 0.0653,  0.0833,  0.0473,  ...,  0.1253,  0.0735,  0.0698],
        [ 0.0933,  0.0639,  0.0478,  ...,  0.0998,  0.0625,  0.0776],
        [ 0.0974,  0.0974,  0.0526,  ...,  0.1032,  0.0838,  0.0797],
        ...,
        [ 0.0535,  0.0857,  0.0435,  ...,  0.0928,  0.0702,  0.1156],
        [ 0.0641,  0.0849,  0.0649,  ...,  0.0739,  0.0665,  0.0624],
        [ 0.0522,  0.0737,  0.0521,  ...,  0.0931,  0.0811,  0.0553]], device='cuda:0')
loss: 109.8223876953125
var: tensor([[ 0.0860,  0.0796,  0.0412,  ...,  0.1012,  0.0597,  0.0686],
        [ 0.0980,  0.0537,  0.0410,  ...,  0.0824,  0.0499,  0.0605],
        [ 0.0437,  0.0562,  0.0435,  ...,  0.0777,  0.0744,  0.0631],
        ...,
        [ 0.0343,  0.0388,  0.0432,  ...,  0.0661,  0.0603,  0.0444],
        [ 0.0876,  0.0711,  0.0389,  ...,  0.0820,  0.0472,  0.0707],
        [ 0.0561,  0.0517,  0.0402,  ...,  0.0689,  0.0804,  0.0453]], device='cuda:0')
loss: 110.23533630371094
var: tensor([[

var: tensor([[ 0.0613,  0.0885,  0.0427,  ...,  0.0917,  0.0683,  0.0603],
        [ 0.0423,  0.0644,  0.0505,  ...,  0.0689,  0.0567,  0.0621],
        [ 0.0490,  0.0744,  0.0336,  ...,  0.0661,  0.0573,  0.0571],
        ...,
        [ 0.0514,  0.1139,  0.0521,  ...,  0.1051,  0.0756,  0.0608],
        [ 0.1455,  0.0949,  0.0590,  ...,  0.0773,  0.0551,  0.0735],
        [ 0.0778,  0.1479,  0.0465,  ...,  0.0940,  0.1150,  0.0673]], device='cuda:0')
loss: 108.73172760009766
var: tensor([[ 0.0986,  0.0570,  0.0489,  ...,  0.0528,  0.0414,  0.0484],
        [ 0.0474,  0.0799,  0.0637,  ...,  0.0832,  0.0588,  0.0535],
        [ 0.0855,  0.1401,  0.0454,  ...,  0.1002,  0.0885,  0.0822],
        ...,
        [ 0.0670,  0.0757,  0.0634,  ...,  0.0683,  0.0630,  0.0551],
        [ 0.0783,  0.0638,  0.0614,  ...,  0.0608,  0.0498,  0.0653],
        [ 0.0562,  0.0905,  0.0522,  ...,  0.0668,  0.0842,  0.0546]], device='cuda:0')
loss: 104.32618713378906
var: tensor([[ 0.0880,  0.0682,  0.050

var: tensor([[ 0.0436,  0.0472,  0.0442,  ...,  0.0627,  0.0721,  0.0468],
        [ 0.0442,  0.0602,  0.0344,  ...,  0.0798,  0.0606,  0.0570],
        [ 0.0651,  0.0841,  0.0764,  ...,  0.0984,  0.0851,  0.0644],
        ...,
        [ 0.1313,  0.1114,  0.0578,  ...,  0.1149,  0.1070,  0.0756],
        [ 0.0619,  0.0902,  0.0774,  ...,  0.0605,  0.0698,  0.0641],
        [ 0.0775,  0.1010,  0.0389,  ...,  0.1123,  0.0844,  0.1090]], device='cuda:0')
loss: 108.38078308105469
var: tensor([[ 0.0270,  0.0650,  0.0380,  ...,  0.0551,  0.0554,  0.0510],
        [ 0.0760,  0.0479,  0.0364,  ...,  0.0604,  0.0471,  0.0567],
        [ 0.0698,  0.1543,  0.0939,  ...,  0.1378,  0.1317,  0.1559],
        ...,
        [ 0.0908,  0.0680,  0.0490,  ...,  0.0844,  0.0861,  0.0731],
        [ 0.0439,  0.0685,  0.0424,  ...,  0.0666,  0.0606,  0.0591],
        [ 0.0382,  0.0651,  0.0372,  ...,  0.0636,  0.0489,  0.0506]], device='cuda:0')
loss: 110.60246276855469
var: tensor([[ 0.0847,  0.0643,  0.059

var: tensor([[ 0.0447,  0.0784,  0.0599,  ...,  0.0672,  0.0745,  0.0717],
        [ 0.0417,  0.0689,  0.0355,  ...,  0.0725,  0.0641,  0.0732],
        [ 0.0987,  0.0865,  0.0581,  ...,  0.1091,  0.0811,  0.0681],
        ...,
        [ 0.0811,  0.0731,  0.0662,  ...,  0.0663,  0.0657,  0.0809],
        [ 0.0530,  0.0478,  0.0406,  ...,  0.0505,  0.0343,  0.0620],
        [ 0.0570,  0.0704,  0.0515,  ...,  0.0898,  0.0649,  0.0633]], device='cuda:0')
loss: 111.06135559082031
var: tensor([[ 0.0576,  0.1470,  0.1043,  ...,  0.1239,  0.1333,  0.1724],
        [ 0.0951,  0.0811,  0.0470,  ...,  0.0787,  0.0605,  0.0713],
        [ 0.0721,  0.0653,  0.0682,  ...,  0.0644,  0.0711,  0.0647],
        ...,
        [ 0.0397,  0.0528,  0.0378,  ...,  0.0648,  0.0639,  0.0695],
        [ 0.0472,  0.0568,  0.0411,  ...,  0.0762,  0.0551,  0.0700],
        [ 0.0631,  0.0892,  0.0643,  ...,  0.0837,  0.0731,  0.0679]], device='cuda:0')
loss: 109.01512145996094
var: tensor([[ 0.0550,  0.0705,  0.059

var: tensor([[ 0.0334,  0.0443,  0.0525,  ...,  0.0547,  0.0790,  0.0654],
        [ 0.0439,  0.0433,  0.0483,  ...,  0.0475,  0.0536,  0.0477],
        [ 0.0505,  0.0578,  0.0486,  ...,  0.0628,  0.0651,  0.0428],
        ...,
        [ 0.0336,  0.0484,  0.0554,  ...,  0.0690,  0.0495,  0.0455],
        [ 0.0526,  0.0945,  0.0889,  ...,  0.0671,  0.0758,  0.0772],
        [ 0.0588,  0.0513,  0.0668,  ...,  0.0509,  0.0483,  0.0787]], device='cuda:0')
loss: 113.32673645019531
var: tensor([[ 0.0521,  0.0624,  0.0518,  ...,  0.0869,  0.0770,  0.0797],
        [ 0.0463,  0.0591,  0.0527,  ...,  0.0599,  0.0681,  0.0648],
        [ 0.0734,  0.0741,  0.0696,  ...,  0.0861,  0.0745,  0.0784],
        ...,
        [ 0.0518,  0.1028,  0.0850,  ...,  0.0764,  0.0732,  0.0751],
        [ 0.0395,  0.0532,  0.0534,  ...,  0.0818,  0.0911,  0.0835],
        [ 0.0546,  0.0780,  0.0402,  ...,  0.0789,  0.0882,  0.0547]], device='cuda:0')
loss: 110.62776184082031
var: tensor([[ 0.0452,  0.0835,  0.069

var: tensor([[ 0.0829,  0.1273,  0.0735,  ...,  0.1189,  0.1137,  0.0989],
        [ 0.0607,  0.0848,  0.0538,  ...,  0.0772,  0.0929,  0.0822],
        [ 0.0694,  0.1718,  0.1091,  ...,  0.1479,  0.1301,  0.1557],
        ...,
        [ 0.0560,  0.0648,  0.0599,  ...,  0.0654,  0.0734,  0.0547],
        [ 0.0776,  0.0967,  0.0644,  ...,  0.0855,  0.0857,  0.0689],
        [ 0.0392,  0.0456,  0.0430,  ...,  0.0635,  0.0784,  0.0627]], device='cuda:0')
loss: 106.75596618652344
var: tensor([[ 0.0596,  0.1289,  0.1024,  ...,  0.0803,  0.0969,  0.0705],
        [ 0.0684,  0.0457,  0.0508,  ...,  0.0704,  0.0649,  0.0786],
        [ 0.0520,  0.0510,  0.0424,  ...,  0.0628,  0.0734,  0.0502],
        ...,
        [ 0.0520,  0.1280,  0.1049,  ...,  0.1149,  0.1551,  0.1148],
        [ 0.1618,  0.1373,  0.0756,  ...,  0.1497,  0.1548,  0.1623],
        [ 0.0335,  0.0706,  0.0447,  ...,  0.0551,  0.0579,  0.0572]], device='cuda:0')
loss: 107.69316864013672
var: tensor([[ 0.0630,  0.1709,  0.123

var: tensor([[ 0.0353,  0.0602,  0.0524,  ...,  0.0790,  0.0800,  0.0597],
        [ 0.0777,  0.0923,  0.0807,  ...,  0.1026,  0.1067,  0.0697],
        [ 0.0421,  0.0589,  0.0477,  ...,  0.0667,  0.0556,  0.0615],
        ...,
        [ 0.1357,  0.1709,  0.0723,  ...,  0.1784,  0.1539,  0.1554],
        [ 0.0593,  0.0551,  0.0392,  ...,  0.0796,  0.0568,  0.0637],
        [ 0.0484,  0.0721,  0.0473,  ...,  0.0793,  0.0635,  0.0664]], device='cuda:0')
loss: 109.62332153320312
var: tensor([[ 0.0620,  0.0744,  0.0431,  ...,  0.0901,  0.0694,  0.0659],
        [ 0.1155,  0.1193,  0.0631,  ...,  0.1271,  0.1113,  0.1044],
        [ 0.0460,  0.0536,  0.0458,  ...,  0.0733,  0.0436,  0.0754],
        ...,
        [ 0.0499,  0.0432,  0.0370,  ...,  0.0557,  0.0344,  0.0749],
        [ 0.0438,  0.0593,  0.0416,  ...,  0.0866,  0.0792,  0.0579],
        [ 0.1411,  0.1271,  0.0936,  ...,  0.1574,  0.0880,  0.1284]], device='cuda:0')
loss: 108.64727783203125
var: tensor([[ 0.0339,  0.0423,  0.034

var: tensor([[ 0.0568,  0.0510,  0.0525,  ...,  0.0687,  0.0661,  0.0716],
        [ 0.0681,  0.0605,  0.0571,  ...,  0.0719,  0.0652,  0.0727],
        [ 0.0448,  0.0653,  0.0609,  ...,  0.0723,  0.0819,  0.0725],
        ...,
        [ 0.0416,  0.0753,  0.0514,  ...,  0.0712,  0.0465,  0.0640],
        [ 0.0401,  0.1358,  0.1203,  ...,  0.1346,  0.1055,  0.1443],
        [ 0.0725,  0.0879,  0.0534,  ...,  0.0893,  0.0764,  0.0766]], device='cuda:0')
loss: 104.92214965820312
var: tensor([[ 0.0416,  0.0662,  0.0619,  ...,  0.0647,  0.0656,  0.0870],
        [ 0.0416,  0.0452,  0.0454,  ...,  0.0568,  0.0590,  0.0758],
        [ 0.0491,  0.0546,  0.0512,  ...,  0.0849,  0.0682,  0.0737],
        ...,
        [ 0.1648,  0.1870,  0.0961,  ...,  0.2118,  0.1591,  0.1742],
        [ 0.0450,  0.0816,  0.0528,  ...,  0.0886,  0.0845,  0.1303],
        [ 0.0390,  0.0353,  0.0365,  ...,  0.0417,  0.0381,  0.0634]], device='cuda:0')
loss: 105.6235122680664
var: tensor([[ 0.0366,  0.0557,  0.0521

var: tensor([[ 0.0302,  0.0452,  0.0193,  ...,  0.0529,  0.0497,  0.0401],
        [ 0.0214,  0.0474,  0.0289,  ...,  0.0339,  0.0754,  0.0385],
        [ 0.0355,  0.0643,  0.0247,  ...,  0.0454,  0.0460,  0.0445],
        ...,
        [ 0.0366,  0.0477,  0.0289,  ...,  0.0485,  0.0551,  0.0408],
        [ 0.0840,  0.1184,  0.0688,  ...,  0.1236,  0.0895,  0.0864],
        [ 0.0457,  0.0896,  0.0508,  ...,  0.0610,  0.0636,  0.0675]], device='cuda:0')
loss: 110.02686309814453
var: tensor([[ 0.0344,  0.0822,  0.0400,  ...,  0.0636,  0.0694,  0.0888],
        [ 0.0616,  0.1012,  0.0363,  ...,  0.1016,  0.0782,  0.0664],
        [ 0.0225,  0.0466,  0.0272,  ...,  0.0308,  0.0611,  0.0354],
        ...,
        [ 0.0648,  0.0854,  0.0450,  ...,  0.0864,  0.0714,  0.0651],
        [ 0.0467,  0.1144,  0.0520,  ...,  0.0805,  0.0661,  0.0819],
        [ 0.0422,  0.0840,  0.0469,  ...,  0.0709,  0.0602,  0.0571]], device='cuda:0')
loss: 110.1129150390625
var: tensor([[ 0.0510,  0.0772,  0.0588

var: tensor([[ 0.0735,  0.1177,  0.0482,  ...,  0.1084,  0.1058,  0.0893],
        [ 0.0660,  0.1216,  0.0535,  ...,  0.1120,  0.1216,  0.0887],
        [ 0.0599,  0.1759,  0.1479,  ...,  0.1643,  0.1998,  0.2037],
        ...,
        [ 0.0729,  0.0816,  0.0484,  ...,  0.0934,  0.0797,  0.0901],
        [ 0.0843,  0.0780,  0.0594,  ...,  0.1005,  0.0891,  0.0738],
        [ 0.0494,  0.0839,  0.0565,  ...,  0.0998,  0.0812,  0.0742]], device='cuda:0')
loss: 107.02304077148438
var: tensor([[ 0.0878,  0.1093,  0.0527,  ...,  0.0845,  0.0892,  0.0770],
        [ 0.1619,  0.1556,  0.0857,  ...,  0.1839,  0.1442,  0.1294],
        [ 0.0994,  0.1128,  0.0520,  ...,  0.1001,  0.1133,  0.0895],
        ...,
        [ 0.0759,  0.0574,  0.0397,  ...,  0.0781,  0.0838,  0.0625],
        [ 0.1554,  0.1909,  0.0923,  ...,  0.1831,  0.1572,  0.1477],
        [ 0.0535,  0.0563,  0.0407,  ...,  0.0762,  0.0688,  0.0587]], device='cuda:0')
loss: 106.87799072265625
var: tensor([[ 0.0544,  0.0884,  0.054

var: tensor([[ 0.0565,  0.0459,  0.0342,  ...,  0.0582,  0.0579,  0.0663],
        [ 0.1095,  0.1289,  0.0760,  ...,  0.1411,  0.0866,  0.1154],
        [ 0.0397,  0.0498,  0.0277,  ...,  0.0666,  0.0455,  0.0622],
        ...,
        [ 0.0459,  0.0411,  0.0287,  ...,  0.0442,  0.0454,  0.0516],
        [ 0.0501,  0.0453,  0.0251,  ...,  0.0477,  0.0377,  0.0433],
        [ 0.0392,  0.0445,  0.0465,  ...,  0.0583,  0.0476,  0.0684]], device='cuda:0')
loss: 108.89205932617188
var: tensor([[ 0.0349,  0.0520,  0.0312,  ...,  0.0534,  0.0390,  0.0499],
        [ 0.0935,  0.0652,  0.0377,  ...,  0.0896,  0.0589,  0.0821],
        [ 0.0263,  0.0324,  0.0345,  ...,  0.0389,  0.0553,  0.0438],
        ...,
        [ 0.0244,  0.0346,  0.0299,  ...,  0.0372,  0.0636,  0.0555],
        [ 0.0458,  0.0534,  0.0290,  ...,  0.0570,  0.0359,  0.0508],
        [ 0.0660,  0.1123,  0.0382,  ...,  0.1003,  0.0910,  0.0737]], device='cuda:0')
loss: 108.59378051757812
var: tensor([[ 0.0491,  0.1194,  0.103

var: tensor([[ 0.0330,  0.0459,  0.0357,  ...,  0.0545,  0.0781,  0.0370],
        [ 0.0551,  0.0599,  0.0401,  ...,  0.0900,  0.0698,  0.0581],
        [ 0.0563,  0.0737,  0.0500,  ...,  0.0896,  0.0784,  0.0527],
        ...,
        [ 0.0465,  0.0429,  0.0288,  ...,  0.0496,  0.0518,  0.0581],
        [ 0.0448,  0.0528,  0.0414,  ...,  0.0687,  0.0684,  0.0478],
        [ 0.0440,  0.0574,  0.0567,  ...,  0.0741,  0.0944,  0.0578]], device='cuda:0')
loss: 112.4071273803711
var: tensor([[ 0.1398,  0.1101,  0.0765,  ...,  0.1589,  0.1287,  0.1070],
        [ 0.0387,  0.0446,  0.0581,  ...,  0.0791,  0.0846,  0.0564],
        [ 0.0615,  0.0561,  0.0318,  ...,  0.0745,  0.0565,  0.0504],
        ...,
        [ 0.0503,  0.0476,  0.0419,  ...,  0.0607,  0.0809,  0.0512],
        [ 0.0448,  0.0621,  0.0661,  ...,  0.0619,  0.1103,  0.0510],
        [ 0.0445,  0.0437,  0.0471,  ...,  0.0640,  0.1159,  0.0693]], device='cuda:0')
loss: 112.33026123046875
var: tensor([[ 0.0366,  0.0515,  0.0492

var: tensor([[ 0.0364,  0.0734,  0.0512,  ...,  0.0791,  0.0615,  0.0655],
        [ 0.0499,  0.1119,  0.0459,  ...,  0.1012,  0.0941,  0.0789],
        [ 0.0771,  0.0905,  0.0623,  ...,  0.1056,  0.0864,  0.0730],
        ...,
        [ 0.0635,  0.0713,  0.0524,  ...,  0.1006,  0.0685,  0.0689],
        [ 0.0479,  0.0494,  0.0387,  ...,  0.0562,  0.0800,  0.0444],
        [ 0.0347,  0.0466,  0.0313,  ...,  0.0558,  0.0499,  0.0437]], device='cuda:0')
loss: 109.36404418945312
var: tensor([[ 0.0300,  0.0454,  0.0410,  ...,  0.0514,  0.0583,  0.0461],
        [ 0.0595,  0.1332,  0.0866,  ...,  0.1048,  0.0690,  0.0769],
        [ 0.0533,  0.0916,  0.0474,  ...,  0.1051,  0.0799,  0.0776],
        ...,
        [ 0.0867,  0.0498,  0.0666,  ...,  0.0855,  0.0512,  0.0832],
        [ 0.0434,  0.0707,  0.0507,  ...,  0.0983,  0.0566,  0.0604],
        [ 0.0287,  0.0423,  0.0313,  ...,  0.0489,  0.0330,  0.0404]], device='cuda:0')
loss: 111.11650848388672
var: tensor([[ 0.0367,  0.0562,  0.038

var: tensor([[ 0.0579,  0.0605,  0.0505,  ...,  0.0644,  0.0523,  0.0490],
        [ 0.0391,  0.0707,  0.0483,  ...,  0.0811,  0.0411,  0.0518],
        [ 0.1054,  0.0676,  0.0501,  ...,  0.0924,  0.0713,  0.0753],
        ...,
        [ 0.0444,  0.0654,  0.0388,  ...,  0.0704,  0.0783,  0.0751],
        [ 0.0386,  0.0768,  0.0558,  ...,  0.0638,  0.0605,  0.0515],
        [ 0.0418,  0.0510,  0.0308,  ...,  0.0615,  0.0591,  0.0349]], device='cuda:0')
loss: 111.26844787597656
var: tensor([[ 0.0523,  0.0714,  0.0389,  ...,  0.0766,  0.0480,  0.0619],
        [ 0.0865,  0.0620,  0.0552,  ...,  0.0962,  0.0552,  0.0740],
        [ 0.0481,  0.0784,  0.0479,  ...,  0.0720,  0.0627,  0.0720],
        ...,
        [ 0.0465,  0.0777,  0.0323,  ...,  0.0788,  0.0560,  0.0626],
        [ 0.0823,  0.0913,  0.0639,  ...,  0.1051,  0.0688,  0.0607],
        [ 0.0489,  0.0584,  0.0458,  ...,  0.0602,  0.0709,  0.0566]], device='cuda:0')
loss: 110.47630310058594
var: tensor([[ 0.0475,  0.0724,  0.063

var: tensor([[ 0.0711,  0.0707,  0.0401,  ...,  0.1250,  0.0852,  0.0686],
        [ 0.0423,  0.0453,  0.0426,  ...,  0.0616,  0.0406,  0.0496],
        [ 0.0483,  0.0455,  0.0363,  ...,  0.0512,  0.0469,  0.0598],
        ...,
        [ 0.0486,  0.0545,  0.0321,  ...,  0.0766,  0.0798,  0.0587],
        [ 0.0572,  0.0576,  0.0401,  ...,  0.0793,  0.0570,  0.0565],
        [ 0.0364,  0.0451,  0.0275,  ...,  0.0426,  0.0570,  0.0651]], device='cuda:0')
loss: 110.7046127319336
var: tensor([[ 0.0894,  0.0739,  0.0546,  ...,  0.1014,  0.0769,  0.0754],
        [ 0.0630,  0.0913,  0.0553,  ...,  0.1077,  0.0925,  0.0839],
        [ 0.0432,  0.0588,  0.0438,  ...,  0.0600,  0.0673,  0.0498],
        ...,
        [ 0.0824,  0.1050,  0.0393,  ...,  0.1222,  0.0828,  0.1074],
        [ 0.0771,  0.0558,  0.0436,  ...,  0.0759,  0.0495,  0.0671],
        [ 0.0565,  0.0488,  0.0417,  ...,  0.0804,  0.0655,  0.0964]], device='cuda:0')
loss: 109.13894653320312
var: tensor([[ 0.0630,  0.0648,  0.0483

var: tensor([[ 0.0294,  0.0355,  0.0282,  ...,  0.0436,  0.0357,  0.0455],
        [ 0.0845,  0.0611,  0.0404,  ...,  0.0776,  0.0495,  0.0702],
        [ 0.0466,  0.0504,  0.0412,  ...,  0.0714,  0.0818,  0.0617],
        ...,
        [ 0.0794,  0.0833,  0.0518,  ...,  0.1223,  0.0743,  0.0726],
        [ 0.0525,  0.2072,  0.1381,  ...,  0.1970,  0.1538,  0.1752],
        [ 0.0972,  0.0787,  0.0759,  ...,  0.1088,  0.0573,  0.0892]], device='cuda:0')
loss: 111.1264877319336
var: tensor([[ 0.0550,  0.1064,  0.0734,  ...,  0.0858,  0.0624,  0.0651],
        [ 0.0414,  0.0582,  0.0400,  ...,  0.0707,  0.0439,  0.0520],
        [ 0.0479,  0.0769,  0.0501,  ...,  0.0775,  0.0653,  0.0583],
        ...,
        [ 0.0394,  0.0449,  0.0386,  ...,  0.0687,  0.0511,  0.0598],
        [ 0.1670,  0.1728,  0.0795,  ...,  0.1967,  0.1265,  0.1800],
        [ 0.0436,  0.0681,  0.0483,  ...,  0.0788,  0.0605,  0.0694]], device='cuda:0')
loss: 109.16954803466797
var: tensor([[ 0.0555,  0.0641,  0.0391

var: tensor([[ 0.0490,  0.0745,  0.0387,  ...,  0.0859,  0.0783,  0.0661],
        [ 0.0361,  0.0556,  0.0554,  ...,  0.0487,  0.0669,  0.0433],
        [ 0.0529,  0.0962,  0.0680,  ...,  0.0911,  0.0833,  0.0689],
        ...,
        [ 0.0969,  0.0509,  0.0450,  ...,  0.0556,  0.0617,  0.0728],
        [ 0.1972,  0.1752,  0.1049,  ...,  0.2773,  0.1876,  0.1864],
        [ 0.0550,  0.0484,  0.0246,  ...,  0.0585,  0.0486,  0.0673]], device='cuda:0')
loss: 105.25686645507812
var: tensor([[ 0.0577,  0.0529,  0.0303,  ...,  0.0784,  0.0688,  0.0436],
        [ 0.0946,  0.0820,  0.0597,  ...,  0.1044,  0.0781,  0.0919],
        [ 0.0576,  0.0956,  0.0461,  ...,  0.1258,  0.1282,  0.0824],
        ...,
        [ 0.0745,  0.1054,  0.0462,  ...,  0.1164,  0.1223,  0.0721],
        [ 0.1036,  0.1122,  0.0514,  ...,  0.1460,  0.1458,  0.0970],
        [ 0.1869,  0.1612,  0.0826,  ...,  0.2318,  0.1653,  0.1960]], device='cuda:0')
loss: 103.98670196533203
var: tensor([[ 0.0402,  0.0569,  0.038

var: tensor([[ 0.0650,  0.0808,  0.0443,  ...,  0.0707,  0.0967,  0.0529],
        [ 0.0669,  0.1115,  0.0413,  ...,  0.1048,  0.0628,  0.0734],
        [ 0.1208,  0.1209,  0.0535,  ...,  0.1493,  0.1092,  0.0954],
        ...,
        [ 0.1647,  0.1508,  0.0820,  ...,  0.2008,  0.1354,  0.1220],
        [ 0.0605,  0.1989,  0.1576,  ...,  0.1875,  0.1300,  0.1036],
        [ 0.1467,  0.1512,  0.1159,  ...,  0.2015,  0.1165,  0.1490]], device='cuda:0')
loss: 106.46163940429688
var: tensor([[ 0.0346,  0.0521,  0.0376,  ...,  0.0912,  0.0759,  0.0691],
        [ 0.0357,  0.0479,  0.0327,  ...,  0.0457,  0.0894,  0.0461],
        [ 0.0304,  0.0438,  0.0347,  ...,  0.0548,  0.0723,  0.0388],
        ...,
        [ 0.0514,  0.0665,  0.0437,  ...,  0.0508,  0.0741,  0.0407],
        [ 0.0979,  0.0682,  0.0446,  ...,  0.0927,  0.0557,  0.0841],
        [ 0.0483,  0.0644,  0.0498,  ...,  0.0848,  0.0525,  0.0801]], device='cuda:0')
loss: 108.39611053466797
var: tensor([[ 0.0793,  0.2336,  0.154

var: tensor([[ 0.0551,  0.0674,  0.0551,  ...,  0.0925,  0.0652,  0.0709],
        [ 0.0402,  0.0422,  0.0461,  ...,  0.0771,  0.0528,  0.0435],
        [ 0.0732,  0.0535,  0.0353,  ...,  0.0683,  0.0411,  0.0667],
        ...,
        [ 0.0842,  0.0954,  0.0654,  ...,  0.1056,  0.0794,  0.0633],
        [ 0.0395,  0.0623,  0.0452,  ...,  0.0584,  0.0626,  0.0397],
        [ 0.0244,  0.0408,  0.0306,  ...,  0.0390,  0.0421,  0.0365]], device='cuda:0')
loss: 110.17521667480469
var: tensor([[ 0.0873,  0.0660,  0.0582,  ...,  0.1153,  0.0509,  0.1106],
        [ 0.0299,  0.0669,  0.0426,  ...,  0.0660,  0.0483,  0.0462],
        [ 0.0370,  0.0567,  0.0432,  ...,  0.0630,  0.0685,  0.0504],
        ...,
        [ 0.0309,  0.0575,  0.0437,  ...,  0.0730,  0.0638,  0.0752],
        [ 0.0416,  0.0355,  0.0326,  ...,  0.0485,  0.0391,  0.0357],
        [ 0.0384,  0.0556,  0.0358,  ...,  0.1010,  0.0511,  0.0708]], device='cuda:0')
loss: 104.59062194824219
var: tensor([[ 0.1018,  0.0591,  0.040

var: tensor([[ 0.2256,  0.1564,  0.0902,  ...,  0.2373,  0.1449,  0.2117],
        [ 0.0710,  0.1691,  0.1238,  ...,  0.1685,  0.0912,  0.1133],
        [ 0.0882,  0.0741,  0.0491,  ...,  0.0939,  0.0549,  0.0645],
        ...,
        [ 0.0442,  0.0438,  0.0317,  ...,  0.0716,  0.0546,  0.0674],
        [ 0.0524,  0.1751,  0.1396,  ...,  0.1684,  0.1022,  0.0925],
        [ 0.0450,  0.0581,  0.0421,  ...,  0.0553,  0.0592,  0.0897]], device='cuda:0')
loss: 105.57784271240234
var: tensor([[ 0.0410,  0.0537,  0.0318,  ...,  0.0672,  0.0501,  0.0398],
        [ 0.0495,  0.0573,  0.0426,  ...,  0.0803,  0.0547,  0.0541],
        [ 0.0829,  0.0861,  0.0477,  ...,  0.1086,  0.0664,  0.0834],
        ...,
        [ 0.0350,  0.0461,  0.0324,  ...,  0.0619,  0.0436,  0.0612],
        [ 0.0531,  0.0620,  0.0418,  ...,  0.0524,  0.0551,  0.0427],
        [ 0.0718,  0.0799,  0.0530,  ...,  0.1004,  0.0620,  0.0715]], device='cuda:0')
loss: 109.78619384765625
var: tensor([[ 0.1315,  0.0883,  0.058

var: tensor([[ 0.0310,  0.0474,  0.0452,  ...,  0.0414,  0.0723,  0.0561],
        [ 0.0386,  0.0612,  0.0346,  ...,  0.0448,  0.0464,  0.0445],
        [ 0.0441,  0.0550,  0.0555,  ...,  0.0386,  0.0812,  0.0404],
        ...,
        [ 0.0564,  0.0909,  0.0606,  ...,  0.0615,  0.0587,  0.0610],
        [ 0.1318,  0.1342,  0.0637,  ...,  0.1553,  0.1148,  0.1290],
        [ 0.0699,  0.0476,  0.0376,  ...,  0.0751,  0.0612,  0.0691]], device='cuda:0')
loss: 108.35425567626953
var: tensor([[ 0.0372,  0.0421,  0.0449,  ...,  0.0523,  0.0674,  0.0621],
        [ 0.0328,  0.0587,  0.0478,  ...,  0.0625,  0.0588,  0.0430],
        [ 0.0444,  0.0671,  0.0560,  ...,  0.0674,  0.0664,  0.0687],
        ...,
        [ 0.0636,  0.0956,  0.0551,  ...,  0.0835,  0.1026,  0.0629],
        [ 0.0745,  0.0676,  0.0426,  ...,  0.1197,  0.0866,  0.0620],
        [ 0.0398,  0.0778,  0.0476,  ...,  0.0519,  0.0610,  0.0583]], device='cuda:0')
loss: 111.39003499348958
====> Epoch: 6 Average loss: 108.7701


loss: 108.71510314941406
var: tensor([[ 0.0476,  0.0694,  0.0394,  ...,  0.0680,  0.0669,  0.0614],
        [ 0.0600,  0.0895,  0.0831,  ...,  0.0592,  0.0861,  0.0545],
        [ 0.0508,  0.0553,  0.0399,  ...,  0.0810,  0.0471,  0.0542],
        ...,
        [ 0.1021,  0.0792,  0.0500,  ...,  0.0982,  0.0783,  0.0662],
        [ 0.0615,  0.1230,  0.0565,  ...,  0.0748,  0.1000,  0.0745],
        [ 0.0430,  0.0786,  0.0652,  ...,  0.1044,  0.0685,  0.0736]], device='cuda:0')
loss: 107.5784912109375
var: tensor([[ 0.1083,  0.0726,  0.0599,  ...,  0.0924,  0.0855,  0.0813],
        [ 0.1293,  0.0670,  0.0633,  ...,  0.0879,  0.0831,  0.0625],
        [ 0.0704,  0.0569,  0.0439,  ...,  0.0968,  0.0711,  0.1195],
        ...,
        [ 0.0444,  0.0379,  0.0284,  ...,  0.0536,  0.0547,  0.0322],
        [ 0.0452,  0.1551,  0.1388,  ...,  0.1353,  0.1582,  0.1632],
        [ 0.0340,  0.0486,  0.0486,  ...,  0.0611,  0.0529,  0.0463]], device='cuda:0')
loss: 103.96499633789062
var: tensor([[

var: tensor([[ 0.0530,  0.1211,  0.0639,  ...,  0.0838,  0.0738,  0.0603],
        [ 0.0480,  0.0721,  0.0405,  ...,  0.0670,  0.0708,  0.0628],
        [ 0.0347,  0.0549,  0.0343,  ...,  0.0752,  0.0508,  0.0485],
        ...,
        [ 0.0829,  0.0940,  0.0603,  ...,  0.0934,  0.0769,  0.0565],
        [ 0.0500,  0.0758,  0.0462,  ...,  0.0864,  0.0792,  0.0499],
        [ 0.0387,  0.0635,  0.0453,  ...,  0.0682,  0.0736,  0.0506]], device='cuda:0')
loss: 103.78857421875
var: tensor([[ 0.0668,  0.1331,  0.0906,  ...,  0.0983,  0.0879,  0.0830],
        [ 0.0679,  0.1465,  0.0702,  ...,  0.1318,  0.1124,  0.0830],
        [ 0.0307,  0.0448,  0.0240,  ...,  0.0790,  0.0866,  0.0648],
        ...,
        [ 0.0786,  0.1114,  0.0624,  ...,  0.1480,  0.1296,  0.0862],
        [ 0.0468,  0.0814,  0.0584,  ...,  0.0975,  0.0633,  0.0698],
        [ 0.0759,  0.0617,  0.0449,  ...,  0.0884,  0.0645,  0.0798]], device='cuda:0')
loss: 106.31603240966797
var: tensor([[ 0.0580,  0.0771,  0.0555, 

var: tensor([[ 0.0490,  0.0515,  0.0515,  ...,  0.0719,  0.0711,  0.0531],
        [ 0.2094,  0.1223,  0.0961,  ...,  0.2136,  0.1429,  0.1835],
        [ 0.0665,  0.0912,  0.0539,  ...,  0.0954,  0.0785,  0.0687],
        ...,
        [ 0.1068,  0.1090,  0.0573,  ...,  0.1154,  0.1112,  0.0749],
        [ 0.0889,  0.0868,  0.0469,  ...,  0.0900,  0.0852,  0.0679],
        [ 0.1232,  0.1758,  0.0813,  ...,  0.1577,  0.0996,  0.1353]], device='cuda:0')
loss: 110.75684356689453
var: tensor([[ 0.0680,  0.0763,  0.0658,  ...,  0.0831,  0.0858,  0.0840],
        [ 0.0806,  0.0739,  0.0341,  ...,  0.0932,  0.0792,  0.0968],
        [ 0.0586,  0.0632,  0.0440,  ...,  0.0772,  0.0632,  0.0497],
        ...,
        [ 0.0287,  0.0444,  0.0297,  ...,  0.0637,  0.0651,  0.0697],
        [ 0.0612,  0.0975,  0.0854,  ...,  0.0760,  0.1081,  0.0635],
        [ 0.0246,  0.0310,  0.0275,  ...,  0.0410,  0.0436,  0.0497]], device='cuda:0')
loss: 109.83828735351562
var: tensor([[ 0.0656,  0.1118,  0.045

var: tensor([[ 0.0317,  0.0542,  0.0419,  ...,  0.0686,  0.0607,  0.0512],
        [ 0.0594,  0.0644,  0.0426,  ...,  0.0866,  0.0577,  0.0591],
        [ 0.0978,  0.0910,  0.0552,  ...,  0.1099,  0.0986,  0.0865],
        ...,
        [ 0.0962,  0.0839,  0.0428,  ...,  0.1243,  0.1081,  0.0833],
        [ 0.1118,  0.1473,  0.0936,  ...,  0.1845,  0.1245,  0.1806],
        [ 0.0993,  0.0857,  0.0518,  ...,  0.0887,  0.0999,  0.0708]], device='cuda:0')
loss: 109.55985260009766
var: tensor([[ 0.0387,  0.0515,  0.0652,  ...,  0.0817,  0.0643,  0.0448],
        [ 0.0559,  0.0478,  0.0339,  ...,  0.0675,  0.0589,  0.0540],
        [ 0.0946,  0.1002,  0.0614,  ...,  0.1167,  0.1147,  0.0880],
        ...,
        [ 0.0620,  0.0982,  0.1042,  ...,  0.0977,  0.0852,  0.0973],
        [ 0.0358,  0.0360,  0.0299,  ...,  0.0577,  0.0519,  0.0434],
        [ 0.0742,  0.0909,  0.0475,  ...,  0.0985,  0.1036,  0.0756]], device='cuda:0')
loss: 110.52667236328125
var: tensor([[ 0.0810,  0.0483,  0.042

var: tensor([[ 0.0857,  0.0688,  0.0547,  ...,  0.1293,  0.0739,  0.0948],
        [ 0.0945,  0.0771,  0.0475,  ...,  0.1067,  0.0793,  0.0698],
        [ 0.0418,  0.1269,  0.0672,  ...,  0.1463,  0.0814,  0.1346],
        ...,
        [ 0.0494,  0.0632,  0.0438,  ...,  0.0906,  0.0603,  0.0671],
        [ 0.0320,  0.0436,  0.0389,  ...,  0.0632,  0.0477,  0.0534],
        [ 0.0366,  0.0633,  0.0817,  ...,  0.0882,  0.0586,  0.0597]], device='cuda:0')
loss: 108.31442260742188
var: tensor([[ 0.0511,  0.0997,  0.0449,  ...,  0.0869,  0.0744,  0.0851],
        [ 0.0259,  0.0733,  0.0482,  ...,  0.0798,  0.0427,  0.0673],
        [ 0.0645,  0.1324,  0.0476,  ...,  0.1320,  0.1091,  0.0828],
        ...,
        [ 0.0695,  0.1202,  0.0554,  ...,  0.1323,  0.1332,  0.0992],
        [ 0.0368,  0.0475,  0.0460,  ...,  0.0579,  0.0565,  0.0654],
        [ 0.0496,  0.0776,  0.0502,  ...,  0.0816,  0.0601,  0.0750]], device='cuda:0')
loss: 110.16172790527344
var: tensor([[ 0.0300,  0.0490,  0.043

var: tensor([[ 0.0478,  0.0481,  0.0403,  ...,  0.0785,  0.0617,  0.0451],
        [ 0.0811,  0.1051,  0.0501,  ...,  0.0918,  0.0832,  0.0740],
        [ 0.0855,  0.1934,  0.0994,  ...,  0.1626,  0.1300,  0.1821],
        ...,
        [ 0.1655,  0.1984,  0.0797,  ...,  0.2237,  0.1794,  0.1647],
        [ 0.0902,  0.0736,  0.0564,  ...,  0.1074,  0.0787,  0.0681],
        [ 0.0608,  0.0571,  0.0374,  ...,  0.0772,  0.0538,  0.0656]], device='cuda:0')
loss: 108.36398315429688
var: tensor([[ 0.0745,  0.1278,  0.0472,  ...,  0.1113,  0.1226,  0.0704],
        [ 0.0631,  0.0954,  0.0409,  ...,  0.0878,  0.0958,  0.0691],
        [ 0.0444,  0.0678,  0.0728,  ...,  0.0934,  0.0829,  0.0565],
        ...,
        [ 0.0379,  0.0442,  0.0351,  ...,  0.0652,  0.0819,  0.0728],
        [ 0.0615,  0.0741,  0.0460,  ...,  0.0577,  0.0580,  0.0615],
        [ 0.0930,  0.0849,  0.0619,  ...,  0.1009,  0.1034,  0.0653]], device='cuda:0')
loss: 105.50724792480469
var: tensor([[ 0.0552,  0.0832,  0.053

var: tensor([[ 0.0763,  0.1813,  0.1030,  ...,  0.1747,  0.1284,  0.1732],
        [ 0.0862,  0.1972,  0.1133,  ...,  0.1710,  0.1153,  0.1603],
        [ 0.0918,  0.1309,  0.0370,  ...,  0.1061,  0.1101,  0.0676],
        ...,
        [ 0.0536,  0.1342,  0.1308,  ...,  0.1411,  0.1305,  0.1169],
        [ 0.0684,  0.0818,  0.0367,  ...,  0.0750,  0.0677,  0.0585],
        [ 0.0535,  0.0805,  0.0564,  ...,  0.0888,  0.0919,  0.0767]], device='cuda:0')
loss: 100.81494140625
var: tensor([[ 0.0421,  0.0454,  0.0364,  ...,  0.0504,  0.0477,  0.0444],
        [ 0.0512,  0.0882,  0.0529,  ...,  0.0786,  0.0734,  0.0690],
        [ 0.0505,  0.0735,  0.0484,  ...,  0.0563,  0.0527,  0.0462],
        ...,
        [ 0.0587,  0.0946,  0.0557,  ...,  0.0697,  0.0663,  0.0565],
        [ 0.0455,  0.0887,  0.0589,  ...,  0.0913,  0.0687,  0.0811],
        [ 0.0360,  0.0394,  0.0358,  ...,  0.0485,  0.0445,  0.0480]], device='cuda:0')
loss: 108.72848510742188
var: tensor([[ 0.0518,  0.0569,  0.0397, 

var: tensor([[ 0.0924,  0.0713,  0.0488,  ...,  0.1018,  0.0625,  0.0880],
        [ 0.0294,  0.0458,  0.0316,  ...,  0.0503,  0.0447,  0.0571],
        [ 0.0918,  0.1419,  0.0617,  ...,  0.1650,  0.0976,  0.1156],
        ...,
        [ 0.0722,  0.0930,  0.0711,  ...,  0.1009,  0.0852,  0.0657],
        [ 0.0302,  0.0524,  0.0384,  ...,  0.0591,  0.0588,  0.0541],
        [ 0.0584,  0.1072,  0.0522,  ...,  0.0830,  0.0888,  0.0679]], device='cuda:0')
loss: 105.8228759765625
var: tensor([[ 0.1254,  0.0942,  0.0620,  ...,  0.1086,  0.0792,  0.0803],
        [ 0.0444,  0.0597,  0.0428,  ...,  0.0589,  0.0474,  0.0575],
        [ 0.0401,  0.0649,  0.0448,  ...,  0.0689,  0.0616,  0.0630],
        ...,
        [ 0.0501,  0.0888,  0.0613,  ...,  0.0937,  0.0691,  0.0804],
        [ 0.0473,  0.0654,  0.0437,  ...,  0.0570,  0.0652,  0.0562],
        [ 0.0283,  0.0392,  0.0337,  ...,  0.0470,  0.0652,  0.0510]], device='cuda:0')
loss: 108.91632080078125
var: tensor([[ 0.0435,  0.0566,  0.0406

var: tensor([[ 0.0411,  0.0381,  0.0356,  ...,  0.0385,  0.0415,  0.0650],
        [ 0.0408,  0.0555,  0.0337,  ...,  0.0460,  0.0328,  0.0409],
        [ 0.0366,  0.0520,  0.0436,  ...,  0.0388,  0.0395,  0.0481],
        ...,
        [ 0.0448,  0.0679,  0.0417,  ...,  0.0834,  0.0564,  0.0651],
        [ 0.0351,  0.0615,  0.0406,  ...,  0.0897,  0.0453,  0.0876],
        [ 0.0567,  0.0764,  0.0416,  ...,  0.0656,  0.0600,  0.0580]], device='cuda:0')
loss: 105.99248504638672
var: tensor([[ 0.0747,  0.0582,  0.0252,  ...,  0.0593,  0.0373,  0.0653],
        [ 0.1367,  0.1795,  0.0665,  ...,  0.1660,  0.1133,  0.1515],
        [ 0.0600,  0.0889,  0.0753,  ...,  0.0850,  0.0774,  0.0665],
        ...,
        [ 0.0414,  0.0593,  0.0357,  ...,  0.0579,  0.0461,  0.0451],
        [ 0.0511,  0.0728,  0.0299,  ...,  0.0880,  0.0546,  0.0694],
        [ 0.0380,  0.0743,  0.0471,  ...,  0.0481,  0.0365,  0.0516]], device='cuda:0')
loss: 108.95703125
var: tensor([[ 0.0582,  0.0581,  0.0404,  ..

var: tensor([[ 0.0344,  0.0736,  0.0357,  ...,  0.0883,  0.0516,  0.0581],
        [ 0.0315,  0.0443,  0.0384,  ...,  0.0458,  0.0543,  0.0386],
        [ 0.0351,  0.0474,  0.0387,  ...,  0.0565,  0.0687,  0.0529],
        ...,
        [ 0.0961,  0.0458,  0.0330,  ...,  0.0856,  0.0453,  0.0809],
        [ 0.0388,  0.0394,  0.0369,  ...,  0.0501,  0.0585,  0.0507],
        [ 0.0619,  0.0812,  0.0502,  ...,  0.1145,  0.0631,  0.0671]], device='cuda:0')
loss: 109.07630920410156
var: tensor([[ 0.0288,  0.0733,  0.0394,  ...,  0.0906,  0.0536,  0.0863],
        [ 0.0556,  0.0703,  0.0581,  ...,  0.0758,  0.0680,  0.0645],
        [ 0.0447,  0.0544,  0.0471,  ...,  0.0722,  0.0618,  0.0598],
        ...,
        [ 0.1112,  0.1331,  0.0943,  ...,  0.1826,  0.1049,  0.1435],
        [ 0.0290,  0.0398,  0.0181,  ...,  0.0651,  0.0455,  0.0520],
        [ 0.0415,  0.0664,  0.0416,  ...,  0.0605,  0.0639,  0.0588]], device='cuda:0')
loss: 107.58789825439453
var: tensor([[ 0.0588,  0.1003,  0.038

var: tensor([[ 0.0560,  0.1177,  0.0455,  ...,  0.0997,  0.0948,  0.0684],
        [ 0.0525,  0.0512,  0.0287,  ...,  0.0759,  0.0613,  0.0661],
        [ 0.0370,  0.0756,  0.0366,  ...,  0.0946,  0.0651,  0.0501],
        ...,
        [ 0.0415,  0.0681,  0.0554,  ...,  0.0552,  0.0801,  0.0622],
        [ 0.0680,  0.0941,  0.0495,  ...,  0.0722,  0.0718,  0.0639],
        [ 0.0415,  0.0638,  0.0455,  ...,  0.0609,  0.0505,  0.0492]], device='cuda:0')
loss: 107.35704040527344
var: tensor([[ 0.0456,  0.0747,  0.0392,  ...,  0.1004,  0.0954,  0.0819],
        [ 0.0399,  0.0544,  0.0301,  ...,  0.0627,  0.0566,  0.0594],
        [ 0.0481,  0.0518,  0.0460,  ...,  0.0603,  0.0556,  0.0705],
        ...,
        [ 0.0526,  0.1005,  0.0568,  ...,  0.0625,  0.0675,  0.0639],
        [ 0.0358,  0.0732,  0.0311,  ...,  0.0586,  0.0466,  0.0510],
        [ 0.1212,  0.1157,  0.0440,  ...,  0.1240,  0.0881,  0.0938]], device='cuda:0')
loss: 108.70781707763672
var: tensor([[ 0.0299,  0.0644,  0.037

var: tensor([[ 0.0381,  0.1194,  0.1124,  ...,  0.1164,  0.1291,  0.0970],
        [ 0.0582,  0.0576,  0.0386,  ...,  0.0673,  0.0484,  0.0476],
        [ 0.0333,  0.0537,  0.0508,  ...,  0.0740,  0.0563,  0.0655],
        ...,
        [ 0.0298,  0.0411,  0.0314,  ...,  0.0524,  0.0524,  0.0415],
        [ 0.0566,  0.1066,  0.0586,  ...,  0.1005,  0.0800,  0.0810],
        [ 0.0868,  0.0461,  0.0394,  ...,  0.1083,  0.0566,  0.0722]], device='cuda:0')
loss: 108.5016860961914
var: tensor([[ 0.0395,  0.0620,  0.0364,  ...,  0.0630,  0.0440,  0.0831],
        [ 0.0344,  0.0513,  0.0538,  ...,  0.0609,  0.1109,  0.0668],
        [ 0.0428,  0.0609,  0.0395,  ...,  0.0622,  0.0488,  0.0524],
        ...,
        [ 0.0424,  0.0880,  0.0789,  ...,  0.0805,  0.0882,  0.0703],
        [ 0.0329,  0.0497,  0.0374,  ...,  0.0679,  0.0503,  0.0668],
        [ 0.0711,  0.1162,  0.0396,  ...,  0.1050,  0.1094,  0.0660]], device='cuda:0')
loss: 108.75437927246094
var: tensor([[ 0.1194,  0.0525,  0.0501

var: tensor([[ 0.0381,  0.0504,  0.0367,  ...,  0.0668,  0.0563,  0.0546],
        [ 0.0347,  0.0402,  0.0300,  ...,  0.0463,  0.0530,  0.0381],
        [ 0.0288,  0.0406,  0.0232,  ...,  0.0539,  0.0464,  0.0382],
        ...,
        [ 0.0446,  0.0454,  0.0418,  ...,  0.0450,  0.0532,  0.0620],
        [ 0.0688,  0.1117,  0.0414,  ...,  0.0854,  0.0870,  0.0560],
        [ 0.1720,  0.1467,  0.0569,  ...,  0.1853,  0.1463,  0.1482]], device='cuda:0')
loss: 108.66706848144531
var: tensor([[ 0.2005,  0.1437,  0.0598,  ...,  0.2020,  0.1512,  0.1911],
        [ 0.0586,  0.0987,  0.0380,  ...,  0.0783,  0.0703,  0.0505],
        [ 0.0672,  0.0777,  0.0350,  ...,  0.0698,  0.0498,  0.0590],
        ...,
        [ 0.0554,  0.0457,  0.0268,  ...,  0.0279,  0.0590,  0.0431],
        [ 0.0650,  0.0515,  0.0444,  ...,  0.0727,  0.0611,  0.0565],
        [ 0.0601,  0.0531,  0.0376,  ...,  0.0914,  0.0600,  0.0801]], device='cuda:0')
loss: 105.50289916992188
var: tensor([[ 0.0490,  0.0431,  0.029

var: tensor([[ 0.0364,  0.0471,  0.0425,  ...,  0.0600,  0.0670,  0.0470],
        [ 0.0724,  0.0454,  0.0458,  ...,  0.0698,  0.0496,  0.0869],
        [ 0.0328,  0.0675,  0.0463,  ...,  0.0849,  0.0636,  0.0491],
        ...,
        [ 0.0553,  0.0739,  0.0693,  ...,  0.0927,  0.0768,  0.0587],
        [ 0.0369,  0.0533,  0.0526,  ...,  0.0499,  0.0674,  0.0472],
        [ 0.0613,  0.1094,  0.0525,  ...,  0.1423,  0.0919,  0.0795]], device='cuda:0')
loss: 109.98474884033203
var: tensor([[ 0.0347,  0.0638,  0.0662,  ...,  0.0816,  0.0630,  0.0565],
        [ 0.0286,  0.0431,  0.0234,  ...,  0.0544,  0.0606,  0.0459],
        [ 0.0424,  0.0860,  0.0512,  ...,  0.0775,  0.0453,  0.0553],
        ...,
        [ 0.0768,  0.0600,  0.0419,  ...,  0.0925,  0.0823,  0.0692],
        [ 0.0452,  0.0670,  0.0452,  ...,  0.0835,  0.0559,  0.0495],
        [ 0.0465,  0.1136,  0.0494,  ...,  0.0830,  0.0610,  0.0610]], device='cuda:0')
loss: 111.00740814208984
var: tensor([[ 0.0461,  0.0566,  0.038

var: tensor([[ 0.0529,  0.0614,  0.0820,  ...,  0.0838,  0.0980,  0.0479],
        [ 0.0337,  0.0624,  0.0493,  ...,  0.1045,  0.0699,  0.0898],
        [ 0.0482,  0.1435,  0.1206,  ...,  0.1965,  0.1467,  0.1438],
        ...,
        [ 0.0515,  0.0571,  0.0593,  ...,  0.0877,  0.0686,  0.0643],
        [ 0.0377,  0.0601,  0.0450,  ...,  0.0871,  0.0708,  0.0654],
        [ 0.0275,  0.0509,  0.0435,  ...,  0.0777,  0.0712,  0.0585]], device='cuda:0')
loss: 105.2137451171875
var: tensor([[ 0.0885,  0.0647,  0.0352,  ...,  0.0999,  0.0592,  0.0565],
        [ 0.0783,  0.0461,  0.0355,  ...,  0.0646,  0.0428,  0.0505],
        [ 0.0372,  0.0741,  0.0740,  ...,  0.0949,  0.0887,  0.0474],
        ...,
        [ 0.0405,  0.0530,  0.0395,  ...,  0.0657,  0.0500,  0.0389],
        [ 0.0477,  0.0756,  0.0363,  ...,  0.0908,  0.0687,  0.0528],
        [ 0.0581,  0.0996,  0.0871,  ...,  0.0930,  0.0956,  0.0611]], device='cuda:0')
loss: 109.1243667602539
var: tensor([[ 0.0409,  0.0439,  0.0566,

var: tensor([[ 0.1017,  0.1531,  0.0750,  ...,  0.1629,  0.1153,  0.1646],
        [ 0.0251,  0.0581,  0.0586,  ...,  0.0829,  0.0763,  0.0551],
        [ 0.0582,  0.0796,  0.0729,  ...,  0.0970,  0.0907,  0.0638],
        ...,
        [ 0.0454,  0.0707,  0.0304,  ...,  0.0780,  0.0542,  0.0452],
        [ 0.0419,  0.0693,  0.0379,  ...,  0.0751,  0.0711,  0.0762],
        [ 0.0468,  0.0618,  0.0350,  ...,  0.0732,  0.0612,  0.0587]], device='cuda:0')
loss: 106.12820434570312
var: tensor([[ 0.0523,  0.0847,  0.0375,  ...,  0.0914,  0.1045,  0.0421],
        [ 0.0273,  0.0493,  0.0497,  ...,  0.0736,  0.0704,  0.0593],
        [ 0.0274,  0.0766,  0.0437,  ...,  0.1039,  0.0659,  0.0619],
        ...,
        [ 0.1098,  0.1318,  0.0649,  ...,  0.1868,  0.0943,  0.1104],
        [ 0.0313,  0.0607,  0.0590,  ...,  0.0783,  0.0845,  0.0554],
        [ 0.0525,  0.0891,  0.0354,  ...,  0.0838,  0.0930,  0.0571]], device='cuda:0')
loss: 104.45381164550781
var: tensor([[ 0.1482,  0.1584,  0.054

var: tensor([[ 0.1202,  0.1902,  0.0683,  ...,  0.1748,  0.1094,  0.1239],
        [ 0.2289,  0.1860,  0.0643,  ...,  0.2075,  0.1523,  0.1472],
        [ 0.0486,  0.0590,  0.0432,  ...,  0.0797,  0.0620,  0.0610],
        ...,
        [ 0.0371,  0.0796,  0.0440,  ...,  0.0917,  0.0726,  0.0716],
        [ 0.0374,  0.0694,  0.0352,  ...,  0.0777,  0.0474,  0.0607],
        [ 0.0830,  0.0581,  0.0577,  ...,  0.1238,  0.0717,  0.0851]], device='cuda:0')
loss: 109.77911376953125
var: tensor([[ 0.1121,  0.0463,  0.0410,  ...,  0.0854,  0.0529,  0.0783],
        [ 0.0314,  0.0507,  0.0278,  ...,  0.0557,  0.0616,  0.0354],
        [ 0.0495,  0.0652,  0.0429,  ...,  0.0903,  0.0668,  0.0340],
        ...,
        [ 0.0471,  0.0471,  0.0412,  ...,  0.1001,  0.0528,  0.0648],
        [ 0.0258,  0.0566,  0.0255,  ...,  0.0628,  0.0578,  0.0482],
        [ 0.1861,  0.2203,  0.0770,  ...,  0.2417,  0.1637,  0.2063]], device='cuda:0')
loss: 108.68203735351562
var: tensor([[ 0.0408,  0.0611,  0.048

var: tensor([[ 0.0431,  0.0830,  0.0423,  ...,  0.0577,  0.0548,  0.0536],
        [ 0.0411,  0.0520,  0.0364,  ...,  0.0635,  0.0388,  0.0747],
        [ 0.0437,  0.0348,  0.0335,  ...,  0.0885,  0.0539,  0.0564],
        ...,
        [ 0.0448,  0.0575,  0.0271,  ...,  0.0498,  0.0407,  0.0681],
        [ 0.0723,  0.0390,  0.0300,  ...,  0.0820,  0.0358,  0.0850],
        [ 0.0349,  0.0547,  0.0394,  ...,  0.0505,  0.0648,  0.0647]], device='cuda:0')
loss: 109.58587646484375
var: tensor([[ 0.0287,  0.0340,  0.0230,  ...,  0.0441,  0.0341,  0.0356],
        [ 0.0305,  0.0539,  0.0453,  ...,  0.0715,  0.0543,  0.0521],
        [ 0.0329,  0.0565,  0.0283,  ...,  0.0350,  0.0425,  0.0381],
        ...,
        [ 0.0969,  0.0509,  0.0452,  ...,  0.1175,  0.0533,  0.0982],
        [ 0.0985,  0.1054,  0.0619,  ...,  0.0981,  0.0857,  0.0728],
        [ 0.0588,  0.0967,  0.0518,  ...,  0.0965,  0.0718,  0.0796]], device='cuda:0')
loss: 109.44192504882812
var: tensor([[ 0.1364,  0.1546,  0.119

var: tensor([[ 0.0348,  0.0571,  0.0389,  ...,  0.0422,  0.0714,  0.0604],
        [ 0.0455,  0.0410,  0.0284,  ...,  0.0444,  0.0474,  0.0474],
        [ 0.0468,  0.0765,  0.0458,  ...,  0.0489,  0.0719,  0.0670],
        ...,
        [ 0.0353,  0.0568,  0.0375,  ...,  0.0633,  0.0543,  0.0565],
        [ 0.0813,  0.1024,  0.0481,  ...,  0.0883,  0.1152,  0.0623],
        [ 0.0396,  0.0567,  0.0489,  ...,  0.0570,  0.0597,  0.0840]], device='cuda:0')
loss: 110.90010070800781
var: tensor([[ 0.0379,  0.0531,  0.0331,  ...,  0.0452,  0.0474,  0.0600],
        [ 0.0474,  0.0729,  0.0359,  ...,  0.0811,  0.0628,  0.0661],
        [ 0.0360,  0.0833,  0.0331,  ...,  0.0545,  0.0594,  0.0568],
        ...,
        [ 0.0523,  0.0752,  0.0287,  ...,  0.0617,  0.0599,  0.0563],
        [ 0.1317,  0.0904,  0.0545,  ...,  0.0967,  0.0796,  0.0839],
        [ 0.0335,  0.0550,  0.0293,  ...,  0.0607,  0.0357,  0.0521]], device='cuda:0')
loss: 105.04368591308594
var: tensor([[ 0.0389,  0.0599,  0.031

var: tensor([[ 0.0487,  0.0665,  0.0442,  ...,  0.0617,  0.0658,  0.0738],
        [ 0.0668,  0.0703,  0.0525,  ...,  0.0728,  0.0736,  0.0676],
        [ 0.0464,  0.0503,  0.0569,  ...,  0.0638,  0.0613,  0.0765],
        ...,
        [ 0.0308,  0.0609,  0.0473,  ...,  0.0598,  0.0655,  0.0525],
        [ 0.0524,  0.0682,  0.0393,  ...,  0.0802,  0.0696,  0.0622],
        [ 0.0564,  0.0731,  0.0417,  ...,  0.0540,  0.0745,  0.0616]], device='cuda:0')
loss: 108.5981216430664
var: tensor([[ 0.1574,  0.1855,  0.1064,  ...,  0.2080,  0.1475,  0.1458],
        [ 0.0450,  0.0747,  0.0351,  ...,  0.0711,  0.0641,  0.0681],
        [ 0.0651,  0.1376,  0.0578,  ...,  0.0809,  0.0930,  0.1137],
        ...,
        [ 0.0414,  0.0707,  0.0452,  ...,  0.0829,  0.0970,  0.0703],
        [ 0.0292,  0.0606,  0.0428,  ...,  0.0656,  0.0628,  0.0655],
        [ 0.0543,  0.1255,  0.0641,  ...,  0.0788,  0.1013,  0.0771]], device='cuda:0')
loss: 104.42076110839844
var: tensor([[ 0.0305,  0.0455,  0.0365

var: tensor([[ 0.0447,  0.0434,  0.0292,  ...,  0.0489,  0.0515,  0.0403],
        [ 0.0540,  0.1183,  0.0785,  ...,  0.1082,  0.0778,  0.0699],
        [ 0.0520,  0.0425,  0.0386,  ...,  0.0801,  0.0585,  0.0464],
        ...,
        [ 0.0491,  0.1056,  0.0410,  ...,  0.0887,  0.0710,  0.0546],
        [ 0.0599,  0.0701,  0.0471,  ...,  0.0813,  0.0705,  0.0562],
        [ 0.0558,  0.0910,  0.0653,  ...,  0.0645,  0.0608,  0.0437]], device='cuda:0')
loss: 109.57048797607422
var: tensor([[ 0.0741,  0.0778,  0.0778,  ...,  0.0744,  0.1005,  0.0608],
        [ 0.0448,  0.0953,  0.0719,  ...,  0.0693,  0.0774,  0.0565],
        [ 0.1082,  0.1299,  0.0475,  ...,  0.1376,  0.0986,  0.0606],
        ...,
        [ 0.0333,  0.0604,  0.0375,  ...,  0.0691,  0.0477,  0.0557],
        [ 0.0554,  0.0587,  0.0402,  ...,  0.0759,  0.0701,  0.0769],
        [ 0.0324,  0.0421,  0.0373,  ...,  0.0458,  0.0613,  0.0340]], device='cuda:0')
loss: 107.34703826904297
var: tensor([[ 0.0579,  0.0673,  0.051

var: tensor([[ 0.0425,  0.0545,  0.0231,  ...,  0.0430,  0.0484,  0.0382],
        [ 0.0773,  0.0771,  0.0445,  ...,  0.0818,  0.0753,  0.0808],
        [ 0.0815,  0.0511,  0.0343,  ...,  0.0865,  0.0488,  0.0530],
        ...,
        [ 0.0351,  0.0694,  0.0315,  ...,  0.0538,  0.0466,  0.0533],
        [ 0.0464,  0.0806,  0.0331,  ...,  0.0574,  0.0484,  0.0392],
        [ 0.0867,  0.0510,  0.0327,  ...,  0.0468,  0.0472,  0.0512]], device='cuda:0')
loss: 110.89646911621094
var: tensor([[ 0.0493,  0.0649,  0.0311,  ...,  0.0468,  0.0498,  0.0431],
        [ 0.0479,  0.0561,  0.0399,  ...,  0.0747,  0.0550,  0.0484],
        [ 0.0411,  0.0587,  0.0408,  ...,  0.0681,  0.0564,  0.0584],
        ...,
        [ 0.0537,  0.0703,  0.0295,  ...,  0.0681,  0.0500,  0.0479],
        [ 0.0769,  0.0707,  0.0421,  ...,  0.0579,  0.0594,  0.0554],
        [ 0.0436,  0.0683,  0.0455,  ...,  0.0508,  0.0684,  0.0543]], device='cuda:0')
loss: 111.20826721191406
var: tensor([[ 0.0410,  0.0561,  0.033

var: tensor([[ 0.1521,  0.1098,  0.0755,  ...,  0.1232,  0.0962,  0.1016],
        [ 0.0345,  0.1694,  0.1207,  ...,  0.1451,  0.1008,  0.1052],
        [ 0.1004,  0.1162,  0.0463,  ...,  0.1283,  0.0959,  0.0640],
        ...,
        [ 0.0362,  0.0447,  0.0313,  ...,  0.0870,  0.0339,  0.0588],
        [ 0.0856,  0.1028,  0.0474,  ...,  0.0935,  0.0806,  0.0662],
        [ 0.0483,  0.0766,  0.0414,  ...,  0.0863,  0.0444,  0.0585]], device='cuda:0')
loss: 110.72100830078125
var: tensor([[ 0.0954,  0.0567,  0.0413,  ...,  0.0509,  0.0460,  0.0545],
        [ 0.0914,  0.0490,  0.0244,  ...,  0.0795,  0.0353,  0.0642],
        [ 0.0483,  0.0846,  0.0472,  ...,  0.0667,  0.0559,  0.0653],
        ...,
        [ 0.0399,  0.0607,  0.0323,  ...,  0.0627,  0.0460,  0.0487],
        [ 0.0568,  0.0752,  0.0430,  ...,  0.0695,  0.0527,  0.0628],
        [ 0.0345,  0.0556,  0.0435,  ...,  0.0600,  0.0415,  0.0631]], device='cuda:0')
loss: 112.09400177001953
var: tensor([[ 0.0377,  0.0756,  0.036

var: tensor([[ 0.0390,  0.0800,  0.0461,  ...,  0.0651,  0.0675,  0.0519],
        [ 0.0334,  0.0896,  0.0717,  ...,  0.0643,  0.0806,  0.0535],
        [ 0.0727,  0.0804,  0.0473,  ...,  0.0757,  0.0644,  0.0599],
        ...,
        [ 0.0672,  0.1168,  0.0541,  ...,  0.0953,  0.0965,  0.0645],
        [ 0.0640,  0.1881,  0.0526,  ...,  0.0920,  0.0806,  0.0695],
        [ 0.0431,  0.0644,  0.0409,  ...,  0.0862,  0.0526,  0.0483]], device='cuda:0')
loss: 111.08333587646484
var: tensor([[ 0.0348,  0.0709,  0.0454,  ...,  0.0484,  0.0659,  0.0357],
        [ 0.0272,  0.0544,  0.0291,  ...,  0.0471,  0.0595,  0.0438],
        [ 0.0907,  0.1960,  0.1015,  ...,  0.1558,  0.1241,  0.1511],
        ...,
        [ 0.1081,  0.1831,  0.0618,  ...,  0.1423,  0.1199,  0.0887],
        [ 0.0848,  0.0831,  0.0449,  ...,  0.0989,  0.0638,  0.0842],
        [ 0.0394,  0.0596,  0.0412,  ...,  0.0721,  0.0476,  0.0469]], device='cuda:0')
loss: 103.31181335449219
var: tensor([[ 0.0984,  0.0738,  0.041

var: tensor([[ 0.0388,  0.0626,  0.0424,  ...,  0.0584,  0.0448,  0.0740],
        [ 0.0675,  0.0676,  0.0457,  ...,  0.0869,  0.0423,  0.0814],
        [ 0.0338,  0.0802,  0.0477,  ...,  0.0680,  0.0501,  0.0644],
        ...,
        [ 0.0468,  0.0663,  0.0379,  ...,  0.0623,  0.0464,  0.0568],
        [ 0.0617,  0.1708,  0.1072,  ...,  0.1550,  0.1026,  0.1341],
        [ 0.0544,  0.0470,  0.0316,  ...,  0.0626,  0.0404,  0.0597]], device='cuda:0')
loss: 109.52824401855469
var: tensor([[ 0.0646,  0.0704,  0.0444,  ...,  0.0817,  0.0525,  0.0748],
        [ 0.0471,  0.1132,  0.0459,  ...,  0.0895,  0.0645,  0.0794],
        [ 0.0439,  0.0447,  0.0398,  ...,  0.0616,  0.0442,  0.0521],
        ...,
        [ 0.0387,  0.0532,  0.0367,  ...,  0.0581,  0.0453,  0.0435],
        [ 0.0332,  0.0819,  0.0545,  ...,  0.0799,  0.0572,  0.0616],
        [ 0.0416,  0.0532,  0.0524,  ...,  0.0855,  0.0428,  0.0821]], device='cuda:0')
loss: 109.44654083251953
var: tensor([[ 0.0682,  0.0739,  0.043

loss: 103.12821960449219
var: tensor([[ 0.0345,  0.0730,  0.0497,  ...,  0.0565,  0.0499,  0.0548],
        [ 0.0314,  0.0464,  0.0343,  ...,  0.0701,  0.0429,  0.0503],
        [ 0.0417,  0.0459,  0.0274,  ...,  0.0510,  0.0504,  0.0351],
        ...,
        [ 0.0740,  0.0712,  0.0365,  ...,  0.0846,  0.0774,  0.0551],
        [ 0.0266,  0.0431,  0.0356,  ...,  0.0338,  0.0532,  0.0408],
        [ 0.0459,  0.0875,  0.0446,  ...,  0.0710,  0.0784,  0.0623]], device='cuda:0')
loss: 105.72908020019531
var: tensor([[ 0.0351,  0.0567,  0.0365,  ...,  0.0573,  0.0480,  0.0617],
        [ 0.0369,  0.0540,  0.0426,  ...,  0.0537,  0.0422,  0.0348],
        [ 0.0502,  0.0494,  0.0392,  ...,  0.0775,  0.0567,  0.0556],
        ...,
        [ 0.0516,  0.0345,  0.0341,  ...,  0.0437,  0.0434,  0.0435],
        [ 0.1152,  0.1753,  0.0680,  ...,  0.1566,  0.1129,  0.1492],
        [ 0.0900,  0.0424,  0.0389,  ...,  0.0656,  0.0491,  0.0540]], device='cuda:0')
loss: 104.4196548461914
var: tensor([[

var: tensor([[ 0.0446,  0.0930,  0.0405,  ...,  0.0794,  0.0794,  0.0493],
        [ 0.0454,  0.0755,  0.0704,  ...,  0.0917,  0.0827,  0.0548],
        [ 0.0317,  0.0445,  0.0220,  ...,  0.0701,  0.0652,  0.0441],
        ...,
        [ 0.0501,  0.0546,  0.0479,  ...,  0.0592,  0.0739,  0.0644],
        [ 0.0312,  0.0379,  0.0311,  ...,  0.0510,  0.0872,  0.0406],
        [ 0.0499,  0.0444,  0.0286,  ...,  0.0486,  0.0607,  0.0486]], device='cuda:0')
loss: 109.256103515625
var: tensor([[ 0.0467,  0.0674,  0.0338,  ...,  0.0972,  0.0744,  0.0545],
        [ 0.0511,  0.1036,  0.0508,  ...,  0.1169,  0.0870,  0.0751],
        [ 0.0348,  0.0560,  0.0489,  ...,  0.0557,  0.0772,  0.0741],
        ...,
        [ 0.0470,  0.0683,  0.0493,  ...,  0.0706,  0.0616,  0.0498],
        [ 0.0484,  0.0776,  0.0499,  ...,  0.0872,  0.0723,  0.0707],
        [ 0.0466,  0.1339,  0.1159,  ...,  0.1428,  0.1054,  0.1014]], device='cuda:0')
loss: 103.21591186523438
var: tensor([[ 0.0405,  0.0507,  0.0432,

var: tensor([[ 0.0554,  0.0903,  0.0578,  ...,  0.0856,  0.0712,  0.0722],
        [ 0.0610,  0.1301,  0.0612,  ...,  0.0820,  0.0746,  0.1019],
        [ 0.0279,  0.0551,  0.0317,  ...,  0.0660,  0.0774,  0.0454],
        ...,
        [ 0.0511,  0.0738,  0.0529,  ...,  0.0723,  0.0630,  0.0556],
        [ 0.0324,  0.0555,  0.0415,  ...,  0.0531,  0.0632,  0.0437],
        [ 0.0470,  0.0537,  0.0381,  ...,  0.0593,  0.0625,  0.0484]], device='cuda:0')
loss: 110.7216796875
var: tensor([[ 0.0567,  0.1251,  0.0385,  ...,  0.0954,  0.0778,  0.0719],
        [ 0.0301,  0.0624,  0.0414,  ...,  0.0859,  0.0565,  0.0582],
        [ 0.0434,  0.1072,  0.0392,  ...,  0.0746,  0.0568,  0.0765],
        ...,
        [ 0.0365,  0.0559,  0.0399,  ...,  0.0654,  0.0684,  0.0384],
        [ 0.0561,  0.0761,  0.0438,  ...,  0.0880,  0.0685,  0.0636],
        [ 0.0800,  0.0670,  0.0414,  ...,  0.0811,  0.0498,  0.0622]], device='cuda:0')
loss: 106.63783264160156
var: tensor([[ 0.0469,  0.1358,  0.1043,  

var: tensor([[ 0.0469,  0.1323,  0.1493,  ...,  0.1250,  0.1424,  0.1054],
        [ 0.0551,  0.1259,  0.0448,  ...,  0.0904,  0.0760,  0.0635],
        [ 0.0374,  0.0519,  0.0510,  ...,  0.0731,  0.0489,  0.0711],
        ...,
        [ 0.0790,  0.0813,  0.0681,  ...,  0.0691,  0.0674,  0.0825],
        [ 0.1727,  0.2210,  0.0840,  ...,  0.1749,  0.1811,  0.1310],
        [ 0.0982,  0.1137,  0.0682,  ...,  0.0890,  0.0853,  0.0828]], device='cuda:0')
loss: 106.91236877441406
var: tensor([[ 0.0349,  0.0599,  0.0470,  ...,  0.0623,  0.0525,  0.0505],
        [ 0.0368,  0.0574,  0.0404,  ...,  0.0746,  0.0412,  0.0601],
        [ 0.0567,  0.0649,  0.0521,  ...,  0.0703,  0.0588,  0.0571],
        ...,
        [ 0.0489,  0.0586,  0.0529,  ...,  0.0526,  0.0515,  0.0309],
        [ 0.0587,  0.1062,  0.0583,  ...,  0.1018,  0.1051,  0.0753],
        [ 0.0407,  0.0675,  0.0364,  ...,  0.0861,  0.0579,  0.0566]], device='cuda:0')
loss: 103.38291931152344
var: tensor([[ 0.1906,  0.1807,  0.087

var: tensor([[ 0.0447,  0.1067,  0.0584,  ...,  0.0880,  0.0568,  0.0941],
        [ 0.0319,  0.0442,  0.0369,  ...,  0.0729,  0.0732,  0.0787],
        [ 0.0583,  0.1816,  0.0870,  ...,  0.1428,  0.0747,  0.0948],
        ...,
        [ 0.0471,  0.0589,  0.0415,  ...,  0.0934,  0.0748,  0.0631],
        [ 0.0329,  0.0579,  0.0512,  ...,  0.0707,  0.0615,  0.0619],
        [ 0.0401,  0.0683,  0.0460,  ...,  0.0762,  0.0380,  0.0504]], device='cuda:0')
loss: 108.40234375
var: tensor([[ 0.0435,  0.0580,  0.0486,  ...,  0.0688,  0.0655,  0.0514],
        [ 0.0300,  0.0633,  0.0410,  ...,  0.0779,  0.0700,  0.0724],
        [ 0.0570,  0.0873,  0.0736,  ...,  0.1097,  0.0758,  0.0644],
        ...,
        [ 0.0206,  0.0337,  0.0313,  ...,  0.0382,  0.0587,  0.0473],
        [ 0.0666,  0.0640,  0.0449,  ...,  0.0925,  0.0610,  0.1184],
        [ 0.0405,  0.1122,  0.0518,  ...,  0.0942,  0.0635,  0.0773]], device='cuda:0')
loss: 105.45645141601562
var: tensor([[ 0.0610,  0.1055,  0.0401,  ..

loss: 111.02203369140625
var: tensor([[ 0.0835,  0.0606,  0.0602,  ...,  0.0791,  0.0671,  0.0898],
        [ 0.0417,  0.1149,  0.0826,  ...,  0.1260,  0.1238,  0.1216],
        [ 0.0547,  0.0866,  0.0654,  ...,  0.0914,  0.0815,  0.0757],
        ...,
        [ 0.0331,  0.0382,  0.0296,  ...,  0.0675,  0.0467,  0.0407],
        [ 0.0357,  0.0395,  0.0415,  ...,  0.0620,  0.0741,  0.0513],
        [ 0.1073,  0.0716,  0.0545,  ...,  0.1097,  0.0536,  0.1147]], device='cuda:0')
loss: 109.53485107421875
var: tensor([[ 0.0396,  0.0710,  0.0439,  ...,  0.0635,  0.0689,  0.0596],
        [ 0.0291,  0.1437,  0.1334,  ...,  0.1531,  0.1228,  0.1408],
        [ 0.0427,  0.0729,  0.0561,  ...,  0.0979,  0.0794,  0.0523],
        ...,
        [ 0.0551,  0.0772,  0.0591,  ...,  0.0798,  0.0826,  0.0798],
        [ 0.0420,  0.0758,  0.0434,  ...,  0.1091,  0.0860,  0.0623],
        [ 0.0586,  0.1671,  0.1159,  ...,  0.1835,  0.1208,  0.1804]], device='cuda:0')
loss: 109.00330352783203
var: tensor([

var: tensor([[ 0.0511,  0.0902,  0.0700,  ...,  0.0789,  0.0693,  0.0451],
        [ 0.1252,  0.1572,  0.0547,  ...,  0.1637,  0.0931,  0.0766],
        [ 0.0752,  0.0836,  0.0588,  ...,  0.0852,  0.0790,  0.0649],
        ...,
        [ 0.1220,  0.0963,  0.0398,  ...,  0.0956,  0.0687,  0.0650],
        [ 0.0571,  0.0976,  0.0394,  ...,  0.0640,  0.0664,  0.0500],
        [ 0.0798,  0.0454,  0.0303,  ...,  0.0550,  0.0450,  0.0533]], device='cuda:0')
loss: 104.57190704345703
var: tensor([[ 0.1005,  0.0929,  0.0444,  ...,  0.1022,  0.0970,  0.0519],
        [ 0.0565,  0.0568,  0.0395,  ...,  0.0899,  0.0529,  0.0604],
        [ 0.0501,  0.2215,  0.1178,  ...,  0.2438,  0.1063,  0.1173],
        ...,
        [ 0.0555,  0.0683,  0.0382,  ...,  0.0754,  0.0537,  0.0488],
        [ 0.0704,  0.1508,  0.0368,  ...,  0.0924,  0.0965,  0.0570],
        [ 0.0669,  0.0757,  0.0274,  ...,  0.0782,  0.0536,  0.0520]], device='cuda:0')
loss: 108.69357299804688
var: tensor([[ 0.0378,  0.0991,  0.061

var: tensor([[ 0.0395,  0.1063,  0.0584,  ...,  0.0688,  0.0670,  0.0565],
        [ 0.0521,  0.0802,  0.0626,  ...,  0.0962,  0.0855,  0.0706],
        [ 0.0399,  0.0666,  0.0497,  ...,  0.0694,  0.0448,  0.0688],
        ...,
        [ 0.0610,  0.1061,  0.0689,  ...,  0.1143,  0.1115,  0.0644],
        [ 0.0703,  0.0650,  0.0512,  ...,  0.0816,  0.0544,  0.0734],
        [ 0.0546,  0.1343,  0.0598,  ...,  0.1175,  0.1143,  0.0693]], device='cuda:0')
loss: 105.80033874511719
var: tensor([[ 0.0226,  0.0444,  0.0506,  ...,  0.0612,  0.0674,  0.0588],
        [ 0.0695,  0.0689,  0.0672,  ...,  0.0860,  0.0799,  0.0710],
        [ 0.1307,  0.0866,  0.0690,  ...,  0.0880,  0.0822,  0.0741],
        ...,
        [ 0.0632,  0.0759,  0.0617,  ...,  0.0856,  0.0675,  0.0634],
        [ 0.1211,  0.1319,  0.1358,  ...,  0.1967,  0.1079,  0.1113],
        [ 0.0517,  0.1129,  0.0594,  ...,  0.1002,  0.0755,  0.0761]], device='cuda:0')
loss: 109.05068969726562
var: tensor([[ 0.0288,  0.0370,  0.047

var: tensor([[ 0.0547,  0.0719,  0.0368,  ...,  0.0731,  0.0594,  0.0601],
        [ 0.0479,  0.0608,  0.0435,  ...,  0.0727,  0.0767,  0.0514],
        [ 0.0382,  0.0363,  0.0232,  ...,  0.0476,  0.0376,  0.0504],
        ...,
        [ 0.0681,  0.0581,  0.0446,  ...,  0.0595,  0.0535,  0.0566],
        [ 0.0554,  0.1235,  0.1097,  ...,  0.1223,  0.1503,  0.0973],
        [ 0.1340,  0.0870,  0.0734,  ...,  0.0973,  0.0975,  0.0785]], device='cuda:0')
loss: 107.76325988769531
var: tensor([[ 0.0598,  0.0709,  0.0610,  ...,  0.0749,  0.0908,  0.0498],
        [ 0.1123,  0.0695,  0.0475,  ...,  0.0852,  0.0832,  0.0889],
        [ 0.0315,  0.0369,  0.0279,  ...,  0.0486,  0.0525,  0.0266],
        ...,
        [ 0.0671,  0.1479,  0.0509,  ...,  0.1119,  0.1260,  0.0929],
        [ 0.0568,  0.0638,  0.0401,  ...,  0.0489,  0.0972,  0.0499],
        [ 0.0392,  0.0850,  0.0584,  ...,  0.0750,  0.0716,  0.0719]], device='cuda:0')
loss: 107.84814453125
var: tensor([[ 0.0832,  0.1517,  0.0609, 

var: tensor([[ 0.0422,  0.0633,  0.0397,  ...,  0.0701,  0.0537,  0.0601],
        [ 0.0676,  0.1083,  0.0331,  ...,  0.1066,  0.0845,  0.0531],
        [ 0.0382,  0.0651,  0.0325,  ...,  0.0710,  0.0548,  0.0681],
        ...,
        [ 0.0337,  0.0412,  0.0221,  ...,  0.0430,  0.0459,  0.0347],
        [ 0.0398,  0.0680,  0.0239,  ...,  0.0527,  0.0504,  0.0345],
        [ 0.0544,  0.0706,  0.0577,  ...,  0.0722,  0.0627,  0.0454]], device='cuda:0')
loss: 109.12220764160156
var: tensor([[ 0.0314,  0.0339,  0.0242,  ...,  0.0379,  0.0645,  0.0432],
        [ 0.0421,  0.0614,  0.0282,  ...,  0.0399,  0.0777,  0.0466],
        [ 0.0542,  0.0664,  0.0294,  ...,  0.0700,  0.0565,  0.0489],
        ...,
        [ 0.0831,  0.0911,  0.0480,  ...,  0.0955,  0.0757,  0.0993],
        [ 0.0742,  0.0629,  0.0361,  ...,  0.0747,  0.0709,  0.0598],
        [ 0.0649,  0.1091,  0.0709,  ...,  0.0695,  0.0749,  0.0475]], device='cuda:0')
loss: 106.06950378417969
var: tensor([[ 0.0491,  0.0640,  0.026

var: tensor([[ 0.0407,  0.0652,  0.0349,  ...,  0.0620,  0.0514,  0.0602],
        [ 0.0339,  0.0457,  0.0463,  ...,  0.0472,  0.0615,  0.0420],
        [ 0.0351,  0.0494,  0.0403,  ...,  0.0739,  0.0515,  0.0744],
        ...,
        [ 0.0426,  0.0454,  0.0425,  ...,  0.0731,  0.0544,  0.0451],
        [ 0.0339,  0.0787,  0.0424,  ...,  0.0633,  0.0505,  0.0522],
        [ 0.0303,  0.0312,  0.0369,  ...,  0.0435,  0.0552,  0.0385]], device='cuda:0')
loss: 111.31057739257812
var: tensor([[ 0.0506,  0.0665,  0.0363,  ...,  0.0813,  0.0403,  0.0656],
        [ 0.0590,  0.1132,  0.0553,  ...,  0.0919,  0.0714,  0.0713],
        [ 0.0852,  0.0657,  0.0386,  ...,  0.0892,  0.0506,  0.0730],
        ...,
        [ 0.0491,  0.0794,  0.0473,  ...,  0.0782,  0.0707,  0.0577],
        [ 0.0731,  0.1534,  0.0762,  ...,  0.1620,  0.0762,  0.0849],
        [ 0.0476,  0.0813,  0.0561,  ...,  0.0946,  0.0610,  0.0700]], device='cuda:0')
loss: 107.00230407714844
var: tensor([[ 0.0385,  0.0789,  0.046

var: tensor([[ 0.0658,  0.1061,  0.0347,  ...,  0.0847,  0.0926,  0.0564],
        [ 0.0476,  0.0641,  0.0352,  ...,  0.0745,  0.0630,  0.0610],
        [ 0.0588,  0.1679,  0.1352,  ...,  0.1746,  0.1149,  0.0993],
        ...,
        [ 0.0377,  0.0599,  0.0399,  ...,  0.0612,  0.0556,  0.0370],
        [ 0.0388,  0.0579,  0.0444,  ...,  0.0544,  0.0452,  0.0416],
        [ 0.1218,  0.1548,  0.0697,  ...,  0.1863,  0.1130,  0.0948]], device='cuda:0')
loss: 104.9298095703125
var: tensor([[ 0.0547,  0.1151,  0.0566,  ...,  0.0972,  0.0760,  0.0677],
        [ 0.0302,  0.0505,  0.0299,  ...,  0.0566,  0.0509,  0.0403],
        [ 0.0836,  0.1538,  0.1066,  ...,  0.1763,  0.1241,  0.1470],
        ...,
        [ 0.0540,  0.0873,  0.0390,  ...,  0.0856,  0.0642,  0.0638],
        [ 0.0450,  0.0659,  0.0330,  ...,  0.0615,  0.0551,  0.0518],
        [ 0.0611,  0.1054,  0.0510,  ...,  0.0952,  0.0823,  0.0660]], device='cuda:0')
loss: 105.70570373535156
var: tensor([[ 0.0365,  0.0524,  0.0426

var: tensor([[ 0.1351,  0.0568,  0.0514,  ...,  0.0797,  0.0680,  0.0926],
        [ 0.0471,  0.2014,  0.1413,  ...,  0.1952,  0.1466,  0.1775],
        [ 0.0277,  0.0873,  0.0460,  ...,  0.0643,  0.0793,  0.0527],
        ...,
        [ 0.0216,  0.0757,  0.0340,  ...,  0.0534,  0.0578,  0.0492],
        [ 0.1706,  0.2040,  0.0804,  ...,  0.1980,  0.1647,  0.1736],
        [ 0.0463,  0.0931,  0.0718,  ...,  0.0775,  0.0864,  0.0568]], device='cuda:0')
loss: 107.42019653320312
var: tensor([[ 0.0399,  0.0349,  0.0189,  ...,  0.0505,  0.0492,  0.0454],
        [ 0.0372,  0.0662,  0.0405,  ...,  0.0592,  0.0718,  0.0457],
        [ 0.0411,  0.0474,  0.0355,  ...,  0.0628,  0.0560,  0.0533],
        ...,
        [ 0.0251,  0.0422,  0.0339,  ...,  0.0647,  0.0464,  0.0444],
        [ 0.0575,  0.0786,  0.0440,  ...,  0.1169,  0.0879,  0.1128],
        [ 0.0504,  0.0489,  0.0473,  ...,  0.0544,  0.0799,  0.0516]], device='cuda:0')
loss: 106.97085571289062
var: tensor([[ 0.0385,  0.0873,  0.057

var: tensor([[ 0.2343,  0.1729,  0.0587,  ...,  0.2171,  0.1466,  0.1392],
        [ 0.0378,  0.0789,  0.0462,  ...,  0.0857,  0.0628,  0.0744],
        [ 0.0526,  0.0523,  0.0444,  ...,  0.0733,  0.0516,  0.0731],
        ...,
        [ 0.1656,  0.1650,  0.0643,  ...,  0.2566,  0.1553,  0.1456],
        [ 0.0489,  0.0726,  0.0423,  ...,  0.0905,  0.0549,  0.0695],
        [ 0.0378,  0.0514,  0.0454,  ...,  0.0509,  0.0731,  0.0517]], device='cuda:0')
loss: 105.88005828857422
var: tensor([[ 0.0518,  0.1371,  0.0993,  ...,  0.1649,  0.1144,  0.1681],
        [ 0.0534,  0.1212,  0.0588,  ...,  0.0889,  0.0699,  0.0727],
        [ 0.0950,  0.1014,  0.0507,  ...,  0.1481,  0.1104,  0.0702],
        ...,
        [ 0.0334,  0.0617,  0.0499,  ...,  0.0875,  0.0471,  0.0626],
        [ 0.0305,  0.0437,  0.0309,  ...,  0.0553,  0.0600,  0.0611],
        [ 0.0583,  0.0982,  0.0557,  ...,  0.1073,  0.0798,  0.0690]], device='cuda:0')
loss: 106.80306243896484
var: tensor([[ 0.0342,  0.0414,  0.035

var: tensor([[ 0.0441,  0.0441,  0.0386,  ...,  0.0501,  0.0511,  0.0588],
        [ 0.0502,  0.0652,  0.0433,  ...,  0.0748,  0.0592,  0.0885],
        [ 0.0573,  0.0782,  0.0566,  ...,  0.0707,  0.0619,  0.0921],
        ...,
        [ 0.0339,  0.0497,  0.0395,  ...,  0.0533,  0.0503,  0.0883],
        [ 0.1041,  0.2001,  0.0959,  ...,  0.1966,  0.1257,  0.1951],
        [ 0.0489,  0.0537,  0.0300,  ...,  0.0582,  0.0473,  0.0506]], device='cuda:0')
loss: 111.06504821777344
var: tensor([[ 0.0956,  0.1110,  0.0459,  ...,  0.1113,  0.0980,  0.0793],
        [ 0.1341,  0.1594,  0.0584,  ...,  0.1723,  0.1319,  0.1236],
        [ 0.0565,  0.0876,  0.0608,  ...,  0.1222,  0.0721,  0.0731],
        ...,
        [ 0.0390,  0.0506,  0.0458,  ...,  0.0413,  0.0536,  0.0470],
        [ 0.0856,  0.0825,  0.0492,  ...,  0.1016,  0.0652,  0.0777],
        [ 0.0544,  0.0640,  0.0368,  ...,  0.0769,  0.0847,  0.0948]], device='cuda:0')
loss: 107.37297821044922
var: tensor([[ 0.1225,  0.1834,  0.072

loss: 112.36624908447266
var: tensor([[ 0.0524,  0.0530,  0.0348,  ...,  0.0668,  0.0630,  0.0814],
        [ 0.0366,  0.0732,  0.0459,  ...,  0.0883,  0.0622,  0.0756],
        [ 0.2344,  0.1900,  0.0835,  ...,  0.2373,  0.1866,  0.2266],
        ...,
        [ 0.0689,  0.0397,  0.0337,  ...,  0.0656,  0.0441,  0.0820],
        [ 0.2075,  0.1845,  0.0941,  ...,  0.2694,  0.1924,  0.2164],
        [ 0.0415,  0.0808,  0.0355,  ...,  0.0802,  0.0541,  0.0776]], device='cuda:0')
loss: 107.45944213867188
var: tensor([[ 0.0315,  0.0338,  0.0218,  ...,  0.0339,  0.0689,  0.0433],
        [ 0.0506,  0.0803,  0.0401,  ...,  0.0653,  0.0559,  0.0639],
        [ 0.1034,  0.0526,  0.0519,  ...,  0.0944,  0.0541,  0.0740],
        ...,
        [ 0.0436,  0.0437,  0.0382,  ...,  0.0728,  0.0646,  0.0529],
        [ 0.0701,  0.0605,  0.0440,  ...,  0.0950,  0.0611,  0.0589],
        [ 0.0358,  0.0732,  0.0354,  ...,  0.0713,  0.0413,  0.0702]], device='cuda:0')
loss: 105.53601837158203
var: tensor([

var: tensor([[ 0.0335,  0.0440,  0.0484,  ...,  0.0709,  0.0408,  0.0338],
        [ 0.0421,  0.0528,  0.0534,  ...,  0.0735,  0.0573,  0.0566],
        [ 0.0751,  0.0850,  0.0505,  ...,  0.0941,  0.0859,  0.0493],
        ...,
        [ 0.0432,  0.0667,  0.0473,  ...,  0.0540,  0.0814,  0.0470],
        [ 0.0410,  0.0453,  0.0367,  ...,  0.0477,  0.0390,  0.0483],
        [ 0.0461,  0.0740,  0.0404,  ...,  0.0742,  0.0756,  0.0626]], device='cuda:0')
loss: 104.0659408569336
var: tensor([[ 0.0448,  0.0320,  0.0313,  ...,  0.0378,  0.0325,  0.0335],
        [ 0.0903,  0.0553,  0.0353,  ...,  0.0949,  0.0506,  0.0684],
        [ 0.0545,  0.0529,  0.0436,  ...,  0.0946,  0.0813,  0.0583],
        ...,
        [ 0.0365,  0.0444,  0.0483,  ...,  0.0455,  0.0686,  0.0430],
        [ 0.0590,  0.0626,  0.0497,  ...,  0.0831,  0.0536,  0.0678],
        [ 0.0600,  0.0535,  0.0515,  ...,  0.0773,  0.0553,  0.0818]], device='cuda:0')
loss: 110.66847229003906
var: tensor([[ 0.0758,  0.0880,  0.0707

var: tensor([[ 0.0661,  0.0519,  0.0438,  ...,  0.0663,  0.0578,  0.0775],
        [ 0.0339,  0.0568,  0.0395,  ...,  0.0685,  0.0493,  0.0641],
        [ 0.0330,  0.0428,  0.0321,  ...,  0.0644,  0.0473,  0.0493],
        ...,
        [ 0.0423,  0.0508,  0.0302,  ...,  0.0738,  0.0510,  0.0697],
        [ 0.0523,  0.0990,  0.0389,  ...,  0.0989,  0.0965,  0.0650],
        [ 0.0419,  0.0411,  0.0378,  ...,  0.0704,  0.0428,  0.0472]], device='cuda:0')
loss: 106.71920013427734
var: tensor([[ 0.0576,  0.0728,  0.0336,  ...,  0.0938,  0.0742,  0.0620],
        [ 0.0471,  0.0704,  0.0380,  ...,  0.0606,  0.0536,  0.0557],
        [ 0.1310,  0.1241,  0.0429,  ...,  0.2379,  0.1247,  0.1248],
        ...,
        [ 0.0561,  0.0623,  0.0387,  ...,  0.1148,  0.0602,  0.0541],
        [ 0.0380,  0.0445,  0.0307,  ...,  0.0664,  0.0550,  0.0604],
        [ 0.0318,  0.0461,  0.0293,  ...,  0.0578,  0.0435,  0.0567]], device='cuda:0')
loss: 108.01734161376953
var: tensor([[ 0.0345,  0.0486,  0.026

var: tensor([[ 0.0443,  0.0896,  0.0356,  ...,  0.0758,  0.0709,  0.0527],
        [ 0.0754,  0.0506,  0.0313,  ...,  0.0840,  0.0582,  0.0453],
        [ 0.0300,  0.0391,  0.0371,  ...,  0.0695,  0.0589,  0.0619],
        ...,
        [ 0.0679,  0.0668,  0.0426,  ...,  0.0956,  0.0675,  0.0595],
        [ 0.0700,  0.0771,  0.0466,  ...,  0.0992,  0.0979,  0.0647],
        [ 0.0544,  0.1033,  0.0798,  ...,  0.0816,  0.0877,  0.0518]], device='cuda:0')
loss: 107.1039810180664
var: tensor([[ 0.0916,  0.0579,  0.0386,  ...,  0.0948,  0.0762,  0.0827],
        [ 0.0624,  0.0445,  0.0438,  ...,  0.0490,  0.0434,  0.0426],
        [ 0.0693,  0.0456,  0.0298,  ...,  0.0597,  0.0455,  0.0477],
        ...,
        [ 0.0414,  0.0447,  0.0350,  ...,  0.0709,  0.0598,  0.0530],
        [ 0.0340,  0.0545,  0.0755,  ...,  0.0787,  0.0630,  0.0427],
        [ 0.0553,  0.0639,  0.0409,  ...,  0.0701,  0.0727,  0.0629]], device='cuda:0')
loss: 104.92973327636719
var: tensor([[ 0.0439,  0.0772,  0.0324

var: tensor([[ 0.0380,  0.0728,  0.0515,  ...,  0.0762,  0.0567,  0.0623],
        [ 0.0484,  0.1449,  0.0922,  ...,  0.1252,  0.0731,  0.0952],
        [ 0.0721,  0.0736,  0.0533,  ...,  0.0716,  0.0493,  0.0772],
        ...,
        [ 0.0702,  0.0913,  0.0827,  ...,  0.1285,  0.0703,  0.1223],
        [ 0.0468,  0.1467,  0.1402,  ...,  0.1462,  0.0960,  0.1313],
        [ 0.0281,  0.0595,  0.0324,  ...,  0.0471,  0.0419,  0.0518]], device='cuda:0')
loss: 103.6361312866211
var: tensor([[ 0.0446,  0.0726,  0.0404,  ...,  0.0778,  0.0498,  0.0726],
        [ 0.0424,  0.0509,  0.0358,  ...,  0.0571,  0.0441,  0.0477],
        [ 0.0340,  0.0477,  0.0343,  ...,  0.0972,  0.0596,  0.0635],
        ...,
        [ 0.0422,  0.0864,  0.0516,  ...,  0.1046,  0.0610,  0.0769],
        [ 0.0431,  0.1321,  0.0631,  ...,  0.1079,  0.0624,  0.0878],
        [ 0.0589,  0.0967,  0.0383,  ...,  0.0942,  0.0724,  0.0805]], device='cuda:0')
loss: 108.13673400878906
var: tensor([[ 0.0673,  0.0888,  0.0768

var: tensor([[ 0.0401,  0.0342,  0.0340,  ...,  0.0735,  0.0447,  0.0513],
        [ 0.0364,  0.0475,  0.0494,  ...,  0.0798,  0.0405,  0.0603],
        [ 0.0282,  0.0515,  0.0439,  ...,  0.0443,  0.0736,  0.0445],
        ...,
        [ 0.0614,  0.0849,  0.0549,  ...,  0.0835,  0.0912,  0.0637],
        [ 0.1054,  0.0655,  0.0457,  ...,  0.0954,  0.0712,  0.0999],
        [ 0.0430,  0.1491,  0.0733,  ...,  0.1115,  0.0772,  0.1158]], device='cuda:0')
loss: 106.97704315185547
var: tensor([[ 0.0657,  0.0759,  0.0493,  ...,  0.0836,  0.0639,  0.0736],
        [ 0.0374,  0.1149,  0.1118,  ...,  0.1562,  0.0819,  0.1082],
        [ 0.0527,  0.1261,  0.0537,  ...,  0.1135,  0.0849,  0.0710],
        ...,
        [ 0.0483,  0.0594,  0.0396,  ...,  0.0663,  0.0535,  0.0616],
        [ 0.1438,  0.1488,  0.0675,  ...,  0.2639,  0.1546,  0.1807],
        [ 0.0363,  0.1037,  0.0460,  ...,  0.0754,  0.0597,  0.0737]], device='cuda:0')
loss: 102.48534393310547
var: tensor([[ 0.0249,  0.0561,  0.033

var: tensor([[ 0.0734,  0.1142,  0.0850,  ...,  0.1001,  0.1474,  0.0854],
        [ 0.0780,  0.0861,  0.0434,  ...,  0.1130,  0.0997,  0.0562],
        [ 0.0432,  0.1272,  0.1152,  ...,  0.1182,  0.0781,  0.0759],
        ...,
        [ 0.0445,  0.0604,  0.0268,  ...,  0.0707,  0.0469,  0.0392],
        [ 0.0651,  0.1305,  0.0472,  ...,  0.0964,  0.0838,  0.0610],
        [ 0.0425,  0.0347,  0.0284,  ...,  0.0655,  0.0443,  0.0473]], device='cuda:0')
loss: 104.6588134765625
var: tensor([[ 0.0340,  0.0297,  0.0145,  ...,  0.0439,  0.0409,  0.0352],
        [ 0.0588,  0.0723,  0.0437,  ...,  0.1192,  0.0597,  0.0912],
        [ 0.0366,  0.0576,  0.0302,  ...,  0.0925,  0.0725,  0.0521],
        ...,
        [ 0.0372,  0.0576,  0.0382,  ...,  0.0696,  0.0618,  0.0444],
        [ 0.0424,  0.0583,  0.0430,  ...,  0.0786,  0.0543,  0.0656],
        [ 0.0481,  0.1050,  0.0552,  ...,  0.0742,  0.0599,  0.0585]], device='cuda:0')
loss: 109.54591369628906
var: tensor([[ 0.0514,  0.0596,  0.0355

var: tensor([[ 0.0374,  0.0363,  0.0302,  ...,  0.0453,  0.0610,  0.0683],
        [ 0.0428,  0.0473,  0.0550,  ...,  0.0510,  0.0588,  0.0541],
        [ 0.0874,  0.0618,  0.0400,  ...,  0.0798,  0.0595,  0.0776],
        ...,
        [ 0.0623,  0.1040,  0.0392,  ...,  0.1102,  0.1204,  0.0644],
        [ 0.0972,  0.0945,  0.0487,  ...,  0.1114,  0.0630,  0.0917],
        [ 0.0317,  0.0615,  0.0389,  ...,  0.0719,  0.0519,  0.0702]], device='cuda:0')
loss: 109.89408111572266
var: tensor([[ 0.1008,  0.0857,  0.0425,  ...,  0.0845,  0.0722,  0.0811],
        [ 0.0570,  0.0697,  0.0475,  ...,  0.0896,  0.1035,  0.0617],
        [ 0.0608,  0.1573,  0.0437,  ...,  0.0892,  0.1176,  0.0743],
        ...,
        [ 0.0365,  0.1833,  0.1542,  ...,  0.1621,  0.1596,  0.1696],
        [ 0.0422,  0.0585,  0.0249,  ...,  0.0570,  0.0819,  0.0291],
        [ 0.0390,  0.0921,  0.0714,  ...,  0.0734,  0.0794,  0.0763]], device='cuda:0')
loss: 104.5858154296875
var: tensor([[ 0.0309,  0.0421,  0.0354

var: tensor([[ 0.0248,  0.0428,  0.0297,  ...,  0.0450,  0.0466,  0.0292],
        [ 0.0506,  0.0692,  0.0537,  ...,  0.1115,  0.0805,  0.0719],
        [ 0.0535,  0.1801,  0.0908,  ...,  0.1284,  0.0887,  0.1384],
        ...,
        [ 0.0468,  0.0771,  0.0475,  ...,  0.0533,  0.0536,  0.0507],
        [ 0.0255,  0.0578,  0.0330,  ...,  0.0525,  0.0516,  0.0465],
        [ 0.0422,  0.0775,  0.0899,  ...,  0.0739,  0.0522,  0.0558]], device='cuda:0')
loss: 104.74153137207031
var: tensor([[ 0.0302,  0.0516,  0.0404,  ...,  0.0581,  0.0455,  0.0751],
        [ 0.0563,  0.0835,  0.0411,  ...,  0.1029,  0.0585,  0.0742],
        [ 0.0623,  0.1120,  0.0454,  ...,  0.1022,  0.0639,  0.0600],
        ...,
        [ 0.0597,  0.1028,  0.0451,  ...,  0.1060,  0.0879,  0.0700],
        [ 0.0518,  0.0594,  0.0513,  ...,  0.0812,  0.0490,  0.0823],
        [ 0.0439,  0.0620,  0.0379,  ...,  0.0484,  0.0585,  0.0481]], device='cuda:0')
loss: 103.10343933105469
var: tensor([[ 0.0380,  0.1025,  0.066

var: tensor([[ 0.0669,  0.0293,  0.0354,  ...,  0.0473,  0.0344,  0.0499],
        [ 0.0329,  0.0512,  0.0280,  ...,  0.0665,  0.0394,  0.0787],
        [ 0.0389,  0.0383,  0.0403,  ...,  0.0612,  0.0649,  0.0547],
        ...,
        [ 0.0317,  0.0378,  0.0259,  ...,  0.0502,  0.0399,  0.0398],
        [ 0.0341,  0.0393,  0.0329,  ...,  0.0504,  0.0394,  0.0710],
        [ 0.0448,  0.0546,  0.0431,  ...,  0.0666,  0.0829,  0.0560]], device='cuda:0')
loss: 107.25231170654297
var: tensor([[ 0.0372,  0.0415,  0.0390,  ...,  0.0486,  0.0780,  0.0520],
        [ 0.0474,  0.0514,  0.0316,  ...,  0.0847,  0.0570,  0.0869],
        [ 0.0528,  0.1156,  0.0433,  ...,  0.0947,  0.0861,  0.0734],
        ...,
        [ 0.0671,  0.0652,  0.0480,  ...,  0.1148,  0.0665,  0.0883],
        [ 0.0398,  0.0429,  0.0389,  ...,  0.0767,  0.0588,  0.0778],
        [ 0.0391,  0.0438,  0.0408,  ...,  0.0481,  0.0430,  0.0572]], device='cuda:0')
loss: 109.47689819335938
var: tensor([[ 0.0400,  0.0566,  0.025

var: tensor([[ 0.0395,  0.1802,  0.1669,  ...,  0.2133,  0.1623,  0.1944],
        [ 0.0414,  0.0637,  0.0535,  ...,  0.0728,  0.0572,  0.0643],
        [ 0.0379,  0.0644,  0.0434,  ...,  0.0483,  0.0578,  0.0522],
        ...,
        [ 0.0721,  0.0790,  0.0532,  ...,  0.1139,  0.0715,  0.0857],
        [ 0.0509,  0.0785,  0.0816,  ...,  0.0781,  0.0697,  0.0619],
        [ 0.0755,  0.0949,  0.0460,  ...,  0.1073,  0.0847,  0.0624]], device='cuda:0')
loss: 101.97489929199219
var: tensor([[ 0.0461,  0.0585,  0.0459,  ...,  0.0985,  0.0696,  0.0660],
        [ 0.0791,  0.0862,  0.0490,  ...,  0.1115,  0.0831,  0.0817],
        [ 0.0445,  0.0683,  0.0398,  ...,  0.0667,  0.0642,  0.0610],
        ...,
        [ 0.0408,  0.0293,  0.0393,  ...,  0.0640,  0.0486,  0.0633],
        [ 0.0506,  0.0402,  0.0475,  ...,  0.0534,  0.0545,  0.0563],
        [ 0.0508,  0.1024,  0.0621,  ...,  0.0894,  0.0749,  0.0761]], device='cuda:0')
loss: 110.87666320800781
var: tensor([[ 0.0618,  0.0940,  0.067

var: tensor([[ 0.0542,  0.0474,  0.0290,  ...,  0.0627,  0.0527,  0.0478],
        [ 0.0802,  0.0726,  0.0345,  ...,  0.0982,  0.0520,  0.0747],
        [ 0.0626,  0.0871,  0.0352,  ...,  0.0960,  0.0610,  0.0641],
        ...,
        [ 0.0600,  0.1151,  0.0455,  ...,  0.0733,  0.0669,  0.0657],
        [ 0.0853,  0.0830,  0.0500,  ...,  0.0900,  0.0687,  0.0797],
        [ 0.0488,  0.0577,  0.0442,  ...,  0.0596,  0.0611,  0.0580]], device='cuda:0')
loss: 105.1029052734375
var: tensor([[ 0.1678,  0.1206,  0.0520,  ...,  0.1572,  0.1077,  0.0970],
        [ 0.0501,  0.0671,  0.0543,  ...,  0.1107,  0.0473,  0.0813],
        [ 0.0456,  0.0822,  0.0399,  ...,  0.0872,  0.0746,  0.0476],
        ...,
        [ 0.0489,  0.0631,  0.0257,  ...,  0.0462,  0.0511,  0.0472],
        [ 0.0570,  0.0820,  0.0326,  ...,  0.1107,  0.0684,  0.0617],
        [ 0.0404,  0.0710,  0.0407,  ...,  0.0614,  0.0851,  0.0476]], device='cuda:0')
loss: 104.44358825683594
var: tensor([[ 0.0295,  0.0296,  0.0211

var: tensor([[ 0.0826,  0.0676,  0.0695,  ...,  0.0943,  0.0610,  0.0823],
        [ 0.0303,  0.0411,  0.0272,  ...,  0.0554,  0.0360,  0.0347],
        [ 0.1970,  0.1539,  0.0660,  ...,  0.2047,  0.1230,  0.1480],
        ...,
        [ 0.0426,  0.0429,  0.0305,  ...,  0.0676,  0.0612,  0.0435],
        [ 0.0589,  0.0745,  0.0366,  ...,  0.0987,  0.0820,  0.0503],
        [ 0.0344,  0.0543,  0.0381,  ...,  0.0798,  0.0499,  0.0635]], device='cuda:0')
loss: 107.21147918701172
var: tensor([[ 0.0279,  0.0316,  0.0325,  ...,  0.0602,  0.0475,  0.0492],
        [ 0.0886,  0.1622,  0.1021,  ...,  0.2177,  0.1058,  0.1327],
        [ 0.0698,  0.0910,  0.0473,  ...,  0.1089,  0.0749,  0.0507],
        ...,
        [ 0.0663,  0.0857,  0.0394,  ...,  0.0821,  0.0576,  0.0620],
        [ 0.0635,  0.1173,  0.0569,  ...,  0.1000,  0.0718,  0.0713],
        [ 0.0405,  0.0507,  0.0329,  ...,  0.0669,  0.0585,  0.0534]], device='cuda:0')
loss: 102.78276062011719
var: tensor([[ 0.0357,  0.0344,  0.043

loss: 104.54702758789062
var: tensor([[ 0.0371,  0.0556,  0.0423,  ...,  0.0941,  0.0611,  0.0656],
        [ 0.0558,  0.1017,  0.0469,  ...,  0.1110,  0.0770,  0.0661],
        [ 0.0613,  0.0518,  0.0377,  ...,  0.1062,  0.0613,  0.0688],
        ...,
        [ 0.0493,  0.0547,  0.0432,  ...,  0.0839,  0.0598,  0.0714],
        [ 0.0337,  0.0625,  0.0259,  ...,  0.0807,  0.0735,  0.0447],
        [ 0.0356,  0.0503,  0.0455,  ...,  0.0683,  0.0511,  0.0518]], device='cuda:0')
loss: 109.02842712402344
var: tensor([[ 0.2120,  0.1895,  0.0692,  ...,  0.2371,  0.1464,  0.1425],
        [ 0.0325,  0.0414,  0.0535,  ...,  0.0702,  0.0558,  0.0416],
        [ 0.0431,  0.0576,  0.0375,  ...,  0.0907,  0.0712,  0.0834],
        ...,
        [ 0.0381,  0.0659,  0.0283,  ...,  0.0768,  0.0497,  0.0603],
        [ 0.0941,  0.1463,  0.0489,  ...,  0.1984,  0.0966,  0.1112],
        [ 0.0473,  0.0690,  0.0458,  ...,  0.0999,  0.0808,  0.0712]], device='cuda:0')
loss: 99.61549377441406
var: tensor([[

var: tensor([[ 0.0445,  0.0573,  0.0415,  ...,  0.0392,  0.0550,  0.0416],
        [ 0.0815,  0.0825,  0.0391,  ...,  0.0994,  0.0594,  0.0957],
        [ 0.0345,  0.0661,  0.0353,  ...,  0.0477,  0.0447,  0.0695],
        ...,
        [ 0.1768,  0.1966,  0.0793,  ...,  0.2121,  0.1706,  0.1775],
        [ 0.0437,  0.0766,  0.0341,  ...,  0.0766,  0.0483,  0.0881],
        [ 0.0603,  0.0846,  0.0365,  ...,  0.0881,  0.0823,  0.0667]], device='cuda:0')
loss: 106.74958801269531
var: tensor([[ 0.0834,  0.1026,  0.0504,  ...,  0.0839,  0.0675,  0.0756],
        [ 0.0478,  0.0536,  0.0478,  ...,  0.0649,  0.0526,  0.0688],
        [ 0.0356,  0.0484,  0.0357,  ...,  0.0494,  0.0495,  0.0406],
        ...,
        [ 0.0923,  0.0968,  0.0604,  ...,  0.0816,  0.0570,  0.1206],
        [ 0.0305,  0.0436,  0.0293,  ...,  0.0310,  0.0367,  0.0443],
        [ 0.0317,  0.0639,  0.0297,  ...,  0.0472,  0.0439,  0.0628]], device='cuda:0')
loss: 108.72834777832031
var: tensor([[ 0.0434,  0.0446,  0.031

var: tensor([[ 0.0538,  0.0710,  0.0699,  ...,  0.0525,  0.0729,  0.0543],
        [ 0.0344,  0.0531,  0.0417,  ...,  0.0711,  0.0418,  0.0566],
        [ 0.0421,  0.0915,  0.0708,  ...,  0.0860,  0.0664,  0.0740],
        ...,
        [ 0.0452,  0.0526,  0.0539,  ...,  0.0601,  0.0566,  0.0533],
        [ 0.0349,  0.0387,  0.0426,  ...,  0.0496,  0.0523,  0.0490],
        [ 0.0499,  0.0788,  0.0358,  ...,  0.0763,  0.0722,  0.0654]], device='cuda:0')
loss: 108.42860412597656
var: tensor([[ 0.0267,  0.0414,  0.0289,  ...,  0.0477,  0.0349,  0.0542],
        [ 0.0561,  0.0782,  0.0518,  ...,  0.0971,  0.0634,  0.0873],
        [ 0.0503,  0.1069,  0.0704,  ...,  0.0748,  0.0666,  0.0645],
        ...,
        [ 0.0431,  0.0534,  0.0317,  ...,  0.1008,  0.0526,  0.0539],
        [ 0.0538,  0.1025,  0.0764,  ...,  0.0857,  0.0769,  0.0706],
        [ 0.0502,  0.0845,  0.0383,  ...,  0.0625,  0.0628,  0.0589]], device='cuda:0')
loss: 104.70609283447266
var: tensor([[ 0.0327,  0.0667,  0.029

====> Test set loss: 97.1050
var: tensor([[ 0.0543,  0.0951,  0.0451,  ...,  0.0811,  0.0946,  0.0742],
        [ 0.0697,  0.0739,  0.0490,  ...,  0.0729,  0.0806,  0.0703],
        [ 0.0246,  0.0470,  0.0371,  ...,  0.0331,  0.0566,  0.0345],
        ...,
        [ 0.0414,  0.1498,  0.1047,  ...,  0.1191,  0.1202,  0.1243],
        [ 0.1427,  0.1633,  0.0709,  ...,  0.1321,  0.1073,  0.1528],
        [ 0.0364,  0.0705,  0.0494,  ...,  0.0420,  0.0656,  0.0716]], device='cuda:0')
loss: 108.21339416503906
var: tensor([[ 0.0658,  0.0482,  0.0418,  ...,  0.0799,  0.0514,  0.0839],
        [ 0.0387,  0.1095,  0.0818,  ...,  0.0515,  0.0645,  0.0826],
        [ 0.0467,  0.1120,  0.0553,  ...,  0.0831,  0.0732,  0.0765],
        ...,
        [ 0.0383,  0.0374,  0.0270,  ...,  0.0319,  0.0395,  0.0523],
        [ 0.0443,  0.0756,  0.0466,  ...,  0.0764,  0.0557,  0.0704],
        [ 0.0511,  0.0636,  0.0416,  ...,  0.0687,  0.0704,  0.0747]], device='cuda:0')
loss: 102.82398986816406
var: tens

var: tensor([[ 0.0267,  0.0370,  0.0346,  ...,  0.0473,  0.0563,  0.0554],
        [ 0.0393,  0.0848,  0.0476,  ...,  0.0773,  0.0582,  0.0620],
        [ 0.0812,  0.1549,  0.0914,  ...,  0.1260,  0.0857,  0.1326],
        ...,
        [ 0.0675,  0.1029,  0.0552,  ...,  0.0756,  0.0787,  0.0673],
        [ 0.0280,  0.0323,  0.0297,  ...,  0.0421,  0.0523,  0.0394],
        [ 0.1348,  0.1457,  0.0951,  ...,  0.1781,  0.1174,  0.1370]], device='cuda:0')
loss: 109.77488708496094
var: tensor([[ 0.0741,  0.0642,  0.0595,  ...,  0.0739,  0.0562,  0.0610],
        [ 0.0528,  0.0548,  0.0294,  ...,  0.0593,  0.0638,  0.0451],
        [ 0.0364,  0.0682,  0.0581,  ...,  0.0548,  0.0571,  0.0537],
        ...,
        [ 0.0486,  0.1851,  0.1394,  ...,  0.1779,  0.1301,  0.1991],
        [ 0.0533,  0.0387,  0.0313,  ...,  0.0426,  0.0509,  0.0692],
        [ 0.0317,  0.0393,  0.0313,  ...,  0.0423,  0.0511,  0.0347]], device='cuda:0')
loss: 106.76164245605469
var: tensor([[ 0.0362,  0.0672,  0.064

var: tensor([[ 0.0750,  0.0543,  0.0421,  ...,  0.1007,  0.0503,  0.0672],
        [ 0.0434,  0.0670,  0.0255,  ...,  0.0741,  0.0517,  0.0458],
        [ 0.0611,  0.0584,  0.0398,  ...,  0.0748,  0.0576,  0.0452],
        ...,
        [ 0.1033,  0.0577,  0.0350,  ...,  0.0860,  0.0539,  0.0734],
        [ 0.0692,  0.0690,  0.0401,  ...,  0.0802,  0.0572,  0.0510],
        [ 0.0410,  0.0927,  0.0366,  ...,  0.0643,  0.0556,  0.0614]], device='cuda:0')
loss: 106.50601196289062
var: tensor([[ 0.0364,  0.0971,  0.0439,  ...,  0.1021,  0.0569,  0.0645],
        [ 0.0582,  0.1444,  0.0449,  ...,  0.1444,  0.1077,  0.0890],
        [ 0.1077,  0.1655,  0.0626,  ...,  0.1576,  0.0806,  0.1255],
        ...,
        [ 0.0477,  0.0673,  0.0435,  ...,  0.0753,  0.0495,  0.0584],
        [ 0.0467,  0.0594,  0.0377,  ...,  0.0705,  0.0368,  0.0817],
        [ 0.0308,  0.0590,  0.0338,  ...,  0.0793,  0.0395,  0.0618]], device='cuda:0')
loss: 105.93170928955078
var: tensor([[ 0.0510,  0.1119,  0.044

var: tensor([[ 0.0358,  0.0665,  0.0240,  ...,  0.0772,  0.0593,  0.0416],
        [ 0.0665,  0.0675,  0.0372,  ...,  0.0943,  0.0876,  0.0699],
        [ 0.0328,  0.0475,  0.0250,  ...,  0.0448,  0.0946,  0.0348],
        ...,
        [ 0.1599,  0.1607,  0.0578,  ...,  0.2120,  0.1799,  0.1125],
        [ 0.0329,  0.0813,  0.0457,  ...,  0.1056,  0.0942,  0.0958],
        [ 0.0386,  0.0922,  0.0475,  ...,  0.0763,  0.0725,  0.0554]], device='cuda:0')
loss: 106.1276626586914
var: tensor([[ 0.0569,  0.0582,  0.0267,  ...,  0.0672,  0.0876,  0.0592],
        [ 0.0276,  0.0942,  0.0341,  ...,  0.0661,  0.0764,  0.0494],
        [ 0.0273,  0.0373,  0.0240,  ...,  0.0516,  0.0527,  0.0329],
        ...,
        [ 0.0393,  0.1366,  0.0404,  ...,  0.0969,  0.0932,  0.0674],
        [ 0.0459,  0.0746,  0.0567,  ...,  0.0671,  0.0861,  0.0485],
        [ 0.0331,  0.0572,  0.0381,  ...,  0.0782,  0.0725,  0.0489]], device='cuda:0')
loss: 109.21045684814453
var: tensor([[ 0.0432,  0.0699,  0.0364

var: tensor([[ 0.0409,  0.1103,  0.0433,  ...,  0.0773,  0.0679,  0.0549],
        [ 0.0380,  0.0481,  0.0273,  ...,  0.0519,  0.0826,  0.0382],
        [ 0.0408,  0.0669,  0.0529,  ...,  0.0620,  0.0780,  0.0530],
        ...,
        [ 0.0287,  0.0482,  0.0364,  ...,  0.0538,  0.0740,  0.0419],
        [ 0.0613,  0.0728,  0.0340,  ...,  0.0822,  0.0557,  0.0577],
        [ 0.1052,  0.1016,  0.0506,  ...,  0.1219,  0.0877,  0.0547]], device='cuda:0')
loss: 104.73931121826172
var: tensor([[ 0.0341,  0.0663,  0.0338,  ...,  0.0944,  0.0583,  0.0489],
        [ 0.0519,  0.0972,  0.0410,  ...,  0.0571,  0.0574,  0.0676],
        [ 0.0609,  0.0715,  0.0378,  ...,  0.0775,  0.0492,  0.0551],
        ...,
        [ 0.0486,  0.0367,  0.0354,  ...,  0.0567,  0.0322,  0.0387],
        [ 0.0512,  0.0640,  0.0327,  ...,  0.0584,  0.0598,  0.0278],
        [ 0.0541,  0.0779,  0.0647,  ...,  0.0797,  0.0839,  0.0488]], device='cuda:0')
loss: 105.32852172851562
var: tensor([[ 0.0625,  0.0679,  0.039

var: tensor([[ 0.0390,  0.0491,  0.0278,  ...,  0.0489,  0.0466,  0.0672],
        [ 0.0800,  0.0531,  0.0292,  ...,  0.0767,  0.0561,  0.0660],
        [ 0.1180,  0.1996,  0.0702,  ...,  0.1826,  0.1005,  0.1426],
        ...,
        [ 0.0768,  0.0674,  0.0336,  ...,  0.0737,  0.0475,  0.0787],
        [ 0.0458,  0.1720,  0.0809,  ...,  0.1583,  0.0785,  0.0909],
        [ 0.0863,  0.1566,  0.0474,  ...,  0.1784,  0.1217,  0.0927]], device='cuda:0')
loss: 103.61827850341797
var: tensor([[ 0.0277,  0.0441,  0.0416,  ...,  0.0426,  0.0797,  0.0435],
        [ 0.0501,  0.0594,  0.0302,  ...,  0.0853,  0.0611,  0.0513],
        [ 0.0449,  0.0578,  0.0242,  ...,  0.0456,  0.0499,  0.0415],
        ...,
        [ 0.0955,  0.0755,  0.0507,  ...,  0.0839,  0.0530,  0.0816],
        [ 0.1263,  0.1026,  0.0457,  ...,  0.0974,  0.0851,  0.0704],
        [ 0.0317,  0.0592,  0.0390,  ...,  0.0515,  0.0877,  0.0377]], device='cuda:0')
loss: 109.9372787475586
var: tensor([[ 0.0527,  0.0856,  0.0393

loss: 110.51097106933594
var: tensor([[ 0.0407,  0.0618,  0.0330,  ...,  0.0580,  0.0411,  0.0764],
        [ 0.0463,  0.1042,  0.0523,  ...,  0.0890,  0.0681,  0.0757],
        [ 0.0829,  0.0600,  0.0347,  ...,  0.0963,  0.0537,  0.0715],
        ...,
        [ 0.0510,  0.0884,  0.0727,  ...,  0.0785,  0.0672,  0.0786],
        [ 0.0339,  0.0464,  0.0241,  ...,  0.0609,  0.0520,  0.0436],
        [ 0.0834,  0.0678,  0.0450,  ...,  0.0884,  0.0950,  0.0583]], device='cuda:0')
loss: 102.37150573730469
var: tensor([[ 0.0270,  0.0344,  0.0250,  ...,  0.0327,  0.0308,  0.0484],
        [ 0.2016,  0.1623,  0.0675,  ...,  0.1927,  0.1383,  0.1259],
        [ 0.0157,  0.0279,  0.0201,  ...,  0.0302,  0.0377,  0.0296],
        ...,
        [ 0.0445,  0.0790,  0.0369,  ...,  0.0630,  0.0685,  0.0661],
        [ 0.0494,  0.0661,  0.0947,  ...,  0.1012,  0.0740,  0.0658],
        [ 0.0549,  0.0576,  0.0352,  ...,  0.0542,  0.0617,  0.0525]], device='cuda:0')
loss: 109.7590560913086
var: tensor([[

var: tensor([[ 0.0396,  0.0498,  0.0277,  ...,  0.0603,  0.0634,  0.0518],
        [ 0.0608,  0.0700,  0.0484,  ...,  0.0940,  0.0726,  0.0658],
        [ 0.0336,  0.0564,  0.0308,  ...,  0.0762,  0.0504,  0.0563],
        ...,
        [ 0.0610,  0.0840,  0.0444,  ...,  0.0868,  0.0623,  0.0593],
        [ 0.0693,  0.0708,  0.0375,  ...,  0.0977,  0.0908,  0.0532],
        [ 0.0514,  0.1227,  0.0445,  ...,  0.1099,  0.0842,  0.0916]], device='cuda:0')
loss: 108.09584045410156
var: tensor([[ 0.0446,  0.0653,  0.0320,  ...,  0.0502,  0.0524,  0.0383],
        [ 0.0373,  0.0484,  0.0386,  ...,  0.0556,  0.0427,  0.0505],
        [ 0.0413,  0.0517,  0.0469,  ...,  0.0550,  0.0537,  0.0355],
        ...,
        [ 0.1094,  0.1332,  0.0477,  ...,  0.1635,  0.1175,  0.0959],
        [ 0.0352,  0.0656,  0.0326,  ...,  0.0653,  0.0518,  0.0679],
        [ 0.0443,  0.0659,  0.0263,  ...,  0.0601,  0.0478,  0.0546]], device='cuda:0')
loss: 106.9482421875
var: tensor([[ 0.0267,  0.0377,  0.0302,  

loss: 104.42977142333984
var: tensor([[ 0.0618,  0.0710,  0.0594,  ...,  0.0717,  0.0830,  0.0507],
        [ 0.0453,  0.1135,  0.0428,  ...,  0.0994,  0.0734,  0.0705],
        [ 0.0532,  0.1427,  0.0932,  ...,  0.1597,  0.0980,  0.1325],
        ...,
        [ 0.0469,  0.0423,  0.0327,  ...,  0.0585,  0.0359,  0.0446],
        [ 0.0251,  0.0356,  0.0170,  ...,  0.0383,  0.0424,  0.0314],
        [ 0.0249,  0.0734,  0.0344,  ...,  0.0770,  0.0535,  0.0712]], device='cuda:0')
loss: 105.24732208251953
var: tensor([[ 0.0295,  0.0423,  0.0239,  ...,  0.0441,  0.0600,  0.0492],
        [ 0.0246,  0.0593,  0.0371,  ...,  0.1060,  0.0551,  0.0619],
        [ 0.0412,  0.0367,  0.0320,  ...,  0.0694,  0.0512,  0.0429],
        ...,
        [ 0.0303,  0.0532,  0.0280,  ...,  0.0894,  0.0612,  0.0897],
        [ 0.0611,  0.1344,  0.0391,  ...,  0.1451,  0.0924,  0.0870],
        [ 0.0388,  0.0591,  0.0214,  ...,  0.0780,  0.0500,  0.0519]], device='cuda:0')
loss: 109.49845123291016
var: tensor([

loss: 106.73446655273438
var: tensor([[ 0.0468,  0.0501,  0.0377,  ...,  0.0832,  0.0511,  0.0605],
        [ 0.0326,  0.0395,  0.0188,  ...,  0.0414,  0.0443,  0.0441],
        [ 0.0426,  0.0569,  0.0389,  ...,  0.0842,  0.0527,  0.0711],
        ...,
        [ 0.0663,  0.1448,  0.0607,  ...,  0.0801,  0.0775,  0.1315],
        [ 0.0298,  0.0420,  0.0410,  ...,  0.0656,  0.0495,  0.0369],
        [ 0.0576,  0.1152,  0.0389,  ...,  0.0929,  0.0666,  0.0837]], device='cuda:0')
loss: 102.0401382446289
var: tensor([[ 0.0342,  0.0404,  0.0161,  ...,  0.0378,  0.0372,  0.0341],
        [ 0.0353,  0.0516,  0.0306,  ...,  0.0469,  0.0445,  0.0570],
        [ 0.0625,  0.0786,  0.0515,  ...,  0.0731,  0.0641,  0.0589],
        ...,
        [ 0.0556,  0.0601,  0.0416,  ...,  0.0760,  0.0512,  0.0691],
        [ 0.0500,  0.0746,  0.0618,  ...,  0.0730,  0.0736,  0.0514],
        [ 0.0757,  0.0864,  0.0313,  ...,  0.1109,  0.0980,  0.0553]], device='cuda:0')
loss: 108.17739868164062
var: tensor([[

var: tensor([[ 0.1230,  0.1226,  0.0869,  ...,  0.1753,  0.1029,  0.1556],
        [ 0.0450,  0.0396,  0.0289,  ...,  0.0417,  0.0556,  0.0525],
        [ 0.0509,  0.0681,  0.0256,  ...,  0.0685,  0.0681,  0.0610],
        ...,
        [ 0.0624,  0.0737,  0.0488,  ...,  0.0650,  0.0763,  0.0795],
        [ 0.0790,  0.1053,  0.0283,  ...,  0.0919,  0.0914,  0.0643],
        [ 0.0542,  0.0710,  0.0293,  ...,  0.0571,  0.0752,  0.0519]], device='cuda:0')
loss: 102.91575622558594
var: tensor([[ 0.0344,  0.0440,  0.0316,  ...,  0.0500,  0.0614,  0.0677],
        [ 0.0359,  0.0467,  0.0356,  ...,  0.0516,  0.0684,  0.0566],
        [ 0.0255,  0.0323,  0.0251,  ...,  0.0448,  0.0413,  0.0489],
        ...,
        [ 0.0230,  0.0344,  0.0296,  ...,  0.0442,  0.0644,  0.0512],
        [ 0.0245,  0.0532,  0.0231,  ...,  0.0726,  0.0515,  0.0502],
        [ 0.0331,  0.0637,  0.0409,  ...,  0.0594,  0.0801,  0.0540]], device='cuda:0')
loss: 106.22464752197266
var: tensor([[ 0.0334,  0.0857,  0.037

var: tensor([[ 0.0676,  0.0970,  0.0913,  ...,  0.1072,  0.1023,  0.0732],
        [ 0.0484,  0.0422,  0.0272,  ...,  0.0557,  0.0390,  0.0483],
        [ 0.0510,  0.0450,  0.0297,  ...,  0.0738,  0.0515,  0.0527],
        ...,
        [ 0.0571,  0.0525,  0.0464,  ...,  0.0838,  0.0604,  0.0392],
        [ 0.0468,  0.0969,  0.0703,  ...,  0.0939,  0.0707,  0.0627],
        [ 0.0976,  0.0525,  0.0291,  ...,  0.0716,  0.0335,  0.0613]], device='cuda:0')
loss: 104.72727966308594
var: tensor([[ 0.0514,  0.0626,  0.0338,  ...,  0.0827,  0.0494,  0.0805],
        [ 0.0558,  0.0526,  0.0348,  ...,  0.0697,  0.0717,  0.0488],
        [ 0.0516,  0.0480,  0.0481,  ...,  0.0783,  0.0601,  0.0610],
        ...,
        [ 0.0466,  0.0449,  0.0237,  ...,  0.0455,  0.0446,  0.0433],
        [ 0.0856,  0.1186,  0.0361,  ...,  0.1054,  0.0930,  0.0697],
        [ 0.0830,  0.0787,  0.0407,  ...,  0.1114,  0.0777,  0.0827]], device='cuda:0')
loss: 102.78085327148438
var: tensor([[ 0.0443,  0.0452,  0.028

var: tensor([[ 0.0371,  0.0476,  0.0292,  ...,  0.0639,  0.0568,  0.0515],
        [ 0.0461,  0.0668,  0.0365,  ...,  0.0620,  0.0529,  0.0420],
        [ 0.0422,  0.0581,  0.0365,  ...,  0.0645,  0.0630,  0.0599],
        ...,
        [ 0.0355,  0.0593,  0.0305,  ...,  0.0566,  0.0475,  0.0762],
        [ 0.0402,  0.0562,  0.0394,  ...,  0.0444,  0.0471,  0.0495],
        [ 0.0276,  0.0376,  0.0443,  ...,  0.0542,  0.0597,  0.0403]], device='cuda:0')
loss: 105.12335205078125
var: tensor([[ 0.0515,  0.0534,  0.0315,  ...,  0.0679,  0.0455,  0.0674],
        [ 0.0296,  0.0524,  0.0271,  ...,  0.0586,  0.0347,  0.0552],
        [ 0.0476,  0.0722,  0.0294,  ...,  0.0748,  0.0543,  0.0580],
        ...,
        [ 0.0799,  0.0720,  0.0644,  ...,  0.0853,  0.0593,  0.0801],
        [ 0.0265,  0.0478,  0.0357,  ...,  0.0525,  0.0745,  0.0391],
        [ 0.0613,  0.1261,  0.0800,  ...,  0.1895,  0.0937,  0.1345]], device='cuda:0')
loss: 107.21654510498047
var: tensor([[ 0.0362,  0.0562,  0.044

var: tensor([[ 0.0263,  0.0520,  0.0511,  ...,  0.0659,  0.0610,  0.0901],
        [ 0.0266,  0.0525,  0.0362,  ...,  0.0579,  0.0597,  0.0605],
        [ 0.0377,  0.0571,  0.0284,  ...,  0.0691,  0.0459,  0.0569],
        ...,
        [ 0.0331,  0.0539,  0.0442,  ...,  0.0700,  0.0729,  0.0665],
        [ 0.0278,  0.0826,  0.0471,  ...,  0.0518,  0.0822,  0.0508],
        [ 0.0522,  0.0691,  0.0401,  ...,  0.0796,  0.0658,  0.0781]], device='cuda:0')
loss: 103.77491760253906
var: tensor([[ 0.0238,  0.0514,  0.0497,  ...,  0.0589,  0.0720,  0.0537],
        [ 0.0174,  0.0269,  0.0231,  ...,  0.0427,  0.0301,  0.0282],
        [ 0.0523,  0.1837,  0.0661,  ...,  0.1328,  0.0837,  0.1140],
        ...,
        [ 0.0480,  0.0890,  0.0378,  ...,  0.0715,  0.0715,  0.0731],
        [ 0.0320,  0.0394,  0.0407,  ...,  0.0644,  0.0560,  0.0666],
        [ 0.0294,  0.0471,  0.0353,  ...,  0.0438,  0.0661,  0.0412]], device='cuda:0')
loss: 105.02857208251953
var: tensor([[ 0.0458,  0.0818,  0.040

var: tensor([[ 0.0380,  0.1037,  0.0361,  ...,  0.0615,  0.0672,  0.0622],
        [ 0.0466,  0.0721,  0.0376,  ...,  0.0921,  0.0547,  0.0729],
        [ 0.0456,  0.0818,  0.0370,  ...,  0.1068,  0.0768,  0.0742],
        ...,
        [ 0.0903,  0.1073,  0.0388,  ...,  0.1274,  0.1027,  0.0818],
        [ 0.0334,  0.0467,  0.0281,  ...,  0.0624,  0.0473,  0.0487],
        [ 0.0847,  0.0798,  0.0641,  ...,  0.1001,  0.0791,  0.0889]], device='cuda:0')
loss: 107.04118347167969
var: tensor([[ 0.0691,  0.1885,  0.0544,  ...,  0.1981,  0.0891,  0.1153],
        [ 0.0582,  0.0997,  0.0482,  ...,  0.1080,  0.0882,  0.0754],
        [ 0.0369,  0.1174,  0.0555,  ...,  0.0622,  0.0695,  0.0557],
        ...,
        [ 0.0245,  0.0544,  0.0357,  ...,  0.0790,  0.0621,  0.0483],
        [ 0.0290,  0.0314,  0.0260,  ...,  0.0503,  0.0295,  0.0430],
        [ 0.0476,  0.0768,  0.0406,  ...,  0.0913,  0.0732,  0.0558]], device='cuda:0')
loss: 108.2008056640625
var: tensor([[ 0.0373,  0.0571,  0.0566

var: tensor([[ 0.0475,  0.0829,  0.0526,  ...,  0.0859,  0.0735,  0.0487],
        [ 0.0456,  0.0655,  0.0381,  ...,  0.0963,  0.0643,  0.0566],
        [ 0.0344,  0.0770,  0.0443,  ...,  0.0836,  0.0533,  0.0575],
        ...,
        [ 0.0607,  0.0732,  0.0381,  ...,  0.1114,  0.0644,  0.0815],
        [ 0.0538,  0.0571,  0.0437,  ...,  0.0895,  0.0595,  0.0708],
        [ 0.0636,  0.1267,  0.0352,  ...,  0.1079,  0.0645,  0.1029]], device='cuda:0')
loss: 109.20050811767578
var: tensor([[ 0.0435,  0.0607,  0.0439,  ...,  0.0703,  0.0557,  0.0538],
        [ 0.0596,  0.0697,  0.0448,  ...,  0.0953,  0.0542,  0.0804],
        [ 0.0380,  0.0541,  0.0474,  ...,  0.0620,  0.0592,  0.0461],
        ...,
        [ 0.0380,  0.0503,  0.0411,  ...,  0.0516,  0.0494,  0.0550],
        [ 0.0350,  0.0499,  0.0333,  ...,  0.0475,  0.0505,  0.0534],
        [ 0.0360,  0.0478,  0.0374,  ...,  0.0356,  0.0514,  0.0469]], device='cuda:0')
loss: 105.60771179199219
var: tensor([[ 0.0317,  0.0519,  0.030

var: tensor([[ 0.1200,  0.0553,  0.0409,  ...,  0.0931,  0.0575,  0.1154],
        [ 0.2119,  0.2015,  0.0791,  ...,  0.1683,  0.1456,  0.1950],
        [ 0.0497,  0.0545,  0.0286,  ...,  0.0471,  0.0503,  0.0428],
        ...,
        [ 0.0588,  0.0502,  0.0270,  ...,  0.0546,  0.0452,  0.0648],
        [ 0.0464,  0.0630,  0.0296,  ...,  0.0633,  0.0507,  0.0587],
        [ 0.0250,  0.0389,  0.0316,  ...,  0.0371,  0.0562,  0.0434]], device='cuda:0')
loss: 104.22496032714844
var: tensor([[ 0.0599,  0.0813,  0.0402,  ...,  0.0690,  0.0531,  0.0844],
        [ 0.0413,  0.0572,  0.0331,  ...,  0.0714,  0.0515,  0.0739],
        [ 0.0432,  0.0610,  0.0325,  ...,  0.0547,  0.0543,  0.0522],
        ...,
        [ 0.1744,  0.1622,  0.0626,  ...,  0.2211,  0.1524,  0.2009],
        [ 0.0418,  0.0659,  0.0310,  ...,  0.0929,  0.0613,  0.0563],
        [ 0.0694,  0.0802,  0.0396,  ...,  0.0881,  0.0802,  0.0812]], device='cuda:0')
loss: 104.32799530029297
var: tensor([[ 0.0489,  0.0775,  0.041

====> Test set loss: 97.2699


In [12]:
x = torch.tensor([[1,2],[3,4]])
t = torch.tensor([[1,1],[1,1]])
x = (x>t).float()
x

tensor([[ 0.,  1.],
        [ 1.,  1.]])

In [None]:
train_loader

In [5]:
for batch_idx, (data, _) in enumerate(train_loader):
    print(type(data))
    print(data.shape)
    #d = data.view(-1, 784)
    #print (d.shape)

<class 'torch.Tensor'>
torch.Size([128, 1, 28, 28])
<class 'torch.Tensor'>
torch.Size([128, 1, 28, 28])
<class 'torch.Tensor'>
torch.Size([128, 1, 28, 28])
<class 'torch.Tensor'>
torch.Size([128, 1, 28, 28])
<class 'torch.Tensor'>
torch.Size([128, 1, 28, 28])
<class 'torch.Tensor'>
torch.Size([128, 1, 28, 28])
<class 'torch.Tensor'>
torch.Size([128, 1, 28, 28])
<class 'torch.Tensor'>
torch.Size([128, 1, 28, 28])
<class 'torch.Tensor'>
torch.Size([128, 1, 28, 28])
<class 'torch.Tensor'>
torch.Size([128, 1, 28, 28])
<class 'torch.Tensor'>
torch.Size([128, 1, 28, 28])
<class 'torch.Tensor'>
torch.Size([128, 1, 28, 28])
<class 'torch.Tensor'>
torch.Size([128, 1, 28, 28])
<class 'torch.Tensor'>
torch.Size([128, 1, 28, 28])
<class 'torch.Tensor'>
torch.Size([128, 1, 28, 28])
<class 'torch.Tensor'>
torch.Size([128, 1, 28, 28])
<class 'torch.Tensor'>
torch.Size([128, 1, 28, 28])
<class 'torch.Tensor'>
torch.Size([128, 1, 28, 28])
<class 'torch.Tensor'>
torch.Size([128, 1, 28, 28])
<class 'torc

<class 'torch.Tensor'>
torch.Size([128, 1, 28, 28])
<class 'torch.Tensor'>
torch.Size([128, 1, 28, 28])
<class 'torch.Tensor'>
torch.Size([128, 1, 28, 28])
<class 'torch.Tensor'>
torch.Size([128, 1, 28, 28])
<class 'torch.Tensor'>
torch.Size([128, 1, 28, 28])
<class 'torch.Tensor'>
torch.Size([128, 1, 28, 28])
<class 'torch.Tensor'>
torch.Size([128, 1, 28, 28])
<class 'torch.Tensor'>
torch.Size([128, 1, 28, 28])
<class 'torch.Tensor'>
torch.Size([128, 1, 28, 28])
<class 'torch.Tensor'>
torch.Size([128, 1, 28, 28])
<class 'torch.Tensor'>
torch.Size([128, 1, 28, 28])
<class 'torch.Tensor'>
torch.Size([128, 1, 28, 28])
<class 'torch.Tensor'>
torch.Size([128, 1, 28, 28])
<class 'torch.Tensor'>
torch.Size([128, 1, 28, 28])
<class 'torch.Tensor'>
torch.Size([128, 1, 28, 28])
<class 'torch.Tensor'>
torch.Size([128, 1, 28, 28])
<class 'torch.Tensor'>
torch.Size([128, 1, 28, 28])
<class 'torch.Tensor'>
torch.Size([128, 1, 28, 28])
<class 'torch.Tensor'>
torch.Size([128, 1, 28, 28])
<class 'torc

<class 'torch.Tensor'>
torch.Size([128, 1, 28, 28])
<class 'torch.Tensor'>
torch.Size([128, 1, 28, 28])
<class 'torch.Tensor'>
torch.Size([128, 1, 28, 28])
<class 'torch.Tensor'>
torch.Size([128, 1, 28, 28])
<class 'torch.Tensor'>
torch.Size([128, 1, 28, 28])
<class 'torch.Tensor'>
torch.Size([128, 1, 28, 28])
<class 'torch.Tensor'>
torch.Size([128, 1, 28, 28])
<class 'torch.Tensor'>
torch.Size([128, 1, 28, 28])
<class 'torch.Tensor'>
torch.Size([128, 1, 28, 28])
<class 'torch.Tensor'>
torch.Size([128, 1, 28, 28])
<class 'torch.Tensor'>
torch.Size([128, 1, 28, 28])
<class 'torch.Tensor'>
torch.Size([128, 1, 28, 28])
<class 'torch.Tensor'>
torch.Size([128, 1, 28, 28])
<class 'torch.Tensor'>
torch.Size([128, 1, 28, 28])
<class 'torch.Tensor'>
torch.Size([128, 1, 28, 28])
<class 'torch.Tensor'>
torch.Size([128, 1, 28, 28])
<class 'torch.Tensor'>
torch.Size([128, 1, 28, 28])
<class 'torch.Tensor'>
torch.Size([128, 1, 28, 28])
<class 'torch.Tensor'>
torch.Size([128, 1, 28, 28])
<class 'torc