In [2]:
link = 'D:/users/Marko/downloads/mirna/'

# Imports

In [3]:
%load_ext tensorboard

In [4]:
import sys
#sys.path.insert(0,'/content/drive/MyDrive/Marko/master')
sys.path.insert(0, link)
import numpy as np
import matplotlib.pyplot as plt

#import tensorflow as tf

import torch
import torch.optim as optim
import torch.nn as nn
import torch.distributions as dist

from torch.nn import functional as F
from torchinfo import summary
from torch.utils.tensorboard import SummaryWriter
from torch.utils.data import Dataset, DataLoader
from torch.autograd import Variable

from sklearn.preprocessing import OneHotEncoder

from tqdm import tqdm
from tqdm import trange

import datetime
import math


writer = SummaryWriter(f"{link}/saved_models/new/HVAE2/tensorboard")

In [5]:
DEVICE = torch.device("cuda" if torch.cuda.is_available() else "cpu")

In [6]:
DEVICE

device(type='cuda')

# Model Classes

In [7]:
class diva_args:

    def __init__(self, z1_dim=1000, z2_dim=1000, d_dim=45, x_dim=7500, y_dim=2,
                 h_dim = 600, h2_dim = 600, number_components = 500,
                 beta=1, rec_alpha = 100, rec_beta = 20, 
                 rec_gamma = 1, warmup = 1, prewarmup = 1):

        self.z1_dim = z1_dim
        self.z2_dim = z2_dim
        self.d_dim = d_dim
        self.x_dim = x_dim
        self.y_dim = y_dim
        
        self.h_dim = h_dim
        self.h2_dim = h2_dim
        
        self.number_components = number_components
        
        self.beta = beta
        self.rec_alpha = rec_alpha
        self.rec_beta = rec_beta
        self.rec_gamma = rec_gamma
        self.warmup = warmup
        self.prewarmup = prewarmup


## Dataset Class

In [8]:
class MicroRNADataset(Dataset):

    def __init__(self, ds='train', create_encodings=False, use_subset=False):
        
        # loading images
        self.images = np.load(f'{link}/data/modmirbase_{ds}_images.npz')['arr_0']/255
        
        
        # loading labels
        print('Loading Labels! (~10s)')     
        ohe = OneHotEncoder(categories='auto', sparse=False)
        labels = np.load(f'{link}/data/modmirbase_{ds}_labels.npz')['arr_0']
        self.labels = ohe.fit_transform(labels)
        
        # loading encoded images
        print("loading encodings")
        if create_encodings:
            x_len, x_bar, x_col = self.get_encoded_values(self.images, ds)
        else:
            x_len = np.load(f'{link}/data/modmirbase_{ds}_images_len3.npz')
            x_bar = np.load(f'{link}/data/modmirbase_{ds}_images_bar3.npz')
            x_col = np.load(f'{link}/data/modmirbase_{ds}_images_col3.npz')
        
        self.x_len = x_len
        self.x_bar = x_bar
        self.x_col = x_col
        
        
        self.mountain = np.load(f'{link}/data/modmirbase_{ds}_mountain.npy')
        
        
        # loading names
        print('Loading Names! (~5s)')
        names =  np.load(f'{link}/data/modmirbase_{ds}_names.npz')['arr_0']
        names = [i.decode('utf-8') for i in names]
        self.species = ['mmu', 'prd', 'hsa', 'ptr', 'efu', 'cbn', 'gma', 'pma',
                        'cel', 'gga', 'ipu', 'ptc', 'mdo', 'cgr', 'bta', 'cin', 
                        'ppy', 'ssc', 'ath', 'cfa', 'osa', 'mtr', 'gra', 'mml',
                        'stu', 'bdi', 'rno', 'oan', 'dre', 'aca', 'eca', 'chi',
                        'bmo', 'ggo', 'aly', 'dps', 'mdm', 'ame', 'ppc', 'ssa',
                        'ppt', 'tca', 'dme', 'sbi']
        # assigning a species label to each observation from species
        # with more than 200 observations from past research
        self.names = []
        for i in names:
            append = False
            for j in self.species:
                if j in i.lower():
                    self.names.append(j)
                    append = True
                    break
            if not append:
                if 'random' in i.lower() or i.isdigit():
                    self.names.append('hsa')
                else:
                    self.names.append('notfound')
        
        # performing one hot encoding
        ohe = OneHotEncoder(categories='auto', sparse=False)
        
       
        
        self.names_ohe = ohe.fit_transform(np.array(self.names).reshape(-1,1))
          
        if use_subset:    
            idxes = [i == 'hsa' and np.random.choice([True, False]) for i in self.names]
            self.names_ohe = self.names_ohe[idxes]
            self.labels = self.labels[idxes]
            self.images = self.images[idxes]
            self.x_len = self.x_len[idxes]
            self.x_col = self.x_col[idxes]
            self.x_bar = self.x_bar[idxes]
            self.mountain = self.mountain[idxes]
    
    def __len__(self):
        return(self.images.shape[0])

    def __getitem__(self, idx):
        d = self.names_ohe[idx]
        y = self.labels[idx]
        x = self.images[idx]
        x = np.transpose(x, (2,0,1))
        x_len = self.x_len[idx]
        x_col = self.x_col[idx]
        x_bar = self.x_bar[idx]
        mount = self.mountain[idx]                        
        return (x, y, d, x_len, x_col, x_bar, mount)


    def get_encoded_values(self, x, ds):
        """
        given an image or batch of images
        returns length of strand, length of bars and colors of bars
        """
        n = x.shape[0]
        x = np.transpose(x, (0,3,1,2))
        out_len = np.zeros((n), dtype=np.uint8)
        out_col = np.zeros((n,5,2,100), dtype=np.uint8)
        out_bar = np.zeros((n,2,100), dtype=np.uint8)

        for i in range(n):
            if i % 100 == 0:
                print(f'at {i} out of {n}')
            rna_len = 0
            broke = False
            for j in range(100):
                if (x[i,:,12,j] == np.array([1,1,1])).all():
                    out_len[i] = rna_len
                    broke = True
                    break
                else:
                    rna_len += 1
                    # check color of bars
                    out_col[i, self.get_color(x[i,:,12,j]), 0, j] = 1 
                    out_col[i, self.get_color(x[i,:,13,j]), 1, j] = 1
                    # check length of bars
                    len1 = 0
                    # loop until white pixel
                    while not (x[i,:,12-len1,j] == np.array([1.,1.,1.])).all():
                        len1 += 1
                        if 13-len1 == 0:
                            break
                    out_bar[i, 0, j] = len1

                    len2 = 0
                    while not (x[i,:,13+len2,j] == np.array([1.,1.,1.])).all():
                        len2 += 1
                        if 13+len2 == 25:
                            break
                    out_bar[i, 1, j] = len2
            if not broke:
                out_len[i] = rna_len


        with open(f'{link}/data/modmirbase_{ds}_images_len3.npz', 'wb') as f:
            np.save(f, out_len)
        with open(f'{link}/data/modmirbase_{ds}_images_col3.npz', 'wb') as f:
            np.save(f, out_col)
        with open(f'{link}/data/modmirbase_{ds}_images_bar3.npz', 'wb') as f:
            np.save(f, out_bar)
        

        return out_len, out_bar, out_col

    def get_color(self, pixel):
        """
        returns the encoded value for a pixel
        """
        if (pixel == np.array([0,0,0])).all():  
            return 0 # black
        elif (pixel == np.array([1,0,0])).all():  
            return 1 # red
        elif (pixel == np.array([0,0,1])).all():  
            return 2 # blue
        elif (pixel == np.array([0,1,0])).all():  
            return 3 # green
        elif (pixel == np.array([1,1,0])).all():  
            return 4 # yellow
        else:
            print("Something wrong!")


## Decoder classes

In [15]:
# Decoders
class px(nn.Module):
    def __init__(self, d_dim, x_dim, y_dim, z1_dim, z2_dim, 
                 h_dim, h2_dim, dim0=2000, dim1=1200, dim2=400):
        super(px, self).__init__()

        
        # p(z1|z2)
        
        self.p_z1 = nn.Sequential(nn.Linear(z2_dim+200, h2_dim),
                                  nn.ReLU(),
                                  nn.Linear(h2_dim, h2_dim),
                                  nn.ReLU())
        self.mu_z1 = nn.Sequential(nn.Linear(h2_dim, z1_dim))
        self.si_z1 = nn.Sequential(nn.Linear(h2_dim, z1_dim), nn.Softplus())
        
        
        # p(x|z1,z2,m)
        
        self.px_z1 = nn.Sequential(nn.Linear(z1_dim, h_dim),
                                   nn.ReLU())
        self.px_z2 = nn.Sequential(nn.Linear(z2_dim+200, h_dim),
                                   nn.ReLU())
        # seperate decoders for length of RNA, color and size of bars
        self.fc_col = nn.Sequential(nn.Linear(2*h_dim, 600),
                                    nn.ReLU())
        self.dc_col1 = nn.Sequential(nn.ConvTranspose2d(in_channels=12, out_channels=48, 
                                                       kernel_size=4, stride=(2,2), padding=(1,1)),  
                                     nn.ReLU())
        self.dc_col2 = nn.Sequential(nn.ConvTranspose2d(in_channels=48, out_channels=48,
                                                       kernel_size=3, stride=(1,1), padding=(1,1)),
                                     nn.ReLU())
        self.dc_col3 = nn.Sequential(nn.ConvTranspose2d(in_channels=48, out_channels=96,
                                                        kernel_size=3, stride=(1,1), padding=(1,1)),
                                     nn.ReLU())
        self.dc_col4 = nn.Sequential(nn.ConvTranspose2d(in_channels=96, out_channels=96,
                                                        kernel_size=3, stride=(1,1), padding=(1,1)),
                                     nn.ReLU())
        self.dc_col5 = nn.Sequential(nn.ConvTranspose2d(in_channels=96, out_channels=5,
                                                        kernel_size=3, stride=(1,1), padding=(1,1)),
                                     nn.Softmax(dim=1))
        
        self.fc_bar = nn.Sequential(nn.Linear(2*h_dim, dim1),  
                                    nn.ReLU(),
                                    nn.Linear(dim1, dim2),
                                    nn.ReLU(),
                                    nn.Dropout(0.2))
        
        self.fc_len = nn.Sequential(nn.Linear(2*h_dim, dim1),  
                                    nn.ReLU(),
                                    nn.Linear(dim1, dim2),
                                    nn.ReLU(),
                                    nn.Dropout(0.2))
#         self.fc3 = nn.Sequential(nn.Linear(dim1, dim2, bias=False),
#                                  nn.ReLU())
        
        # Predicting length and color of each bar
        #self.color = nn.Sequential(nn.Conv1d(1,5, kernel_size=1, bias=False), 
                                  # nn.Softmax(dim=1))

        
        # Predicting the length of each bar
        self.length_bar_top = nn.Sequential(nn.Linear(dim2,100), nn.Softplus())
        self.length_bar_bot = nn.Sequential(nn.Linear(dim2,100), nn.Softplus())
        #self.length_bar_scale = nn.Sequential(nn.Conv1d(100, 1, kernel_size = 3, padding = 'same', bias=False), nn.Sigmoid())
        
        # Predicting length of the RNA strand
        self.length_RNA = nn.Sequential(nn.Linear(dim2,400), nn.ReLU(),nn.Linear(400,1), nn.Softplus())
        #self.length_RNA_scale = nn.Sequential(nn.Linear(400,1, bias=False), nn.Sigmoid())
        
    def forward(self, z1, mz2):
        
        # p(z1|z2)
        pz1 = self.p_z1(mz2)
        pz1_m = self.mu_z1(pz1)
        pz1_s = self.si_z1(pz1)
        
        # p(x|z1,z2,m)
        hz1 = self.px_z1(z1)
        hz2 = self.px_z2(mz2)
        h = torch.cat([hz1,hz2],1)
        
        len_RNA = self.fc_len(h)
        len_RNA = self.length_RNA(len_RNA)
        len_RNA_sc = nn.Parameter(torch.tensor([1.])).to(DEVICE)

        
        len_bar = self.fc_bar(h)
        len_bar = torch.cat([self.length_bar_top(len_bar)[:,None,:],self.length_bar_bot(len_bar)[:,None,:]], dim=1) 
        len_bar_sc = nn.Parameter(torch.tensor([1.])).to(DEVICE)

        col = self.fc_col(h)
        col = col.reshape(-1,12,1,50)
        col1 = self.dc_col1(col)
        col2 = self.dc_col2(col1) + col1
        col3 = self.dc_col3(col2)
        col4 = self.dc_col4(col3) + col3
        col_bar = self.dc_col5(col4)
        
        
        return len_RNA, len_RNA_sc, len_bar, len_bar_sc, col_bar, pz1_m, pz1_s

    def reconstruct_image(self, len_RNA, var_RNA, len_bar, var_bar ,col_bar, sample=False):
        """
        reconstructs RNA image given output from decoder
        even indexes of len_bar and col_bar   -> top
        uneven indexes of len_bar and col_bar -> bottom
        function does not support sampling yet
        color reconstructions: 0: black
                               1: red
                               2: blue
                               3: green
                               4: yellow
        """
        color_dict = {
                  0: np.array([0,0,0]), # black
                  1: np.array([1,0,0]), # red
                  3: np.array([0,1,0]), # green
                  2: np.array([0,0,1]), # blue
                  4: np.array([1,1,0])  # yellow
                  }
    
        
        len_RNA = len_RNA.cpu().numpy()
        var_RNA = var_RNA.cpu().numpy()
        #.reshape((100,))
        len_bar = len_bar.cpu().numpy()
        var_bar = var_bar.cpu().numpy()
        col_bar = col_bar.cpu().numpy()
        n = len_RNA.shape[0]
        output = np.ones((n,25,100,3))

        for i in range(n):
            if sample:
                limit = int(np.round(np.random.normal(loc=len_RNA[i], scale=var_RNA[i])))
            else:
                limit = int(np.round(len_RNA[i]))
            limit = min(100, limit)
            for j in range(limit):
                if sample:
                    _len_bar_1 = int(np.round(np.random.normal(loc=len_bar[i,0,j], scale=var_bar[i,0,j])))
                    _len_bar_2 = int(np.round(np.random.normal(loc=len_bar[i,1,j], scale=var_bar[i,1,j])))
                    _col_bar_1 = np.random.choice(np.arange(5), p = col_bar[i, :, 2*j])
                    _col_bar_2 = np.random.choice(np.arange(5), p = col_bar[i,:, 2*j+1])
                else:
                    _len_bar_1 = int(np.round(len_bar[i,0,j])) 
                    _len_bar_2 = int(np.round(len_bar[i,1,j]))
                    _col_bar_1 = np.argmax(col_bar[i,:,0,j])
                    _col_bar_2 = np.argmax(col_bar[i,:,1,j])
                
                h1 = max(0,13-_len_bar_1)
                # paint upper bar
                output[i, h1:13, j] = color_dict[_col_bar_1]
                h2 = min(25,13+_len_bar_2)
                # paint lower bar
                output[i, 13:h2, j] = color_dict[_col_bar_2]
        
        
        return output


In [16]:
int(np.round(3.7, 0))
int(3.7)

3

In [17]:
# pzy_ = pzy(45, 7500, 2, 32,32,32)
# summary(pzy_, (1,2))
pzy_ = px(45, 7500, 2, 500,500,500,500)
summary(pzy_, [(1,500),(1,700)])

Layer (type:depth-idx)                   Output Shape              Param #
px                                       --                        --
├─Sequential: 1-1                        [1, 500]                  --
│    └─Linear: 2-1                       [1, 500]                  350,500
│    └─ReLU: 2-2                         [1, 500]                  --
│    └─Linear: 2-3                       [1, 500]                  250,500
│    └─ReLU: 2-4                         [1, 500]                  --
├─Sequential: 1-2                        [1, 500]                  --
│    └─Linear: 2-5                       [1, 500]                  250,500
├─Sequential: 1-3                        [1, 500]                  --
│    └─Linear: 2-6                       [1, 500]                  250,500
│    └─Softplus: 2-7                     [1, 500]                  --
├─Sequential: 1-4                        [1, 500]                  --
│    └─Linear: 2-8                       [1, 500]                

## Endcoder Classes

In [18]:
#pzy_.reconstruct_image(torch.zeros((1,100)), torch.zeros((1,13,200)), torch.zeros(1,5,200)).shape

In [19]:
class qz(nn.Module):
    def __init__(self, d_dim, x_dim, y_dim, z1_dim ,z2_dim, h_dim, h2_dim):
        super(qz, self).__init__()

        # q(z2 | x)
        self.encoder_z2 = nn.Sequential(
            nn.Conv2d(3, 32, kernel_size=3, stride=1, padding = 'valid',bias=False),
            nn.ReLU(),
            nn.Conv2d(32, 64, kernel_size=3, stride=1, padding = 'valid',bias=False),
            nn.ReLU(),
            nn.MaxPool2d(2, 2),
            nn.Conv2d(64, 128, kernel_size=3, stride=1, padding = 'valid', bias=False),
            nn.ReLU(), 
#             nn.Conv2d(128, 128, kernel_size=3, stride=1, padding = 'same', bias=False),
#             nn.ReLU(), 
            nn.MaxPool2d(2, 2),
            nn.Conv2d(128, 256, kernel_size=3, stride=1, bias=False),
            nn.ReLU(), 
            nn.MaxPool2d(2, 2),
        )
        
        self.mu_z2 = nn.Sequential(nn.Linear(2560, z2_dim))
        self.si_z2 = nn.Sequential(nn.Linear(2560, z2_dim), nn.Softplus())
        
        
        # q(z1 | x, z2)
        self.encoder_z1 = nn.Sequential(
            nn.Conv2d(3, 32, kernel_size=3, stride=1, padding = 'valid',bias=False),
            nn.ReLU(),
            nn.Conv2d(32, 64, kernel_size=3, stride=1, padding = 'valid',bias=False),
            nn.ReLU(),
            nn.MaxPool2d(2, 2),
            nn.Conv2d(64, 128, kernel_size=3, stride=1, padding = 'valid', bias=False),
            nn.ReLU(), 
#             nn.Conv2d(128, 128, kernel_size=3, stride=1, padding = 'same', bias=False),
#             nn.ReLU(), 
            nn.MaxPool2d(2, 2),
            nn.Conv2d(128, 256, kernel_size=3, stride=1, bias=False),
            nn.ReLU(), 
            nn.MaxPool2d(2, 2),
        )
        
        self.fc_z2 = nn.Sequential(nn.Linear(z2_dim+200, h_dim), nn.ReLU())
        self.fc_z1 = nn.Sequential(nn.Linear(2560, h_dim), nn.ReLU())
        
        self.fc_z1_z2 = nn.Sequential(nn.Linear(2*h_dim, h2_dim), nn.ReLU())
        
        self.mu_z1 = nn.Sequential(nn.Linear(h2_dim, z1_dim))
        self.si_z1 = nn.Sequential(nn.Linear(h2_dim, z1_dim), nn.Softplus())

#         torch.nn.init.xavier_uniform_(self.encoder[0].weight)
#         torch.nn.init.xavier_uniform_(self.encoder[3].weight)
#         torch.nn.init.xavier_uniform_(self.fc11[0].weight)
#         self.fc11[0].bias.data.zero_()
#         torch.nn.init.xavier_uniform_(self.fc12[0].weight)
#         self.fc12[0].bias.data.zero_()
    
    def q_z2(self, x):
        z2 = self.encoder_z2(x)
        z2 = z2.view(-1, 2560)
        z2_m = self.mu_z2(z2) 
        z2_s = self.si_z2(z2)
        
        return z2_m, z2_s
    
    def forward(self, x, m):
        
        # q(z2 | x) & m
        z2_m, z2_s = self.q_z2(x)
        # reparameterization trick
        qz2 = dist.Normal(z2_m, z2_s)
        z2 = qz2.rsample()
        # z2 & m
        mz2 = torch.cat([z2, m],1)
        
        
        
        # q(z1 | x, z2, m)
        z1 = self.encoder_z1(x)
        z1 = z1.view(-1, 2560)
        z1 = self.fc_z1(z1)
        
        mz2_ = self.fc_z2(mz2)
        
        z1 = torch.cat([mz2_, z1],1)
        z1 = self.fc_z1_z2(z1)
        z1_m = self.mu_z1(z1)
        z1_s = self.si_z1(z1)
        
        qz1 = dist.Normal(z1_m, z1_s)
        z1 = qz1.rsample()
        
        
        #z_loc = self.fc11(h)
        #z_scale = self.fc12(h) + 1e-7

        return z1, z2, mz2, z1_m, z1_s, z2_m, z2_s




In [20]:
a = torch.tensor([[1,2,3],[4,5,6]])
b = torch.tensor([[1,3],[4,6]])

torch.cat([a,b],1)

tensor([[1, 2, 3, 1, 3],
        [4, 5, 6, 4, 6]])

In [21]:
enc = qz(128,10,10,10,500,400,400)
enc(torch.zeros((1,3,25,100)), torch.zeros((1,200)))
summary(enc, [(1,3,25,100),(1,200)])

Layer (type:depth-idx)                   Output Shape              Param #
qz                                       --                        --
├─Sequential: 1-1                        [1, 256, 1, 10]           --
│    └─Conv2d: 2-1                       [1, 32, 23, 98]           864
│    └─ReLU: 2-2                         [1, 32, 23, 98]           --
│    └─Conv2d: 2-3                       [1, 64, 21, 96]           18,432
│    └─ReLU: 2-4                         [1, 64, 21, 96]           --
│    └─MaxPool2d: 2-5                    [1, 64, 10, 48]           --
│    └─Conv2d: 2-6                       [1, 128, 8, 46]           73,728
│    └─ReLU: 2-7                         [1, 128, 8, 46]           --
│    └─MaxPool2d: 2-8                    [1, 128, 4, 23]           --
│    └─Conv2d: 2-9                       [1, 256, 2, 21]           294,912
│    └─ReLU: 2-10                        [1, 256, 2, 21]           --
│    └─MaxPool2d: 2-11                   [1, 256, 1, 10]           --
├

In [22]:
def log_Normal_diag(x, mean, std, average=False, dim=None):
    log_var = 2*torch.log(std)
    log_normal = -0.5 * ( log_var + torch.pow( x - mean, 2 ) / torch.exp( log_var ) )
    if average:
        return torch.mean( log_normal, dim )
    else:
        return torch.sum( log_normal, dim )

## Full model class

In [23]:
class HVAE(nn.Module):
    def __init__(self, args):
        super(HVAE, self).__init__()
        self.z1_dim = args.z1_dim
        self.z2_dim = args.z2_dim
        self.d_dim = args.d_dim
        self.x_dim = args.x_dim
        self.y_dim = args.y_dim
        self.h_dim = args.h_dim
        self.h2_dim = args.h2_dim
        self.number_components = args.number_components
        
        #d_dim, x_dim, y_dim, z1_dim ,z2_dim, h_dim, h2_dim
        self.px = px(self.d_dim, self.x_dim, self.y_dim, self.z1_dim, self.z2_dim, 
                     self.h_dim, self.h2_dim)
        
        self.qz = qz(self.d_dim, self.x_dim, self.y_dim, self.z1_dim, self.z2_dim, 
                     self.h_dim, self.h2_dim)
        

        self.beta = args.beta
        
        self.rec_alpha = args.rec_alpha
        self.rec_beta = args.rec_beta
        self.rec_gamma = args.rec_gamma

        self.warmup = args.warmup
        self.prewarmup = args.prewarmup
        
        self.add_pseudoinputs()
        
        self.lqz1 = []
        self.lqz2 = []
        self.lpz1 = []
        self.lpz2 = []
        
        self.bar = []
        self.len = []
        self.col = []
        
        self.cuda()

    def forward(self, d, x, y, m):
        # Encode
        z1, z2, mz2, z1_m, z1_s, z2_m, z2_s = self.qz(x, m)
        # Decode
        x_len, x_len_scale, x_bar, x_bar_scale, x_col, pz1_m, pz1_s = self.px(z1, mz2)
        
        return x_len, x_len_scale, x_bar, x_bar_scale, x_col, z1, z2, z1_m, z1_s, z2_m, z2_s, pz1_m, pz1_s
    
    
    def log_p_z2(self, z2):
        C = self.number_components
        
        X = self.means(self.idle_input).view(-1,3,25,100)
        
        pz2_m, pz2_s = self.qz.q_z2(X)
        
        z_expand = z2.unsqueeze(1)
        means = pz2_m.unsqueeze(0)
        stds = pz2_s.unsqueeze(0)
        
        a = log_Normal_diag(z_expand, means, stds, dim=2) - math.log(C)
        a_max, _ = torch.max(a,1)
        
        log_prior = (a_max + torch.log(torch.sum(torch.exp(a-a_max.unsqueeze(1)),1)))
        
        return log_prior
    
    def loss_function(self, d, x, y, m, out_len, out_bar, out_col):
        
        x_len, x_len_scale, x_bar, x_bar_scale, x_col, z1, z2, z1_m, z1_s, z2_m, z2_s, pz1_m, pz1_s = self.forward(d, x, y, m)
        
        # Reconstruction Loss
        mask = (1 - F.one_hot(torch.round(out_len).to(torch.int64)-1, 100).cumsum(dim=1)[:,None,None,:])
        mask1 = (1 - F.one_hot(torch.round(out_len).to(torch.int64)-1, 100).cumsum(dim=1)[:,None,:]).repeat(1,2,1)

        x_col = mask.repeat(1,5,2,1)*x_col
        
#         x_gap = x_col[:,0,:]
#         x_nuc = x_col[:,1:,:]
                
        
        
        dist_len = dist.Normal(x_len, x_len_scale+1e-7)
        log_len = dist_len.log_prob(out_len[:,None]).mean()
        
        
        mse_bar = ((((x_bar - out_bar)**2)*mask1).sum(dim=(1,2))/(mask1.sum(dim=(1,2)))).sum()#.detach().item()
        
        max_bar = torch.argmax(x_col, dim=1)
        acc_bar = (((max_bar==torch.argmax(out_col, dim=1))*mask1).sum((1,2))/out_len).sum()
        acc_bar2 = (((max_bar==torch.argsort(out_col, dim=1)[:,1,:,:])*mask1).sum((1,2))/out_len).sum() + acc_bar
        
        RE_len = -log_len
        RE_bar = mse_bar#-log_bar
        RE_col = F.cross_entropy(x_col, out_col, reduction='sum')
          
            
        # KL loss
        KL_p_z1 = log_Normal_diag(z1, pz1_m, pz1_s, dim=1).sum()
        KL_q_z1 = log_Normal_diag(z1, z1_m, z1_s, dim=1).sum()
        KL_p_z2 = self.log_p_z2(z2).sum()
        KL_q_z2 = log_Normal_diag(z2, z2_m, z2_s, dim=1).sum()
        KL = -(KL_p_z1 + KL_p_z2 - KL_q_z1 - KL_q_z2)
        #print(KL_p_z1.shape,KL_p_z2.shape,KL_q_z1.shape,KL_q_z2.shape)
        
        
#         self.lpz1.append(KL_p_z1.detach().item())
#         self.lpz2.append(KL_p_z2.detach().item())
#         self.lqz1.append(KL_q_z1.detach().item())
#         self.lqz2.append(KL_q_z2.detach().item())
        
#         self.bar.append(RE_bar.detach())
#         self.col.append(RE_col.detach())
#         self.len.append(RE_len.detach())
        
        
        return self.rec_alpha * RE_len \
                  + self.rec_beta * RE_bar \
                  + self.rec_gamma * RE_col \
                  + self.beta * KL, \
                  RE_bar, RE_len, RE_col, mse_bar, acc_bar, acc_bar2
    
    def add_pseudoinputs(self):
        # TODO: rework pseudo generation based on reconstruction
        nonlinearity = nn.Hardtanh(min_val=0.0, max_val=1.0)
        self.means = nn.Sequential(nn.Linear(self.number_components, 3*25*100, bias=False), nonlinearity)
        self.idle_input = Variable(torch.eye(self.number_components, self.number_components), requires_grad=False).to(DEVICE)

In [24]:
a = dist.Normal(0,1)
a.log_prob(torch.tensor(10))

tensor(-50.9189)

In [25]:
default_args = diva_args()
enc = HVAE(default_args)
summary(enc,[ (1,1),(1,3,25,100),(1,1),(1,200)])

Layer (type:depth-idx)                   Output Shape              Param #
HVAE                                     --                        --
├─px: 1-1                                --                        (recursive)
│    └─Sequential: 2-1                   --                        (recursive)
│    │    └─Linear: 3-1                  --                        (recursive)
│    │    └─ReLU: 3-2                    --                        --
│    │    └─Linear: 3-3                  --                        (recursive)
│    │    └─ReLU: 3-4                    --                        --
│    └─Sequential: 2-2                   --                        (recursive)
│    │    └─Linear: 3-5                  --                        (recursive)
│    └─Sequential: 2-3                   --                        (recursive)
│    │    └─Linear: 3-6                  --                        (recursive)
│    │    └─Softplus: 3-7                --                        --
│    └─Sequen

# Training the model

## Loading dataset

In [26]:
RNA_dataset = MicroRNADataset(create_encodings=False)

Loading Labels! (~10s)
loading encodings
Loading Names! (~5s)


In [27]:
RNA_dataset_test = MicroRNADataset('test', create_encodings=False)

Loading Labels! (~10s)
loading encodings
Loading Names! (~5s)


In [28]:
RNA_dataset.x_bar.shape, RNA_dataset.x_col.shape 

((34721, 2, 100), (34721, 5, 2, 100))

In [29]:
def train_single_epoch(train_loader, model, optimizer, epoch):
    model.train()
    train_loss = 0
    epoch_bar_loss = 0
    epoch_col_loss = 0
    epoch_len_loss = 0
    no_batches = 0
    train_corr = 0
    mse_bar = 0
    acc_bar = 0
    acc_bar2 = 0
    pbar = tqdm(enumerate(train_loader), unit="batch", 
                                     desc=f'Epoch {epoch}')
    for batch_idx, (x, y, d, x_len, x_col, x_bar, m) in pbar:
        # To device
        x, y, d , x_len, x_bar, x_col, m= x.to(DEVICE), y.to(DEVICE), d.to(DEVICE), x_len.to(DEVICE), x_bar.to(DEVICE), x_col.to(DEVICE), m.to(DEVICE)

        optimizer.zero_grad()
        loss, bar_loss, len_loss, col_loss, mse, acc, acc2 = model.loss_function(d.float(), x.float(), y.float(), m.float(), x_len.float(), x_bar.float(), x_col.float())
      
        loss.backward()
        optimizer.step()
        pbar.set_postfix(loss=loss.item()/x.shape[0])
        train_loss += loss
        epoch_bar_loss += bar_loss
        epoch_col_loss += col_loss
        epoch_len_loss += len_loss
        mse_bar += mse
        acc_bar += acc
        acc_bar2 += acc2
        no_batches += 1

    train_loss /= len(train_loader.dataset)
    epoch_bar_loss /= len(train_loader.dataset)
    epoch_len_loss /= len(train_loader.dataset)
    epoch_col_loss /= len(train_loader.dataset)
    acc_bar /= len(train_loader.dataset)
    acc_bar2 /= len(train_loader.dataset)
    mse_bar /= len(train_loader.dataset)
    
    return train_loss, epoch_bar_loss, epoch_len_loss, epoch_col_loss, mse_bar, acc_bar, acc_bar2

In [30]:
def test_single_epoch(test_loader, model, epoch):
    model.eval()
    test_loss = 0
    epoch_bar_loss = 0
    epoch_col_loss = 0
    epoch_len_loss = 0
    mse_bar = 0
    acc_bar = 0   
    acc_bar2 = 0
    with torch.no_grad():
        for batch_idx, (x,y,d,x_len,x_col,x_bar, m) in enumerate(test_loader):
            x, y, d, x_len, x_bar, x_col, m = x.to(DEVICE), y.to(DEVICE), d.to(DEVICE), x_len.to(DEVICE), x_bar.to(DEVICE), x_col.to(DEVICE), m.to(DEVICE)
            loss, bar_loss, len_loss, col_loss, mse, acc, acc2 = model.loss_function(d.float(), x.float(), y.float(),m.float(),x_len.float(),x_bar.float(),x_col.float())
            test_loss += loss
            epoch_bar_loss += bar_loss
            epoch_col_loss += col_loss
            epoch_len_loss += len_loss
            mse_bar += mse
            acc_bar += acc
            acc_bar2 += acc2
    test_loss /= len(test_loader.dataset)
    epoch_bar_loss /= len(test_loader.dataset)
    epoch_len_loss /= len(test_loader.dataset)
    epoch_col_loss /= len(test_loader.dataset)
    acc_bar /= len(test_loader.dataset)
    acc_bar2 /= len(test_loader.dataset)
    mse_bar /= len(test_loader.dataset)
    
    return test_loss, epoch_bar_loss, epoch_len_loss, epoch_col_loss, mse_bar, acc_bar, acc_bar2
  

In [31]:
def train(args, train_loader, test_loader, diva, optimizer, end_epoch, start_epoch=0, save_folder='sd_1.0.0',save_interval=5):
    
    epoch_loss_sup = []
    test_loss = []
    
    for epoch in range(start_epoch+1, end_epoch+1):
        diva.beta = min([args.beta, args.beta * (epoch - args.prewarmup * 1.) / (args.warmup)])
        if epoch< args.prewarmup:
            diva.beta = args.beta/args.prewarmup
        train_loss, avg_loss_bar, avg_loss_len, avg_loss_col, mtr, atr, atr2 = train_single_epoch(train_loader, diva, optimizer, epoch)
        str_loss_sup = train_loss
        epoch_loss_sup.append(train_loss)
        str_print = "epoch {}: avg train loss {:.2f}".format(epoch, str_loss_sup)
        str_print += ", bar train loss {:.3f}".format(avg_loss_bar)
        str_print += ", len train loss {:.3f}".format(avg_loss_len)
        str_print += ", col train loss {:.3f}".format(avg_loss_col)
        print(str_print)

        rec_loss_train = diva.rec_alpha * avg_loss_len + diva.rec_beta * avg_loss_bar + diva.rec_gamma * avg_loss_col
        dis_loss_train = train_loss - rec_loss_train

        test_lss, avg_loss_bar_test, avg_loss_len_test, avg_loss_col_test, mte, ate, ate2 = test_single_epoch(test_loader, diva, epoch)
        test_loss.append(test_lss)
       
        str_print = "epoch {}: avg test  loss {:.2f}".format(epoch, test_lss)
        str_print += ", bar  test loss {:.3f}".format(avg_loss_bar_test)
        str_print += ", len  test loss {:.3f}".format(avg_loss_len_test)
        str_print += ", col  test loss {:.3f}".format(avg_loss_col_test)
        print(str_print)

        rec_loss_test = diva.rec_alpha * avg_loss_len_test + diva.rec_beta * avg_loss_bar_test + diva.rec_gamma * avg_loss_col_test
        dis_loss_test = test_lss - rec_loss_test

        if writer is not None:
            
            writer.add_scalars("Total_Loss", {'train': train_loss, 'test': test_lss} ,epoch)
            writer.add_scalars("Reconstruction_vs_Disentanglement",{'rec':rec_loss_train, 'dis':dis_loss_train}, epoch)
            writer.add_scalars("bar_mse",{'train': mtr, 'test':mte}, epoch)
            writer.add_scalars("bar_acc",{'train-top1': atr, 'test-top1':ate, 'train-top2': atr2, 'test-top2':ate2}, epoch)

        if epoch % save_interval == 0:
            save_reconstructions(epoch, test_loader, diva, name=save_folder)
            save_reconstructions(epoch, train_loader, diva, name=save_folder, estr='tr')
        
        
        if epoch % 50 == 0:
            torch.save(diva.state_dict(), f'{link}/saved_models/{save_folder}/checkpoints/{epoch}.pth')

    if writer is not None:
        writer.flush()

    epoch_loss_sup = [i.detach().cpu().numpy() for i in epoch_loss_sup]
    test_loss = [i.detach().cpu().numpy() for i in test_loss]
    return epoch_loss_sup, test_loss

In [32]:
def save_reconstructions(epoch, test_loader, diva, name='diva', estr=''):
    a = next(enumerate(test_loader))
    with torch.no_grad():
        diva.eval()
        d = a[1][2][:10].to(DEVICE).float()
        x = a[1][0][:10].to(DEVICE).float()
        y = a[1][1][:10].to(DEVICE).float()
        m = a[1][-1][:10].to(DEVICE).float()
        x_1, x_1var, x_2, x_2var, x_3 ,z1, z2, z1_m, z1_s, z2_m, z2_s, pz1_m, pz1_s = diva(d,x,y,m)
        out = diva.px.reconstruct_image(x_1, x_1var, x_2, x_2var, x_3)

    plt.figure(figsize=(80,20))
    fig, ax = plt.subplots(nrows=10, ncols=2)

    ax[0,0].set_title("Original")
    ax[0,1].set_title("Reconstructed")

    for i in range(10):
        ax[i, 1].imshow(out[i])
        ax[i, 0].imshow(x[i].cpu().permute(1,2,0))
        ax[i, 0].xaxis.set_visible(False)
        ax[i, 0].yaxis.set_visible(False)
        ax[i, 1].xaxis.set_visible(False)
        ax[i, 1].yaxis.set_visible(False)
    fig.tight_layout(pad=0.1)
    plt.savefig(f'{link}/saved_models/{name}/reconstructions/e{epoch}{estr}.png')
    plt.close('all')

In [33]:
DEVICE

device(type='cuda')

## Model Training

In [34]:
default_args = diva_args(prewarmup=0, number_components=50)

In [35]:
diva = HVAE(default_args).to(DEVICE)

In [36]:
#diva.load_state_dict(torch.load(f'{link}/saved_models/VAE10/checkpoints/905.pth'))

In [37]:
train_loader = DataLoader(RNA_dataset, batch_size=128, shuffle=True)
test_loader = DataLoader(RNA_dataset_test, batch_size=128)

In [38]:
#optimizer = optim.SGD(diva.parameters(), lr=0.00001, momentum=0.1, nesterov=True)
optimizer = optim.Adam(diva.parameters(), lr=0.001)

In [39]:
RNA_dataset.x_len.min(), RNA_dataset.x_len.max()

(10, 100)

In [40]:
writer.flush()

In [41]:
diva.rec_gamma = 3

In [42]:
%tensorboard  --logdir="D:/users/Marko/downloads/mirna/saved_models/new/HVAE2/tensorboard/"

Reusing TensorBoard on port 6006 (pid 16804), started 16:38:08 ago. (Use '!kill 16804' to kill it.)

In [43]:
lss, lss_t = train(default_args, train_loader, test_loader, diva, optimizer, 500, 0, save_folder="new/HVAE2",save_interval=5)

Epoch 1: 272batch [00:33,  8.01batch/s, loss=684]  


epoch 1: avg train loss 762.05, bar train loss 10.645, len train loss 0.407, col train loss 168.432
epoch 1: avg test  loss 680.26, bar  test loss 8.483, len  test loss 0.049, col  test loss 167.091


Epoch 2: 272batch [00:31,  8.77batch/s, loss=616]


epoch 2: avg train loss 674.00, bar train loss 8.165, len train loss 0.058, col train loss 166.647


Epoch 3: 1batch [00:00,  8.70batch/s, loss=643]

epoch 2: avg test  loss 656.69, bar  test loss 7.473, len  test loss 0.056, col  test loss 165.165


Epoch 3: 272batch [00:31,  8.73batch/s, loss=621]


epoch 3: avg train loss 641.39, bar train loss 6.802, len train loss 0.062, col train loss 163.893


Epoch 4: 1batch [00:00,  8.62batch/s, loss=623]

epoch 3: avg test  loss 624.72, bar  test loss 6.096, len  test loss 0.054, col  test loss 163.143


Epoch 4: 272batch [00:31,  8.73batch/s, loss=667]


epoch 4: avg train loss 621.52, bar train loss 5.946, len train loss 0.061, col train loss 162.706


Epoch 5: 1batch [00:00,  8.62batch/s, loss=626]

epoch 4: avg test  loss 611.16, bar  test loss 5.472, len  test loss 0.054, col  test loss 162.414


Epoch 5: 272batch [00:31,  8.73batch/s, loss=638]


epoch 5: avg train loss 610.55, bar train loss 5.530, len train loss 0.052, col train loss 161.974
epoch 5: avg test  loss 604.04, bar  test loss 5.197, len  test loss 0.060, col  test loss 161.762


Epoch 6: 272batch [00:31,  8.73batch/s, loss=616]


epoch 6: avg train loss 602.98, bar train loss 5.226, len train loss 0.052, col train loss 161.363


Epoch 7: 1batch [00:00,  8.70batch/s, loss=603]

epoch 6: avg test  loss 593.83, bar  test loss 4.875, len  test loss 0.039, col  test loss 161.095


Epoch 7: 272batch [00:31,  8.73batch/s, loss=572]


epoch 7: avg train loss 597.69, bar train loss 5.003, len train loss 0.057, col train loss 160.864


Epoch 8: 1batch [00:00,  8.70batch/s, loss=571]

epoch 7: avg test  loss 588.08, bar  test loss 4.630, len  test loss 0.039, col  test loss 160.671


Epoch 8: 272batch [00:31,  8.61batch/s, loss=643]


epoch 8: avg train loss 592.19, bar train loss 4.813, len train loss 0.051, col train loss 160.409


Epoch 9: 1batch [00:00,  8.47batch/s, loss=583]

epoch 8: avg test  loss 590.46, bar  test loss 4.464, len  test loss 0.108, col  test loss 160.306


Epoch 9: 272batch [00:31,  8.60batch/s, loss=624]


epoch 9: avg train loss 588.52, bar train loss 4.661, len train loss 0.054, col train loss 160.074


Epoch 10: 1batch [00:00,  8.47batch/s, loss=607]

epoch 9: avg test  loss 581.09, bar  test loss 4.399, len  test loss 0.030, col  test loss 160.093


Epoch 10: 272batch [00:31,  8.64batch/s, loss=631]


epoch 10: avg train loss 584.24, bar train loss 4.529, len train loss 0.046, col train loss 159.781
epoch 10: avg test  loss 578.16, bar  test loss 4.143, len  test loss 0.040, col  test loss 159.858


Epoch 11: 272batch [00:31,  8.69batch/s, loss=589]


epoch 11: avg train loss 581.29, bar train loss 4.419, len train loss 0.046, col train loss 159.517


Epoch 12: 1batch [00:00,  8.62batch/s, loss=604]

epoch 11: avg test  loss 576.74, bar  test loss 4.231, len  test loss 0.027, col  test loss 159.478


Epoch 12: 272batch [00:31,  8.66batch/s, loss=602]


epoch 12: avg train loss 579.54, bar train loss 4.327, len train loss 0.052, col train loss 159.311


Epoch 13: 1batch [00:00,  8.55batch/s, loss=600]

epoch 12: avg test  loss 578.92, bar  test loss 4.128, len  test loss 0.088, col  test loss 159.398


Epoch 13: 272batch [00:31,  8.63batch/s, loss=678]


epoch 13: avg train loss 576.59, bar train loss 4.242, len train loss 0.047, col train loss 159.052


Epoch 14: 1batch [00:00,  8.55batch/s, loss=609]

epoch 13: avg test  loss 576.65, bar  test loss 4.024, len  test loss 0.044, col  test loss 159.098


Epoch 14: 272batch [00:31,  8.64batch/s, loss=566]


epoch 14: avg train loss 574.27, bar train loss 4.159, len train loss 0.048, col train loss 158.797


Epoch 15: 1batch [00:00,  8.62batch/s, loss=582]

epoch 14: avg test  loss 567.53, bar  test loss 3.805, len  test loss 0.047, col  test loss 158.921


Epoch 15: 272batch [00:31,  8.65batch/s, loss=587]


epoch 15: avg train loss 571.89, bar train loss 4.085, len train loss 0.045, col train loss 158.588
epoch 15: avg test  loss 565.18, bar  test loss 3.721, len  test loss 0.034, col  test loss 158.723


Epoch 16: 272batch [00:31,  8.64batch/s, loss=653]


epoch 16: avg train loss 570.12, bar train loss 4.035, len train loss 0.043, col train loss 158.396


Epoch 17: 1batch [00:00,  8.55batch/s, loss=558]

epoch 16: avg test  loss 562.46, bar  test loss 3.690, len  test loss 0.025, col  test loss 158.387


Epoch 17: 272batch [00:31,  8.64batch/s, loss=556]


epoch 17: avg train loss 568.19, bar train loss 3.979, len train loss 0.041, col train loss 158.167


Epoch 18: 1batch [00:00,  8.55batch/s, loss=552]

epoch 17: avg test  loss 564.13, bar  test loss 3.660, len  test loss 0.052, col  test loss 158.393


Epoch 18: 272batch [00:31,  8.63batch/s, loss=543]


epoch 18: avg train loss 566.62, bar train loss 3.925, len train loss 0.041, col train loss 158.004


Epoch 19: 1batch [00:00,  8.55batch/s, loss=588]

epoch 18: avg test  loss 562.18, bar  test loss 3.592, len  test loss 0.040, col  test loss 158.311


Epoch 19: 272batch [00:31,  8.63batch/s, loss=588]


epoch 19: avg train loss 564.98, bar train loss 3.868, len train loss 0.042, col train loss 157.796


Epoch 20: 1batch [00:00,  8.55batch/s, loss=581]

epoch 19: avg test  loss 563.27, bar  test loss 3.558, len  test loss 0.086, col  test loss 158.069


Epoch 20: 272batch [00:31,  8.63batch/s, loss=532]


epoch 20: avg train loss 562.92, bar train loss 3.815, len train loss 0.038, col train loss 157.620
epoch 20: avg test  loss 572.07, bar  test loss 3.554, len  test loss 0.171, col  test loss 158.192


Epoch 21: 272batch [00:31,  8.62batch/s, loss=580]


epoch 21: avg train loss 561.20, bar train loss 3.773, len train loss 0.035, col train loss 157.465


Epoch 22: 1batch [00:00,  8.62batch/s, loss=580]

epoch 21: avg test  loss 580.83, bar  test loss 3.506, len  test loss 0.275, col  test loss 157.730


Epoch 22: 272batch [00:31,  8.64batch/s, loss=538]


epoch 22: avg train loss 560.17, bar train loss 3.727, len train loss 0.037, col train loss 157.309


Epoch 23: 1batch [00:00,  8.62batch/s, loss=566]

epoch 22: avg test  loss 571.01, bar  test loss 3.422, len  test loss 0.198, col  test loss 157.744


Epoch 23: 272batch [00:31,  8.60batch/s, loss=546]


epoch 23: avg train loss 558.31, bar train loss 3.688, len train loss 0.032, col train loss 157.140


Epoch 24: 1batch [00:00,  8.40batch/s, loss=567]

epoch 23: avg test  loss 591.38, bar  test loss 3.375, len  test loss 0.411, col  test loss 157.486


Epoch 24: 272batch [00:31,  8.59batch/s, loss=538]


epoch 24: avg train loss 557.00, bar train loss 3.636, len train loss 0.032, col train loss 157.023


Epoch 25: 1batch [00:00,  8.55batch/s, loss=560]

epoch 24: avg test  loss 581.06, bar  test loss 3.358, len  test loss 0.295, col  test loss 157.438


Epoch 25: 272batch [00:31,  8.58batch/s, loss=574]


epoch 25: avg train loss 556.09, bar train loss 3.614, len train loss 0.032, col train loss 156.860
epoch 25: avg test  loss 584.79, bar  test loss 3.368, len  test loss 0.350, col  test loss 157.442


Epoch 26: 272batch [00:31,  8.58batch/s, loss=560]


epoch 26: avg train loss 554.70, bar train loss 3.580, len train loss 0.030, col train loss 156.720


Epoch 27: 1batch [00:00,  8.47batch/s, loss=548]

epoch 26: avg test  loss 587.92, bar  test loss 3.310, len  test loss 0.393, col  test loss 157.325


Epoch 27: 272batch [00:31,  8.58batch/s, loss=600]


epoch 27: avg train loss 553.60, bar train loss 3.546, len train loss 0.029, col train loss 156.596


Epoch 28: 1batch [00:00,  8.55batch/s, loss=574]

epoch 27: avg test  loss 609.76, bar  test loss 3.328, len  test loss 0.614, col  test loss 157.452


Epoch 28: 272batch [00:31,  8.58batch/s, loss=624]


epoch 28: avg train loss 552.54, bar train loss 3.511, len train loss 0.028, col train loss 156.526


Epoch 29: 1batch [00:00,  8.55batch/s, loss=545]

epoch 28: avg test  loss 577.24, bar  test loss 3.275, len  test loss 0.300, col  test loss 157.148


Epoch 29: 272batch [00:31,  8.58batch/s, loss=583]


epoch 29: avg train loss 551.51, bar train loss 3.483, len train loss 0.028, col train loss 156.356


Epoch 30: 1batch [00:00,  8.55batch/s, loss=573]

epoch 29: avg test  loss 588.81, bar  test loss 3.242, len  test loss 0.428, col  test loss 157.128


Epoch 30: 272batch [00:31,  8.59batch/s, loss=514]


epoch 30: avg train loss 550.59, bar train loss 3.457, len train loss 0.027, col train loss 156.244
epoch 30: avg test  loss 595.53, bar  test loss 3.254, len  test loss 0.491, col  test loss 157.190


Epoch 31: 272batch [00:31,  8.57batch/s, loss=516]


epoch 31: avg train loss 549.71, bar train loss 3.430, len train loss 0.028, col train loss 156.121


Epoch 32: 1batch [00:00,  8.47batch/s, loss=531]

epoch 31: avg test  loss 598.00, bar  test loss 3.237, len  test loss 0.511, col  test loss 156.951


Epoch 32: 272batch [00:31,  8.58batch/s, loss=536]


epoch 32: avg train loss 548.80, bar train loss 3.404, len train loss 0.027, col train loss 156.037


Epoch 33: 1batch [00:00,  8.47batch/s, loss=547]

epoch 32: avg test  loss 590.17, bar  test loss 3.221, len  test loss 0.438, col  test loss 157.043


Epoch 33: 272batch [00:31,  8.58batch/s, loss=563]


epoch 33: avg train loss 547.83, bar train loss 3.369, len train loss 0.028, col train loss 155.915


Epoch 34: 1batch [00:00,  8.40batch/s, loss=561]

epoch 33: avg test  loss 584.35, bar  test loss 3.184, len  test loss 0.389, col  test loss 157.004


Epoch 34: 272batch [00:31,  8.56batch/s, loss=563]


epoch 34: avg train loss 546.91, bar train loss 3.350, len train loss 0.027, col train loss 155.779


Epoch 35: 1batch [00:00,  8.47batch/s, loss=542]

epoch 34: avg test  loss 583.56, bar  test loss 3.182, len  test loss 0.383, col  test loss 156.941


Epoch 35: 272batch [00:31,  8.58batch/s, loss=564]


epoch 35: avg train loss 546.41, bar train loss 3.330, len train loss 0.027, col train loss 155.719
epoch 35: avg test  loss 600.85, bar  test loss 3.166, len  test loss 0.545, col  test loss 157.218


Epoch 36: 272batch [00:31,  8.58batch/s, loss=561]


epoch 36: avg train loss 545.51, bar train loss 3.306, len train loss 0.027, col train loss 155.593


Epoch 37: 1batch [00:00,  8.47batch/s, loss=543]

epoch 36: avg test  loss 587.73, bar  test loss 3.181, len  test loss 0.433, col  test loss 156.878


Epoch 37: 272batch [00:31,  8.57batch/s, loss=599]


epoch 37: avg train loss 544.72, bar train loss 3.284, len train loss 0.026, col train loss 155.501


Epoch 38: 1batch [00:00,  8.47batch/s, loss=559]

epoch 37: avg test  loss 581.41, bar  test loss 3.196, len  test loss 0.369, col  test loss 156.904


Epoch 38: 272batch [00:31,  8.56batch/s, loss=560]


epoch 38: avg train loss 543.89, bar train loss 3.261, len train loss 0.027, col train loss 155.392


Epoch 39: 1batch [00:00,  8.40batch/s, loss=543]

epoch 38: avg test  loss 585.66, bar  test loss 3.112, len  test loss 0.429, col  test loss 156.886


Epoch 39: 272batch [00:31,  8.53batch/s, loss=554]


epoch 39: avg train loss 542.82, bar train loss 3.236, len train loss 0.025, col train loss 155.280


Epoch 40: 1batch [00:00,  8.40batch/s, loss=556]

epoch 39: avg test  loss 594.20, bar  test loss 3.158, len  test loss 0.512, col  test loss 156.908


Epoch 40: 272batch [00:32,  8.49batch/s, loss=544]


epoch 40: avg train loss 542.53, bar train loss 3.222, len train loss 0.027, col train loss 155.210
epoch 40: avg test  loss 588.76, bar  test loss 3.146, len  test loss 0.449, col  test loss 156.554


Epoch 41: 272batch [00:32,  8.41batch/s, loss=579]


epoch 41: avg train loss 541.74, bar train loss 3.198, len train loss 0.027, col train loss 155.117


Epoch 42: 1batch [00:00,  8.26batch/s, loss=530]

epoch 41: avg test  loss 583.25, bar  test loss 3.119, len  test loss 0.411, col  test loss 156.613


Epoch 42: 272batch [00:32,  8.34batch/s, loss=569]


epoch 42: avg train loss 541.02, bar train loss 3.186, len train loss 0.025, col train loss 155.012


Epoch 43: 1batch [00:00,  8.13batch/s, loss=561]

epoch 42: avg test  loss 578.73, bar  test loss 3.108, len  test loss 0.361, col  test loss 156.809


Epoch 43: 272batch [00:33,  8.15batch/s, loss=556]


epoch 43: avg train loss 540.35, bar train loss 3.161, len train loss 0.026, col train loss 154.919


Epoch 44: 1batch [00:00,  8.20batch/s, loss=564]

epoch 43: avg test  loss 588.35, bar  test loss 3.153, len  test loss 0.461, col  test loss 156.677


Epoch 44: 272batch [00:32,  8.32batch/s, loss=557]


epoch 44: avg train loss 539.60, bar train loss 3.143, len train loss 0.026, col train loss 154.820


Epoch 45: 1batch [00:00,  8.20batch/s, loss=537]

epoch 44: avg test  loss 576.75, bar  test loss 3.086, len  test loss 0.344, col  test loss 156.668


Epoch 45: 272batch [00:32,  8.31batch/s, loss=567]


epoch 45: avg train loss 538.89, bar train loss 3.126, len train loss 0.025, col train loss 154.740
epoch 45: avg test  loss 587.66, bar  test loss 3.081, len  test loss 0.463, col  test loss 156.534


Epoch 46: 272batch [00:32,  8.30batch/s, loss=606]


epoch 46: avg train loss 538.25, bar train loss 3.113, len train loss 0.025, col train loss 154.643


Epoch 47: 1batch [00:00,  8.26batch/s, loss=562]

epoch 46: avg test  loss 601.98, bar  test loss 3.064, len  test loss 0.598, col  test loss 156.855


Epoch 47: 272batch [00:32,  8.31batch/s, loss=532]


epoch 47: avg train loss 537.60, bar train loss 3.095, len train loss 0.024, col train loss 154.544


Epoch 48: 1batch [00:00,  8.13batch/s, loss=528]

epoch 47: avg test  loss 584.76, bar  test loss 3.100, len  test loss 0.426, col  test loss 156.795


Epoch 48: 272batch [00:32,  8.29batch/s, loss=554]


epoch 48: avg train loss 537.13, bar train loss 3.074, len train loss 0.026, col train loss 154.491


Epoch 49: 1batch [00:00,  8.26batch/s, loss=560]

epoch 48: avg test  loss 594.34, bar  test loss 3.093, len  test loss 0.492, col  test loss 156.842


Epoch 49: 272batch [00:32,  8.29batch/s, loss=583]


epoch 49: avg train loss 536.66, bar train loss 3.065, len train loss 0.026, col train loss 154.417


Epoch 50: 1batch [00:00,  8.26batch/s, loss=537]

epoch 49: avg test  loss 583.92, bar  test loss 3.061, len  test loss 0.433, col  test loss 156.455


Epoch 50: 272batch [00:32,  8.29batch/s, loss=578]


epoch 50: avg train loss 535.70, bar train loss 3.042, len train loss 0.024, col train loss 154.313
epoch 50: avg test  loss 594.68, bar  test loss 3.136, len  test loss 0.526, col  test loss 156.678


Epoch 51: 272batch [00:32,  8.28batch/s, loss=548]


epoch 51: avg train loss 535.32, bar train loss 3.030, len train loss 0.025, col train loss 154.231


Epoch 52: 1batch [00:00,  8.20batch/s, loss=555]

epoch 51: avg test  loss 583.33, bar  test loss 3.079, len  test loss 0.417, col  test loss 156.457


Epoch 52: 272batch [00:32,  8.28batch/s, loss=507]


epoch 52: avg train loss 535.02, bar train loss 3.022, len train loss 0.025, col train loss 154.166


Epoch 53: 1batch [00:00,  8.20batch/s, loss=537]

epoch 52: avg test  loss 592.41, bar  test loss 3.128, len  test loss 0.510, col  test loss 156.689


Epoch 53: 272batch [00:32,  8.27batch/s, loss=530]


epoch 53: avg train loss 534.01, bar train loss 3.000, len train loss 0.024, col train loss 154.039


Epoch 54: 1batch [00:00,  8.26batch/s, loss=545]

epoch 53: avg test  loss 582.70, bar  test loss 3.051, len  test loss 0.422, col  test loss 156.594


Epoch 54: 272batch [00:32,  8.27batch/s, loss=537]


epoch 54: avg train loss 533.65, bar train loss 2.988, len train loss 0.024, col train loss 154.007


Epoch 55: 1batch [00:00,  8.33batch/s, loss=545]

epoch 54: avg test  loss 584.98, bar  test loss 3.055, len  test loss 0.441, col  test loss 156.558


Epoch 55: 272batch [00:32,  8.26batch/s, loss=511]


epoch 55: avg train loss 532.94, bar train loss 2.969, len train loss 0.023, col train loss 153.907
epoch 55: avg test  loss 593.04, bar  test loss 3.089, len  test loss 0.520, col  test loss 156.665


Epoch 56: 272batch [00:32,  8.27batch/s, loss=558]


epoch 56: avg train loss 532.43, bar train loss 2.956, len train loss 0.024, col train loss 153.842


Epoch 57: 1batch [00:00,  8.13batch/s, loss=519]

epoch 56: avg test  loss 588.24, bar  test loss 3.086, len  test loss 0.479, col  test loss 156.551


Epoch 57: 272batch [00:32,  8.25batch/s, loss=490]


epoch 57: avg train loss 532.13, bar train loss 2.949, len train loss 0.024, col train loss 153.758


Epoch 58: 1batch [00:00,  8.33batch/s, loss=523]

epoch 57: avg test  loss 579.38, bar  test loss 3.065, len  test loss 0.381, col  test loss 156.609


Epoch 58: 272batch [00:32,  8.26batch/s, loss=585]


epoch 58: avg train loss 531.46, bar train loss 2.933, len train loss 0.024, col train loss 153.665


Epoch 59: 1batch [00:00,  8.13batch/s, loss=538]

epoch 58: avg test  loss 581.92, bar  test loss 3.044, len  test loss 0.411, col  test loss 156.869


Epoch 59: 272batch [00:33,  8.24batch/s, loss=564]


epoch 59: avg train loss 531.04, bar train loss 2.925, len train loss 0.023, col train loss 153.614


Epoch 60: 1batch [00:00,  8.20batch/s, loss=509]

epoch 59: avg test  loss 580.29, bar  test loss 3.042, len  test loss 0.397, col  test loss 156.681


Epoch 60: 272batch [00:33,  8.24batch/s, loss=557]


epoch 60: avg train loss 530.65, bar train loss 2.917, len train loss 0.024, col train loss 153.542
epoch 60: avg test  loss 585.00, bar  test loss 3.062, len  test loss 0.447, col  test loss 156.614


Epoch 61: 272batch [00:33,  8.18batch/s, loss=592]


epoch 61: avg train loss 529.93, bar train loss 2.893, len train loss 0.024, col train loss 153.452


Epoch 62: 1batch [00:00,  8.06batch/s, loss=516]

epoch 61: avg test  loss 584.69, bar  test loss 3.064, len  test loss 0.427, col  test loss 156.872


Epoch 62: 272batch [00:33,  8.22batch/s, loss=553]


epoch 62: avg train loss 529.67, bar train loss 2.889, len train loss 0.024, col train loss 153.384


Epoch 63: 1batch [00:00,  8.13batch/s, loss=545]

epoch 62: avg test  loss 577.17, bar  test loss 3.070, len  test loss 0.357, col  test loss 156.770


Epoch 63: 272batch [00:33,  8.23batch/s, loss=521]


epoch 63: avg train loss 529.05, bar train loss 2.876, len train loss 0.023, col train loss 153.295


Epoch 64: 1batch [00:00,  8.20batch/s, loss=506]

epoch 63: avg test  loss 580.62, bar  test loss 3.072, len  test loss 0.392, col  test loss 156.778


Epoch 64: 272batch [00:33,  8.22batch/s, loss=505]


epoch 64: avg train loss 528.77, bar train loss 2.869, len train loss 0.023, col train loss 153.256


Epoch 65: 1batch [00:00,  8.20batch/s, loss=517]

epoch 64: avg test  loss 583.39, bar  test loss 3.063, len  test loss 0.425, col  test loss 156.567


Epoch 65: 272batch [00:33,  8.22batch/s, loss=563]


epoch 65: avg train loss 527.87, bar train loss 2.853, len train loss 0.022, col train loss 153.134
epoch 65: avg test  loss 591.31, bar  test loss 3.083, len  test loss 0.508, col  test loss 156.589


Epoch 66: 272batch [00:33,  8.21batch/s, loss=558]


epoch 66: avg train loss 527.65, bar train loss 2.842, len train loss 0.023, col train loss 153.098


Epoch 67: 1batch [00:00,  8.13batch/s, loss=510]

epoch 66: avg test  loss 585.95, bar  test loss 3.084, len  test loss 0.451, col  test loss 156.758


Epoch 67: 272batch [00:33,  8.22batch/s, loss=566]


epoch 67: avg train loss 527.25, bar train loss 2.832, len train loss 0.023, col train loss 153.060


Epoch 68: 1batch [00:00,  8.26batch/s, loss=547]

epoch 67: avg test  loss 586.47, bar  test loss 3.063, len  test loss 0.460, col  test loss 156.716


Epoch 68: 272batch [00:33,  8.20batch/s, loss=571]


epoch 68: avg train loss 526.88, bar train loss 2.827, len train loss 0.023, col train loss 152.993


Epoch 69: 1batch [00:00,  8.20batch/s, loss=535]

epoch 68: avg test  loss 591.43, bar  test loss 3.115, len  test loss 0.503, col  test loss 156.792


Epoch 69: 272batch [00:33,  8.19batch/s, loss=535]


epoch 69: avg train loss 526.38, bar train loss 2.809, len train loss 0.023, col train loss 152.912


Epoch 70: 1batch [00:00,  8.13batch/s, loss=520]

epoch 69: avg test  loss 595.08, bar  test loss 3.099, len  test loss 0.535, col  test loss 156.908


Epoch 70: 272batch [00:33,  8.19batch/s, loss=519]


epoch 70: avg train loss 525.99, bar train loss 2.805, len train loss 0.023, col train loss 152.859
epoch 70: avg test  loss 588.20, bar  test loss 3.141, len  test loss 0.441, col  test loss 157.054


Epoch 71: 272batch [00:33,  8.20batch/s, loss=542]


epoch 71: avg train loss 525.53, bar train loss 2.793, len train loss 0.023, col train loss 152.775


Epoch 72: 1batch [00:00,  8.13batch/s, loss=512]

epoch 71: avg test  loss 586.86, bar  test loss 3.081, len  test loss 0.455, col  test loss 156.835


Epoch 72: 272batch [00:33,  8.20batch/s, loss=560]


epoch 72: avg train loss 525.16, bar train loss 2.782, len train loss 0.022, col train loss 152.739


Epoch 73: 1batch [00:00,  8.33batch/s, loss=521]

epoch 72: avg test  loss 592.35, bar  test loss 3.097, len  test loss 0.505, col  test loss 156.951


Epoch 73: 272batch [00:33,  8.20batch/s, loss=504]


epoch 73: avg train loss 524.87, bar train loss 2.780, len train loss 0.023, col train loss 152.671


Epoch 74: 1batch [00:00,  8.13batch/s, loss=529]

epoch 73: avg test  loss 594.82, bar  test loss 3.081, len  test loss 0.518, col  test loss 156.784


Epoch 74: 272batch [00:33,  8.21batch/s, loss=539]


epoch 74: avg train loss 524.63, bar train loss 2.768, len train loss 0.023, col train loss 152.631


Epoch 75: 1batch [00:00,  8.20batch/s, loss=517]

epoch 74: avg test  loss 593.21, bar  test loss 3.105, len  test loss 0.487, col  test loss 156.913


Epoch 75: 272batch [00:33,  8.21batch/s, loss=516]


epoch 75: avg train loss 524.04, bar train loss 2.754, len train loss 0.023, col train loss 152.552
epoch 75: avg test  loss 595.00, bar  test loss 3.126, len  test loss 0.526, col  test loss 157.078


Epoch 76: 272batch [00:33,  8.18batch/s, loss=549]


epoch 76: avg train loss 523.65, bar train loss 2.747, len train loss 0.023, col train loss 152.491


Epoch 77: 1batch [00:00,  8.00batch/s, loss=522]

epoch 76: avg test  loss 585.56, bar  test loss 3.103, len  test loss 0.429, col  test loss 156.799


Epoch 77: 272batch [00:33,  8.19batch/s, loss=525]


epoch 77: avg train loss 523.13, bar train loss 2.736, len train loss 0.022, col train loss 152.415


Epoch 78: 1batch [00:00,  8.20batch/s, loss=543]

epoch 77: avg test  loss 603.23, bar  test loss 3.116, len  test loss 0.580, col  test loss 156.803


Epoch 78: 272batch [00:33,  8.19batch/s, loss=572]


epoch 78: avg train loss 522.76, bar train loss 2.730, len train loss 0.022, col train loss 152.339


Epoch 79: 1batch [00:00,  8.13batch/s, loss=544]

epoch 78: avg test  loss 592.47, bar  test loss 3.138, len  test loss 0.489, col  test loss 157.240


Epoch 79: 272batch [00:33,  8.10batch/s, loss=535]


epoch 79: avg train loss 522.47, bar train loss 2.726, len train loss 0.022, col train loss 152.313


Epoch 80: 1batch [00:00,  8.06batch/s, loss=527]

epoch 79: avg test  loss 587.44, bar  test loss 3.094, len  test loss 0.438, col  test loss 157.217


Epoch 80: 272batch [00:33,  8.17batch/s, loss=545]


epoch 80: avg train loss 522.30, bar train loss 2.717, len train loss 0.022, col train loss 152.274
epoch 80: avg test  loss 595.23, bar  test loss 3.137, len  test loss 0.534, col  test loss 157.036


Epoch 81: 272batch [00:33,  8.15batch/s, loss=589]


epoch 81: avg train loss 521.59, bar train loss 2.705, len train loss 0.021, col train loss 152.180


Epoch 82: 1batch [00:00,  8.06batch/s, loss=509]

epoch 81: avg test  loss 593.71, bar  test loss 3.138, len  test loss 0.509, col  test loss 156.998


Epoch 82: 272batch [00:33,  8.15batch/s, loss=512]


epoch 82: avg train loss 521.28, bar train loss 2.693, len train loss 0.022, col train loss 152.135


Epoch 83: 1batch [00:00,  7.41batch/s, loss=525]

epoch 82: avg test  loss 589.43, bar  test loss 3.120, len  test loss 0.463, col  test loss 157.128


Epoch 83: 272batch [00:33,  8.13batch/s, loss=541]


epoch 83: avg train loss 521.15, bar train loss 2.691, len train loss 0.022, col train loss 152.121


Epoch 84: 1batch [00:00,  8.13batch/s, loss=507]

epoch 83: avg test  loss 586.78, bar  test loss 3.108, len  test loss 0.444, col  test loss 157.018


Epoch 84: 272batch [00:33,  8.13batch/s, loss=489]


epoch 84: avg train loss 520.63, bar train loss 2.681, len train loss 0.021, col train loss 152.029


Epoch 85: 1batch [00:00,  8.13batch/s, loss=521]

epoch 84: avg test  loss 591.32, bar  test loss 3.155, len  test loss 0.456, col  test loss 157.311


Epoch 85: 272batch [00:33,  8.10batch/s, loss=525]


epoch 85: avg train loss 520.17, bar train loss 2.669, len train loss 0.021, col train loss 151.974
epoch 85: avg test  loss 592.84, bar  test loss 3.142, len  test loss 0.500, col  test loss 157.131


Epoch 86: 272batch [00:33,  8.11batch/s, loss=563]


epoch 86: avg train loss 520.01, bar train loss 2.668, len train loss 0.021, col train loss 151.929


Epoch 87: 1batch [00:00,  8.13batch/s, loss=524]

epoch 86: avg test  loss 591.92, bar  test loss 3.120, len  test loss 0.487, col  test loss 157.121


Epoch 87: 272batch [00:33,  8.10batch/s, loss=510]


epoch 87: avg train loss 519.65, bar train loss 2.659, len train loss 0.021, col train loss 151.869


Epoch 88: 1batch [00:00,  8.06batch/s, loss=504]

epoch 87: avg test  loss 589.44, bar  test loss 3.135, len  test loss 0.467, col  test loss 157.023


Epoch 88: 272batch [00:33,  8.12batch/s, loss=508]


epoch 88: avg train loss 519.17, bar train loss 2.650, len train loss 0.021, col train loss 151.780


Epoch 89: 1batch [00:00,  8.00batch/s, loss=530]

epoch 88: avg test  loss 600.68, bar  test loss 3.159, len  test loss 0.555, col  test loss 157.293


Epoch 89: 272batch [00:33,  8.11batch/s, loss=528]


epoch 89: avg train loss 518.87, bar train loss 2.644, len train loss 0.021, col train loss 151.750


Epoch 90: 1batch [00:00,  8.13batch/s, loss=518]

epoch 89: avg test  loss 593.91, bar  test loss 3.180, len  test loss 0.498, col  test loss 157.126


Epoch 90: 272batch [00:33,  8.08batch/s, loss=524]


epoch 90: avg train loss 518.76, bar train loss 2.640, len train loss 0.022, col train loss 151.716
epoch 90: avg test  loss 586.50, bar  test loss 3.158, len  test loss 0.436, col  test loss 157.203


Epoch 91: 272batch [00:33,  8.12batch/s, loss=510]


epoch 91: avg train loss 517.96, bar train loss 2.626, len train loss 0.020, col train loss 151.608


Epoch 92: 1batch [00:00,  7.69batch/s, loss=511]

epoch 91: avg test  loss 594.62, bar  test loss 3.163, len  test loss 0.510, col  test loss 157.229


Epoch 92: 272batch [00:33,  8.09batch/s, loss=498]


epoch 92: avg train loss 517.81, bar train loss 2.622, len train loss 0.021, col train loss 151.601


Epoch 93: 1batch [00:00,  8.20batch/s, loss=504]

epoch 92: avg test  loss 592.91, bar  test loss 3.159, len  test loss 0.494, col  test loss 157.141


Epoch 93: 272batch [00:33,  8.06batch/s, loss=507]


epoch 93: avg train loss 517.76, bar train loss 2.615, len train loss 0.021, col train loss 151.568


Epoch 94: 1batch [00:00,  8.00batch/s, loss=490]

epoch 93: avg test  loss 592.79, bar  test loss 3.179, len  test loss 0.480, col  test loss 157.318


Epoch 94: 272batch [00:33,  8.08batch/s, loss=548]


epoch 94: avg train loss 517.41, bar train loss 2.611, len train loss 0.020, col train loss 151.522


Epoch 95: 1batch [00:00,  8.00batch/s, loss=551]

epoch 94: avg test  loss 590.92, bar  test loss 3.165, len  test loss 0.470, col  test loss 157.217


Epoch 95: 272batch [00:33,  8.09batch/s, loss=544]


epoch 95: avg train loss 516.87, bar train loss 2.600, len train loss 0.021, col train loss 151.437
epoch 95: avg test  loss 590.55, bar  test loss 3.172, len  test loss 0.447, col  test loss 157.162


Epoch 96: 272batch [00:33,  8.11batch/s, loss=533]


epoch 96: avg train loss 517.01, bar train loss 2.609, len train loss 0.021, col train loss 151.409


Epoch 97: 1batch [00:00,  8.13batch/s, loss=520]

epoch 96: avg test  loss 591.98, bar  test loss 3.168, len  test loss 0.478, col  test loss 157.426


Epoch 97: 272batch [00:33,  8.10batch/s, loss=545]


epoch 97: avg train loss 516.46, bar train loss 2.594, len train loss 0.020, col train loss 151.365


Epoch 98: 1batch [00:00,  8.00batch/s, loss=511]

epoch 97: avg test  loss 597.39, bar  test loss 3.162, len  test loss 0.525, col  test loss 157.269


Epoch 98: 272batch [00:33,  8.07batch/s, loss=511]


epoch 98: avg train loss 516.25, bar train loss 2.591, len train loss 0.021, col train loss 151.303


Epoch 99: 1batch [00:00,  8.00batch/s, loss=517]

epoch 98: avg test  loss 594.41, bar  test loss 3.165, len  test loss 0.487, col  test loss 157.401


Epoch 99: 272batch [00:33,  8.06batch/s, loss=527]


epoch 99: avg train loss 516.02, bar train loss 2.583, len train loss 0.020, col train loss 151.285


Epoch 100: 1batch [00:00,  8.13batch/s, loss=512]

epoch 99: avg test  loss 588.83, bar  test loss 3.157, len  test loss 0.450, col  test loss 157.273


Epoch 100: 272batch [00:33,  8.07batch/s, loss=503]


epoch 100: avg train loss 515.47, bar train loss 2.573, len train loss 0.021, col train loss 151.193
epoch 100: avg test  loss 585.59, bar  test loss 3.185, len  test loss 0.405, col  test loss 157.411


Epoch 101: 272batch [00:33,  8.04batch/s, loss=529]


epoch 101: avg train loss 515.58, bar train loss 2.575, len train loss 0.020, col train loss 151.212


Epoch 102: 1batch [00:00,  7.94batch/s, loss=534]

epoch 101: avg test  loss 592.72, bar  test loss 3.197, len  test loss 0.477, col  test loss 157.435


Epoch 102: 272batch [00:33,  8.06batch/s, loss=518]


epoch 102: avg train loss 514.93, bar train loss 2.561, len train loss 0.020, col train loss 151.118


Epoch 103: 1batch [00:00,  8.00batch/s, loss=517]

epoch 102: avg test  loss 592.43, bar  test loss 3.204, len  test loss 0.481, col  test loss 157.328


Epoch 103: 272batch [00:33,  8.03batch/s, loss=546]


epoch 103: avg train loss 514.79, bar train loss 2.556, len train loss 0.020, col train loss 151.089


Epoch 104: 1batch [00:00,  7.94batch/s, loss=514]

epoch 103: avg test  loss 594.36, bar  test loss 3.203, len  test loss 0.490, col  test loss 157.563


Epoch 104: 272batch [00:33,  8.02batch/s, loss=488]


epoch 104: avg train loss 514.46, bar train loss 2.548, len train loss 0.021, col train loss 151.022


Epoch 105: 1batch [00:00,  8.13batch/s, loss=503]

epoch 104: avg test  loss 589.75, bar  test loss 3.195, len  test loss 0.438, col  test loss 157.622


Epoch 105: 272batch [00:34,  7.98batch/s, loss=516]


epoch 105: avg train loss 514.22, bar train loss 2.546, len train loss 0.019, col train loss 151.009
epoch 105: avg test  loss 593.83, bar  test loss 3.206, len  test loss 0.485, col  test loss 157.540


Epoch 106: 272batch [00:33,  8.02batch/s, loss=536]


epoch 106: avg train loss 513.91, bar train loss 2.541, len train loss 0.020, col train loss 150.939


Epoch 107: 1batch [00:00,  7.81batch/s, loss=519]

epoch 106: avg test  loss 591.24, bar  test loss 3.195, len  test loss 0.463, col  test loss 157.534


Epoch 107: 272batch [00:33,  8.00batch/s, loss=559]


epoch 107: avg train loss 513.94, bar train loss 2.541, len train loss 0.020, col train loss 150.945


Epoch 108: 1batch [00:00,  7.94batch/s, loss=499]

epoch 107: avg test  loss 587.58, bar  test loss 3.212, len  test loss 0.427, col  test loss 157.529


Epoch 108: 272batch [00:34,  7.98batch/s, loss=547]


epoch 108: avg train loss 513.49, bar train loss 2.531, len train loss 0.020, col train loss 150.871


Epoch 109: 1batch [00:00,  7.94batch/s, loss=507]

epoch 108: avg test  loss 603.35, bar  test loss 3.227, len  test loss 0.583, col  test loss 157.566


Epoch 109: 272batch [00:33,  8.00batch/s, loss=513]


epoch 109: avg train loss 513.28, bar train loss 2.527, len train loss 0.020, col train loss 150.831


Epoch 110: 1batch [00:00,  8.00batch/s, loss=506]

epoch 109: avg test  loss 598.82, bar  test loss 3.245, len  test loss 0.477, col  test loss 157.561


Epoch 110: 272batch [00:33,  8.00batch/s, loss=528]


epoch 110: avg train loss 513.37, bar train loss 2.529, len train loss 0.020, col train loss 150.826
epoch 110: avg test  loss 598.59, bar  test loss 3.220, len  test loss 0.492, col  test loss 157.585


Epoch 111: 272batch [00:33,  8.00batch/s, loss=506]


epoch 111: avg train loss 512.75, bar train loss 2.518, len train loss 0.019, col train loss 150.749


Epoch 112: 1batch [00:00,  7.94batch/s, loss=521]

epoch 111: avg test  loss 600.43, bar  test loss 3.232, len  test loss 0.539, col  test loss 157.544


Epoch 112: 272batch [00:34,  7.99batch/s, loss=515]


epoch 112: avg train loss 512.77, bar train loss 2.514, len train loss 0.020, col train loss 150.757


Epoch 113: 1batch [00:00,  7.94batch/s, loss=520]

epoch 112: avg test  loss 596.85, bar  test loss 3.240, len  test loss 0.507, col  test loss 157.634


Epoch 113: 272batch [00:34,  7.98batch/s, loss=526]


epoch 113: avg train loss 512.25, bar train loss 2.508, len train loss 0.020, col train loss 150.650


Epoch 114: 1batch [00:00,  7.94batch/s, loss=494]

epoch 113: avg test  loss 593.50, bar  test loss 3.235, len  test loss 0.473, col  test loss 157.662


Epoch 114: 272batch [00:34,  7.98batch/s, loss=488]


epoch 114: avg train loss 512.06, bar train loss 2.505, len train loss 0.019, col train loss 150.632


Epoch 115: 1batch [00:00,  7.81batch/s, loss=536]

epoch 114: avg test  loss 586.86, bar  test loss 3.235, len  test loss 0.411, col  test loss 157.648


Epoch 115: 272batch [00:34,  7.97batch/s, loss=549]


epoch 115: avg train loss 511.88, bar train loss 2.498, len train loss 0.020, col train loss 150.569
epoch 115: avg test  loss 589.01, bar  test loss 3.252, len  test loss 0.417, col  test loss 157.700


Epoch 116: 272batch [00:34,  7.99batch/s, loss=508]


epoch 116: avg train loss 511.57, bar train loss 2.498, len train loss 0.019, col train loss 150.514


Epoch 117: 1batch [00:00,  8.00batch/s, loss=520]

epoch 116: avg test  loss 594.51, bar  test loss 3.257, len  test loss 0.454, col  test loss 157.852


Epoch 117: 272batch [00:34,  7.98batch/s, loss=514]


epoch 117: avg train loss 511.41, bar train loss 2.490, len train loss 0.020, col train loss 150.504


Epoch 118: 1batch [00:00,  7.87batch/s, loss=513]

epoch 117: avg test  loss 597.96, bar  test loss 3.277, len  test loss 0.514, col  test loss 157.687


Epoch 118: 272batch [00:34,  7.97batch/s, loss=529]


epoch 118: avg train loss 511.18, bar train loss 2.487, len train loss 0.019, col train loss 150.476


Epoch 119: 1batch [00:00,  7.87batch/s, loss=490]

epoch 118: avg test  loss 593.27, bar  test loss 3.251, len  test loss 0.474, col  test loss 157.633


Epoch 119: 272batch [00:34,  7.96batch/s, loss=515]


epoch 119: avg train loss 510.94, bar train loss 2.481, len train loss 0.019, col train loss 150.437


Epoch 120: 1batch [00:00,  7.87batch/s, loss=509]

epoch 119: avg test  loss 597.49, bar  test loss 3.242, len  test loss 0.509, col  test loss 157.684


Epoch 120: 272batch [00:34,  7.95batch/s, loss=507]


epoch 120: avg train loss 510.81, bar train loss 2.479, len train loss 0.019, col train loss 150.409
epoch 120: avg test  loss 594.65, bar  test loss 3.280, len  test loss 0.480, col  test loss 157.804


Epoch 121: 272batch [00:34,  7.95batch/s, loss=492]


epoch 121: avg train loss 510.65, bar train loss 2.480, len train loss 0.019, col train loss 150.342


Epoch 122: 1batch [00:00,  7.87batch/s, loss=494]

epoch 121: avg test  loss 596.29, bar  test loss 3.266, len  test loss 0.495, col  test loss 157.719


Epoch 122: 272batch [00:34,  7.97batch/s, loss=562]


epoch 122: avg train loss 510.40, bar train loss 2.472, len train loss 0.019, col train loss 150.349


Epoch 123: 1batch [00:00,  8.00batch/s, loss=508]

epoch 122: avg test  loss 598.86, bar  test loss 3.268, len  test loss 0.507, col  test loss 158.264


Epoch 123: 272batch [00:34,  7.95batch/s, loss=587]


epoch 123: avg train loss 510.16, bar train loss 2.465, len train loss 0.019, col train loss 150.310


Epoch 124: 1batch [00:00,  7.87batch/s, loss=509]

epoch 123: avg test  loss 594.91, bar  test loss 3.258, len  test loss 0.465, col  test loss 157.731


Epoch 124: 272batch [00:34,  7.94batch/s, loss=509]


epoch 124: avg train loss 509.85, bar train loss 2.458, len train loss 0.019, col train loss 150.271


Epoch 125: 1batch [00:00,  8.00batch/s, loss=507]

epoch 124: avg test  loss 593.54, bar  test loss 3.256, len  test loss 0.466, col  test loss 157.820


Epoch 125: 272batch [00:34,  7.90batch/s, loss=548]


epoch 125: avg train loss 509.86, bar train loss 2.460, len train loss 0.019, col train loss 150.264
epoch 125: avg test  loss 592.74, bar  test loss 3.277, len  test loss 0.453, col  test loss 158.131


Epoch 126: 272batch [00:34,  7.92batch/s, loss=544]


epoch 126: avg train loss 509.35, bar train loss 2.451, len train loss 0.019, col train loss 150.187


Epoch 127: 1batch [00:00,  7.75batch/s, loss=511]

epoch 126: avg test  loss 602.00, bar  test loss 3.266, len  test loss 0.550, col  test loss 157.846


Epoch 127: 272batch [00:34,  7.92batch/s, loss=537]


epoch 127: avg train loss 509.47, bar train loss 2.456, len train loss 0.019, col train loss 150.160


Epoch 128: 1batch [00:00,  7.75batch/s, loss=511]

epoch 127: avg test  loss 595.42, bar  test loss 3.288, len  test loss 0.473, col  test loss 157.945


Epoch 128: 272batch [00:34,  7.89batch/s, loss=523]


epoch 128: avg train loss 509.28, bar train loss 2.451, len train loss 0.019, col train loss 150.141


Epoch 129: 1batch [00:00,  7.94batch/s, loss=511]

epoch 128: avg test  loss 596.42, bar  test loss 3.291, len  test loss 0.478, col  test loss 157.929


Epoch 129: 272batch [00:34,  7.89batch/s, loss=517]


epoch 129: avg train loss 508.96, bar train loss 2.446, len train loss 0.019, col train loss 150.088


Epoch 130: 1batch [00:00,  7.69batch/s, loss=524]

epoch 129: avg test  loss 595.07, bar  test loss 3.281, len  test loss 0.481, col  test loss 158.004


Epoch 130: 272batch [00:34,  7.91batch/s, loss=525]


epoch 130: avg train loss 508.67, bar train loss 2.441, len train loss 0.019, col train loss 150.039
epoch 130: avg test  loss 593.85, bar  test loss 3.304, len  test loss 0.436, col  test loss 157.988


Epoch 131: 272batch [00:34,  7.89batch/s, loss=514]


epoch 131: avg train loss 508.60, bar train loss 2.439, len train loss 0.019, col train loss 150.021


Epoch 132: 1batch [00:00,  7.87batch/s, loss=528]

epoch 131: avg test  loss 594.96, bar  test loss 3.304, len  test loss 0.472, col  test loss 157.954


Epoch 132: 272batch [00:34,  7.88batch/s, loss=589]


epoch 132: avg train loss 508.28, bar train loss 2.434, len train loss 0.018, col train loss 149.975


Epoch 133: 1batch [00:00,  7.81batch/s, loss=512]

epoch 132: avg test  loss 604.62, bar  test loss 3.301, len  test loss 0.550, col  test loss 157.987


Epoch 133: 272batch [00:34,  7.88batch/s, loss=483]


epoch 133: avg train loss 508.23, bar train loss 2.428, len train loss 0.018, col train loss 150.007


Epoch 134: 1batch [00:00,  7.75batch/s, loss=526]

epoch 133: avg test  loss 597.49, bar  test loss 3.315, len  test loss 0.471, col  test loss 157.997


Epoch 134: 272batch [00:34,  7.88batch/s, loss=517]


epoch 134: avg train loss 508.13, bar train loss 2.431, len train loss 0.018, col train loss 149.955


Epoch 135: 1batch [00:00,  7.46batch/s, loss=501]

epoch 134: avg test  loss 598.09, bar  test loss 3.301, len  test loss 0.502, col  test loss 158.065


Epoch 135: 272batch [00:34,  7.87batch/s, loss=537]


epoch 135: avg train loss 507.64, bar train loss 2.426, len train loss 0.018, col train loss 149.866
epoch 135: avg test  loss 597.76, bar  test loss 3.318, len  test loss 0.488, col  test loss 158.103


Epoch 136: 272batch [00:34,  7.86batch/s, loss=525]


epoch 136: avg train loss 507.69, bar train loss 2.422, len train loss 0.018, col train loss 149.859


Epoch 137: 1batch [00:00,  7.87batch/s, loss=491]

epoch 136: avg test  loss 598.04, bar  test loss 3.303, len  test loss 0.498, col  test loss 158.020


Epoch 137: 272batch [00:34,  7.85batch/s, loss=523]


epoch 137: avg train loss 507.32, bar train loss 2.414, len train loss 0.018, col train loss 149.836


Epoch 138: 1batch [00:00,  7.81batch/s, loss=506]

epoch 137: avg test  loss 599.17, bar  test loss 3.319, len  test loss 0.509, col  test loss 158.011


Epoch 138: 272batch [00:34,  7.86batch/s, loss=525]


epoch 138: avg train loss 507.22, bar train loss 2.409, len train loss 0.018, col train loss 149.807


Epoch 139: 1batch [00:00,  7.58batch/s, loss=487]

epoch 138: avg test  loss 593.09, bar  test loss 3.309, len  test loss 0.450, col  test loss 158.031


Epoch 139: 272batch [00:34,  7.85batch/s, loss=501]


epoch 139: avg train loss 506.93, bar train loss 2.406, len train loss 0.018, col train loss 149.777


Epoch 140: 1batch [00:00,  7.81batch/s, loss=515]

epoch 139: avg test  loss 595.83, bar  test loss 3.344, len  test loss 0.471, col  test loss 158.143


Epoch 140: 272batch [00:34,  7.84batch/s, loss=487]


epoch 140: avg train loss 507.02, bar train loss 2.407, len train loss 0.018, col train loss 149.773
epoch 140: avg test  loss 598.32, bar  test loss 3.321, len  test loss 0.489, col  test loss 158.132


Epoch 141: 272batch [00:34,  7.84batch/s, loss=520]


epoch 141: avg train loss 506.59, bar train loss 2.399, len train loss 0.018, col train loss 149.739


Epoch 142: 1batch [00:00,  7.69batch/s, loss=502]

epoch 141: avg test  loss 593.79, bar  test loss 3.320, len  test loss 0.455, col  test loss 158.054


Epoch 142: 272batch [00:34,  7.85batch/s, loss=521]


epoch 142: avg train loss 506.69, bar train loss 2.401, len train loss 0.018, col train loss 149.706


Epoch 143: 1batch [00:00,  7.75batch/s, loss=523]

epoch 142: avg test  loss 598.44, bar  test loss 3.321, len  test loss 0.489, col  test loss 158.053


Epoch 143: 272batch [00:34,  7.84batch/s, loss=508]


epoch 143: avg train loss 506.37, bar train loss 2.397, len train loss 0.018, col train loss 149.671


Epoch 144: 1batch [00:00,  7.81batch/s, loss=486]

epoch 143: avg test  loss 594.73, bar  test loss 3.332, len  test loss 0.437, col  test loss 158.191


Epoch 144: 272batch [00:34,  7.85batch/s, loss=503]


epoch 144: avg train loss 506.51, bar train loss 2.405, len train loss 0.018, col train loss 149.658


Epoch 145: 1batch [00:00,  7.69batch/s, loss=491]

epoch 144: avg test  loss 596.04, bar  test loss 3.339, len  test loss 0.467, col  test loss 158.172


Epoch 145: 272batch [00:34,  7.82batch/s, loss=518]


epoch 145: avg train loss 506.23, bar train loss 2.393, len train loss 0.017, col train loss 149.638
epoch 145: avg test  loss 593.56, bar  test loss 3.339, len  test loss 0.446, col  test loss 158.180


Epoch 146: 272batch [00:34,  7.82batch/s, loss=521]


epoch 146: avg train loss 505.84, bar train loss 2.389, len train loss 0.018, col train loss 149.569


Epoch 147: 1batch [00:00,  7.69batch/s, loss=523]

epoch 146: avg test  loss 596.23, bar  test loss 3.360, len  test loss 0.456, col  test loss 158.449


Epoch 147: 272batch [00:34,  7.81batch/s, loss=479]


epoch 147: avg train loss 505.73, bar train loss 2.386, len train loss 0.018, col train loss 149.551


Epoch 148: 1batch [00:00,  7.81batch/s, loss=502]

epoch 147: avg test  loss 601.45, bar  test loss 3.359, len  test loss 0.518, col  test loss 158.327


Epoch 148: 272batch [00:34,  7.82batch/s, loss=504]


epoch 148: avg train loss 505.61, bar train loss 2.385, len train loss 0.018, col train loss 149.514


Epoch 149: 1batch [00:00,  7.63batch/s, loss=499]

epoch 148: avg test  loss 593.72, bar  test loss 3.344, len  test loss 0.449, col  test loss 158.195


Epoch 149: 272batch [00:34,  7.80batch/s, loss=559]


epoch 149: avg train loss 505.51, bar train loss 2.379, len train loss 0.018, col train loss 149.520


Epoch 150: 1batch [00:00,  7.52batch/s, loss=484]

epoch 149: avg test  loss 600.02, bar  test loss 3.342, len  test loss 0.488, col  test loss 158.290


Epoch 150: 272batch [00:34,  7.79batch/s, loss=561]


epoch 150: avg train loss 505.34, bar train loss 2.379, len train loss 0.018, col train loss 149.457
epoch 150: avg test  loss 593.16, bar  test loss 3.344, len  test loss 0.435, col  test loss 158.200


Epoch 151: 272batch [00:34,  7.82batch/s, loss=543]


epoch 151: avg train loss 505.35, bar train loss 2.380, len train loss 0.018, col train loss 149.460


Epoch 152: 1batch [00:00,  7.75batch/s, loss=498]

epoch 151: avg test  loss 605.83, bar  test loss 3.368, len  test loss 0.538, col  test loss 158.367


Epoch 152: 272batch [00:34,  7.79batch/s, loss=530]


epoch 152: avg train loss 505.29, bar train loss 2.383, len train loss 0.017, col train loss 149.451


Epoch 153: 1batch [00:00,  7.81batch/s, loss=501]

epoch 152: avg test  loss 591.37, bar  test loss 3.366, len  test loss 0.410, col  test loss 158.373


Epoch 153: 272batch [00:34,  7.82batch/s, loss=504]


epoch 153: avg train loss 504.80, bar train loss 2.366, len train loss 0.018, col train loss 149.408


Epoch 154: 1batch [00:00,  7.58batch/s, loss=502]

epoch 153: avg test  loss 603.54, bar  test loss 3.371, len  test loss 0.535, col  test loss 158.451


Epoch 154: 272batch [00:35,  7.72batch/s, loss=554]


epoch 154: avg train loss 504.50, bar train loss 2.367, len train loss 0.017, col train loss 149.324


Epoch 155: 1batch [00:00,  6.25batch/s, loss=476]

epoch 154: avg test  loss 599.98, bar  test loss 3.364, len  test loss 0.502, col  test loss 158.335


Epoch 155: 272batch [00:35,  7.74batch/s, loss=510]


epoch 155: avg train loss 504.57, bar train loss 2.361, len train loss 0.017, col train loss 149.403
epoch 155: avg test  loss 602.60, bar  test loss 3.393, len  test loss 0.511, col  test loss 158.448


Epoch 156: 272batch [00:34,  7.80batch/s, loss=508]


epoch 156: avg train loss 504.64, bar train loss 2.363, len train loss 0.017, col train loss 149.354


Epoch 157: 1batch [00:00,  7.63batch/s, loss=502]

epoch 156: avg test  loss 598.23, bar  test loss 3.377, len  test loss 0.475, col  test loss 158.256


Epoch 157: 272batch [00:35,  7.76batch/s, loss=517]


epoch 157: avg train loss 504.39, bar train loss 2.366, len train loss 0.017, col train loss 149.303


Epoch 158: 1batch [00:00,  7.58batch/s, loss=508]

epoch 157: avg test  loss 598.24, bar  test loss 3.387, len  test loss 0.475, col  test loss 158.514


Epoch 158: 272batch [00:35,  7.74batch/s, loss=487]


epoch 158: avg train loss 504.05, bar train loss 2.358, len train loss 0.017, col train loss 149.258


Epoch 159: 1batch [00:00,  7.81batch/s, loss=510]

epoch 158: avg test  loss 600.25, bar  test loss 3.372, len  test loss 0.499, col  test loss 158.464


Epoch 159: 272batch [00:35,  7.74batch/s, loss=493]


epoch 159: avg train loss 503.78, bar train loss 2.354, len train loss 0.017, col train loss 149.185


Epoch 160: 1batch [00:00,  7.75batch/s, loss=480]

epoch 159: avg test  loss 603.66, bar  test loss 3.397, len  test loss 0.513, col  test loss 158.430


Epoch 160: 272batch [00:35,  7.76batch/s, loss=469]


epoch 160: avg train loss 503.76, bar train loss 2.350, len train loss 0.017, col train loss 149.216
epoch 160: avg test  loss 602.84, bar  test loss 3.384, len  test loss 0.521, col  test loss 158.412


Epoch 161: 272batch [00:35,  7.75batch/s, loss=503]


epoch 161: avg train loss 503.69, bar train loss 2.350, len train loss 0.017, col train loss 149.212


Epoch 162: 1batch [00:00,  7.58batch/s, loss=506]

epoch 161: avg test  loss 601.35, bar  test loss 3.370, len  test loss 0.487, col  test loss 158.414


Epoch 162: 272batch [00:35,  7.75batch/s, loss=480]


epoch 162: avg train loss 503.49, bar train loss 2.351, len train loss 0.016, col train loss 149.147


Epoch 163: 1batch [00:00,  7.69batch/s, loss=496]

epoch 162: avg test  loss 606.78, bar  test loss 3.413, len  test loss 0.561, col  test loss 158.482


Epoch 163: 272batch [00:35,  7.73batch/s, loss=506]


epoch 163: avg train loss 503.56, bar train loss 2.349, len train loss 0.017, col train loss 149.169


Epoch 164: 1batch [00:00,  7.63batch/s, loss=497]

epoch 163: avg test  loss 603.10, bar  test loss 3.411, len  test loss 0.518, col  test loss 158.710


Epoch 164: 272batch [00:35,  7.73batch/s, loss=540]


epoch 164: avg train loss 503.08, bar train loss 2.337, len train loss 0.017, col train loss 149.126


Epoch 165: 1batch [00:00,  7.75batch/s, loss=521]

epoch 164: avg test  loss 602.85, bar  test loss 3.405, len  test loss 0.497, col  test loss 158.945


Epoch 165: 272batch [00:35,  7.73batch/s, loss=481]


epoch 165: avg train loss 503.49, bar train loss 2.344, len train loss 0.017, col train loss 149.170
epoch 165: avg test  loss 599.47, bar  test loss 3.413, len  test loss 0.474, col  test loss 158.708


Epoch 166: 272batch [00:35,  7.76batch/s, loss=493]


epoch 166: avg train loss 503.01, bar train loss 2.340, len train loss 0.016, col train loss 149.065


Epoch 167: 1batch [00:00,  7.75batch/s, loss=500]

epoch 166: avg test  loss 604.81, bar  test loss 3.432, len  test loss 0.533, col  test loss 158.541


Epoch 167: 272batch [00:35,  7.74batch/s, loss=474]


epoch 167: avg train loss 502.81, bar train loss 2.334, len train loss 0.016, col train loss 149.048


Epoch 168: 1batch [00:00,  7.75batch/s, loss=500]

epoch 167: avg test  loss 604.06, bar  test loss 3.403, len  test loss 0.486, col  test loss 158.553


Epoch 168: 272batch [00:35,  7.73batch/s, loss=533]


epoch 168: avg train loss 502.77, bar train loss 2.334, len train loss 0.016, col train loss 149.029


Epoch 169: 1batch [00:00,  7.63batch/s, loss=496]

epoch 168: avg test  loss 597.96, bar  test loss 3.432, len  test loss 0.460, col  test loss 158.707


Epoch 169: 272batch [00:35,  7.71batch/s, loss=497]


epoch 169: avg train loss 502.60, bar train loss 2.331, len train loss 0.017, col train loss 149.004


Epoch 170: 1batch [00:00,  7.81batch/s, loss=474]

epoch 169: avg test  loss 601.36, bar  test loss 3.433, len  test loss 0.496, col  test loss 158.588


Epoch 170: 272batch [00:35,  7.70batch/s, loss=519]


epoch 170: avg train loss 502.71, bar train loss 2.338, len train loss 0.017, col train loss 149.023
epoch 170: avg test  loss 597.03, bar  test loss 3.419, len  test loss 0.453, col  test loss 158.604


Epoch 171: 272batch [00:35,  7.65batch/s, loss=481]


epoch 171: avg train loss 502.61, bar train loss 2.328, len train loss 0.017, col train loss 149.010


Epoch 172: 1batch [00:00,  7.69batch/s, loss=506]

epoch 171: avg test  loss 595.90, bar  test loss 3.432, len  test loss 0.440, col  test loss 158.688


Epoch 172: 272batch [00:35,  7.73batch/s, loss=503]


epoch 172: avg train loss 502.32, bar train loss 2.329, len train loss 0.016, col train loss 148.967


Epoch 173: 1batch [00:00,  7.52batch/s, loss=481]

epoch 172: avg test  loss 601.58, bar  test loss 3.422, len  test loss 0.491, col  test loss 158.589


Epoch 173: 272batch [00:35,  7.70batch/s, loss=534]


epoch 173: avg train loss 502.02, bar train loss 2.326, len train loss 0.016, col train loss 148.893


Epoch 174: 1batch [00:00,  7.81batch/s, loss=514]

epoch 173: avg test  loss 600.28, bar  test loss 3.427, len  test loss 0.484, col  test loss 158.734


Epoch 174: 272batch [00:35,  7.68batch/s, loss=533]


epoch 174: avg train loss 502.15, bar train loss 2.322, len train loss 0.016, col train loss 148.916


Epoch 175: 0batch [00:00, ?batch/s, loss=513]

epoch 174: avg test  loss 602.67, bar  test loss 3.431, len  test loss 0.507, col  test loss 158.699


Epoch 175: 272batch [00:35,  7.65batch/s, loss=532]


epoch 175: avg train loss 501.90, bar train loss 2.323, len train loss 0.017, col train loss 148.872
epoch 175: avg test  loss 601.10, bar  test loss 3.436, len  test loss 0.491, col  test loss 158.675


Epoch 176: 272batch [00:35,  7.71batch/s, loss=465]


epoch 176: avg train loss 501.91, bar train loss 2.321, len train loss 0.016, col train loss 148.883


Epoch 177: 1batch [00:00,  7.69batch/s, loss=526]

epoch 176: avg test  loss 602.61, bar  test loss 3.461, len  test loss 0.500, col  test loss 158.723


Epoch 177: 272batch [00:35,  7.70batch/s, loss=529]


epoch 177: avg train loss 501.82, bar train loss 2.323, len train loss 0.016, col train loss 148.858


Epoch 178: 1batch [00:00,  7.52batch/s, loss=487]

epoch 177: avg test  loss 600.78, bar  test loss 3.452, len  test loss 0.478, col  test loss 158.561


Epoch 178: 272batch [00:35,  7.67batch/s, loss=496]


epoch 178: avg train loss 501.59, bar train loss 2.317, len train loss 0.016, col train loss 148.806


Epoch 179: 1batch [00:00,  7.69batch/s, loss=517]

epoch 178: avg test  loss 595.14, bar  test loss 3.437, len  test loss 0.428, col  test loss 158.734


Epoch 179: 272batch [00:35,  7.68batch/s, loss=468]


epoch 179: avg train loss 501.17, bar train loss 2.310, len train loss 0.016, col train loss 148.751


Epoch 180: 1batch [00:00,  7.52batch/s, loss=498]

epoch 179: avg test  loss 605.47, bar  test loss 3.446, len  test loss 0.532, col  test loss 158.637


Epoch 180: 272batch [00:35,  7.68batch/s, loss=492]


epoch 180: avg train loss 501.28, bar train loss 2.310, len train loss 0.016, col train loss 148.765
epoch 180: avg test  loss 607.17, bar  test loss 3.451, len  test loss 0.526, col  test loss 158.796


Epoch 181: 272batch [00:35,  7.68batch/s, loss=548]


epoch 181: avg train loss 501.21, bar train loss 2.312, len train loss 0.016, col train loss 148.737


Epoch 182: 0batch [00:00, ?batch/s, loss=493]

epoch 181: avg test  loss 597.10, bar  test loss 3.442, len  test loss 0.450, col  test loss 158.635


Epoch 182: 272batch [00:35,  7.68batch/s, loss=551]


epoch 182: avg train loss 501.08, bar train loss 2.305, len train loss 0.016, col train loss 148.745


Epoch 183: 0batch [00:00, ?batch/s]

epoch 182: avg test  loss 595.90, bar  test loss 3.463, len  test loss 0.427, col  test loss 158.744


Epoch 183: 272batch [00:35,  7.65batch/s, loss=516]


epoch 183: avg train loss 500.96, bar train loss 2.299, len train loss 0.015, col train loss 148.739


Epoch 184: 0batch [00:00, ?batch/s]

epoch 183: avg test  loss 600.52, bar  test loss 3.455, len  test loss 0.473, col  test loss 158.780


Epoch 184: 272batch [00:35,  7.62batch/s, loss=535]


epoch 184: avg train loss 500.81, bar train loss 2.300, len train loss 0.016, col train loss 148.700


Epoch 185: 1batch [00:00,  7.63batch/s, loss=501]

epoch 184: avg test  loss 596.90, bar  test loss 3.466, len  test loss 0.434, col  test loss 158.773


Epoch 185: 272batch [00:35,  7.65batch/s, loss=490]


epoch 185: avg train loss 501.00, bar train loss 2.307, len train loss 0.016, col train loss 148.723
epoch 185: avg test  loss 606.31, bar  test loss 3.482, len  test loss 0.518, col  test loss 158.781


Epoch 186: 272batch [00:35,  7.66batch/s, loss=486]


epoch 186: avg train loss 500.65, bar train loss 2.298, len train loss 0.016, col train loss 148.675


Epoch 187: 1batch [00:00,  7.41batch/s, loss=510]

epoch 186: avg test  loss 604.31, bar  test loss 3.483, len  test loss 0.510, col  test loss 158.706


Epoch 187: 272batch [00:35,  7.65batch/s, loss=536]


epoch 187: avg train loss 500.70, bar train loss 2.299, len train loss 0.015, col train loss 148.666


Epoch 188: 1batch [00:00,  7.58batch/s, loss=497]

epoch 187: avg test  loss 600.91, bar  test loss 3.469, len  test loss 0.470, col  test loss 158.716


Epoch 188: 272batch [00:35,  7.65batch/s, loss=521]


epoch 188: avg train loss 500.59, bar train loss 2.299, len train loss 0.015, col train loss 148.677


Epoch 189: 1batch [00:00,  7.81batch/s, loss=508]

epoch 188: avg test  loss 598.62, bar  test loss 3.482, len  test loss 0.453, col  test loss 158.801


Epoch 189: 272batch [00:35,  7.61batch/s, loss=515]


epoch 189: avg train loss 500.37, bar train loss 2.293, len train loss 0.016, col train loss 148.624


Epoch 190: 1batch [00:00,  7.19batch/s, loss=495]

epoch 189: avg test  loss 601.00, bar  test loss 3.475, len  test loss 0.478, col  test loss 158.849


Epoch 190: 272batch [00:34,  7.82batch/s, loss=546]


epoch 190: avg train loss 500.38, bar train loss 2.297, len train loss 0.016, col train loss 148.589
epoch 190: avg test  loss 600.44, bar  test loss 3.494, len  test loss 0.453, col  test loss 158.882


Epoch 191: 272batch [00:34,  7.85batch/s, loss=534]


epoch 191: avg train loss 500.37, bar train loss 2.292, len train loss 0.016, col train loss 148.588


Epoch 192: 1batch [00:00,  7.69batch/s, loss=499]

epoch 191: avg test  loss 605.43, bar  test loss 3.486, len  test loss 0.519, col  test loss 158.878


Epoch 192: 272batch [00:34,  7.86batch/s, loss=558]


epoch 192: avg train loss 499.94, bar train loss 2.288, len train loss 0.015, col train loss 148.544


Epoch 193: 1batch [00:00,  7.81batch/s, loss=515]

epoch 192: avg test  loss 604.26, bar  test loss 3.492, len  test loss 0.508, col  test loss 158.813


Epoch 193: 272batch [00:34,  7.87batch/s, loss=556]


epoch 193: avg train loss 499.89, bar train loss 2.286, len train loss 0.015, col train loss 148.528


Epoch 194: 1batch [00:00,  7.75batch/s, loss=505]

epoch 193: avg test  loss 606.73, bar  test loss 3.498, len  test loss 0.523, col  test loss 158.828


Epoch 194: 272batch [00:34,  7.82batch/s, loss=464]


epoch 194: avg train loss 499.81, bar train loss 2.286, len train loss 0.016, col train loss 148.506


Epoch 195: 1batch [00:00,  7.75batch/s, loss=516]

epoch 194: avg test  loss 603.36, bar  test loss 3.498, len  test loss 0.483, col  test loss 159.009


Epoch 195: 272batch [00:34,  7.84batch/s, loss=493]


epoch 195: avg train loss 499.83, bar train loss 2.283, len train loss 0.016, col train loss 148.544
epoch 195: avg test  loss 604.83, bar  test loss 3.518, len  test loss 0.511, col  test loss 158.893


Epoch 196: 272batch [00:34,  7.86batch/s, loss=464]


epoch 196: avg train loss 499.48, bar train loss 2.282, len train loss 0.016, col train loss 148.459


Epoch 197: 1batch [00:00,  7.75batch/s, loss=476]

epoch 196: avg test  loss 608.76, bar  test loss 3.517, len  test loss 0.540, col  test loss 158.928


Epoch 197: 272batch [00:34,  7.84batch/s, loss=484]


epoch 197: avg train loss 499.53, bar train loss 2.281, len train loss 0.015, col train loss 148.462


Epoch 198: 1batch [00:00,  7.63batch/s, loss=504]

epoch 197: avg test  loss 605.44, bar  test loss 3.498, len  test loss 0.520, col  test loss 158.853


Epoch 198: 272batch [00:34,  7.85batch/s, loss=518]


epoch 198: avg train loss 499.16, bar train loss 2.276, len train loss 0.015, col train loss 148.394


Epoch 199: 1batch [00:00,  7.75batch/s, loss=469]

epoch 198: avg test  loss 599.27, bar  test loss 3.517, len  test loss 0.453, col  test loss 158.951


Epoch 199: 272batch [00:34,  7.85batch/s, loss=526]


epoch 199: avg train loss 499.38, bar train loss 2.278, len train loss 0.016, col train loss 148.412


Epoch 200: 1batch [00:00,  7.52batch/s, loss=499]

epoch 199: avg test  loss 604.47, bar  test loss 3.528, len  test loss 0.504, col  test loss 158.942


Epoch 200: 272batch [00:34,  7.84batch/s, loss=481]


epoch 200: avg train loss 499.11, bar train loss 2.276, len train loss 0.015, col train loss 148.389
epoch 200: avg test  loss 602.58, bar  test loss 3.542, len  test loss 0.475, col  test loss 159.123


Epoch 201: 272batch [00:34,  7.83batch/s, loss=519]


epoch 201: avg train loss 499.09, bar train loss 2.274, len train loss 0.015, col train loss 148.404


Epoch 202: 1batch [00:00,  7.69batch/s, loss=518]

epoch 201: avg test  loss 602.43, bar  test loss 3.517, len  test loss 0.480, col  test loss 159.065


Epoch 202: 272batch [00:34,  7.82batch/s, loss=483]


epoch 202: avg train loss 499.01, bar train loss 2.274, len train loss 0.015, col train loss 148.360


Epoch 203: 1batch [00:00,  7.41batch/s, loss=499]

epoch 202: avg test  loss 601.00, bar  test loss 3.508, len  test loss 0.469, col  test loss 158.866


Epoch 203: 272batch [00:34,  7.81batch/s, loss=500]


epoch 203: avg train loss 499.01, bar train loss 2.274, len train loss 0.015, col train loss 148.367


Epoch 204: 1batch [00:00,  7.69batch/s, loss=489]

epoch 203: avg test  loss 598.42, bar  test loss 3.498, len  test loss 0.441, col  test loss 159.001


Epoch 204: 272batch [00:35,  7.77batch/s, loss=505]


epoch 204: avg train loss 498.95, bar train loss 2.272, len train loss 0.015, col train loss 148.363


Epoch 205: 1batch [00:00,  8.00batch/s, loss=505]

epoch 204: avg test  loss 605.12, bar  test loss 3.517, len  test loss 0.497, col  test loss 158.990


Epoch 205: 272batch [00:34,  7.80batch/s, loss=508]


epoch 205: avg train loss 498.76, bar train loss 2.269, len train loss 0.015, col train loss 148.306
epoch 205: avg test  loss 600.05, bar  test loss 3.518, len  test loss 0.444, col  test loss 159.030


Epoch 206: 272batch [00:34,  7.79batch/s, loss=542]


epoch 206: avg train loss 498.59, bar train loss 2.265, len train loss 0.015, col train loss 148.312


Epoch 207: 1batch [00:00,  7.81batch/s, loss=500]

epoch 206: avg test  loss 599.38, bar  test loss 3.522, len  test loss 0.447, col  test loss 158.976


Epoch 207: 272batch [00:34,  7.78batch/s, loss=529]


epoch 207: avg train loss 498.56, bar train loss 2.263, len train loss 0.015, col train loss 148.316


Epoch 208: 1batch [00:00,  7.58batch/s, loss=501]

epoch 207: avg test  loss 605.89, bar  test loss 3.535, len  test loss 0.506, col  test loss 159.078


Epoch 208: 272batch [00:35,  7.77batch/s, loss=484]


epoch 208: avg train loss 498.41, bar train loss 2.262, len train loss 0.015, col train loss 148.268


Epoch 209: 1batch [00:00,  7.58batch/s, loss=484]

epoch 208: avg test  loss 602.62, bar  test loss 3.522, len  test loss 0.470, col  test loss 158.942


Epoch 209: 272batch [00:35,  7.77batch/s, loss=502]


epoch 209: avg train loss 498.42, bar train loss 2.260, len train loss 0.015, col train loss 148.317


Epoch 210: 1batch [00:00,  7.41batch/s, loss=506]

epoch 209: avg test  loss 602.70, bar  test loss 3.535, len  test loss 0.480, col  test loss 158.988


Epoch 210: 272batch [00:35,  7.77batch/s, loss=523]


epoch 210: avg train loss 498.50, bar train loss 2.260, len train loss 0.016, col train loss 148.288
epoch 210: avg test  loss 605.96, bar  test loss 3.533, len  test loss 0.509, col  test loss 159.067


Epoch 211: 272batch [00:35,  7.77batch/s, loss=503]


epoch 211: avg train loss 498.13, bar train loss 2.254, len train loss 0.015, col train loss 148.235


Epoch 212: 1batch [00:00,  7.58batch/s, loss=490]

epoch 211: avg test  loss 602.97, bar  test loss 3.547, len  test loss 0.472, col  test loss 158.977


Epoch 212: 272batch [00:35,  7.77batch/s, loss=469]


epoch 212: avg train loss 498.04, bar train loss 2.253, len train loss 0.015, col train loss 148.218


Epoch 213: 1batch [00:00,  7.75batch/s, loss=494]

epoch 212: avg test  loss 606.79, bar  test loss 3.542, len  test loss 0.503, col  test loss 159.183


Epoch 213: 272batch [00:35,  7.76batch/s, loss=519]


epoch 213: avg train loss 497.89, bar train loss 2.253, len train loss 0.015, col train loss 148.160


Epoch 214: 1batch [00:00,  7.87batch/s, loss=493]

epoch 213: avg test  loss 604.03, bar  test loss 3.568, len  test loss 0.481, col  test loss 159.194


Epoch 214: 272batch [00:35,  7.75batch/s, loss=483]


epoch 214: avg train loss 498.07, bar train loss 2.257, len train loss 0.015, col train loss 148.214


Epoch 215: 1batch [00:00,  7.52batch/s, loss=503]

epoch 214: avg test  loss 603.61, bar  test loss 3.554, len  test loss 0.482, col  test loss 159.075


Epoch 215: 272batch [00:35,  7.73batch/s, loss=521]


epoch 215: avg train loss 497.77, bar train loss 2.251, len train loss 0.015, col train loss 148.174
epoch 215: avg test  loss 600.97, bar  test loss 3.564, len  test loss 0.457, col  test loss 159.133


Epoch 216: 272batch [00:35,  7.75batch/s, loss=497]


epoch 216: avg train loss 497.89, bar train loss 2.250, len train loss 0.015, col train loss 148.208


Epoch 217: 1batch [00:00,  7.69batch/s, loss=493]

epoch 216: avg test  loss 606.46, bar  test loss 3.560, len  test loss 0.510, col  test loss 159.119


Epoch 217: 272batch [00:35,  7.76batch/s, loss=538]


epoch 217: avg train loss 497.71, bar train loss 2.250, len train loss 0.015, col train loss 148.131


Epoch 218: 1batch [00:00,  7.58batch/s, loss=513]

epoch 217: avg test  loss 605.27, bar  test loss 3.562, len  test loss 0.501, col  test loss 159.164


Epoch 218: 272batch [00:35,  7.70batch/s, loss=522]


epoch 218: avg train loss 497.45, bar train loss 2.246, len train loss 0.014, col train loss 148.122


Epoch 219: 1batch [00:00,  7.63batch/s, loss=474]

epoch 218: avg test  loss 604.39, bar  test loss 3.562, len  test loss 0.485, col  test loss 159.230


Epoch 219: 272batch [00:35,  7.73batch/s, loss=551]


epoch 219: avg train loss 497.44, bar train loss 2.246, len train loss 0.015, col train loss 148.080


Epoch 220: 1batch [00:00,  7.52batch/s, loss=491]

epoch 219: avg test  loss 599.75, bar  test loss 3.577, len  test loss 0.445, col  test loss 159.143


Epoch 220: 272batch [00:35,  7.66batch/s, loss=488]


epoch 220: avg train loss 497.56, bar train loss 2.243, len train loss 0.015, col train loss 148.146
epoch 220: avg test  loss 607.75, bar  test loss 3.568, len  test loss 0.519, col  test loss 159.131


Epoch 221: 272batch [00:35,  7.76batch/s, loss=491]


epoch 221: avg train loss 497.31, bar train loss 2.241, len train loss 0.015, col train loss 148.078


Epoch 222: 1batch [00:00,  7.75batch/s, loss=496]

epoch 221: avg test  loss 603.60, bar  test loss 3.581, len  test loss 0.478, col  test loss 159.240


Epoch 222: 272batch [00:35,  7.75batch/s, loss=508]


epoch 222: avg train loss 497.38, bar train loss 2.243, len train loss 0.015, col train loss 148.103


Epoch 223: 1batch [00:00,  7.52batch/s, loss=498]

epoch 222: avg test  loss 611.68, bar  test loss 3.579, len  test loss 0.554, col  test loss 159.214


Epoch 223: 272batch [00:35,  7.73batch/s, loss=497]


epoch 223: avg train loss 496.95, bar train loss 2.240, len train loss 0.015, col train loss 148.008


Epoch 224: 1batch [00:00,  7.87batch/s, loss=503]

epoch 223: avg test  loss 604.19, bar  test loss 3.575, len  test loss 0.483, col  test loss 159.186


Epoch 224: 272batch [00:35,  7.70batch/s, loss=505]


epoch 224: avg train loss 497.04, bar train loss 2.241, len train loss 0.015, col train loss 148.015


Epoch 225: 1batch [00:00,  7.81batch/s, loss=502]

epoch 224: avg test  loss 608.80, bar  test loss 3.584, len  test loss 0.521, col  test loss 159.158


Epoch 225: 272batch [00:35,  7.69batch/s, loss=514]


epoch 225: avg train loss 497.08, bar train loss 2.239, len train loss 0.014, col train loss 148.061
epoch 225: avg test  loss 605.06, bar  test loss 3.575, len  test loss 0.487, col  test loss 159.203


Epoch 226: 272batch [00:35,  7.70batch/s, loss=476]


epoch 226: avg train loss 497.06, bar train loss 2.237, len train loss 0.015, col train loss 148.025


Epoch 227: 1batch [00:00,  7.41batch/s, loss=471]

epoch 226: avg test  loss 605.23, bar  test loss 3.580, len  test loss 0.488, col  test loss 159.217


Epoch 227: 272batch [00:35,  7.68batch/s, loss=478]


epoch 227: avg train loss 497.12, bar train loss 2.238, len train loss 0.014, col train loss 148.062


Epoch 228: 1batch [00:00,  7.35batch/s, loss=490]

epoch 227: avg test  loss 604.30, bar  test loss 3.576, len  test loss 0.470, col  test loss 159.260


Epoch 228: 272batch [00:35,  7.70batch/s, loss=492]


epoch 228: avg train loss 496.99, bar train loss 2.234, len train loss 0.015, col train loss 148.041


Epoch 229: 1batch [00:00,  7.58batch/s, loss=502]

epoch 228: avg test  loss 605.53, bar  test loss 3.580, len  test loss 0.490, col  test loss 159.269


Epoch 229: 272batch [00:35,  7.57batch/s, loss=499]


epoch 229: avg train loss 496.61, bar train loss 2.231, len train loss 0.014, col train loss 147.973


Epoch 230: 1batch [00:00,  7.52batch/s, loss=492]

epoch 229: avg test  loss 609.81, bar  test loss 3.590, len  test loss 0.529, col  test loss 159.453


Epoch 230: 272batch [00:35,  7.64batch/s, loss=490]


epoch 230: avg train loss 496.49, bar train loss 2.226, len train loss 0.014, col train loss 147.963
epoch 230: avg test  loss 609.75, bar  test loss 3.616, len  test loss 0.527, col  test loss 159.327


Epoch 231: 272batch [00:35,  7.61batch/s, loss=500]


epoch 231: avg train loss 496.44, bar train loss 2.229, len train loss 0.014, col train loss 147.956


Epoch 232: 1batch [00:00,  7.58batch/s, loss=505]

epoch 231: avg test  loss 606.29, bar  test loss 3.582, len  test loss 0.504, col  test loss 159.234


Epoch 232: 272batch [00:35,  7.65batch/s, loss=501]


epoch 232: avg train loss 496.41, bar train loss 2.220, len train loss 0.014, col train loss 147.983


Epoch 233: 1batch [00:00,  7.52batch/s, loss=479]

epoch 232: avg test  loss 609.44, bar  test loss 3.599, len  test loss 0.529, col  test loss 159.253


Epoch 233: 272batch [00:35,  7.67batch/s, loss=510]


epoch 233: avg train loss 496.34, bar train loss 2.226, len train loss 0.014, col train loss 147.914


Epoch 234: 1batch [00:00,  7.52batch/s, loss=481]

epoch 233: avg test  loss 605.60, bar  test loss 3.583, len  test loss 0.490, col  test loss 159.278


Epoch 234: 272batch [00:35,  7.67batch/s, loss=517]


epoch 234: avg train loss 496.29, bar train loss 2.221, len train loss 0.014, col train loss 147.952


Epoch 235: 1batch [00:00,  7.63batch/s, loss=472]

epoch 234: avg test  loss 609.04, bar  test loss 3.612, len  test loss 0.517, col  test loss 159.433


Epoch 235: 272batch [00:35,  7.66batch/s, loss=474]


epoch 235: avg train loss 496.24, bar train loss 2.221, len train loss 0.014, col train loss 147.931
epoch 235: avg test  loss 608.01, bar  test loss 3.592, len  test loss 0.516, col  test loss 159.298


Epoch 236: 272batch [00:35,  7.67batch/s, loss=483]


epoch 236: avg train loss 496.02, bar train loss 2.220, len train loss 0.014, col train loss 147.875


Epoch 237: 1batch [00:00,  7.58batch/s, loss=503]

epoch 236: avg test  loss 610.23, bar  test loss 3.617, len  test loss 0.532, col  test loss 159.403


Epoch 237: 272batch [00:35,  7.64batch/s, loss=482]


epoch 237: avg train loss 496.08, bar train loss 2.219, len train loss 0.014, col train loss 147.874


Epoch 238: 1batch [00:00,  7.58batch/s, loss=497]

epoch 237: avg test  loss 605.80, bar  test loss 3.602, len  test loss 0.491, col  test loss 159.314


Epoch 238: 272batch [00:35,  7.64batch/s, loss=501]


epoch 238: avg train loss 495.88, bar train loss 2.217, len train loss 0.014, col train loss 147.849


Epoch 239: 1batch [00:00,  7.52batch/s, loss=494]

epoch 238: avg test  loss 608.44, bar  test loss 3.619, len  test loss 0.513, col  test loss 159.389


Epoch 239: 272batch [00:35,  7.63batch/s, loss=512]


epoch 239: avg train loss 495.81, bar train loss 2.219, len train loss 0.014, col train loss 147.824


Epoch 240: 1batch [00:00,  7.81batch/s, loss=485]

epoch 239: avg test  loss 607.54, bar  test loss 3.604, len  test loss 0.499, col  test loss 159.426


Epoch 240: 272batch [00:35,  7.63batch/s, loss=508]


epoch 240: avg train loss 495.63, bar train loss 2.209, len train loss 0.014, col train loss 147.826
epoch 240: avg test  loss 603.64, bar  test loss 3.608, len  test loss 0.466, col  test loss 159.212


Epoch 241: 272batch [00:35,  7.64batch/s, loss=486]


epoch 241: avg train loss 495.62, bar train loss 2.212, len train loss 0.015, col train loss 147.786


Epoch 242: 1batch [00:00,  7.46batch/s, loss=482]

epoch 241: avg test  loss 601.89, bar  test loss 3.609, len  test loss 0.450, col  test loss 159.421


Epoch 242: 272batch [00:35,  7.62batch/s, loss=512]


epoch 242: avg train loss 495.58, bar train loss 2.214, len train loss 0.014, col train loss 147.796


Epoch 243: 1batch [00:00,  7.46batch/s, loss=506]

epoch 242: avg test  loss 609.94, bar  test loss 3.633, len  test loss 0.516, col  test loss 159.504


Epoch 243: 272batch [00:35,  7.60batch/s, loss=463]


epoch 243: avg train loss 495.94, bar train loss 2.214, len train loss 0.015, col train loss 147.871


Epoch 244: 1batch [00:00,  7.35batch/s, loss=503]

epoch 243: avg test  loss 604.37, bar  test loss 3.630, len  test loss 0.465, col  test loss 159.378


Epoch 244: 272batch [00:35,  7.57batch/s, loss=468]


epoch 244: avg train loss 495.65, bar train loss 2.211, len train loss 0.014, col train loss 147.847


Epoch 245: 1batch [00:00,  7.52batch/s, loss=488]

epoch 244: avg test  loss 604.60, bar  test loss 3.622, len  test loss 0.469, col  test loss 159.593


Epoch 245: 272batch [00:35,  7.57batch/s, loss=523]


epoch 245: avg train loss 495.51, bar train loss 2.209, len train loss 0.014, col train loss 147.784
epoch 245: avg test  loss 602.93, bar  test loss 3.639, len  test loss 0.451, col  test loss 159.408


Epoch 246: 272batch [00:35,  7.61batch/s, loss=493]


epoch 246: avg train loss 495.34, bar train loss 2.207, len train loss 0.014, col train loss 147.772


Epoch 247: 1batch [00:00,  7.19batch/s, loss=508]

epoch 246: avg test  loss 607.55, bar  test loss 3.629, len  test loss 0.499, col  test loss 159.515


Epoch 247: 272batch [00:35,  7.60batch/s, loss=510]


epoch 247: avg train loss 495.25, bar train loss 2.208, len train loss 0.014, col train loss 147.734


Epoch 248: 1batch [00:00,  7.46batch/s, loss=472]

epoch 247: avg test  loss 611.54, bar  test loss 3.630, len  test loss 0.533, col  test loss 159.343


Epoch 248: 272batch [00:35,  7.58batch/s, loss=522]


epoch 248: avg train loss 495.41, bar train loss 2.208, len train loss 0.014, col train loss 147.781


Epoch 249: 1batch [00:00,  7.58batch/s, loss=496]

epoch 248: avg test  loss 610.07, bar  test loss 3.658, len  test loss 0.515, col  test loss 159.529


Epoch 249: 272batch [00:35,  7.58batch/s, loss=489]


epoch 249: avg train loss 495.00, bar train loss 2.200, len train loss 0.014, col train loss 147.740


Epoch 250: 1batch [00:00,  7.41batch/s, loss=499]

epoch 249: avg test  loss 603.99, bar  test loss 3.626, len  test loss 0.462, col  test loss 159.441


Epoch 250: 272batch [00:35,  7.57batch/s, loss=537]


epoch 250: avg train loss 495.08, bar train loss 2.202, len train loss 0.014, col train loss 147.735
epoch 250: avg test  loss 610.26, bar  test loss 3.644, len  test loss 0.517, col  test loss 159.581


Epoch 251: 272batch [00:35,  7.56batch/s, loss=452]


epoch 251: avg train loss 495.15, bar train loss 2.205, len train loss 0.014, col train loss 147.715


Epoch 252: 1batch [00:00,  7.58batch/s, loss=485]

epoch 251: avg test  loss 607.91, bar  test loss 3.644, len  test loss 0.496, col  test loss 159.406


Epoch 252: 272batch [00:35,  7.57batch/s, loss=492]


epoch 252: avg train loss 495.06, bar train loss 2.204, len train loss 0.014, col train loss 147.697


Epoch 253: 1batch [00:00,  7.46batch/s, loss=499]

epoch 252: avg test  loss 613.02, bar  test loss 3.638, len  test loss 0.553, col  test loss 159.465


Epoch 253: 272batch [00:35,  7.57batch/s, loss=470]


epoch 253: avg train loss 494.65, bar train loss 2.193, len train loss 0.014, col train loss 147.672


Epoch 254: 1batch [00:00,  7.14batch/s, loss=475]

epoch 253: avg test  loss 612.25, bar  test loss 3.657, len  test loss 0.542, col  test loss 159.554


Epoch 254: 272batch [00:35,  7.56batch/s, loss=523]


epoch 254: avg train loss 494.68, bar train loss 2.194, len train loss 0.014, col train loss 147.668


Epoch 255: 1batch [00:00,  7.58batch/s, loss=482]

epoch 254: avg test  loss 605.36, bar  test loss 3.652, len  test loss 0.475, col  test loss 159.475


Epoch 255: 272batch [00:36,  7.53batch/s, loss=510]


epoch 255: avg train loss 494.68, bar train loss 2.194, len train loss 0.014, col train loss 147.650
epoch 255: avg test  loss 606.92, bar  test loss 3.671, len  test loss 0.482, col  test loss 159.520


Epoch 256: 272batch [00:35,  7.57batch/s, loss=486]


epoch 256: avg train loss 494.63, bar train loss 2.192, len train loss 0.013, col train loss 147.664


Epoch 257: 1batch [00:00,  7.41batch/s, loss=507]

epoch 256: avg test  loss 607.85, bar  test loss 3.640, len  test loss 0.497, col  test loss 159.443


Epoch 257: 272batch [00:35,  7.56batch/s, loss=521]


epoch 257: avg train loss 494.33, bar train loss 2.189, len train loss 0.014, col train loss 147.614


Epoch 258: 1batch [00:00,  7.69batch/s, loss=492]

epoch 257: avg test  loss 607.29, bar  test loss 3.624, len  test loss 0.473, col  test loss 159.488


Epoch 258: 272batch [00:36,  7.53batch/s, loss=495]


epoch 258: avg train loss 494.58, bar train loss 2.196, len train loss 0.013, col train loss 147.628


Epoch 259: 1batch [00:00,  7.14batch/s, loss=491]

epoch 258: avg test  loss 604.32, bar  test loss 3.648, len  test loss 0.456, col  test loss 159.494


Epoch 259: 272batch [00:36,  7.53batch/s, loss=502]


epoch 259: avg train loss 494.53, bar train loss 2.193, len train loss 0.014, col train loss 147.612


Epoch 260: 1batch [00:00,  7.52batch/s, loss=497]

epoch 259: avg test  loss 610.28, bar  test loss 3.680, len  test loss 0.512, col  test loss 159.589


Epoch 260: 272batch [00:36,  7.43batch/s, loss=483]


epoch 260: avg train loss 494.25, bar train loss 2.188, len train loss 0.013, col train loss 147.580
epoch 260: avg test  loss 608.13, bar  test loss 3.678, len  test loss 0.493, col  test loss 159.790


Epoch 261: 272batch [00:37,  7.21batch/s, loss=545]


epoch 261: avg train loss 494.67, bar train loss 2.192, len train loss 0.014, col train loss 147.699


Epoch 262: 0batch [00:00, ?batch/s]

epoch 261: avg test  loss 613.13, bar  test loss 3.675, len  test loss 0.535, col  test loss 159.790


Epoch 262: 272batch [00:36,  7.44batch/s, loss=509]


epoch 262: avg train loss 494.04, bar train loss 2.185, len train loss 0.014, col train loss 147.541


Epoch 263: 0batch [00:00, ?batch/s]

epoch 262: avg test  loss 611.00, bar  test loss 3.665, len  test loss 0.525, col  test loss 159.516


Epoch 263: 272batch [00:37,  7.28batch/s, loss=521]


epoch 263: avg train loss 494.37, bar train loss 2.190, len train loss 0.013, col train loss 147.609


Epoch 264: 1batch [00:00,  7.09batch/s, loss=468]

epoch 263: avg test  loss 607.31, bar  test loss 3.686, len  test loss 0.483, col  test loss 159.578


Epoch 264: 272batch [00:37,  7.30batch/s, loss=501]


epoch 264: avg train loss 494.05, bar train loss 2.184, len train loss 0.014, col train loss 147.547


Epoch 265: 1batch [00:00,  7.35batch/s, loss=509]

epoch 264: avg test  loss 611.78, bar  test loss 3.666, len  test loss 0.514, col  test loss 159.441


Epoch 265: 272batch [00:37,  7.31batch/s, loss=502]


epoch 265: avg train loss 493.94, bar train loss 2.182, len train loss 0.014, col train loss 147.522
epoch 265: avg test  loss 607.32, bar  test loss 3.663, len  test loss 0.484, col  test loss 159.562


Epoch 266: 272batch [00:37,  7.30batch/s, loss=469]


epoch 266: avg train loss 493.97, bar train loss 2.182, len train loss 0.013, col train loss 147.554


Epoch 267: 1batch [00:00,  7.30batch/s, loss=501]

epoch 266: avg test  loss 608.45, bar  test loss 3.696, len  test loss 0.493, col  test loss 159.688


Epoch 267: 272batch [00:37,  7.30batch/s, loss=484]


epoch 267: avg train loss 493.68, bar train loss 2.175, len train loss 0.013, col train loss 147.498


Epoch 268: 1batch [00:00,  7.19batch/s, loss=498]

epoch 267: avg test  loss 609.63, bar  test loss 3.688, len  test loss 0.500, col  test loss 159.553


Epoch 268: 272batch [00:37,  7.32batch/s, loss=467]


epoch 268: avg train loss 493.99, bar train loss 2.181, len train loss 0.014, col train loss 147.551


Epoch 269: 1batch [00:00,  7.09batch/s, loss=496]

epoch 268: avg test  loss 609.66, bar  test loss 3.669, len  test loss 0.502, col  test loss 159.618


Epoch 269: 272batch [00:37,  7.27batch/s, loss=513]


epoch 269: avg train loss 493.70, bar train loss 2.178, len train loss 0.013, col train loss 147.477


Epoch 270: 1batch [00:00,  7.25batch/s, loss=493]

epoch 269: avg test  loss 606.31, bar  test loss 3.683, len  test loss 0.474, col  test loss 159.616


Epoch 270: 272batch [00:37,  7.27batch/s, loss=529]


epoch 270: avg train loss 493.55, bar train loss 2.177, len train loss 0.013, col train loss 147.452
epoch 270: avg test  loss 611.72, bar  test loss 3.696, len  test loss 0.529, col  test loss 159.586


Epoch 271: 272batch [00:37,  7.32batch/s, loss=467]


epoch 271: avg train loss 493.70, bar train loss 2.180, len train loss 0.013, col train loss 147.498


Epoch 272: 1batch [00:00,  7.52batch/s, loss=516]

epoch 271: avg test  loss 606.25, bar  test loss 3.669, len  test loss 0.479, col  test loss 159.680


Epoch 272: 272batch [00:37,  7.25batch/s, loss=484]


epoch 272: avg train loss 493.64, bar train loss 2.177, len train loss 0.013, col train loss 147.500


Epoch 273: 1batch [00:00,  7.19batch/s, loss=500]

epoch 272: avg test  loss 611.75, bar  test loss 3.686, len  test loss 0.527, col  test loss 159.664


Epoch 273: 272batch [00:37,  7.28batch/s, loss=564]


epoch 273: avg train loss 493.49, bar train loss 2.174, len train loss 0.013, col train loss 147.470


Epoch 274: 1batch [00:00,  6.76batch/s, loss=498]

epoch 273: avg test  loss 607.71, bar  test loss 3.691, len  test loss 0.482, col  test loss 159.745


Epoch 274: 272batch [00:37,  7.27batch/s, loss=513]


epoch 274: avg train loss 493.56, bar train loss 2.179, len train loss 0.013, col train loss 147.462


Epoch 275: 1batch [00:00,  7.30batch/s, loss=504]

epoch 274: avg test  loss 611.54, bar  test loss 3.710, len  test loss 0.519, col  test loss 159.790


Epoch 275: 272batch [00:37,  7.26batch/s, loss=487]


epoch 275: avg train loss 493.45, bar train loss 2.176, len train loss 0.014, col train loss 147.456
epoch 275: avg test  loss 607.88, bar  test loss 3.697, len  test loss 0.484, col  test loss 159.769


Epoch 276: 272batch [00:37,  7.27batch/s, loss=515]


epoch 276: avg train loss 493.20, bar train loss 2.166, len train loss 0.014, col train loss 147.396


Epoch 277: 1batch [00:00,  7.30batch/s, loss=483]

epoch 276: avg test  loss 610.17, bar  test loss 3.699, len  test loss 0.509, col  test loss 159.618


Epoch 277: 272batch [00:37,  7.27batch/s, loss=488]


epoch 277: avg train loss 493.17, bar train loss 2.170, len train loss 0.013, col train loss 147.391


Epoch 278: 1batch [00:00,  7.52batch/s, loss=511]

epoch 277: avg test  loss 611.07, bar  test loss 3.712, len  test loss 0.507, col  test loss 159.778


Epoch 278: 272batch [00:37,  7.28batch/s, loss=527]


epoch 278: avg train loss 493.20, bar train loss 2.167, len train loss 0.013, col train loss 147.427


Epoch 279: 1batch [00:00,  7.52batch/s, loss=478]

epoch 278: avg test  loss 609.46, bar  test loss 3.719, len  test loss 0.488, col  test loss 159.707


Epoch 279: 272batch [00:37,  7.26batch/s, loss=482]


epoch 279: avg train loss 493.56, bar train loss 2.176, len train loss 0.013, col train loss 147.484


Epoch 280: 1batch [00:00,  7.25batch/s, loss=495]

epoch 279: avg test  loss 608.09, bar  test loss 3.709, len  test loss 0.484, col  test loss 159.705


Epoch 280: 272batch [00:37,  7.25batch/s, loss=486]


epoch 280: avg train loss 493.26, bar train loss 2.173, len train loss 0.013, col train loss 147.430
epoch 280: avg test  loss 609.29, bar  test loss 3.696, len  test loss 0.499, col  test loss 159.697


Epoch 281: 272batch [00:37,  7.26batch/s, loss=531]


epoch 281: avg train loss 493.26, bar train loss 2.172, len train loss 0.013, col train loss 147.444


Epoch 282: 1batch [00:00,  7.09batch/s, loss=482]

epoch 281: avg test  loss 609.46, bar  test loss 3.692, len  test loss 0.499, col  test loss 159.707


Epoch 282: 272batch [00:37,  7.27batch/s, loss=505]


epoch 282: avg train loss 492.85, bar train loss 2.164, len train loss 0.013, col train loss 147.343


Epoch 283: 1batch [00:00,  7.04batch/s, loss=498]

epoch 282: avg test  loss 609.78, bar  test loss 3.695, len  test loss 0.504, col  test loss 159.669


Epoch 283: 272batch [00:37,  7.25batch/s, loss=548]


epoch 283: avg train loss 492.92, bar train loss 2.164, len train loss 0.013, col train loss 147.367


Epoch 284: 1batch [00:00,  7.09batch/s, loss=481]

epoch 283: avg test  loss 606.83, bar  test loss 3.700, len  test loss 0.476, col  test loss 159.774


Epoch 284: 272batch [00:37,  7.26batch/s, loss=520]


epoch 284: avg train loss 492.93, bar train loss 2.166, len train loss 0.013, col train loss 147.378


Epoch 285: 1batch [00:00,  6.99batch/s, loss=511]

epoch 284: avg test  loss 609.09, bar  test loss 3.729, len  test loss 0.490, col  test loss 159.774


Epoch 285: 272batch [00:37,  7.23batch/s, loss=517]


epoch 285: avg train loss 492.88, bar train loss 2.165, len train loss 0.013, col train loss 147.366
epoch 285: avg test  loss 605.90, bar  test loss 3.704, len  test loss 0.465, col  test loss 159.650


Epoch 286: 272batch [00:37,  7.24batch/s, loss=490]


epoch 286: avg train loss 492.79, bar train loss 2.163, len train loss 0.013, col train loss 147.351


Epoch 287: 1batch [00:00,  6.85batch/s, loss=468]

epoch 286: avg test  loss 608.19, bar  test loss 3.733, len  test loss 0.483, col  test loss 159.743


Epoch 287: 272batch [00:37,  7.24batch/s, loss=530]


epoch 287: avg train loss 492.85, bar train loss 2.165, len train loss 0.013, col train loss 147.352


Epoch 288: 1batch [00:00,  7.09batch/s, loss=484]

epoch 287: avg test  loss 608.22, bar  test loss 3.717, len  test loss 0.479, col  test loss 159.636


Epoch 288: 272batch [00:37,  7.23batch/s, loss=473]


epoch 288: avg train loss 492.62, bar train loss 2.162, len train loss 0.013, col train loss 147.301


Epoch 289: 1batch [00:00,  7.30batch/s, loss=483]

epoch 288: avg test  loss 609.11, bar  test loss 3.718, len  test loss 0.480, col  test loss 159.597


Epoch 289: 272batch [00:37,  7.22batch/s, loss=477]


epoch 289: avg train loss 492.62, bar train loss 2.161, len train loss 0.013, col train loss 147.307


Epoch 290: 1batch [00:00,  7.09batch/s, loss=519]

epoch 289: avg test  loss 610.32, bar  test loss 3.737, len  test loss 0.501, col  test loss 159.930


Epoch 290: 272batch [00:37,  7.21batch/s, loss=463]


epoch 290: avg train loss 492.60, bar train loss 2.161, len train loss 0.013, col train loss 147.318
epoch 290: avg test  loss 605.26, bar  test loss 3.727, len  test loss 0.449, col  test loss 159.840


Epoch 291: 272batch [00:37,  7.24batch/s, loss=518]


epoch 291: avg train loss 492.48, bar train loss 2.160, len train loss 0.013, col train loss 147.289


Epoch 292: 1batch [00:00,  7.04batch/s, loss=489]

epoch 291: avg test  loss 611.87, bar  test loss 3.729, len  test loss 0.498, col  test loss 159.835


Epoch 292: 272batch [00:37,  7.25batch/s, loss=503]


epoch 292: avg train loss 492.80, bar train loss 2.164, len train loss 0.014, col train loss 147.324


Epoch 293: 1batch [00:00,  7.25batch/s, loss=482]

epoch 292: avg test  loss 609.16, bar  test loss 3.740, len  test loss 0.484, col  test loss 159.852


Epoch 293: 272batch [00:37,  7.23batch/s, loss=514]


epoch 293: avg train loss 492.39, bar train loss 2.160, len train loss 0.013, col train loss 147.261


Epoch 294: 1batch [00:00,  7.14batch/s, loss=487]

epoch 293: avg test  loss 610.39, bar  test loss 3.724, len  test loss 0.499, col  test loss 159.755


Epoch 294: 272batch [00:37,  7.19batch/s, loss=538]


epoch 294: avg train loss 492.30, bar train loss 2.157, len train loss 0.013, col train loss 147.254


Epoch 295: 0batch [00:00, ?batch/s]

epoch 294: avg test  loss 611.51, bar  test loss 3.743, len  test loss 0.509, col  test loss 159.750


Epoch 295: 272batch [00:38,  7.16batch/s, loss=537]


epoch 295: avg train loss 492.33, bar train loss 2.160, len train loss 0.013, col train loss 147.232
epoch 295: avg test  loss 606.67, bar  test loss 3.725, len  test loss 0.455, col  test loss 159.794


Epoch 296: 272batch [00:37,  7.20batch/s, loss=498]


epoch 296: avg train loss 492.30, bar train loss 2.158, len train loss 0.013, col train loss 147.254


Epoch 297: 1batch [00:00,  7.04batch/s, loss=476]

epoch 296: avg test  loss 611.30, bar  test loss 3.738, len  test loss 0.509, col  test loss 159.700


Epoch 297: 272batch [00:37,  7.23batch/s, loss=493]


epoch 297: avg train loss 492.07, bar train loss 2.152, len train loss 0.013, col train loss 147.220


Epoch 298: 1batch [00:00,  7.41batch/s, loss=490]

epoch 297: avg test  loss 608.87, bar  test loss 3.753, len  test loss 0.475, col  test loss 159.927


Epoch 298: 272batch [00:37,  7.21batch/s, loss=505]


epoch 298: avg train loss 492.23, bar train loss 2.154, len train loss 0.013, col train loss 147.251


Epoch 299: 1batch [00:00,  7.14batch/s, loss=501]

epoch 298: avg test  loss 609.12, bar  test loss 3.748, len  test loss 0.476, col  test loss 159.837


Epoch 299: 272batch [00:37,  7.21batch/s, loss=478]


epoch 299: avg train loss 492.12, bar train loss 2.154, len train loss 0.013, col train loss 147.227


Epoch 300: 1batch [00:00,  6.99batch/s, loss=490]

epoch 299: avg test  loss 612.76, bar  test loss 3.758, len  test loss 0.517, col  test loss 159.822


Epoch 300: 272batch [00:37,  7.19batch/s, loss=446]


epoch 300: avg train loss 492.07, bar train loss 2.153, len train loss 0.013, col train loss 147.218
epoch 300: avg test  loss 612.67, bar  test loss 3.773, len  test loss 0.515, col  test loss 159.858


Epoch 301: 272batch [00:37,  7.16batch/s, loss=515]


epoch 301: avg train loss 492.15, bar train loss 2.158, len train loss 0.013, col train loss 147.201


Epoch 302: 1batch [00:00,  7.46batch/s, loss=490]

epoch 301: avg test  loss 610.78, bar  test loss 3.763, len  test loss 0.498, col  test loss 159.903


Epoch 302: 272batch [00:38,  7.16batch/s, loss=540]


epoch 302: avg train loss 491.84, bar train loss 2.147, len train loss 0.013, col train loss 147.170


Epoch 303: 1batch [00:00,  7.14batch/s, loss=499]

epoch 302: avg test  loss 608.79, bar  test loss 3.736, len  test loss 0.478, col  test loss 159.810


Epoch 303: 272batch [00:37,  7.17batch/s, loss=510]


epoch 303: avg train loss 491.91, bar train loss 2.150, len train loss 0.013, col train loss 147.164


Epoch 304: 1batch [00:00,  6.99batch/s, loss=492]

epoch 303: avg test  loss 608.63, bar  test loss 3.745, len  test loss 0.475, col  test loss 159.839


Epoch 304: 272batch [00:37,  7.17batch/s, loss=465]


epoch 304: avg train loss 491.92, bar train loss 2.148, len train loss 0.013, col train loss 147.225


Epoch 305: 1batch [00:00,  7.04batch/s, loss=476]

epoch 304: avg test  loss 610.92, bar  test loss 3.762, len  test loss 0.502, col  test loss 159.788


Epoch 305: 272batch [00:37,  7.16batch/s, loss=494]


epoch 305: avg train loss 491.90, bar train loss 2.149, len train loss 0.013, col train loss 147.189
epoch 305: avg test  loss 613.15, bar  test loss 3.771, len  test loss 0.519, col  test loss 160.015


Epoch 306: 272batch [00:37,  7.18batch/s, loss=485]


epoch 306: avg train loss 491.85, bar train loss 2.149, len train loss 0.013, col train loss 147.189


Epoch 307: 1batch [00:00,  7.19batch/s, loss=486]

epoch 306: avg test  loss 609.37, bar  test loss 3.749, len  test loss 0.483, col  test loss 159.805


Epoch 307: 272batch [00:38,  7.15batch/s, loss=488]


epoch 307: avg train loss 491.70, bar train loss 2.148, len train loss 0.012, col train loss 147.158


Epoch 308: 1batch [00:00,  7.14batch/s, loss=499]

epoch 307: avg test  loss 608.80, bar  test loss 3.771, len  test loss 0.477, col  test loss 159.939


Epoch 308: 272batch [00:38,  7.15batch/s, loss=506]


epoch 308: avg train loss 491.59, bar train loss 2.144, len train loss 0.013, col train loss 147.147


Epoch 309: 1batch [00:00,  7.09batch/s, loss=494]

epoch 308: avg test  loss 606.94, bar  test loss 3.759, len  test loss 0.461, col  test loss 159.829


Epoch 309: 272batch [00:38,  7.12batch/s, loss=496]


epoch 309: avg train loss 491.53, bar train loss 2.145, len train loss 0.012, col train loss 147.130


Epoch 310: 1batch [00:00,  6.71batch/s, loss=473]

epoch 309: avg test  loss 614.29, bar  test loss 3.753, len  test loss 0.532, col  test loss 159.914


Epoch 310: 272batch [00:38,  7.14batch/s, loss=476]


epoch 310: avg train loss 491.42, bar train loss 2.139, len train loss 0.013, col train loss 147.112
epoch 310: avg test  loss 609.99, bar  test loss 3.773, len  test loss 0.486, col  test loss 160.005


Epoch 311: 272batch [00:38,  7.14batch/s, loss=517]


epoch 311: avg train loss 491.49, bar train loss 2.144, len train loss 0.013, col train loss 147.116


Epoch 312: 1batch [00:00,  6.80batch/s, loss=469]

epoch 311: avg test  loss 612.85, bar  test loss 3.761, len  test loss 0.513, col  test loss 160.040


Epoch 312: 272batch [00:38,  7.13batch/s, loss=532]


epoch 312: avg train loss 491.47, bar train loss 2.141, len train loss 0.013, col train loss 147.119


Epoch 313: 1batch [00:00,  7.46batch/s, loss=489]

epoch 312: avg test  loss 615.46, bar  test loss 3.789, len  test loss 0.533, col  test loss 159.958


Epoch 313: 272batch [00:38,  7.14batch/s, loss=515]


epoch 313: avg train loss 491.55, bar train loss 2.139, len train loss 0.013, col train loss 147.167


Epoch 314: 1batch [00:00,  7.04batch/s, loss=491]

epoch 313: avg test  loss 611.03, bar  test loss 3.771, len  test loss 0.496, col  test loss 159.947


Epoch 314: 272batch [00:38,  7.14batch/s, loss=486]


epoch 314: avg train loss 491.14, bar train loss 2.135, len train loss 0.013, col train loss 147.080


Epoch 315: 1batch [00:00,  6.80batch/s, loss=513]

epoch 314: avg test  loss 608.84, bar  test loss 3.780, len  test loss 0.472, col  test loss 159.922


Epoch 315: 272batch [00:38,  7.11batch/s, loss=494]


epoch 315: avg train loss 491.25, bar train loss 2.139, len train loss 0.013, col train loss 147.079
epoch 315: avg test  loss 614.25, bar  test loss 3.751, len  test loss 0.532, col  test loss 159.918


Epoch 316: 272batch [00:38,  7.13batch/s, loss=511]


epoch 316: avg train loss 491.20, bar train loss 2.137, len train loss 0.013, col train loss 147.090


Epoch 317: 1batch [00:00,  6.90batch/s, loss=516]

epoch 316: avg test  loss 613.44, bar  test loss 3.764, len  test loss 0.516, col  test loss 160.124


Epoch 317: 272batch [00:38,  7.04batch/s, loss=487]


epoch 317: avg train loss 491.33, bar train loss 2.138, len train loss 0.013, col train loss 147.118


Epoch 318: 1batch [00:00,  6.71batch/s, loss=495]

epoch 317: avg test  loss 612.15, bar  test loss 3.776, len  test loss 0.508, col  test loss 159.939


Epoch 318: 272batch [00:38,  7.08batch/s, loss=506]


epoch 318: avg train loss 491.17, bar train loss 2.137, len train loss 0.013, col train loss 147.075


Epoch 319: 1batch [00:00,  7.25batch/s, loss=481]

epoch 318: avg test  loss 615.50, bar  test loss 3.785, len  test loss 0.529, col  test loss 160.083


Epoch 319: 272batch [00:38,  7.11batch/s, loss=542]


epoch 319: avg train loss 491.57, bar train loss 2.143, len train loss 0.013, col train loss 147.171


Epoch 320: 1batch [00:00,  6.99batch/s, loss=470]

epoch 319: avg test  loss 615.24, bar  test loss 3.778, len  test loss 0.532, col  test loss 160.061


Epoch 320: 272batch [00:38,  7.11batch/s, loss=482]


epoch 320: avg train loss 491.07, bar train loss 2.134, len train loss 0.012, col train loss 147.079
epoch 320: avg test  loss 609.43, bar  test loss 3.783, len  test loss 0.476, col  test loss 160.049


Epoch 321: 272batch [00:38,  7.08batch/s, loss=513]


epoch 321: avg train loss 490.91, bar train loss 2.131, len train loss 0.012, col train loss 147.057


Epoch 322: 1batch [00:00,  6.90batch/s, loss=486]

epoch 321: avg test  loss 611.77, bar  test loss 3.781, len  test loss 0.497, col  test loss 159.956


Epoch 322: 272batch [00:38,  7.08batch/s, loss=491]


epoch 322: avg train loss 491.35, bar train loss 2.139, len train loss 0.013, col train loss 147.117


Epoch 323: 1batch [00:00,  6.99batch/s, loss=479]

epoch 322: avg test  loss 612.77, bar  test loss 3.783, len  test loss 0.510, col  test loss 159.884


Epoch 323: 272batch [00:38,  7.09batch/s, loss=447]


epoch 323: avg train loss 491.10, bar train loss 2.140, len train loss 0.013, col train loss 147.035


Epoch 324: 1batch [00:00,  7.30batch/s, loss=485]

epoch 323: avg test  loss 615.50, bar  test loss 3.775, len  test loss 0.539, col  test loss 159.957


Epoch 324: 272batch [00:38,  7.06batch/s, loss=514]


epoch 324: avg train loss 490.55, bar train loss 2.126, len train loss 0.012, col train loss 146.967


Epoch 325: 1batch [00:00,  7.41batch/s, loss=485]

epoch 324: avg test  loss 610.75, bar  test loss 3.802, len  test loss 0.485, col  test loss 159.981


Epoch 325: 272batch [00:38,  7.04batch/s, loss=497]


epoch 325: avg train loss 490.55, bar train loss 2.123, len train loss 0.012, col train loss 146.991
epoch 325: avg test  loss 611.36, bar  test loss 3.811, len  test loss 0.488, col  test loss 160.023


Epoch 326: 272batch [00:38,  7.07batch/s, loss=473]


epoch 326: avg train loss 490.79, bar train loss 2.131, len train loss 0.012, col train loss 147.020


Epoch 327: 1batch [00:00,  7.19batch/s, loss=471]

epoch 326: avg test  loss 608.99, bar  test loss 3.798, len  test loss 0.469, col  test loss 160.086


Epoch 327: 272batch [00:38,  7.05batch/s, loss=495]


epoch 327: avg train loss 490.71, bar train loss 2.129, len train loss 0.012, col train loss 147.015


Epoch 328: 1batch [00:00,  7.14batch/s, loss=493]

epoch 327: avg test  loss 613.99, bar  test loss 3.781, len  test loss 0.520, col  test loss 160.018


Epoch 328: 272batch [00:38,  7.05batch/s, loss=503]


epoch 328: avg train loss 490.69, bar train loss 2.126, len train loss 0.013, col train loss 146.997


Epoch 329: 1batch [00:00,  6.99batch/s, loss=490]

epoch 328: avg test  loss 615.68, bar  test loss 3.815, len  test loss 0.535, col  test loss 160.009


Epoch 329: 272batch [00:38,  7.07batch/s, loss=507]


epoch 329: avg train loss 490.80, bar train loss 2.131, len train loss 0.012, col train loss 147.022


Epoch 330: 1batch [00:00,  6.94batch/s, loss=480]

epoch 329: avg test  loss 612.96, bar  test loss 3.806, len  test loss 0.509, col  test loss 160.113


Epoch 330: 272batch [00:38,  7.07batch/s, loss=477]


epoch 330: avg train loss 490.51, bar train loss 2.124, len train loss 0.012, col train loss 146.986
epoch 330: avg test  loss 617.63, bar  test loss 3.802, len  test loss 0.555, col  test loss 160.102


Epoch 331: 272batch [00:38,  7.06batch/s, loss=477]


epoch 331: avg train loss 490.81, bar train loss 2.126, len train loss 0.013, col train loss 147.073


Epoch 332: 1batch [00:00,  6.90batch/s, loss=511]

epoch 331: avg test  loss 615.07, bar  test loss 3.806, len  test loss 0.529, col  test loss 160.101


Epoch 332: 272batch [00:38,  7.04batch/s, loss=527]


epoch 332: avg train loss 490.86, bar train loss 2.131, len train loss 0.013, col train loss 147.061


Epoch 333: 1batch [00:00,  7.04batch/s, loss=493]

epoch 332: avg test  loss 614.68, bar  test loss 3.787, len  test loss 0.528, col  test loss 160.033


Epoch 333: 272batch [00:38,  7.02batch/s, loss=473]


epoch 333: avg train loss 490.61, bar train loss 2.127, len train loss 0.012, col train loss 147.001


Epoch 334: 1batch [00:00,  7.14batch/s, loss=464]

epoch 333: avg test  loss 615.49, bar  test loss 3.812, len  test loss 0.529, col  test loss 160.100


Epoch 334: 272batch [00:38,  7.02batch/s, loss=535]


epoch 334: avg train loss 490.35, bar train loss 2.124, len train loss 0.012, col train loss 146.950


Epoch 335: 1batch [00:00,  6.94batch/s, loss=500]

epoch 334: avg test  loss 611.96, bar  test loss 3.824, len  test loss 0.495, col  test loss 160.069


Epoch 335: 272batch [00:38,  7.04batch/s, loss=525]


epoch 335: avg train loss 490.65, bar train loss 2.129, len train loss 0.012, col train loss 146.998
epoch 335: avg test  loss 617.32, bar  test loss 3.820, len  test loss 0.547, col  test loss 160.202


Epoch 336: 272batch [00:38,  7.02batch/s, loss=506]


epoch 336: avg train loss 490.40, bar train loss 2.126, len train loss 0.012, col train loss 146.947


Epoch 337: 1batch [00:00,  6.94batch/s, loss=502]

epoch 336: avg test  loss 613.73, bar  test loss 3.819, len  test loss 0.509, col  test loss 160.125


Epoch 337: 272batch [00:38,  7.04batch/s, loss=511]


epoch 337: avg train loss 490.42, bar train loss 2.126, len train loss 0.012, col train loss 146.964


Epoch 338: 1batch [00:00,  6.94batch/s, loss=497]

epoch 337: avg test  loss 610.85, bar  test loss 3.798, len  test loss 0.488, col  test loss 160.067


Epoch 338: 272batch [00:38,  7.02batch/s, loss=512]


epoch 338: avg train loss 490.40, bar train loss 2.122, len train loss 0.013, col train loss 146.972


Epoch 339: 1batch [00:00,  6.71batch/s, loss=480]

epoch 338: avg test  loss 615.98, bar  test loss 3.833, len  test loss 0.534, col  test loss 160.165


Epoch 339: 272batch [00:38,  7.01batch/s, loss=494]


epoch 339: avg train loss 490.41, bar train loss 2.125, len train loss 0.013, col train loss 146.963


Epoch 340: 1batch [00:00,  6.85batch/s, loss=462]

epoch 339: avg test  loss 613.90, bar  test loss 3.797, len  test loss 0.517, col  test loss 160.120


Epoch 340: 272batch [00:38,  7.01batch/s, loss=516]


epoch 340: avg train loss 490.03, bar train loss 2.121, len train loss 0.013, col train loss 146.850
epoch 340: avg test  loss 614.08, bar  test loss 3.821, len  test loss 0.516, col  test loss 160.151


Epoch 341: 272batch [00:39,  6.88batch/s, loss=488]


epoch 341: avg train loss 490.29, bar train loss 2.126, len train loss 0.012, col train loss 146.925


Epoch 342: 1batch [00:00,  7.04batch/s, loss=496]

epoch 341: avg test  loss 613.38, bar  test loss 3.821, len  test loss 0.502, col  test loss 160.169


Epoch 342: 272batch [00:38,  6.98batch/s, loss=446]


epoch 342: avg train loss 490.12, bar train loss 2.118, len train loss 0.012, col train loss 146.909


Epoch 343: 1batch [00:00,  6.67batch/s, loss=469]

epoch 342: avg test  loss 614.67, bar  test loss 3.844, len  test loss 0.515, col  test loss 160.177


Epoch 343: 272batch [00:39,  6.93batch/s, loss=477]


epoch 343: avg train loss 489.99, bar train loss 2.117, len train loss 0.012, col train loss 146.902


Epoch 344: 0batch [00:00, ?batch/s, loss=500]

epoch 343: avg test  loss 615.20, bar  test loss 3.847, len  test loss 0.515, col  test loss 160.210


Epoch 344: 272batch [00:38,  6.99batch/s, loss=475]


epoch 344: avg train loss 490.35, bar train loss 2.121, len train loss 0.013, col train loss 146.960


Epoch 345: 1batch [00:00,  6.90batch/s, loss=473]

epoch 344: avg test  loss 609.25, bar  test loss 3.839, len  test loss 0.461, col  test loss 160.241


Epoch 345: 272batch [00:38,  7.02batch/s, loss=482]


epoch 345: avg train loss 490.05, bar train loss 2.121, len train loss 0.012, col train loss 146.908
epoch 345: avg test  loss 615.71, bar  test loss 3.841, len  test loss 0.524, col  test loss 160.189


Epoch 346: 272batch [00:38,  7.02batch/s, loss=513]


epoch 346: avg train loss 489.87, bar train loss 2.119, len train loss 0.012, col train loss 146.840


Epoch 347: 0batch [00:00, ?batch/s]

epoch 346: avg test  loss 616.06, bar  test loss 3.836, len  test loss 0.511, col  test loss 160.165


Epoch 347: 272batch [00:38,  7.03batch/s, loss=485]


epoch 347: avg train loss 490.06, bar train loss 2.119, len train loss 0.012, col train loss 146.914


Epoch 348: 1batch [00:00,  6.94batch/s, loss=486]

epoch 347: avg test  loss 614.60, bar  test loss 3.854, len  test loss 0.503, col  test loss 160.460


Epoch 348: 272batch [00:38,  7.03batch/s, loss=498]


epoch 348: avg train loss 489.95, bar train loss 2.119, len train loss 0.012, col train loss 146.881


Epoch 349: 1batch [00:00,  6.99batch/s, loss=482]

epoch 348: avg test  loss 614.10, bar  test loss 3.850, len  test loss 0.510, col  test loss 160.086


Epoch 349: 272batch [00:38,  7.01batch/s, loss=497]


epoch 349: avg train loss 489.81, bar train loss 2.113, len train loss 0.012, col train loss 146.869


Epoch 350: 1batch [00:00,  7.09batch/s, loss=480]

epoch 349: avg test  loss 611.07, bar  test loss 3.846, len  test loss 0.482, col  test loss 160.081


Epoch 350: 272batch [00:38,  7.03batch/s, loss=460]


epoch 350: avg train loss 489.83, bar train loss 2.117, len train loss 0.012, col train loss 146.871
epoch 350: avg test  loss 616.14, bar  test loss 3.844, len  test loss 0.523, col  test loss 160.155


Epoch 351: 272batch [00:38,  7.01batch/s, loss=498]


epoch 351: avg train loss 489.91, bar train loss 2.117, len train loss 0.012, col train loss 146.880


Epoch 352: 1batch [00:00,  6.94batch/s, loss=482]

epoch 351: avg test  loss 616.32, bar  test loss 3.843, len  test loss 0.530, col  test loss 160.111


Epoch 352: 272batch [00:38,  7.02batch/s, loss=494]


epoch 352: avg train loss 489.72, bar train loss 2.112, len train loss 0.012, col train loss 146.864


Epoch 353: 1batch [00:00,  6.54batch/s, loss=494]

epoch 352: avg test  loss 611.00, bar  test loss 3.809, len  test loss 0.481, col  test loss 160.089


Epoch 353: 272batch [00:38,  7.00batch/s, loss=515]


epoch 353: avg train loss 489.66, bar train loss 2.112, len train loss 0.012, col train loss 146.841


Epoch 354: 1batch [00:00,  6.71batch/s, loss=487]

epoch 353: avg test  loss 612.97, bar  test loss 3.848, len  test loss 0.500, col  test loss 160.120


Epoch 354: 272batch [00:38,  7.04batch/s, loss=540]


epoch 354: avg train loss 489.64, bar train loss 2.115, len train loss 0.012, col train loss 146.816


Epoch 355: 1batch [00:00,  6.67batch/s, loss=488]

epoch 354: avg test  loss 612.78, bar  test loss 3.849, len  test loss 0.492, col  test loss 160.207


Epoch 355: 272batch [00:38,  7.02batch/s, loss=494]


epoch 355: avg train loss 489.42, bar train loss 2.106, len train loss 0.012, col train loss 146.801
epoch 355: avg test  loss 615.41, bar  test loss 3.846, len  test loss 0.518, col  test loss 160.188


Epoch 356: 272batch [00:38,  7.00batch/s, loss=510]


epoch 356: avg train loss 489.53, bar train loss 2.112, len train loss 0.012, col train loss 146.811


Epoch 357: 1batch [00:00,  6.85batch/s, loss=475]

epoch 356: avg test  loss 613.11, bar  test loss 3.857, len  test loss 0.495, col  test loss 160.208


Epoch 357: 272batch [00:38,  6.98batch/s, loss=498]


epoch 357: avg train loss 489.52, bar train loss 2.111, len train loss 0.012, col train loss 146.818


Epoch 358: 1batch [00:00,  6.90batch/s, loss=515]

epoch 357: avg test  loss 611.81, bar  test loss 3.875, len  test loss 0.476, col  test loss 160.281


Epoch 358: 272batch [00:39,  6.96batch/s, loss=481]


epoch 358: avg train loss 489.54, bar train loss 2.109, len train loss 0.012, col train loss 146.817


Epoch 359: 1batch [00:00,  6.49batch/s, loss=471]

epoch 358: avg test  loss 613.77, bar  test loss 3.862, len  test loss 0.502, col  test loss 160.194


Epoch 359: 272batch [00:38,  6.99batch/s, loss=473]


epoch 359: avg train loss 489.18, bar train loss 2.104, len train loss 0.012, col train loss 146.762


Epoch 360: 1batch [00:00,  7.30batch/s, loss=483]

epoch 359: avg test  loss 617.74, bar  test loss 3.861, len  test loss 0.542, col  test loss 160.254


Epoch 360: 272batch [00:38,  6.99batch/s, loss=498]


epoch 360: avg train loss 489.42, bar train loss 2.105, len train loss 0.012, col train loss 146.832
epoch 360: avg test  loss 613.45, bar  test loss 3.857, len  test loss 0.498, col  test loss 160.225


Epoch 361: 272batch [00:38,  6.98batch/s, loss=497]


epoch 361: avg train loss 489.49, bar train loss 2.110, len train loss 0.012, col train loss 146.809


Epoch 362: 1batch [00:00,  6.90batch/s, loss=491]

epoch 361: avg test  loss 610.70, bar  test loss 3.853, len  test loss 0.474, col  test loss 160.191


Epoch 362: 272batch [00:38,  6.99batch/s, loss=503]


epoch 362: avg train loss 489.26, bar train loss 2.104, len train loss 0.012, col train loss 146.794


Epoch 363: 1batch [00:00,  6.71batch/s, loss=478]

epoch 362: avg test  loss 613.62, bar  test loss 3.859, len  test loss 0.500, col  test loss 160.205


Epoch 363: 272batch [00:38,  6.97batch/s, loss=506]


epoch 363: avg train loss 489.54, bar train loss 2.110, len train loss 0.012, col train loss 146.834


Epoch 364: 1batch [00:00,  6.76batch/s, loss=480]

epoch 363: avg test  loss 613.06, bar  test loss 3.849, len  test loss 0.496, col  test loss 160.230


Epoch 364: 272batch [00:39,  6.92batch/s, loss=499]


epoch 364: avg train loss 489.24, bar train loss 2.106, len train loss 0.012, col train loss 146.760


Epoch 365: 1batch [00:00,  7.09batch/s, loss=490]

epoch 364: avg test  loss 613.51, bar  test loss 3.863, len  test loss 0.500, col  test loss 160.228


Epoch 365: 272batch [00:39,  6.97batch/s, loss=503]


epoch 365: avg train loss 489.13, bar train loss 2.105, len train loss 0.012, col train loss 146.761
epoch 365: avg test  loss 613.58, bar  test loss 3.879, len  test loss 0.494, col  test loss 160.308


Epoch 366: 272batch [00:38,  6.98batch/s, loss=447]


epoch 366: avg train loss 489.24, bar train loss 2.110, len train loss 0.012, col train loss 146.756


Epoch 367: 1batch [00:00,  7.04batch/s, loss=489]

epoch 366: avg test  loss 617.08, bar  test loss 3.867, len  test loss 0.536, col  test loss 160.200


Epoch 367: 272batch [00:38,  6.99batch/s, loss=509]


epoch 367: avg train loss 489.09, bar train loss 2.101, len train loss 0.012, col train loss 146.740


Epoch 368: 1batch [00:00,  6.85batch/s, loss=481]

epoch 367: avg test  loss 614.80, bar  test loss 3.890, len  test loss 0.506, col  test loss 160.335


Epoch 368: 272batch [00:39,  6.97batch/s, loss=524]


epoch 368: avg train loss 489.19, bar train loss 2.101, len train loss 0.012, col train loss 146.785


Epoch 369: 1batch [00:00,  7.14batch/s, loss=490]

epoch 368: avg test  loss 611.59, bar  test loss 3.862, len  test loss 0.482, col  test loss 160.310


Epoch 369: 272batch [00:39,  6.96batch/s, loss=492]


epoch 369: avg train loss 488.86, bar train loss 2.099, len train loss 0.012, col train loss 146.703


Epoch 370: 1batch [00:00,  6.80batch/s, loss=492]

epoch 369: avg test  loss 614.16, bar  test loss 3.880, len  test loss 0.498, col  test loss 160.282


Epoch 370: 272batch [00:39,  6.95batch/s, loss=482]


epoch 370: avg train loss 489.08, bar train loss 2.102, len train loss 0.012, col train loss 146.756
epoch 370: avg test  loss 612.06, bar  test loss 3.845, len  test loss 0.483, col  test loss 160.264


Epoch 371: 272batch [00:39,  6.95batch/s, loss=504]


epoch 371: avg train loss 489.08, bar train loss 2.101, len train loss 0.012, col train loss 146.759


Epoch 372: 1batch [00:00,  6.90batch/s, loss=487]

epoch 371: avg test  loss 617.28, bar  test loss 3.887, len  test loss 0.530, col  test loss 160.331


Epoch 372: 272batch [00:39,  6.91batch/s, loss=492]


epoch 372: avg train loss 489.12, bar train loss 2.101, len train loss 0.012, col train loss 146.795


Epoch 373: 1batch [00:00,  7.04batch/s, loss=489]

epoch 372: avg test  loss 615.61, bar  test loss 3.884, len  test loss 0.514, col  test loss 160.344


Epoch 373: 272batch [00:39,  6.92batch/s, loss=534]


epoch 373: avg train loss 488.94, bar train loss 2.099, len train loss 0.012, col train loss 146.735


Epoch 374: 1batch [00:00,  7.30batch/s, loss=474]

epoch 373: avg test  loss 614.53, bar  test loss 3.878, len  test loss 0.506, col  test loss 160.250


Epoch 374: 272batch [00:39,  6.97batch/s, loss=479]


epoch 374: avg train loss 488.85, bar train loss 2.097, len train loss 0.012, col train loss 146.741


Epoch 375: 0batch [00:00, ?batch/s]

epoch 374: avg test  loss 616.40, bar  test loss 3.871, len  test loss 0.522, col  test loss 160.283


Epoch 375: 272batch [00:39,  6.89batch/s, loss=470]


epoch 375: avg train loss 488.82, bar train loss 2.094, len train loss 0.012, col train loss 146.728
epoch 375: avg test  loss 613.11, bar  test loss 3.876, len  test loss 0.488, col  test loss 160.317


Epoch 376: 272batch [00:39,  6.92batch/s, loss=547]


epoch 376: avg train loss 488.93, bar train loss 2.100, len train loss 0.012, col train loss 146.735


Epoch 377: 1batch [00:00,  6.45batch/s, loss=471]

epoch 376: avg test  loss 614.52, bar  test loss 3.874, len  test loss 0.506, col  test loss 160.266


Epoch 377: 272batch [00:39,  6.92batch/s, loss=534]


epoch 377: avg train loss 488.84, bar train loss 2.098, len train loss 0.012, col train loss 146.712


Epoch 378: 1batch [00:00,  6.67batch/s, loss=476]

epoch 377: avg test  loss 611.48, bar  test loss 3.879, len  test loss 0.472, col  test loss 160.406


Epoch 378: 272batch [00:39,  6.91batch/s, loss=502]


epoch 378: avg train loss 488.82, bar train loss 2.096, len train loss 0.013, col train loss 146.698


Epoch 379: 1batch [00:00,  6.62batch/s, loss=498]

epoch 378: avg test  loss 616.52, bar  test loss 3.905, len  test loss 0.522, col  test loss 160.374


Epoch 379: 272batch [00:39,  6.90batch/s, loss=479]


epoch 379: avg train loss 488.70, bar train loss 2.094, len train loss 0.012, col train loss 146.690


Epoch 380: 1batch [00:00,  7.25batch/s, loss=499]

epoch 379: avg test  loss 615.76, bar  test loss 3.902, len  test loss 0.510, col  test loss 160.414


Epoch 380: 272batch [00:39,  6.92batch/s, loss=482]


epoch 380: avg train loss 488.77, bar train loss 2.093, len train loss 0.012, col train loss 146.733
epoch 380: avg test  loss 617.22, bar  test loss 3.888, len  test loss 0.529, col  test loss 160.215


Epoch 381: 272batch [00:39,  6.91batch/s, loss=471]


epoch 381: avg train loss 488.75, bar train loss 2.095, len train loss 0.012, col train loss 146.714


Epoch 382: 1batch [00:00,  7.25batch/s, loss=490]

epoch 381: avg test  loss 615.05, bar  test loss 3.885, len  test loss 0.507, col  test loss 160.404


Epoch 382: 272batch [00:39,  6.90batch/s, loss=493]


epoch 382: avg train loss 488.64, bar train loss 2.094, len train loss 0.012, col train loss 146.674


Epoch 383: 1batch [00:00,  6.71batch/s, loss=487]

epoch 382: avg test  loss 614.81, bar  test loss 3.907, len  test loss 0.502, col  test loss 160.391


Epoch 383: 272batch [00:39,  6.90batch/s, loss=462]


epoch 383: avg train loss 488.64, bar train loss 2.093, len train loss 0.012, col train loss 146.702


Epoch 384: 1batch [00:00,  6.25batch/s, loss=463]

epoch 383: avg test  loss 614.49, bar  test loss 3.891, len  test loss 0.501, col  test loss 160.220


Epoch 384: 272batch [00:39,  6.89batch/s, loss=476]


epoch 384: avg train loss 488.56, bar train loss 2.090, len train loss 0.012, col train loss 146.685


Epoch 385: 1batch [00:00,  6.99batch/s, loss=491]

epoch 384: avg test  loss 613.56, bar  test loss 3.914, len  test loss 0.480, col  test loss 160.326


Epoch 385: 272batch [00:39,  6.88batch/s, loss=514]


epoch 385: avg train loss 488.54, bar train loss 2.095, len train loss 0.012, col train loss 146.647
epoch 385: avg test  loss 613.57, bar  test loss 3.903, len  test loss 0.491, col  test loss 160.302


Epoch 386: 272batch [00:39,  6.89batch/s, loss=479]


epoch 386: avg train loss 488.55, bar train loss 2.090, len train loss 0.012, col train loss 146.688


Epoch 387: 1batch [00:00,  7.14batch/s, loss=485]

epoch 386: avg test  loss 617.30, bar  test loss 3.916, len  test loss 0.524, col  test loss 160.371


Epoch 387: 272batch [00:39,  6.92batch/s, loss=489]


epoch 387: avg train loss 488.54, bar train loss 2.091, len train loss 0.011, col train loss 146.700


Epoch 388: 1batch [00:00,  6.85batch/s, loss=482]

epoch 387: avg test  loss 616.96, bar  test loss 3.898, len  test loss 0.525, col  test loss 160.303


Epoch 388: 272batch [00:39,  6.91batch/s, loss=485]


epoch 388: avg train loss 488.20, bar train loss 2.081, len train loss 0.012, col train loss 146.644


Epoch 389: 1batch [00:00,  6.71batch/s, loss=485]

epoch 388: avg test  loss 617.96, bar  test loss 3.904, len  test loss 0.532, col  test loss 160.409


Epoch 389: 272batch [00:39,  6.88batch/s, loss=503]


epoch 389: avg train loss 488.45, bar train loss 2.090, len train loss 0.012, col train loss 146.656


Epoch 390: 1batch [00:00,  6.62batch/s, loss=490]

epoch 389: avg test  loss 616.47, bar  test loss 3.908, len  test loss 0.506, col  test loss 160.423


Epoch 390: 272batch [00:39,  6.86batch/s, loss=524]


epoch 390: avg train loss 488.37, bar train loss 2.086, len train loss 0.012, col train loss 146.680
epoch 390: avg test  loss 615.42, bar  test loss 3.912, len  test loss 0.493, col  test loss 160.836


Epoch 391: 272batch [00:39,  6.89batch/s, loss=474]


epoch 391: avg train loss 488.57, bar train loss 2.092, len train loss 0.012, col train loss 146.705


Epoch 392: 1batch [00:00,  6.99batch/s, loss=476]

epoch 391: avg test  loss 617.02, bar  test loss 3.914, len  test loss 0.524, col  test loss 160.367


Epoch 392: 272batch [00:39,  6.81batch/s, loss=490]


epoch 392: avg train loss 488.31, bar train loss 2.083, len train loss 0.012, col train loss 146.656


Epoch 393: 1batch [00:00,  6.90batch/s, loss=482]

epoch 392: avg test  loss 616.15, bar  test loss 3.924, len  test loss 0.510, col  test loss 160.344


Epoch 393: 272batch [00:39,  6.87batch/s, loss=511]


epoch 393: avg train loss 488.19, bar train loss 2.087, len train loss 0.012, col train loss 146.603


Epoch 394: 1batch [00:00,  6.58batch/s, loss=472]

epoch 393: avg test  loss 615.71, bar  test loss 3.938, len  test loss 0.501, col  test loss 160.510


Epoch 394: 272batch [00:39,  6.87batch/s, loss=470]


epoch 394: avg train loss 488.36, bar train loss 2.088, len train loss 0.012, col train loss 146.644


Epoch 395: 1batch [00:00,  6.14batch/s, loss=486]

epoch 394: avg test  loss 611.54, bar  test loss 3.937, len  test loss 0.462, col  test loss 160.466


Epoch 395: 272batch [00:39,  6.87batch/s, loss=492]


epoch 395: avg train loss 488.03, bar train loss 2.080, len train loss 0.012, col train loss 146.601
epoch 395: avg test  loss 613.72, bar  test loss 3.887, len  test loss 0.491, col  test loss 160.381


Epoch 396: 272batch [00:39,  6.87batch/s, loss=478]


epoch 396: avg train loss 488.17, bar train loss 2.080, len train loss 0.012, col train loss 146.650


Epoch 397: 1batch [00:00,  6.62batch/s, loss=495]

epoch 396: avg test  loss 613.15, bar  test loss 3.914, len  test loss 0.486, col  test loss 160.253


Epoch 397: 272batch [00:39,  6.85batch/s, loss=493]


epoch 397: avg train loss 488.02, bar train loss 2.081, len train loss 0.012, col train loss 146.602


Epoch 398: 0batch [00:00, ?batch/s, loss=493]

epoch 397: avg test  loss 614.38, bar  test loss 3.920, len  test loss 0.494, col  test loss 160.354


Epoch 398: 272batch [00:39,  6.86batch/s, loss=517]


epoch 398: avg train loss 488.24, bar train loss 2.088, len train loss 0.012, col train loss 146.627


Epoch 399: 1batch [00:00,  6.49batch/s, loss=487]

epoch 398: avg test  loss 616.58, bar  test loss 3.938, len  test loss 0.498, col  test loss 160.429


Epoch 399: 272batch [00:39,  6.86batch/s, loss=491]


epoch 399: avg train loss 488.20, bar train loss 2.081, len train loss 0.012, col train loss 146.653


Epoch 400: 1batch [00:00,  6.99batch/s, loss=510]

epoch 399: avg test  loss 616.60, bar  test loss 3.925, len  test loss 0.509, col  test loss 160.425


Epoch 400: 272batch [00:39,  6.86batch/s, loss=518]


epoch 400: avg train loss 488.06, bar train loss 2.084, len train loss 0.011, col train loss 146.587
epoch 400: avg test  loss 615.35, bar  test loss 3.912, len  test loss 0.507, col  test loss 160.364


Epoch 401: 272batch [00:39,  6.83batch/s, loss=466]


epoch 401: avg train loss 488.11, bar train loss 2.077, len train loss 0.012, col train loss 146.678


Epoch 402: 1batch [00:00,  7.09batch/s, loss=496]

epoch 401: avg test  loss 614.48, bar  test loss 3.903, len  test loss 0.499, col  test loss 160.408


Epoch 402: 272batch [00:39,  6.87batch/s, loss=469]


epoch 402: avg train loss 488.06, bar train loss 2.083, len train loss 0.012, col train loss 146.587


Epoch 403: 1batch [00:00,  6.80batch/s, loss=504]

epoch 402: avg test  loss 611.66, bar  test loss 3.930, len  test loss 0.462, col  test loss 160.310


Epoch 403: 272batch [00:39,  6.85batch/s, loss=504]


epoch 403: avg train loss 487.94, bar train loss 2.079, len train loss 0.011, col train loss 146.603


Epoch 404: 1batch [00:00,  7.19batch/s, loss=482]

epoch 403: avg test  loss 618.26, bar  test loss 3.937, len  test loss 0.527, col  test loss 160.476


Epoch 404: 272batch [00:39,  6.80batch/s, loss=489]


epoch 404: avg train loss 488.20, bar train loss 2.080, len train loss 0.012, col train loss 146.678


Epoch 405: 1batch [00:00,  6.80batch/s, loss=493]

epoch 404: avg test  loss 615.93, bar  test loss 3.931, len  test loss 0.492, col  test loss 160.521


Epoch 405: 272batch [00:39,  6.83batch/s, loss=527]


epoch 405: avg train loss 487.85, bar train loss 2.078, len train loss 0.012, col train loss 146.576
epoch 405: avg test  loss 616.59, bar  test loss 3.928, len  test loss 0.511, col  test loss 160.421


Epoch 406: 272batch [00:39,  6.85batch/s, loss=512]


epoch 406: avg train loss 488.03, bar train loss 2.080, len train loss 0.012, col train loss 146.627


Epoch 407: 1batch [00:00,  6.90batch/s, loss=474]

epoch 406: avg test  loss 612.97, bar  test loss 3.908, len  test loss 0.479, col  test loss 160.541


Epoch 407: 272batch [00:39,  6.85batch/s, loss=476]


epoch 407: avg train loss 487.79, bar train loss 2.076, len train loss 0.011, col train loss 146.576


Epoch 408: 1batch [00:00,  7.30batch/s, loss=517]

epoch 407: avg test  loss 616.15, bar  test loss 3.937, len  test loss 0.497, col  test loss 160.480


Epoch 408: 272batch [00:40,  6.78batch/s, loss=474]


epoch 408: avg train loss 487.85, bar train loss 2.073, len train loss 0.011, col train loss 146.619


Epoch 409: 1batch [00:00,  6.85batch/s, loss=491]

epoch 408: avg test  loss 618.16, bar  test loss 3.932, len  test loss 0.517, col  test loss 160.702


Epoch 409: 272batch [00:40,  6.79batch/s, loss=522]


epoch 409: avg train loss 487.90, bar train loss 2.077, len train loss 0.012, col train loss 146.601


Epoch 410: 1batch [00:00,  6.80batch/s, loss=485]

epoch 409: avg test  loss 612.99, bar  test loss 3.916, len  test loss 0.471, col  test loss 160.574


Epoch 410: 272batch [00:40,  6.78batch/s, loss=524]


epoch 410: avg train loss 487.98, bar train loss 2.082, len train loss 0.012, col train loss 146.599
epoch 410: avg test  loss 613.49, bar  test loss 3.926, len  test loss 0.480, col  test loss 160.429


Epoch 411: 272batch [00:39,  6.84batch/s, loss=523]


epoch 411: avg train loss 487.81, bar train loss 2.077, len train loss 0.012, col train loss 146.572


Epoch 412: 1batch [00:00,  6.67batch/s, loss=477]

epoch 411: avg test  loss 618.59, bar  test loss 3.940, len  test loss 0.525, col  test loss 160.453


Epoch 412: 272batch [00:39,  6.83batch/s, loss=497]


epoch 412: avg train loss 487.61, bar train loss 2.075, len train loss 0.012, col train loss 146.535


Epoch 413: 1batch [00:00,  6.76batch/s, loss=474]

epoch 412: avg test  loss 617.65, bar  test loss 3.935, len  test loss 0.518, col  test loss 160.586


Epoch 413: 272batch [00:40,  6.76batch/s, loss=448]


epoch 413: avg train loss 487.70, bar train loss 2.078, len train loss 0.011, col train loss 146.545


Epoch 414: 1batch [00:00,  6.76batch/s, loss=495]

epoch 413: avg test  loss 612.48, bar  test loss 3.933, len  test loss 0.465, col  test loss 160.453


Epoch 414: 272batch [00:40,  6.79batch/s, loss=519]


epoch 414: avg train loss 487.61, bar train loss 2.074, len train loss 0.011, col train loss 146.537


Epoch 415: 1batch [00:00,  6.71batch/s, loss=496]

epoch 414: avg test  loss 615.02, bar  test loss 3.931, len  test loss 0.493, col  test loss 160.482


Epoch 415: 272batch [00:40,  6.80batch/s, loss=528]


epoch 415: avg train loss 487.60, bar train loss 2.070, len train loss 0.011, col train loss 146.564
epoch 415: avg test  loss 611.45, bar  test loss 3.952, len  test loss 0.456, col  test loss 160.505


Epoch 416: 272batch [00:40,  6.80batch/s, loss=494]


epoch 416: avg train loss 487.44, bar train loss 2.072, len train loss 0.011, col train loss 146.505


Epoch 417: 1batch [00:00,  6.45batch/s, loss=480]

epoch 416: avg test  loss 616.42, bar  test loss 3.970, len  test loss 0.501, col  test loss 160.521


Epoch 417: 272batch [00:40,  6.79batch/s, loss=475]


epoch 417: avg train loss 487.65, bar train loss 2.076, len train loss 0.011, col train loss 146.542


Epoch 418: 1batch [00:00,  6.54batch/s, loss=484]

epoch 417: avg test  loss 615.21, bar  test loss 3.942, len  test loss 0.496, col  test loss 160.502


Epoch 418: 272batch [00:40,  6.78batch/s, loss=514]


epoch 418: avg train loss 487.55, bar train loss 2.071, len train loss 0.011, col train loss 146.546


Epoch 419: 1batch [00:00,  6.67batch/s, loss=471]

epoch 418: avg test  loss 613.18, bar  test loss 3.939, len  test loss 0.470, col  test loss 160.447


Epoch 419: 272batch [00:40,  6.77batch/s, loss=455]


epoch 419: avg train loss 487.45, bar train loss 2.073, len train loss 0.011, col train loss 146.503


Epoch 420: 1batch [00:00,  6.67batch/s, loss=505]

epoch 419: avg test  loss 615.10, bar  test loss 3.934, len  test loss 0.496, col  test loss 160.470


Epoch 420: 272batch [00:40,  6.78batch/s, loss=483]


epoch 420: avg train loss 487.68, bar train loss 2.077, len train loss 0.012, col train loss 146.553
epoch 420: avg test  loss 614.84, bar  test loss 3.976, len  test loss 0.483, col  test loss 160.464


Epoch 421: 272batch [00:40,  6.79batch/s, loss=482]


epoch 421: avg train loss 487.62, bar train loss 2.070, len train loss 0.012, col train loss 146.580


Epoch 422: 0batch [00:00, ?batch/s, loss=477]

epoch 421: avg test  loss 614.63, bar  test loss 3.956, len  test loss 0.483, col  test loss 160.556


Epoch 422: 272batch [00:40,  6.76batch/s, loss=501]


epoch 422: avg train loss 487.65, bar train loss 2.073, len train loss 0.011, col train loss 146.574


Epoch 423: 1batch [00:00,  6.71batch/s, loss=474]

epoch 422: avg test  loss 617.54, bar  test loss 3.966, len  test loss 0.513, col  test loss 160.498


Epoch 423: 272batch [00:40,  6.70batch/s, loss=468]


epoch 423: avg train loss 487.77, bar train loss 2.077, len train loss 0.012, col train loss 146.547


Epoch 424: 1batch [00:00,  7.04batch/s, loss=505]

epoch 423: avg test  loss 615.53, bar  test loss 3.943, len  test loss 0.496, col  test loss 160.587


Epoch 424: 272batch [00:40,  6.80batch/s, loss=485]


epoch 424: avg train loss 487.46, bar train loss 2.068, len train loss 0.011, col train loss 146.547


Epoch 425: 1batch [00:00,  6.54batch/s, loss=473]

epoch 424: avg test  loss 614.37, bar  test loss 3.945, len  test loss 0.484, col  test loss 160.434


Epoch 425: 272batch [00:40,  6.77batch/s, loss=475]


epoch 425: avg train loss 487.61, bar train loss 2.071, len train loss 0.011, col train loss 146.575
epoch 425: avg test  loss 618.74, bar  test loss 3.954, len  test loss 0.528, col  test loss 160.561


Epoch 426: 272batch [00:39,  6.83batch/s, loss=420]


epoch 426: avg train loss 487.40, bar train loss 2.071, len train loss 0.011, col train loss 146.518


Epoch 427: 1batch [00:00,  6.54batch/s, loss=480]

epoch 426: avg test  loss 616.72, bar  test loss 3.982, len  test loss 0.493, col  test loss 160.898


Epoch 427: 272batch [00:39,  6.94batch/s, loss=511]


epoch 427: avg train loss 487.55, bar train loss 2.073, len train loss 0.012, col train loss 146.530


Epoch 428: 1batch [00:00,  6.90batch/s, loss=482]

epoch 427: avg test  loss 614.22, bar  test loss 3.951, len  test loss 0.480, col  test loss 160.657


Epoch 428: 272batch [00:39,  6.93batch/s, loss=492]


epoch 428: avg train loss 487.35, bar train loss 2.066, len train loss 0.011, col train loss 146.513


Epoch 429: 1batch [00:00,  6.76batch/s, loss=493]

epoch 428: avg test  loss 616.08, bar  test loss 3.953, len  test loss 0.497, col  test loss 160.508


Epoch 429: 272batch [00:39,  6.86batch/s, loss=499]


epoch 429: avg train loss 487.36, bar train loss 2.069, len train loss 0.011, col train loss 146.508


Epoch 430: 1batch [00:00,  6.80batch/s, loss=486]

epoch 429: avg test  loss 614.02, bar  test loss 3.959, len  test loss 0.479, col  test loss 160.448


Epoch 430: 272batch [00:39,  6.89batch/s, loss=511]


epoch 430: avg train loss 487.44, bar train loss 2.071, len train loss 0.011, col train loss 146.523
epoch 430: avg test  loss 617.45, bar  test loss 3.952, len  test loss 0.511, col  test loss 160.582


Epoch 431: 272batch [00:39,  6.92batch/s, loss=479]


epoch 431: avg train loss 487.28, bar train loss 2.067, len train loss 0.012, col train loss 146.494


Epoch 432: 1batch [00:00,  6.62batch/s, loss=478]

epoch 431: avg test  loss 615.80, bar  test loss 3.965, len  test loss 0.485, col  test loss 160.512


Epoch 432: 272batch [00:39,  6.89batch/s, loss=486]


epoch 432: avg train loss 487.46, bar train loss 2.068, len train loss 0.011, col train loss 146.563


Epoch 433: 1batch [00:00,  6.94batch/s, loss=469]

epoch 432: avg test  loss 614.73, bar  test loss 3.972, len  test loss 0.478, col  test loss 160.666


Epoch 433: 272batch [00:39,  6.88batch/s, loss=483]


epoch 433: avg train loss 487.30, bar train loss 2.069, len train loss 0.011, col train loss 146.490


Epoch 434: 1batch [00:00,  6.99batch/s, loss=497]

epoch 433: avg test  loss 614.92, bar  test loss 3.975, len  test loss 0.479, col  test loss 160.653


Epoch 434: 272batch [00:39,  6.92batch/s, loss=476]


epoch 434: avg train loss 487.23, bar train loss 2.066, len train loss 0.011, col train loss 146.495


Epoch 435: 1batch [00:00,  6.62batch/s, loss=503]

epoch 434: avg test  loss 612.84, bar  test loss 3.991, len  test loss 0.461, col  test loss 160.670


Epoch 435: 272batch [00:39,  6.89batch/s, loss=498]


epoch 435: avg train loss 487.25, bar train loss 2.064, len train loss 0.011, col train loss 146.512
epoch 435: avg test  loss 613.54, bar  test loss 3.981, len  test loss 0.463, col  test loss 160.606


Epoch 436: 272batch [00:39,  6.90batch/s, loss=455]


epoch 436: avg train loss 487.21, bar train loss 2.066, len train loss 0.012, col train loss 146.477


Epoch 437: 1batch [00:00,  6.76batch/s, loss=483]

epoch 436: avg test  loss 614.64, bar  test loss 3.980, len  test loss 0.480, col  test loss 160.639


Epoch 437: 272batch [00:39,  6.89batch/s, loss=534]


epoch 437: avg train loss 487.09, bar train loss 2.066, len train loss 0.011, col train loss 146.452


Epoch 438: 1batch [00:00,  6.66batch/s, loss=488]

epoch 437: avg test  loss 617.27, bar  test loss 3.972, len  test loss 0.507, col  test loss 160.507


Epoch 438: 272batch [00:39,  6.89batch/s, loss=456]


epoch 438: avg train loss 487.15, bar train loss 2.066, len train loss 0.011, col train loss 146.479


Epoch 439: 1batch [00:00,  7.19batch/s, loss=467]

epoch 438: avg test  loss 616.28, bar  test loss 3.957, len  test loss 0.502, col  test loss 160.586


Epoch 439: 272batch [00:39,  6.86batch/s, loss=481]


epoch 439: avg train loss 487.09, bar train loss 2.062, len train loss 0.011, col train loss 146.490


Epoch 440: 1batch [00:00,  6.62batch/s, loss=488]

epoch 439: avg test  loss 617.87, bar  test loss 3.976, len  test loss 0.506, col  test loss 160.536


Epoch 440: 272batch [00:39,  6.90batch/s, loss=508]


epoch 440: avg train loss 487.19, bar train loss 2.065, len train loss 0.012, col train loss 146.482
epoch 440: avg test  loss 620.24, bar  test loss 3.987, len  test loss 0.533, col  test loss 160.636


Epoch 441: 272batch [00:39,  6.85batch/s, loss=553]


epoch 441: avg train loss 487.14, bar train loss 2.064, len train loss 0.011, col train loss 146.488


Epoch 442: 1batch [00:00,  6.17batch/s, loss=495]

epoch 441: avg test  loss 615.21, bar  test loss 3.969, len  test loss 0.487, col  test loss 160.554


Epoch 442: 272batch [00:39,  6.86batch/s, loss=538]


epoch 442: avg train loss 486.94, bar train loss 2.062, len train loss 0.011, col train loss 146.453


Epoch 443: 1batch [00:00,  6.58batch/s, loss=499]

epoch 442: avg test  loss 616.95, bar  test loss 3.974, len  test loss 0.502, col  test loss 160.693


Epoch 443: 272batch [00:39,  6.84batch/s, loss=485]


epoch 443: avg train loss 487.17, bar train loss 2.065, len train loss 0.012, col train loss 146.473


Epoch 444: 1batch [00:00,  7.30batch/s, loss=485]

epoch 443: avg test  loss 621.25, bar  test loss 3.995, len  test loss 0.533, col  test loss 160.796


Epoch 444: 272batch [00:39,  6.83batch/s, loss=486]


epoch 444: avg train loss 487.19, bar train loss 2.066, len train loss 0.012, col train loss 146.489


Epoch 445: 1batch [00:00,  6.80batch/s, loss=489]

epoch 444: avg test  loss 616.00, bar  test loss 3.975, len  test loss 0.493, col  test loss 160.577


Epoch 445: 272batch [00:39,  6.81batch/s, loss=488]


epoch 445: avg train loss 487.07, bar train loss 2.063, len train loss 0.011, col train loss 146.482
epoch 445: avg test  loss 619.50, bar  test loss 3.975, len  test loss 0.526, col  test loss 160.652


Epoch 446: 272batch [00:39,  6.88batch/s, loss=461]


epoch 446: avg train loss 486.92, bar train loss 2.058, len train loss 0.011, col train loss 146.440


Epoch 447: 1batch [00:00,  6.99batch/s, loss=480]

epoch 446: avg test  loss 619.22, bar  test loss 3.982, len  test loss 0.526, col  test loss 160.652


Epoch 447: 272batch [00:39,  6.86batch/s, loss=489]


epoch 447: avg train loss 486.93, bar train loss 2.063, len train loss 0.011, col train loss 146.431


Epoch 448: 1batch [00:00,  6.45batch/s, loss=477]

epoch 447: avg test  loss 618.92, bar  test loss 4.003, len  test loss 0.514, col  test loss 160.675


Epoch 448: 272batch [00:40,  6.76batch/s, loss=458]


epoch 448: avg train loss 487.12, bar train loss 2.060, len train loss 0.011, col train loss 146.515


Epoch 449: 1batch [00:00,  6.80batch/s, loss=488]

epoch 448: avg test  loss 618.81, bar  test loss 3.991, len  test loss 0.516, col  test loss 160.705


Epoch 449: 272batch [00:39,  6.85batch/s, loss=488]


epoch 449: avg train loss 486.89, bar train loss 2.059, len train loss 0.011, col train loss 146.460


Epoch 450: 1batch [00:00,  6.94batch/s, loss=496]

epoch 449: avg test  loss 615.10, bar  test loss 3.980, len  test loss 0.481, col  test loss 160.648


Epoch 450: 272batch [00:39,  6.85batch/s, loss=488]


epoch 450: avg train loss 486.91, bar train loss 2.064, len train loss 0.011, col train loss 146.420
epoch 450: avg test  loss 617.13, bar  test loss 3.995, len  test loss 0.498, col  test loss 160.719


Epoch 451: 272batch [00:39,  6.84batch/s, loss=511]


epoch 451: avg train loss 486.86, bar train loss 2.059, len train loss 0.011, col train loss 146.434


Epoch 452: 1batch [00:00,  6.90batch/s, loss=490]

epoch 451: avg test  loss 616.57, bar  test loss 3.976, len  test loss 0.503, col  test loss 160.554


Epoch 452: 272batch [00:39,  6.89batch/s, loss=459]


epoch 452: avg train loss 486.94, bar train loss 2.060, len train loss 0.011, col train loss 146.465


Epoch 453: 1batch [00:00,  6.67batch/s, loss=486]

epoch 452: avg test  loss 616.55, bar  test loss 4.004, len  test loss 0.493, col  test loss 160.656


Epoch 453: 272batch [00:39,  6.80batch/s, loss=492]


epoch 453: avg train loss 486.72, bar train loss 2.055, len train loss 0.011, col train loss 146.424


Epoch 454: 1batch [00:00,  7.09batch/s, loss=483]

epoch 453: avg test  loss 617.06, bar  test loss 4.006, len  test loss 0.497, col  test loss 160.727


Epoch 454: 272batch [00:39,  6.87batch/s, loss=497]


epoch 454: avg train loss 486.72, bar train loss 2.054, len train loss 0.011, col train loss 146.428


Epoch 455: 1batch [00:00,  6.62batch/s, loss=500]

epoch 454: avg test  loss 617.66, bar  test loss 4.012, len  test loss 0.501, col  test loss 160.722


Epoch 455: 272batch [00:39,  6.81batch/s, loss=494]


epoch 455: avg train loss 486.58, bar train loss 2.054, len train loss 0.011, col train loss 146.398
epoch 455: avg test  loss 619.41, bar  test loss 3.978, len  test loss 0.525, col  test loss 160.548


Epoch 456: 272batch [00:39,  6.83batch/s, loss=452]


epoch 456: avg train loss 486.76, bar train loss 2.055, len train loss 0.011, col train loss 146.449


Epoch 457: 1batch [00:00,  6.67batch/s, loss=477]

epoch 456: avg test  loss 617.24, bar  test loss 3.975, len  test loss 0.507, col  test loss 160.662


Epoch 457: 272batch [00:39,  6.84batch/s, loss=488]


epoch 457: avg train loss 486.91, bar train loss 2.063, len train loss 0.011, col train loss 146.433


Epoch 458: 0batch [00:00, ?batch/s, loss=503]

epoch 457: avg test  loss 613.45, bar  test loss 4.002, len  test loss 0.464, col  test loss 160.609


Epoch 458: 272batch [00:39,  6.81batch/s, loss=481]


epoch 458: avg train loss 486.68, bar train loss 2.057, len train loss 0.011, col train loss 146.406


Epoch 459: 0batch [00:00, ?batch/s, loss=505]

epoch 458: avg test  loss 615.34, bar  test loss 4.001, len  test loss 0.482, col  test loss 160.659


Epoch 459: 272batch [00:40,  6.79batch/s, loss=507]


epoch 459: avg train loss 486.54, bar train loss 2.053, len train loss 0.011, col train loss 146.384


Epoch 460: 1batch [00:00,  6.10batch/s, loss=477]

epoch 459: avg test  loss 616.52, bar  test loss 3.980, len  test loss 0.498, col  test loss 160.684


Epoch 460: 272batch [00:40,  6.78batch/s, loss=464]


epoch 460: avg train loss 486.66, bar train loss 2.052, len train loss 0.011, col train loss 146.428
epoch 460: avg test  loss 616.48, bar  test loss 3.991, len  test loss 0.493, col  test loss 160.682


Epoch 461: 272batch [00:39,  6.81batch/s, loss=472]


epoch 461: avg train loss 486.86, bar train loss 2.059, len train loss 0.011, col train loss 146.453


Epoch 462: 0batch [00:00, ?batch/s, loss=520]

epoch 461: avg test  loss 617.53, bar  test loss 3.992, len  test loss 0.501, col  test loss 160.685


Epoch 462: 272batch [00:40,  6.78batch/s, loss=477]


epoch 462: avg train loss 486.64, bar train loss 2.055, len train loss 0.011, col train loss 146.401


Epoch 463: 1batch [00:00,  6.80batch/s, loss=484]

epoch 462: avg test  loss 616.30, bar  test loss 3.983, len  test loss 0.494, col  test loss 160.608


Epoch 463: 272batch [00:40,  6.79batch/s, loss=516]


epoch 463: avg train loss 486.63, bar train loss 2.049, len train loss 0.011, col train loss 146.435


Epoch 464: 0batch [00:00, ?batch/s, loss=473]

epoch 463: avg test  loss 615.47, bar  test loss 3.991, len  test loss 0.481, col  test loss 160.663


Epoch 464: 272batch [00:40,  6.77batch/s, loss=489]


epoch 464: avg train loss 486.64, bar train loss 2.053, len train loss 0.011, col train loss 146.435


Epoch 465: 0batch [00:00, ?batch/s]

epoch 464: avg test  loss 617.23, bar  test loss 4.036, len  test loss 0.493, col  test loss 160.738


Epoch 465: 272batch [00:40,  6.77batch/s, loss=518]


epoch 465: avg train loss 486.56, bar train loss 2.053, len train loss 0.011, col train loss 146.400
epoch 465: avg test  loss 617.10, bar  test loss 3.994, len  test loss 0.494, col  test loss 160.687


Epoch 466: 272batch [00:40,  6.78batch/s, loss=499]


epoch 466: avg train loss 486.36, bar train loss 2.049, len train loss 0.011, col train loss 146.364


Epoch 467: 1batch [00:00,  6.62batch/s, loss=482]

epoch 466: avg test  loss 616.44, bar  test loss 4.016, len  test loss 0.490, col  test loss 160.707


Epoch 467: 272batch [00:40,  6.78batch/s, loss=524]


epoch 467: avg train loss 486.45, bar train loss 2.051, len train loss 0.011, col train loss 146.377


Epoch 468: 1batch [00:00,  6.54batch/s, loss=464]

epoch 467: avg test  loss 614.76, bar  test loss 4.006, len  test loss 0.473, col  test loss 160.710


Epoch 468: 272batch [00:40,  6.78batch/s, loss=511]


epoch 468: avg train loss 486.44, bar train loss 2.051, len train loss 0.011, col train loss 146.376


Epoch 469: 1batch [00:00,  6.71batch/s, loss=472]

epoch 468: avg test  loss 618.07, bar  test loss 4.014, len  test loss 0.506, col  test loss 160.747


Epoch 469: 272batch [00:39,  6.80batch/s, loss=562]


epoch 469: avg train loss 486.45, bar train loss 2.051, len train loss 0.011, col train loss 146.386


Epoch 470: 1batch [00:00,  6.85batch/s, loss=468]

epoch 469: avg test  loss 616.79, bar  test loss 4.007, len  test loss 0.491, col  test loss 160.670


Epoch 470: 272batch [00:40,  6.79batch/s, loss=538]


epoch 470: avg train loss 486.45, bar train loss 2.054, len train loss 0.011, col train loss 146.370
epoch 470: avg test  loss 618.35, bar  test loss 4.006, len  test loss 0.510, col  test loss 160.637


Epoch 471: 272batch [00:39,  6.82batch/s, loss=513]


epoch 471: avg train loss 486.39, bar train loss 2.045, len train loss 0.011, col train loss 146.399


Epoch 472: 0batch [00:00, ?batch/s, loss=478]

epoch 471: avg test  loss 618.88, bar  test loss 3.998, len  test loss 0.513, col  test loss 160.666


Epoch 472: 272batch [00:39,  6.80batch/s, loss=483]


epoch 472: avg train loss 486.57, bar train loss 2.052, len train loss 0.011, col train loss 146.420


Epoch 473: 1batch [00:00,  6.80batch/s, loss=494]

epoch 472: avg test  loss 616.90, bar  test loss 4.005, len  test loss 0.496, col  test loss 160.697


Epoch 473: 272batch [00:40,  6.80batch/s, loss=468]


epoch 473: avg train loss 486.35, bar train loss 2.051, len train loss 0.011, col train loss 146.345


Epoch 474: 1batch [00:00,  6.76batch/s, loss=488]

epoch 473: avg test  loss 618.70, bar  test loss 4.041, len  test loss 0.503, col  test loss 160.820


Epoch 474: 272batch [00:40,  6.68batch/s, loss=447]


epoch 474: avg train loss 486.53, bar train loss 2.054, len train loss 0.011, col train loss 146.396


Epoch 475: 1batch [00:00,  6.49batch/s, loss=497]

epoch 474: avg test  loss 615.06, bar  test loss 4.014, len  test loss 0.472, col  test loss 160.862


Epoch 475: 272batch [00:41,  6.62batch/s, loss=468]


epoch 475: avg train loss 486.37, bar train loss 2.048, len train loss 0.011, col train loss 146.385
epoch 475: avg test  loss 617.78, bar  test loss 3.998, len  test loss 0.505, col  test loss 160.716


Epoch 476: 272batch [00:41,  6.62batch/s, loss=487]


epoch 476: avg train loss 486.52, bar train loss 2.050, len train loss 0.011, col train loss 146.416


Epoch 477: 0batch [00:00, ?batch/s, loss=486]

epoch 476: avg test  loss 614.08, bar  test loss 4.003, len  test loss 0.463, col  test loss 160.749


Epoch 477: 272batch [00:41,  6.63batch/s, loss=493]


epoch 477: avg train loss 486.51, bar train loss 2.049, len train loss 0.011, col train loss 146.421


Epoch 478: 1batch [00:00,  6.71batch/s, loss=492]

epoch 477: avg test  loss 617.74, bar  test loss 4.004, len  test loss 0.502, col  test loss 160.717


Epoch 478: 272batch [00:40,  6.64batch/s, loss=473]


epoch 478: avg train loss 486.46, bar train loss 2.049, len train loss 0.011, col train loss 146.405


Epoch 479: 1batch [00:00,  6.45batch/s, loss=490]

epoch 478: avg test  loss 617.29, bar  test loss 4.005, len  test loss 0.496, col  test loss 160.816


Epoch 479: 272batch [00:41,  6.63batch/s, loss=487]


epoch 479: avg train loss 486.30, bar train loss 2.047, len train loss 0.011, col train loss 146.362


Epoch 480: 1batch [00:00,  6.80batch/s, loss=498]

epoch 479: avg test  loss 616.81, bar  test loss 4.032, len  test loss 0.488, col  test loss 160.753


Epoch 480: 272batch [00:41,  6.60batch/s, loss=492]


epoch 480: avg train loss 486.40, bar train loss 2.048, len train loss 0.011, col train loss 146.392
epoch 480: avg test  loss 618.64, bar  test loss 4.011, len  test loss 0.509, col  test loss 160.776


Epoch 481: 272batch [00:41,  6.62batch/s, loss=482]


epoch 481: avg train loss 486.35, bar train loss 2.043, len train loss 0.011, col train loss 146.408


Epoch 482: 1batch [00:00,  6.33batch/s, loss=484]

epoch 481: avg test  loss 617.80, bar  test loss 4.033, len  test loss 0.495, col  test loss 160.827


Epoch 482: 272batch [00:41,  6.62batch/s, loss=473]


epoch 482: avg train loss 486.24, bar train loss 2.045, len train loss 0.011, col train loss 146.362


Epoch 483: 1batch [00:00,  6.41batch/s, loss=499]

epoch 482: avg test  loss 617.13, bar  test loss 4.034, len  test loss 0.489, col  test loss 160.866


Epoch 483: 272batch [00:41,  6.61batch/s, loss=488]


epoch 483: avg train loss 486.22, bar train loss 2.046, len train loss 0.011, col train loss 146.372


Epoch 484: 0batch [00:00, ?batch/s, loss=494]

epoch 483: avg test  loss 618.81, bar  test loss 4.017, len  test loss 0.507, col  test loss 160.682


Epoch 484: 272batch [00:41,  6.60batch/s, loss=525]


epoch 484: avg train loss 486.25, bar train loss 2.046, len train loss 0.011, col train loss 146.371


Epoch 485: 1batch [00:00,  6.45batch/s, loss=485]

epoch 484: avg test  loss 617.35, bar  test loss 4.034, len  test loss 0.492, col  test loss 160.761


Epoch 485: 272batch [00:41,  6.61batch/s, loss=446]


epoch 485: avg train loss 486.16, bar train loss 2.043, len train loss 0.011, col train loss 146.344
epoch 485: avg test  loss 616.81, bar  test loss 3.997, len  test loss 0.490, col  test loss 160.625


Epoch 486: 272batch [00:41,  6.57batch/s, loss=524]


epoch 486: avg train loss 486.10, bar train loss 2.045, len train loss 0.011, col train loss 146.327


Epoch 487: 1batch [00:00,  6.67batch/s, loss=478]

epoch 486: avg test  loss 618.66, bar  test loss 4.035, len  test loss 0.505, col  test loss 160.749


Epoch 487: 272batch [00:41,  6.62batch/s, loss=474]


epoch 487: avg train loss 486.23, bar train loss 2.045, len train loss 0.011, col train loss 146.384


Epoch 488: 1batch [00:00,  6.85batch/s, loss=503]

epoch 487: avg test  loss 621.31, bar  test loss 4.029, len  test loss 0.532, col  test loss 160.754


Epoch 488: 272batch [00:41,  6.60batch/s, loss=505]


epoch 488: avg train loss 486.18, bar train loss 2.043, len train loss 0.011, col train loss 146.368


Epoch 489: 1batch [00:00,  6.37batch/s, loss=482]

epoch 488: avg test  loss 620.35, bar  test loss 4.029, len  test loss 0.521, col  test loss 160.800


Epoch 489: 272batch [00:41,  6.57batch/s, loss=519]


epoch 489: avg train loss 486.28, bar train loss 2.045, len train loss 0.011, col train loss 146.397


Epoch 490: 1batch [00:00,  6.49batch/s, loss=490]

epoch 489: avg test  loss 622.17, bar  test loss 4.020, len  test loss 0.544, col  test loss 160.732


Epoch 490: 272batch [00:42,  6.35batch/s, loss=467]


epoch 490: avg train loss 486.28, bar train loss 2.045, len train loss 0.011, col train loss 146.393
epoch 490: avg test  loss 619.03, bar  test loss 4.026, len  test loss 0.510, col  test loss 160.879


Epoch 491: 272batch [00:42,  6.41batch/s, loss=478]


epoch 491: avg train loss 486.17, bar train loss 2.044, len train loss 0.011, col train loss 146.365


Epoch 492: 1batch [00:00,  6.10batch/s, loss=469]

epoch 491: avg test  loss 617.39, bar  test loss 4.043, len  test loss 0.488, col  test loss 160.782


Epoch 492: 272batch [00:41,  6.55batch/s, loss=537]


epoch 492: avg train loss 485.89, bar train loss 2.034, len train loss 0.011, col train loss 146.340


Epoch 493: 1batch [00:00,  6.45batch/s, loss=493]

epoch 492: avg test  loss 619.52, bar  test loss 4.013, len  test loss 0.517, col  test loss 160.652


Epoch 493: 272batch [00:41,  6.55batch/s, loss=482]


epoch 493: avg train loss 486.08, bar train loss 2.044, len train loss 0.011, col train loss 146.337


Epoch 494: 1batch [00:00,  6.49batch/s, loss=498]

epoch 493: avg test  loss 616.95, bar  test loss 4.028, len  test loss 0.490, col  test loss 160.820


Epoch 494: 272batch [00:41,  6.56batch/s, loss=511]


epoch 494: avg train loss 486.09, bar train loss 2.045, len train loss 0.011, col train loss 146.354


Epoch 495: 0batch [00:00, ?batch/s]

epoch 494: avg test  loss 621.29, bar  test loss 4.046, len  test loss 0.528, col  test loss 160.826


Epoch 495: 272batch [00:41,  6.55batch/s, loss=511]


epoch 495: avg train loss 485.90, bar train loss 2.040, len train loss 0.011, col train loss 146.306
epoch 495: avg test  loss 616.70, bar  test loss 4.044, len  test loss 0.484, col  test loss 160.812


Epoch 496: 272batch [00:41,  6.56batch/s, loss=498]


epoch 496: avg train loss 486.12, bar train loss 2.039, len train loss 0.011, col train loss 146.384


Epoch 497: 1batch [00:00,  6.54batch/s, loss=491]

epoch 496: avg test  loss 618.62, bar  test loss 4.056, len  test loss 0.497, col  test loss 160.942


Epoch 497: 272batch [00:41,  6.55batch/s, loss=471]


epoch 497: avg train loss 486.30, bar train loss 2.044, len train loss 0.011, col train loss 146.425


Epoch 498: 0batch [00:00, ?batch/s, loss=494]

epoch 497: avg test  loss 615.84, bar  test loss 4.031, len  test loss 0.476, col  test loss 160.825


Epoch 498: 272batch [00:41,  6.55batch/s, loss=481]


epoch 498: avg train loss 486.25, bar train loss 2.042, len train loss 0.011, col train loss 146.410


Epoch 499: 1batch [00:00,  6.25batch/s, loss=475]

epoch 498: avg test  loss 615.28, bar  test loss 4.016, len  test loss 0.474, col  test loss 160.724


Epoch 499: 272batch [00:41,  6.50batch/s, loss=483]


epoch 499: avg train loss 486.12, bar train loss 2.041, len train loss 0.011, col train loss 146.377


Epoch 500: 0batch [00:00, ?batch/s, loss=471]

epoch 499: avg test  loss 619.31, bar  test loss 4.049, len  test loss 0.505, col  test loss 160.823


Epoch 500: 272batch [00:41,  6.55batch/s, loss=534]


epoch 500: avg train loss 486.10, bar train loss 2.043, len train loss 0.011, col train loss 146.359
epoch 500: avg test  loss 618.11, bar  test loss 4.031, len  test loss 0.499, col  test loss 160.768


In [44]:
lss, lss_t = train(default_args, train_loader, test_loader, diva, optimizer, 1000,500,save_folder="new/HVAE2",save_interval=5)

Epoch 501: 272batch [00:31,  8.60batch/s, loss=466]


epoch 501: avg train loss 486.28, bar train loss 2.043, len train loss 0.011, col train loss 146.432


Epoch 502: 1batch [00:00,  8.40batch/s, loss=502]

epoch 501: avg test  loss 617.89, bar  test loss 4.047, len  test loss 0.492, col  test loss 160.964


Epoch 502: 272batch [00:31,  8.57batch/s, loss=461]


epoch 502: avg train loss 485.94, bar train loss 2.038, len train loss 0.011, col train loss 146.323


Epoch 503: 1batch [00:00,  8.47batch/s, loss=493]

epoch 502: avg test  loss 617.96, bar  test loss 4.054, len  test loss 0.493, col  test loss 160.880


Epoch 503: 272batch [00:31,  8.58batch/s, loss=480]


epoch 503: avg train loss 485.91, bar train loss 2.035, len train loss 0.011, col train loss 146.346


Epoch 504: 1batch [00:00,  8.40batch/s, loss=487]

epoch 503: avg test  loss 619.42, bar  test loss 4.043, len  test loss 0.508, col  test loss 160.795


Epoch 504: 272batch [00:31,  8.58batch/s, loss=447]


epoch 504: avg train loss 485.77, bar train loss 2.036, len train loss 0.011, col train loss 146.298


Epoch 505: 1batch [00:00,  8.40batch/s, loss=494]

epoch 504: avg test  loss 617.36, bar  test loss 4.046, len  test loss 0.489, col  test loss 160.782


Epoch 505: 272batch [00:31,  8.58batch/s, loss=469]


epoch 505: avg train loss 485.85, bar train loss 2.031, len train loss 0.011, col train loss 146.361
epoch 505: avg test  loss 618.64, bar  test loss 4.045, len  test loss 0.501, col  test loss 160.832


Epoch 506: 272batch [00:31,  8.58batch/s, loss=503]


epoch 506: avg train loss 485.87, bar train loss 2.039, len train loss 0.011, col train loss 146.305


Epoch 507: 1batch [00:00,  8.40batch/s, loss=509]

epoch 506: avg test  loss 619.46, bar  test loss 4.054, len  test loss 0.505, col  test loss 160.922


Epoch 507: 272batch [00:31,  8.57batch/s, loss=518]


epoch 507: avg train loss 486.00, bar train loss 2.040, len train loss 0.011, col train loss 146.361


Epoch 508: 1batch [00:00,  8.55batch/s, loss=476]

epoch 507: avg test  loss 617.36, bar  test loss 4.059, len  test loss 0.483, col  test loss 160.936


Epoch 508: 272batch [00:31,  8.59batch/s, loss=500]


epoch 508: avg train loss 486.15, bar train loss 2.044, len train loss 0.011, col train loss 146.375


Epoch 509: 1batch [00:00,  8.40batch/s, loss=482]

epoch 508: avg test  loss 618.08, bar  test loss 4.027, len  test loss 0.495, col  test loss 160.800


Epoch 509: 272batch [00:31,  8.59batch/s, loss=480]


epoch 509: avg train loss 485.74, bar train loss 2.038, len train loss 0.011, col train loss 146.286


Epoch 510: 1batch [00:00,  8.40batch/s, loss=500]

epoch 509: avg test  loss 620.10, bar  test loss 4.045, len  test loss 0.516, col  test loss 160.817


Epoch 510: 272batch [00:31,  8.58batch/s, loss=478]


epoch 510: avg train loss 485.85, bar train loss 2.037, len train loss 0.011, col train loss 146.301
epoch 510: avg test  loss 618.26, bar  test loss 4.050, len  test loss 0.496, col  test loss 160.822


Epoch 511: 272batch [00:31,  8.58batch/s, loss=487]


epoch 511: avg train loss 485.63, bar train loss 2.034, len train loss 0.011, col train loss 146.293


Epoch 512: 1batch [00:00,  8.47batch/s, loss=468]

epoch 511: avg test  loss 619.75, bar  test loss 4.056, len  test loss 0.509, col  test loss 160.873


Epoch 512: 272batch [00:31,  8.58batch/s, loss=456]


epoch 512: avg train loss 485.96, bar train loss 2.035, len train loss 0.011, col train loss 146.376


Epoch 513: 1batch [00:00,  8.40batch/s, loss=501]

epoch 512: avg test  loss 622.40, bar  test loss 4.054, len  test loss 0.533, col  test loss 160.904


Epoch 513: 272batch [00:31,  8.58batch/s, loss=510]


epoch 513: avg train loss 485.91, bar train loss 2.040, len train loss 0.011, col train loss 146.328


Epoch 514: 1batch [00:00,  8.40batch/s, loss=496]

epoch 513: avg test  loss 619.46, bar  test loss 4.048, len  test loss 0.506, col  test loss 160.870


Epoch 514: 272batch [00:31,  8.57batch/s, loss=530]


epoch 514: avg train loss 485.88, bar train loss 2.037, len train loss 0.011, col train loss 146.326


Epoch 515: 1batch [00:00,  8.47batch/s, loss=479]

epoch 514: avg test  loss 620.03, bar  test loss 4.034, len  test loss 0.514, col  test loss 160.939


Epoch 515: 272batch [00:31,  8.57batch/s, loss=502]


epoch 515: avg train loss 485.83, bar train loss 2.037, len train loss 0.011, col train loss 146.317
epoch 515: avg test  loss 620.24, bar  test loss 4.035, len  test loss 0.519, col  test loss 160.867


Epoch 516: 272batch [00:31,  8.56batch/s, loss=522]


epoch 516: avg train loss 485.72, bar train loss 2.028, len train loss 0.011, col train loss 146.342


Epoch 517: 1batch [00:00,  8.33batch/s, loss=496]

epoch 516: avg test  loss 616.71, bar  test loss 4.052, len  test loss 0.479, col  test loss 160.814


Epoch 517: 272batch [00:31,  8.57batch/s, loss=464]


epoch 517: avg train loss 485.77, bar train loss 2.037, len train loss 0.011, col train loss 146.309


Epoch 518: 1batch [00:00,  8.40batch/s, loss=490]

epoch 517: avg test  loss 620.71, bar  test loss 4.083, len  test loss 0.513, col  test loss 160.950


Epoch 518: 272batch [00:31,  8.56batch/s, loss=448]


epoch 518: avg train loss 485.82, bar train loss 2.033, len train loss 0.011, col train loss 146.333


Epoch 519: 1batch [00:00,  8.20batch/s, loss=472]

epoch 518: avg test  loss 619.28, bar  test loss 4.042, len  test loss 0.510, col  test loss 160.764


Epoch 519: 272batch [00:31,  8.57batch/s, loss=470]


epoch 519: avg train loss 485.70, bar train loss 2.032, len train loss 0.011, col train loss 146.302


Epoch 520: 1batch [00:00,  8.33batch/s, loss=467]

epoch 519: avg test  loss 620.93, bar  test loss 4.074, len  test loss 0.516, col  test loss 160.993


Epoch 520: 272batch [00:31,  8.57batch/s, loss=489]


epoch 520: avg train loss 485.49, bar train loss 2.027, len train loss 0.011, col train loss 146.288
epoch 520: avg test  loss 617.58, bar  test loss 4.064, len  test loss 0.485, col  test loss 160.927


Epoch 521: 272batch [00:31,  8.57batch/s, loss=501]


epoch 521: avg train loss 485.71, bar train loss 2.031, len train loss 0.011, col train loss 146.325


Epoch 522: 1batch [00:00,  8.47batch/s, loss=477]

epoch 521: avg test  loss 620.07, bar  test loss 4.063, len  test loss 0.511, col  test loss 160.853


Epoch 522: 272batch [00:31,  8.59batch/s, loss=482]


epoch 522: avg train loss 485.55, bar train loss 2.029, len train loss 0.011, col train loss 146.277


Epoch 523: 1batch [00:00,  8.47batch/s, loss=461]

epoch 522: avg test  loss 620.09, bar  test loss 4.053, len  test loss 0.513, col  test loss 160.805


Epoch 523: 272batch [00:31,  8.59batch/s, loss=502]


epoch 523: avg train loss 485.54, bar train loss 2.031, len train loss 0.011, col train loss 146.258


Epoch 524: 1batch [00:00,  8.26batch/s, loss=474]

epoch 523: avg test  loss 617.83, bar  test loss 4.080, len  test loss 0.487, col  test loss 160.924


Epoch 524: 272batch [00:31,  8.60batch/s, loss=480]


epoch 524: avg train loss 485.60, bar train loss 2.031, len train loss 0.011, col train loss 146.295


Epoch 525: 1batch [00:00,  8.47batch/s, loss=493]

epoch 524: avg test  loss 616.97, bar  test loss 4.089, len  test loss 0.474, col  test loss 160.823


Epoch 525: 272batch [00:31,  8.59batch/s, loss=465]


epoch 525: avg train loss 485.97, bar train loss 2.036, len train loss 0.011, col train loss 146.366
epoch 525: avg test  loss 619.94, bar  test loss 4.087, len  test loss 0.504, col  test loss 160.924


Epoch 526: 272batch [00:31,  8.58batch/s, loss=502]


epoch 526: avg train loss 485.77, bar train loss 2.032, len train loss 0.011, col train loss 146.335


Epoch 527: 1batch [00:00,  8.33batch/s, loss=491]

epoch 526: avg test  loss 616.30, bar  test loss 4.064, len  test loss 0.467, col  test loss 161.040


Epoch 527: 272batch [00:31,  8.58batch/s, loss=503]


epoch 527: avg train loss 485.75, bar train loss 2.028, len train loss 0.011, col train loss 146.355


Epoch 528: 1batch [00:00,  8.40batch/s, loss=462]

epoch 527: avg test  loss 617.82, bar  test loss 4.051, len  test loss 0.490, col  test loss 160.905


Epoch 528: 272batch [00:31,  8.58batch/s, loss=499]


epoch 528: avg train loss 485.76, bar train loss 2.038, len train loss 0.011, col train loss 146.305


Epoch 529: 1batch [00:00,  8.33batch/s, loss=468]

epoch 528: avg test  loss 618.94, bar  test loss 4.056, len  test loss 0.503, col  test loss 160.803


Epoch 529: 272batch [00:31,  8.58batch/s, loss=483]


epoch 529: avg train loss 485.52, bar train loss 2.028, len train loss 0.011, col train loss 146.278


Epoch 530: 1batch [00:00,  8.26batch/s, loss=482]

epoch 529: avg test  loss 618.53, bar  test loss 4.078, len  test loss 0.492, col  test loss 160.956


Epoch 530: 272batch [00:31,  8.58batch/s, loss=499]


epoch 530: avg train loss 485.58, bar train loss 2.031, len train loss 0.011, col train loss 146.287
epoch 530: avg test  loss 618.29, bar  test loss 4.061, len  test loss 0.491, col  test loss 160.940


Epoch 531: 272batch [00:31,  8.58batch/s, loss=488]


epoch 531: avg train loss 485.79, bar train loss 2.030, len train loss 0.011, col train loss 146.350


Epoch 532: 1batch [00:00,  8.47batch/s, loss=463]

epoch 531: avg test  loss 619.58, bar  test loss 4.064, len  test loss 0.503, col  test loss 160.974


Epoch 532: 272batch [00:31,  8.57batch/s, loss=462]


epoch 532: avg train loss 485.79, bar train loss 2.034, len train loss 0.011, col train loss 146.347


Epoch 533: 1batch [00:00,  8.47batch/s, loss=477]

epoch 532: avg test  loss 618.90, bar  test loss 4.082, len  test loss 0.493, col  test loss 160.937


Epoch 533: 272batch [00:31,  8.58batch/s, loss=508]


epoch 533: avg train loss 485.73, bar train loss 2.031, len train loss 0.011, col train loss 146.325


Epoch 534: 1batch [00:00,  8.40batch/s, loss=473]

epoch 533: avg test  loss 616.88, bar  test loss 4.060, len  test loss 0.477, col  test loss 160.999


Epoch 534: 272batch [00:31,  8.58batch/s, loss=476]


epoch 534: avg train loss 485.68, bar train loss 2.033, len train loss 0.011, col train loss 146.319


Epoch 535: 1batch [00:00,  8.33batch/s, loss=504]

epoch 534: avg test  loss 617.21, bar  test loss 4.065, len  test loss 0.481, col  test loss 160.869


Epoch 535: 272batch [00:31,  8.58batch/s, loss=483]


epoch 535: avg train loss 485.42, bar train loss 2.023, len train loss 0.011, col train loss 146.286
epoch 535: avg test  loss 619.36, bar  test loss 4.088, len  test loss 0.499, col  test loss 161.002


Epoch 536: 272batch [00:31,  8.57batch/s, loss=473]


epoch 536: avg train loss 485.70, bar train loss 2.027, len train loss 0.011, col train loss 146.352


Epoch 537: 1batch [00:00,  8.40batch/s, loss=501]

epoch 536: avg test  loss 619.76, bar  test loss 4.092, len  test loss 0.499, col  test loss 160.888


Epoch 537: 272batch [00:31,  8.58batch/s, loss=474]


epoch 537: avg train loss 485.71, bar train loss 2.032, len train loss 0.011, col train loss 146.331


Epoch 538: 1batch [00:00,  8.40batch/s, loss=479]

epoch 537: avg test  loss 621.45, bar  test loss 4.095, len  test loss 0.517, col  test loss 160.917


Epoch 538: 272batch [00:31,  8.56batch/s, loss=503]


epoch 538: avg train loss 485.72, bar train loss 2.026, len train loss 0.011, col train loss 146.364


Epoch 539: 1batch [00:00,  8.26batch/s, loss=480]

epoch 538: avg test  loss 618.19, bar  test loss 4.075, len  test loss 0.483, col  test loss 161.157


Epoch 539: 41batch [00:04,  8.43batch/s, loss=479]


KeyboardInterrupt: 

In [None]:
lss2, lss_t2 = train(default_args, train_loader, test_loader, diva, optimizer, 1000, 500, save_folder="VAEFC")

In [None]:
lss, lss_t = train(default_args, train_loader, test_loader, diva, optimizer, 1600, 1000, save_folder="VAEFC")

In [None]:
def plot_loss_acc(lss, lss_t):
    fig,ax = plt.subplots()
    ax.plot(lss, label="train loss")
    ax.plot(lss_t, label = "test loss")
    #ax1 = ax.twinx()
    #ax1.plot(yacc, label = "train accuracy", ls='--')
    #ax1.plot(yacc_t, label = "test accuracy", ls='--')

    lines, labels = ax.get_legend_handles_labels()
    #lines2, labels2 = ax1.get_legend_handles_labels()

    ax.legend(lines, labels)

In [None]:
plot_loss_acc(lss, lss_t)

In [None]:
plot_loss_acc(lss3, lss_t3, yacc3, yacc_t3)

In [None]:
def plot_change_latent_var(diva, lat_space="y", var_idx=[0,1,2,3,4,5,6,7], step = 5):
    a = next(enumerate(test_loader))
    with torch.no_grad():
        diva.eval()
        d = a[1][2][:len(var_idx)].to(DEVICE).float()
        x = a[1][0][:len(var_idx)].to(DEVICE).float()
        y = a[1][1][:len(var_idx)].to(DEVICE).float()

        zx, zx_sc = diva.qzx(x)
        zy, zy_sc = diva.qzy(x)
        zd, zd_sc =  diva.qzd(x)

        print(torch.max(zy), torch.min(zy), "sdmax:", torch.max(zy_sc))

        out = change(zx, zy, zd, var_idx, lat_space, diva, step)
    
    fig, ax = plt.subplots(ncols=out.shape[0],nrows=len(var_idx),figsize=(10*4*out.shape[0],10*len(var_idx)))
    for i in range(out.shape[0]):
      for j in range(len(var_idx)):
        ax[j,i].imshow(out[i,j])

In [None]:
def change(zx, zy, zd, idx, lat = "y", model=diva, step = 2):
    
    dif = np.arange(-30,15,step)
    print(torch.max(zy), torch.min(zy))
    out = np.zeros((dif.shape[0], len(idx), 25, 100 ,3))  
    #print(zy.shape, dif.shape[0])
    for i in range(dif.shape[0]):
      for j in range(len(idx)):
        if lat == "y":
            zy[j,idx] = dif[i]
        elif lat == "x":
            zx[j,idx] = dif[i]
        elif lat == "d":
            zd[j,idx] = dif[i]
        len_, bar, col = model.px(zd[j],zx[j],zy[j])
        out[i,j] = model.px.reconstruct_image(len_[None,:], bar, col)
    
    return out



In [None]:
plot_change_latent_var(diva)

In [None]:
fig,ax = plt.subplots()
ax.plot(np.arange(50,120), [i.cpu().detach().numpy() for i in lss2], label="train loss")
ax.plot(np.arange(50,120), [i.cpu().detach().numpy() for i in lss_t2], label = "testloss")
ax1 = ax.twinx()
ax1.plot(np.arange(50,120), yacc2, label = "train")
ax1.plot(np.arange(50,120), yacc_t2, label = "test")

plt.legend()

In [None]:
fig,ax = plt.subplots()
ax.plot(np.arange(120,180), [i.cpu().detach().numpy() for i in lss3], label="train loss")
ax.plot(np.arange(120,180), [i.cpu().detach().numpy() for i in lss_t3], label = "testloss")
ax1 = ax.twinx()
ax1.plot(np.arange(120,180), yacc3, label = "train",c='green')
ax1.plot(np.arange(120,180), yacc_t3, label = "test")

plt.legend()

# Model Evaluation

## Sampling from trained model

In [None]:
def plot_latent_space(lat_space="y"):
    '''
    lat_space: y, d, x
    '''

    

In [None]:
plot(x, out, 0)

In [None]:
fig, ax = plt.subplots(nrows=3, ncols=3)
for i in range(9):
  ax[i//3, i%3].imshow(x[i].cpu().permute(1,2,0))
  
plt.savefig('divastamporg.png')