In [1]:
%matplotlib inline

In [2]:
import os
import random
import sys
import codecs
import torch
import torch.autograd as autograd
import torch.nn as nn
import torch.nn.functional as F
import torch.optim as optim
import torch.utils.data as Data

from torchtext import data
from torchtext import datasets
from torchtext.vocab import GloVe

SEED = 1

torch.set_num_threads(8)
random.seed(SEED)
torch.manual_seed(SEED)

<torch._C.Generator at 0x7f55016f07e0>

In [3]:
# input: a sequence of tokens, and a token_to_index dictionary
# output: a LongTensor variable to encode the sequence of idxs
def prepare_sequence(seq, to_ix, cuda=False):
    var = autograd.Variable(torch.LongTensor([to_ix[w] for w in seq.split(' ')]).cuda())
    return var

def prepare_label(label,label_to_ix, cuda=False):
    var = autograd.Variable(torch.LongTensor([label_to_ix[label]]).cuda())
    return var

def build_token_to_ix(sentences):
    token_to_ix = dict()
    print(len(sentences))
    for sent in sentences:
        for token in sent.split(' '):
            if token not in token_to_ix:
                token_to_ix[token] = len(token_to_ix)
    token_to_ix['<pad>'] = len(token_to_ix)
    return token_to_ix

def build_label_to_ix(labels):
    label_to_ix = dict()
    for label in labels:
        if label not in label_to_ix:
            label_to_ix[label] = len(label_to_ix)

In [4]:
def load_IMDB_data():
    file_pos = './datasets/IMDB/imdb.pos'
    file_neg = './datasets/IMDB/imdb.neg'
    print('loading MR data from',file_pos,'and',file_neg)

    pos_sents = codecs.open(file_pos, 'r', 'utf8').read().split('\n')
    neg_sents = codecs.open(file_neg, 'r', 'utf8').read().split('\n')

    random.seed(SEED)
    random.shuffle(pos_sents)
    random.shuffle(neg_sents)

    print(len(pos_sents))
    print(len(neg_sents))

    train_data = [(sent,1) for sent in pos_sents[:210000]] + [(sent, 0) for sent in neg_sents[:210000]]
    dev_data = [(sent, 1) for sent in pos_sents[210000:270000]] + [(sent, 0) for sent in neg_sents[210000:270000]]
    test_data = [(sent, 1) for sent in pos_sents[270000:]] + [(sent, 0) for sent in neg_sents[270000:]]


    random.shuffle(train_data)
    random.shuffle(dev_data)
    random.shuffle(test_data)

    print('train:',len(train_data),'dev:',len(dev_data),'test:',len(test_data))

    word_to_ix = build_token_to_ix([s for s,_ in train_data+dev_data+test_data])
    label_to_ix = {0:0,1:1}
    print('vocab size:',len(word_to_ix),'label size:',len(label_to_ix))
    print('loading data done!')
    return train_data,dev_data,test_data,word_to_ix,label_to_ix

In [5]:
class LSTMClassifier(nn.Module):
    def __init__(self, embedding_dim, hidden_dim, vocab_size, label_size):
        super(LSTMClassifier, self).__init__()
        self.hidden_dim = hidden_dim
        self.word_embeddings = nn.Embedding(vocab_size, embedding_dim)
        self.lstm = nn.LSTM(embedding_dim, hidden_dim)
        self.hidden2label = nn.Linear(hidden_dim, label_size)
        self.hidden = self.init_hidden()

    def init_hidden(self):
        # the first is the hidden h
        # the second is the cell  c
        return (autograd.Variable(torch.zeros(1, 1, self.hidden_dim).cuda()),
                autograd.Variable(torch.zeros(1, 1, self.hidden_dim).cuda()))

    def forward(self, sentence):
        embeds = self.word_embeddings(sentence)
        x = embeds.view(len(sentence), 1, -1)
        lstm_out, self.hidden = self.lstm(x, self.hidden)
        y  = self.hidden2label(lstm_out[-1])
        log_probs = F.log_softmax(y)
        return log_probs

In [6]:
def get_accuracy(truth, pred):
    assert len(truth)==len(pred)
    right = 0
    for i in range(len(truth)):
        if truth[i]==pred[i]:
            right += 1.0
    return right/len(truth)

*GloVe: Global Vectors for Word Representation*

* https://nlp.stanford.edu/projects/glove/
* https://github.com/spro/practical-pytorch/blob/master/glove-word-vectors/glove-word-vectors.ipynb

In [7]:
# glove = GloVe(name='6B', dim=100)

# print('Loaded {} words'.format(len(glove.itos)))

# def get_word(word):
#     return glove.vectors[glove.stoi[word]]

# print('Embedding len: {}'.format(get_word('the').shape[0]))

In [8]:
def train():
    train_data, dev_data, test_data, word_to_ix, label_to_ix = load_IMDB_data()
    EMBEDDING_DIM = 50
    HIDDEN_DIM = 50
    EPOCH = 100
    best_dev_acc = 0.0
    model = LSTMClassifier(embedding_dim=EMBEDDING_DIM,hidden_dim=HIDDEN_DIM,
                           vocab_size=len(word_to_ix),label_size=len(label_to_ix)).cuda()
    loss_function = nn.NLLLoss()
    optimizer = optim.Adam(model.parameters(),lr = 1e-3)
    #optimizer = torch.optim.SGD(model.parameters(), lr = 1e-2)
    no_up = 0
    for i in range(EPOCH):
        random.shuffle(train_data)
        print('epoch: %d start!' % i)
        train_epoch(model, train_data, loss_function, optimizer, word_to_ix, label_to_ix, i)
        print('now best dev acc:',best_dev_acc)
        dev_acc = evaluate(model,dev_data,loss_function,word_to_ix,label_to_ix,'dev')
        test_acc = evaluate(model, test_data, loss_function, word_to_ix, label_to_ix, 'test')
        if dev_acc > best_dev_acc:
            best_dev_acc = dev_acc
            os.system('rm mr_best_model_acc_*.model')
            print('New Best Dev!!!')
            torch.save(model.state_dict(), 'best_models/mr_best_model_acc_' + str(int(test_acc*10000)) + '.model')
            no_up = 0
        else:
            no_up += 1
            if no_up >= 10:
                exit()

def evaluate(model, data, loss_function, word_to_ix, label_to_ix, name ='dev'):
    model.eval()
    avg_loss = 0.0
    truth_res = []
    pred_res = []

    for sent, label in data:
        truth_res.append(label_to_ix[label])
        # detaching it from its history on the last instance.
        model.hidden = model.init_hidden()
        sent = prepare_sequence(sent, word_to_ix)
        label = prepare_label(label, label_to_ix)
        pred = model(sent)
        pred_label = pred.data.max(1)[1].cpu().numpy()
        pred_res.append(pred_label)
        # model.zero_grad() # should I keep this when I am evaluating the model?
        loss = loss_function(pred, label)
        avg_loss += loss.data[0]
    avg_loss /= len(data)
    acc = get_accuracy(truth_res, pred_res)
    print(name + ' avg_loss:%g train acc:%g' % (avg_loss, acc ))
    return acc

In [None]:
def train_epoch(model, train_data, loss_function, optimizer, word_to_ix, label_to_ix, i):
    model.train()
    
    avg_loss = 0.0
    count = 0
    truth_res = []
    pred_res = []
    batch_sent = []

    for sent, label in train_data:
        truth_res.append(label_to_ix[label])
        # detaching it from its history on the last instance.
        model.hidden = model.init_hidden()
        sent = prepare_sequence(sent, word_to_ix)
        label = prepare_label(label, label_to_ix)
        pred = model(sent)
        pred_label = pred.data.max(1)[1].cpu().numpy()
        pred_res.append(pred_label)
        model.zero_grad()
        loss = loss_function(pred, label)
        avg_loss += loss.data[0]
        count += 1
        if count % 500 == 0:
            print('epoch: %d iterations: %d loss :%g' % (i, count, loss.data[0]))

        loss.backward()
        optimizer.step()
    avg_loss /= len(train_data)
    print('epoch: %d done! \n train avg_loss:%g , acc:%g'%(i, avg_loss, get_accuracy(truth_res,pred_res)))

In [None]:
train()

('loading MR data from', './datasets/IMDB/imdb.pos', 'and', './datasets/IMDB/imdb.neg')
300001
300001
('train:', 420000, 'dev:', 120000, 'test:', 60002)
600002
('vocab size:', 139300, 'label size:', 2)
loading data done!
epoch: 0 start!
epoch: 0 iterations: 500 loss :1.003
epoch: 0 iterations: 1000 loss :0.877521
epoch: 0 iterations: 1500 loss :0.651214
epoch: 0 iterations: 2000 loss :0.900085
epoch: 0 iterations: 2500 loss :0.926793
epoch: 0 iterations: 3000 loss :0.743511
epoch: 0 iterations: 3500 loss :0.330643
epoch: 0 iterations: 4000 loss :0.64402
epoch: 0 iterations: 4500 loss :0.42271
epoch: 0 iterations: 5000 loss :0.82321
epoch: 0 iterations: 5500 loss :0.083346
epoch: 0 iterations: 6000 loss :0.242063
epoch: 0 iterations: 6500 loss :0.77371
epoch: 0 iterations: 7000 loss :1.05399
epoch: 0 iterations: 7500 loss :1.70051
epoch: 0 iterations: 8000 loss :0.952174
epoch: 0 iterations: 8500 loss :0.67163
epoch: 0 iterations: 9000 loss :0.053081
epoch: 0 iterations: 9500 loss :0.40

epoch: 0 iterations: 96000 loss :0.532229
epoch: 0 iterations: 96500 loss :2.25317
epoch: 0 iterations: 97000 loss :1.07608
epoch: 0 iterations: 97500 loss :0.209075
epoch: 0 iterations: 98000 loss :1.05468
epoch: 0 iterations: 98500 loss :0.235083
epoch: 0 iterations: 99000 loss :0.00518775
epoch: 0 iterations: 99500 loss :0.0536507
epoch: 0 iterations: 100000 loss :0.133067
epoch: 0 iterations: 100500 loss :0.450593
epoch: 0 iterations: 101000 loss :0.570038
epoch: 0 iterations: 101500 loss :0.188487
epoch: 0 iterations: 102000 loss :3.17398
epoch: 0 iterations: 102500 loss :0.0128675
epoch: 0 iterations: 103000 loss :0.496278
epoch: 0 iterations: 103500 loss :0.0128152
epoch: 0 iterations: 104000 loss :0.408552
epoch: 0 iterations: 104500 loss :0.603786
epoch: 0 iterations: 105000 loss :0.396291
epoch: 0 iterations: 105500 loss :0.226057
epoch: 0 iterations: 106000 loss :0.0525239
epoch: 0 iterations: 106500 loss :0.344116
epoch: 0 iterations: 107000 loss :0.122477
epoch: 0 iteratio

epoch: 0 iterations: 191000 loss :0.0369941
epoch: 0 iterations: 191500 loss :0.587561
epoch: 0 iterations: 192000 loss :0.279566
epoch: 0 iterations: 192500 loss :0.0745373
epoch: 0 iterations: 193000 loss :0.00697327
epoch: 0 iterations: 193500 loss :0.663794
epoch: 0 iterations: 194000 loss :0.0330119
epoch: 0 iterations: 194500 loss :0.0217905
epoch: 0 iterations: 195000 loss :0.225823
epoch: 0 iterations: 195500 loss :0.0183609
epoch: 0 iterations: 196000 loss :0.0558445
epoch: 0 iterations: 196500 loss :0.362035
epoch: 0 iterations: 197000 loss :0.13039
epoch: 0 iterations: 197500 loss :1.07984
epoch: 0 iterations: 198000 loss :0.020242
epoch: 0 iterations: 198500 loss :0.271303
epoch: 0 iterations: 199000 loss :0.873755
epoch: 0 iterations: 199500 loss :0.0173371
epoch: 0 iterations: 200000 loss :0.0671794
epoch: 0 iterations: 200500 loss :0.377833
epoch: 0 iterations: 201000 loss :0.81986
epoch: 0 iterations: 201500 loss :0.0841663
epoch: 0 iterations: 202000 loss :0.290764
epo

epoch: 0 iterations: 286000 loss :0.0470574
epoch: 0 iterations: 286500 loss :0.733554
epoch: 0 iterations: 287000 loss :0.506438
epoch: 0 iterations: 287500 loss :0.0597062
epoch: 0 iterations: 288000 loss :0.188412
epoch: 0 iterations: 288500 loss :0.0108535
epoch: 0 iterations: 289000 loss :0.0446422
epoch: 0 iterations: 289500 loss :0.00561547
epoch: 0 iterations: 290000 loss :0.00128818
epoch: 0 iterations: 290500 loss :0.0028441
epoch: 0 iterations: 291000 loss :0.719369
epoch: 0 iterations: 291500 loss :0.112605
epoch: 0 iterations: 292000 loss :0.0110965
epoch: 0 iterations: 292500 loss :0.545538
epoch: 0 iterations: 293000 loss :0.218368
epoch: 0 iterations: 293500 loss :0.098435
epoch: 0 iterations: 294000 loss :2.07287
epoch: 0 iterations: 294500 loss :0.462462
epoch: 0 iterations: 295000 loss :0.01121
epoch: 0 iterations: 295500 loss :0.0239338
epoch: 0 iterations: 296000 loss :0.0226022
epoch: 0 iterations: 296500 loss :0.640602
epoch: 0 iterations: 297000 loss :0.445294
e

epoch: 0 iterations: 380500 loss :0.762107
epoch: 0 iterations: 381000 loss :0.0859309
epoch: 0 iterations: 381500 loss :2.53266
epoch: 0 iterations: 382000 loss :0.136538
epoch: 0 iterations: 382500 loss :0.0599158
epoch: 0 iterations: 383000 loss :0.0333769
epoch: 0 iterations: 383500 loss :0.759584
epoch: 0 iterations: 384000 loss :0.530454
epoch: 0 iterations: 384500 loss :0.00597978
epoch: 0 iterations: 385000 loss :0.669453
epoch: 0 iterations: 385500 loss :1.50037
epoch: 0 iterations: 386000 loss :1.81833
epoch: 0 iterations: 386500 loss :0.445652
epoch: 0 iterations: 387000 loss :0.0367496
epoch: 0 iterations: 387500 loss :0.20261
epoch: 0 iterations: 388000 loss :0.649222
epoch: 0 iterations: 388500 loss :0.0049746
epoch: 0 iterations: 389000 loss :0.596345
epoch: 0 iterations: 389500 loss :0.141341
epoch: 0 iterations: 390000 loss :0.135478
epoch: 0 iterations: 390500 loss :0.0524539
epoch: 0 iterations: 391000 loss :0.588154
epoch: 0 iterations: 391500 loss :0.02124
epoch: 0

epoch: 1 iterations: 54000 loss :0.0609045
epoch: 1 iterations: 54500 loss :0.00594258
epoch: 1 iterations: 55000 loss :0.645926
epoch: 1 iterations: 55500 loss :0.0735204
epoch: 1 iterations: 56000 loss :0.00471544
epoch: 1 iterations: 56500 loss :0.194472
epoch: 1 iterations: 57000 loss :0.0483602
epoch: 1 iterations: 57500 loss :0.00555634
epoch: 1 iterations: 58000 loss :0.0231297
epoch: 1 iterations: 58500 loss :0.0026474
epoch: 1 iterations: 59000 loss :0.00144458
epoch: 1 iterations: 59500 loss :0.0355017
epoch: 1 iterations: 60000 loss :0.0788051
epoch: 1 iterations: 60500 loss :0.0634056
epoch: 1 iterations: 61000 loss :0.0722837
epoch: 1 iterations: 61500 loss :0.0152822
epoch: 1 iterations: 62000 loss :0.111862
epoch: 1 iterations: 62500 loss :0.254177
epoch: 1 iterations: 63000 loss :0.0104599
epoch: 1 iterations: 63500 loss :1.46876
epoch: 1 iterations: 64000 loss :0.0181911
epoch: 1 iterations: 64500 loss :1.17425
epoch: 1 iterations: 65000 loss :0.0393149
epoch: 1 iterat

epoch: 1 iterations: 149500 loss :0.724699
epoch: 1 iterations: 150000 loss :0.62234
epoch: 1 iterations: 150500 loss :0.463721
epoch: 1 iterations: 151000 loss :0.00228882
epoch: 1 iterations: 151500 loss :2.25139
epoch: 1 iterations: 152000 loss :0.00975633
epoch: 1 iterations: 152500 loss :0.0737408
epoch: 1 iterations: 153000 loss :0.0436677
epoch: 1 iterations: 153500 loss :0.103777
epoch: 1 iterations: 154000 loss :0.54253
epoch: 1 iterations: 154500 loss :1.33116
epoch: 1 iterations: 155000 loss :0.0607666
epoch: 1 iterations: 155500 loss :1.00859
epoch: 1 iterations: 156000 loss :2.25442
epoch: 1 iterations: 156500 loss :0.674149
epoch: 1 iterations: 157000 loss :1.30573
epoch: 1 iterations: 157500 loss :0.00688291
epoch: 1 iterations: 158000 loss :2.01848
epoch: 1 iterations: 158500 loss :0.130661
epoch: 1 iterations: 159000 loss :0.0133785
epoch: 1 iterations: 159500 loss :0.68325
epoch: 1 iterations: 160000 loss :0.220456
epoch: 1 iterations: 160500 loss :0.199217
epoch: 1 i

epoch: 1 iterations: 244500 loss :0.204702
epoch: 1 iterations: 245000 loss :0.0172985
epoch: 1 iterations: 245500 loss :0.391148
epoch: 1 iterations: 246000 loss :0.0282959
epoch: 1 iterations: 246500 loss :0.0413665
epoch: 1 iterations: 247000 loss :0.0154316
epoch: 1 iterations: 247500 loss :1.61271
epoch: 1 iterations: 248000 loss :0.425256
epoch: 1 iterations: 248500 loss :0.0052402
epoch: 1 iterations: 249000 loss :0.0118206
epoch: 1 iterations: 249500 loss :0.0567212
epoch: 1 iterations: 250000 loss :0.0413041
epoch: 1 iterations: 250500 loss :0.921108
epoch: 1 iterations: 251000 loss :0.735774
epoch: 1 iterations: 251500 loss :0.531655
epoch: 1 iterations: 252000 loss :0.601263
epoch: 1 iterations: 252500 loss :0.108734
epoch: 1 iterations: 253000 loss :0.0147274
epoch: 1 iterations: 253500 loss :0.279872
epoch: 1 iterations: 254000 loss :0.271439
epoch: 1 iterations: 254500 loss :0.0305321
epoch: 1 iterations: 255000 loss :0.193869
epoch: 1 iterations: 255500 loss :0.203908
ep

epoch: 1 iterations: 339000 loss :1.07594
epoch: 1 iterations: 339500 loss :0.0129845
epoch: 1 iterations: 340000 loss :0.0191493
epoch: 1 iterations: 340500 loss :0.107282
epoch: 1 iterations: 341000 loss :0.0737511
epoch: 1 iterations: 341500 loss :0.270722
epoch: 1 iterations: 342000 loss :0.246648
epoch: 1 iterations: 342500 loss :0.141742
epoch: 1 iterations: 343000 loss :1.26862
epoch: 1 iterations: 343500 loss :0.135067
epoch: 1 iterations: 344000 loss :0.438412
epoch: 1 iterations: 344500 loss :0.00514364
epoch: 1 iterations: 345000 loss :0.176828
epoch: 1 iterations: 345500 loss :0.00224566
epoch: 1 iterations: 346000 loss :0.00519323
epoch: 1 iterations: 346500 loss :0.317089
epoch: 1 iterations: 347000 loss :2.5802
epoch: 1 iterations: 347500 loss :0.00508428
epoch: 1 iterations: 348000 loss :0.853709
epoch: 1 iterations: 348500 loss :0.572638
epoch: 1 iterations: 349000 loss :0.315435
epoch: 1 iterations: 349500 loss :0.00916004
epoch: 1 iterations: 350000 loss :0.172714
ep

epoch: 2 iterations: 12000 loss :1.47685
epoch: 2 iterations: 12500 loss :0.596444
epoch: 2 iterations: 13000 loss :0.660301
epoch: 2 iterations: 13500 loss :0.0355341
epoch: 2 iterations: 14000 loss :0.00308657
epoch: 2 iterations: 14500 loss :0.00251293
epoch: 2 iterations: 15000 loss :0.00693846
epoch: 2 iterations: 15500 loss :0.946451
epoch: 2 iterations: 16000 loss :4.78978
epoch: 2 iterations: 16500 loss :0.0447975
epoch: 2 iterations: 17000 loss :0.0057323
epoch: 2 iterations: 17500 loss :0.00631857
epoch: 2 iterations: 18000 loss :0.105951
epoch: 2 iterations: 18500 loss :0.837906
epoch: 2 iterations: 19000 loss :0.47594
epoch: 2 iterations: 19500 loss :0.0287235
epoch: 2 iterations: 20000 loss :0.00399089
epoch: 2 iterations: 20500 loss :0.0142934
epoch: 2 iterations: 21000 loss :0.0108073
epoch: 2 iterations: 21500 loss :0.0163268
epoch: 2 iterations: 22000 loss :0.00491953
epoch: 2 iterations: 22500 loss :0.0943637
epoch: 2 iterations: 23000 loss :1.60077
epoch: 2 iteration

epoch: 2 iterations: 108500 loss :0.275783
epoch: 2 iterations: 109000 loss :1.19446
epoch: 2 iterations: 109500 loss :0.0113896
epoch: 2 iterations: 110000 loss :0.0142312
epoch: 2 iterations: 110500 loss :1.45263
epoch: 2 iterations: 111000 loss :0.0140224
epoch: 2 iterations: 111500 loss :0.061938
epoch: 2 iterations: 112000 loss :0.515417
epoch: 2 iterations: 112500 loss :0.197488
epoch: 2 iterations: 113000 loss :1.82775
epoch: 2 iterations: 113500 loss :0.323834
epoch: 2 iterations: 114000 loss :0.00341916
epoch: 2 iterations: 114500 loss :0.00462723
epoch: 2 iterations: 115000 loss :0.00517845
epoch: 2 iterations: 115500 loss :0.452395
epoch: 2 iterations: 116000 loss :0.653676
epoch: 2 iterations: 116500 loss :0.084232
epoch: 2 iterations: 117000 loss :0.0642
epoch: 2 iterations: 117500 loss :0.00518513
epoch: 2 iterations: 118000 loss :0.00812554
epoch: 2 iterations: 118500 loss :0.0039916
epoch: 2 iterations: 119000 loss :0.156024
epoch: 2 iterations: 119500 loss :0.0131322
e

epoch: 2 iterations: 203000 loss :0.00515795
epoch: 2 iterations: 203500 loss :0.00536895
epoch: 2 iterations: 204000 loss :0.00386167
epoch: 2 iterations: 204500 loss :0.231956
epoch: 2 iterations: 205000 loss :0.0384423
epoch: 2 iterations: 205500 loss :0.252031
epoch: 2 iterations: 206000 loss :1.82406
epoch: 2 iterations: 206500 loss :1.10598
epoch: 2 iterations: 207000 loss :0.216772
epoch: 2 iterations: 207500 loss :0.00383854
epoch: 2 iterations: 208000 loss :0.00898862
epoch: 2 iterations: 208500 loss :1.82906
epoch: 2 iterations: 209000 loss :0.120056
epoch: 2 iterations: 209500 loss :0.0665703
epoch: 2 iterations: 210000 loss :0.019165
epoch: 2 iterations: 210500 loss :0.00623131
epoch: 2 iterations: 211000 loss :0.356632
epoch: 2 iterations: 211500 loss :1.52988
epoch: 2 iterations: 212000 loss :0.0280887
epoch: 2 iterations: 212500 loss :0.894086
epoch: 2 iterations: 213000 loss :0.0142686
epoch: 2 iterations: 213500 loss :0.610402
epoch: 2 iterations: 214000 loss :0.001090

epoch: 2 iterations: 297500 loss :0.0274118
epoch: 2 iterations: 298000 loss :0.0580114
epoch: 2 iterations: 298500 loss :0.0285265
epoch: 2 iterations: 299000 loss :1.17474
epoch: 2 iterations: 299500 loss :0.41013
epoch: 2 iterations: 300000 loss :0.223327
epoch: 2 iterations: 300500 loss :0.174334
epoch: 2 iterations: 301000 loss :0.278386
epoch: 2 iterations: 301500 loss :0.653874
epoch: 2 iterations: 302000 loss :0.376991
epoch: 2 iterations: 302500 loss :0.00324321
epoch: 2 iterations: 303000 loss :0.607296
epoch: 2 iterations: 303500 loss :0.00214386
epoch: 2 iterations: 304000 loss :0.138776
epoch: 2 iterations: 304500 loss :0.177382
epoch: 2 iterations: 305000 loss :2.4272
epoch: 2 iterations: 305500 loss :0.0044353
epoch: 2 iterations: 306000 loss :0.0104325
epoch: 2 iterations: 306500 loss :0.0578743
epoch: 2 iterations: 307000 loss :0.0280144
epoch: 2 iterations: 307500 loss :0.0329427
epoch: 2 iterations: 308000 loss :0.383304
epoch: 2 iterations: 308500 loss :0.019309
epo

epoch: 2 iterations: 392000 loss :0.545895
epoch: 2 iterations: 392500 loss :0.904264
epoch: 2 iterations: 393000 loss :2.90424
epoch: 2 iterations: 393500 loss :0.0129838
epoch: 2 iterations: 394000 loss :0.0213578
epoch: 2 iterations: 394500 loss :0.124911
epoch: 2 iterations: 395000 loss :0.0842733
epoch: 2 iterations: 395500 loss :0.0358381
epoch: 2 iterations: 396000 loss :3.2305
epoch: 2 iterations: 396500 loss :0.00703073
epoch: 2 iterations: 397000 loss :0.0681381
epoch: 2 iterations: 397500 loss :0.0387828
epoch: 2 iterations: 398000 loss :0.00545716
epoch: 2 iterations: 398500 loss :0.0303103
epoch: 2 iterations: 399000 loss :0.334068
epoch: 2 iterations: 399500 loss :0.904169
epoch: 2 iterations: 400000 loss :0.0158924
epoch: 2 iterations: 400500 loss :0.727423
epoch: 2 iterations: 401000 loss :0.0338835
epoch: 2 iterations: 401500 loss :0.0264281
epoch: 2 iterations: 402000 loss :1.91143
epoch: 2 iterations: 402500 loss :0.00722718
epoch: 2 iterations: 403000 loss :0.250834

epoch: 3 iterations: 66000 loss :0.214729
epoch: 3 iterations: 66500 loss :0.00214863
epoch: 3 iterations: 67000 loss :0.0647309
epoch: 3 iterations: 67500 loss :0.686632
epoch: 3 iterations: 68000 loss :0.0585954
epoch: 3 iterations: 68500 loss :0.0160515
epoch: 3 iterations: 69000 loss :0.0383523
epoch: 3 iterations: 69500 loss :0.0182406
epoch: 3 iterations: 70000 loss :0.312329
epoch: 3 iterations: 70500 loss :0.0324469
epoch: 3 iterations: 71000 loss :0.0157564
epoch: 3 iterations: 71500 loss :1.06561
epoch: 3 iterations: 72000 loss :0.0109794
epoch: 3 iterations: 72500 loss :0.519239
epoch: 3 iterations: 73000 loss :0.138884
epoch: 3 iterations: 73500 loss :0.0134165
epoch: 3 iterations: 74000 loss :0.342728
epoch: 3 iterations: 74500 loss :0.0268245
epoch: 3 iterations: 75000 loss :0.0101814
epoch: 3 iterations: 75500 loss :0.0169231
epoch: 3 iterations: 76000 loss :0.0419083
epoch: 3 iterations: 76500 loss :0.00637317
epoch: 3 iterations: 77000 loss :0.135096
epoch: 3 iteration

epoch: 3 iterations: 161000 loss :0.198601
epoch: 3 iterations: 161500 loss :0.340233
epoch: 3 iterations: 162000 loss :2.04634
epoch: 3 iterations: 162500 loss :0.0962598
epoch: 3 iterations: 163000 loss :0.00335121
epoch: 3 iterations: 163500 loss :0.279992
epoch: 3 iterations: 164000 loss :0.152487
epoch: 3 iterations: 164500 loss :0.113609
epoch: 3 iterations: 165000 loss :0.0386543
epoch: 3 iterations: 165500 loss :0.041416
epoch: 3 iterations: 166000 loss :0.00666571
epoch: 3 iterations: 166500 loss :0.0090723
epoch: 3 iterations: 167000 loss :0.00423717
epoch: 3 iterations: 167500 loss :0.0213993
epoch: 3 iterations: 168000 loss :0.148523
epoch: 3 iterations: 168500 loss :0.979236
epoch: 3 iterations: 169000 loss :0.0146469
epoch: 3 iterations: 169500 loss :0.0251552
epoch: 3 iterations: 170000 loss :0.00799704
epoch: 3 iterations: 170500 loss :0.00190449
epoch: 3 iterations: 171000 loss :0.190546
epoch: 3 iterations: 171500 loss :0.00535941
epoch: 3 iterations: 172000 loss :0.0

epoch: 3 iterations: 255500 loss :0.00553608
epoch: 3 iterations: 256000 loss :0.0456144
epoch: 3 iterations: 256500 loss :0.0339497
epoch: 3 iterations: 257000 loss :0.0042181
epoch: 3 iterations: 257500 loss :0.0539941
epoch: 3 iterations: 258000 loss :1.16172
epoch: 3 iterations: 258500 loss :0.148474
epoch: 3 iterations: 259000 loss :0.267758
epoch: 3 iterations: 259500 loss :1.66739
epoch: 3 iterations: 260000 loss :0.0166364
epoch: 3 iterations: 260500 loss :0.00848889
epoch: 3 iterations: 261000 loss :0.0772114
epoch: 3 iterations: 261500 loss :0.0294722
epoch: 3 iterations: 262000 loss :0.0273914
epoch: 3 iterations: 262500 loss :0.144516
epoch: 3 iterations: 263000 loss :1.72464
epoch: 3 iterations: 263500 loss :0.0554566
epoch: 3 iterations: 264000 loss :0.00505304
epoch: 3 iterations: 264500 loss :0.46234
epoch: 3 iterations: 265000 loss :0.0117655
epoch: 3 iterations: 265500 loss :0.0077343
epoch: 3 iterations: 266000 loss :0.0400307
epoch: 3 iterations: 266500 loss :0.0030

epoch: 3 iterations: 350000 loss :0.100747
epoch: 3 iterations: 350500 loss :0.223102
epoch: 3 iterations: 351000 loss :0.0196213
epoch: 3 iterations: 351500 loss :0.0027113
epoch: 3 iterations: 352000 loss :0.687029
epoch: 3 iterations: 352500 loss :1.50127
epoch: 3 iterations: 353000 loss :0.0236592
epoch: 3 iterations: 353500 loss :0.015202
epoch: 3 iterations: 354000 loss :0.0179218
epoch: 3 iterations: 354500 loss :0.0361187
epoch: 3 iterations: 355000 loss :0.00553489
epoch: 3 iterations: 355500 loss :0.0122306
epoch: 3 iterations: 356000 loss :0.526077
epoch: 3 iterations: 356500 loss :0.00804019
epoch: 3 iterations: 357000 loss :0.00506949
epoch: 3 iterations: 357500 loss :0.381315
epoch: 3 iterations: 358000 loss :0.790631
epoch: 3 iterations: 358500 loss :0.0552144
epoch: 3 iterations: 359000 loss :0.111771
epoch: 3 iterations: 359500 loss :0.0713861
epoch: 3 iterations: 360000 loss :1.62095
epoch: 3 iterations: 360500 loss :0.00359035
epoch: 3 iterations: 361000 loss :0.0218

epoch: 4 iterations: 22500 loss :0.357495
epoch: 4 iterations: 23000 loss :0.487465
epoch: 4 iterations: 23500 loss :0.250778
epoch: 4 iterations: 24000 loss :0.49028
epoch: 4 iterations: 24500 loss :0.00225472
epoch: 4 iterations: 25000 loss :0.103962
epoch: 4 iterations: 25500 loss :0.00821543
epoch: 4 iterations: 26000 loss :0.00942302
epoch: 4 iterations: 26500 loss :0.201912
epoch: 4 iterations: 27000 loss :0.0110928
epoch: 4 iterations: 27500 loss :0.106213
epoch: 4 iterations: 28000 loss :0.118904
epoch: 4 iterations: 28500 loss :0.0113775
epoch: 4 iterations: 29000 loss :0.0825578
epoch: 4 iterations: 29500 loss :0.34706
epoch: 4 iterations: 30000 loss :0.00490522
epoch: 4 iterations: 30500 loss :0.020907
epoch: 4 iterations: 31000 loss :0.260804
epoch: 4 iterations: 31500 loss :0.0176302
epoch: 4 iterations: 32000 loss :0.0233722
epoch: 4 iterations: 32500 loss :1.53212
epoch: 4 iterations: 33000 loss :0.0629399
epoch: 4 iterations: 33500 loss :0.0556214
epoch: 4 iterations: 3

epoch: 4 iterations: 119000 loss :0.0403086
epoch: 4 iterations: 119500 loss :0.0385413
epoch: 4 iterations: 120000 loss :0.338672
epoch: 4 iterations: 120500 loss :0.178222
epoch: 4 iterations: 121000 loss :0.203394
epoch: 4 iterations: 121500 loss :1.43487
epoch: 4 iterations: 122000 loss :0.180472
epoch: 4 iterations: 122500 loss :0.00310564
epoch: 4 iterations: 123000 loss :0.0342437
epoch: 4 iterations: 123500 loss :0.0189497
epoch: 4 iterations: 124000 loss :0.152568
epoch: 4 iterations: 124500 loss :0.0957845
epoch: 4 iterations: 125000 loss :0.031104
epoch: 4 iterations: 125500 loss :0.533219
epoch: 4 iterations: 126000 loss :0.0203569
epoch: 4 iterations: 126500 loss :0.0261343
epoch: 4 iterations: 127000 loss :0.0166366
epoch: 4 iterations: 127500 loss :0.0272992
epoch: 4 iterations: 128000 loss :0.0249151
epoch: 4 iterations: 128500 loss :0.00906205
epoch: 4 iterations: 129000 loss :0.0696691
epoch: 4 iterations: 129500 loss :0.0203698
epoch: 4 iterations: 130000 loss :0.227

epoch: 4 iterations: 213500 loss :0.0187459
epoch: 4 iterations: 214000 loss :0.0462078
epoch: 4 iterations: 214500 loss :0.0120423
epoch: 4 iterations: 215000 loss :1.7633
epoch: 4 iterations: 215500 loss :0.00168371
epoch: 4 iterations: 216000 loss :0.0407816
epoch: 4 iterations: 216500 loss :0.656489
epoch: 4 iterations: 217000 loss :0.017403
epoch: 4 iterations: 217500 loss :0.00616741
epoch: 4 iterations: 218000 loss :0.0670203
epoch: 4 iterations: 218500 loss :0.750103
epoch: 4 iterations: 219000 loss :0.162828
epoch: 4 iterations: 219500 loss :0.548396
epoch: 4 iterations: 220000 loss :0.0218562
epoch: 4 iterations: 220500 loss :0.0972905
epoch: 4 iterations: 221000 loss :0.0129678
epoch: 4 iterations: 221500 loss :1.38352
epoch: 4 iterations: 222000 loss :1.2457
epoch: 4 iterations: 222500 loss :0.0275884
epoch: 4 iterations: 223000 loss :0.0618834
epoch: 4 iterations: 223500 loss :1.03795
epoch: 4 iterations: 224000 loss :0.945047
epoch: 4 iterations: 224500 loss :0.0902454
ep

epoch: 4 iterations: 308000 loss :0.2127
epoch: 4 iterations: 308500 loss :0.278189
epoch: 4 iterations: 309000 loss :0.0157906
epoch: 4 iterations: 309500 loss :0.0385289
epoch: 4 iterations: 310000 loss :0.111921
epoch: 4 iterations: 310500 loss :0.914678
epoch: 4 iterations: 311000 loss :0.189026
epoch: 4 iterations: 311500 loss :0.0116756
epoch: 4 iterations: 312000 loss :0.218103
epoch: 4 iterations: 312500 loss :0.373981
epoch: 4 iterations: 313000 loss :0.0453582
epoch: 4 iterations: 313500 loss :0.00806093
epoch: 4 iterations: 314000 loss :0.0900434
epoch: 4 iterations: 314500 loss :0.0293449
epoch: 4 iterations: 315000 loss :0.0878893
epoch: 4 iterations: 315500 loss :1.14522
epoch: 4 iterations: 316000 loss :0.505106
epoch: 4 iterations: 316500 loss :0.600962
epoch: 4 iterations: 317000 loss :0.00906348
epoch: 4 iterations: 317500 loss :0.429833
epoch: 4 iterations: 318000 loss :0.0222883
epoch: 4 iterations: 318500 loss :0.243306
epoch: 4 iterations: 319000 loss :1.45915
epo

epoch: 4 iterations: 402500 loss :0.0247331
epoch: 4 iterations: 403000 loss :0.0167214
epoch: 4 iterations: 403500 loss :0.00426006
epoch: 4 iterations: 404000 loss :3.07133
epoch: 4 iterations: 404500 loss :0.592647
epoch: 4 iterations: 405000 loss :0.323126
epoch: 4 iterations: 405500 loss :0.227919
epoch: 4 iterations: 406000 loss :0.155503
epoch: 4 iterations: 406500 loss :0.0721719
epoch: 4 iterations: 407000 loss :0.141448
epoch: 4 iterations: 407500 loss :1.05605
epoch: 4 iterations: 408000 loss :0.240753
epoch: 4 iterations: 408500 loss :0.00439405
epoch: 4 iterations: 409000 loss :1.65545
epoch: 4 iterations: 409500 loss :1.63047
epoch: 4 iterations: 410000 loss :0.0203159
epoch: 4 iterations: 410500 loss :0.0383705
epoch: 4 iterations: 411000 loss :0.378193
epoch: 4 iterations: 411500 loss :0.00504756
epoch: 4 iterations: 412000 loss :0.306167
epoch: 4 iterations: 412500 loss :0.0135134
epoch: 4 iterations: 413000 loss :0.0347745
epoch: 4 iterations: 413500 loss :0.243172
ep

epoch: 5 iterations: 76000 loss :0.0131688
epoch: 5 iterations: 76500 loss :0.0061326
epoch: 5 iterations: 77000 loss :0.0483251
epoch: 5 iterations: 77500 loss :1.08301
epoch: 5 iterations: 78000 loss :0.014442
epoch: 5 iterations: 78500 loss :0.146512
epoch: 5 iterations: 79000 loss :0.00679994
epoch: 5 iterations: 79500 loss :0.02747
epoch: 5 iterations: 80000 loss :0.00761366
epoch: 5 iterations: 80500 loss :0.00462484
epoch: 5 iterations: 81000 loss :0.0194871
epoch: 5 iterations: 81500 loss :0.00598216
epoch: 5 iterations: 82000 loss :1.34747
epoch: 5 iterations: 82500 loss :0.0380781
epoch: 5 iterations: 83000 loss :0.183595
epoch: 5 iterations: 83500 loss :0.00982738
epoch: 5 iterations: 84000 loss :0.0660408
epoch: 5 iterations: 84500 loss :0.00914288
epoch: 5 iterations: 85000 loss :0.0476023
epoch: 5 iterations: 85500 loss :0.322331
epoch: 5 iterations: 86000 loss :0.0643936
epoch: 5 iterations: 86500 loss :0.0184426
epoch: 5 iterations: 87000 loss :0.0257577
epoch: 5 iterat

epoch: 5 iterations: 171000 loss :0.260199
epoch: 5 iterations: 171500 loss :0.0229266
epoch: 5 iterations: 172000 loss :1.33314
epoch: 5 iterations: 172500 loss :0.367446
epoch: 5 iterations: 173000 loss :0.135454
epoch: 5 iterations: 173500 loss :0.00324774
epoch: 5 iterations: 174000 loss :2.97234
epoch: 5 iterations: 174500 loss :1.09614
epoch: 5 iterations: 175000 loss :0.276079
epoch: 5 iterations: 175500 loss :1.17484
epoch: 5 iterations: 176000 loss :0.981392
epoch: 5 iterations: 176500 loss :0.210265
epoch: 5 iterations: 177000 loss :0.0291125
epoch: 5 iterations: 177500 loss :0.00531697
epoch: 5 iterations: 178000 loss :0.0401801
epoch: 5 iterations: 178500 loss :0.0187472
epoch: 5 iterations: 179000 loss :0.0650955
epoch: 5 iterations: 179500 loss :0.0122161
epoch: 5 iterations: 180000 loss :0.0128713
epoch: 5 iterations: 180500 loss :0.00595617
epoch: 5 iterations: 181000 loss :2.521
epoch: 5 iterations: 181500 loss :0.0976866
epoch: 5 iterations: 182000 loss :0.0319473
epo

epoch: 5 iterations: 265500 loss :0.0461636
epoch: 5 iterations: 266000 loss :0.0276281
epoch: 5 iterations: 266500 loss :0.00269389
epoch: 5 iterations: 267000 loss :0.362507
epoch: 5 iterations: 267500 loss :0.0768119
epoch: 5 iterations: 268000 loss :0.0469639
epoch: 5 iterations: 268500 loss :0.0135272
epoch: 5 iterations: 269000 loss :0.229301
epoch: 5 iterations: 269500 loss :0.00682783
epoch: 5 iterations: 270000 loss :0.0101075
epoch: 5 iterations: 270500 loss :0.00501013
epoch: 5 iterations: 271000 loss :0.00498271
epoch: 5 iterations: 271500 loss :0.00307941
epoch: 5 iterations: 272000 loss :0.144615
epoch: 5 iterations: 272500 loss :0.158224
epoch: 5 iterations: 273000 loss :0.00465655
epoch: 5 iterations: 273500 loss :0.00193644
epoch: 5 iterations: 274000 loss :0.971715
epoch: 5 iterations: 274500 loss :0.0636797
epoch: 5 iterations: 275000 loss :0.105088
epoch: 5 iterations: 275500 loss :4.07628
epoch: 5 iterations: 276000 loss :0.00836134
epoch: 5 iterations: 276500 loss

epoch: 5 iterations: 359500 loss :0.0129461
epoch: 5 iterations: 360000 loss :0.130278
epoch: 5 iterations: 360500 loss :0.0420992
epoch: 5 iterations: 361000 loss :1.4984
epoch: 5 iterations: 361500 loss :0.0116043
epoch: 5 iterations: 362000 loss :0.00693822
epoch: 5 iterations: 362500 loss :0.542608
epoch: 5 iterations: 363000 loss :0.0191736
epoch: 5 iterations: 363500 loss :0.340897
epoch: 5 iterations: 364000 loss :0.22953
epoch: 5 iterations: 364500 loss :0.0171072
epoch: 5 iterations: 365000 loss :0.496036
epoch: 5 iterations: 365500 loss :0.00478458
epoch: 5 iterations: 366000 loss :0.0179007
epoch: 5 iterations: 366500 loss :0.060689
epoch: 5 iterations: 367000 loss :0.768262
epoch: 5 iterations: 367500 loss :1.51679
epoch: 5 iterations: 368000 loss :0.00583315
epoch: 5 iterations: 368500 loss :0.00267792
epoch: 5 iterations: 369000 loss :0.344004
epoch: 5 iterations: 369500 loss :0.0130188
epoch: 5 iterations: 370000 loss :0.0277888
epoch: 5 iterations: 370500 loss :0.014630

epoch: 6 iterations: 32500 loss :0.030228
epoch: 6 iterations: 33000 loss :0.0951475
epoch: 6 iterations: 33500 loss :0.0106952
epoch: 6 iterations: 34000 loss :0.00638485
epoch: 6 iterations: 34500 loss :0.0919416
epoch: 6 iterations: 35000 loss :1.04322
epoch: 6 iterations: 35500 loss :0.0134673
epoch: 6 iterations: 36000 loss :0.0164306
epoch: 6 iterations: 36500 loss :0.0314839
epoch: 6 iterations: 37000 loss :0.0101767
epoch: 6 iterations: 37500 loss :0.717244
epoch: 6 iterations: 38000 loss :0.913065
epoch: 6 iterations: 38500 loss :0.235774
epoch: 6 iterations: 39000 loss :0.0110204
epoch: 6 iterations: 39500 loss :2.18873
epoch: 6 iterations: 40000 loss :0.035319
epoch: 6 iterations: 40500 loss :0.174992
epoch: 6 iterations: 41000 loss :0.146519
epoch: 6 iterations: 41500 loss :0.0777155
epoch: 6 iterations: 42000 loss :0.292888
epoch: 6 iterations: 42500 loss :0.00794458
epoch: 6 iterations: 43000 loss :0.00469995
epoch: 6 iterations: 43500 loss :0.047352
epoch: 6 iterations: 

epoch: 6 iterations: 128500 loss :0.329768
epoch: 6 iterations: 129000 loss :0.180458
epoch: 6 iterations: 129500 loss :0.0371249
epoch: 6 iterations: 130000 loss :0.0909586
epoch: 6 iterations: 130500 loss :0.748683
epoch: 6 iterations: 131000 loss :0.620902
epoch: 6 iterations: 131500 loss :0.0203686
epoch: 6 iterations: 132000 loss :0.0305179
epoch: 6 iterations: 132500 loss :1.72995
epoch: 6 iterations: 133000 loss :0.0229971
epoch: 6 iterations: 133500 loss :0.17001
epoch: 6 iterations: 134000 loss :0.0754799
epoch: 6 iterations: 134500 loss :0.735038
epoch: 6 iterations: 135000 loss :0.108513
epoch: 6 iterations: 135500 loss :0.057559
epoch: 6 iterations: 136000 loss :2.74689
epoch: 6 iterations: 136500 loss :0.0111989
epoch: 6 iterations: 137000 loss :0.0123868
epoch: 6 iterations: 137500 loss :0.0236385
epoch: 6 iterations: 138000 loss :0.26782
epoch: 6 iterations: 138500 loss :0.585503
epoch: 6 iterations: 139000 loss :0.0510957
epoch: 6 iterations: 139500 loss :0.132109
epoch

epoch: 6 iterations: 222500 loss :0.00878358
epoch: 6 iterations: 223000 loss :0.05884
epoch: 6 iterations: 223500 loss :0.026826
epoch: 6 iterations: 224000 loss :0.0123696
epoch: 6 iterations: 224500 loss :0.0236762
epoch: 6 iterations: 225000 loss :0.479735
epoch: 6 iterations: 225500 loss :0.136675
epoch: 6 iterations: 226000 loss :0.0302348
epoch: 6 iterations: 226500 loss :0.137474
epoch: 6 iterations: 227000 loss :0.185183
epoch: 6 iterations: 227500 loss :0.032609
epoch: 6 iterations: 228000 loss :0.173159
epoch: 6 iterations: 228500 loss :0.0111446
epoch: 6 iterations: 229000 loss :0.0194613
epoch: 6 iterations: 229500 loss :0.0646534
epoch: 6 iterations: 230000 loss :0.0565698
epoch: 6 iterations: 230500 loss :0.0125883
epoch: 6 iterations: 231000 loss :0.904497
epoch: 6 iterations: 231500 loss :1.77442
epoch: 6 iterations: 232000 loss :0.837299
epoch: 6 iterations: 232500 loss :0.022853
epoch: 6 iterations: 233000 loss :0.0176544
epoch: 6 iterations: 233500 loss :0.005934
ep

epoch: 6 iterations: 317000 loss :0.0549983
epoch: 6 iterations: 317500 loss :0.0454775
epoch: 6 iterations: 318000 loss :0.00859952
epoch: 6 iterations: 318500 loss :0.00139761
epoch: 6 iterations: 319000 loss :0.751568
epoch: 6 iterations: 319500 loss :0.0121603
epoch: 6 iterations: 320000 loss :0.375561
epoch: 6 iterations: 320500 loss :2.14294
epoch: 6 iterations: 321000 loss :0.635602
epoch: 6 iterations: 321500 loss :0.0210073
epoch: 6 iterations: 322000 loss :3.83838
epoch: 6 iterations: 322500 loss :1.314
epoch: 6 iterations: 323000 loss :0.0899949
epoch: 6 iterations: 323500 loss :0.271159
epoch: 6 iterations: 324000 loss :0.00464153
epoch: 6 iterations: 324500 loss :0.0303848
epoch: 6 iterations: 325000 loss :0.00866008
epoch: 6 iterations: 325500 loss :0.0186234
epoch: 6 iterations: 326000 loss :0.0094676
epoch: 6 iterations: 326500 loss :0.819142
epoch: 6 iterations: 327000 loss :0.00913906
epoch: 6 iterations: 327500 loss :0.158899
epoch: 6 iterations: 328000 loss :0.01102

epoch: 6 iterations: 411500 loss :0.0674428
epoch: 6 iterations: 412000 loss :0.824412
epoch: 6 iterations: 412500 loss :0.0394828
epoch: 6 iterations: 413000 loss :0.0713903
epoch: 6 iterations: 413500 loss :0.792616
epoch: 6 iterations: 414000 loss :0.0880314
epoch: 6 iterations: 414500 loss :0.0207301
epoch: 6 iterations: 415000 loss :0.00780606
epoch: 6 iterations: 415500 loss :0.0902572
epoch: 6 iterations: 416000 loss :0.0202348
epoch: 6 iterations: 416500 loss :0.239394
epoch: 6 iterations: 417000 loss :0.224532
epoch: 6 iterations: 417500 loss :0.0390886
epoch: 6 iterations: 418000 loss :0.00777221
epoch: 6 iterations: 418500 loss :0.0211093
epoch: 6 iterations: 419000 loss :0.223428
epoch: 6 iterations: 419500 loss :0.00575852
epoch: 6 iterations: 420000 loss :0.0210526
epoch: 6 done! 
 train avg_loss:0.297902 , acc:0.874831
('now best dev acc:', 0.8402166666666666)
dev avg_loss:0.351568 train acc:0.839992
test avg_loss:0.349041 train acc:0.842105
epoch: 7 start!
epoch: 7 iter

epoch: 7 iterations: 85500 loss :0.0391266
epoch: 7 iterations: 86000 loss :0.0793432
epoch: 7 iterations: 86500 loss :0.038893
epoch: 7 iterations: 87000 loss :0.00272369
epoch: 7 iterations: 87500 loss :0.66768
epoch: 7 iterations: 88000 loss :0.0100431
epoch: 7 iterations: 88500 loss :0.0102949
epoch: 7 iterations: 89000 loss :0.688204
epoch: 7 iterations: 89500 loss :0.0155244
epoch: 7 iterations: 90000 loss :0.0300708
epoch: 7 iterations: 90500 loss :0.133303
epoch: 7 iterations: 91000 loss :0.0904403
epoch: 7 iterations: 91500 loss :0.167271
epoch: 7 iterations: 92000 loss :0.479175
epoch: 7 iterations: 92500 loss :3.11174
epoch: 7 iterations: 93000 loss :2.46485
epoch: 7 iterations: 93500 loss :0.0158803
epoch: 7 iterations: 94000 loss :0.052111
epoch: 7 iterations: 94500 loss :0.316497
epoch: 7 iterations: 95000 loss :0.00998425
epoch: 7 iterations: 95500 loss :0.011394
epoch: 7 iterations: 96000 loss :0.0462652
epoch: 7 iterations: 96500 loss :0.00380039
epoch: 7 iterations: 9

epoch: 7 iterations: 180000 loss :0.00785899
epoch: 7 iterations: 180500 loss :0.118273
epoch: 7 iterations: 181000 loss :0.00509691
epoch: 7 iterations: 181500 loss :0.00893974
epoch: 7 iterations: 182000 loss :0.0119362
epoch: 7 iterations: 182500 loss :2.08885
epoch: 7 iterations: 183000 loss :0.741407
epoch: 7 iterations: 183500 loss :3.85609
epoch: 7 iterations: 184000 loss :0.297861
epoch: 7 iterations: 184500 loss :0.016957
epoch: 7 iterations: 185000 loss :0.00378036
epoch: 7 iterations: 185500 loss :0.129437
epoch: 7 iterations: 186000 loss :0.0684719
epoch: 7 iterations: 186500 loss :0.0307927
epoch: 7 iterations: 187000 loss :0.178216
epoch: 7 iterations: 187500 loss :0.00378299
epoch: 7 iterations: 188000 loss :0.0807496
epoch: 7 iterations: 188500 loss :0.00579667
epoch: 7 iterations: 189000 loss :0.0567356
epoch: 7 iterations: 189500 loss :0.195011
epoch: 7 iterations: 190000 loss :0.0797344
epoch: 7 iterations: 190500 loss :3.2229
epoch: 7 iterations: 191000 loss :0.0229

epoch: 7 iterations: 274500 loss :0.112932
epoch: 7 iterations: 275000 loss :0.00343513
epoch: 7 iterations: 275500 loss :0.0154958
epoch: 7 iterations: 276000 loss :1.57154
epoch: 7 iterations: 276500 loss :0.0165482
epoch: 7 iterations: 277000 loss :0.249408
epoch: 7 iterations: 277500 loss :0.0317924
epoch: 7 iterations: 278000 loss :0.588874
epoch: 7 iterations: 278500 loss :0.62708
epoch: 7 iterations: 279000 loss :0.166525
epoch: 7 iterations: 279500 loss :0.304622
epoch: 7 iterations: 280000 loss :0.0165905
epoch: 7 iterations: 280500 loss :0.452507
epoch: 7 iterations: 281000 loss :0.121074
epoch: 7 iterations: 281500 loss :0.0333977
epoch: 7 iterations: 282000 loss :0.0089004
epoch: 7 iterations: 282500 loss :0.0844585
epoch: 7 iterations: 283000 loss :0.0100369
epoch: 7 iterations: 283500 loss :0.272139
epoch: 7 iterations: 284000 loss :0.0311604
epoch: 7 iterations: 284500 loss :0.436695
epoch: 7 iterations: 285000 loss :0.00815034
epoch: 7 iterations: 285500 loss :0.0169568

epoch: 7 iterations: 369000 loss :0.290129
epoch: 7 iterations: 369500 loss :0.011301
epoch: 7 iterations: 370000 loss :0.0400474
epoch: 7 iterations: 370500 loss :0.951866
epoch: 7 iterations: 371000 loss :0.0182266
epoch: 7 iterations: 371500 loss :0.0132518
epoch: 7 iterations: 372000 loss :1.587
epoch: 7 iterations: 372500 loss :0.342672
epoch: 7 iterations: 373000 loss :0.0278876
epoch: 7 iterations: 373500 loss :0.033026
epoch: 7 iterations: 374000 loss :2.21567
epoch: 7 iterations: 374500 loss :1.52069
epoch: 7 iterations: 375000 loss :0.419101
epoch: 7 iterations: 375500 loss :0.00182033
epoch: 7 iterations: 376000 loss :0.0396125
epoch: 7 iterations: 376500 loss :0.0221593
epoch: 7 iterations: 377000 loss :0.0298525
epoch: 7 iterations: 377500 loss :0.983172
epoch: 7 iterations: 378000 loss :0.994759
epoch: 7 iterations: 378500 loss :0.212318
epoch: 7 iterations: 379000 loss :0.0205963
epoch: 7 iterations: 379500 loss :0.0914761
epoch: 7 iterations: 380000 loss :0.0056448
epoc

epoch: 8 iterations: 41500 loss :0.0552522
epoch: 8 iterations: 42000 loss :3.94642
epoch: 8 iterations: 42500 loss :0.00481248
epoch: 8 iterations: 43000 loss :0.00411606
epoch: 8 iterations: 43500 loss :0.0641694
epoch: 8 iterations: 44000 loss :0.0980357
epoch: 8 iterations: 44500 loss :0.0338562
epoch: 8 iterations: 45000 loss :0.456771
epoch: 8 iterations: 45500 loss :0.0455221
epoch: 8 iterations: 46000 loss :0.0914466
epoch: 8 iterations: 46500 loss :0.0426226
epoch: 8 iterations: 47000 loss :0.00308919
epoch: 8 iterations: 47500 loss :0.00656033
epoch: 8 iterations: 48000 loss :0.0641373
epoch: 8 iterations: 48500 loss :0.956185
epoch: 8 iterations: 49000 loss :0.154078
epoch: 8 iterations: 49500 loss :0.0925506
epoch: 8 iterations: 50000 loss :0.265044
epoch: 8 iterations: 50500 loss :0.0143706
epoch: 8 iterations: 51000 loss :0.110281
epoch: 8 iterations: 51500 loss :0.874843
epoch: 8 iterations: 52000 loss :0.625019
epoch: 8 iterations: 52500 loss :0.0762287
epoch: 8 iterati

epoch: 8 iterations: 137000 loss :0.0344903
epoch: 8 iterations: 137500 loss :0.204512
epoch: 8 iterations: 138000 loss :0.00959873
epoch: 8 iterations: 138500 loss :0.0168804
epoch: 8 iterations: 139000 loss :0.00841045
epoch: 8 iterations: 139500 loss :0.0164194
epoch: 8 iterations: 140000 loss :0.0165145
epoch: 8 iterations: 140500 loss :0.140657
epoch: 8 iterations: 141000 loss :0.18754
epoch: 8 iterations: 141500 loss :0.0297904
epoch: 8 iterations: 142000 loss :0.404776
epoch: 8 iterations: 142500 loss :0.110892
epoch: 8 iterations: 143000 loss :0.00401664
epoch: 8 iterations: 143500 loss :0.425271
epoch: 8 iterations: 144000 loss :0.68483
epoch: 8 iterations: 144500 loss :0.00608063
epoch: 8 iterations: 145000 loss :0.248546
epoch: 8 iterations: 145500 loss :0.0293133
epoch: 8 iterations: 146000 loss :0.00826693
epoch: 8 iterations: 146500 loss :0.0110345
epoch: 8 iterations: 147000 loss :0.377241
epoch: 8 iterations: 147500 loss :0.00670934
epoch: 8 iterations: 148000 loss :1.3

epoch: 8 iterations: 231500 loss :0.215983
epoch: 8 iterations: 232000 loss :0.0573108
epoch: 8 iterations: 232500 loss :0.0163032
epoch: 8 iterations: 233000 loss :0.00394773
epoch: 8 iterations: 233500 loss :0.441031
epoch: 8 iterations: 234000 loss :0.20105
epoch: 8 iterations: 234500 loss :0.181868
epoch: 8 iterations: 235000 loss :0.018819
epoch: 8 iterations: 235500 loss :0.124337
epoch: 8 iterations: 236000 loss :0.0039711
epoch: 8 iterations: 236500 loss :0.133448
epoch: 8 iterations: 237000 loss :0.217267
epoch: 8 iterations: 237500 loss :0.221487
epoch: 8 iterations: 238000 loss :0.558811
epoch: 8 iterations: 238500 loss :0.0749872
epoch: 8 iterations: 239000 loss :0.0277675
epoch: 8 iterations: 239500 loss :0.28445
epoch: 8 iterations: 240000 loss :0.0538143
epoch: 8 iterations: 240500 loss :0.0247413
epoch: 8 iterations: 241000 loss :0.0435877
epoch: 8 iterations: 241500 loss :0.133728
epoch: 8 iterations: 242000 loss :0.0105281
epoch: 8 iterations: 242500 loss :0.212461
ep

epoch: 8 iterations: 325500 loss :0.0577437
epoch: 8 iterations: 326000 loss :0.0170572
epoch: 8 iterations: 326500 loss :0.136785
epoch: 8 iterations: 327000 loss :0.150394
epoch: 8 iterations: 327500 loss :0.0140314
epoch: 8 iterations: 328000 loss :0.00949526
epoch: 8 iterations: 328500 loss :1.94417
epoch: 8 iterations: 329000 loss :0.119107
epoch: 8 iterations: 329500 loss :0.101697
epoch: 8 iterations: 330000 loss :0.0137861
epoch: 8 iterations: 330500 loss :0.0204509
epoch: 8 iterations: 331000 loss :0.394201
epoch: 8 iterations: 331500 loss :2.0199
epoch: 8 iterations: 332000 loss :0.0121899
epoch: 8 iterations: 332500 loss :0.508746
epoch: 8 iterations: 333000 loss :0.00688148
epoch: 8 iterations: 333500 loss :0.104762
epoch: 8 iterations: 334000 loss :0.630656
epoch: 8 iterations: 334500 loss :0.123962
epoch: 8 iterations: 335000 loss :0.0319133
epoch: 8 iterations: 335500 loss :5.42481
epoch: 8 iterations: 336000 loss :0.0304892
epoch: 8 iterations: 336500 loss :0.0211046
ep

epoch: 8 iterations: 420000 loss :0.0229188
epoch: 8 done! 
 train avg_loss:0.289754 , acc:0.88039
('now best dev acc:', 0.8403083333333333)
dev avg_loss:0.353059 train acc:0.840325
test avg_loss:0.350936 train acc:0.842772
New Best Dev!!!
epoch: 9 start!
epoch: 9 iterations: 500 loss :0.0431995
epoch: 9 iterations: 1000 loss :0.107788
epoch: 9 iterations: 1500 loss :0.0194331
epoch: 9 iterations: 2000 loss :0.23575
epoch: 9 iterations: 2500 loss :0.0244536
epoch: 9 iterations: 3000 loss :1.68152
epoch: 9 iterations: 3500 loss :0.092678
epoch: 9 iterations: 4000 loss :0.984346
epoch: 9 iterations: 4500 loss :0.0336981
epoch: 9 iterations: 5000 loss :0.00277448
epoch: 9 iterations: 5500 loss :0.0854371
epoch: 9 iterations: 6000 loss :0.0336016
epoch: 9 iterations: 6500 loss :0.036153
epoch: 9 iterations: 7000 loss :0.0100121
epoch: 9 iterations: 7500 loss :0.130593
epoch: 9 iterations: 8000 loss :0.217212
epoch: 9 iterations: 8500 loss :0.0167887
epoch: 9 iterations: 9000 loss :1.25188


epoch: 9 iterations: 94500 loss :0.115906
epoch: 9 iterations: 95000 loss :0.023586
epoch: 9 iterations: 95500 loss :0.0276697
epoch: 9 iterations: 96000 loss :0.0327803
epoch: 9 iterations: 96500 loss :0.00645018
epoch: 9 iterations: 97000 loss :0.65621
epoch: 9 iterations: 97500 loss :0.110595
epoch: 9 iterations: 98000 loss :0.00258708
epoch: 9 iterations: 98500 loss :0.00597215
epoch: 9 iterations: 99000 loss :0.0463326
epoch: 9 iterations: 99500 loss :0.0150664
epoch: 9 iterations: 100000 loss :0.225033
epoch: 9 iterations: 100500 loss :0.828517
epoch: 9 iterations: 101000 loss :0.0862248
epoch: 9 iterations: 101500 loss :0.084537
epoch: 9 iterations: 102000 loss :0.586132
epoch: 9 iterations: 102500 loss :0.2045
epoch: 9 iterations: 103000 loss :0.107645
epoch: 9 iterations: 103500 loss :0.0145137
epoch: 9 iterations: 104000 loss :2.56849
epoch: 9 iterations: 104500 loss :0.31977
epoch: 9 iterations: 105000 loss :0.0202013
epoch: 9 iterations: 105500 loss :0.0191293
epoch: 9 iter

epoch: 9 iterations: 189000 loss :0.0160818
epoch: 9 iterations: 189500 loss :0.0152004
epoch: 9 iterations: 190000 loss :0.108395
epoch: 9 iterations: 190500 loss :0.0148518
epoch: 9 iterations: 191000 loss :0.0351363
epoch: 9 iterations: 191500 loss :0.0540979
epoch: 9 iterations: 192000 loss :0.00466847
epoch: 9 iterations: 192500 loss :0.174006
epoch: 9 iterations: 193000 loss :0.0107424
epoch: 9 iterations: 193500 loss :2.75578
epoch: 9 iterations: 194000 loss :0.125999
epoch: 9 iterations: 194500 loss :0.0140581
epoch: 9 iterations: 195000 loss :0.0115266
epoch: 9 iterations: 195500 loss :0.0539891
epoch: 9 iterations: 196000 loss :0.0195491
epoch: 9 iterations: 196500 loss :0.00812387
epoch: 9 iterations: 197000 loss :0.0178282
epoch: 9 iterations: 197500 loss :0.841733
epoch: 9 iterations: 198000 loss :0.0389783
epoch: 9 iterations: 198500 loss :0.0387076
epoch: 9 iterations: 199000 loss :0.0843949
epoch: 9 iterations: 199500 loss :0.0440202
epoch: 9 iterations: 200000 loss :0.

epoch: 9 iterations: 283500 loss :1.32704
epoch: 9 iterations: 284000 loss :2.01904
epoch: 9 iterations: 284500 loss :0.00902367
epoch: 9 iterations: 285000 loss :0.213315
epoch: 9 iterations: 285500 loss :0.0251878
epoch: 9 iterations: 286000 loss :0.0122547
epoch: 9 iterations: 286500 loss :0.08744
epoch: 9 iterations: 287000 loss :0.286412
epoch: 9 iterations: 287500 loss :0.197124
epoch: 9 iterations: 288000 loss :0.0151793
epoch: 9 iterations: 288500 loss :0.133402
epoch: 9 iterations: 289000 loss :0.0336239
epoch: 9 iterations: 289500 loss :0.0247707
epoch: 9 iterations: 290000 loss :0.00840592
epoch: 9 iterations: 290500 loss :1.32504
epoch: 9 iterations: 291000 loss :0.0565158
epoch: 9 iterations: 291500 loss :0.0357304
epoch: 9 iterations: 292000 loss :0.0158243
epoch: 9 iterations: 292500 loss :0.0150599
epoch: 9 iterations: 293000 loss :0.16694
epoch: 9 iterations: 293500 loss :1.07639
epoch: 9 iterations: 294000 loss :0.0189017
epoch: 9 iterations: 294500 loss :0.0826278
ep

epoch: 9 iterations: 378000 loss :0.173798
epoch: 9 iterations: 378500 loss :0.00722551
epoch: 9 iterations: 379000 loss :0.012939
epoch: 9 iterations: 379500 loss :0.0219018
epoch: 9 iterations: 380000 loss :0.153438
epoch: 9 iterations: 380500 loss :0.0121278
epoch: 9 iterations: 381000 loss :0.0082767
epoch: 9 iterations: 381500 loss :0.0508223
epoch: 9 iterations: 382000 loss :2.26937
epoch: 9 iterations: 382500 loss :0.0146837
epoch: 9 iterations: 383000 loss :0.0221198
epoch: 9 iterations: 383500 loss :0.099478
epoch: 9 iterations: 384000 loss :0.194988
epoch: 9 iterations: 384500 loss :0.00289178
epoch: 9 iterations: 385000 loss :0.548945
epoch: 9 iterations: 385500 loss :0.1546
epoch: 9 iterations: 386000 loss :3.80141
epoch: 9 iterations: 386500 loss :1.09168
epoch: 9 iterations: 387000 loss :0.099292
epoch: 9 iterations: 387500 loss :0.204648
epoch: 9 iterations: 388000 loss :0.11719
epoch: 9 iterations: 388500 loss :0.77066
epoch: 9 iterations: 389000 loss :0.0340918
epoch: 

epoch: 10 iterations: 50000 loss :0.474829
epoch: 10 iterations: 50500 loss :0.107949
epoch: 10 iterations: 51000 loss :0.0223815
epoch: 10 iterations: 51500 loss :0.0267934
epoch: 10 iterations: 52000 loss :0.17125
epoch: 10 iterations: 52500 loss :0.0356357
epoch: 10 iterations: 53000 loss :0.142227
epoch: 10 iterations: 53500 loss :0.465536
epoch: 10 iterations: 54000 loss :0.0236174
epoch: 10 iterations: 54500 loss :1.74303
epoch: 10 iterations: 55000 loss :0.0232972
epoch: 10 iterations: 55500 loss :0.509157
epoch: 10 iterations: 56000 loss :0.025739
epoch: 10 iterations: 56500 loss :0.00707269
epoch: 10 iterations: 57000 loss :0.0248498
epoch: 10 iterations: 57500 loss :0.290042
epoch: 10 iterations: 58000 loss :0.0119948
epoch: 10 iterations: 58500 loss :0.00788999
epoch: 10 iterations: 59000 loss :0.264376
epoch: 10 iterations: 59500 loss :0.0517236
epoch: 10 iterations: 60000 loss :0.00225544
epoch: 10 iterations: 60500 loss :0.866305
epoch: 10 iterations: 61000 loss :0.011789

epoch: 10 iterations: 143000 loss :2.1321
epoch: 10 iterations: 143500 loss :0.0738342
epoch: 10 iterations: 144000 loss :0.102335
epoch: 10 iterations: 144500 loss :0.598428
epoch: 10 iterations: 145000 loss :0.313052
epoch: 10 iterations: 145500 loss :0.678042
epoch: 10 iterations: 146000 loss :0.0280452
epoch: 10 iterations: 146500 loss :0.0358343
epoch: 10 iterations: 147000 loss :1.59971
epoch: 10 iterations: 147500 loss :0.0239002
epoch: 10 iterations: 148000 loss :0.353724
epoch: 10 iterations: 148500 loss :0.173935
epoch: 10 iterations: 149000 loss :0.207083
epoch: 10 iterations: 149500 loss :0.0260813
epoch: 10 iterations: 150000 loss :0.00782418
epoch: 10 iterations: 150500 loss :0.143972
epoch: 10 iterations: 151000 loss :0.00461149
epoch: 10 iterations: 151500 loss :1.27431
epoch: 10 iterations: 152000 loss :0.499253
epoch: 10 iterations: 152500 loss :0.0154099
epoch: 10 iterations: 153000 loss :0.0179727
epoch: 10 iterations: 153500 loss :0.236744
epoch: 10 iterations: 154

epoch: 10 iterations: 235500 loss :0.00639844
epoch: 10 iterations: 236000 loss :0.051729
epoch: 10 iterations: 236500 loss :0.070343
epoch: 10 iterations: 237000 loss :0.0179701
epoch: 10 iterations: 237500 loss :0.0863074
epoch: 10 iterations: 238000 loss :0.00340056
epoch: 10 iterations: 238500 loss :0.362398
epoch: 10 iterations: 239000 loss :0.00684738
epoch: 10 iterations: 239500 loss :2.02763
epoch: 10 iterations: 240000 loss :1.59307
epoch: 10 iterations: 240500 loss :0.0463072
epoch: 10 iterations: 241000 loss :0.0541878
epoch: 10 iterations: 241500 loss :0.594771
epoch: 10 iterations: 242000 loss :1.13666
epoch: 10 iterations: 242500 loss :0.0238162
epoch: 10 iterations: 243000 loss :0.0426906
epoch: 10 iterations: 243500 loss :0.0183942
epoch: 10 iterations: 244000 loss :0.117743
epoch: 10 iterations: 244500 loss :0.042913
epoch: 10 iterations: 245000 loss :0.223832
epoch: 10 iterations: 245500 loss :0.0201592
epoch: 10 iterations: 246000 loss :0.0065217
epoch: 10 iterations

epoch: 10 iterations: 327500 loss :0.0103498
epoch: 10 iterations: 328000 loss :0.443919
epoch: 10 iterations: 328500 loss :0.00126767
epoch: 10 iterations: 329000 loss :0.0342797
epoch: 10 iterations: 329500 loss :0.100682
epoch: 10 iterations: 330000 loss :0.0356309
epoch: 10 iterations: 330500 loss :0.0318432
epoch: 10 iterations: 331000 loss :0.605478
epoch: 10 iterations: 331500 loss :0.253998
epoch: 10 iterations: 332000 loss :0.0155737
epoch: 10 iterations: 332500 loss :0.0599471
epoch: 10 iterations: 333000 loss :0.674651
epoch: 10 iterations: 333500 loss :0.0702362
epoch: 10 iterations: 334000 loss :0.0317223
epoch: 10 iterations: 334500 loss :0.0287864
epoch: 10 iterations: 335000 loss :1.7547
epoch: 10 iterations: 335500 loss :0.140018
epoch: 10 iterations: 336000 loss :0.206912
epoch: 10 iterations: 336500 loss :0.0349816
epoch: 10 iterations: 337000 loss :0.141197
epoch: 10 iterations: 337500 loss :0.0110886
epoch: 10 iterations: 338000 loss :0.801484
epoch: 10 iterations:

epoch: 10 iterations: 419500 loss :0.0266812
epoch: 10 iterations: 420000 loss :0.0430394
epoch: 10 done! 
 train avg_loss:0.284604 , acc:0.883852
('now best dev acc:', 0.8404666666666667)
dev avg_loss:0.354878 train acc:0.8411
test avg_loss:0.355447 train acc:0.841672
New Best Dev!!!
epoch: 11 start!
epoch: 11 iterations: 500 loss :0.0278641
epoch: 11 iterations: 1000 loss :0.228679
epoch: 11 iterations: 1500 loss :0.45552
epoch: 11 iterations: 2000 loss :0.889059
epoch: 11 iterations: 2500 loss :2.01214
epoch: 11 iterations: 3000 loss :0.105323
epoch: 11 iterations: 3500 loss :0.346762
epoch: 11 iterations: 4000 loss :0.499394
epoch: 11 iterations: 4500 loss :0.299121
epoch: 11 iterations: 5000 loss :2.72257
epoch: 11 iterations: 5500 loss :1.69594
epoch: 11 iterations: 6000 loss :0.0313938
epoch: 11 iterations: 6500 loss :0.50756
epoch: 11 iterations: 7000 loss :0.0115228
epoch: 11 iterations: 7500 loss :0.00130081
epoch: 11 iterations: 8000 loss :0.00716233
epoch: 11 iterations: 85

epoch: 11 iterations: 91500 loss :0.0775665
epoch: 11 iterations: 92000 loss :0.00259542
epoch: 11 iterations: 92500 loss :0.0362643
epoch: 11 iterations: 93000 loss :0.613027
epoch: 11 iterations: 93500 loss :0.119675
epoch: 11 iterations: 94000 loss :0.358178
epoch: 11 iterations: 94500 loss :0.0180645
epoch: 11 iterations: 95000 loss :0.00370908
epoch: 11 iterations: 95500 loss :0.304189
epoch: 11 iterations: 96000 loss :0.554209
epoch: 11 iterations: 96500 loss :0.186617
epoch: 11 iterations: 97000 loss :0.362125
epoch: 11 iterations: 97500 loss :0.0086956
epoch: 11 iterations: 98000 loss :0.00921249
epoch: 11 iterations: 98500 loss :0.274575
epoch: 11 iterations: 99000 loss :0.18545
epoch: 11 iterations: 99500 loss :0.406593
epoch: 11 iterations: 100000 loss :0.00618029
epoch: 11 iterations: 100500 loss :3.04232
epoch: 11 iterations: 101000 loss :0.25145
epoch: 11 iterations: 101500 loss :0.0130646
epoch: 11 iterations: 102000 loss :0.0185707
epoch: 11 iterations: 102500 loss :0.0

epoch: 11 iterations: 184000 loss :2.31304
epoch: 11 iterations: 184500 loss :0.078817
epoch: 11 iterations: 185000 loss :3.74924
epoch: 11 iterations: 185500 loss :0.443622
epoch: 11 iterations: 186000 loss :0.332215
epoch: 11 iterations: 186500 loss :0.0171655
epoch: 11 iterations: 187000 loss :0.573897
epoch: 11 iterations: 187500 loss :0.0075376
epoch: 11 iterations: 188000 loss :0.0354193
epoch: 11 iterations: 188500 loss :0.0705998
epoch: 11 iterations: 189000 loss :0.479446
epoch: 11 iterations: 189500 loss :0.00653052
epoch: 11 iterations: 190000 loss :1.26367
epoch: 11 iterations: 190500 loss :0.00448942
epoch: 11 iterations: 191000 loss :1.98211
epoch: 11 iterations: 191500 loss :0.0190624
epoch: 11 iterations: 192000 loss :0.0130231
epoch: 11 iterations: 192500 loss :0.0871917
epoch: 11 iterations: 193000 loss :2.2405
epoch: 11 iterations: 193500 loss :0.066093
epoch: 11 iterations: 194000 loss :0.0538712
epoch: 11 iterations: 194500 loss :0.0157104
epoch: 11 iterations: 195

epoch: 11 iterations: 276000 loss :0.0567118
epoch: 11 iterations: 276500 loss :0.0340669
epoch: 11 iterations: 277000 loss :0.0151064
epoch: 11 iterations: 277500 loss :0.148961
epoch: 11 iterations: 278000 loss :0.101742
epoch: 11 iterations: 278500 loss :0.532286
epoch: 11 iterations: 279000 loss :0.0106966
epoch: 11 iterations: 279500 loss :0.0176016
epoch: 11 iterations: 280000 loss :0.145339
epoch: 11 iterations: 280500 loss :0.0450882
epoch: 11 iterations: 281000 loss :0.0406995
epoch: 11 iterations: 281500 loss :0.122608
epoch: 11 iterations: 282000 loss :0.416128
epoch: 11 iterations: 282500 loss :0.214831
epoch: 11 iterations: 283000 loss :0.364128
epoch: 11 iterations: 283500 loss :0.00453877
epoch: 11 iterations: 284000 loss :0.00831652
epoch: 11 iterations: 284500 loss :0.0052352
epoch: 11 iterations: 285000 loss :0.130604
epoch: 11 iterations: 285500 loss :0.790117
epoch: 11 iterations: 286000 loss :0.162458
epoch: 11 iterations: 286500 loss :0.270608
epoch: 11 iterations

epoch: 11 iterations: 368000 loss :0.0217434
epoch: 11 iterations: 368500 loss :0.0314345
epoch: 11 iterations: 369000 loss :0.00614333
epoch: 11 iterations: 369500 loss :0.00433564
epoch: 11 iterations: 370000 loss :0.0188702
epoch: 11 iterations: 370500 loss :0.450227
epoch: 11 iterations: 371000 loss :0.0821443
epoch: 11 iterations: 371500 loss :0.0595849
epoch: 11 iterations: 372000 loss :0.0618916
epoch: 11 iterations: 372500 loss :0.0564219
epoch: 11 iterations: 373000 loss :0.0185982
epoch: 11 iterations: 373500 loss :0.287929
epoch: 11 iterations: 374000 loss :0.400521
epoch: 11 iterations: 374500 loss :1.65586
epoch: 11 iterations: 375000 loss :0.108683
epoch: 11 iterations: 375500 loss :0.0826712
epoch: 11 iterations: 376000 loss :0.00878763
epoch: 11 iterations: 376500 loss :0.769865
epoch: 11 iterations: 377000 loss :0.0319136
epoch: 11 iterations: 377500 loss :0.0128899
epoch: 11 iterations: 378000 loss :1.54395
epoch: 11 iterations: 378500 loss :0.397362
epoch: 11 iterati

epoch: 12 iterations: 39000 loss :0.0290427
epoch: 12 iterations: 39500 loss :0.0466123
epoch: 12 iterations: 40000 loss :0.0206144
epoch: 12 iterations: 40500 loss :0.172732
epoch: 12 iterations: 41000 loss :0.0119392
epoch: 12 iterations: 41500 loss :2.5217
epoch: 12 iterations: 42000 loss :0.410755
epoch: 12 iterations: 42500 loss :3.97334
epoch: 12 iterations: 43000 loss :0.146554
epoch: 12 iterations: 43500 loss :0.0156002
epoch: 12 iterations: 44000 loss :0.0120635
epoch: 12 iterations: 44500 loss :0.0156276
epoch: 12 iterations: 45000 loss :0.0776161
epoch: 12 iterations: 45500 loss :0.0218557
epoch: 12 iterations: 46000 loss :0.37445
epoch: 12 iterations: 46500 loss :0.0405262
epoch: 12 iterations: 47000 loss :0.0206894
epoch: 12 iterations: 47500 loss :0.0161023
epoch: 12 iterations: 48000 loss :0.0228761
epoch: 12 iterations: 48500 loss :0.01807
epoch: 12 iterations: 49000 loss :0.231598
epoch: 12 iterations: 49500 loss :0.0702517
epoch: 12 iterations: 50000 loss :0.272097
ep

epoch: 12 iterations: 132500 loss :0.0342183
epoch: 12 iterations: 133000 loss :0.00419569
epoch: 12 iterations: 133500 loss :0.363579
epoch: 12 iterations: 134000 loss :0.0822572
epoch: 12 iterations: 134500 loss :0.00489473
epoch: 12 iterations: 135000 loss :0.00495911
epoch: 12 iterations: 135500 loss :0.183594
epoch: 12 iterations: 136000 loss :0.173042
epoch: 12 iterations: 136500 loss :0.0100708
epoch: 12 iterations: 137000 loss :0.00893569
epoch: 12 iterations: 137500 loss :0.00940871
epoch: 12 iterations: 138000 loss :0.0610245
epoch: 12 iterations: 138500 loss :0.0143881
epoch: 12 iterations: 139000 loss :0.888346
epoch: 12 iterations: 139500 loss :0.0605954
epoch: 12 iterations: 140000 loss :0.010082
epoch: 12 iterations: 140500 loss :0.0997064
epoch: 12 iterations: 141000 loss :0.00133204
epoch: 12 iterations: 141500 loss :0.00907207
epoch: 12 iterations: 142000 loss :0.0129526
epoch: 12 iterations: 142500 loss :0.016129
epoch: 12 iterations: 143000 loss :0.0345129
epoch: 12

epoch: 12 iterations: 224500 loss :0.0303707
epoch: 12 iterations: 225000 loss :0.00244188
epoch: 12 iterations: 225500 loss :1.77091
epoch: 12 iterations: 226000 loss :0.0683417
epoch: 12 iterations: 226500 loss :3.69933
epoch: 12 iterations: 227000 loss :0.561214
epoch: 12 iterations: 227500 loss :0.778521
epoch: 12 iterations: 228000 loss :0.00308275
epoch: 12 iterations: 228500 loss :0.012141
epoch: 12 iterations: 229000 loss :0.0062902
epoch: 12 iterations: 229500 loss :0.987738
epoch: 12 iterations: 230000 loss :0.0119627
epoch: 12 iterations: 230500 loss :0.196879
epoch: 12 iterations: 231000 loss :0.369347
epoch: 12 iterations: 231500 loss :0.0097425
epoch: 12 iterations: 232000 loss :0.00632358
epoch: 12 iterations: 232500 loss :0.0322618
epoch: 12 iterations: 233000 loss :0.0741835
epoch: 12 iterations: 233500 loss :0.0296497
epoch: 12 iterations: 234000 loss :0.0391258
epoch: 12 iterations: 234500 loss :0.0294334
epoch: 12 iterations: 235000 loss :0.0108979
epoch: 12 iterati

epoch: 12 iterations: 317000 loss :0.00345969
epoch: 12 iterations: 317500 loss :0.026758
epoch: 12 iterations: 318000 loss :0.0126225
epoch: 12 iterations: 318500 loss :0.00725794
epoch: 12 iterations: 319000 loss :0.00986171
epoch: 12 iterations: 319500 loss :0.0685148
epoch: 12 iterations: 320000 loss :0.0561409
epoch: 12 iterations: 320500 loss :0.043017
epoch: 12 iterations: 321000 loss :0.0234039
epoch: 12 iterations: 321500 loss :0.0178977
epoch: 12 iterations: 322000 loss :0.0406106
epoch: 12 iterations: 322500 loss :0.00838137
epoch: 12 iterations: 323000 loss :0.0179455
epoch: 12 iterations: 323500 loss :0.783542
epoch: 12 iterations: 324000 loss :0.253528
epoch: 12 iterations: 324500 loss :0.0626832
epoch: 12 iterations: 325000 loss :0.227144
epoch: 12 iterations: 325500 loss :0.63297
epoch: 12 iterations: 326000 loss :0.260603
epoch: 12 iterations: 326500 loss :0.0069809
epoch: 12 iterations: 327000 loss :0.173081
epoch: 12 iterations: 327500 loss :0.0592268
epoch: 12 itera

epoch: 12 iterations: 409000 loss :0.0195167
epoch: 12 iterations: 409500 loss :0.0369639
epoch: 12 iterations: 410000 loss :0.0105417
epoch: 12 iterations: 410500 loss :0.00789475
epoch: 12 iterations: 411000 loss :1.99478
epoch: 12 iterations: 411500 loss :0.00470495
epoch: 12 iterations: 412000 loss :0.0541087
epoch: 12 iterations: 412500 loss :0.0246224
epoch: 12 iterations: 413000 loss :0.00708687
epoch: 12 iterations: 413500 loss :0.87532
epoch: 12 iterations: 414000 loss :0.00325036
epoch: 12 iterations: 414500 loss :0.859772
epoch: 12 iterations: 415000 loss :0.0355334
epoch: 12 iterations: 415500 loss :0.666387
epoch: 12 iterations: 416000 loss :0.00903726
epoch: 12 iterations: 416500 loss :0.327858
epoch: 12 iterations: 417000 loss :0.00239277
epoch: 12 iterations: 417500 loss :0.0984145
epoch: 12 iterations: 418000 loss :0.0202694
epoch: 12 iterations: 418500 loss :0.0144618
epoch: 12 iterations: 419000 loss :1.26604
epoch: 12 iterations: 419500 loss :0.0419327
epoch: 12 ite

epoch: 13 iterations: 81000 loss :0.158519
epoch: 13 iterations: 81500 loss :0.00661778
epoch: 13 iterations: 82000 loss :0.0420369
epoch: 13 iterations: 82500 loss :0.302151
epoch: 13 iterations: 83000 loss :0.0433799
epoch: 13 iterations: 83500 loss :0.134712
epoch: 13 iterations: 84000 loss :0.00623155
epoch: 13 iterations: 84500 loss :0.109079
epoch: 13 iterations: 85000 loss :0.00831676
epoch: 13 iterations: 85500 loss :0.0214571
epoch: 13 iterations: 86000 loss :0.0480279
epoch: 13 iterations: 86500 loss :0.010546
epoch: 13 iterations: 87000 loss :2.53458
epoch: 13 iterations: 87500 loss :0.195346
epoch: 13 iterations: 88000 loss :0.00997496
epoch: 13 iterations: 88500 loss :0.00452971
epoch: 13 iterations: 89000 loss :0.0193018
epoch: 13 iterations: 89500 loss :0.178593
epoch: 13 iterations: 90000 loss :0.0163951
epoch: 13 iterations: 90500 loss :3.34581
epoch: 13 iterations: 91000 loss :0.143983
epoch: 13 iterations: 91500 loss :0.0370644
epoch: 13 iterations: 92000 loss :0.028

epoch: 13 iterations: 173500 loss :0.011701
epoch: 13 iterations: 174000 loss :0.122222
epoch: 13 iterations: 174500 loss :0.359441
epoch: 13 iterations: 175000 loss :0.0140159
epoch: 13 iterations: 175500 loss :0.0117128
epoch: 13 iterations: 176000 loss :0.0162821
epoch: 13 iterations: 176500 loss :0.345494
epoch: 13 iterations: 177000 loss :0.523439
epoch: 13 iterations: 177500 loss :0.262718
epoch: 13 iterations: 178000 loss :0.00920844
epoch: 13 iterations: 178500 loss :0.0492774
epoch: 13 iterations: 179000 loss :0.0707111
epoch: 13 iterations: 179500 loss :0.0414072
epoch: 13 iterations: 180000 loss :0.0573263
epoch: 13 iterations: 180500 loss :0.024389
epoch: 13 iterations: 181000 loss :1.81587
epoch: 13 iterations: 181500 loss :0.0503852
epoch: 13 iterations: 182000 loss :0.00116682
epoch: 13 iterations: 182500 loss :0.740866
epoch: 13 iterations: 183000 loss :0.016613
epoch: 13 iterations: 183500 loss :0.029357
epoch: 13 iterations: 184000 loss :0.00804782
epoch: 13 iteration

epoch: 13 iterations: 265500 loss :0.0626907
epoch: 13 iterations: 266000 loss :0.0411295
epoch: 13 iterations: 266500 loss :0.100584
epoch: 13 iterations: 267000 loss :0.23606
epoch: 13 iterations: 267500 loss :0.108451
epoch: 13 iterations: 268000 loss :0.0366409
epoch: 13 iterations: 268500 loss :0.0674565
epoch: 13 iterations: 269000 loss :0.0042572
epoch: 13 iterations: 269500 loss :0.255461
epoch: 13 iterations: 270000 loss :0.0187404
epoch: 13 iterations: 270500 loss :0.151441
epoch: 13 iterations: 271000 loss :0.10942
epoch: 13 iterations: 271500 loss :0.0220275
epoch: 13 iterations: 272000 loss :0.00465512
epoch: 13 iterations: 272500 loss :0.00734305
epoch: 13 iterations: 273000 loss :0.138224
epoch: 13 iterations: 273500 loss :0.0219533
epoch: 13 iterations: 274000 loss :0.169014
epoch: 13 iterations: 274500 loss :0.0280122
epoch: 13 iterations: 275000 loss :0.043708
epoch: 13 iterations: 275500 loss :0.674617
epoch: 13 iterations: 276000 loss :0.539614
epoch: 13 iterations:

epoch: 13 iterations: 357500 loss :0.0637664
epoch: 13 iterations: 358000 loss :0.0139287
epoch: 13 iterations: 358500 loss :0.0221199
epoch: 13 iterations: 359000 loss :1.25046
epoch: 13 iterations: 359500 loss :0.0632346
epoch: 13 iterations: 360000 loss :0.287595
epoch: 13 iterations: 360500 loss :0.342012
epoch: 13 iterations: 361000 loss :0.182094
epoch: 13 iterations: 361500 loss :0.169856
epoch: 13 iterations: 362000 loss :0.0352135
epoch: 13 iterations: 362500 loss :0.0119109
epoch: 13 iterations: 363000 loss :0.420954
epoch: 13 iterations: 363500 loss :0.0899725
epoch: 13 iterations: 364000 loss :0.0218115
epoch: 13 iterations: 364500 loss :0.023495
epoch: 13 iterations: 365000 loss :0.205744
epoch: 13 iterations: 365500 loss :0.0167413
epoch: 13 iterations: 366000 loss :0.0128391
epoch: 13 iterations: 366500 loss :0.0128461
epoch: 13 iterations: 367000 loss :1.30473
epoch: 13 iterations: 367500 loss :0.0105679
epoch: 13 iterations: 368000 loss :0.0885135
epoch: 13 iterations:

epoch: 14 iterations: 28500 loss :0.321672
epoch: 14 iterations: 29000 loss :1.01926
epoch: 14 iterations: 29500 loss :0.0120233
epoch: 14 iterations: 30000 loss :0.181829
epoch: 14 iterations: 30500 loss :0.242322
epoch: 14 iterations: 31000 loss :0.984817
epoch: 14 iterations: 31500 loss :0.0144932
epoch: 14 iterations: 32000 loss :3.03027
epoch: 14 iterations: 32500 loss :0.00522041
epoch: 14 iterations: 33000 loss :0.0201225
epoch: 14 iterations: 33500 loss :0.011642
epoch: 14 iterations: 34000 loss :0.0428172
epoch: 14 iterations: 34500 loss :0.0615299
epoch: 14 iterations: 35000 loss :0.338453
epoch: 14 iterations: 35500 loss :0.170093
epoch: 14 iterations: 36000 loss :0.0168334
epoch: 14 iterations: 36500 loss :0.0171925
epoch: 14 iterations: 37000 loss :0.722814
epoch: 14 iterations: 37500 loss :0.186433
epoch: 14 iterations: 38000 loss :0.096866
epoch: 14 iterations: 38500 loss :0.0804399
epoch: 14 iterations: 39000 loss :0.190665
epoch: 14 iterations: 39500 loss :0.00653172
e

epoch: 14 iterations: 122500 loss :0.388773
epoch: 14 iterations: 123000 loss :0.0181569
epoch: 14 iterations: 123500 loss :0.0692183
epoch: 14 iterations: 124000 loss :0.0208864
epoch: 14 iterations: 124500 loss :2.56283
epoch: 14 iterations: 125000 loss :0.00735259
epoch: 14 iterations: 125500 loss :0.0044744
epoch: 14 iterations: 126000 loss :0.304794
epoch: 14 iterations: 126500 loss :0.0642665
epoch: 14 iterations: 127000 loss :0.0230299
epoch: 14 iterations: 127500 loss :0.567821
epoch: 14 iterations: 128000 loss :0.00602984
epoch: 14 iterations: 128500 loss :0.0206842
epoch: 14 iterations: 129000 loss :0.340252
epoch: 14 iterations: 129500 loss :0.0269467
epoch: 14 iterations: 130000 loss :0.169359
epoch: 14 iterations: 130500 loss :0.720494
epoch: 14 iterations: 131000 loss :0.0036025
epoch: 14 iterations: 131500 loss :0.0885917
epoch: 14 iterations: 132000 loss :0.202992
epoch: 14 iterations: 132500 loss :0.892286
epoch: 14 iterations: 133000 loss :0.152152
epoch: 14 iteration

epoch: 14 iterations: 214500 loss :0.0802248
epoch: 14 iterations: 215000 loss :0.0133433
epoch: 14 iterations: 215500 loss :0.0446738
epoch: 14 iterations: 216000 loss :1.03884
epoch: 14 iterations: 216500 loss :0.00678897
epoch: 14 iterations: 217000 loss :1.92091
epoch: 14 iterations: 217500 loss :0.0579662
epoch: 14 iterations: 218000 loss :0.0121453
epoch: 14 iterations: 218500 loss :0.0245774
epoch: 14 iterations: 219000 loss :0.1271
epoch: 14 iterations: 219500 loss :0.444364
epoch: 14 iterations: 220000 loss :0.515998
epoch: 14 iterations: 220500 loss :4.74601
epoch: 14 iterations: 221000 loss :0.0927402
epoch: 14 iterations: 221500 loss :0.022095
epoch: 14 iterations: 222000 loss :0.107537
epoch: 14 iterations: 222500 loss :1.35284
epoch: 14 iterations: 223000 loss :0.0505632
epoch: 14 iterations: 223500 loss :0.151587
epoch: 14 iterations: 224000 loss :0.0930575
epoch: 14 iterations: 224500 loss :0.00868654
epoch: 14 iterations: 225000 loss :1.32426
epoch: 14 iterations: 2255

epoch: 14 iterations: 307000 loss :0.582353
epoch: 14 iterations: 307500 loss :1.15436
epoch: 14 iterations: 308000 loss :0.0161335
epoch: 14 iterations: 308500 loss :0.168651
epoch: 14 iterations: 309000 loss :0.0027287
epoch: 14 iterations: 309500 loss :0.0555794
epoch: 14 iterations: 310000 loss :0.147378
epoch: 14 iterations: 310500 loss :0.103315
epoch: 14 iterations: 311000 loss :0.0125706
epoch: 14 iterations: 311500 loss :0.344266
epoch: 14 iterations: 312000 loss :0.0325093
epoch: 14 iterations: 312500 loss :0.0584822
epoch: 14 iterations: 313000 loss :0.0604231
epoch: 14 iterations: 313500 loss :0.0137664
epoch: 14 iterations: 314000 loss :0.0066371
epoch: 14 iterations: 314500 loss :0.0168219
epoch: 14 iterations: 315000 loss :0.0095911
epoch: 14 iterations: 315500 loss :0.157164
epoch: 14 iterations: 316000 loss :0.47071
epoch: 14 iterations: 316500 loss :0.0151708
epoch: 14 iterations: 317000 loss :0.00699043
epoch: 14 iterations: 317500 loss :0.0170441
epoch: 14 iteration

epoch: 14 iterations: 399000 loss :0.029611
epoch: 14 iterations: 399500 loss :2.45671
epoch: 14 iterations: 400000 loss :4.17005
epoch: 14 iterations: 400500 loss :0.719223
epoch: 14 iterations: 401000 loss :0.016747
epoch: 14 iterations: 401500 loss :0.0333894
epoch: 14 iterations: 402000 loss :0.113057
epoch: 14 iterations: 402500 loss :0.671731
epoch: 14 iterations: 403000 loss :0.00891042
epoch: 14 iterations: 403500 loss :0.0965421
epoch: 14 iterations: 404000 loss :0.0216584
epoch: 14 iterations: 404500 loss :0.226402
epoch: 14 iterations: 405000 loss :0.123902
epoch: 14 iterations: 405500 loss :0.0292265
epoch: 14 iterations: 406000 loss :0.735412
epoch: 14 iterations: 406500 loss :0.0130608
epoch: 14 iterations: 407000 loss :0.422366
epoch: 14 iterations: 407500 loss :0.0174558
epoch: 14 iterations: 408000 loss :0.0123769
epoch: 14 iterations: 408500 loss :0.00794232
epoch: 14 iterations: 409000 loss :0.145273
epoch: 14 iterations: 409500 loss :0.0190519
epoch: 14 iterations: 