In [1]:
import os
import pickle
import argparse
import numpy as np
from model import Options, Seq2SeqAttn


In [2]:
# Parse the command line arguments.
parser = argparse.ArgumentParser()
parser.add_argument('--data_path', type = str, default = './pre-data/',
                    help = 'the directory to the data')

parser.add_argument('--word_embeddings_path', type = str, default = './pre-data/word_embeddings.npy',
                    help = 'the directory to the pre-trained word embeddings')
parser.add_argument('--num_epochs', type = int, default = 10,
                    help = 'the number of epochs to train the data')
parser.add_argument('--batch_size', type = int, default = 1,
                    help = 'the batch size')
parser.add_argument('--learning_rate', type = float, default = 0.001,
                    help = 'the learning rate')
parser.add_argument('--beam_width', type = int, default = 256,
                    help = 'the beam width when decoding')
parser.add_argument('--word_embed_size', type = int, default = 256,
                    help = 'the size of word embeddings')
parser.add_argument('--n_hidden_units_enc', type = int, default = 256,
                    help = 'the number of hidden units of encoder')
parser.add_argument('--n_hidden_units_dec', type = int, default = 256,
                    help = 'the number of hidden units of decoder')
parser.add_argument('--attn_depth', type = int, default = 128,
                    help = 'attention depth')
parser.add_argument('--restore_path', type = str, default = './model_dailydialog_rf',
                    help = 'the path to restore the trained model')
parser.add_argument('--restore_epoch', type = int, default = 0,
                    help = 'the epoch to restore')

parser.add_argument('--save_path', type = str, default = './model_dailydialog_rf',
                    help = 'the path to save the trained model to')

# args = parser.parse_args()
args, unknown = parser.parse_known_args()


In [3]:
def read_data(data_path):
    def load_np_files(path):
        my_set = {}
        my_set['enc_input'] = np.load(os.path.join(path, 'enc_input.npy'))
        my_set['dec_input'] = np.load(os.path.join(path, 'dec_input.npy'))
        my_set['target'] = np.load(os.path.join(path, 'target.npy'))
        my_set['enc_input_len'] = np.load(os.path.join(path, 'enc_input_len.npy'))
        my_set['dec_input_len'] = np.load(os.path.join(path, 'dec_input_len.npy'))
        return my_set
    train_set = load_np_files(os.path.join(data_path, 'train'))
    valid_set = load_np_files(os.path.join(data_path, 'validation'))
    with open(os.path.join(data_path, 'token2id.pickle'), 'rb') as file:
        token2id = pickle.load(file)
    return train_set, valid_set, token2id

In [4]:
if __name__ == '__main__':
    train_set, valid_set, token2id = read_data(args.data_path)
    max_uttr_len_enc = train_set['enc_input'].shape[1]
    max_uttr_len_dec = train_set['dec_input'].shape[1]

    word_embeddings = np.load(args.word_embeddings_path)

    options = Options(mode = 'TRAIN',
                      num_epochs = args.num_epochs,
                      batch_size = args.batch_size,
                      learning_rate = args.learning_rate,
                      beam_width = args.beam_width,
                      vocab_size = len(token2id),
                      max_uttr_len_enc = max_uttr_len_enc,
                      max_uttr_len_dec = max_uttr_len_dec,
                      go_index = token2id['<go>'],
                      eos_index = token2id['<eos>'],
                      word_embed_size = args.word_embed_size,
                      n_hidden_units_enc = args.n_hidden_units_enc,
                      n_hidden_units_dec = args.n_hidden_units_dec,
                      attn_depth = args.attn_depth,
                      word_embeddings = word_embeddings)
    model = Seq2SeqAttn(options)

    for var in model.tvars:
        print(var.name)

    if args.restore_epoch > 0:
        model.restore(os.path.join(args.restore_path, 'model_epoch_{:03d}.ckpt'.format(args.restore_epoch)))
    else:
        model.init_tf_vars()
    model.train(train_set, args.save_path, args.restore_epoch, valid_set)


Building the TensorFlow graph...
embedding/word_embeddings:0
encoding/rnn/gru_cell/gates/kernel:0
encoding/rnn/gru_cell/gates/bias:0
encoding/rnn/gru_cell/candidate/kernel:0
encoding/rnn/gru_cell/candidate/bias:0
decoding/memory_layer/kernel:0
decoding/attention_v:0
decoding/my_bahdanau_attention/query_layer/kernel:0
decoding/attention_wrapper/gru_cell/gates/kernel:0
decoding/attention_wrapper/gru_cell/gates/bias:0
decoding/attention_wrapper/gru_cell/candidate/kernel:0
decoding/attention_wrapper/gru_cell/candidate/bias:0
decoding/dense/kernel:0
decoding/dense/bias:0
TensorFlow variables initialized.
Start to train the model...
Epoch 001/010, valid ppl = None, batch 0001/0508, train loss = 7.368693828582764
Epoch 001/010, valid ppl = None, batch 0002/0508, train loss = 7.304680824279785
Epoch 001/010, valid ppl = None, batch 0003/0508, train loss = 7.213321208953857
Epoch 001/010, valid ppl = None, batch 0004/0508, train loss = 7.312109470367432
Epoch 001/010, valid ppl = None, batch 00

Epoch 001/010, valid ppl = None, batch 0095/0508, train loss = 6.448348045349121
Epoch 001/010, valid ppl = None, batch 0096/0508, train loss = 4.595766544342041
Epoch 001/010, valid ppl = None, batch 0097/0508, train loss = 5.351205825805664
Epoch 001/010, valid ppl = None, batch 0098/0508, train loss = 4.946530342102051
Epoch 001/010, valid ppl = None, batch 0099/0508, train loss = 6.118973255157471
Epoch 001/010, valid ppl = None, batch 0100/0508, train loss = 4.349318027496338
Epoch 001/010, valid ppl = None, batch 0101/0508, train loss = 4.895392894744873
Epoch 001/010, valid ppl = None, batch 0102/0508, train loss = 4.385718822479248
Epoch 001/010, valid ppl = None, batch 0103/0508, train loss = 5.8848114013671875
Epoch 001/010, valid ppl = None, batch 0104/0508, train loss = 4.846677780151367
Epoch 001/010, valid ppl = None, batch 0105/0508, train loss = 5.062910556793213
Epoch 001/010, valid ppl = None, batch 0106/0508, train loss = 6.994507789611816
Epoch 001/010, valid ppl = 

Epoch 001/010, valid ppl = None, batch 0197/0508, train loss = 6.255429744720459
Epoch 001/010, valid ppl = None, batch 0198/0508, train loss = 4.75693416595459
Epoch 001/010, valid ppl = None, batch 0199/0508, train loss = 5.814449310302734
Epoch 001/010, valid ppl = None, batch 0200/0508, train loss = 6.220405578613281
Epoch 001/010, valid ppl = None, batch 0201/0508, train loss = 5.0271806716918945
Epoch 001/010, valid ppl = None, batch 0202/0508, train loss = 4.991115570068359
Epoch 001/010, valid ppl = None, batch 0203/0508, train loss = 3.6213436126708984
Epoch 001/010, valid ppl = None, batch 0204/0508, train loss = 5.293203830718994
Epoch 001/010, valid ppl = None, batch 0205/0508, train loss = 4.587733745574951
Epoch 001/010, valid ppl = None, batch 0206/0508, train loss = 5.8510942459106445
Epoch 001/010, valid ppl = None, batch 0207/0508, train loss = 4.126319408416748
Epoch 001/010, valid ppl = None, batch 0208/0508, train loss = 6.131417751312256
Epoch 001/010, valid ppl =

Epoch 001/010, valid ppl = None, batch 0299/0508, train loss = 5.151618480682373
Epoch 001/010, valid ppl = None, batch 0300/0508, train loss = 5.594198226928711
Epoch 001/010, valid ppl = None, batch 0301/0508, train loss = 5.545319557189941
Epoch 001/010, valid ppl = None, batch 0302/0508, train loss = 5.1512956619262695
Epoch 001/010, valid ppl = None, batch 0303/0508, train loss = 4.486741542816162
Epoch 001/010, valid ppl = None, batch 0304/0508, train loss = 3.954984426498413
Epoch 001/010, valid ppl = None, batch 0305/0508, train loss = 4.242379665374756
Epoch 001/010, valid ppl = None, batch 0306/0508, train loss = 5.7284369468688965
Epoch 001/010, valid ppl = None, batch 0307/0508, train loss = 5.349480628967285
Epoch 001/010, valid ppl = None, batch 0308/0508, train loss = 4.954710483551025
Epoch 001/010, valid ppl = None, batch 0309/0508, train loss = 4.60728645324707
Epoch 001/010, valid ppl = None, batch 0310/0508, train loss = 5.195657730102539
Epoch 001/010, valid ppl = 

Epoch 001/010, valid ppl = None, batch 0400/0508, train loss = 4.14119815826416
Epoch 001/010, valid ppl = None, batch 0401/0508, train loss = 5.270768642425537
Epoch 001/010, valid ppl = None, batch 0402/0508, train loss = 3.964315414428711
Epoch 001/010, valid ppl = None, batch 0403/0508, train loss = 5.687956809997559
Epoch 001/010, valid ppl = None, batch 0404/0508, train loss = 6.102665901184082
Epoch 001/010, valid ppl = None, batch 0405/0508, train loss = 5.982167720794678
Epoch 001/010, valid ppl = None, batch 0406/0508, train loss = 5.926502704620361
Epoch 001/010, valid ppl = None, batch 0407/0508, train loss = 6.625740051269531
Epoch 001/010, valid ppl = None, batch 0408/0508, train loss = 5.593047142028809
Epoch 001/010, valid ppl = None, batch 0409/0508, train loss = 5.3111090660095215
Epoch 001/010, valid ppl = None, batch 0410/0508, train loss = 3.7010936737060547
Epoch 001/010, valid ppl = None, batch 0411/0508, train loss = 6.051217079162598
Epoch 001/010, valid ppl = 

Epoch 001/010, valid ppl = None, batch 0501/0508, train loss = 3.5441014766693115
Epoch 001/010, valid ppl = None, batch 0502/0508, train loss = 5.24899959564209
Epoch 001/010, valid ppl = None, batch 0503/0508, train loss = 3.8530330657958984
Epoch 001/010, valid ppl = None, batch 0504/0508, train loss = 7.3014421463012695
Epoch 001/010, valid ppl = None, batch 0505/0508, train loss = 5.851811408996582
Epoch 001/010, valid ppl = None, batch 0506/0508, train loss = 4.716418743133545
Epoch 001/010, valid ppl = None, batch 0507/0508, train loss = 5.366741180419922
Epoch 001/010, valid ppl = None, batch 0508/0508, train loss = 5.586796283721924
Saving the trained model to ./model_dailydialog_rf/model_epoch_001.ckpt...
Epoch 002/010, valid ppl = 120.63403990420883, batch 0001/0508, train loss = 5.055620193481445
Epoch 002/010, valid ppl = 120.63403990420883, batch 0002/0508, train loss = 5.0271077156066895
Epoch 002/010, valid ppl = 120.63403990420883, batch 0003/0508, train loss = 6.32280

Epoch 002/010, valid ppl = 120.63403990420883, batch 0080/0508, train loss = 3.6766364574432373
Epoch 002/010, valid ppl = 120.63403990420883, batch 0081/0508, train loss = 4.843767166137695
Epoch 002/010, valid ppl = 120.63403990420883, batch 0082/0508, train loss = 5.293715476989746
Epoch 002/010, valid ppl = 120.63403990420883, batch 0083/0508, train loss = 2.2775020599365234
Epoch 002/010, valid ppl = 120.63403990420883, batch 0084/0508, train loss = 1.162298560142517
Epoch 002/010, valid ppl = 120.63403990420883, batch 0085/0508, train loss = 4.651834011077881
Epoch 002/010, valid ppl = 120.63403990420883, batch 0086/0508, train loss = 4.562288761138916
Epoch 002/010, valid ppl = 120.63403990420883, batch 0087/0508, train loss = 2.342717409133911
Epoch 002/010, valid ppl = 120.63403990420883, batch 0088/0508, train loss = 4.833137512207031
Epoch 002/010, valid ppl = 120.63403990420883, batch 0089/0508, train loss = 1.6449122428894043
Epoch 002/010, valid ppl = 120.63403990420883, 

Epoch 002/010, valid ppl = 120.63403990420883, batch 0167/0508, train loss = 3.859398603439331
Epoch 002/010, valid ppl = 120.63403990420883, batch 0168/0508, train loss = 4.033249378204346
Epoch 002/010, valid ppl = 120.63403990420883, batch 0169/0508, train loss = 4.934250354766846
Epoch 002/010, valid ppl = 120.63403990420883, batch 0170/0508, train loss = 3.3079440593719482
Epoch 002/010, valid ppl = 120.63403990420883, batch 0171/0508, train loss = 4.409295558929443
Epoch 002/010, valid ppl = 120.63403990420883, batch 0172/0508, train loss = 5.001101970672607
Epoch 002/010, valid ppl = 120.63403990420883, batch 0173/0508, train loss = 6.097934246063232
Epoch 002/010, valid ppl = 120.63403990420883, batch 0174/0508, train loss = 2.1621108055114746
Epoch 002/010, valid ppl = 120.63403990420883, batch 0175/0508, train loss = 3.1699090003967285
Epoch 002/010, valid ppl = 120.63403990420883, batch 0176/0508, train loss = 6.010542392730713
Epoch 002/010, valid ppl = 120.63403990420883, 

Epoch 002/010, valid ppl = 120.63403990420883, batch 0254/0508, train loss = 5.086292266845703
Epoch 002/010, valid ppl = 120.63403990420883, batch 0255/0508, train loss = 3.9232335090637207
Epoch 002/010, valid ppl = 120.63403990420883, batch 0256/0508, train loss = 4.523638725280762
Epoch 002/010, valid ppl = 120.63403990420883, batch 0257/0508, train loss = 4.758864402770996
Epoch 002/010, valid ppl = 120.63403990420883, batch 0258/0508, train loss = 3.9855287075042725
Epoch 002/010, valid ppl = 120.63403990420883, batch 0259/0508, train loss = 5.860074520111084
Epoch 002/010, valid ppl = 120.63403990420883, batch 0260/0508, train loss = 4.879950523376465
Epoch 002/010, valid ppl = 120.63403990420883, batch 0261/0508, train loss = 3.8139760494232178
Epoch 002/010, valid ppl = 120.63403990420883, batch 0262/0508, train loss = 3.826932191848755
Epoch 002/010, valid ppl = 120.63403990420883, batch 0263/0508, train loss = 4.241097927093506
Epoch 002/010, valid ppl = 120.63403990420883, 

Epoch 002/010, valid ppl = 120.63403990420883, batch 0341/0508, train loss = 4.675627708435059
Epoch 002/010, valid ppl = 120.63403990420883, batch 0342/0508, train loss = 5.199068069458008
Epoch 002/010, valid ppl = 120.63403990420883, batch 0343/0508, train loss = 2.6248772144317627
Epoch 002/010, valid ppl = 120.63403990420883, batch 0344/0508, train loss = 1.0343012809753418
Epoch 002/010, valid ppl = 120.63403990420883, batch 0345/0508, train loss = 4.994429111480713
Epoch 002/010, valid ppl = 120.63403990420883, batch 0346/0508, train loss = 4.971125602722168
Epoch 002/010, valid ppl = 120.63403990420883, batch 0347/0508, train loss = 4.0253801345825195
Epoch 002/010, valid ppl = 120.63403990420883, batch 0348/0508, train loss = 4.286047458648682
Epoch 002/010, valid ppl = 120.63403990420883, batch 0349/0508, train loss = 4.80405855178833
Epoch 002/010, valid ppl = 120.63403990420883, batch 0350/0508, train loss = 4.103457927703857
Epoch 002/010, valid ppl = 120.63403990420883, b

Epoch 002/010, valid ppl = 120.63403990420883, batch 0428/0508, train loss = 6.007573127746582
Epoch 002/010, valid ppl = 120.63403990420883, batch 0429/0508, train loss = 6.144204616546631
Epoch 002/010, valid ppl = 120.63403990420883, batch 0430/0508, train loss = 3.2251107692718506
Epoch 002/010, valid ppl = 120.63403990420883, batch 0431/0508, train loss = 5.720931053161621
Epoch 002/010, valid ppl = 120.63403990420883, batch 0432/0508, train loss = 4.343952178955078
Epoch 002/010, valid ppl = 120.63403990420883, batch 0433/0508, train loss = 5.612496852874756
Epoch 002/010, valid ppl = 120.63403990420883, batch 0434/0508, train loss = 3.6362152099609375
Epoch 002/010, valid ppl = 120.63403990420883, batch 0435/0508, train loss = 5.0498046875
Epoch 002/010, valid ppl = 120.63403990420883, batch 0436/0508, train loss = 5.326091289520264
Epoch 002/010, valid ppl = 120.63403990420883, batch 0437/0508, train loss = 2.5445871353149414
Epoch 002/010, valid ppl = 120.63403990420883, batch

Epoch 003/010, valid ppl = 118.79532458312138, batch 0006/0508, train loss = 2.4751853942871094
Epoch 003/010, valid ppl = 118.79532458312138, batch 0007/0508, train loss = 4.49712610244751
Epoch 003/010, valid ppl = 118.79532458312138, batch 0008/0508, train loss = 3.598388671875
Epoch 003/010, valid ppl = 118.79532458312138, batch 0009/0508, train loss = 4.885589599609375
Epoch 003/010, valid ppl = 118.79532458312138, batch 0010/0508, train loss = 2.8724184036254883
Epoch 003/010, valid ppl = 118.79532458312138, batch 0011/0508, train loss = 4.826246738433838
Epoch 003/010, valid ppl = 118.79532458312138, batch 0012/0508, train loss = 5.143311500549316
Epoch 003/010, valid ppl = 118.79532458312138, batch 0013/0508, train loss = 3.897350311279297
Epoch 003/010, valid ppl = 118.79532458312138, batch 0014/0508, train loss = 4.052797317504883
Epoch 003/010, valid ppl = 118.79532458312138, batch 0015/0508, train loss = 3.8896031379699707
Epoch 003/010, valid ppl = 118.79532458312138, batc

Epoch 003/010, valid ppl = 118.79532458312138, batch 0093/0508, train loss = 5.385684013366699
Epoch 003/010, valid ppl = 118.79532458312138, batch 0094/0508, train loss = 2.1794230937957764
Epoch 003/010, valid ppl = 118.79532458312138, batch 0095/0508, train loss = 3.489924669265747
Epoch 003/010, valid ppl = 118.79532458312138, batch 0096/0508, train loss = 2.3595187664031982
Epoch 003/010, valid ppl = 118.79532458312138, batch 0097/0508, train loss = 3.5139100551605225
Epoch 003/010, valid ppl = 118.79532458312138, batch 0098/0508, train loss = 3.315824031829834
Epoch 003/010, valid ppl = 118.79532458312138, batch 0099/0508, train loss = 5.327434062957764
Epoch 003/010, valid ppl = 118.79532458312138, batch 0100/0508, train loss = 3.979426622390747
Epoch 003/010, valid ppl = 118.79532458312138, batch 0101/0508, train loss = 4.483570098876953
Epoch 003/010, valid ppl = 118.79532458312138, batch 0102/0508, train loss = 4.719291687011719
Epoch 003/010, valid ppl = 118.79532458312138, 

Epoch 003/010, valid ppl = 118.79532458312138, batch 0179/0508, train loss = 4.497322082519531
Epoch 003/010, valid ppl = 118.79532458312138, batch 0180/0508, train loss = 4.798752784729004
Epoch 003/010, valid ppl = 118.79532458312138, batch 0181/0508, train loss = 3.491511106491089
Epoch 003/010, valid ppl = 118.79532458312138, batch 0182/0508, train loss = 5.051914691925049
Epoch 003/010, valid ppl = 118.79532458312138, batch 0183/0508, train loss = 4.411609172821045
Epoch 003/010, valid ppl = 118.79532458312138, batch 0184/0508, train loss = 4.210038185119629
Epoch 003/010, valid ppl = 118.79532458312138, batch 0185/0508, train loss = 2.1219465732574463
Epoch 003/010, valid ppl = 118.79532458312138, batch 0186/0508, train loss = 2.764476776123047
Epoch 003/010, valid ppl = 118.79532458312138, batch 0187/0508, train loss = 3.8516595363616943
Epoch 003/010, valid ppl = 118.79532458312138, batch 0188/0508, train loss = 4.394442558288574
Epoch 003/010, valid ppl = 118.79532458312138, b

Epoch 003/010, valid ppl = 118.79532458312138, batch 0265/0508, train loss = 2.7969906330108643
Epoch 003/010, valid ppl = 118.79532458312138, batch 0266/0508, train loss = 5.065258979797363
Epoch 003/010, valid ppl = 118.79532458312138, batch 0267/0508, train loss = 4.111340522766113
Epoch 003/010, valid ppl = 118.79532458312138, batch 0268/0508, train loss = 5.227219581604004
Epoch 003/010, valid ppl = 118.79532458312138, batch 0269/0508, train loss = 3.348900079727173
Epoch 003/010, valid ppl = 118.79532458312138, batch 0270/0508, train loss = 3.629058837890625
Epoch 003/010, valid ppl = 118.79532458312138, batch 0271/0508, train loss = 3.1602532863616943
Epoch 003/010, valid ppl = 118.79532458312138, batch 0272/0508, train loss = 4.2886762619018555
Epoch 003/010, valid ppl = 118.79532458312138, batch 0273/0508, train loss = 3.138216972351074
Epoch 003/010, valid ppl = 118.79532458312138, batch 0274/0508, train loss = 2.742966890335083
Epoch 003/010, valid ppl = 118.79532458312138, 

Epoch 003/010, valid ppl = 118.79532458312138, batch 0352/0508, train loss = 4.395349502563477
Epoch 003/010, valid ppl = 118.79532458312138, batch 0353/0508, train loss = 0.7539057731628418
Epoch 003/010, valid ppl = 118.79532458312138, batch 0354/0508, train loss = 3.2074599266052246
Epoch 003/010, valid ppl = 118.79532458312138, batch 0355/0508, train loss = 3.922900915145874
Epoch 003/010, valid ppl = 118.79532458312138, batch 0356/0508, train loss = 4.1140570640563965
Epoch 003/010, valid ppl = 118.79532458312138, batch 0357/0508, train loss = 3.765392303466797
Epoch 003/010, valid ppl = 118.79532458312138, batch 0358/0508, train loss = 3.2763116359710693
Epoch 003/010, valid ppl = 118.79532458312138, batch 0359/0508, train loss = 4.332615375518799
Epoch 003/010, valid ppl = 118.79532458312138, batch 0360/0508, train loss = 3.7007973194122314
Epoch 003/010, valid ppl = 118.79532458312138, batch 0361/0508, train loss = 4.032514572143555
Epoch 003/010, valid ppl = 118.79532458312138

Epoch 003/010, valid ppl = 118.79532458312138, batch 0438/0508, train loss = 4.733376979827881
Epoch 003/010, valid ppl = 118.79532458312138, batch 0439/0508, train loss = 4.886661052703857
Epoch 003/010, valid ppl = 118.79532458312138, batch 0440/0508, train loss = 4.345930576324463
Epoch 003/010, valid ppl = 118.79532458312138, batch 0441/0508, train loss = 5.5920233726501465
Epoch 003/010, valid ppl = 118.79532458312138, batch 0442/0508, train loss = 4.082847595214844
Epoch 003/010, valid ppl = 118.79532458312138, batch 0443/0508, train loss = 2.3654651641845703
Epoch 003/010, valid ppl = 118.79532458312138, batch 0444/0508, train loss = 4.492830753326416
Epoch 003/010, valid ppl = 118.79532458312138, batch 0445/0508, train loss = 4.360732078552246
Epoch 003/010, valid ppl = 118.79532458312138, batch 0446/0508, train loss = 3.1538820266723633
Epoch 003/010, valid ppl = 118.79532458312138, batch 0447/0508, train loss = 3.9273104667663574
Epoch 003/010, valid ppl = 118.79532458312138,

Epoch 004/010, valid ppl = 146.13936505096146, batch 0016/0508, train loss = 3.681380033493042
Epoch 004/010, valid ppl = 146.13936505096146, batch 0017/0508, train loss = 3.8828036785125732
Epoch 004/010, valid ppl = 146.13936505096146, batch 0018/0508, train loss = 4.495388984680176
Epoch 004/010, valid ppl = 146.13936505096146, batch 0019/0508, train loss = 3.6345672607421875
Epoch 004/010, valid ppl = 146.13936505096146, batch 0020/0508, train loss = 3.3565943241119385
Epoch 004/010, valid ppl = 146.13936505096146, batch 0021/0508, train loss = 3.3138186931610107
Epoch 004/010, valid ppl = 146.13936505096146, batch 0022/0508, train loss = 1.0211125612258911
Epoch 004/010, valid ppl = 146.13936505096146, batch 0023/0508, train loss = 4.179083824157715
Epoch 004/010, valid ppl = 146.13936505096146, batch 0024/0508, train loss = 4.540969371795654
Epoch 004/010, valid ppl = 146.13936505096146, batch 0025/0508, train loss = 3.329148769378662
Epoch 004/010, valid ppl = 146.13936505096146

Epoch 004/010, valid ppl = 146.13936505096146, batch 0102/0508, train loss = 3.125889778137207
Epoch 004/010, valid ppl = 146.13936505096146, batch 0103/0508, train loss = 3.7637994289398193
Epoch 004/010, valid ppl = 146.13936505096146, batch 0104/0508, train loss = 3.6057112216949463
Epoch 004/010, valid ppl = 146.13936505096146, batch 0105/0508, train loss = 3.3732376098632812
Epoch 004/010, valid ppl = 146.13936505096146, batch 0106/0508, train loss = 3.3998162746429443
Epoch 004/010, valid ppl = 146.13936505096146, batch 0107/0508, train loss = 3.697654962539673
Epoch 004/010, valid ppl = 146.13936505096146, batch 0108/0508, train loss = 4.539421081542969
Epoch 004/010, valid ppl = 146.13936505096146, batch 0109/0508, train loss = 2.6797938346862793
Epoch 004/010, valid ppl = 146.13936505096146, batch 0110/0508, train loss = 2.951159715652466
Epoch 004/010, valid ppl = 146.13936505096146, batch 0111/0508, train loss = 4.085903167724609
Epoch 004/010, valid ppl = 146.13936505096146

Epoch 004/010, valid ppl = 146.13936505096146, batch 0188/0508, train loss = 3.5639700889587402
Epoch 004/010, valid ppl = 146.13936505096146, batch 0189/0508, train loss = 3.1029586791992188
Epoch 004/010, valid ppl = 146.13936505096146, batch 0190/0508, train loss = 2.670419692993164
Epoch 004/010, valid ppl = 146.13936505096146, batch 0191/0508, train loss = 3.5982208251953125
Epoch 004/010, valid ppl = 146.13936505096146, batch 0192/0508, train loss = 3.520918130874634
Epoch 004/010, valid ppl = 146.13936505096146, batch 0193/0508, train loss = 3.4678831100463867
Epoch 004/010, valid ppl = 146.13936505096146, batch 0194/0508, train loss = 3.4721264839172363
Epoch 004/010, valid ppl = 146.13936505096146, batch 0195/0508, train loss = 3.8402833938598633
Epoch 004/010, valid ppl = 146.13936505096146, batch 0196/0508, train loss = 3.8227336406707764
Epoch 004/010, valid ppl = 146.13936505096146, batch 0197/0508, train loss = 3.357893705368042
Epoch 004/010, valid ppl = 146.139365050961

Epoch 004/010, valid ppl = 146.13936505096146, batch 0274/0508, train loss = 3.852524757385254
Epoch 004/010, valid ppl = 146.13936505096146, batch 0275/0508, train loss = 1.1667073965072632
Epoch 004/010, valid ppl = 146.13936505096146, batch 0276/0508, train loss = 4.181654453277588
Epoch 004/010, valid ppl = 146.13936505096146, batch 0277/0508, train loss = 2.5294015407562256
Epoch 004/010, valid ppl = 146.13936505096146, batch 0278/0508, train loss = 2.522768020629883
Epoch 004/010, valid ppl = 146.13936505096146, batch 0279/0508, train loss = 3.1175365447998047
Epoch 004/010, valid ppl = 146.13936505096146, batch 0280/0508, train loss = 4.103924751281738
Epoch 004/010, valid ppl = 146.13936505096146, batch 0281/0508, train loss = 4.534101486206055
Epoch 004/010, valid ppl = 146.13936505096146, batch 0282/0508, train loss = 4.180868625640869
Epoch 004/010, valid ppl = 146.13936505096146, batch 0283/0508, train loss = 4.460292816162109
Epoch 004/010, valid ppl = 146.13936505096146, 

Epoch 004/010, valid ppl = 146.13936505096146, batch 0360/0508, train loss = 3.1889970302581787
Epoch 004/010, valid ppl = 146.13936505096146, batch 0361/0508, train loss = 3.7053089141845703
Epoch 004/010, valid ppl = 146.13936505096146, batch 0362/0508, train loss = 4.074317455291748
Epoch 004/010, valid ppl = 146.13936505096146, batch 0363/0508, train loss = 3.3735010623931885
Epoch 004/010, valid ppl = 146.13936505096146, batch 0364/0508, train loss = 4.062209129333496
Epoch 004/010, valid ppl = 146.13936505096146, batch 0365/0508, train loss = 4.261528015136719
Epoch 004/010, valid ppl = 146.13936505096146, batch 0366/0508, train loss = 3.3324637413024902
Epoch 004/010, valid ppl = 146.13936505096146, batch 0367/0508, train loss = 3.1272971630096436
Epoch 004/010, valid ppl = 146.13936505096146, batch 0368/0508, train loss = 3.366006851196289
Epoch 004/010, valid ppl = 146.13936505096146, batch 0369/0508, train loss = 3.816365957260132
Epoch 004/010, valid ppl = 146.13936505096146

Epoch 004/010, valid ppl = 146.13936505096146, batch 0446/0508, train loss = 2.080489158630371
Epoch 004/010, valid ppl = 146.13936505096146, batch 0447/0508, train loss = 4.942586898803711
Epoch 004/010, valid ppl = 146.13936505096146, batch 0448/0508, train loss = 4.232222080230713
Epoch 004/010, valid ppl = 146.13936505096146, batch 0449/0508, train loss = 2.4447100162506104
Epoch 004/010, valid ppl = 146.13936505096146, batch 0450/0508, train loss = 3.2772884368896484
Epoch 004/010, valid ppl = 146.13936505096146, batch 0451/0508, train loss = 3.055135488510132
Epoch 004/010, valid ppl = 146.13936505096146, batch 0452/0508, train loss = 3.2249960899353027
Epoch 004/010, valid ppl = 146.13936505096146, batch 0453/0508, train loss = 4.096200942993164
Epoch 004/010, valid ppl = 146.13936505096146, batch 0454/0508, train loss = 2.7454817295074463
Epoch 004/010, valid ppl = 146.13936505096146, batch 0455/0508, train loss = 4.60338020324707
Epoch 004/010, valid ppl = 146.13936505096146, 

Epoch 005/010, valid ppl = 164.35373648988278, batch 0024/0508, train loss = 3.8391523361206055
Epoch 005/010, valid ppl = 164.35373648988278, batch 0025/0508, train loss = 2.623026132583618
Epoch 005/010, valid ppl = 164.35373648988278, batch 0026/0508, train loss = 2.5018107891082764
Epoch 005/010, valid ppl = 164.35373648988278, batch 0027/0508, train loss = 1.481763243675232
Epoch 005/010, valid ppl = 164.35373648988278, batch 0028/0508, train loss = 3.183420419692993
Epoch 005/010, valid ppl = 164.35373648988278, batch 0029/0508, train loss = 3.2726876735687256
Epoch 005/010, valid ppl = 164.35373648988278, batch 0030/0508, train loss = 3.1572439670562744
Epoch 005/010, valid ppl = 164.35373648988278, batch 0031/0508, train loss = 2.0359673500061035
Epoch 005/010, valid ppl = 164.35373648988278, batch 0032/0508, train loss = 2.641813278198242
Epoch 005/010, valid ppl = 164.35373648988278, batch 0033/0508, train loss = 1.7241673469543457
Epoch 005/010, valid ppl = 164.3537364898827

Epoch 005/010, valid ppl = 164.35373648988278, batch 0110/0508, train loss = 3.450714111328125
Epoch 005/010, valid ppl = 164.35373648988278, batch 0111/0508, train loss = 2.750746250152588
Epoch 005/010, valid ppl = 164.35373648988278, batch 0112/0508, train loss = 1.3294795751571655
Epoch 005/010, valid ppl = 164.35373648988278, batch 0113/0508, train loss = 1.2965396642684937
Epoch 005/010, valid ppl = 164.35373648988278, batch 0114/0508, train loss = 2.525463581085205
Epoch 005/010, valid ppl = 164.35373648988278, batch 0115/0508, train loss = 2.4376046657562256
Epoch 005/010, valid ppl = 164.35373648988278, batch 0116/0508, train loss = 2.224989175796509
Epoch 005/010, valid ppl = 164.35373648988278, batch 0117/0508, train loss = 2.3784546852111816
Epoch 005/010, valid ppl = 164.35373648988278, batch 0118/0508, train loss = 2.7657198905944824
Epoch 005/010, valid ppl = 164.35373648988278, batch 0119/0508, train loss = 3.100025177001953
Epoch 005/010, valid ppl = 164.35373648988278

Epoch 005/010, valid ppl = 164.35373648988278, batch 0196/0508, train loss = 4.664553642272949
Epoch 005/010, valid ppl = 164.35373648988278, batch 0197/0508, train loss = 3.3428468704223633
Epoch 005/010, valid ppl = 164.35373648988278, batch 0198/0508, train loss = 1.8299174308776855
Epoch 005/010, valid ppl = 164.35373648988278, batch 0199/0508, train loss = 3.158172607421875
Epoch 005/010, valid ppl = 164.35373648988278, batch 0200/0508, train loss = 1.9461861848831177
Epoch 005/010, valid ppl = 164.35373648988278, batch 0201/0508, train loss = 2.4968996047973633
Epoch 005/010, valid ppl = 164.35373648988278, batch 0202/0508, train loss = 2.524078845977783
Epoch 005/010, valid ppl = 164.35373648988278, batch 0203/0508, train loss = 2.667376756668091
Epoch 005/010, valid ppl = 164.35373648988278, batch 0204/0508, train loss = 3.6193928718566895
Epoch 005/010, valid ppl = 164.35373648988278, batch 0205/0508, train loss = 3.488497495651245
Epoch 005/010, valid ppl = 164.35373648988278

Epoch 005/010, valid ppl = 164.35373648988278, batch 0282/0508, train loss = 3.8142929077148438
Epoch 005/010, valid ppl = 164.35373648988278, batch 0283/0508, train loss = 3.0052638053894043
Epoch 005/010, valid ppl = 164.35373648988278, batch 0284/0508, train loss = 2.9776108264923096
Epoch 005/010, valid ppl = 164.35373648988278, batch 0285/0508, train loss = 1.9423919916152954
Epoch 005/010, valid ppl = 164.35373648988278, batch 0286/0508, train loss = 2.4294919967651367
Epoch 005/010, valid ppl = 164.35373648988278, batch 0287/0508, train loss = 2.8301212787628174
Epoch 005/010, valid ppl = 164.35373648988278, batch 0288/0508, train loss = 2.4345548152923584
Epoch 005/010, valid ppl = 164.35373648988278, batch 0289/0508, train loss = 3.2095937728881836
Epoch 005/010, valid ppl = 164.35373648988278, batch 0290/0508, train loss = 1.6782172918319702
Epoch 005/010, valid ppl = 164.35373648988278, batch 0291/0508, train loss = 1.4126497507095337
Epoch 005/010, valid ppl = 164.353736489

Epoch 005/010, valid ppl = 164.35373648988278, batch 0368/0508, train loss = 2.590055227279663
Epoch 005/010, valid ppl = 164.35373648988278, batch 0369/0508, train loss = 1.6160539388656616
Epoch 005/010, valid ppl = 164.35373648988278, batch 0370/0508, train loss = 1.9565191268920898
Epoch 005/010, valid ppl = 164.35373648988278, batch 0371/0508, train loss = 3.7754948139190674
Epoch 005/010, valid ppl = 164.35373648988278, batch 0372/0508, train loss = 3.322357416152954
Epoch 005/010, valid ppl = 164.35373648988278, batch 0373/0508, train loss = 2.073115348815918
Epoch 005/010, valid ppl = 164.35373648988278, batch 0374/0508, train loss = 2.232022523880005
Epoch 005/010, valid ppl = 164.35373648988278, batch 0375/0508, train loss = 2.8843345642089844
Epoch 005/010, valid ppl = 164.35373648988278, batch 0376/0508, train loss = 3.6590561866760254
Epoch 005/010, valid ppl = 164.35373648988278, batch 0377/0508, train loss = 1.89984130859375
Epoch 005/010, valid ppl = 164.35373648988278,

Epoch 005/010, valid ppl = 164.35373648988278, batch 0454/0508, train loss = 3.060737133026123
Epoch 005/010, valid ppl = 164.35373648988278, batch 0455/0508, train loss = 2.782625198364258
Epoch 005/010, valid ppl = 164.35373648988278, batch 0456/0508, train loss = 3.0626091957092285
Epoch 005/010, valid ppl = 164.35373648988278, batch 0457/0508, train loss = 3.002350330352783
Epoch 005/010, valid ppl = 164.35373648988278, batch 0458/0508, train loss = 3.2929656505584717
Epoch 005/010, valid ppl = 164.35373648988278, batch 0459/0508, train loss = 3.6159827709198
Epoch 005/010, valid ppl = 164.35373648988278, batch 0460/0508, train loss = 1.6471995115280151
Epoch 005/010, valid ppl = 164.35373648988278, batch 0461/0508, train loss = 4.196456432342529
Epoch 005/010, valid ppl = 164.35373648988278, batch 0462/0508, train loss = 2.8418893814086914
Epoch 005/010, valid ppl = 164.35373648988278, batch 0463/0508, train loss = 2.189303159713745
Epoch 005/010, valid ppl = 164.35373648988278, b

Epoch 006/010, valid ppl = 188.4198270023736, batch 0032/0508, train loss = 1.8182004690170288
Epoch 006/010, valid ppl = 188.4198270023736, batch 0033/0508, train loss = 2.648716688156128
Epoch 006/010, valid ppl = 188.4198270023736, batch 0034/0508, train loss = 2.502047061920166
Epoch 006/010, valid ppl = 188.4198270023736, batch 0035/0508, train loss = 1.9543430805206299
Epoch 006/010, valid ppl = 188.4198270023736, batch 0036/0508, train loss = 2.5873751640319824
Epoch 006/010, valid ppl = 188.4198270023736, batch 0037/0508, train loss = 1.6918805837631226
Epoch 006/010, valid ppl = 188.4198270023736, batch 0038/0508, train loss = 2.517629623413086
Epoch 006/010, valid ppl = 188.4198270023736, batch 0039/0508, train loss = 1.1584707498550415
Epoch 006/010, valid ppl = 188.4198270023736, batch 0040/0508, train loss = 2.9492499828338623
Epoch 006/010, valid ppl = 188.4198270023736, batch 0041/0508, train loss = 1.834686279296875
Epoch 006/010, valid ppl = 188.4198270023736, batch 00

Epoch 006/010, valid ppl = 188.4198270023736, batch 0119/0508, train loss = 1.05767822265625
Epoch 006/010, valid ppl = 188.4198270023736, batch 0120/0508, train loss = 2.7398579120635986
Epoch 006/010, valid ppl = 188.4198270023736, batch 0121/0508, train loss = 1.6411350965499878
Epoch 006/010, valid ppl = 188.4198270023736, batch 0122/0508, train loss = 1.7293546199798584
Epoch 006/010, valid ppl = 188.4198270023736, batch 0123/0508, train loss = 1.4816007614135742
Epoch 006/010, valid ppl = 188.4198270023736, batch 0124/0508, train loss = 1.6845076084136963
Epoch 006/010, valid ppl = 188.4198270023736, batch 0125/0508, train loss = 1.8374754190444946
Epoch 006/010, valid ppl = 188.4198270023736, batch 0126/0508, train loss = 2.0562195777893066
Epoch 006/010, valid ppl = 188.4198270023736, batch 0127/0508, train loss = 2.40556001663208
Epoch 006/010, valid ppl = 188.4198270023736, batch 0128/0508, train loss = 1.523307204246521
Epoch 006/010, valid ppl = 188.4198270023736, batch 012

Epoch 006/010, valid ppl = 188.4198270023736, batch 0206/0508, train loss = 2.0233778953552246
Epoch 006/010, valid ppl = 188.4198270023736, batch 0207/0508, train loss = 1.868370771408081
Epoch 006/010, valid ppl = 188.4198270023736, batch 0208/0508, train loss = 2.5152392387390137
Epoch 006/010, valid ppl = 188.4198270023736, batch 0209/0508, train loss = 1.0359092950820923
Epoch 006/010, valid ppl = 188.4198270023736, batch 0210/0508, train loss = 2.9402973651885986
Epoch 006/010, valid ppl = 188.4198270023736, batch 0211/0508, train loss = 1.252424716949463
Epoch 006/010, valid ppl = 188.4198270023736, batch 0212/0508, train loss = 1.5448716878890991
Epoch 006/010, valid ppl = 188.4198270023736, batch 0213/0508, train loss = 2.224208354949951
Epoch 006/010, valid ppl = 188.4198270023736, batch 0214/0508, train loss = 2.4408650398254395
Epoch 006/010, valid ppl = 188.4198270023736, batch 0215/0508, train loss = 1.6880069971084595
Epoch 006/010, valid ppl = 188.4198270023736, batch 0

Epoch 006/010, valid ppl = 188.4198270023736, batch 0293/0508, train loss = 1.0845956802368164
Epoch 006/010, valid ppl = 188.4198270023736, batch 0294/0508, train loss = 3.4231112003326416
Epoch 006/010, valid ppl = 188.4198270023736, batch 0295/0508, train loss = 2.7470319271087646
Epoch 006/010, valid ppl = 188.4198270023736, batch 0296/0508, train loss = 2.368335247039795
Epoch 006/010, valid ppl = 188.4198270023736, batch 0297/0508, train loss = 2.5882022380828857
Epoch 006/010, valid ppl = 188.4198270023736, batch 0298/0508, train loss = 1.8002818822860718
Epoch 006/010, valid ppl = 188.4198270023736, batch 0299/0508, train loss = 2.778137683868408
Epoch 006/010, valid ppl = 188.4198270023736, batch 0300/0508, train loss = 2.55627703666687
Epoch 006/010, valid ppl = 188.4198270023736, batch 0301/0508, train loss = 1.058272123336792
Epoch 006/010, valid ppl = 188.4198270023736, batch 0302/0508, train loss = 1.6015526056289673
Epoch 006/010, valid ppl = 188.4198270023736, batch 030

Epoch 006/010, valid ppl = 188.4198270023736, batch 0380/0508, train loss = 2.161344528198242
Epoch 006/010, valid ppl = 188.4198270023736, batch 0381/0508, train loss = 2.49835205078125
Epoch 006/010, valid ppl = 188.4198270023736, batch 0382/0508, train loss = 3.3038864135742188
Epoch 006/010, valid ppl = 188.4198270023736, batch 0383/0508, train loss = 2.0456418991088867
Epoch 006/010, valid ppl = 188.4198270023736, batch 0384/0508, train loss = 3.257106065750122
Epoch 006/010, valid ppl = 188.4198270023736, batch 0385/0508, train loss = 2.5505383014678955
Epoch 006/010, valid ppl = 188.4198270023736, batch 0386/0508, train loss = 2.27799916267395
Epoch 006/010, valid ppl = 188.4198270023736, batch 0387/0508, train loss = 1.893565058708191
Epoch 006/010, valid ppl = 188.4198270023736, batch 0388/0508, train loss = 2.3982274532318115
Epoch 006/010, valid ppl = 188.4198270023736, batch 0389/0508, train loss = 1.7645639181137085
Epoch 006/010, valid ppl = 188.4198270023736, batch 0390/

Epoch 006/010, valid ppl = 188.4198270023736, batch 0467/0508, train loss = 1.100098729133606
Epoch 006/010, valid ppl = 188.4198270023736, batch 0468/0508, train loss = 2.3738646507263184
Epoch 006/010, valid ppl = 188.4198270023736, batch 0469/0508, train loss = 1.3008637428283691
Epoch 006/010, valid ppl = 188.4198270023736, batch 0470/0508, train loss = 2.128192663192749
Epoch 006/010, valid ppl = 188.4198270023736, batch 0471/0508, train loss = 2.1778385639190674
Epoch 006/010, valid ppl = 188.4198270023736, batch 0472/0508, train loss = 0.9278500080108643
Epoch 006/010, valid ppl = 188.4198270023736, batch 0473/0508, train loss = 1.3806232213974
Epoch 006/010, valid ppl = 188.4198270023736, batch 0474/0508, train loss = 3.0792956352233887
Epoch 006/010, valid ppl = 188.4198270023736, batch 0475/0508, train loss = 1.7727428674697876
Epoch 006/010, valid ppl = 188.4198270023736, batch 0476/0508, train loss = 2.2742481231689453
Epoch 006/010, valid ppl = 188.4198270023736, batch 047

Epoch 007/010, valid ppl = 283.40933614803555, batch 0045/0508, train loss = 1.7063226699829102
Epoch 007/010, valid ppl = 283.40933614803555, batch 0046/0508, train loss = 1.5138051509857178
Epoch 007/010, valid ppl = 283.40933614803555, batch 0047/0508, train loss = 1.1669844388961792
Epoch 007/010, valid ppl = 283.40933614803555, batch 0048/0508, train loss = 1.5573606491088867
Epoch 007/010, valid ppl = 283.40933614803555, batch 0049/0508, train loss = 1.2669178247451782
Epoch 007/010, valid ppl = 283.40933614803555, batch 0050/0508, train loss = 0.8166859745979309
Epoch 007/010, valid ppl = 283.40933614803555, batch 0051/0508, train loss = 1.3721280097961426
Epoch 007/010, valid ppl = 283.40933614803555, batch 0052/0508, train loss = 2.0306384563446045
Epoch 007/010, valid ppl = 283.40933614803555, batch 0053/0508, train loss = 0.62822026014328
Epoch 007/010, valid ppl = 283.40933614803555, batch 0054/0508, train loss = 1.189588189125061
Epoch 007/010, valid ppl = 283.409336148035

Epoch 007/010, valid ppl = 283.40933614803555, batch 0131/0508, train loss = 0.1191595196723938
Epoch 007/010, valid ppl = 283.40933614803555, batch 0132/0508, train loss = 1.355767011642456
Epoch 007/010, valid ppl = 283.40933614803555, batch 0133/0508, train loss = 1.2559741735458374
Epoch 007/010, valid ppl = 283.40933614803555, batch 0134/0508, train loss = 1.64776611328125
Epoch 007/010, valid ppl = 283.40933614803555, batch 0135/0508, train loss = 1.0114973783493042
Epoch 007/010, valid ppl = 283.40933614803555, batch 0136/0508, train loss = 1.1687391996383667
Epoch 007/010, valid ppl = 283.40933614803555, batch 0137/0508, train loss = 0.8113706707954407
Epoch 007/010, valid ppl = 283.40933614803555, batch 0138/0508, train loss = 1.6771936416625977
Epoch 007/010, valid ppl = 283.40933614803555, batch 0139/0508, train loss = 0.823487401008606
Epoch 007/010, valid ppl = 283.40933614803555, batch 0140/0508, train loss = 2.4712018966674805
Epoch 007/010, valid ppl = 283.4093361480355

Epoch 007/010, valid ppl = 283.40933614803555, batch 0217/0508, train loss = 1.3164981603622437
Epoch 007/010, valid ppl = 283.40933614803555, batch 0218/0508, train loss = 2.3690547943115234
Epoch 007/010, valid ppl = 283.40933614803555, batch 0219/0508, train loss = 1.1896765232086182
Epoch 007/010, valid ppl = 283.40933614803555, batch 0220/0508, train loss = 1.1244431734085083
Epoch 007/010, valid ppl = 283.40933614803555, batch 0221/0508, train loss = 1.869352102279663
Epoch 007/010, valid ppl = 283.40933614803555, batch 0222/0508, train loss = 1.0195388793945312
Epoch 007/010, valid ppl = 283.40933614803555, batch 0223/0508, train loss = 1.7193472385406494
Epoch 007/010, valid ppl = 283.40933614803555, batch 0224/0508, train loss = 1.4923388957977295
Epoch 007/010, valid ppl = 283.40933614803555, batch 0225/0508, train loss = 0.9337947368621826
Epoch 007/010, valid ppl = 283.40933614803555, batch 0226/0508, train loss = 0.8973850011825562
Epoch 007/010, valid ppl = 283.4093361480

Epoch 007/010, valid ppl = 283.40933614803555, batch 0303/0508, train loss = 0.8489333391189575
Epoch 007/010, valid ppl = 283.40933614803555, batch 0304/0508, train loss = 1.1016871929168701
Epoch 007/010, valid ppl = 283.40933614803555, batch 0305/0508, train loss = 2.660069704055786
Epoch 007/010, valid ppl = 283.40933614803555, batch 0306/0508, train loss = 1.105026125907898
Epoch 007/010, valid ppl = 283.40933614803555, batch 0307/0508, train loss = 1.4095455408096313
Epoch 007/010, valid ppl = 283.40933614803555, batch 0308/0508, train loss = 1.6797548532485962
Epoch 007/010, valid ppl = 283.40933614803555, batch 0309/0508, train loss = 1.3577865362167358
Epoch 007/010, valid ppl = 283.40933614803555, batch 0310/0508, train loss = 0.8710077404975891
Epoch 007/010, valid ppl = 283.40933614803555, batch 0311/0508, train loss = 1.1521813869476318
Epoch 007/010, valid ppl = 283.40933614803555, batch 0312/0508, train loss = 1.7223962545394897
Epoch 007/010, valid ppl = 283.40933614803

Epoch 007/010, valid ppl = 283.40933614803555, batch 0389/0508, train loss = 1.035811185836792
Epoch 007/010, valid ppl = 283.40933614803555, batch 0390/0508, train loss = 1.5554190874099731
Epoch 007/010, valid ppl = 283.40933614803555, batch 0391/0508, train loss = 1.8230377435684204
Epoch 007/010, valid ppl = 283.40933614803555, batch 0392/0508, train loss = 1.9195351600646973
Epoch 007/010, valid ppl = 283.40933614803555, batch 0393/0508, train loss = 1.1673338413238525
Epoch 007/010, valid ppl = 283.40933614803555, batch 0394/0508, train loss = 0.695097804069519
Epoch 007/010, valid ppl = 283.40933614803555, batch 0395/0508, train loss = 1.77609384059906
Epoch 007/010, valid ppl = 283.40933614803555, batch 0396/0508, train loss = 0.9394238591194153
Epoch 007/010, valid ppl = 283.40933614803555, batch 0397/0508, train loss = 1.9942436218261719
Epoch 007/010, valid ppl = 283.40933614803555, batch 0398/0508, train loss = 2.4727468490600586
Epoch 007/010, valid ppl = 283.4093361480355

Epoch 007/010, valid ppl = 283.40933614803555, batch 0475/0508, train loss = 1.7716203927993774
Epoch 007/010, valid ppl = 283.40933614803555, batch 0476/0508, train loss = 1.6759707927703857
Epoch 007/010, valid ppl = 283.40933614803555, batch 0477/0508, train loss = 1.4924345016479492
Epoch 007/010, valid ppl = 283.40933614803555, batch 0478/0508, train loss = 1.6906070709228516
Epoch 007/010, valid ppl = 283.40933614803555, batch 0479/0508, train loss = 1.8460718393325806
Epoch 007/010, valid ppl = 283.40933614803555, batch 0480/0508, train loss = 1.2893099784851074
Epoch 007/010, valid ppl = 283.40933614803555, batch 0481/0508, train loss = 1.751792073249817
Epoch 007/010, valid ppl = 283.40933614803555, batch 0482/0508, train loss = 1.5401638746261597
Epoch 007/010, valid ppl = 283.40933614803555, batch 0483/0508, train loss = 0.982731819152832
Epoch 007/010, valid ppl = 283.40933614803555, batch 0484/0508, train loss = 1.8786112070083618
Epoch 007/010, valid ppl = 283.40933614803

Epoch 008/010, valid ppl = 378.08178038121724, batch 0052/0508, train loss = 1.7222436666488647
Epoch 008/010, valid ppl = 378.08178038121724, batch 0053/0508, train loss = 1.1469268798828125
Epoch 008/010, valid ppl = 378.08178038121724, batch 0054/0508, train loss = 0.5727978944778442
Epoch 008/010, valid ppl = 378.08178038121724, batch 0055/0508, train loss = 0.8788873553276062
Epoch 008/010, valid ppl = 378.08178038121724, batch 0056/0508, train loss = 0.9305581450462341
Epoch 008/010, valid ppl = 378.08178038121724, batch 0057/0508, train loss = 1.0508460998535156
Epoch 008/010, valid ppl = 378.08178038121724, batch 0058/0508, train loss = 1.1239111423492432
Epoch 008/010, valid ppl = 378.08178038121724, batch 0059/0508, train loss = 0.6597349643707275
Epoch 008/010, valid ppl = 378.08178038121724, batch 0060/0508, train loss = 0.8246777057647705
Epoch 008/010, valid ppl = 378.08178038121724, batch 0061/0508, train loss = 0.6853170990943909
Epoch 008/010, valid ppl = 378.081780381

Epoch 008/010, valid ppl = 378.08178038121724, batch 0138/0508, train loss = 1.057574987411499
Epoch 008/010, valid ppl = 378.08178038121724, batch 0139/0508, train loss = 1.3401590585708618
Epoch 008/010, valid ppl = 378.08178038121724, batch 0140/0508, train loss = 0.7692580223083496
Epoch 008/010, valid ppl = 378.08178038121724, batch 0141/0508, train loss = 0.8257307410240173
Epoch 008/010, valid ppl = 378.08178038121724, batch 0142/0508, train loss = 1.3892614841461182
Epoch 008/010, valid ppl = 378.08178038121724, batch 0143/0508, train loss = 0.9668592810630798
Epoch 008/010, valid ppl = 378.08178038121724, batch 0144/0508, train loss = 1.059254765510559
Epoch 008/010, valid ppl = 378.08178038121724, batch 0145/0508, train loss = 0.560032308101654
Epoch 008/010, valid ppl = 378.08178038121724, batch 0146/0508, train loss = 0.6733506321907043
Epoch 008/010, valid ppl = 378.08178038121724, batch 0147/0508, train loss = 0.9121650457382202
Epoch 008/010, valid ppl = 378.081780381217

Epoch 008/010, valid ppl = 378.08178038121724, batch 0224/0508, train loss = 1.2845691442489624
Epoch 008/010, valid ppl = 378.08178038121724, batch 0225/0508, train loss = 0.9332243800163269
Epoch 008/010, valid ppl = 378.08178038121724, batch 0226/0508, train loss = 0.9015741944313049
Epoch 008/010, valid ppl = 378.08178038121724, batch 0227/0508, train loss = 1.027576208114624
Epoch 008/010, valid ppl = 378.08178038121724, batch 0228/0508, train loss = 1.0105684995651245
Epoch 008/010, valid ppl = 378.08178038121724, batch 0229/0508, train loss = 0.6310265064239502
Epoch 008/010, valid ppl = 378.08178038121724, batch 0230/0508, train loss = 0.7708536982536316
Epoch 008/010, valid ppl = 378.08178038121724, batch 0231/0508, train loss = 1.1941862106323242
Epoch 008/010, valid ppl = 378.08178038121724, batch 0232/0508, train loss = 0.9075246453285217
Epoch 008/010, valid ppl = 378.08178038121724, batch 0233/0508, train loss = 0.9293981194496155
Epoch 008/010, valid ppl = 378.0817803812

Epoch 008/010, valid ppl = 378.08178038121724, batch 0310/0508, train loss = 1.3800276517868042
Epoch 008/010, valid ppl = 378.08178038121724, batch 0311/0508, train loss = 1.135654330253601
Epoch 008/010, valid ppl = 378.08178038121724, batch 0312/0508, train loss = 1.2417446374893188
Epoch 008/010, valid ppl = 378.08178038121724, batch 0313/0508, train loss = 1.4814870357513428
Epoch 008/010, valid ppl = 378.08178038121724, batch 0314/0508, train loss = 0.8313164114952087
Epoch 008/010, valid ppl = 378.08178038121724, batch 0315/0508, train loss = 1.5157583951950073
Epoch 008/010, valid ppl = 378.08178038121724, batch 0316/0508, train loss = 1.410710334777832
Epoch 008/010, valid ppl = 378.08178038121724, batch 0317/0508, train loss = 0.9368212223052979
Epoch 008/010, valid ppl = 378.08178038121724, batch 0318/0508, train loss = 1.0845465660095215
Epoch 008/010, valid ppl = 378.08178038121724, batch 0319/0508, train loss = 1.4983575344085693
Epoch 008/010, valid ppl = 378.08178038121

Epoch 008/010, valid ppl = 378.08178038121724, batch 0396/0508, train loss = 1.0305744409561157
Epoch 008/010, valid ppl = 378.08178038121724, batch 0397/0508, train loss = 1.337934136390686
Epoch 008/010, valid ppl = 378.08178038121724, batch 0398/0508, train loss = 0.5158294439315796
Epoch 008/010, valid ppl = 378.08178038121724, batch 0399/0508, train loss = 0.782346785068512
Epoch 008/010, valid ppl = 378.08178038121724, batch 0400/0508, train loss = 0.617784857749939
Epoch 008/010, valid ppl = 378.08178038121724, batch 0401/0508, train loss = 1.3535374402999878
Epoch 008/010, valid ppl = 378.08178038121724, batch 0402/0508, train loss = 0.6287065148353577
Epoch 008/010, valid ppl = 378.08178038121724, batch 0403/0508, train loss = 0.970228374004364
Epoch 008/010, valid ppl = 378.08178038121724, batch 0404/0508, train loss = 0.911562979221344
Epoch 008/010, valid ppl = 378.08178038121724, batch 0405/0508, train loss = 1.2673898935317993
Epoch 008/010, valid ppl = 378.08178038121724

Epoch 008/010, valid ppl = 378.08178038121724, batch 0482/0508, train loss = 0.8143103718757629
Epoch 008/010, valid ppl = 378.08178038121724, batch 0483/0508, train loss = 1.5674914121627808
Epoch 008/010, valid ppl = 378.08178038121724, batch 0484/0508, train loss = 0.8116915822029114
Epoch 008/010, valid ppl = 378.08178038121724, batch 0485/0508, train loss = 0.8291728496551514
Epoch 008/010, valid ppl = 378.08178038121724, batch 0486/0508, train loss = 0.8568981289863586
Epoch 008/010, valid ppl = 378.08178038121724, batch 0487/0508, train loss = 1.0174006223678589
Epoch 008/010, valid ppl = 378.08178038121724, batch 0488/0508, train loss = 1.3084909915924072
Epoch 008/010, valid ppl = 378.08178038121724, batch 0489/0508, train loss = 1.21364426612854
Epoch 008/010, valid ppl = 378.08178038121724, batch 0490/0508, train loss = 1.2776317596435547
Epoch 008/010, valid ppl = 378.08178038121724, batch 0491/0508, train loss = 1.4093767404556274
Epoch 008/010, valid ppl = 378.08178038121

Epoch 009/010, valid ppl = 477.33696172310346, batch 0059/0508, train loss = 0.8331725597381592
Epoch 009/010, valid ppl = 477.33696172310346, batch 0060/0508, train loss = 1.0612684488296509
Epoch 009/010, valid ppl = 477.33696172310346, batch 0061/0508, train loss = 0.5108868479728699
Epoch 009/010, valid ppl = 477.33696172310346, batch 0062/0508, train loss = 1.0383327007293701
Epoch 009/010, valid ppl = 477.33696172310346, batch 0063/0508, train loss = 0.6281194090843201
Epoch 009/010, valid ppl = 477.33696172310346, batch 0064/0508, train loss = 0.5545971989631653
Epoch 009/010, valid ppl = 477.33696172310346, batch 0065/0508, train loss = 0.5542466640472412
Epoch 009/010, valid ppl = 477.33696172310346, batch 0066/0508, train loss = 0.7047017812728882
Epoch 009/010, valid ppl = 477.33696172310346, batch 0067/0508, train loss = 0.6473069190979004
Epoch 009/010, valid ppl = 477.33696172310346, batch 0068/0508, train loss = 1.146588683128357
Epoch 009/010, valid ppl = 477.3369617231

Epoch 009/010, valid ppl = 477.33696172310346, batch 0145/0508, train loss = 0.4096882939338684
Epoch 009/010, valid ppl = 477.33696172310346, batch 0146/0508, train loss = 0.2792522609233856
Epoch 009/010, valid ppl = 477.33696172310346, batch 0147/0508, train loss = 0.7881758213043213
Epoch 009/010, valid ppl = 477.33696172310346, batch 0148/0508, train loss = 0.12797756493091583
Epoch 009/010, valid ppl = 477.33696172310346, batch 0149/0508, train loss = 0.42747560143470764
Epoch 009/010, valid ppl = 477.33696172310346, batch 0150/0508, train loss = 0.18713736534118652
Epoch 009/010, valid ppl = 477.33696172310346, batch 0151/0508, train loss = 0.5856350064277649
Epoch 009/010, valid ppl = 477.33696172310346, batch 0152/0508, train loss = 0.7126789689064026
Epoch 009/010, valid ppl = 477.33696172310346, batch 0153/0508, train loss = 1.0401287078857422
Epoch 009/010, valid ppl = 477.33696172310346, batch 0154/0508, train loss = 0.3715522885322571
Epoch 009/010, valid ppl = 477.336961

Epoch 009/010, valid ppl = 477.33696172310346, batch 0231/0508, train loss = 1.0509425401687622
Epoch 009/010, valid ppl = 477.33696172310346, batch 0232/0508, train loss = 0.6289296746253967
Epoch 009/010, valid ppl = 477.33696172310346, batch 0233/0508, train loss = 0.8527002930641174
Epoch 009/010, valid ppl = 477.33696172310346, batch 0234/0508, train loss = 1.0196274518966675
Epoch 009/010, valid ppl = 477.33696172310346, batch 0235/0508, train loss = 0.5034000873565674
Epoch 009/010, valid ppl = 477.33696172310346, batch 0236/0508, train loss = 0.7592297196388245
Epoch 009/010, valid ppl = 477.33696172310346, batch 0237/0508, train loss = 0.38118571043014526
Epoch 009/010, valid ppl = 477.33696172310346, batch 0238/0508, train loss = 0.46716681122779846
Epoch 009/010, valid ppl = 477.33696172310346, batch 0239/0508, train loss = 0.2379617542028427
Epoch 009/010, valid ppl = 477.33696172310346, batch 0240/0508, train loss = 0.5071734189987183
Epoch 009/010, valid ppl = 477.3369617

Epoch 009/010, valid ppl = 477.33696172310346, batch 0317/0508, train loss = 0.955003559589386
Epoch 009/010, valid ppl = 477.33696172310346, batch 0318/0508, train loss = 0.22026105225086212
Epoch 009/010, valid ppl = 477.33696172310346, batch 0319/0508, train loss = 0.3624769449234009
Epoch 009/010, valid ppl = 477.33696172310346, batch 0320/0508, train loss = 0.4236501157283783
Epoch 009/010, valid ppl = 477.33696172310346, batch 0321/0508, train loss = 0.5743915438652039
Epoch 009/010, valid ppl = 477.33696172310346, batch 0322/0508, train loss = 0.7497663497924805
Epoch 009/010, valid ppl = 477.33696172310346, batch 0323/0508, train loss = 0.1027570441365242
Epoch 009/010, valid ppl = 477.33696172310346, batch 0324/0508, train loss = 0.7674386501312256
Epoch 009/010, valid ppl = 477.33696172310346, batch 0325/0508, train loss = 0.8983690142631531
Epoch 009/010, valid ppl = 477.33696172310346, batch 0326/0508, train loss = 0.9056230187416077
Epoch 009/010, valid ppl = 477.336961723

Epoch 009/010, valid ppl = 477.33696172310346, batch 0403/0508, train loss = 0.555791437625885
Epoch 009/010, valid ppl = 477.33696172310346, batch 0404/0508, train loss = 0.3895557224750519
Epoch 009/010, valid ppl = 477.33696172310346, batch 0405/0508, train loss = 0.48300978541374207
Epoch 009/010, valid ppl = 477.33696172310346, batch 0406/0508, train loss = 1.2328858375549316
Epoch 009/010, valid ppl = 477.33696172310346, batch 0407/0508, train loss = 0.8797696232795715
Epoch 009/010, valid ppl = 477.33696172310346, batch 0408/0508, train loss = 0.8539977073669434
Epoch 009/010, valid ppl = 477.33696172310346, batch 0409/0508, train loss = 0.5979912281036377
Epoch 009/010, valid ppl = 477.33696172310346, batch 0410/0508, train loss = 0.8561280369758606
Epoch 009/010, valid ppl = 477.33696172310346, batch 0411/0508, train loss = 0.6751746535301208
Epoch 009/010, valid ppl = 477.33696172310346, batch 0412/0508, train loss = 0.6981971859931946
Epoch 009/010, valid ppl = 477.336961723

Epoch 009/010, valid ppl = 477.33696172310346, batch 0489/0508, train loss = 0.9425304532051086
Epoch 009/010, valid ppl = 477.33696172310346, batch 0490/0508, train loss = 0.4932217001914978
Epoch 009/010, valid ppl = 477.33696172310346, batch 0491/0508, train loss = 1.2670663595199585
Epoch 009/010, valid ppl = 477.33696172310346, batch 0492/0508, train loss = 0.44591596722602844
Epoch 009/010, valid ppl = 477.33696172310346, batch 0493/0508, train loss = 1.087699055671692
Epoch 009/010, valid ppl = 477.33696172310346, batch 0494/0508, train loss = 0.7341375946998596
Epoch 009/010, valid ppl = 477.33696172310346, batch 0495/0508, train loss = 0.8907814025878906
Epoch 009/010, valid ppl = 477.33696172310346, batch 0496/0508, train loss = 0.46206140518188477
Epoch 009/010, valid ppl = 477.33696172310346, batch 0497/0508, train loss = 0.927956223487854
Epoch 009/010, valid ppl = 477.33696172310346, batch 0498/0508, train loss = 0.8522728085517883
Epoch 009/010, valid ppl = 477.336961723

Epoch 010/010, valid ppl = 638.2196538599143, batch 0066/0508, train loss = 0.6375149488449097
Epoch 010/010, valid ppl = 638.2196538599143, batch 0067/0508, train loss = 0.5207785367965698
Epoch 010/010, valid ppl = 638.2196538599143, batch 0068/0508, train loss = 0.40505504608154297
Epoch 010/010, valid ppl = 638.2196538599143, batch 0069/0508, train loss = 0.35984739661216736
Epoch 010/010, valid ppl = 638.2196538599143, batch 0070/0508, train loss = 0.3999609053134918
Epoch 010/010, valid ppl = 638.2196538599143, batch 0071/0508, train loss = 0.2822491526603699
Epoch 010/010, valid ppl = 638.2196538599143, batch 0072/0508, train loss = 0.5700160264968872
Epoch 010/010, valid ppl = 638.2196538599143, batch 0073/0508, train loss = 0.4318106770515442
Epoch 010/010, valid ppl = 638.2196538599143, batch 0074/0508, train loss = 0.4614265263080597
Epoch 010/010, valid ppl = 638.2196538599143, batch 0075/0508, train loss = 0.3030475974082947
Epoch 010/010, valid ppl = 638.2196538599143, ba

Epoch 010/010, valid ppl = 638.2196538599143, batch 0153/0508, train loss = 0.6562248468399048
Epoch 010/010, valid ppl = 638.2196538599143, batch 0154/0508, train loss = 0.1974707692861557
Epoch 010/010, valid ppl = 638.2196538599143, batch 0155/0508, train loss = 0.3676471710205078
Epoch 010/010, valid ppl = 638.2196538599143, batch 0156/0508, train loss = 0.2828691601753235
Epoch 010/010, valid ppl = 638.2196538599143, batch 0157/0508, train loss = 0.3351576030254364
Epoch 010/010, valid ppl = 638.2196538599143, batch 0158/0508, train loss = 0.6287676692008972
Epoch 010/010, valid ppl = 638.2196538599143, batch 0159/0508, train loss = 0.27087610960006714
Epoch 010/010, valid ppl = 638.2196538599143, batch 0160/0508, train loss = 0.5419405698776245
Epoch 010/010, valid ppl = 638.2196538599143, batch 0161/0508, train loss = 0.7264087796211243
Epoch 010/010, valid ppl = 638.2196538599143, batch 0162/0508, train loss = 0.43770021200180054
Epoch 010/010, valid ppl = 638.2196538599143, ba

Epoch 010/010, valid ppl = 638.2196538599143, batch 0240/0508, train loss = 0.5954276323318481
Epoch 010/010, valid ppl = 638.2196538599143, batch 0241/0508, train loss = 0.4871475398540497
Epoch 010/010, valid ppl = 638.2196538599143, batch 0242/0508, train loss = 0.8544524908065796
Epoch 010/010, valid ppl = 638.2196538599143, batch 0243/0508, train loss = 0.3698592782020569
Epoch 010/010, valid ppl = 638.2196538599143, batch 0244/0508, train loss = 0.2168380320072174
Epoch 010/010, valid ppl = 638.2196538599143, batch 0245/0508, train loss = 0.23821422457695007
Epoch 010/010, valid ppl = 638.2196538599143, batch 0246/0508, train loss = 0.4200102686882019
Epoch 010/010, valid ppl = 638.2196538599143, batch 0247/0508, train loss = 0.4900507628917694
Epoch 010/010, valid ppl = 638.2196538599143, batch 0248/0508, train loss = 0.606079638004303
Epoch 010/010, valid ppl = 638.2196538599143, batch 0249/0508, train loss = 0.41456931829452515
Epoch 010/010, valid ppl = 638.2196538599143, bat

Epoch 010/010, valid ppl = 638.2196538599143, batch 0327/0508, train loss = 0.255890429019928
Epoch 010/010, valid ppl = 638.2196538599143, batch 0328/0508, train loss = 0.5624951124191284
Epoch 010/010, valid ppl = 638.2196538599143, batch 0329/0508, train loss = 0.32968488335609436
Epoch 010/010, valid ppl = 638.2196538599143, batch 0330/0508, train loss = 0.7348499894142151
Epoch 010/010, valid ppl = 638.2196538599143, batch 0331/0508, train loss = 0.5193235278129578
Epoch 010/010, valid ppl = 638.2196538599143, batch 0332/0508, train loss = 0.5973396301269531
Epoch 010/010, valid ppl = 638.2196538599143, batch 0333/0508, train loss = 0.30606335401535034
Epoch 010/010, valid ppl = 638.2196538599143, batch 0334/0508, train loss = 0.16250935196876526
Epoch 010/010, valid ppl = 638.2196538599143, batch 0335/0508, train loss = 0.596186101436615
Epoch 010/010, valid ppl = 638.2196538599143, batch 0336/0508, train loss = 0.5858466029167175
Epoch 010/010, valid ppl = 638.2196538599143, bat

Epoch 010/010, valid ppl = 638.2196538599143, batch 0414/0508, train loss = 0.4652198255062103
Epoch 010/010, valid ppl = 638.2196538599143, batch 0415/0508, train loss = 0.7774840593338013
Epoch 010/010, valid ppl = 638.2196538599143, batch 0416/0508, train loss = 0.6502383947372437
Epoch 010/010, valid ppl = 638.2196538599143, batch 0417/0508, train loss = 0.4922370910644531
Epoch 010/010, valid ppl = 638.2196538599143, batch 0418/0508, train loss = 0.8284174203872681
Epoch 010/010, valid ppl = 638.2196538599143, batch 0419/0508, train loss = 0.36350584030151367
Epoch 010/010, valid ppl = 638.2196538599143, batch 0420/0508, train loss = 0.5290470719337463
Epoch 010/010, valid ppl = 638.2196538599143, batch 0421/0508, train loss = 1.3254088163375854
Epoch 010/010, valid ppl = 638.2196538599143, batch 0422/0508, train loss = 0.4642428755760193
Epoch 010/010, valid ppl = 638.2196538599143, batch 0423/0508, train loss = 0.5373047590255737
Epoch 010/010, valid ppl = 638.2196538599143, bat

Epoch 010/010, valid ppl = 638.2196538599143, batch 0501/0508, train loss = 0.029726823791861534
Epoch 010/010, valid ppl = 638.2196538599143, batch 0502/0508, train loss = 0.5395171642303467
Epoch 010/010, valid ppl = 638.2196538599143, batch 0503/0508, train loss = 0.46807530522346497
Epoch 010/010, valid ppl = 638.2196538599143, batch 0504/0508, train loss = 0.8016194105148315
Epoch 010/010, valid ppl = 638.2196538599143, batch 0505/0508, train loss = 0.5074193477630615
Epoch 010/010, valid ppl = 638.2196538599143, batch 0506/0508, train loss = 0.5261082649230957
Epoch 010/010, valid ppl = 638.2196538599143, batch 0507/0508, train loss = 0.7749949097633362
Epoch 010/010, valid ppl = 638.2196538599143, batch 0508/0508, train loss = 0.4285781681537628
Saving the trained model to ./model_dailydialog_rf/model_epoch_010.ckpt...
Epoch 001, valid ppl = 120.63403990420883
Epoch 002, valid ppl = 118.79532458312138
Epoch 003, valid ppl = 146.13936505096146
Epoch 004, valid ppl = 164.353736489