# Import all the required libraries

In [4]:
import logging

import torch
from train import train_model

from model_classifier import QAClassifierModel
from model import QAModel
from preprocess import SquadPreprocessor, SquadPlausibleAnswersPreprocessor
import inspect
%load_ext autoreload
%autoreload 2

torch.__version__

The autoreload extension is already loaded. To reload it, use:
  %reload_ext autoreload


'1.6.0'

# Check for GPU availibility

In [7]:
print(f"Is GPU Available: {torch.cuda.is_available()} \nNo. of GPU's availble: {torch.cuda.device_count()}")

Is GPU Available: True 
No. of GPU's availble: 1


# Set the level of logging required

In [9]:
import os
os.environ['CUDA_LAUNCH_BLOCKING'] = '1' # Allows to print elaborate error messages when running on GPU

In [11]:
logging.basicConfig(level=logging.INFO)

# Train the model

In [8]:
# Train model with plausible answers
train_model(preprocessor=SquadPlausibleAnswersPreprocessor, base_model=QAModel, frac_val_data=1.0,
            frac_train_data=1.0, save_model_prefix="plausible", save_every = 5000, batch_size = 8, n_epoch=15)

INFO:root:Including plausible answers: True
INFO:root:Including plausible answers: True
INFO:root:Number of impossible questions, train: 43498, val: 5930
INFO:root:Using device: cuda
  return {key: torch.tensor(val[idx]) for key, val in self.encodings.items()}


Train: Epoch: 1, iter: 1, avg. loss: 6.27
Train: Epoch: 1, iter: 2, avg. loss: 6.34
Train: Epoch: 1, iter: 3, avg. loss: 6.16
Train: Epoch: 1, iter: 4, avg. loss: 6.12
Train: Epoch: 1, iter: 5, avg. loss: 5.96
Train: Epoch: 1, iter: 6, avg. loss: 5.87
Train: Epoch: 1, iter: 7, avg. loss: 5.73
Train: Epoch: 1, iter: 8, avg. loss: 5.65
Train: Epoch: 1, iter: 9, avg. loss: 5.54
Train: Epoch: 1, iter: 10, avg. loss: 5.37

Eval: Epoch: 1, iter: 10, avg. loss: 5.15

Train: Epoch: 1, iter: 11, avg. loss: 4.91
Train: Epoch: 1, iter: 12, avg. loss: 4.93
Train: Epoch: 1, iter: 13, avg. loss: 4.83
Train: Epoch: 1, iter: 14, avg. loss: 5.19
Train: Epoch: 1, iter: 15, avg. loss: 4.59
Train: Epoch: 1, iter: 16, avg. loss: 4.59
Train: Epoch: 1, iter: 17, avg. loss: 4.44
Train: Epoch: 1, iter: 18, avg. loss: 4.57
Train: Epoch: 1, iter: 19, avg. loss: 4.76
Train: Epoch: 1, iter: 20, avg. loss: 4.11

Eval: Epoch: 1, iter: 20, avg. loss: 4.59

Train: Epoch: 1, iter: 21, avg. loss: 4.13
Train: Epoch: 1, i

INFO:root:Saving checkpoint model to model_checkpoint/plausible_model_5000.pt



Eval: Epoch: 1, iter: 5000, avg. loss: 1.46

Train: Epoch: 1, iter: 5001, avg. loss: 1.65
Train: Epoch: 1, iter: 5002, avg. loss: 1.47
Train: Epoch: 1, iter: 5003, avg. loss: 0.91
Train: Epoch: 1, iter: 5004, avg. loss: 0.85
Train: Epoch: 1, iter: 5005, avg. loss: 1.89
Train: Epoch: 1, iter: 5006, avg. loss: 1.74
Train: Epoch: 1, iter: 5007, avg. loss: 1.14
Train: Epoch: 1, iter: 5008, avg. loss: 1.44
Train: Epoch: 1, iter: 5009, avg. loss: 1.54
Train: Epoch: 1, iter: 5010, avg. loss: 1.66

Eval: Epoch: 1, iter: 5010, avg. loss: 1.29

Train: Epoch: 1, iter: 5011, avg. loss: 1.78
Train: Epoch: 1, iter: 5012, avg. loss: 1.28
Train: Epoch: 1, iter: 5013, avg. loss: 1.18
Train: Epoch: 1, iter: 5014, avg. loss: 1.99
Train: Epoch: 1, iter: 5015, avg. loss: 0.88
Train: Epoch: 1, iter: 5016, avg. loss: 2.22
Train: Epoch: 1, iter: 5017, avg. loss: 0.68
Train: Epoch: 1, iter: 5018, avg. loss: 1.68
Train: Epoch: 1, iter: 5019, avg. loss: 1.58
Train: Epoch: 1, iter: 5020, avg. loss: 1.18

Eval: E

INFO:root:Saving checkpoint model to model_checkpoint/plausible_model_10000.pt



Eval: Epoch: 1, iter: 10000, avg. loss: 1.46

Train: Epoch: 1, iter: 10001, avg. loss: 2.45
Train: Epoch: 1, iter: 10002, avg. loss: 1.58
Train: Epoch: 1, iter: 10003, avg. loss: 1.40
Train: Epoch: 1, iter: 10004, avg. loss: 0.75
Train: Epoch: 1, iter: 10005, avg. loss: 2.36
Train: Epoch: 1, iter: 10006, avg. loss: 1.89
Train: Epoch: 1, iter: 10007, avg. loss: 2.11
Train: Epoch: 1, iter: 10008, avg. loss: 1.01
Train: Epoch: 1, iter: 10009, avg. loss: 1.33
Train: Epoch: 1, iter: 10010, avg. loss: 0.67

Eval: Epoch: 1, iter: 10010, avg. loss: 1.61

Train: Epoch: 1, iter: 10011, avg. loss: 0.81
Train: Epoch: 1, iter: 10012, avg. loss: 0.65
Train: Epoch: 1, iter: 10013, avg. loss: 1.68
Train: Epoch: 1, iter: 10014, avg. loss: 1.93
Train: Epoch: 1, iter: 10015, avg. loss: 1.59
Train: Epoch: 1, iter: 10016, avg. loss: 0.11
Train: Epoch: 1, iter: 10017, avg. loss: 0.83
Train: Epoch: 1, iter: 10018, avg. loss: 2.05
Train: Epoch: 1, iter: 10019, avg. loss: 1.90
Train: Epoch: 1, iter: 10020, av

INFO:root:Saving checkpoint model to model_checkpoint/plausible_model_15000.pt



Eval: Epoch: 1, iter: 15000, avg. loss: 1.64

Train: Epoch: 1, iter: 15001, avg. loss: 1.80
Train: Epoch: 1, iter: 15002, avg. loss: 1.41
Train: Epoch: 1, iter: 15003, avg. loss: 1.80
Train: Epoch: 1, iter: 15004, avg. loss: 0.79
Train: Epoch: 1, iter: 15005, avg. loss: 1.23
Train: Epoch: 1, iter: 15006, avg. loss: 2.17
Train: Epoch: 1, iter: 15007, avg. loss: 0.86
Train: Epoch: 1, iter: 15008, avg. loss: 0.98
Train: Epoch: 1, iter: 15009, avg. loss: 1.16
Train: Epoch: 1, iter: 15010, avg. loss: 1.54

Eval: Epoch: 1, iter: 15010, avg. loss: 1.05

Train: Epoch: 1, iter: 15011, avg. loss: 1.68
Train: Epoch: 1, iter: 15012, avg. loss: 1.13
Train: Epoch: 1, iter: 15013, avg. loss: 1.88
Train: Epoch: 1, iter: 15014, avg. loss: 1.05
Train: Epoch: 1, iter: 15015, avg. loss: 1.34
Train: Epoch: 1, iter: 15016, avg. loss: 1.94
Train: Epoch: 1, iter: 15017, avg. loss: 1.71
Train: Epoch: 1, iter: 15018, avg. loss: 1.15
Train: Epoch: 1, iter: 15019, avg. loss: 1.55
Train: Epoch: 1, iter: 15020, av

INFO:root:Saving checkpoint model to model_checkpoint/plausible_model_20000.pt



Eval: Epoch: 2, iter: 20000, avg. loss: 1.27

Train: Epoch: 2, iter: 20001, avg. loss: 1.44
Train: Epoch: 2, iter: 20002, avg. loss: 1.07
Train: Epoch: 2, iter: 20003, avg. loss: 0.49
Train: Epoch: 2, iter: 20004, avg. loss: 0.86
Train: Epoch: 2, iter: 20005, avg. loss: 0.94
Train: Epoch: 2, iter: 20006, avg. loss: 1.60
Train: Epoch: 2, iter: 20007, avg. loss: 0.96
Train: Epoch: 2, iter: 20008, avg. loss: 1.23
Train: Epoch: 2, iter: 20009, avg. loss: 1.24
Train: Epoch: 2, iter: 20010, avg. loss: 0.80

Eval: Epoch: 2, iter: 20010, avg. loss: 1.49

Train: Epoch: 2, iter: 20011, avg. loss: 1.28
Train: Epoch: 2, iter: 20012, avg. loss: 1.36
Train: Epoch: 2, iter: 20013, avg. loss: 1.05
Train: Epoch: 2, iter: 20014, avg. loss: 1.21
Train: Epoch: 2, iter: 20015, avg. loss: 0.74
Train: Epoch: 2, iter: 20016, avg. loss: 1.15
Train: Epoch: 2, iter: 20017, avg. loss: 1.28
Train: Epoch: 2, iter: 20018, avg. loss: 1.00
Train: Epoch: 2, iter: 20019, avg. loss: 2.13
Train: Epoch: 2, iter: 20020, av

INFO:root:Saving checkpoint model to model_checkpoint/plausible_model_25000.pt



Eval: Epoch: 2, iter: 25000, avg. loss: 1.59

Train: Epoch: 2, iter: 25001, avg. loss: 0.95
Train: Epoch: 2, iter: 25002, avg. loss: 0.43
Train: Epoch: 2, iter: 25003, avg. loss: 0.43
Train: Epoch: 2, iter: 25004, avg. loss: 0.84
Train: Epoch: 2, iter: 25005, avg. loss: 1.67
Train: Epoch: 2, iter: 25006, avg. loss: 2.40
Train: Epoch: 2, iter: 25007, avg. loss: 0.66
Train: Epoch: 2, iter: 25008, avg. loss: 0.67
Train: Epoch: 2, iter: 25009, avg. loss: 0.95
Train: Epoch: 2, iter: 25010, avg. loss: 1.72

Eval: Epoch: 2, iter: 25010, avg. loss: 1.45

Train: Epoch: 2, iter: 25011, avg. loss: 0.94
Train: Epoch: 2, iter: 25012, avg. loss: 1.28
Train: Epoch: 2, iter: 25013, avg. loss: 0.91
Train: Epoch: 2, iter: 25014, avg. loss: 1.51
Train: Epoch: 2, iter: 25015, avg. loss: 0.55
Train: Epoch: 2, iter: 25016, avg. loss: 0.57
Train: Epoch: 2, iter: 25017, avg. loss: 0.69
Train: Epoch: 2, iter: 25018, avg. loss: 1.16
Train: Epoch: 2, iter: 25019, avg. loss: 0.62
Train: Epoch: 2, iter: 25020, av

INFO:root:Saving checkpoint model to model_checkpoint/plausible_model_30000.pt



Eval: Epoch: 2, iter: 30000, avg. loss: 1.54

Train: Epoch: 2, iter: 30001, avg. loss: 0.95
Train: Epoch: 2, iter: 30002, avg. loss: 1.71
Train: Epoch: 2, iter: 30003, avg. loss: 0.84
Train: Epoch: 2, iter: 30004, avg. loss: 1.22
Train: Epoch: 2, iter: 30005, avg. loss: 0.56
Train: Epoch: 2, iter: 30006, avg. loss: 1.03
Train: Epoch: 2, iter: 30007, avg. loss: 0.79
Train: Epoch: 2, iter: 30008, avg. loss: 2.38
Train: Epoch: 2, iter: 30009, avg. loss: 1.02
Train: Epoch: 2, iter: 30010, avg. loss: 0.68

Eval: Epoch: 2, iter: 30010, avg. loss: 1.64

Train: Epoch: 2, iter: 30011, avg. loss: 1.14
Train: Epoch: 2, iter: 30012, avg. loss: 0.54
Train: Epoch: 2, iter: 30013, avg. loss: 0.98
Train: Epoch: 2, iter: 30014, avg. loss: 1.02
Train: Epoch: 2, iter: 30015, avg. loss: 0.96
Train: Epoch: 2, iter: 30016, avg. loss: 1.13
Train: Epoch: 2, iter: 30017, avg. loss: 1.87
Train: Epoch: 2, iter: 30018, avg. loss: 1.10
Train: Epoch: 2, iter: 30019, avg. loss: 0.98
Train: Epoch: 2, iter: 30020, av

INFO:root:Saving checkpoint model to model_checkpoint/plausible_model_35000.pt



Eval: Epoch: 3, iter: 35000, avg. loss: 1.75

Train: Epoch: 3, iter: 35001, avg. loss: 0.76
Train: Epoch: 3, iter: 35002, avg. loss: 0.64
Train: Epoch: 3, iter: 35003, avg. loss: 0.53
Train: Epoch: 3, iter: 35004, avg. loss: 1.95
Train: Epoch: 3, iter: 35005, avg. loss: 1.22
Train: Epoch: 3, iter: 35006, avg. loss: 0.42
Train: Epoch: 3, iter: 35007, avg. loss: 0.73
Train: Epoch: 3, iter: 35008, avg. loss: 1.12
Train: Epoch: 3, iter: 35009, avg. loss: 0.34
Train: Epoch: 3, iter: 35010, avg. loss: 0.81

Eval: Epoch: 3, iter: 35010, avg. loss: 1.43

Train: Epoch: 3, iter: 35011, avg. loss: 0.22
Train: Epoch: 3, iter: 35012, avg. loss: 0.49
Train: Epoch: 3, iter: 35013, avg. loss: 0.78
Train: Epoch: 3, iter: 35014, avg. loss: 0.33
Train: Epoch: 3, iter: 35015, avg. loss: 0.65
Train: Epoch: 3, iter: 35016, avg. loss: 0.71
Train: Epoch: 3, iter: 35017, avg. loss: 0.35
Train: Epoch: 3, iter: 35018, avg. loss: 0.74
Train: Epoch: 3, iter: 35019, avg. loss: 1.18
Train: Epoch: 3, iter: 35020, av

INFO:root:Saving checkpoint model to model_checkpoint/plausible_model_40000.pt



Eval: Epoch: 3, iter: 40000, avg. loss: 1.49

Train: Epoch: 3, iter: 40001, avg. loss: 0.96
Train: Epoch: 3, iter: 40002, avg. loss: 0.37
Train: Epoch: 3, iter: 40003, avg. loss: 1.62
Train: Epoch: 3, iter: 40004, avg. loss: 0.55
Train: Epoch: 3, iter: 40005, avg. loss: 0.59
Train: Epoch: 3, iter: 40006, avg. loss: 0.84
Train: Epoch: 3, iter: 40007, avg. loss: 0.27
Train: Epoch: 3, iter: 40008, avg. loss: 1.41
Train: Epoch: 3, iter: 40009, avg. loss: 0.97
Train: Epoch: 3, iter: 40010, avg. loss: 0.82

Eval: Epoch: 3, iter: 40010, avg. loss: 1.64

Train: Epoch: 3, iter: 40011, avg. loss: 0.36
Train: Epoch: 3, iter: 40012, avg. loss: 1.49
Train: Epoch: 3, iter: 40013, avg. loss: 0.90
Train: Epoch: 3, iter: 40014, avg. loss: 0.79
Train: Epoch: 3, iter: 40015, avg. loss: 0.68
Train: Epoch: 3, iter: 40016, avg. loss: 0.49
Train: Epoch: 3, iter: 40017, avg. loss: 0.73
Train: Epoch: 3, iter: 40018, avg. loss: 0.73
Train: Epoch: 3, iter: 40019, avg. loss: 0.91
Train: Epoch: 3, iter: 40020, av

INFO:root:Saving checkpoint model to model_checkpoint/plausible_model_45000.pt



Eval: Epoch: 3, iter: 45000, avg. loss: 1.15

Train: Epoch: 3, iter: 45001, avg. loss: 0.31
Train: Epoch: 3, iter: 45002, avg. loss: 0.47
Train: Epoch: 3, iter: 45003, avg. loss: 0.24
Train: Epoch: 3, iter: 45004, avg. loss: 0.59
Train: Epoch: 3, iter: 45005, avg. loss: 0.99
Train: Epoch: 3, iter: 45006, avg. loss: 0.94
Train: Epoch: 3, iter: 45007, avg. loss: 0.84
Train: Epoch: 3, iter: 45008, avg. loss: 1.12
Train: Epoch: 3, iter: 45009, avg. loss: 1.22
Train: Epoch: 3, iter: 45010, avg. loss: 0.52

Eval: Epoch: 3, iter: 45010, avg. loss: 1.21

Train: Epoch: 3, iter: 45011, avg. loss: 1.12
Train: Epoch: 3, iter: 45012, avg. loss: 1.57
Train: Epoch: 3, iter: 45013, avg. loss: 0.29
Train: Epoch: 3, iter: 45014, avg. loss: 0.75
Train: Epoch: 3, iter: 45015, avg. loss: 0.49
Train: Epoch: 3, iter: 45016, avg. loss: 1.58
Train: Epoch: 3, iter: 45017, avg. loss: 1.40
Train: Epoch: 3, iter: 45018, avg. loss: 0.97
Train: Epoch: 3, iter: 45019, avg. loss: 0.53
Train: Epoch: 3, iter: 45020, av

INFO:root:Saving checkpoint model to model_checkpoint/plausible_model_50000.pt



Eval: Epoch: 4, iter: 50000, avg. loss: 1.52

Train: Epoch: 4, iter: 50001, avg. loss: 0.34
Train: Epoch: 4, iter: 50002, avg. loss: 0.63
Train: Epoch: 4, iter: 50003, avg. loss: 0.16
Train: Epoch: 4, iter: 50004, avg. loss: 0.35
Train: Epoch: 4, iter: 50005, avg. loss: 0.47
Train: Epoch: 4, iter: 50006, avg. loss: 0.44
Train: Epoch: 4, iter: 50007, avg. loss: 0.32
Train: Epoch: 4, iter: 50008, avg. loss: 0.25
Train: Epoch: 4, iter: 50009, avg. loss: 0.82
Train: Epoch: 4, iter: 50010, avg. loss: 0.17

Eval: Epoch: 4, iter: 50010, avg. loss: 1.54

Train: Epoch: 4, iter: 50011, avg. loss: 1.68
Train: Epoch: 4, iter: 50012, avg. loss: 0.96
Train: Epoch: 4, iter: 50013, avg. loss: 1.02
Train: Epoch: 4, iter: 50014, avg. loss: 0.48
Train: Epoch: 4, iter: 50015, avg. loss: 0.58
Train: Epoch: 4, iter: 50016, avg. loss: 0.47
Train: Epoch: 4, iter: 50017, avg. loss: 0.51
Train: Epoch: 4, iter: 50018, avg. loss: 0.65
Train: Epoch: 4, iter: 50019, avg. loss: 0.74
Train: Epoch: 4, iter: 50020, av

INFO:root:Saving checkpoint model to model_checkpoint/plausible_model_55000.pt



Eval: Epoch: 4, iter: 55000, avg. loss: 1.07

Train: Epoch: 4, iter: 55001, avg. loss: 0.90
Train: Epoch: 4, iter: 55002, avg. loss: 0.24
Train: Epoch: 4, iter: 55003, avg. loss: 0.64
Train: Epoch: 4, iter: 55004, avg. loss: 0.20
Train: Epoch: 4, iter: 55005, avg. loss: 0.48
Train: Epoch: 4, iter: 55006, avg. loss: 0.97
Train: Epoch: 4, iter: 55007, avg. loss: 0.62
Train: Epoch: 4, iter: 55008, avg. loss: 0.95
Train: Epoch: 4, iter: 55009, avg. loss: 0.95
Train: Epoch: 4, iter: 55010, avg. loss: 0.36

Eval: Epoch: 4, iter: 55010, avg. loss: 1.93

Train: Epoch: 4, iter: 55011, avg. loss: 0.87
Train: Epoch: 4, iter: 55012, avg. loss: 0.71
Train: Epoch: 4, iter: 55013, avg. loss: 0.58
Train: Epoch: 4, iter: 55014, avg. loss: 0.63
Train: Epoch: 4, iter: 55015, avg. loss: 1.15
Train: Epoch: 4, iter: 55016, avg. loss: 1.24
Train: Epoch: 4, iter: 55017, avg. loss: 1.60
Train: Epoch: 4, iter: 55018, avg. loss: 0.44
Train: Epoch: 4, iter: 55019, avg. loss: 0.92
Train: Epoch: 4, iter: 55020, av

INFO:root:Saving checkpoint model to model_checkpoint/plausible_model_60000.pt



Eval: Epoch: 4, iter: 60000, avg. loss: 1.35

Train: Epoch: 4, iter: 60001, avg. loss: 0.65
Train: Epoch: 4, iter: 60002, avg. loss: 0.50
Train: Epoch: 4, iter: 60003, avg. loss: 1.11
Train: Epoch: 4, iter: 60004, avg. loss: 0.46
Train: Epoch: 4, iter: 60005, avg. loss: 0.35
Train: Epoch: 4, iter: 60006, avg. loss: 0.69
Train: Epoch: 4, iter: 60007, avg. loss: 0.46
Train: Epoch: 4, iter: 60008, avg. loss: 0.67
Train: Epoch: 4, iter: 60009, avg. loss: 1.58
Train: Epoch: 4, iter: 60010, avg. loss: 1.46

Eval: Epoch: 4, iter: 60010, avg. loss: 1.31

Train: Epoch: 4, iter: 60011, avg. loss: 0.37
Train: Epoch: 4, iter: 60012, avg. loss: 1.13
Train: Epoch: 4, iter: 60013, avg. loss: 0.18
Train: Epoch: 4, iter: 60014, avg. loss: 0.68
Train: Epoch: 4, iter: 60015, avg. loss: 0.87
Train: Epoch: 4, iter: 60016, avg. loss: 0.81
Train: Epoch: 4, iter: 60017, avg. loss: 0.68
Train: Epoch: 4, iter: 60018, avg. loss: 0.20
Train: Epoch: 4, iter: 60019, avg. loss: 0.12
Train: Epoch: 4, iter: 60020, av

INFO:root:Saving checkpoint model to model_checkpoint/plausible_model_65000.pt



Eval: Epoch: 4, iter: 65000, avg. loss: 1.98

Train: Epoch: 4, iter: 65001, avg. loss: 0.39
Train: Epoch: 4, iter: 65002, avg. loss: 0.23
Train: Epoch: 4, iter: 65003, avg. loss: 0.27
Train: Epoch: 4, iter: 65004, avg. loss: 0.60
Train: Epoch: 4, iter: 65005, avg. loss: 0.54
Train: Epoch: 4, iter: 65006, avg. loss: 0.42
Train: Epoch: 4, iter: 65007, avg. loss: 0.42
Train: Epoch: 4, iter: 65008, avg. loss: 0.39
Train: Epoch: 4, iter: 65009, avg. loss: 0.52
Train: Epoch: 4, iter: 65010, avg. loss: 0.18

Eval: Epoch: 4, iter: 65010, avg. loss: 1.09

Train: Epoch: 4, iter: 65011, avg. loss: 0.81
Train: Epoch: 4, iter: 65012, avg. loss: 0.45
Train: Epoch: 4, iter: 65013, avg. loss: 0.79
Train: Epoch: 4, iter: 65014, avg. loss: 1.15
Train: Epoch: 4, iter: 65015, avg. loss: 0.61
Train: Epoch: 4, iter: 65016, avg. loss: 2.05
Train: Epoch: 4, iter: 65017, avg. loss: 0.56
Train: Epoch: 4, iter: 65018, avg. loss: 0.55
Train: Epoch: 4, iter: 65019, avg. loss: 0.39
Train: Epoch: 4, iter: 65020, av

INFO:root:Saving checkpoint model to model_checkpoint/plausible_model_70000.pt



Eval: Epoch: 5, iter: 70000, avg. loss: 1.30

Train: Epoch: 5, iter: 70001, avg. loss: 0.17
Train: Epoch: 5, iter: 70002, avg. loss: 0.51
Train: Epoch: 5, iter: 70003, avg. loss: 0.87
Train: Epoch: 5, iter: 70004, avg. loss: 0.96
Train: Epoch: 5, iter: 70005, avg. loss: 0.35
Train: Epoch: 5, iter: 70006, avg. loss: 0.38
Train: Epoch: 5, iter: 70007, avg. loss: 0.45
Train: Epoch: 5, iter: 70008, avg. loss: 0.76
Train: Epoch: 5, iter: 70009, avg. loss: 0.53
Train: Epoch: 5, iter: 70010, avg. loss: 0.91

Eval: Epoch: 5, iter: 70010, avg. loss: 1.62

Train: Epoch: 5, iter: 70011, avg. loss: 0.41
Train: Epoch: 5, iter: 70012, avg. loss: 0.20
Train: Epoch: 5, iter: 70013, avg. loss: 0.36
Train: Epoch: 5, iter: 70014, avg. loss: 0.72
Train: Epoch: 5, iter: 70015, avg. loss: 1.12
Train: Epoch: 5, iter: 70016, avg. loss: 0.21
Train: Epoch: 5, iter: 70017, avg. loss: 0.47
Train: Epoch: 5, iter: 70018, avg. loss: 0.31
Train: Epoch: 5, iter: 70019, avg. loss: 0.04
Train: Epoch: 5, iter: 70020, av

INFO:root:Saving checkpoint model to model_checkpoint/plausible_model_75000.pt



Eval: Epoch: 5, iter: 75000, avg. loss: 1.90

Train: Epoch: 5, iter: 75001, avg. loss: 0.47
Train: Epoch: 5, iter: 75002, avg. loss: 0.42
Train: Epoch: 5, iter: 75003, avg. loss: 0.36
Train: Epoch: 5, iter: 75004, avg. loss: 0.64
Train: Epoch: 5, iter: 75005, avg. loss: 0.30
Train: Epoch: 5, iter: 75006, avg. loss: 0.39
Train: Epoch: 5, iter: 75007, avg. loss: 0.81
Train: Epoch: 5, iter: 75008, avg. loss: 0.40
Train: Epoch: 5, iter: 75009, avg. loss: 0.16
Train: Epoch: 5, iter: 75010, avg. loss: 0.58

Eval: Epoch: 5, iter: 75010, avg. loss: 1.84

Train: Epoch: 5, iter: 75011, avg. loss: 0.24
Train: Epoch: 5, iter: 75012, avg. loss: 0.64
Train: Epoch: 5, iter: 75013, avg. loss: 0.74
Train: Epoch: 5, iter: 75014, avg. loss: 0.20
Train: Epoch: 5, iter: 75015, avg. loss: 0.32
Train: Epoch: 5, iter: 75016, avg. loss: 0.16
Train: Epoch: 5, iter: 75017, avg. loss: 0.64
Train: Epoch: 5, iter: 75018, avg. loss: 0.11
Train: Epoch: 5, iter: 75019, avg. loss: 0.91
Train: Epoch: 5, iter: 75020, av

INFO:root:Saving checkpoint model to model_checkpoint/plausible_model_80000.pt



Eval: Epoch: 5, iter: 80000, avg. loss: 1.66

Train: Epoch: 5, iter: 80001, avg. loss: 0.31
Train: Epoch: 5, iter: 80002, avg. loss: 0.30
Train: Epoch: 5, iter: 80003, avg. loss: 0.45
Train: Epoch: 5, iter: 80004, avg. loss: 0.40
Train: Epoch: 5, iter: 80005, avg. loss: 0.42
Train: Epoch: 5, iter: 80006, avg. loss: 0.62
Train: Epoch: 5, iter: 80007, avg. loss: 0.80
Train: Epoch: 5, iter: 80008, avg. loss: 0.58
Train: Epoch: 5, iter: 80009, avg. loss: 0.16
Train: Epoch: 5, iter: 80010, avg. loss: 0.47

Eval: Epoch: 5, iter: 80010, avg. loss: 1.90

Train: Epoch: 5, iter: 80011, avg. loss: 0.23
Train: Epoch: 5, iter: 80012, avg. loss: 0.16
Train: Epoch: 5, iter: 80013, avg. loss: 1.24
Train: Epoch: 5, iter: 80014, avg. loss: 0.28
Train: Epoch: 5, iter: 80015, avg. loss: 0.44
Train: Epoch: 5, iter: 80016, avg. loss: 0.92
Train: Epoch: 5, iter: 80017, avg. loss: 0.68
Train: Epoch: 5, iter: 80018, avg. loss: 0.18
Train: Epoch: 5, iter: 80019, avg. loss: 0.37
Train: Epoch: 5, iter: 80020, av

INFO:root:Saving checkpoint model to model_checkpoint/plausible_model_85000.pt



Eval: Epoch: 6, iter: 85000, avg. loss: 1.78

Train: Epoch: 6, iter: 85001, avg. loss: 0.79
Train: Epoch: 6, iter: 85002, avg. loss: 0.22
Train: Epoch: 6, iter: 85003, avg. loss: 0.38
Train: Epoch: 6, iter: 85004, avg. loss: 0.90
Train: Epoch: 6, iter: 85005, avg. loss: 0.45
Train: Epoch: 6, iter: 85006, avg. loss: 0.48
Train: Epoch: 6, iter: 85007, avg. loss: 0.30
Train: Epoch: 6, iter: 85008, avg. loss: 0.02
Train: Epoch: 6, iter: 85009, avg. loss: 0.39
Train: Epoch: 6, iter: 85010, avg. loss: 0.47

Eval: Epoch: 6, iter: 85010, avg. loss: 2.08

Train: Epoch: 6, iter: 85011, avg. loss: 0.50
Train: Epoch: 6, iter: 85012, avg. loss: 1.09
Train: Epoch: 6, iter: 85013, avg. loss: 0.55
Train: Epoch: 6, iter: 85014, avg. loss: 0.53
Train: Epoch: 6, iter: 85015, avg. loss: 0.33
Train: Epoch: 6, iter: 85016, avg. loss: 0.43
Train: Epoch: 6, iter: 85017, avg. loss: 0.20
Train: Epoch: 6, iter: 85018, avg. loss: 0.28
Train: Epoch: 6, iter: 85019, avg. loss: 0.18
Train: Epoch: 6, iter: 85020, av