In [1]:
import torch
import torch.nn as nn

from sotoxic.data_helper.data_transformer import DataTransformer
from sotoxic.data_helper.data_loader import DataLoader
from sotoxic.train.trainer import PyTorchModelTrainer
from sotoxic.config import dataset_config 

  from ._conv import register_converters as _register_converters
Using TensorFlow backend.


In [2]:
VOCAB_SIZE = 100000
MAX_SEQUENCE_LENGTH = 300
EMBEDDING_SIZE = 300

## Prepare training and testing data

In [3]:
print("Loading the dataset")
data_transformer = DataTransformer(max_num_words=VOCAB_SIZE, max_sequence_length=MAX_SEQUENCE_LENGTH, char_level=False)
data_loader = DataLoader()
train_sequences, training_labels, test_sequences = data_transformer.prepare_data()

Loading the dataset
Doing preprocessing...
Preprocessed.


In [4]:
train_sequences[:20]

[[686,
  76,
  1,
  132,
  124,
  173,
  28,
  705,
  4324,
  9378,
  1162,
  81,
  350,
  44,
  81,
  12,
  13594,
  50,
  6507,
  15,
  59,
  2539,
  143,
  3,
  2736,
  31,
  111,
  1190,
  16065,
  2418,
  6,
  51,
  20,
  12,
  239,
  1,
  349,
  29,
  1,
  46,
  136,
  3,
  38,
  3789,
  85],
 [337,
  7768,
  42,
  2818,
  14,
  628,
  3656,
  3,
  38,
  4701,
  2584,
  22,
  90,
  46,
  929,
  3682,
  987,
  674,
  10174],
 [429,
  363,
  3,
  38,
  118,
  12,
  250,
  2,
  77,
  291,
  10,
  50,
  9,
  14,
  551,
  8,
  2391,
  496,
  478,
  99,
  6,
  568,
  2,
  39,
  314,
  132,
  364,
  4,
  28,
  46,
  42,
  183,
  2,
  440,
  58,
  34,
  1,
  2227,
  88,
  1,
  696,
  474],
 [58,
  3,
  134,
  92,
  56,
  311,
  1362,
  15,
  2063,
  3,
  5532,
  23,
  1,
  109,
  2330,
  53,
  18,
  485,
  15,
  25,
  5,
  3714,
  4,
  1310,
  4,
  9973,
  3,
  64,
  1,
  273,
  83,
  115,
  12893,
  35,
  9,
  44,
  16,
  41,
  11,
  1,
  1469,
  131,
  1245,
  2128,
  418,
  1245,
  30

In [5]:
print("Loading the pre-trained word embedding.")
embeddings_index = data_loader.load_embedding('features/crawl-300d-2M.vec')
embedding_matrix = data_transformer.build_embedding_matrix(embeddings_index)
print("Loaded")

Loading the pre-trained word embedding.
Total 2000000 word vectors.
Null word embeddings: 22573
Loaded


## Build model

In [6]:
import importlib
import sotoxic.models.pytorch.bgru as bgru
import sotoxic.train.trainer as trn
importlib.reload(bgru)
importlib.reload(trn)

<module 'sotoxic.train.trainer' from '/home/zake7749/PycharmProjects/CCP/sotoxic/train/trainer.py'>

In [7]:
def get_bgru_network():
    embedding = nn.Embedding(VOCAB_SIZE, EMBEDDING_SIZE)
    embedding.weight.data.copy_(torch.from_numpy(embedding_matrix))
    embedding.weight.requires_grad=False
    return bgru.BayesianGRUClassifier(input_size=EMBEDDING_SIZE, hidden_size=60, embedding=embedding)

## Training

In [8]:
trainer = trn.PyTorchModelTrainer(model_stamp="FASTTXT_BGRU_64_64", epoch_num=300, learning_rate=1e-3,
                                  verbose_round=40, shuffle_inputs=False, early_stopping_round=10)

In [None]:
model, best_logloss, best_auc, best_val_pred = trainer.train_folds(X=train_sequences, y=training_labels,
                    fold_count=10, batch_size=256, get_model_func=get_bgru_network, skip_fold=0)

Choose the torch base model.
Training on fold 0
Epoch:1 Batch:0 Log-loss0.7120054364204407
Epoch:1 Batch:40 Log-loss0.1323106735944748
Epoch:1 Batch:80 Log-loss0.07861244678497314
Epoch:1 Batch:120 Log-loss0.050647079944610596
Epoch:1 Batch:160 Log-loss0.04874030873179436
Epoch:1 Batch:200 Log-loss0.05985138937830925
Epoch:1 Batch:240 Log-loss0.037754934281110764
Epoch:1 Batch:280 Log-loss0.050901126116514206
Epoch:1 Batch:320 Log-loss0.06970404833555222
Epoch:1 Batch:360 Log-loss0.06141173839569092
Epoch:1 Batch:400 Log-loss0.04935069754719734
Epoch:1 Batch:440 Log-loss0.0667911097407341
Epoch:1 Batch:480 Log-loss0.04504765197634697
Epoch:1 Batch:520 Log-loss0.055000707507133484
Epoch:1 Batch:560 Log-loss0.036638546735048294
Epoch average log loss:0.0793381747856204
Model has been saved as temporary_checkpoints/FASTTXT_BGRU_64_64-TEMP.pt.

In Epoch1, val_loss:0.04555952425826937, best_val_loss:0.04555952425826937, best_auc:0.976878537666061
Epoch:2 Batch:0 Log-loss0.06867814809083939


Epoch:10 Batch:0 Log-loss0.03695434331893921
Epoch:10 Batch:40 Log-loss0.04090544953942299
Epoch:10 Batch:80 Log-loss0.05570065602660179
Epoch:10 Batch:120 Log-loss0.03997639939188957
Epoch:10 Batch:160 Log-loss0.04213264212012291
Epoch:10 Batch:200 Log-loss0.03962920978665352
Epoch:10 Batch:240 Log-loss0.040476951748132706
Epoch:10 Batch:280 Log-loss0.04190034046769142
Epoch:10 Batch:320 Log-loss0.044796139001846313
Epoch:10 Batch:360 Log-loss0.03308139368891716
Epoch:10 Batch:400 Log-loss0.051052410155534744
Epoch:10 Batch:440 Log-loss0.0357748419046402
Epoch:10 Batch:480 Log-loss0.032477814704179764
Epoch:10 Batch:520 Log-loss0.05190897360444069
Epoch:10 Batch:560 Log-loss0.03744189813733101
Epoch average log loss:0.04090871061531028
Model has been saved as temporary_checkpoints/FASTTXT_BGRU_64_64-TEMP.pt.

In Epoch10, val_loss:0.03803986401146478, best_val_loss:0.03803986401146478, best_auc:0.9886834264795996
Epoch:11 Batch:0 Log-loss0.03530322387814522
Epoch:11 Batch:40 Log-loss0.

Epoch:19 Batch:80 Log-loss0.05360683426260948
Epoch:19 Batch:120 Log-loss0.05828571319580078
Epoch:19 Batch:160 Log-loss0.04043808579444885
Epoch:19 Batch:200 Log-loss0.024384962394833565
Epoch:19 Batch:240 Log-loss0.04166371375322342
Epoch:19 Batch:280 Log-loss0.05821231007575989
Epoch:19 Batch:320 Log-loss0.03888482227921486
Epoch:19 Batch:360 Log-loss0.04209063574671745
Epoch:19 Batch:400 Log-loss0.03534097224473953
Epoch:19 Batch:440 Log-loss0.02912217192351818
Epoch:19 Batch:480 Log-loss0.03045186959207058
Epoch:19 Batch:520 Log-loss0.05266507342457771
Epoch:19 Batch:560 Log-loss0.04180420935153961
Epoch average log loss:0.03868482537634139
In Epoch19, val_loss:0.03725522742800543, best_val_loss:0.03724741371682446, best_auc:0.9893603398944103
Epoch:20 Batch:0 Log-loss0.034415099769830704
Epoch:20 Batch:40 Log-loss0.03907474875450134
Epoch:20 Batch:80 Log-loss0.03349713981151581
Epoch:20 Batch:120 Log-loss0.038461823016405106
Epoch:20 Batch:160 Log-loss0.038610685616731644
Epoch:2

Epoch:28 Batch:200 Log-loss0.031570933759212494
Epoch:28 Batch:240 Log-loss0.06176721677184105
Epoch:28 Batch:280 Log-loss0.038737863302230835
Epoch:28 Batch:320 Log-loss0.04648162052035332
Epoch:28 Batch:360 Log-loss0.03659859299659729
Epoch:28 Batch:400 Log-loss0.03391778841614723
Epoch:28 Batch:440 Log-loss0.03358413279056549
Epoch:28 Batch:480 Log-loss0.03738055005669594
Epoch:28 Batch:520 Log-loss0.030275478959083557
Epoch:28 Batch:560 Log-loss0.031242234632372856
Epoch average log loss:0.037374141542906206
In Epoch28, val_loss:0.037056066856172847, best_val_loss:0.036953444690154345, best_auc:0.9895186046708294
Epoch:29 Batch:0 Log-loss0.0413806326687336
Epoch:29 Batch:40 Log-loss0.0488111674785614
Epoch:29 Batch:80 Log-loss0.03226311132311821
Epoch:29 Batch:120 Log-loss0.060494571924209595
Epoch:29 Batch:160 Log-loss0.030656667426228523
Epoch:29 Batch:200 Log-loss0.03970308601856232
Epoch:29 Batch:240 Log-loss0.03575023636221886
Epoch:29 Batch:280 Log-loss0.03034629113972187
Epo

Epoch:37 Batch:520 Log-loss0.0317780040204525
Epoch:37 Batch:560 Log-loss0.036394987255334854
Epoch average log loss:0.03683391263974564
Model has been saved as temporary_checkpoints/FASTTXT_BGRU_64_64-TEMP.pt.

In Epoch37, val_loss:0.036779424331287926, best_val_loss:0.036779424331287926, best_auc:0.9895815556650747
Epoch:38 Batch:0 Log-loss0.040687840431928635
Epoch:38 Batch:40 Log-loss0.04156241938471794
Epoch:38 Batch:80 Log-loss0.040576811879873276
Epoch:38 Batch:120 Log-loss0.031041691079735756
Epoch:38 Batch:160 Log-loss0.04214386269450188
Epoch:38 Batch:200 Log-loss0.045967068523168564
Epoch:38 Batch:240 Log-loss0.031998272985219955
Epoch:38 Batch:280 Log-loss0.03450891748070717
Epoch:38 Batch:320 Log-loss0.03579799458384514
Epoch:38 Batch:360 Log-loss0.048357706516981125
Epoch:38 Batch:400 Log-loss0.03253639116883278
Epoch:38 Batch:440 Log-loss0.035472165793180466
Epoch:38 Batch:480 Log-loss0.022564785555005074
Epoch:38 Batch:520 Log-loss0.026673145592212677
Epoch:38 Batch:560

Epoch:47 Batch:160 Log-loss0.04869798943400383
Epoch:47 Batch:200 Log-loss0.03346498683094978
Epoch:47 Batch:240 Log-loss0.03800887614488602
Epoch:47 Batch:280 Log-loss0.043155938386917114
Epoch:47 Batch:320 Log-loss0.03454754129052162
Epoch:47 Batch:360 Log-loss0.0354398675262928
Epoch:47 Batch:400 Log-loss0.035380031913518906
Epoch:47 Batch:440 Log-loss0.044184986501932144
Epoch:47 Batch:480 Log-loss0.03441204875707626
Epoch:47 Batch:520 Log-loss0.04677858576178551
Epoch:47 Batch:560 Log-loss0.03860176354646683
Epoch average log loss:0.03657726087341351
A pre-trained model at temporary_checkpoints/FASTTXT_BGRU_64_64-TEMP.pt has been loaded.

Model has been saved as checkpoints/FASTTXT_BGRU_64_640.pt.

Choose the torch base model.
Training on fold 1
Epoch:1 Batch:0 Log-loss0.6727760434150696
Epoch:1 Batch:40 Log-loss0.1336449235677719
Epoch:1 Batch:80 Log-loss0.10393470525741577
Epoch:1 Batch:120 Log-loss0.057671431452035904
Epoch:1 Batch:160 Log-loss0.06155194714665413
Epoch:1 Batch:

Epoch:9 Batch:160 Log-loss0.04311126098036766
Epoch:9 Batch:200 Log-loss0.03977668657898903
Epoch:9 Batch:240 Log-loss0.04928787052631378
Epoch:9 Batch:280 Log-loss0.04343109950423241
Epoch:9 Batch:320 Log-loss0.045554351061582565
Epoch:9 Batch:360 Log-loss0.028222650289535522
Epoch:9 Batch:400 Log-loss0.02884092926979065
Epoch:9 Batch:440 Log-loss0.04377659782767296
Epoch:9 Batch:480 Log-loss0.0330808125436306
Epoch:9 Batch:520 Log-loss0.04353070631623268
Epoch:9 Batch:560 Log-loss0.03304726257920265
Epoch average log loss:0.041231107442373675
Model has been saved as temporary_checkpoints/FASTTXT_BGRU_64_64-TEMP.pt.

In Epoch9, val_loss:0.040261446192419954, best_val_loss:0.040261446192419954, best_auc:0.9891183657826991
Epoch:10 Batch:0 Log-loss0.045131534337997437
Epoch:10 Batch:40 Log-loss0.047467898577451706
Epoch:10 Batch:80 Log-loss0.034875765442848206
Epoch:10 Batch:120 Log-loss0.04786363244056702
Epoch:10 Batch:160 Log-loss0.04445711150765419
Epoch:10 Batch:200 Log-loss0.04032

Epoch:18 Batch:160 Log-loss0.035658031702041626
Epoch:18 Batch:200 Log-loss0.04560533165931702
Epoch:18 Batch:240 Log-loss0.06093995273113251
Epoch:18 Batch:280 Log-loss0.04654531553387642
Epoch:18 Batch:320 Log-loss0.03224104270339012
Epoch:18 Batch:360 Log-loss0.04050925374031067
Epoch:18 Batch:400 Log-loss0.037411078810691833
Epoch:18 Batch:440 Log-loss0.02660735882818699
Epoch:18 Batch:480 Log-loss0.048006296157836914
Epoch:18 Batch:520 Log-loss0.03775300830602646
Epoch:18 Batch:560 Log-loss0.04408837482333183
Epoch average log loss:0.03856381814527724
Model has been saved as temporary_checkpoints/FASTTXT_BGRU_64_64-TEMP.pt.

In Epoch18, val_loss:0.038620384849044447, best_val_loss:0.038620384849044447, best_auc:0.9905910215615558
Epoch:19 Batch:0 Log-loss0.03824811056256294
Epoch:19 Batch:40 Log-loss0.016808228567242622
Epoch:19 Batch:80 Log-loss0.035543378442525864
Epoch:19 Batch:120 Log-loss0.03020019829273224
Epoch:19 Batch:160 Log-loss0.03790932148694992
Epoch:19 Batch:200 Log

Epoch:27 Batch:360 Log-loss0.03544208034873009
Epoch:27 Batch:400 Log-loss0.031754668802022934
Epoch:27 Batch:440 Log-loss0.04824363812804222
Epoch:27 Batch:480 Log-loss0.048651132732629776
Epoch:27 Batch:520 Log-loss0.024600772187113762
Epoch:27 Batch:560 Log-loss0.04342334344983101
Epoch average log loss:0.03731697032095066
In Epoch27, val_loss:0.03860016198210927, best_val_loss:0.03844808302013479, best_auc:0.990704355678504
Epoch:28 Batch:0 Log-loss0.028779620304703712
Epoch:28 Batch:40 Log-loss0.03864942863583565
Epoch:28 Batch:80 Log-loss0.03994976356625557
Epoch:28 Batch:120 Log-loss0.05983389914035797
Epoch:28 Batch:160 Log-loss0.0371534563601017
Epoch:28 Batch:200 Log-loss0.03952157124876976
Epoch:28 Batch:240 Log-loss0.023651396855711937
Epoch:28 Batch:280 Log-loss0.022818179801106453
Epoch:28 Batch:320 Log-loss0.05143021047115326
Epoch:28 Batch:360 Log-loss0.04304340109229088
Epoch:28 Batch:400 Log-loss0.04066958650946617
Epoch:28 Batch:440 Log-loss0.035157933831214905
Epoch

Epoch:37 Batch:0 Log-loss0.03646939992904663
Epoch:37 Batch:40 Log-loss0.029216179624199867
Epoch:37 Batch:80 Log-loss0.036086030304431915
Epoch:37 Batch:120 Log-loss0.03187054023146629
Epoch:37 Batch:160 Log-loss0.03597589209675789
Epoch:37 Batch:200 Log-loss0.040180642157793045
Epoch:37 Batch:240 Log-loss0.0369984395802021
Epoch:37 Batch:280 Log-loss0.032506559044122696
Epoch:37 Batch:320 Log-loss0.04712832346558571
Epoch:37 Batch:360 Log-loss0.03497335687279701
Epoch:37 Batch:400 Log-loss0.0449063815176487
Epoch:37 Batch:440 Log-loss0.0633268728852272
Epoch:37 Batch:480 Log-loss0.027778228744864464
Epoch:37 Batch:520 Log-loss0.031030038371682167
Epoch:37 Batch:560 Log-loss0.027357565239071846
Epoch average log loss:0.03663257978457425
Model has been saved as temporary_checkpoints/FASTTXT_BGRU_64_64-TEMP.pt.

In Epoch37, val_loss:0.038327332179147876, best_val_loss:0.038327332179147876, best_auc:0.9907846981884747
Epoch:38 Batch:0 Log-loss0.0414077527821064
Epoch:38 Batch:40 Log-loss

Epoch:46 Batch:360 Log-loss0.028098128736019135
Epoch:46 Batch:400 Log-loss0.02508808858692646
Epoch:46 Batch:440 Log-loss0.04062319174408913
Epoch:46 Batch:480 Log-loss0.05267810449004173
Epoch:46 Batch:520 Log-loss0.03798578307032585
Epoch:46 Batch:560 Log-loss0.04819203540682793
Epoch average log loss:0.03658836573595181
In Epoch46, val_loss:0.03837748371079889, best_val_loss:0.038327332179147876, best_auc:0.9907846981884747
Epoch:47 Batch:0 Log-loss0.04228948429226875
Epoch:47 Batch:40 Log-loss0.053644049912691116
Epoch:47 Batch:80 Log-loss0.0299371387809515
Epoch:47 Batch:120 Log-loss0.03826596960425377
Epoch:47 Batch:160 Log-loss0.04309915378689766
Epoch:47 Batch:200 Log-loss0.03421245515346527
Epoch:47 Batch:240 Log-loss0.05905935540795326
Epoch:47 Batch:280 Log-loss0.04731204733252525
Epoch:47 Batch:320 Log-loss0.04027416184544563
Epoch:47 Batch:360 Log-loss0.0433635376393795
Epoch:47 Batch:400 Log-loss0.048432428389787674
Epoch:47 Batch:440 Log-loss0.032580431550741196
Epoch:4

Epoch:8 Batch:400 Log-loss0.03662538155913353
Epoch:8 Batch:440 Log-loss0.03899862989783287
Epoch:8 Batch:480 Log-loss0.04006917029619217
Epoch:8 Batch:520 Log-loss0.0517415814101696
Epoch:8 Batch:560 Log-loss0.035872798413038254
Epoch average log loss:0.04204534596231367
Model has been saved as temporary_checkpoints/FASTTXT_BGRU_64_64-TEMP.pt.

In Epoch8, val_loss:0.03950107477793544, best_val_loss:0.03950107477793544, best_auc:0.989833465663108
Epoch:9 Batch:0 Log-loss0.0630677193403244
Epoch:9 Batch:40 Log-loss0.032331325113773346
Epoch:9 Batch:80 Log-loss0.047606054693460464
Epoch:9 Batch:120 Log-loss0.054586682468652725
Epoch:9 Batch:160 Log-loss0.047248248010873795
Epoch:9 Batch:200 Log-loss0.02666633389890194
Epoch:9 Batch:240 Log-loss0.04046201333403587
Epoch:9 Batch:280 Log-loss0.032455701380968094
Epoch:9 Batch:320 Log-loss0.03451235219836235
Epoch:9 Batch:360 Log-loss0.03911256045103073
Epoch:9 Batch:400 Log-loss0.030111514031887054
Epoch:9 Batch:440 Log-loss0.05952444672584

Epoch:17 Batch:440 Log-loss0.050244856625795364
Epoch:17 Batch:480 Log-loss0.03357003629207611
Epoch:17 Batch:520 Log-loss0.045512083917856216
Epoch:17 Batch:560 Log-loss0.037274282425642014
Epoch average log loss:0.038705564383417365
Model has been saved as temporary_checkpoints/FASTTXT_BGRU_64_64-TEMP.pt.

In Epoch17, val_loss:0.03753429972140312, best_val_loss:0.03753429972140312, best_auc:0.9907392010568472
Epoch:18 Batch:0 Log-loss0.03486906737089157
Epoch:18 Batch:40 Log-loss0.040532927960157394
Epoch:18 Batch:80 Log-loss0.037907350808382034
Epoch:18 Batch:120 Log-loss0.05321185290813446
Epoch:18 Batch:160 Log-loss0.04002360999584198
Epoch:18 Batch:200 Log-loss0.048030223697423935
Epoch:18 Batch:240 Log-loss0.03564560040831566
Epoch:18 Batch:280 Log-loss0.05232837423682213
Epoch:18 Batch:320 Log-loss0.033754441887140274
Epoch:18 Batch:360 Log-loss0.024255527183413506
Epoch:18 Batch:400 Log-loss0.03634358569979668
Epoch:18 Batch:440 Log-loss0.03060762770473957
Epoch:18 Batch:480 L

Epoch:27 Batch:0 Log-loss0.04765066131949425
Epoch:27 Batch:40 Log-loss0.030533581972122192
Epoch:27 Batch:80 Log-loss0.03516639769077301
Epoch:27 Batch:120 Log-loss0.04590623080730438
Epoch:27 Batch:160 Log-loss0.028501277789473534
Epoch:27 Batch:200 Log-loss0.02199750579893589
Epoch:27 Batch:240 Log-loss0.03329619765281677
Epoch:27 Batch:280 Log-loss0.02977646328508854
Epoch:27 Batch:320 Log-loss0.046193405985832214
Epoch:27 Batch:360 Log-loss0.0385616160929203
Epoch:27 Batch:400 Log-loss0.04397210851311684
Epoch:27 Batch:440 Log-loss0.03921296074986458
Epoch:27 Batch:480 Log-loss0.034743670374155045
Epoch:27 Batch:520 Log-loss0.03560959920287132
Epoch:27 Batch:560 Log-loss0.03977116942405701
Epoch average log loss:0.03747429199782865
In Epoch27, val_loss:0.03735585581873504, best_val_loss:0.03733554633664588, best_auc:0.990945842787065
Epoch:28 Batch:0 Log-loss0.041897520422935486
Epoch:28 Batch:40 Log-loss0.029437685385346413
Epoch:28 Batch:80 Log-loss0.04550371691584587
Epoch:28 B

Epoch:36 Batch:400 Log-loss0.025833694264292717
Epoch:36 Batch:440 Log-loss0.034409526735544205
Epoch:36 Batch:480 Log-loss0.025018826127052307
Epoch:36 Batch:520 Log-loss0.031979165971279144
Epoch:36 Batch:560 Log-loss0.03731510415673256
Epoch average log loss:0.03684867032071842
In Epoch36, val_loss:0.03731820794399781, best_val_loss:0.037304429734430704, best_auc:0.9910044825886049
Epoch:37 Batch:0 Log-loss0.041120968759059906
Epoch:37 Batch:40 Log-loss0.04017426818609238
Epoch:37 Batch:80 Log-loss0.052230436354875565
Epoch:37 Batch:120 Log-loss0.03885991871356964
Epoch:37 Batch:160 Log-loss0.02336188219487667
Epoch:37 Batch:200 Log-loss0.037928953766822815
Epoch:37 Batch:240 Log-loss0.0404653437435627
Epoch:37 Batch:280 Log-loss0.01976540870964527
Epoch:37 Batch:320 Log-loss0.0346110463142395
Epoch:37 Batch:360 Log-loss0.04622014984488487
Epoch:37 Batch:400 Log-loss0.03186018019914627
Epoch:37 Batch:440 Log-loss0.04804309830069542
Epoch:37 Batch:480 Log-loss0.03703493997454643
Epoc

Epoch:46 Batch:40 Log-loss0.04640065133571625
Epoch:46 Batch:80 Log-loss0.03536185994744301
Epoch:46 Batch:120 Log-loss0.024372020736336708
Epoch:46 Batch:160 Log-loss0.04049365594983101
Epoch:46 Batch:200 Log-loss0.03226381912827492
Epoch:46 Batch:240 Log-loss0.029100291430950165
Epoch:46 Batch:280 Log-loss0.048882756382226944
Epoch:46 Batch:320 Log-loss0.033108893781900406
Epoch:46 Batch:360 Log-loss0.03262598440051079
Epoch:46 Batch:400 Log-loss0.032616760581731796
Epoch:46 Batch:440 Log-loss0.030659863725304604
Epoch:46 Batch:480 Log-loss0.03488423302769661
Epoch:46 Batch:520 Log-loss0.02750486694276333
Epoch:46 Batch:560 Log-loss0.0325506292283535
Epoch average log loss:0.03659242326061108
In Epoch46, val_loss:0.03727975592343704, best_val_loss:0.03721452095062645, best_auc:0.9910563496841317
Epoch:47 Batch:0 Log-loss0.028656980022788048
Epoch:47 Batch:40 Log-loss0.03158046677708626
Epoch:47 Batch:80 Log-loss0.04087788984179497
Epoch:47 Batch:120 Log-loss0.0454706996679306
Epoch:4

Epoch:8 Batch:80 Log-loss0.026733243837952614
Epoch:8 Batch:120 Log-loss0.024655088782310486
Epoch:8 Batch:160 Log-loss0.0476449616253376
Epoch:8 Batch:200 Log-loss0.04001067206263542
Epoch:8 Batch:240 Log-loss0.04956318438053131
Epoch:8 Batch:280 Log-loss0.03784343972802162
Epoch:8 Batch:320 Log-loss0.05257384106516838
Epoch:8 Batch:360 Log-loss0.029924876987934113
Epoch:8 Batch:400 Log-loss0.04770452156662941
Epoch:8 Batch:440 Log-loss0.04735509678721428
Epoch:8 Batch:480 Log-loss0.045842722058296204
Epoch:8 Batch:520 Log-loss0.03182806447148323
Epoch:8 Batch:560 Log-loss0.044424816966056824
Epoch average log loss:0.04223519116640091
Model has been saved as temporary_checkpoints/FASTTXT_BGRU_64_64-TEMP.pt.

In Epoch8, val_loss:0.04113873117097322, best_val_loss:0.04113873117097322, best_auc:0.9854845190711595
Epoch:9 Batch:0 Log-loss0.04345192387700081
Epoch:9 Batch:40 Log-loss0.04898719862103462
Epoch:9 Batch:80 Log-loss0.06000930070877075
Epoch:9 Batch:120 Log-loss0.048041671514511

Epoch:17 Batch:200 Log-loss0.03365105763077736
Epoch:17 Batch:240 Log-loss0.03986181318759918
Epoch:17 Batch:280 Log-loss0.03372947871685028
Epoch:17 Batch:320 Log-loss0.04586018994450569
Epoch:17 Batch:360 Log-loss0.03453269973397255
Epoch:17 Batch:400 Log-loss0.040486890822649
Epoch:17 Batch:440 Log-loss0.037645578384399414
Epoch:17 Batch:480 Log-loss0.030009711161255836
Epoch:17 Batch:520 Log-loss0.040392402559518814
Epoch:17 Batch:560 Log-loss0.03294892609119415
Epoch average log loss:0.03877530910540372
Model has been saved as temporary_checkpoints/FASTTXT_BGRU_64_64-TEMP.pt.

In Epoch17, val_loss:0.03991126317927755, best_val_loss:0.03991126317927755, best_auc:0.9880556862096544
Epoch:18 Batch:0 Log-loss0.040074821561574936
Epoch:18 Batch:40 Log-loss0.040846195071935654
Epoch:18 Batch:80 Log-loss0.037810105830430984
Epoch:18 Batch:120 Log-loss0.0367041677236557
Epoch:18 Batch:160 Log-loss0.040505167096853256
Epoch:18 Batch:200 Log-loss0.034350231289863586
Epoch:18 Batch:240 Log-l

Epoch:26 Batch:280 Log-loss0.0324312224984169
Epoch:26 Batch:320 Log-loss0.043237343430519104
Epoch:26 Batch:360 Log-loss0.048127006739377975
Epoch:26 Batch:400 Log-loss0.02048318274319172
Epoch:26 Batch:440 Log-loss0.03484311327338219
Epoch:26 Batch:480 Log-loss0.04101413115859032
Epoch:26 Batch:520 Log-loss0.03416096046566963
Epoch:26 Batch:560 Log-loss0.032723695039749146
Epoch average log loss:0.03758471753015848
In Epoch26, val_loss:0.03973707576121572, best_val_loss:0.03960626397149949, best_auc:0.9882408352973778
Epoch:27 Batch:0 Log-loss0.05371787026524544
Epoch:27 Batch:40 Log-loss0.04236404970288277
Epoch:27 Batch:80 Log-loss0.05403284355998039
Epoch:27 Batch:120 Log-loss0.024500088766217232
Epoch:27 Batch:160 Log-loss0.042078617960214615
Epoch:27 Batch:200 Log-loss0.033170174807310104
Epoch:27 Batch:240 Log-loss0.0327983982861042
Epoch:27 Batch:280 Log-loss0.04499615356326103
Epoch:27 Batch:320 Log-loss0.04755761846899986
Epoch:27 Batch:360 Log-loss0.04892247915267944
Epoch:

In Epoch35, val_loss:0.039657340306191564, best_val_loss:0.039578173508909895, best_auc:0.9883901954473616
Epoch:36 Batch:0 Log-loss0.028388721868395805
Epoch:36 Batch:40 Log-loss0.027466779574751854
Epoch:36 Batch:80 Log-loss0.02881482057273388
Epoch:36 Batch:120 Log-loss0.037767112255096436
Epoch:36 Batch:160 Log-loss0.028785988688468933
Epoch:36 Batch:200 Log-loss0.033389244228601456
Epoch:36 Batch:240 Log-loss0.022862069308757782
Epoch:36 Batch:280 Log-loss0.02861057035624981
Epoch:36 Batch:320 Log-loss0.03138485178351402
Epoch:36 Batch:360 Log-loss0.03939642012119293
Epoch:36 Batch:400 Log-loss0.026068901643157005
Epoch:36 Batch:440 Log-loss0.0366431325674057
Epoch:36 Batch:480 Log-loss0.02163195051252842
Epoch:36 Batch:520 Log-loss0.02748493105173111
Epoch:36 Batch:560 Log-loss0.04909767210483551
Epoch average log loss:0.036708988179452715
In Epoch36, val_loss:0.03967144006626593, best_val_loss:0.039578173508909895, best_auc:0.9883901954473616
Epoch:37 Batch:0 Log-loss0.036945242

Epoch:45 Batch:200 Log-loss0.037846554070711136
Epoch:45 Batch:240 Log-loss0.04242054000496864
Epoch:45 Batch:280 Log-loss0.05488096550107002
Epoch:45 Batch:320 Log-loss0.026418335735797882
Epoch:45 Batch:360 Log-loss0.03647127375006676
Epoch:45 Batch:400 Log-loss0.0363917276263237
Epoch:45 Batch:440 Log-loss0.03109787404537201
Epoch:45 Batch:480 Log-loss0.036177489906549454
Epoch:45 Batch:520 Log-loss0.033712368458509445
Epoch:45 Batch:560 Log-loss0.030969778075814247
Epoch average log loss:0.0364347140737144
In Epoch45, val_loss:0.03958566948339255, best_val_loss:0.039563648721861154, best_auc:0.988465415625026
Epoch:46 Batch:0 Log-loss0.03161366656422615
Epoch:46 Batch:40 Log-loss0.04283595085144043
Epoch:46 Batch:80 Log-loss0.041522856801748276
Epoch:46 Batch:120 Log-loss0.043729234486818314
Epoch:46 Batch:160 Log-loss0.02303955890238285
Epoch:46 Batch:200 Log-loss0.03180466964840889
Epoch:46 Batch:240 Log-loss0.040012892335653305
Epoch:46 Batch:280 Log-loss0.05044377222657204
Epoc

In Epoch54, val_loss:0.039624828676775324, best_val_loss:0.03956095000325142, best_auc:0.9884330467037216
Epoch:55 Batch:0 Log-loss0.034983109682798386
Epoch:55 Batch:40 Log-loss0.043533142656087875
Epoch:55 Batch:80 Log-loss0.035091809928417206
Epoch:55 Batch:120 Log-loss0.05586490035057068
Epoch:55 Batch:160 Log-loss0.034371551126241684
Epoch:55 Batch:200 Log-loss0.020768629387021065
Epoch:55 Batch:240 Log-loss0.044510677456855774
Epoch:55 Batch:280 Log-loss0.046813011169433594
Epoch:55 Batch:320 Log-loss0.03270531818270683
Epoch:55 Batch:360 Log-loss0.04032721370458603
Epoch:55 Batch:400 Log-loss0.04183114692568779
Epoch:55 Batch:440 Log-loss0.028339119628071785
Epoch:55 Batch:480 Log-loss0.040713679045438766
Epoch:55 Batch:520 Log-loss0.03994131460785866
Epoch:55 Batch:560 Log-loss0.03601524233818054
Epoch average log loss:0.0363054969580844
In Epoch55, val_loss:0.039604770953555024, best_val_loss:0.03956095000325142, best_auc:0.9884330467037216
Epoch:56 Batch:0 Log-loss0.034731213

Epoch:7 Batch:0 Log-loss0.03548818454146385
Epoch:7 Batch:40 Log-loss0.052665531635284424
Epoch:7 Batch:80 Log-loss0.03596782684326172
Epoch:7 Batch:120 Log-loss0.04696022346615791
Epoch:7 Batch:160 Log-loss0.03771286457777023
Epoch:7 Batch:200 Log-loss0.059957217425107956
Epoch:7 Batch:240 Log-loss0.048102304339408875
Epoch:7 Batch:280 Log-loss0.044488389045000076
Epoch:7 Batch:320 Log-loss0.03202056512236595
Epoch:7 Batch:360 Log-loss0.04730924963951111
Epoch:7 Batch:400 Log-loss0.04715922102332115
Epoch:7 Batch:440 Log-loss0.03295135498046875
Epoch:7 Batch:480 Log-loss0.03756494075059891
Epoch:7 Batch:520 Log-loss0.04242478311061859
Epoch:7 Batch:560 Log-loss0.0506175272166729
Epoch average log loss:0.04220668766980192
Model has been saved as temporary_checkpoints/FASTTXT_BGRU_64_64-TEMP.pt.

In Epoch7, val_loss:0.03953565719962627, best_val_loss:0.03953565719962627, best_auc:0.9887815929665466
Epoch:8 Batch:0 Log-loss0.035534877330064774
Epoch:8 Batch:40 Log-loss0.02707836776971817

Epoch:16 Batch:120 Log-loss0.02847808413207531
Epoch:16 Batch:160 Log-loss0.04073413088917732
Epoch:16 Batch:200 Log-loss0.04970342293381691
Epoch:16 Batch:240 Log-loss0.03921099379658699
Epoch:16 Batch:280 Log-loss0.02875444106757641
Epoch:16 Batch:320 Log-loss0.023150764405727386
Epoch:16 Batch:360 Log-loss0.03523242846131325
Epoch:16 Batch:400 Log-loss0.03908280283212662
Epoch:16 Batch:440 Log-loss0.03343937173485756
Epoch:16 Batch:480 Log-loss0.03022467903792858
Epoch:16 Batch:520 Log-loss0.05012531206011772
Epoch:16 Batch:560 Log-loss0.03380236029624939
Epoch average log loss:0.03903021079687668
In Epoch16, val_loss:0.03828643841673148, best_val_loss:0.03810529382589412, best_auc:0.9903077410517865
Epoch:17 Batch:0 Log-loss0.035158198326826096
Epoch:17 Batch:40 Log-loss0.03788575902581215
Epoch:17 Batch:80 Log-loss0.041078221052885056
Epoch:17 Batch:120 Log-loss0.03147970512509346
Epoch:17 Batch:160 Log-loss0.03534971550107002
Epoch:17 Batch:200 Log-loss0.05309704318642616
Epoch:1

Epoch:25 Batch:240 Log-loss0.042076244950294495
Epoch:25 Batch:280 Log-loss0.04033327102661133
Epoch:25 Batch:320 Log-loss0.042131200432777405
Epoch:25 Batch:360 Log-loss0.0439172089099884
Epoch:25 Batch:400 Log-loss0.04719462990760803
Epoch:25 Batch:440 Log-loss0.035465557128190994
Epoch:25 Batch:480 Log-loss0.040575526654720306
Epoch:25 Batch:520 Log-loss0.03884885460138321
Epoch:25 Batch:560 Log-loss0.035009708255529404
Epoch average log loss:0.03756963840153601
In Epoch25, val_loss:0.03762516986694113, best_val_loss:0.03758535380011604, best_auc:0.9906366406253445
Epoch:26 Batch:0 Log-loss0.04991983249783516
Epoch:26 Batch:40 Log-loss0.04616701975464821
Epoch:26 Batch:80 Log-loss0.04436659440398216
Epoch:26 Batch:120 Log-loss0.03783582150936127
Epoch:26 Batch:160 Log-loss0.03593594953417778
Epoch:26 Batch:200 Log-loss0.047565627843141556
Epoch:26 Batch:240 Log-loss0.04818875715136528
Epoch:26 Batch:280 Log-loss0.033925384283065796
Epoch:26 Batch:320 Log-loss0.0288123469799757
Epoch

Epoch:34 Batch:520 Log-loss0.047328025102615356
Epoch:34 Batch:560 Log-loss0.04677702486515045
Epoch average log loss:0.036833271231236205
In Epoch34, val_loss:0.037629429597550834, best_val_loss:0.03752064762243834, best_auc:0.9907191334804722
Epoch:35 Batch:0 Log-loss0.03654155880212784
Epoch:35 Batch:40 Log-loss0.03824657201766968
Epoch:35 Batch:80 Log-loss0.042992692440748215
Epoch:35 Batch:120 Log-loss0.03254116326570511
Epoch:35 Batch:160 Log-loss0.0536394827067852
Epoch:35 Batch:200 Log-loss0.027161823585629463
Epoch:35 Batch:240 Log-loss0.04223228618502617
Epoch:35 Batch:280 Log-loss0.035007674247026443
Epoch:35 Batch:320 Log-loss0.050888512283563614
Epoch:35 Batch:360 Log-loss0.028673483058810234
Epoch:35 Batch:400 Log-loss0.03539141267538071
Epoch:35 Batch:440 Log-loss0.053066834807395935
Epoch:35 Batch:480 Log-loss0.028763746842741966
Epoch:35 Batch:520 Log-loss0.02728216163814068
Epoch:35 Batch:560 Log-loss0.02542814053595066
Epoch average log loss:0.03684140107527908
Model

Epoch:44 Batch:120 Log-loss0.050662193447351456
Epoch:44 Batch:160 Log-loss0.02383950911462307
Epoch:44 Batch:200 Log-loss0.03868343308568001
Epoch:44 Batch:240 Log-loss0.04093961417675018
Epoch:44 Batch:280 Log-loss0.03775416314601898
Epoch:44 Batch:320 Log-loss0.0525713674724102
Epoch:44 Batch:360 Log-loss0.03795639052987099
Epoch:44 Batch:400 Log-loss0.04328681901097298
Epoch:44 Batch:440 Log-loss0.05027790740132332
Epoch:44 Batch:480 Log-loss0.042690690606832504
Epoch:44 Batch:520 Log-loss0.027824893593788147
Epoch:44 Batch:560 Log-loss0.02921321429312229
Epoch average log loss:0.0367065680180011
Model has been saved as temporary_checkpoints/FASTTXT_BGRU_64_64-TEMP.pt.

In Epoch44, val_loss:0.037426348052701425, best_val_loss:0.037426348052701425, best_auc:0.9907144276621792
Epoch:45 Batch:0 Log-loss0.029776304960250854
Epoch:45 Batch:40 Log-loss0.03824174776673317
Epoch:45 Batch:80 Log-loss0.025960206985473633
Epoch:45 Batch:120 Log-loss0.03196068853139877
Epoch:45 Batch:160 Log-l

Epoch:53 Batch:480 Log-loss0.03595719859004021
Epoch:53 Batch:520 Log-loss0.0469401516020298
Epoch:53 Batch:560 Log-loss0.04815412685275078
Epoch average log loss:0.036312858983209094
In Epoch53, val_loss:0.03748325602208597, best_val_loss:0.037426348052701425, best_auc:0.9907144276621792
Epoch:54 Batch:0 Log-loss0.039839792996644974
Epoch:54 Batch:40 Log-loss0.050849948078393936
Epoch:54 Batch:80 Log-loss0.04053773358464241
Epoch:54 Batch:120 Log-loss0.042080312967300415
Epoch:54 Batch:160 Log-loss0.034418996423482895
Epoch:54 Batch:200 Log-loss0.03692706301808357
Epoch:54 Batch:240 Log-loss0.02783624641597271
Epoch:54 Batch:280 Log-loss0.041737109422683716
Epoch:54 Batch:320 Log-loss0.0345863401889801
Epoch:54 Batch:360 Log-loss0.02867191843688488
Epoch:54 Batch:400 Log-loss0.032103750854730606
Epoch:54 Batch:440 Log-loss0.042101431638002396
Epoch:54 Batch:480 Log-loss0.03534375876188278
Epoch:54 Batch:520 Log-loss0.027273863554000854
Epoch:54 Batch:560 Log-loss0.03870425745844841
Ep

Epoch:8 Batch:520 Log-loss0.03923605754971504
Epoch:8 Batch:560 Log-loss0.02341325767338276
Epoch average log loss:0.042146239898699735
Model has been saved as temporary_checkpoints/FASTTXT_BGRU_64_64-TEMP.pt.

In Epoch8, val_loss:0.03792250036242368, best_val_loss:0.03792250036242368, best_auc:0.9891503180111494
Epoch:9 Batch:0 Log-loss0.04385707154870033
Epoch:9 Batch:40 Log-loss0.03290438652038574
Epoch:9 Batch:80 Log-loss0.04584120586514473
Epoch:9 Batch:120 Log-loss0.04214106500148773
Epoch:9 Batch:160 Log-loss0.032752957195043564
Epoch:9 Batch:200 Log-loss0.03788946568965912
Epoch:9 Batch:240 Log-loss0.04010153189301491
Epoch:9 Batch:280 Log-loss0.03367197886109352
Epoch:9 Batch:320 Log-loss0.03964441269636154
Epoch:9 Batch:360 Log-loss0.04141067713499069
Epoch:9 Batch:400 Log-loss0.03334914147853851
Epoch:9 Batch:440 Log-loss0.034839730709791183
Epoch:9 Batch:480 Log-loss0.04178367182612419
Epoch:9 Batch:520 Log-loss0.04252682253718376
Epoch:9 Batch:560 Log-loss0.031889401376247

Epoch:17 Batch:480 Log-loss0.03868662193417549
Epoch:17 Batch:520 Log-loss0.043887943029403687
Epoch:17 Batch:560 Log-loss0.034761834889650345
Epoch average log loss:0.03907029921122428
In Epoch17, val_loss:0.03674639646263186, best_val_loss:0.03670715160384994, best_auc:0.9907649454506751
Epoch:18 Batch:0 Log-loss0.03137710317969322
Epoch:18 Batch:40 Log-loss0.03229707479476929
Epoch:18 Batch:80 Log-loss0.03881513699889183
Epoch:18 Batch:120 Log-loss0.03610445186495781
Epoch:18 Batch:160 Log-loss0.03558258339762688
Epoch:18 Batch:200 Log-loss0.03684235364198685
Epoch:18 Batch:240 Log-loss0.05346217751502991
Epoch:18 Batch:280 Log-loss0.045369382947683334
Epoch:18 Batch:320 Log-loss0.034988466650247574
Epoch:18 Batch:360 Log-loss0.045316021889448166
Epoch:18 Batch:400 Log-loss0.044925857335329056
Epoch:18 Batch:440 Log-loss0.03924776241183281
Epoch:18 Batch:480 Log-loss0.04326817765831947
Epoch:18 Batch:520 Log-loss0.03963537514209747
Epoch:18 Batch:560 Log-loss0.03409786522388458
Epoc

Epoch:27 Batch:0 Log-loss0.032058022916316986
Epoch:27 Batch:40 Log-loss0.037677913904190063
Epoch:27 Batch:80 Log-loss0.031161850318312645
Epoch:27 Batch:120 Log-loss0.02310800738632679
Epoch:27 Batch:160 Log-loss0.028846995905041695
Epoch:27 Batch:200 Log-loss0.03471627086400986
Epoch:27 Batch:240 Log-loss0.04245747625827789
Epoch:27 Batch:280 Log-loss0.03251992538571358
Epoch:27 Batch:320 Log-loss0.030567854642868042
Epoch:27 Batch:360 Log-loss0.04350472614169121
Epoch:27 Batch:400 Log-loss0.046614814549684525
Epoch:27 Batch:440 Log-loss0.04512598738074303
Epoch:27 Batch:480 Log-loss0.04219217598438263
Epoch:27 Batch:520 Log-loss0.030640453100204468
Epoch:27 Batch:560 Log-loss0.03488735482096672
Epoch average log loss:0.03753504768080477
Model has been saved as temporary_checkpoints/FASTTXT_BGRU_64_64-TEMP.pt.

In Epoch27, val_loss:0.03633666397599476, best_val_loss:0.03633666397599476, best_auc:0.991000214625914
Epoch:28 Batch:0 Log-loss0.03391767665743828
Epoch:28 Batch:40 Log-los

Epoch:36 Batch:400 Log-loss0.04799996316432953
Epoch:36 Batch:440 Log-loss0.03632586821913719
Epoch:36 Batch:480 Log-loss0.032197196036577225
Epoch:36 Batch:520 Log-loss0.0477294959127903
Epoch:36 Batch:560 Log-loss0.044385313987731934
Epoch average log loss:0.037027884367853404
In Epoch36, val_loss:0.036511069997664805, best_val_loss:0.03633666397599476, best_auc:0.991000214625914
Epoch:37 Batch:0 Log-loss0.033630046993494034
Epoch:37 Batch:40 Log-loss0.04341144487261772
Epoch:37 Batch:80 Log-loss0.043827518820762634
Epoch:37 Batch:120 Log-loss0.03235602378845215
Epoch:37 Batch:160 Log-loss0.029233241453766823
Epoch:37 Batch:200 Log-loss0.05922232195734978
Epoch:37 Batch:240 Log-loss0.040833912789821625
Epoch:37 Batch:280 Log-loss0.03064712882041931
Epoch:37 Batch:320 Log-loss0.03206590563058853
Epoch:37 Batch:360 Log-loss0.0380646176636219
Epoch:37 Batch:400 Log-loss0.03685888275504112
Epoch:37 Batch:440 Log-loss0.0318370945751667
Epoch:37 Batch:480 Log-loss0.03119787573814392
Epoch:

Epoch:8 Batch:440 Log-loss0.026999376714229584
Epoch:8 Batch:480 Log-loss0.04400629922747612
Epoch:8 Batch:520 Log-loss0.03930778056383133
Epoch:8 Batch:560 Log-loss0.059055302292108536
Epoch average log loss:0.04195517084694334
Model has been saved as temporary_checkpoints/FASTTXT_BGRU_64_64-TEMP.pt.

In Epoch8, val_loss:0.038943949354370344, best_val_loss:0.038943949354370344, best_auc:0.9869054354742267
Epoch:9 Batch:0 Log-loss0.04157564416527748
Epoch:9 Batch:40 Log-loss0.042970944195985794
Epoch:9 Batch:80 Log-loss0.04248839244246483
Epoch:9 Batch:120 Log-loss0.04621853306889534
Epoch:9 Batch:160 Log-loss0.035649366676807404
Epoch:9 Batch:200 Log-loss0.03273468837141991
Epoch:9 Batch:240 Log-loss0.045425593852996826
Epoch:9 Batch:280 Log-loss0.05068336799740791
Epoch:9 Batch:320 Log-loss0.044638875871896744
Epoch:9 Batch:360 Log-loss0.04561986029148102
Epoch:9 Batch:400 Log-loss0.036621466279029846
Epoch:9 Batch:440 Log-loss0.04304751753807068
Epoch:9 Batch:480 Log-loss0.047916159

In Epoch17, val_loss:0.03804959634552036, best_val_loss:0.038025336946415605, best_auc:0.9889229674990642
Epoch:18 Batch:0 Log-loss0.05093863606452942
Epoch:18 Batch:40 Log-loss0.03569447249174118
Epoch:18 Batch:80 Log-loss0.030999116599559784
Epoch:18 Batch:120 Log-loss0.043984126299619675
Epoch:18 Batch:160 Log-loss0.04073851928114891
Epoch:18 Batch:200 Log-loss0.0501139871776104
Epoch:18 Batch:240 Log-loss0.04075596109032631
Epoch:18 Batch:280 Log-loss0.045665789395570755
Epoch:18 Batch:320 Log-loss0.043532561510801315
Epoch:18 Batch:360 Log-loss0.03232383355498314
Epoch:18 Batch:400 Log-loss0.02937909960746765
Epoch:18 Batch:440 Log-loss0.030361143872141838
Epoch:18 Batch:480 Log-loss0.06526514887809753
Epoch:18 Batch:520 Log-loss0.04856736585497856
Epoch:18 Batch:560 Log-loss0.04805982857942581
Epoch average log loss:0.038626848886321695
In Epoch18, val_loss:0.03809442507545027, best_val_loss:0.038025336946415605, best_auc:0.9889229674990642
Epoch:19 Batch:0 Log-loss0.035694349557

Epoch:27 Batch:240 Log-loss0.03731074556708336
Epoch:27 Batch:280 Log-loss0.03224267438054085
Epoch:27 Batch:320 Log-loss0.019776832312345505
Epoch:27 Batch:360 Log-loss0.047354597598314285
Epoch:27 Batch:400 Log-loss0.022550620138645172
Epoch:27 Batch:440 Log-loss0.032220106571912766
Epoch:27 Batch:480 Log-loss0.03721199184656143
Epoch:27 Batch:520 Log-loss0.042260248214006424
Epoch:27 Batch:560 Log-loss0.02921636588871479
Epoch average log loss:0.03739128584108715
Model has been saved as temporary_checkpoints/FASTTXT_BGRU_64_64-TEMP.pt.

In Epoch27, val_loss:0.037555375900341165, best_val_loss:0.037555375900341165, best_auc:0.9894698424386442
Epoch:28 Batch:0 Log-loss0.03778574988245964
Epoch:28 Batch:40 Log-loss0.03254866227507591
Epoch:28 Batch:80 Log-loss0.04492509365081787
Epoch:28 Batch:120 Log-loss0.03577310964465141
Epoch:28 Batch:160 Log-loss0.03733382001519203
Epoch:28 Batch:200 Log-loss0.0500914566218853
Epoch:28 Batch:240 Log-loss0.024008147418498993
Epoch:28 Batch:280 Log

Epoch:36 Batch:560 Log-loss0.043779853731393814
Epoch average log loss:0.03689869058850621
In Epoch36, val_loss:0.037692696456019144, best_val_loss:0.03753689442131411, best_auc:0.9894980425088349
Epoch:37 Batch:0 Log-loss0.033113252371549606
Epoch:37 Batch:40 Log-loss0.0506560243666172
Epoch:37 Batch:80 Log-loss0.032049696892499924
Epoch:37 Batch:120 Log-loss0.0572362057864666
Epoch:37 Batch:160 Log-loss0.039986517280340195
Epoch:37 Batch:200 Log-loss0.03667522221803665
Epoch:37 Batch:240 Log-loss0.029182152822613716
Epoch:37 Batch:280 Log-loss0.03598419204354286
Epoch:37 Batch:320 Log-loss0.04507964849472046
Epoch:37 Batch:360 Log-loss0.029649024829268456
Epoch:37 Batch:400 Log-loss0.03400484099984169
Epoch:37 Batch:440 Log-loss0.03319002315402031
Epoch:37 Batch:480 Log-loss0.03851920738816261
Epoch:37 Batch:520 Log-loss0.042954761534929276
Epoch:37 Batch:560 Log-loss0.05137614160776138
Epoch average log loss:0.036965755850542334
In Epoch37, val_loss:0.037767706182749584, best_val_lo

Epoch:2 Batch:160 Log-loss0.051143571734428406
Epoch:2 Batch:200 Log-loss0.04185109958052635
Epoch:2 Batch:240 Log-loss0.038973793387413025
Epoch:2 Batch:280 Log-loss0.046875178813934326
Epoch:2 Batch:320 Log-loss0.0638737753033638
Epoch:2 Batch:360 Log-loss0.04933242127299309
Epoch:2 Batch:400 Log-loss0.045571219176054
Epoch:2 Batch:440 Log-loss0.056573331356048584
Epoch:2 Batch:480 Log-loss0.03366239741444588
Epoch:2 Batch:520 Log-loss0.05586392804980278
Epoch:2 Batch:560 Log-loss0.05873476713895798
Epoch average log loss:0.04966696346444743
Model has been saved as temporary_checkpoints/FASTTXT_BGRU_64_64-TEMP.pt.

In Epoch2, val_loss:0.04754312649880641, best_val_loss:0.04754312649880641, best_auc:0.9785247130291529
Epoch:3 Batch:0 Log-loss0.03936924785375595
Epoch:3 Batch:40 Log-loss0.03871582821011543
Epoch:3 Batch:80 Log-loss0.03771987184882164
Epoch:3 Batch:120 Log-loss0.04217385873198509
Epoch:3 Batch:160 Log-loss0.05575795844197273
Epoch:3 Batch:200 Log-loss0.05685500428080559

Epoch:11 Batch:160 Log-loss0.03412267565727234
Epoch:11 Batch:200 Log-loss0.039331838488578796
Epoch:11 Batch:240 Log-loss0.04977966845035553
Epoch:11 Batch:280 Log-loss0.04404750093817711
Epoch:11 Batch:320 Log-loss0.03475538268685341
Epoch:11 Batch:360 Log-loss0.041808854788541794
Epoch:11 Batch:400 Log-loss0.03803091496229172
Epoch:11 Batch:440 Log-loss0.039786387234926224
Epoch:11 Batch:480 Log-loss0.04521549865603447
Epoch:11 Batch:520 Log-loss0.04675464704632759
Epoch:11 Batch:560 Log-loss0.03984994441270828
Epoch average log loss:0.04075316271212484
Model has been saved as temporary_checkpoints/FASTTXT_BGRU_64_64-TEMP.pt.

In Epoch11, val_loss:0.040111199292105215, best_val_loss:0.040111199292105215, best_auc:0.9874906535293957
Epoch:12 Batch:0 Log-loss0.02083994261920452
Epoch:12 Batch:40 Log-loss0.03963178023695946
Epoch:12 Batch:80 Log-loss0.02447463758289814
Epoch:12 Batch:120 Log-loss0.05673886463046074
Epoch:12 Batch:160 Log-loss0.03424261882901192
Epoch:12 Batch:200 Log-l

Epoch:20 Batch:240 Log-loss0.03927800431847572
Epoch:20 Batch:280 Log-loss0.04753885045647621
Epoch:20 Batch:320 Log-loss0.02503562718629837
Epoch:20 Batch:360 Log-loss0.028513098135590553
Epoch:20 Batch:400 Log-loss0.050185661762952805
Epoch:20 Batch:440 Log-loss0.029106413945555687
Epoch:20 Batch:480 Log-loss0.04420166090130806
Epoch:20 Batch:520 Log-loss0.044173773378133774
Epoch:20 Batch:560 Log-loss0.031179916113615036
Epoch average log loss:0.03824161816654461
Model has been saved as temporary_checkpoints/FASTTXT_BGRU_64_64-TEMP.pt.

In Epoch20, val_loss:0.039440354297872064, best_val_loss:0.039440354297872064, best_auc:0.9885961692987003
Epoch:21 Batch:0 Log-loss0.04731267690658569
Epoch:21 Batch:40 Log-loss0.021234488114714622
Epoch:21 Batch:80 Log-loss0.035927463322877884
Epoch:21 Batch:120 Log-loss0.03808920457959175
Epoch:21 Batch:160 Log-loss0.04243460297584534
Epoch:21 Batch:200 Log-loss0.04232342168688774
Epoch:21 Batch:240 Log-loss0.032635707408189774
Epoch:21 Batch:280 

Epoch:29 Batch:480 Log-loss0.04226592183113098
Epoch:29 Batch:520 Log-loss0.0438595749437809
Epoch:29 Batch:560 Log-loss0.04386654496192932
Epoch average log loss:0.037408116340105026
In Epoch29, val_loss:0.039461284095747166, best_val_loss:0.03918212631970267, best_auc:0.9887729979000054
Epoch:30 Batch:0 Log-loss0.050351519137620926
Epoch:30 Batch:40 Log-loss0.043535325676202774
Epoch:30 Batch:80 Log-loss0.030129151418805122
Epoch:30 Batch:120 Log-loss0.04064665734767914
Epoch:30 Batch:160 Log-loss0.03896826133131981
Epoch:30 Batch:200 Log-loss0.03554191812872887
Epoch:30 Batch:240 Log-loss0.020142018795013428
Epoch:30 Batch:280 Log-loss0.028736582025885582
Epoch:30 Batch:320 Log-loss0.03584105893969536
Epoch:30 Batch:360 Log-loss0.0378265306353569
Epoch:30 Batch:400 Log-loss0.04393140971660614
Epoch:30 Batch:440 Log-loss0.039167147129774094
Epoch:30 Batch:480 Log-loss0.02146512269973755
Epoch:30 Batch:520 Log-loss0.03640872612595558
Epoch:30 Batch:560 Log-loss0.03652501478791237
Epoc

Epoch:4 Batch:0 Log-loss0.04857441410422325
Epoch:4 Batch:40 Log-loss0.0388202890753746
Epoch:4 Batch:80 Log-loss0.034085892140865326
Epoch:4 Batch:120 Log-loss0.058511149138212204
Epoch:4 Batch:160 Log-loss0.046584855765104294
Epoch:4 Batch:200 Log-loss0.04567112401127815
Epoch:4 Batch:240 Log-loss0.04985649883747101
Epoch:4 Batch:280 Log-loss0.04126705601811409
Epoch:4 Batch:320 Log-loss0.04631468281149864
Epoch:4 Batch:360 Log-loss0.07630687206983566
Epoch:4 Batch:400 Log-loss0.04593697190284729
Epoch:4 Batch:440 Log-loss0.05655166879296303
Epoch:4 Batch:480 Log-loss0.04430748149752617
Epoch:4 Batch:520 Log-loss0.04134054854512215
Epoch:4 Batch:560 Log-loss0.044468868523836136
Epoch average log loss:0.04551009874724384
Model has been saved as temporary_checkpoints/FASTTXT_BGRU_64_64-TEMP.pt.

In Epoch4, val_loss:0.040792865033664825, best_val_loss:0.040792865033664825, best_auc:0.9865633028123061
Epoch:5 Batch:0 Log-loss0.03637802228331566
Epoch:5 Batch:40 Log-loss0.0539213418960571

Epoch:13 Batch:240 Log-loss0.03666029870510101
Epoch:13 Batch:280 Log-loss0.03794027492403984
Epoch:13 Batch:320 Log-loss0.03209575638175011
Epoch:13 Batch:360 Log-loss0.027211545035243034
Epoch:13 Batch:400 Log-loss0.039986204355955124
Epoch:13 Batch:440 Log-loss0.032385874539613724
Epoch:13 Batch:480 Log-loss0.042384516447782516
Epoch:13 Batch:520 Log-loss0.03023792989552021
Epoch:13 Batch:560 Log-loss0.04209998995065689
Epoch average log loss:0.04007272729317524
In Epoch13, val_loss:0.03827162573478809, best_val_loss:0.03809650519363438, best_auc:0.9883203300539964
Epoch:14 Batch:0 Log-loss0.05613327398896217
Epoch:14 Batch:40 Log-loss0.02607407234609127
Epoch:14 Batch:80 Log-loss0.037494733929634094
Epoch:14 Batch:120 Log-loss0.04086542874574661
Epoch:14 Batch:160 Log-loss0.042488064616918564
Epoch:14 Batch:200 Log-loss0.033579111099243164
Epoch:14 Batch:240 Log-loss0.04034866392612457
Epoch:14 Batch:280 Log-loss0.03760915622115135
Epoch:14 Batch:320 Log-loss0.04818230867385864
Epo

Epoch:22 Batch:480 Log-loss0.04583213850855827
Epoch:22 Batch:520 Log-loss0.023703603073954582
Epoch:22 Batch:560 Log-loss0.03026270680129528
Epoch average log loss:0.03812316501113985
In Epoch22, val_loss:0.037584361195042916, best_val_loss:0.03750593372882481, best_auc:0.9889360910311962
Epoch:23 Batch:0 Log-loss0.037214744836091995
Epoch:23 Batch:40 Log-loss0.04588218033313751
Epoch:23 Batch:80 Log-loss0.04655660688877106
Epoch:23 Batch:120 Log-loss0.03538404032588005
Epoch:23 Batch:160 Log-loss0.043606821447610855
Epoch:23 Batch:200 Log-loss0.028064822778105736
Epoch:23 Batch:240 Log-loss0.029773995280265808
Epoch:23 Batch:280 Log-loss0.05827256664633751
Epoch:23 Batch:320 Log-loss0.042706605046987534
Epoch:23 Batch:360 Log-loss0.04082326963543892
Epoch:23 Batch:400 Log-loss0.03643850237131119
Epoch:23 Batch:440 Log-loss0.04934261739253998
Epoch:23 Batch:480 Log-loss0.029192691668868065
Epoch:23 Batch:520 Log-loss0.042013172060251236
Epoch:23 Batch:560 Log-loss0.03500572219491005
E

Epoch:32 Batch:0 Log-loss0.02555924467742443
Epoch:32 Batch:40 Log-loss0.043173015117645264
Epoch:32 Batch:80 Log-loss0.03214317187666893
Epoch:32 Batch:120 Log-loss0.04182949289679527
Epoch:32 Batch:160 Log-loss0.048973049968481064
Epoch:32 Batch:200 Log-loss0.027037186548113823
Epoch:32 Batch:240 Log-loss0.03429853543639183
Epoch:32 Batch:280 Log-loss0.04188264533877373
Epoch:32 Batch:320 Log-loss0.027212508022785187
Epoch:32 Batch:360 Log-loss0.05423672869801521
Epoch:32 Batch:400 Log-loss0.026018239557743073
Epoch:32 Batch:440 Log-loss0.03591928258538246
Epoch:32 Batch:480 Log-loss0.029280902817845345
Epoch:32 Batch:520 Log-loss0.03492751345038414
Epoch:32 Batch:560 Log-loss0.04193948954343796
Epoch average log loss:0.03728586017553295
In Epoch32, val_loss:0.03737022754721287, best_val_loss:0.037280518824741884, best_auc:0.9891612523457282
Epoch:33 Batch:0 Log-loss0.054315660148859024
Epoch:33 Batch:40 Log-loss0.04033203795552254
Epoch:33 Batch:80 Log-loss0.030183130875229836
Epoch

Epoch:41 Batch:240 Log-loss0.04956863448023796
Epoch:41 Batch:280 Log-loss0.028649361804127693
Epoch:41 Batch:320 Log-loss0.041014574468135834
Epoch:41 Batch:360 Log-loss0.030673174187541008
Epoch:41 Batch:400 Log-loss0.0355849415063858
Epoch:41 Batch:440 Log-loss0.026770837604999542
Epoch:41 Batch:480 Log-loss0.029718542471528053
Epoch:41 Batch:520 Log-loss0.03486945107579231
Epoch:41 Batch:560 Log-loss0.04453378543257713
Epoch average log loss:0.036813383070485935
In Epoch41, val_loss:0.03725409934025623, best_val_loss:0.037187047823038145, best_auc:0.9889335917214264
Epoch:42 Batch:0 Log-loss0.032268550246953964
Epoch:42 Batch:40 Log-loss0.03819175437092781
Epoch:42 Batch:80 Log-loss0.026156602427363396
Epoch:42 Batch:120 Log-loss0.035541970282793045
Epoch:42 Batch:160 Log-loss0.037008222192525864
Epoch:42 Batch:200 Log-loss0.03382289037108421
Epoch:42 Batch:240 Log-loss0.049914002418518066
Epoch:42 Batch:280 Log-loss0.04340128228068352
Epoch:42 Batch:320 Log-loss0.03338106349110603

## Make predections

In [None]:
import numpy as np
from sklearn.metrics import roc_auc_score

train_fold_preditcions = np.concatenate(best_val_pred, axis=0)
training_auc = roc_auc_score(training_labels, train_fold_preditcions)
print("Training AUC", training_auc)

In [None]:
import pandas as pd
path = 'Dataset/'
TRAIN_DATA_FILE=path + 'train.csv'
TEST_DATA_FILE=path + 'test.csv'
test_df = pd.read_csv(TEST_DATA_FILE)
train_df = pd.read_csv(TRAIN_DATA_FILE)

In [None]:
CLASSES = ["toxic", "severe_toxic", "obscene", "threat", "insult", "identity_hate"]
submit_path_prefix = "results/bgru/Fasttext-BGRU-" + str(MAX_SEQUENCE_LENGTH) 

print("Predicting testing results...")
test_predicts_list = []
for fold_id, model in enumerate(new_models):
    test_predicts = model.predict(test_sequences, batch_size=256, verbose=1)
    test_predicts_list.append(test_predicts)

test_predicts = np.zeros(test_predicts_list[0].shape)
for fold_predict in test_predicts_list:
    test_predicts += fold_predict
test_predicts /= len(test_predicts_list)

test_ids = test_df["id"].values
test_ids = test_ids.reshape((len(test_ids), 1))

test_predicts = pd.DataFrame(data=test_predicts, columns=CLASSES)
test_predicts["id"] = test_ids
test_predicts = test_predicts[["id"] + CLASSES]


In [None]:
submit_path = submit_path_prefix + "-L{:4f}-A{:4f}.csv".format(best_logloss, best_auc)
test_predicts.to_csv(submit_path, index=False)

In [None]:
print("Predicting training results...")

train_ids = train_df["id"].values
train_ids = train_ids.reshape((len(train_ids), 1))

train_predicts = pd.DataFrame(data=train_fold_preditcions, columns=CLASSES)
train_predicts["id"] = train_ids
train_predicts = train_predicts[["id"] + CLASSES]
submit_path = submit_path_prefix + "-Train-L{:4f}-A{:4f}.csv".format(best_logloss, best_auc)
train_predicts.to_csv(submit_path, index=False)