In [1]:
import torch
import torch.nn as nn

from sotoxic.data_helper.data_transformer import DataTransformer
from sotoxic.data_helper.data_loader import DataLoader
from sotoxic.train.trainer import PyTorchModelTrainer
from sotoxic.config import dataset_config 

  from ._conv import register_converters as _register_converters
Using TensorFlow backend.


In [2]:
VOCAB_SIZE = 100000
MAX_SEQUENCE_LENGTH = 300
EMBEDDING_SIZE = 300

## Prepare training and testing data

In [3]:
print("Loading the dataset")
data_transformer = DataTransformer(max_num_words=VOCAB_SIZE, max_sequence_length=MAX_SEQUENCE_LENGTH, char_level=False)
data_loader = DataLoader()
train_sequences, training_labels, test_sequences = data_transformer.prepare_data()

Loading the dataset
Doing preprocessing...
Preprocessed.


In [4]:
train_sequences[:20]

[[686,
  76,
  1,
  132,
  124,
  173,
  28,
  705,
  4323,
  9377,
  1162,
  81,
  350,
  44,
  81,
  12,
  13593,
  50,
  6506,
  15,
  59,
  2539,
  143,
  3,
  2736,
  31,
  111,
  1190,
  16064,
  2418,
  6,
  51,
  20,
  12,
  239,
  1,
  349,
  29,
  1,
  46,
  136,
  3,
  38,
  3789,
  85],
 [337,
  7767,
  42,
  2818,
  14,
  628,
  3656,
  3,
  38,
  4700,
  2584,
  22,
  90,
  46,
  929,
  3682,
  987,
  674,
  10173],
 [429,
  363,
  3,
  38,
  118,
  12,
  250,
  2,
  77,
  291,
  10,
  50,
  9,
  14,
  551,
  8,
  2391,
  496,
  478,
  99,
  6,
  568,
  2,
  39,
  314,
  132,
  364,
  4,
  28,
  46,
  42,
  183,
  2,
  440,
  58,
  34,
  1,
  2227,
  88,
  1,
  696,
  474],
 [58,
  3,
  134,
  92,
  55,
  311,
  1363,
  15,
  2063,
  3,
  5531,
  23,
  1,
  109,
  2330,
  53,
  18,
  485,
  15,
  25,
  5,
  3714,
  4,
  1310,
  4,
  9972,
  3,
  64,
  1,
  273,
  83,
  115,
  12892,
  35,
  9,
  44,
  16,
  41,
  11,
  1,
  1470,
  131,
  1245,
  2128,
  418,
  1245,
  30

In [5]:
print("Loading the pre-trained word embedding.")
embeddings_index = data_loader.load_embedding('features/crawl-300d-2M.vec')
embedding_matrix = data_transformer.build_embedding_matrix(embeddings_index)
print("Loaded")

Loading the pre-trained word embedding.
Total 2000000 word vectors.
Null word embeddings: 22573
Loaded


## Build model

In [38]:
import importlib
import sotoxic.models.pytorch.rhn as rhn
import sotoxic.train.trainer as trn
importlib.reload(rhn)
importlib.reload(trn)

<module 'sotoxic.train.trainer' from '/home/zake7749/PycharmProjects/CCP/sotoxic/train/trainer.py'>

In [39]:
def get_recurrent_higway_classifier():
    embedding = nn.Embedding(VOCAB_SIZE, EMBEDDING_SIZE)
    embedding.weight.data.copy_(torch.from_numpy(embedding_matrix))
    embedding.weight.requires_grad=False
    return rhn.RecurrentHighwayClassifier(
        input_size=EMBEDDING_SIZE,
        hidden_size=60, 
        embedding=embedding,
        recurrence_length=2,
        recurrent_dropout=0.25)


## Training

In [40]:
trainer = trn.PyTorchModelTrainer(model_stamp="FASTTEXT_RHN_64_64", epoch_num=300, learning_rate=1e-3,
                                  verbose_round=80, shuffle_inputs=False, early_stopping_round=12)

In [9]:
models, best_logloss, best_auc, best_val_pred = trainer.train_folds(X=train_sequences, y=training_labels,
                    fold_count=10, batch_size=256, get_model_func=get_recurrent_higway_classifier)

Choose the torch base model.
Training on fold 0
Epoch:1 Batch:0 Log-loss0.6764200329780579
Epoch:1 Batch:80 Log-loss0.09407692402601242
Epoch:1 Batch:160 Log-loss0.09060367941856384
Epoch:1 Batch:240 Log-loss0.0713363066315651
Epoch:1 Batch:320 Log-loss0.055740322917699814
Epoch:1 Batch:400 Log-loss0.0804063081741333
Epoch:1 Batch:480 Log-loss0.0346609428524971
Epoch:1 Batch:560 Log-loss0.07526189088821411
Epoch average log loss:0.084349685122392
Model has been saved as temporary_checkpoints/FASTTEXT_RHN_64_64-TEMP.pt.

In Epoch1, val_loss:0.04926930949574479, best_val_loss:0.04926930949574479, best_auc:0.9753638758367783
Epoch:2 Batch:0 Log-loss0.047581274062395096
Epoch:2 Batch:80 Log-loss0.03739865869283676
Epoch:2 Batch:160 Log-loss0.02832009084522724
Epoch:2 Batch:240 Log-loss0.059971634298563004
Epoch:2 Batch:320 Log-loss0.05598978325724602
Epoch:2 Batch:400 Log-loss0.05800679326057434
Epoch:2 Batch:480 Log-loss0.052891626954078674
Epoch:2 Batch:560 Log-loss0.035993900150060654
E

Epoch:15 Batch:320 Log-loss0.030456768348813057
Epoch:15 Batch:400 Log-loss0.0304322000592947
Epoch:15 Batch:480 Log-loss0.04947105050086975
Epoch:15 Batch:560 Log-loss0.03121676668524742
Epoch average log loss:0.03985342569981835
Model has been saved as temporary_checkpoints/FASTTEXT_RHN_64_64-TEMP.pt.

In Epoch15, val_loss:0.03766852826388454, best_val_loss:0.03766852826388454, best_auc:0.990284062556752
Epoch:16 Batch:0 Log-loss0.03523236885666847
Epoch:16 Batch:80 Log-loss0.04171955958008766
Epoch:16 Batch:160 Log-loss0.03461119160056114
Epoch:16 Batch:240 Log-loss0.048311617225408554
Epoch:16 Batch:320 Log-loss0.038581714034080505
Epoch:16 Batch:400 Log-loss0.031511932611465454
Epoch:16 Batch:480 Log-loss0.03388978913426399
Epoch:16 Batch:560 Log-loss0.04285668209195137
Epoch average log loss:0.039643369408856544
Model has been saved as temporary_checkpoints/FASTTEXT_RHN_64_64-TEMP.pt.

In Epoch16, val_loss:0.03758368035311024, best_val_loss:0.03758368035311024, best_auc:0.9901440

Epoch:30 Batch:400 Log-loss0.03785456344485283
Epoch:30 Batch:480 Log-loss0.04306377097964287
Epoch:30 Batch:560 Log-loss0.03783402219414711
Epoch average log loss:0.037760935231511084
Model has been saved as temporary_checkpoints/FASTTEXT_RHN_64_64-TEMP.pt.

In Epoch30, val_loss:0.03717460307236107, best_val_loss:0.03717460307236107, best_auc:0.9905650709821402
Epoch:31 Batch:0 Log-loss0.03407754749059677
Epoch:31 Batch:80 Log-loss0.03229319304227829
Epoch:31 Batch:160 Log-loss0.04111488163471222
Epoch:31 Batch:240 Log-loss0.03453874588012695
Epoch:31 Batch:320 Log-loss0.04419414699077606
Epoch:31 Batch:400 Log-loss0.022545315325260162
Epoch:31 Batch:480 Log-loss0.0527334101498127
Epoch:31 Batch:560 Log-loss0.03118349239230156
Epoch average log loss:0.0374804664968646
Model has been saved as temporary_checkpoints/FASTTEXT_RHN_64_64-TEMP.pt.

In Epoch31, val_loss:0.037053314777036495, best_val_loss:0.037053314777036495, best_auc:0.9905358257982354
Epoch:32 Batch:0 Log-loss0.03002392314

Epoch:2 Batch:480 Log-loss0.06170211359858513
Epoch:2 Batch:560 Log-loss0.056031085550785065
Epoch average log loss:0.05337644493473428
In Epoch2, val_loss:0.05235306843447438, best_val_loss:0.05111843037142374, best_auc:0.9728146245265809
Epoch:3 Batch:0 Log-loss0.05006115138530731
Epoch:3 Batch:80 Log-loss0.05657699704170227
Epoch:3 Batch:160 Log-loss0.04490293189883232
Epoch:3 Batch:240 Log-loss0.03619351238012314
Epoch:3 Batch:320 Log-loss0.07174747437238693
Epoch:3 Batch:400 Log-loss0.04430321231484413
Epoch:3 Batch:480 Log-loss0.05191109701991081
Epoch:3 Batch:560 Log-loss0.041987329721450806
Epoch average log loss:0.05025121001194098
Model has been saved as temporary_checkpoints/FASTTEXT_RHN_64_64-TEMP.pt.

In Epoch3, val_loss:0.04729695975633182, best_val_loss:0.04729695975633182, best_auc:0.977834065065673
Epoch:4 Batch:0 Log-loss0.07252666354179382
Epoch:4 Batch:80 Log-loss0.04659726843237877
Epoch:4 Batch:160 Log-loss0.06561022251844406
Epoch:4 Batch:240 Log-loss0.0350778400

Epoch:16 Batch:560 Log-loss0.04825394228100777
Epoch average log loss:0.04019081565950598
In Epoch16, val_loss:0.04001604260462636, best_val_loss:0.03981916391784723, best_auc:0.9897247756156066
Epoch:17 Batch:0 Log-loss0.030554376542568207
Epoch:17 Batch:80 Log-loss0.040036942809820175
Epoch:17 Batch:160 Log-loss0.03191262483596802
Epoch:17 Batch:240 Log-loss0.04790053144097328
Epoch:17 Batch:320 Log-loss0.05502623692154884
Epoch:17 Batch:400 Log-loss0.0524011105298996
Epoch:17 Batch:480 Log-loss0.044097576290369034
Epoch:17 Batch:560 Log-loss0.04616418480873108
Epoch average log loss:0.03987186909985862
In Epoch17, val_loss:0.0402473788965836, best_val_loss:0.03981916391784723, best_auc:0.9897247756156066
Epoch:18 Batch:0 Log-loss0.039020586758852005
Epoch:18 Batch:80 Log-loss0.035747867077589035
Epoch:18 Batch:160 Log-loss0.04417452588677406
Epoch:18 Batch:240 Log-loss0.04101055860519409
Epoch:18 Batch:320 Log-loss0.03627045452594757
Epoch:18 Batch:400 Log-loss0.03318973258137703
Ep

Epoch:31 Batch:240 Log-loss0.033379945904016495
Epoch:31 Batch:320 Log-loss0.036133430898189545
Epoch:31 Batch:400 Log-loss0.03633055090904236
Epoch:31 Batch:480 Log-loss0.029332110658288002
Epoch:31 Batch:560 Log-loss0.04237540066242218
Epoch average log loss:0.038091836912956624
In Epoch31, val_loss:0.03933979842168355, best_val_loss:0.03920176149522164, best_auc:0.9902525662097995
Epoch:32 Batch:0 Log-loss0.04068051278591156
Epoch:32 Batch:80 Log-loss0.029142724350094795
Epoch:32 Batch:160 Log-loss0.03255143389105797
Epoch:32 Batch:240 Log-loss0.03811360150575638
Epoch:32 Batch:320 Log-loss0.04262396693229675
Epoch:32 Batch:400 Log-loss0.04448455199599266
Epoch:32 Batch:480 Log-loss0.03675564005970955
Epoch:32 Batch:560 Log-loss0.04667548090219498
Epoch average log loss:0.03785014832392335
In Epoch32, val_loss:0.039418808711276454, best_val_loss:0.03920176149522164, best_auc:0.9902525662097995
Epoch:33 Batch:0 Log-loss0.03888056427240372
Epoch:33 Batch:80 Log-loss0.03820540383458137

In Epoch46, val_loss:0.03925254646954041, best_val_loss:0.03909190979720897, best_auc:0.9903393737793028
Epoch:47 Batch:0 Log-loss0.042367175221443176
Epoch:47 Batch:80 Log-loss0.026822848245501518
Epoch:47 Batch:160 Log-loss0.048959504812955856
Epoch:47 Batch:240 Log-loss0.04415258765220642
Epoch:47 Batch:320 Log-loss0.03561440482735634
Epoch:47 Batch:400 Log-loss0.028074493631720543
Epoch:47 Batch:480 Log-loss0.04009208455681801
Epoch:47 Batch:560 Log-loss0.031041815876960754
Epoch average log loss:0.0375291524820828
A pre-trained model at temporary_checkpoints/FASTTEXT_RHN_64_64-TEMP.pt has been loaded.

Model has been saved as checkpoints/FASTTEXT_RHN_64_641.pt.

Choose the torch base model.
Training on fold 2
Epoch:1 Batch:0 Log-loss0.6674628853797913
Epoch:1 Batch:80 Log-loss0.13349492847919464
Epoch:1 Batch:160 Log-loss0.085947185754776
Epoch:1 Batch:240 Log-loss0.0798916444182396
Epoch:1 Batch:320 Log-loss0.0926297977566719
Epoch:1 Batch:400 Log-loss0.06787348538637161
Epoch:1 

Epoch:14 Batch:80 Log-loss0.04302411153912544
Epoch:14 Batch:160 Log-loss0.0454287976026535
Epoch:14 Batch:240 Log-loss0.036822326481342316
Epoch:14 Batch:320 Log-loss0.04764799773693085
Epoch:14 Batch:400 Log-loss0.041338857263326645
Epoch:14 Batch:480 Log-loss0.0558943934738636
Epoch:14 Batch:560 Log-loss0.04525012522935867
Epoch average log loss:0.04535711080700691
Model has been saved as temporary_checkpoints/FASTTEXT_RHN_64_64-TEMP.pt.

In Epoch14, val_loss:0.04180933231121664, best_val_loss:0.04180933231121664, best_auc:0.9873879664320498
Epoch:15 Batch:0 Log-loss0.0514286570250988
Epoch:15 Batch:80 Log-loss0.05611097440123558
Epoch:15 Batch:160 Log-loss0.03017943538725376
Epoch:15 Batch:240 Log-loss0.05530748888850212
Epoch:15 Batch:320 Log-loss0.03709632530808449
Epoch:15 Batch:400 Log-loss0.03576720133423805
Epoch:15 Batch:480 Log-loss0.036006804555654526
Epoch:15 Batch:560 Log-loss0.04189033806324005
Epoch average log loss:0.04461571832653135
Model has been saved as temporary

Epoch:28 Batch:320 Log-loss0.03656997159123421
Epoch:28 Batch:400 Log-loss0.04381921514868736
Epoch:28 Batch:480 Log-loss0.03894702345132828
Epoch:28 Batch:560 Log-loss0.04251810535788536
Epoch average log loss:0.0414368053366031
Model has been saved as temporary_checkpoints/FASTTEXT_RHN_64_64-TEMP.pt.

In Epoch28, val_loss:0.03920685232542534, best_val_loss:0.03920685232542534, best_auc:0.9903751770621172
Epoch:29 Batch:0 Log-loss0.04486597701907158
Epoch:29 Batch:80 Log-loss0.04063516482710838
Epoch:29 Batch:160 Log-loss0.05469881370663643
Epoch:29 Batch:240 Log-loss0.041476618498563766
Epoch:29 Batch:320 Log-loss0.044276732951402664
Epoch:29 Batch:400 Log-loss0.03186545521020889
Epoch:29 Batch:480 Log-loss0.042694564908742905
Epoch:29 Batch:560 Log-loss0.035684920847415924
Epoch average log loss:0.04128334309040968
In Epoch29, val_loss:0.039228665459441744, best_val_loss:0.03920685232542534, best_auc:0.9903751770621172
Epoch:30 Batch:0 Log-loss0.055004749447107315
Epoch:30 Batch:80 

In Epoch42, val_loss:0.03858395984099385, best_val_loss:0.038502631441594805, best_auc:0.9907638151250046
Epoch:43 Batch:0 Log-loss0.04289352893829346
Epoch:43 Batch:80 Log-loss0.03482220694422722
Epoch:43 Batch:160 Log-loss0.028714537620544434
Epoch:43 Batch:240 Log-loss0.0372578464448452
Epoch:43 Batch:320 Log-loss0.042857956141233444
Epoch:43 Batch:400 Log-loss0.03794160485267639
Epoch:43 Batch:480 Log-loss0.037178099155426025
Epoch:43 Batch:560 Log-loss0.02656126394867897
Epoch average log loss:0.04009668595224087
In Epoch43, val_loss:0.038540649454517684, best_val_loss:0.038502631441594805, best_auc:0.9907638151250046
Epoch:44 Batch:0 Log-loss0.04633226990699768
Epoch:44 Batch:80 Log-loss0.061987098306417465
Epoch:44 Batch:160 Log-loss0.04715224727988243
Epoch:44 Batch:240 Log-loss0.05227178335189819
Epoch:44 Batch:320 Log-loss0.027004098519682884
Epoch:44 Batch:400 Log-loss0.029736021533608437
Epoch:44 Batch:480 Log-loss0.04029693827033043
Epoch:44 Batch:560 Log-loss0.04200386628

Epoch:57 Batch:560 Log-loss0.038082998245954514
Epoch average log loss:0.04002621650496232
In Epoch57, val_loss:0.038357738991957685, best_val_loss:0.03828459900954433, best_auc:0.9908638921770435
Epoch:58 Batch:0 Log-loss0.054733142256736755
Epoch:58 Batch:80 Log-loss0.05223669111728668
Epoch:58 Batch:160 Log-loss0.03271069377660751
Epoch:58 Batch:240 Log-loss0.04749557003378868
Epoch:58 Batch:320 Log-loss0.032637711614370346
Epoch:58 Batch:400 Log-loss0.033266108483076096
Epoch:58 Batch:480 Log-loss0.03806423768401146
Epoch:58 Batch:560 Log-loss0.046329859644174576
Epoch average log loss:0.039877284609247
In Epoch58, val_loss:0.03837416896985276, best_val_loss:0.03828459900954433, best_auc:0.9908638921770435
Epoch:59 Batch:0 Log-loss0.036391668021678925
Epoch:59 Batch:80 Log-loss0.0391409732401371
Epoch:59 Batch:160 Log-loss0.043105658143758774
Epoch:59 Batch:240 Log-loss0.03191642090678215
Epoch:59 Batch:320 Log-loss0.030474543571472168
Epoch:59 Batch:400 Log-loss0.0457703173160553


Epoch:73 Batch:0 Log-loss0.037563033401966095
Epoch:73 Batch:80 Log-loss0.022351861000061035
Epoch:73 Batch:160 Log-loss0.033470846712589264
Epoch:73 Batch:240 Log-loss0.04191089794039726
Epoch:73 Batch:320 Log-loss0.031777553260326385
Epoch:73 Batch:400 Log-loss0.03203774616122246
Epoch:73 Batch:480 Log-loss0.055559661239385605
Epoch:73 Batch:560 Log-loss0.04367543011903763
Epoch average log loss:0.039636465038971176
In Epoch73, val_loss:0.03829174023995011, best_val_loss:0.03825401620105184, best_auc:0.9908820199505582
Epoch:74 Batch:0 Log-loss0.03933379799127579
Epoch:74 Batch:80 Log-loss0.041197191923856735
Epoch:74 Batch:160 Log-loss0.03193904459476471
Epoch:74 Batch:240 Log-loss0.03898513689637184
Epoch:74 Batch:320 Log-loss0.028872095048427582
Epoch:74 Batch:400 Log-loss0.04453450068831444
Epoch:74 Batch:480 Log-loss0.05351494252681732
Epoch:74 Batch:560 Log-loss0.03863035514950752
Epoch average log loss:0.03952039785550109
In Epoch74, val_loss:0.03829385247031482, best_val_loss

Epoch:9 Batch:560 Log-loss0.039844170212745667
Epoch average log loss:0.042132799769751726
Model has been saved as temporary_checkpoints/FASTTEXT_RHN_64_64-TEMP.pt.

In Epoch9, val_loss:0.0425120992683235, best_val_loss:0.0425120992683235, best_auc:0.985032869551759
Epoch:10 Batch:0 Log-loss0.04476436972618103
Epoch:10 Batch:80 Log-loss0.05466615781188011
Epoch:10 Batch:160 Log-loss0.050803884863853455
Epoch:10 Batch:240 Log-loss0.047501251101493835
Epoch:10 Batch:320 Log-loss0.037773046642541885
Epoch:10 Batch:400 Log-loss0.039184629917144775
Epoch:10 Batch:480 Log-loss0.04436181113123894
Epoch:10 Batch:560 Log-loss0.036837633699178696
Epoch average log loss:0.04175305679839637
Model has been saved as temporary_checkpoints/FASTTEXT_RHN_64_64-TEMP.pt.

In Epoch10, val_loss:0.04176219172849749, best_val_loss:0.04176219172849749, best_auc:0.985760322660381
Epoch:11 Batch:0 Log-loss0.04284526780247688
Epoch:11 Batch:80 Log-loss0.037643738090991974
Epoch:11 Batch:160 Log-loss0.029082747176

Epoch:24 Batch:0 Log-loss0.033515941351652145
Epoch:24 Batch:80 Log-loss0.0496051125228405
Epoch:24 Batch:160 Log-loss0.047146961092948914
Epoch:24 Batch:240 Log-loss0.036767419427633286
Epoch:24 Batch:320 Log-loss0.036778468638658524
Epoch:24 Batch:400 Log-loss0.03485209867358208
Epoch:24 Batch:480 Log-loss0.030108099803328514
Epoch:24 Batch:560 Log-loss0.04030716419219971
Epoch average log loss:0.0380753274208733
In Epoch24, val_loss:0.04083952330894639, best_val_loss:0.04071669930716485, best_auc:0.9880413748118803
Epoch:25 Batch:0 Log-loss0.03944004327058792
Epoch:25 Batch:80 Log-loss0.03436566889286041
Epoch:25 Batch:160 Log-loss0.04776051640510559
Epoch:25 Batch:240 Log-loss0.030198633670806885
Epoch:25 Batch:320 Log-loss0.05548122897744179
Epoch:25 Batch:400 Log-loss0.059334516525268555
Epoch:25 Batch:480 Log-loss0.046979594975709915
Epoch:25 Batch:560 Log-loss0.04621219262480736
Epoch average log loss:0.03798107707906248
In Epoch25, val_loss:0.040817666684670274, best_val_loss:

Epoch:39 Batch:240 Log-loss0.05300792679190636
Epoch:39 Batch:320 Log-loss0.05596470460295677
Epoch:39 Batch:400 Log-loss0.035542842000722885
Epoch:39 Batch:480 Log-loss0.04786532744765282
Epoch:39 Batch:560 Log-loss0.04455173388123512
Epoch average log loss:0.037376002039361214
In Epoch39, val_loss:0.04056011578414893, best_val_loss:0.040408434608041964, best_auc:0.9882946492066981
Epoch:40 Batch:0 Log-loss0.03857572376728058
Epoch:40 Batch:80 Log-loss0.02615060657262802
Epoch:40 Batch:160 Log-loss0.04137798771262169
Epoch:40 Batch:240 Log-loss0.032091740518808365
Epoch:40 Batch:320 Log-loss0.030469827353954315
Epoch:40 Batch:400 Log-loss0.03673144057393074
Epoch:40 Batch:480 Log-loss0.034315325319767
Epoch:40 Batch:560 Log-loss0.03398074209690094
Epoch average log loss:0.037060772055493935
In Epoch40, val_loss:0.04067558193905147, best_val_loss:0.040408434608041964, best_auc:0.9882946492066981
Epoch:41 Batch:0 Log-loss0.039796385914087296
Epoch:41 Batch:80 Log-loss0.02937209606170654

Epoch:7 Batch:0 Log-loss0.03617720678448677
Epoch:7 Batch:80 Log-loss0.0496673546731472
Epoch:7 Batch:160 Log-loss0.06015283986926079
Epoch:7 Batch:240 Log-loss0.04327564314007759
Epoch:7 Batch:320 Log-loss0.04168299213051796
Epoch:7 Batch:400 Log-loss0.04615413025021553
Epoch:7 Batch:480 Log-loss0.039308320730924606
Epoch:7 Batch:560 Log-loss0.042627155780792236
Epoch average log loss:0.04410304794686713
Model has been saved as temporary_checkpoints/FASTTEXT_RHN_64_64-TEMP.pt.

In Epoch7, val_loss:0.04101343677215864, best_val_loss:0.04101343677215864, best_auc:0.9874742174329275
Epoch:8 Batch:0 Log-loss0.04478418454527855
Epoch:8 Batch:80 Log-loss0.04880278930068016
Epoch:8 Batch:160 Log-loss0.05242016911506653
Epoch:8 Batch:240 Log-loss0.05851307138800621
Epoch:8 Batch:320 Log-loss0.03206633776426315
Epoch:8 Batch:400 Log-loss0.053046245127916336
Epoch:8 Batch:480 Log-loss0.028051307424902916
Epoch:8 Batch:560 Log-loss0.03844509646296501
Epoch average log loss:0.04357143050458814
Mo

Epoch:21 Batch:320 Log-loss0.040978554636240005
Epoch:21 Batch:400 Log-loss0.03788148984313011
Epoch:21 Batch:480 Log-loss0.032204631716012955
Epoch:21 Batch:560 Log-loss0.03286150097846985
Epoch average log loss:0.03903895652121199
In Epoch21, val_loss:0.03843523730654874, best_val_loss:0.0381959077538959, best_auc:0.9903443259157444
Epoch:22 Batch:0 Log-loss0.03506571426987648
Epoch:22 Batch:80 Log-loss0.05018548667430878
Epoch:22 Batch:160 Log-loss0.03942006826400757
Epoch:22 Batch:240 Log-loss0.04464910551905632
Epoch:22 Batch:320 Log-loss0.04036559537053108
Epoch:22 Batch:400 Log-loss0.04386816918849945
Epoch:22 Batch:480 Log-loss0.046606164425611496
Epoch:22 Batch:560 Log-loss0.036583662033081055
Epoch average log loss:0.038848533517947155
In Epoch22, val_loss:0.0381985090815911, best_val_loss:0.0381959077538959, best_auc:0.9903443259157444
Epoch:23 Batch:0 Log-loss0.03290756791830063
Epoch:23 Batch:80 Log-loss0.044387731701135635
Epoch:23 Batch:160 Log-loss0.03148932754993439
Ep

Epoch:36 Batch:160 Log-loss0.03890731930732727
Epoch:36 Batch:240 Log-loss0.03552400320768356
Epoch:36 Batch:320 Log-loss0.03394286334514618
Epoch:36 Batch:400 Log-loss0.022011829540133476
Epoch:36 Batch:480 Log-loss0.045127809047698975
Epoch:36 Batch:560 Log-loss0.02589309588074684
Epoch average log loss:0.03747035656955892
In Epoch36, val_loss:0.03781317906858436, best_val_loss:0.03777586024194641, best_auc:0.9906090771063606
Epoch:37 Batch:0 Log-loss0.04708505794405937
Epoch:37 Batch:80 Log-loss0.030802428722381592
Epoch:37 Batch:160 Log-loss0.0350959375500679
Epoch:37 Batch:240 Log-loss0.044335246086120605
Epoch:37 Batch:320 Log-loss0.03193534538149834
Epoch:37 Batch:400 Log-loss0.020494287833571434
Epoch:37 Batch:480 Log-loss0.041236624121665955
Epoch:37 Batch:560 Log-loss0.03416894003748894
Epoch average log loss:0.03766748538639929
In Epoch37, val_loss:0.03782403675826664, best_val_loss:0.03777586024194641, best_auc:0.9906090771063606
Epoch:38 Batch:0 Log-loss0.03709869459271431

In Epoch51, val_loss:0.037810737664454815, best_val_loss:0.03776315267642132, best_auc:0.9905577007216221
Epoch:52 Batch:0 Log-loss0.05458724871277809
Epoch:52 Batch:80 Log-loss0.042988378554582596
Epoch:52 Batch:160 Log-loss0.029215507209300995
Epoch:52 Batch:240 Log-loss0.052889157086610794
Epoch:52 Batch:320 Log-loss0.03583129867911339
Epoch:52 Batch:400 Log-loss0.03762909024953842
Epoch:52 Batch:480 Log-loss0.030087999999523163
Epoch:52 Batch:560 Log-loss0.03810743987560272
Epoch average log loss:0.03720860525832644
In Epoch52, val_loss:0.037854331273436966, best_val_loss:0.03776315267642132, best_auc:0.9905577007216221
Epoch:53 Batch:0 Log-loss0.03282177075743675
Epoch:53 Batch:80 Log-loss0.04228833690285683
Epoch:53 Batch:160 Log-loss0.029869534075260162
Epoch:53 Batch:240 Log-loss0.024082409217953682
Epoch:53 Batch:320 Log-loss0.04089953750371933
Epoch:53 Batch:400 Log-loss0.03663834556937218
Epoch:53 Batch:480 Log-loss0.046171512454748154
Epoch:53 Batch:560 Log-loss0.0307076405

Epoch:13 Batch:0 Log-loss0.032253239303827286
Epoch:13 Batch:80 Log-loss0.03070041351020336
Epoch:13 Batch:160 Log-loss0.04723528027534485
Epoch:13 Batch:240 Log-loss0.034450117498636246
Epoch:13 Batch:320 Log-loss0.04955190420150757
Epoch:13 Batch:400 Log-loss0.04607824608683586
Epoch:13 Batch:480 Log-loss0.04090959578752518
Epoch:13 Batch:560 Log-loss0.02864951826632023
Epoch average log loss:0.040770111472478936
Model has been saved as temporary_checkpoints/FASTTEXT_RHN_64_64-TEMP.pt.

In Epoch13, val_loss:0.038168949273072544, best_val_loss:0.038168949273072544, best_auc:0.9899251698559312
Epoch:14 Batch:0 Log-loss0.025691932067275047
Epoch:14 Batch:80 Log-loss0.058148279786109924
Epoch:14 Batch:160 Log-loss0.04040117934346199
Epoch:14 Batch:240 Log-loss0.02992095984518528
Epoch:14 Batch:320 Log-loss0.051131755113601685
Epoch:14 Batch:400 Log-loss0.02711285836994648
Epoch:14 Batch:480 Log-loss0.05289420112967491
Epoch:14 Batch:560 Log-loss0.03132263198494911
Epoch average log loss:

Epoch:27 Batch:480 Log-loss0.02275513857603073
Epoch:27 Batch:560 Log-loss0.04262002184987068
Epoch average log loss:0.03845697439475251
In Epoch27, val_loss:0.03756883108218751, best_val_loss:0.03733111265470762, best_auc:0.9905904578762067
Epoch:28 Batch:0 Log-loss0.03924019634723663
Epoch:28 Batch:80 Log-loss0.05011703446507454
Epoch:28 Batch:160 Log-loss0.03766028210520744
Epoch:28 Batch:240 Log-loss0.04296092689037323
Epoch:28 Batch:320 Log-loss0.04188014194369316
Epoch:28 Batch:400 Log-loss0.028997043147683144
Epoch:28 Batch:480 Log-loss0.0510292649269104
Epoch:28 Batch:560 Log-loss0.03416885435581207
Epoch average log loss:0.03827250435881849
In Epoch28, val_loss:0.03758677445342735, best_val_loss:0.03733111265470762, best_auc:0.9905904578762067
Epoch:29 Batch:0 Log-loss0.04772840812802315
Epoch:29 Batch:80 Log-loss0.02682955376803875
Epoch:29 Batch:160 Log-loss0.02664805017411709
Epoch:29 Batch:240 Log-loss0.03521977365016937
Epoch:29 Batch:320 Log-loss0.040229927748441696
Epoc

Epoch:43 Batch:80 Log-loss0.037961434572935104
Epoch:43 Batch:160 Log-loss0.03483762592077255
Epoch:43 Batch:240 Log-loss0.03351212292909622
Epoch:43 Batch:320 Log-loss0.04093945398926735
Epoch:43 Batch:400 Log-loss0.049768637865781784
Epoch:43 Batch:480 Log-loss0.040084417909383774
Epoch:43 Batch:560 Log-loss0.0402580127120018
Epoch average log loss:0.03759565534003611
A pre-trained model at temporary_checkpoints/FASTTEXT_RHN_64_64-TEMP.pt has been loaded.

Model has been saved as checkpoints/FASTTEXT_RHN_64_645.pt.

Choose the torch base model.
Training on fold 6
Epoch:1 Batch:0 Log-loss0.6927940845489502
Epoch:1 Batch:80 Log-loss0.0726037472486496
Epoch:1 Batch:160 Log-loss0.04304327443242073
Epoch:1 Batch:240 Log-loss0.05778472125530243
Epoch:1 Batch:320 Log-loss0.07424319535493851
Epoch:1 Batch:400 Log-loss0.06802014261484146
Epoch:1 Batch:480 Log-loss0.03602615371346474
Epoch:1 Batch:560 Log-loss0.04634514078497887
Epoch average log loss:0.08527183783839323
Model has been saved a

Epoch:14 Batch:320 Log-loss0.031884316354990005
Epoch:14 Batch:400 Log-loss0.029345927760004997
Epoch:14 Batch:480 Log-loss0.06262467056512833
Epoch:14 Batch:560 Log-loss0.03380608186125755
Epoch average log loss:0.04019845632636654
Model has been saved as temporary_checkpoints/FASTTEXT_RHN_64_64-TEMP.pt.

In Epoch14, val_loss:0.03851778102079172, best_val_loss:0.03851778102079172, best_auc:0.9893188794910439
Epoch:15 Batch:0 Log-loss0.03941350802779198
Epoch:15 Batch:80 Log-loss0.033235590904951096
Epoch:15 Batch:160 Log-loss0.047063782811164856
Epoch:15 Batch:240 Log-loss0.045274555683135986
Epoch:15 Batch:320 Log-loss0.03511225804686546
Epoch:15 Batch:400 Log-loss0.03512350097298622
Epoch:15 Batch:480 Log-loss0.0358218215405941
Epoch:15 Batch:560 Log-loss0.042068224400281906
Epoch average log loss:0.03985174111356693
Model has been saved as temporary_checkpoints/FASTTEXT_RHN_64_64-TEMP.pt.

In Epoch15, val_loss:0.038195228366395835, best_val_loss:0.038195228366395835, best_auc:0.989

Epoch:29 Batch:0 Log-loss0.04242418333888054
Epoch:29 Batch:80 Log-loss0.032052576541900635
Epoch:29 Batch:160 Log-loss0.04607522115111351
Epoch:29 Batch:240 Log-loss0.03211600333452225
Epoch:29 Batch:320 Log-loss0.06305466592311859
Epoch:29 Batch:400 Log-loss0.05832577124238014
Epoch:29 Batch:480 Log-loss0.02574724145233631
Epoch:29 Batch:560 Log-loss0.03929305821657181
Epoch average log loss:0.03798205828892865
In Epoch29, val_loss:0.03786773756981707, best_val_loss:0.037820321437183176, best_auc:0.9899850017057168
Epoch:30 Batch:0 Log-loss0.02591921202838421
Epoch:30 Batch:80 Log-loss0.033962465822696686
Epoch:30 Batch:160 Log-loss0.033928029239177704
Epoch:30 Batch:240 Log-loss0.035718392580747604
Epoch:30 Batch:320 Log-loss0.04978758096694946
Epoch:30 Batch:400 Log-loss0.034477606415748596
Epoch:30 Batch:480 Log-loss0.027941538020968437
Epoch:30 Batch:560 Log-loss0.027523469179868698
Epoch average log loss:0.03782896599067109
In Epoch30, val_loss:0.03794131476745904, best_val_loss

Epoch:5 Batch:0 Log-loss0.04819232597947121
Epoch:5 Batch:80 Log-loss0.046335697174072266
Epoch:5 Batch:160 Log-loss0.03540770336985588
Epoch:5 Batch:240 Log-loss0.054816752672195435
Epoch:5 Batch:320 Log-loss0.05290122330188751
Epoch:5 Batch:400 Log-loss0.05128878355026245
Epoch:5 Batch:480 Log-loss0.04393814876675606
Epoch:5 Batch:560 Log-loss0.0402793250977993
Epoch average log loss:0.044765238457226325
Model has been saved as temporary_checkpoints/FASTTEXT_RHN_64_64-TEMP.pt.

In Epoch5, val_loss:0.0425990939515009, best_val_loss:0.0425990939515009, best_auc:0.9835963027268328
Epoch:6 Batch:0 Log-loss0.043334852904081345
Epoch:6 Batch:80 Log-loss0.04659324884414673
Epoch:6 Batch:160 Log-loss0.04048130288720131
Epoch:6 Batch:240 Log-loss0.033043477684259415
Epoch:6 Batch:320 Log-loss0.055700402706861496
Epoch:6 Batch:400 Log-loss0.04544730857014656
Epoch:6 Batch:480 Log-loss0.03856174275279045
Epoch:6 Batch:560 Log-loss0.03481787443161011
Epoch average log loss:0.043945174624345135
M

Epoch:19 Batch:400 Log-loss0.03831661120057106
Epoch:19 Batch:480 Log-loss0.032637886703014374
Epoch:19 Batch:560 Log-loss0.034789133816957474
Epoch average log loss:0.039025595993734896
Model has been saved as temporary_checkpoints/FASTTEXT_RHN_64_64-TEMP.pt.

In Epoch19, val_loss:0.04006720200186018, best_val_loss:0.04006720200186018, best_auc:0.9880115490992544
Epoch:20 Batch:0 Log-loss0.03694509342312813
Epoch:20 Batch:80 Log-loss0.03268841654062271
Epoch:20 Batch:160 Log-loss0.04011614993214607
Epoch:20 Batch:240 Log-loss0.04694761708378792
Epoch:20 Batch:320 Log-loss0.03771110624074936
Epoch:20 Batch:400 Log-loss0.0586770661175251
Epoch:20 Batch:480 Log-loss0.034826524555683136
Epoch:20 Batch:560 Log-loss0.03439858555793762
Epoch average log loss:0.03901751371366637
Model has been saved as temporary_checkpoints/FASTTEXT_RHN_64_64-TEMP.pt.

In Epoch20, val_loss:0.03997707306546649, best_val_loss:0.03997707306546649, best_auc:0.9880455643533805
Epoch:21 Batch:0 Log-loss0.0348148681

Epoch:34 Batch:240 Log-loss0.039723414927721024
Epoch:34 Batch:320 Log-loss0.04476425051689148
Epoch:34 Batch:400 Log-loss0.029548151418566704
Epoch:34 Batch:480 Log-loss0.032862577587366104
Epoch:34 Batch:560 Log-loss0.034602243453264236
Epoch average log loss:0.037255329251222845
In Epoch34, val_loss:0.03994183416685969, best_val_loss:0.039679786274804695, best_auc:0.9883647863109658
Epoch:35 Batch:0 Log-loss0.0524764321744442
Epoch:35 Batch:80 Log-loss0.035855259746313095
Epoch:35 Batch:160 Log-loss0.03219010308384895
Epoch:35 Batch:240 Log-loss0.023379230871796608
Epoch:35 Batch:320 Log-loss0.03696596249938011
Epoch:35 Batch:400 Log-loss0.027117548510432243
Epoch:35 Batch:480 Log-loss0.03594191372394562
Epoch:35 Batch:560 Log-loss0.04457966983318329
Epoch average log loss:0.037166668667591045
In Epoch35, val_loss:0.03995155345286712, best_val_loss:0.039679786274804695, best_auc:0.9883647863109658
Epoch:36 Batch:0 Log-loss0.033967748284339905
Epoch:36 Batch:80 Log-loss0.042463283985

Epoch:6 Batch:80 Log-loss0.03814166039228439
Epoch:6 Batch:160 Log-loss0.056268360465765
Epoch:6 Batch:240 Log-loss0.047410447150468826
Epoch:6 Batch:320 Log-loss0.055771712213754654
Epoch:6 Batch:400 Log-loss0.03949829563498497
Epoch:6 Batch:480 Log-loss0.030791571363806725
Epoch:6 Batch:560 Log-loss0.03229568898677826
Epoch average log loss:0.044981272565200923
Model has been saved as temporary_checkpoints/FASTTEXT_RHN_64_64-TEMP.pt.

In Epoch6, val_loss:0.04155889092983551, best_val_loss:0.04155889092983551, best_auc:0.9859867698818442
Epoch:7 Batch:0 Log-loss0.044706087559461594
Epoch:7 Batch:80 Log-loss0.04482072964310646
Epoch:7 Batch:160 Log-loss0.03476889804005623
Epoch:7 Batch:240 Log-loss0.05308767780661583
Epoch:7 Batch:320 Log-loss0.04733544960618019
Epoch:7 Batch:400 Log-loss0.04073473438620567
Epoch:7 Batch:480 Log-loss0.048633888363838196
Epoch:7 Batch:560 Log-loss0.044384364038705826
Epoch average log loss:0.044326877001939075
Model has been saved as temporary_checkpoin

Epoch:20 Batch:480 Log-loss0.0327741764485836
Epoch:20 Batch:560 Log-loss0.04017656296491623
Epoch average log loss:0.0390448432748339
In Epoch20, val_loss:0.03795222403640442, best_val_loss:0.037926237694796805, best_auc:0.9897850123345697
Epoch:21 Batch:0 Log-loss0.03814211115241051
Epoch:21 Batch:80 Log-loss0.035382095724344254
Epoch:21 Batch:160 Log-loss0.033323440700769424
Epoch:21 Batch:240 Log-loss0.052605804055929184
Epoch:21 Batch:320 Log-loss0.03816227987408638
Epoch:21 Batch:400 Log-loss0.039860185235738754
Epoch:21 Batch:480 Log-loss0.044858891516923904
Epoch:21 Batch:560 Log-loss0.042281363159418106
Epoch average log loss:0.039070909121073784
Model has been saved as temporary_checkpoints/FASTTEXT_RHN_64_64-TEMP.pt.

In Epoch21, val_loss:0.03791436877659677, best_val_loss:0.03791436877659677, best_auc:0.989891544404899
Epoch:22 Batch:0 Log-loss0.029027186334133148
Epoch:22 Batch:80 Log-loss0.044422123581171036
Epoch:22 Batch:160 Log-loss0.035015057772397995
Epoch:22 Batch:2

In Epoch35, val_loss:0.037855840185442184, best_val_loss:0.037684062535458564, best_auc:0.9900457880117605
Epoch:36 Batch:0 Log-loss0.05497657135128975
Epoch:36 Batch:80 Log-loss0.0437898151576519
Epoch:36 Batch:160 Log-loss0.04222365841269493
Epoch:36 Batch:240 Log-loss0.03186464682221413
Epoch:36 Batch:320 Log-loss0.03034449927508831
Epoch:36 Batch:400 Log-loss0.05314840003848076
Epoch:36 Batch:480 Log-loss0.04296601936221123
Epoch:36 Batch:560 Log-loss0.030323464423418045
Epoch average log loss:0.037688776014173135
In Epoch36, val_loss:0.03795074429561351, best_val_loss:0.037684062535458564, best_auc:0.9900457880117605
Epoch:37 Batch:0 Log-loss0.039890535175800323
Epoch:37 Batch:80 Log-loss0.03803515061736107
Epoch:37 Batch:160 Log-loss0.05736413225531578
Epoch:37 Batch:240 Log-loss0.03706048056483269
Epoch:37 Batch:320 Log-loss0.03357957676053047
Epoch:37 Batch:400 Log-loss0.03536348044872284
Epoch:37 Batch:480 Log-loss0.028796495869755745
Epoch:37 Batch:560 Log-loss0.0314621403813

Epoch:10 Batch:160 Log-loss0.04282389581203461
Epoch:10 Batch:240 Log-loss0.031121863052248955
Epoch:10 Batch:320 Log-loss0.05522811785340309
Epoch:10 Batch:400 Log-loss0.041295621544122696
Epoch:10 Batch:480 Log-loss0.037460751831531525
Epoch:10 Batch:560 Log-loss0.04177011176943779
Epoch average log loss:0.041290296713954636
Model has been saved as temporary_checkpoints/FASTTEXT_RHN_64_64-TEMP.pt.

In Epoch10, val_loss:0.04146477673379654, best_val_loss:0.04146477673379654, best_auc:0.9879854702331209
Epoch:11 Batch:0 Log-loss0.03828712925314903
Epoch:11 Batch:80 Log-loss0.029279427602887154
Epoch:11 Batch:160 Log-loss0.03931937366724014
Epoch:11 Batch:240 Log-loss0.03444394841790199
Epoch:11 Batch:320 Log-loss0.051808979362249374
Epoch:11 Batch:400 Log-loss0.040487103164196014
Epoch:11 Batch:480 Log-loss0.05333732068538666
Epoch:11 Batch:560 Log-loss0.038853392004966736
Epoch average log loss:0.040830884674297914
Model has been saved as temporary_checkpoints/FASTTEXT_RHN_64_64-TEMP.

Epoch:24 Batch:480 Log-loss0.0466466061770916
Epoch:24 Batch:560 Log-loss0.03535909950733185
Epoch average log loss:0.038148098016556886
Model has been saved as temporary_checkpoints/FASTTEXT_RHN_64_64-TEMP.pt.

In Epoch24, val_loss:0.04016188253774589, best_val_loss:0.04016188253774589, best_auc:0.9893363387932773
Epoch:25 Batch:0 Log-loss0.03850245103240013
Epoch:25 Batch:80 Log-loss0.04465041682124138
Epoch:25 Batch:160 Log-loss0.040072001516819
Epoch:25 Batch:240 Log-loss0.028470242395997047
Epoch:25 Batch:320 Log-loss0.04116030037403107
Epoch:25 Batch:400 Log-loss0.026606528088450432
Epoch:25 Batch:480 Log-loss0.038054484874010086
Epoch:25 Batch:560 Log-loss0.0354715920984745
Epoch average log loss:0.037899431631168615
In Epoch25, val_loss:0.040314034142484294, best_val_loss:0.04016188253774589, best_auc:0.9893363387932773
Epoch:26 Batch:0 Log-loss0.032303087413311005
Epoch:26 Batch:80 Log-loss0.026805786415934563
Epoch:26 Batch:160 Log-loss0.04925544187426567
Epoch:26 Batch:240 L

Model has been saved as checkpoints/FASTTEXT_RHN_64_649.pt.



In [41]:
# keep training

new_models, best_logloss, best_auc, best_val_pred = trainer.keep_train_folds(X=train_sequences, y=training_labels,
                    fold_count=10, batch_size=256, old_models=models)

Training on fold 0
Epoch:1 Batch:0 Log-loss0.036531466990709305
Epoch:1 Batch:80 Log-loss0.03582215681672096
Epoch:1 Batch:160 Log-loss0.029018335044384003
Epoch:1 Batch:240 Log-loss0.036196328699588776
Epoch:1 Batch:320 Log-loss0.03609498217701912
Epoch:1 Batch:400 Log-loss0.0301118865609169
Epoch:1 Batch:480 Log-loss0.028371067717671394
Epoch:1 Batch:560 Log-loss0.02657708339393139
Epoch average log loss:0.03519969365359949
Model has been saved as temporary_checkpoints/FASTTEXT_RHN_64_64-TEMP.pt.

In Epoch1, val_loss:0.037408311027521235, best_val_loss:0.037408311027521235, best_auc:0.9905914533781136
Epoch:2 Batch:0 Log-loss0.03476415202021599
Epoch:2 Batch:80 Log-loss0.0448206402361393
Epoch:2 Batch:160 Log-loss0.03184705600142479
Epoch:2 Batch:240 Log-loss0.02453266829252243
Epoch:2 Batch:320 Log-loss0.031927693635225296
Epoch:2 Batch:400 Log-loss0.04199408367276192
Epoch:2 Batch:480 Log-loss0.031146720051765442
Epoch:2 Batch:560 Log-loss0.038211703300476074
Epoch average log loss

Epoch:16 Batch:320 Log-loss0.030546551570296288
Epoch:16 Batch:400 Log-loss0.02839331515133381
Epoch:16 Batch:480 Log-loss0.034630145877599716
Epoch:16 Batch:560 Log-loss0.041434042155742645
Epoch average log loss:0.03535553821296032
In Epoch16, val_loss:0.03739511261529497, best_val_loss:0.03706135061191495, best_auc:0.9906306823656061
Epoch:17 Batch:0 Log-loss0.030000939965248108
Epoch:17 Batch:80 Log-loss0.04034572094678879
Epoch:17 Batch:160 Log-loss0.0307935681194067
Epoch:17 Batch:240 Log-loss0.029938489198684692
Epoch:17 Batch:320 Log-loss0.029702000319957733
Epoch:17 Batch:400 Log-loss0.02555868774652481
Epoch:17 Batch:480 Log-loss0.028783852234482765
Epoch:17 Batch:560 Log-loss0.03363228216767311
Epoch average log loss:0.035218066278113316
In Epoch17, val_loss:0.03736124952589379, best_val_loss:0.03706135061191495, best_auc:0.9906306823656061
Epoch:18 Batch:0 Log-loss0.028585178777575493
Epoch:18 Batch:80 Log-loss0.03286898508667946
Epoch:18 Batch:160 Log-loss0.039684984833002

Epoch:10 Batch:0 Log-loss0.03167102858424187
Epoch:10 Batch:80 Log-loss0.03980262205004692
Epoch:10 Batch:160 Log-loss0.03291260078549385
Epoch:10 Batch:240 Log-loss0.039584625512361526
Epoch:10 Batch:320 Log-loss0.0318765826523304
Epoch:10 Batch:400 Log-loss0.034126050770282745
Epoch:10 Batch:480 Log-loss0.035141151398420334
Epoch:10 Batch:560 Log-loss0.03821359574794769
Epoch average log loss:0.036590098466591114
Model has been saved as temporary_checkpoints/FASTTEXT_RHN_64_64-TEMP.pt.

In Epoch10, val_loss:0.03897156411771602, best_val_loss:0.03897156411771602, best_auc:0.9904688482991184
Epoch:11 Batch:0 Log-loss0.03022613376379013
Epoch:11 Batch:80 Log-loss0.02622983418405056
Epoch:11 Batch:160 Log-loss0.048999711871147156
Epoch:11 Batch:240 Log-loss0.026382675394415855
Epoch:11 Batch:320 Log-loss0.03980107977986336
Epoch:11 Batch:400 Log-loss0.03398565948009491
Epoch:11 Batch:480 Log-loss0.03103755973279476
Epoch:11 Batch:560 Log-loss0.03763815760612488
Epoch average log loss:0.0

Epoch:3 Batch:240 Log-loss0.032005272805690765
Epoch:3 Batch:320 Log-loss0.0390213280916214
Epoch:3 Batch:400 Log-loss0.03865356370806694
Epoch:3 Batch:480 Log-loss0.0460469089448452
Epoch:3 Batch:560 Log-loss0.02496490813791752
Epoch average log loss:0.039944548555649814
Model has been saved as temporary_checkpoints/FASTTEXT_RHN_64_64-TEMP.pt.

In Epoch3, val_loss:0.03834335084060546, best_val_loss:0.03834335084060546, best_auc:0.990730663749567
Epoch:4 Batch:0 Log-loss0.03521014377474785
Epoch:4 Batch:80 Log-loss0.048332978039979935
Epoch:4 Batch:160 Log-loss0.051618512719869614
Epoch:4 Batch:240 Log-loss0.033066276460886
Epoch:4 Batch:320 Log-loss0.04460427537560463
Epoch:4 Batch:400 Log-loss0.03888536989688873
Epoch:4 Batch:480 Log-loss0.032224517315626144
Epoch:4 Batch:560 Log-loss0.0522904247045517
Epoch average log loss:0.039509261949985684
Model has been saved as temporary_checkpoints/FASTTEXT_RHN_64_64-TEMP.pt.

In Epoch4, val_loss:0.0379504426149232, best_val_loss:0.037950442

Epoch:18 Batch:240 Log-loss0.030680930241942406
Epoch:18 Batch:320 Log-loss0.042495403438806534
Epoch:18 Batch:400 Log-loss0.04091886058449745
Epoch:18 Batch:480 Log-loss0.03740249201655388
Epoch:18 Batch:560 Log-loss0.049633562564849854
Epoch average log loss:0.036289786494203974
In Epoch18, val_loss:0.03763787818940871, best_val_loss:0.03755628232418578, best_auc:0.991321868146562
Epoch:19 Batch:0 Log-loss0.04028857871890068
Epoch:19 Batch:80 Log-loss0.029782412573695183
Epoch:19 Batch:160 Log-loss0.0276960376650095
Epoch:19 Batch:240 Log-loss0.0395294725894928
Epoch:19 Batch:320 Log-loss0.062283992767333984
Epoch:19 Batch:400 Log-loss0.04187283292412758
Epoch:19 Batch:480 Log-loss0.03349567577242851
Epoch:19 Batch:560 Log-loss0.05303627625107765
Epoch average log loss:0.036181867871034355
In Epoch19, val_loss:0.037795202638426784, best_val_loss:0.03755628232418578, best_auc:0.991321868146562
Epoch:20 Batch:0 Log-loss0.04225537180900574
Epoch:20 Batch:80 Log-loss0.034826185554265976


Model has been saved as temporary_checkpoints/FASTTEXT_RHN_64_64-TEMP.pt.

In Epoch9, val_loss:0.04031868534488856, best_val_loss:0.04031868534488856, best_auc:0.988507101980355
Epoch:10 Batch:0 Log-loss0.037676919251680374
Epoch:10 Batch:80 Log-loss0.026269955560564995
Epoch:10 Batch:160 Log-loss0.032758038491010666
Epoch:10 Batch:240 Log-loss0.03625533729791641
Epoch:10 Batch:320 Log-loss0.03885022923350334
Epoch:10 Batch:400 Log-loss0.03763432055711746
Epoch:10 Batch:480 Log-loss0.03844169154763222
Epoch:10 Batch:560 Log-loss0.029993753880262375
Epoch average log loss:0.03610843778920493
In Epoch10, val_loss:0.0408912177192061, best_val_loss:0.04031868534488856, best_auc:0.988507101980355
Epoch:11 Batch:0 Log-loss0.04773542657494545
Epoch:11 Batch:80 Log-loss0.03310179337859154
Epoch:11 Batch:160 Log-loss0.040052250027656555
Epoch:11 Batch:240 Log-loss0.030351713299751282
Epoch:11 Batch:320 Log-loss0.056189220398664474
Epoch:11 Batch:400 Log-loss0.024402394890785217
Epoch:11 Batch:4

Epoch:4 Batch:80 Log-loss0.037233926355838776
Epoch:4 Batch:160 Log-loss0.044129639863967896
Epoch:4 Batch:240 Log-loss0.05626616254448891
Epoch:4 Batch:320 Log-loss0.03646199777722359
Epoch:4 Batch:400 Log-loss0.0284369308501482
Epoch:4 Batch:480 Log-loss0.041317906230688095
Epoch:4 Batch:560 Log-loss0.032546672970056534
Epoch average log loss:0.03771523407527379
In Epoch4, val_loss:0.03833784164551411, best_val_loss:0.037972753504137126, best_auc:0.9901462779772943
Epoch:5 Batch:0 Log-loss0.03403029963374138
Epoch:5 Batch:80 Log-loss0.03243027999997139
Epoch:5 Batch:160 Log-loss0.035253364592790604
Epoch:5 Batch:240 Log-loss0.036598023027181625
Epoch:5 Batch:320 Log-loss0.04244200512766838
Epoch:5 Batch:400 Log-loss0.04261108115315437
Epoch:5 Batch:480 Log-loss0.032846126705408096
Epoch:5 Batch:560 Log-loss0.04084589332342148
Epoch average log loss:0.03758782513073779
In Epoch5, val_loss:0.03798649841787571, best_val_loss:0.037972753504137126, best_auc:0.9901462779772943
Epoch:6 Batc

  loss = -(transformed_labels * np.log(y_pred)).sum(axis=1)
  loss = -(transformed_labels * np.log(y_pred)).sum(axis=1)


In Epoch10, val_loss:nan, best_val_loss:0.03788784150779539, best_auc:0.990084701347369
Epoch:11 Batch:0 Log-loss0.04602649435400963
Epoch:11 Batch:80 Log-loss0.03017587773501873
Epoch:11 Batch:160 Log-loss0.03831406682729721
Epoch:11 Batch:240 Log-loss0.04492254555225372
Epoch:11 Batch:320 Log-loss0.0332631878554821
Epoch:11 Batch:400 Log-loss0.03734120354056358
Epoch:11 Batch:480 Log-loss0.034766972064971924
Epoch:11 Batch:560 Log-loss0.04941846802830696
Epoch average log loss:0.036114837320721044
In Epoch11, val_loss:nan, best_val_loss:0.03788784150779539, best_auc:0.990084701347369
Epoch:12 Batch:0 Log-loss0.044260889291763306
Epoch:12 Batch:80 Log-loss0.04089733585715294
Epoch:12 Batch:160 Log-loss0.04165925458073616
Epoch:12 Batch:240 Log-loss0.043058544397354126
Epoch:12 Batch:320 Log-loss0.042819809168577194
Epoch:12 Batch:400 Log-loss0.04282712936401367
Epoch:12 Batch:480 Log-loss0.03803418204188347
Epoch:12 Batch:560 Log-loss0.03983001410961151
Epoch average log loss:0.036019

Epoch:5 Batch:400 Log-loss0.030093243345618248
Epoch:5 Batch:480 Log-loss0.018039489164948463
Epoch:5 Batch:560 Log-loss0.04151514172554016
Epoch average log loss:0.03797521377314946
In Epoch5, val_loss:0.03819615840981692, best_val_loss:0.03775466213959252, best_auc:0.99036589680514
Epoch:6 Batch:0 Log-loss0.02336401306092739
Epoch:6 Batch:80 Log-loss0.04573683440685272
Epoch:6 Batch:160 Log-loss0.04076691344380379
Epoch:6 Batch:240 Log-loss0.04391122981905937
Epoch:6 Batch:320 Log-loss0.044730644673109055
Epoch:6 Batch:400 Log-loss0.0320717953145504
Epoch:6 Batch:480 Log-loss0.037110552191734314
Epoch:6 Batch:560 Log-loss0.028581203892827034
Epoch average log loss:0.03761226306004184
In Epoch6, val_loss:0.038166955782558146, best_val_loss:0.03775466213959252, best_auc:0.99036589680514
Epoch:7 Batch:0 Log-loss0.03393092006444931
Epoch:7 Batch:80 Log-loss0.033407505601644516
Epoch:7 Batch:160 Log-loss0.049434076994657516
Epoch:7 Batch:240 Log-loss0.02716623991727829
Epoch:7 Batch:320 L

Epoch:1 Batch:0 Log-loss0.05207217112183571
Epoch:1 Batch:80 Log-loss0.03845914080739021
Epoch:1 Batch:160 Log-loss0.035605866461992264
Epoch:1 Batch:240 Log-loss0.04167464002966881
Epoch:1 Batch:320 Log-loss0.052951741963624954
Epoch:1 Batch:400 Log-loss0.03308295086026192
Epoch:1 Batch:480 Log-loss0.02545510232448578
Epoch:1 Batch:560 Log-loss0.026346463710069656
Epoch average log loss:0.03555475313748632
Model has been saved as temporary_checkpoints/FASTTEXT_RHN_64_64-TEMP.pt.

In Epoch1, val_loss:0.03954641780618133, best_val_loss:0.03954641780618133, best_auc:0.9896234366979048
Epoch:2 Batch:0 Log-loss0.04751436412334442
Epoch:2 Batch:80 Log-loss0.030747773125767708
Epoch:2 Batch:160 Log-loss0.027692407369613647
Epoch:2 Batch:240 Log-loss0.03106490522623062
Epoch:2 Batch:320 Log-loss0.03448696807026863
Epoch:2 Batch:400 Log-loss0.03421015664935112
Epoch:2 Batch:480 Log-loss0.033812977373600006
Epoch:2 Batch:560 Log-loss0.04125376418232918
Epoch average log loss:0.03916513882910034

Epoch:16 Batch:240 Log-loss0.03371323272585869
Epoch:16 Batch:320 Log-loss0.04443761706352234
Epoch:16 Batch:400 Log-loss0.02794976532459259
Epoch:16 Batch:480 Log-loss0.028991661965847015
Epoch:16 Batch:560 Log-loss0.022236615419387817
Epoch average log loss:0.035471910278179815
In Epoch16, val_loss:0.038446196350147344, best_val_loss:0.03782607360579734, best_auc:0.9902244769918855
Epoch:17 Batch:0 Log-loss0.03249521926045418
Epoch:17 Batch:80 Log-loss0.03803713619709015
Epoch:17 Batch:160 Log-loss0.03942335024476051
Epoch:17 Batch:240 Log-loss0.04239571467041969
Epoch:17 Batch:320 Log-loss0.04388946667313576
Epoch:17 Batch:400 Log-loss0.028058985248208046
Epoch:17 Batch:480 Log-loss0.041725043207407
Epoch:17 Batch:560 Log-loss0.04402457922697067
Epoch average log loss:0.03555354495931949
In Epoch17, val_loss:0.038251327148832816, best_val_loss:0.03782607360579734, best_auc:0.9902244769918855
Epoch:18 Batch:0 Log-loss0.0230376198887825
Epoch:18 Batch:80 Log-loss0.029103966429829597
E

Epoch:8 Batch:560 Log-loss0.018029995262622833
Epoch average log loss:0.03682059693216745
In Epoch8, val_loss:0.040302184031095596, best_val_loss:0.03970959235260172, best_auc:0.9884084612497316
Epoch:9 Batch:0 Log-loss0.033474210649728775
Epoch:9 Batch:80 Log-loss0.02909381128847599
Epoch:9 Batch:160 Log-loss0.02780190296471119
Epoch:9 Batch:240 Log-loss0.027900410816073418
Epoch:9 Batch:320 Log-loss0.035261120647192
Epoch:9 Batch:400 Log-loss0.034019362181425095
Epoch:9 Batch:480 Log-loss0.029447287321090698
Epoch:9 Batch:560 Log-loss0.04000287875533104
Epoch average log loss:0.03633360559553174
In Epoch9, val_loss:0.0400507137951366, best_val_loss:0.03970959235260172, best_auc:0.9884084612497316
Epoch:10 Batch:0 Log-loss0.031076958402991295
Epoch:10 Batch:80 Log-loss0.0312681682407856
Epoch:10 Batch:160 Log-loss0.04380783438682556
Epoch:10 Batch:240 Log-loss0.032192766666412354
Epoch:10 Batch:320 Log-loss0.04843224585056305
Epoch:10 Batch:400 Log-loss0.04303550347685814
Epoch:10 Bat

Epoch:9 Batch:0 Log-loss0.035227056592702866
Epoch:9 Batch:80 Log-loss0.03321220353245735
Epoch:9 Batch:160 Log-loss0.040791433304548264
Epoch:9 Batch:240 Log-loss0.03755727782845497
Epoch:9 Batch:320 Log-loss0.02223108522593975
Epoch:9 Batch:400 Log-loss0.036377791315317154
Epoch:9 Batch:480 Log-loss0.035230815410614014
Epoch:9 Batch:560 Log-loss0.040438611060380936
Epoch average log loss:0.036815993665784065
In Epoch9, val_loss:0.03840831145742161, best_val_loss:0.03751126514220742, best_auc:0.9898700414891296
Epoch:10 Batch:0 Log-loss0.03399014472961426
Epoch:10 Batch:80 Log-loss0.018776964396238327
Epoch:10 Batch:160 Log-loss0.05743438005447388
Epoch:10 Batch:240 Log-loss0.03840179368853569
Epoch:10 Batch:320 Log-loss0.03482433781027794
Epoch:10 Batch:400 Log-loss0.03970171883702278
Epoch:10 Batch:480 Log-loss0.029150905087590218
Epoch:10 Batch:560 Log-loss0.03424927219748497
Epoch average log loss:0.03674386511224189
In Epoch10, val_loss:0.03830415780585586, best_val_loss:0.037511

Epoch:7 Batch:80 Log-loss0.04403877258300781
Epoch:7 Batch:160 Log-loss0.04668818414211273
Epoch:7 Batch:240 Log-loss0.0374080166220665
Epoch:7 Batch:320 Log-loss0.02633543312549591
Epoch:7 Batch:400 Log-loss0.04821203649044037
Epoch:7 Batch:480 Log-loss0.037637703120708466
Epoch:7 Batch:560 Log-loss0.042374834418296814
Epoch average log loss:0.036936644611081905
In Epoch7, val_loss:0.04104022416694721, best_val_loss:0.04034946693479865, best_auc:0.9893968306623105
Epoch:8 Batch:0 Log-loss0.032038066536188126
Epoch:8 Batch:80 Log-loss0.03901800885796547
Epoch:8 Batch:160 Log-loss0.04085184633731842
Epoch:8 Batch:240 Log-loss0.041280340403318405
Epoch:8 Batch:320 Log-loss0.03356344252824783
Epoch:8 Batch:400 Log-loss0.02586238831281662
Epoch:8 Batch:480 Log-loss0.02725793607532978
Epoch:8 Batch:560 Log-loss0.03114374913275242
Epoch average log loss:0.03686091272559549
In Epoch8, val_loss:0.04097913077627538, best_val_loss:0.04034946693479865, best_auc:0.9893968306623105
Epoch:9 Batch:0 

Epoch:22 Batch:480 Log-loss0.028182735666632652
Epoch:22 Batch:560 Log-loss0.0524577759206295
Epoch average log loss:0.03471323919116653
In Epoch22, val_loss:0.04071607518488194, best_val_loss:0.04012715772403915, best_auc:0.9895871182630483
Epoch:23 Batch:0 Log-loss0.039027612656354904
Epoch:23 Batch:80 Log-loss0.02714204601943493
Epoch:23 Batch:160 Log-loss0.04840656742453575
Epoch:23 Batch:240 Log-loss0.027546949684619904
Epoch:23 Batch:320 Log-loss0.025439567863941193
Epoch:23 Batch:400 Log-loss0.024166835471987724
Epoch:23 Batch:480 Log-loss0.044597651809453964
Epoch:23 Batch:560 Log-loss0.028611093759536743
Epoch average log loss:0.03460068312540118
A pre-trained model at temporary_checkpoints/FASTTEXT_RHN_64_64-TEMP.pt has been loaded.

Model has been saved as checkpoints/FASTTEXT_RHN_64_649.pt.



In [45]:
best_logloss

0.038431989078936295

## Make predections

In [49]:
import numpy as np
from sklearn.metrics import roc_auc_score

train_fold_preditcions = np.concatenate(best_val_pred, axis=0)
training_auc = roc_auc_score(training_labels, train_fold_preditcions)
print("Training AUC", training_auc)

Training AUC 0.9898540098272272


In [51]:
import pandas as pd
path = 'Dataset/'
TRAIN_DATA_FILE=path + 'train.csv'
TEST_DATA_FILE=path + 'test.csv'
test_df = pd.read_csv(TEST_DATA_FILE)
train_df = pd.read_csv(TRAIN_DATA_FILE)

In [53]:
#test_data = test_df
CLASSES = ["toxic", "severe_toxic", "obscene", "threat", "insult", "identity_hate"]
submit_path_prefix = "results/rhn/Fasttext-tunedRHN-" + str(MAX_SEQUENCE_LENGTH) 

print("Predicting testing results...")
test_predicts_list = []
for fold_id, model in enumerate(new_models):
    test_predicts = model.predict(test_sequences, batch_size=256, verbose=1)
    test_predicts_list.append(test_predicts)

test_predicts = np.zeros(test_predicts_list[0].shape)
for fold_predict in test_predicts_list:
    test_predicts += fold_predict
test_predicts /= len(test_predicts_list)

test_ids = test_df["id"].values
test_ids = test_ids.reshape((len(test_ids), 1))

test_predicts = pd.DataFrame(data=test_predicts, columns=CLASSES)
test_predicts["id"] = test_ids
test_predicts = test_predicts[["id"] + CLASSES]

Predicting testing results...


NameError: name 'val_loss' is not defined

In [54]:
submit_path = submit_path_prefix + "-L{:4f}-A{:4f}.csv".format(best_logloss, best_auc)
test_predicts.to_csv(submit_path, index=False)

In [56]:
print("Predicting training results...")

train_ids = train_df["id"].values
train_ids = train_ids.reshape((len(train_ids), 1))

train_predicts = pd.DataFrame(data=train_fold_preditcions, columns=CLASSES)
train_predicts["id"] = train_ids
train_predicts = train_predicts[["id"] + CLASSES]
submit_path = submit_path_prefix + "-Train-L{:4f}-A{:4f}.csv".format(best_logloss, best_auc)
train_predicts.to_csv(submit_path, index=False)

Predicting training results...
