In [1]:
import os
import pickle
import numpy as np
import time

from gensim.models import Word2Vec
from keras.callbacks import Callback, EarlyStopping
from sklearn.metrics import log_loss, roc_auc_score, accuracy_score, hamming_loss, f1_score
from skopt import gp_minimize
from skopt.space import Real, Integer, Categorical

from models import get_rnn_model
from cm import multilabel_confusion_matrix
from data_process import get_embedding_matrix, data_generator, get_all_notes_labels, get_features, get_targets, get_gold_label_targets

# Customized Evaluation for keras model
class CustomEvaluation(Callback):
    def __init__(self, validation_data=(), interval=1):
        super(Callback, self).__init__()

        self.interval = interval
        self.X_val, self.y_val = list(validation_data)

    def on_epoch_end(self, epoch, logs={}):
        if epoch % self.interval == 0:
            y_pred = []
            for x in self.X_val:
                y = np.squeeze(self.model.predict_on_batch(x))
                y_pred.append(y)
            y_pred = np.concatenate(y_pred)
            y_pred_ham = y_pred > 0.5
            y_val = np.concatenate(self.y_val)
            roc = roc_auc_score(y_val, y_pred, average='micro')
            loss = log_loss(y_val, y_pred)
            ham = hamming_loss(y_val, y_pred_ham)
            sub = accuracy_score(y_val, y_pred_ham)
            f1 = f1_score(y_val, y_pred_ham, average='micro')
            print("Adiitional val metrics: - ROC-AUC: %.6f - Log-Loss: %.6f - Hamming-Loss: %.6f - Subset-Accuracy: %.6f - F1-Score: %.6f" % (roc, loss, ham, sub, f1))
            
def model_train(param, 
                notes_train, 
                labels_train, 
                up_notes_train, 
                up_labels_train, 
                gold_labels_train, 
                notes_test, 
                labels_test, 
                gold_labels_test,
                results_file,
                verbose=1):
    
    print('*'*80)
    print("Parameters (note: embed_size*10, latent_dim*64):\n", param)
    print('*'*80)
    
    start_time = time.time()
    
    # assign parameters
    up = int(param['up'])
    window_size = int(param['window_size'])
    embed_size = int(param['embed_size'] * 10)
    latent_dim = int(param['latent_dim'] * 64)
    dropout_rate = param['dropout_rate']
    epochs = param['epochs']
    category = param['category']
    max_features = 60000 #param['max_features']
    train_embed = True #param['train_embed']
    model_type = 'CuDNNLSTM' #param['model_type']
    
    # upsampling
    if up > 0:
        if verbose != 0: print('upsampling for %d times...' % (up))
        notes_train = [note + up * up_note for note, up_note in zip(notes_train, up_notes_train)]
        labels_train = [label + up * up_label for label, up_label in zip(labels_train, up_labels_train)]
    notes = notes_train + notes_test
    labels = labels_train + labels_test
    gold_labels = gold_labels_train + gold_labels_test
    
    # prepare features
    X_train_seq, X_test_seq, word_index = get_features(max_features, notes_train, notes_test, verbose=1)
    nb_words = min(max_features, len(word_index))

    # prepare embedding matrix
    if train_embed:
        if verbose != 0: print('preparing pretrained embedding matrix ...')
        w2v = Word2Vec(notes, size=embed_size, window=window_size, min_count=1, workers=4)
        embedding_index = dict(zip(w2v.wv.index2word, w2v.wv.vectors))
        embedding_matrix = get_embedding_matrix(embedding_index=embedding_index, 
                                                word_index=word_index, 
                                                max_features=max_features, 
                                                embed_size=embed_size)
        
    # prepare targets
    Y_train, Y_test, mlb, num_labels = get_targets(labels_train, labels_test, category, verbose=1)  

    # get rnn model
    model = get_rnn_model(nb_words=nb_words, 
                          num_labels=num_labels, 
                          embed_size=embed_size, 
                          latent_dim=latent_dim, 
                          model_type=model_type, 
                          embedding_matrix=embedding_matrix, 
                          dropout=dropout_rate, 
                          train_embed=train_embed)
    if verbose != 0: 
        print('model summary:')
        print(model.summary())
    
    # model compiling
    model.compile(loss='binary_crossentropy',
                  optimizer='adam',
                  metrics=['accuracy'])

    # model training
    if verbose != 0: print('\ntraining model ...')
    custevl = CustomEvaluation(validation_data=(X_test_seq, Y_test), interval=1)
    earlystop = EarlyStopping(monitor='val_loss', min_delta=0.0005, patience=2, verbose=0, mode='auto')
    train_gen = data_generator(X_train_seq, Y_train)
    test_gen = data_generator(X_test_seq, Y_test)
    v = 1 if verbose != 0 else 0  
    hist = model.fit_generator(train_gen,
                                steps_per_epoch=len(Y_train),
                                epochs=epochs,
                                validation_data=test_gen,
                                validation_steps=len(Y_test),
                                callbacks=[custevl, earlystop],
                                verbose=v)

    # prediction of test data
    if verbose != 0: print('predicting test data ...')
    Y_pred = []
    for x in X_test_seq:
        x = np.array(x).reshape((1,-1))
        y_pred = np.squeeze(model.predict_on_batch(x))
        Y_pred.append(y_pred)
    Y_pred_concat = np.concatenate(Y_pred)
    Y_val = np.concatenate(Y_test)

    # confusion matrix 
    if verbose == 2: 
        cm = multilabel_confusion_matrix(Y_val, np.where(Y_pred_concat > 0.5, 1, 0))
        for i, j in zip(cm, mlb.classes_):
            print(j+':\n', i,'\n')

    # prepare gold label targets
    Y_gold_test, Y_gold_pred, gmlb = get_gold_label_targets(Y_pred, gold_labels, gold_labels_test, mlb, category=category, verbose=1) 

    # f1 scores for gold label
    f1 = f1_score(Y_gold_test, Y_gold_pred, average='micro')
    print('\nF1 Scores for global labels:\nALL (average="micro"):', f1)
    
    # confusion matrix for gold label
    if verbose == 2: 
        gcm = multilabel_confusion_matrix(np.concatenate(Y_gold_test), np.concatenate(Y_gold_pred))
        for i, j in zip(gcm, gmlb.classes_):
            print(j+':\n', i,'\n')
    
    # f1 score list
    if verbose == 2: 
        f1_all = f1_score(Y_gold_test, Y_gold_pred, average=None)
        for i, j in zip(f1_all, gmlb.classes_):
            print(j+': '+str(i))
    
    print('\n')
    
    elapsed_time = time.time() - start_time
    
    # save results
    with open(results_file,"a") as f:
        f.write("Parameters (note: embed_size*10, ltent_dim*64):\n" + str(param))
        f.write('\nF1 Scores for global labels(average="micro"): %.3f; Running time: %.1f\n' % (f1, elapsed_time))
          
    return f1

def bayes_opt(space):
    
    results_file = "opt_results_" + time.strftime("%Y%m%d") + ".txt"
    
    param = {
            'up': space[0],               # Times of upsampling for training data
            'window_size': space[1],                # Window size for word2vec
            'embed_size': space[2],                # Length of the vector that we willl get from the embedding layer
            'latent_dim': space[3],               # Hidden layers dimension 
            'dropout_rate': space[4],             # Rate of the dropout layers
            'epochs': space[5],               # Max num of vocabulary
            'category': space[6]}                 # Number of epochs
            #'max_features': space[0],              # Is categoty labels
            #'train_embed': space[0],               # Using pre-made embedidng matrix as weight
            #'model_type': space[0]
            #}
                
    f1 = model_train(param, 
                    notes_train, 
                    labels_train, 
                    up_notes_train, 
                    up_labels_train, 
                    gold_labels_train, 
                    notes_test, 
                    labels_test, 
                    gold_labels_test,
                    results_file=results_file)
    
    return (-f1)    

if __name__ == "__main__":
    
    # loading data 
    if os.path.exists('loaded_data.dat'):
        
        with open('loaded_data.dat','rb') as f:
            notes_train = pickle.load(f)
            labels_train = pickle.load(f)
            up_notes_train = pickle.load(f)
            up_labels_train = pickle.load(f)
            gold_labels_train = pickle.load(f)
            notes_test = pickle.load(f)
            labels_test = pickle.load(f)
            gold_labels_test = pickle.load(f)
            
    else:
        
        notes_train_1, labels_train_1, up_notes_train_1, up_labels_train_1, gold_labels_train_1 = get_all_notes_labels('/host_home/data/i2b2/2014/training/training-RiskFactors-Complete-Set1') 
        notes_train_2, labels_train_2, up_notes_train_2, up_labels_train_2, gold_labels_train_2 = get_all_notes_labels('/host_home/data/i2b2/2014/training/training-RiskFactors-Complete-Set2') 

        notes_train = notes_train_1 + notes_train_2
        labels_train = labels_train_1 + labels_train_2
        up_notes_train = up_notes_train_1 + up_notes_train_2
        up_labels_train = up_labels_train_1 + up_labels_train_2
        gold_labels_train = gold_labels_train_1 + gold_labels_train_2

        notes_test, labels_test, _1, _2, gold_labels_test = get_all_notes_labels('/host_home/data/i2b2/2014/testing/testing-RiskFactors-Complete')

        with open('loaded_data.dat','wb') as f:
            pickle.dump(notes_train, f)
            pickle.dump(labels_train, f)
            pickle.dump(up_notes_train, f)
            pickle.dump(up_labels_train, f)
            pickle.dump(gold_labels_train, f)
            pickle.dump(notes_test, f)
            pickle.dump(labels_test, f)
            pickle.dump(gold_labels_test, f)

    # loading parameters space
    space = [Integer(5, 15, name='up'),
            Integer(3, 5, name='window_size'),
            Integer(3, 5, name='embed_size'),
            Integer(3, 5, name='latent_dim'),
            Real(0, 0.5, name='dropout_rate'),
            Integer(20, 21, name='epochs'),
            Categorical([None], name='category')]
            #Integer(1, 60000, name='max_features'),
            #Categorical([True], name='train_embed'),
            #Categorical(['CuDNNLSTM'], name='model_type')]
    
    # initial parameters       
    x0 = [12, 3, 4, 5, 0.0, 21, None]
    
    # optimization
    #res_torch = gp_minimize(bayes_opt_torch, space, x0=x0, n_calls=50, verbose=True)
    res = gp_minimize(bayes_opt, space, x0=x0, n_calls=100, verbose=True)
    
    # save opt results
    res_file = "res_final_" + time.strftime("%Y%m%d") + ".txt"
    with open(res_file,"a") as f:
        f.write('opt by keras:\n%s\n' % str(res))
        
    # python command: python heart_no_pad_opt_comparison.py > heart_no_pad_opt_comparison.log

Using TensorFlow backend.


Iteration No: 1 started. Evaluating function at provided point.
********************************************************************************
Parameters (note: embed_size*10, latent_dim*64):
 {'up': 12, 'window_size': 3, 'embed_size': 4, 'latent_dim': 5, 'dropout_rate': 0.0, 'epochs': 21, 'category': None}
********************************************************************************
upsampling for 12 times...
preparing features ...
preparing pretrained embedding matrix ...
preparing targets ...
Instructions for updating:
Colocations handled automatically by placer.
model summary:
_________________________________________________________________
Layer (type)                 Output Shape              Param #   
input_1 (InputLayer)         (None, None)              0         
_________________________________________________________________
embedding_1 (Embedding)      (None, None, 40)          1799360   
_________________________________________________________________
bidirection

Epoch 1/20
Adiitional val metrics: - ROC-AUC: 0.954813 - Log-Loss: 3.535779 - Hamming-Loss: 0.006480 - Subset-Accuracy: 0.715960 - F1-Score: 0.711552
Epoch 2/20
Adiitional val metrics: - ROC-AUC: 0.976983 - Log-Loss: 2.744638 - Hamming-Loss: 0.003494 - Subset-Accuracy: 0.859679 - F1-Score: 0.842283
Epoch 3/20
Adiitional val metrics: - ROC-AUC: 0.981350 - Log-Loss: 2.379633 - Hamming-Loss: 0.002667 - Subset-Accuracy: 0.878473 - F1-Score: 0.876607
Epoch 4/20
Adiitional val metrics: - ROC-AUC: 0.984865 - Log-Loss: 1.975803 - Hamming-Loss: 0.001771 - Subset-Accuracy: 0.914141 - F1-Score: 0.916760
Epoch 5/20
Adiitional val metrics: - ROC-AUC: 0.986753 - Log-Loss: 1.683818 - Hamming-Loss: 0.001596 - Subset-Accuracy: 0.919977 - F1-Score: 0.924518
Epoch 6/20
Adiitional val metrics: - ROC-AUC: 0.987870 - Log-Loss: 1.490647 - Hamming-Loss: 0.001545 - Subset-Accuracy: 0.912721 - F1-Score: 0.926199
predicting test data ...
preparing gold label targets ...

F1 Scores for global labels:
ALL (average

preparing gold label targets ...

F1 Scores for global labels:
ALL (average="micro"): 0.856867655557696


Iteration No: 5 ended. Evaluation done at random point.
Time taken: 819.6338
Function value obtained: -0.8569
Current minimum: -0.8604
Iteration No: 6 started. Evaluating function at random point.
********************************************************************************
Parameters (note: embed_size*10, latent_dim*64):
 {'up': 8, 'window_size': 5, 'embed_size': 5, 'latent_dim': 5, 'dropout_rate': 0.10659010649839881, 'epochs': 20, 'category': None}
********************************************************************************
upsampling for 8 times...
preparing features ...
preparing pretrained embedding matrix ...
preparing targets ...
model summary:
_________________________________________________________________
Layer (type)                 Output Shape              Param #   
input_6 (InputLayer)         (None, None)              0         
____________________________


training model ...
Epoch 1/21
Adiitional val metrics: - ROC-AUC: 0.948507 - Log-Loss: 3.326665 - Hamming-Loss: 0.008001 - Subset-Accuracy: 0.713171 - F1-Score: 0.669169
Epoch 2/21
Adiitional val metrics: - ROC-AUC: 0.972960 - Log-Loss: 2.790543 - Hamming-Loss: 0.004192 - Subset-Accuracy: 0.817709 - F1-Score: 0.812076
Epoch 3/21
Adiitional val metrics: - ROC-AUC: 0.978937 - Log-Loss: 2.386070 - Hamming-Loss: 0.002500 - Subset-Accuracy: 0.867367 - F1-Score: 0.883140
Epoch 4/21
Adiitional val metrics: - ROC-AUC: 0.982819 - Log-Loss: 2.018572 - Hamming-Loss: 0.001931 - Subset-Accuracy: 0.893861 - F1-Score: 0.908684
Epoch 5/21
Adiitional val metrics: - ROC-AUC: 0.983866 - Log-Loss: 1.756954 - Hamming-Loss: 0.001800 - Subset-Accuracy: 0.897164 - F1-Score: 0.914051
Epoch 6/21
Adiitional val metrics: - ROC-AUC: 0.984746 - Log-Loss: 1.571315 - Hamming-Loss: 0.001851 - Subset-Accuracy: 0.886015 - F1-Score: 0.910700
predicting test data ...
preparing gold label targets ...

F1 Scores for global 

Adiitional val metrics: - ROC-AUC: 0.985786 - Log-Loss: 1.725317 - Hamming-Loss: 0.001777 - Subset-Accuracy: 0.896143 - F1-Score: 0.914938
predicting test data ...
preparing gold label targets ...

F1 Scores for global labels:
ALL (average="micro"): 0.8607235521613551


Iteration No: 10 ended. Evaluation done at random point.
Time taken: 903.7609
Function value obtained: -0.8607
Current minimum: -0.8641
Iteration No: 11 started. Evaluating function at random point.
********************************************************************************
Parameters (note: embed_size*10, latent_dim*64):
 {'up': 14, 'window_size': 4, 'embed_size': 4, 'latent_dim': 3, 'dropout_rate': 0.38301930260317163, 'epochs': 21, 'category': None}
********************************************************************************
upsampling for 14 times...
preparing features ...
preparing pretrained embedding matrix ...
preparing targets ...
model summary:
_________________________________________________________

Epoch 1/20
Adiitional val metrics: - ROC-AUC: 0.958605 - Log-Loss: 3.421662 - Hamming-Loss: 0.005131 - Subset-Accuracy: 0.717213 - F1-Score: 0.752189
Epoch 2/20
Adiitional val metrics: - ROC-AUC: 0.973122 - Log-Loss: 2.864074 - Hamming-Loss: 0.003263 - Subset-Accuracy: 0.819544 - F1-Score: 0.843912
Epoch 3/20
Adiitional val metrics: - ROC-AUC: 0.981247 - Log-Loss: 2.409223 - Hamming-Loss: 0.002080 - Subset-Accuracy: 0.884746 - F1-Score: 0.901047
Epoch 4/20
Adiitional val metrics: - ROC-AUC: 0.985048 - Log-Loss: 2.101984 - Hamming-Loss: 0.001805 - Subset-Accuracy: 0.899761 - F1-Score: 0.914161
Epoch 5/20
Adiitional val metrics: - ROC-AUC: 0.987051 - Log-Loss: 1.788272 - Hamming-Loss: 0.001770 - Subset-Accuracy: 0.899748 - F1-Score: 0.915654
Epoch 6/20
Adiitional val metrics: - ROC-AUC: 0.988591 - Log-Loss: 1.545659 - Hamming-Loss: 0.001751 - Subset-Accuracy: 0.904614 - F1-Score: 0.916787
predicting test data ...
preparing gold label targets ...

F1 Scores for global labels:
ALL (average

Adiitional val metrics: - ROC-AUC: 0.988095 - Log-Loss: 1.492730 - Hamming-Loss: 0.001373 - Subset-Accuracy: 0.928743 - F1-Score: 0.935190
Epoch 6/21
Adiitional val metrics: - ROC-AUC: 0.989156 - Log-Loss: 1.301494 - Hamming-Loss: 0.001379 - Subset-Accuracy: 0.930613 - F1-Score: 0.934942
predicting test data ...
preparing gold label targets ...

F1 Scores for global labels:
ALL (average="micro"): 0.872770853307766


Iteration No: 15 ended. Search finished for the next optimal point.
Time taken: 810.2242
Function value obtained: -0.8728
Current minimum: -0.8728
Iteration No: 16 started. Searching for the next optimal point.
********************************************************************************
Parameters (note: embed_size*10, latent_dim*64):
 {'up': 15, 'window_size': 5, 'embed_size': 5, 'latent_dim': 5, 'dropout_rate': 0.47762711040042366, 'epochs': 21, 'category': None}
********************************************************************************
upsampling for 15 times..

Epoch 1/20
Adiitional val metrics: - ROC-AUC: 0.974837 - Log-Loss: 3.267247 - Hamming-Loss: 0.001761 - Subset-Accuracy: 0.921936 - F1-Score: 0.916429
Epoch 2/20
Adiitional val metrics: - ROC-AUC: 0.980988 - Log-Loss: 2.481163 - Hamming-Loss: 0.001461 - Subset-Accuracy: 0.937727 - F1-Score: 0.931386
Epoch 3/20
Adiitional val metrics: - ROC-AUC: 0.983854 - Log-Loss: 2.069423 - Hamming-Loss: 0.001368 - Subset-Accuracy: 0.942327 - F1-Score: 0.935823
Epoch 4/20
Adiitional val metrics: - ROC-AUC: 0.985411 - Log-Loss: 1.804658 - Hamming-Loss: 0.001221 - Subset-Accuracy: 0.944569 - F1-Score: 0.942574
Epoch 5/20
Adiitional val metrics: - ROC-AUC: 0.986217 - Log-Loss: 1.627235 - Hamming-Loss: 0.001188 - Subset-Accuracy: 0.944971 - F1-Score: 0.944119
predicting test data ...
preparing gold label targets ...

F1 Scores for global labels:
ALL (average="micro"): 0.8566938713438436


Iteration No: 18 ended. Search finished for the next optimal point.
Time taken: 681.0954
Function value obtained: -0.8

preparing pretrained embedding matrix ...
preparing targets ...
model summary:
_________________________________________________________________
Layer (type)                 Output Shape              Param #   
input_21 (InputLayer)        (None, None)              0         
_________________________________________________________________
embedding_21 (Embedding)     (None, None, 50)          2249200   
_________________________________________________________________
bidirectional_21 (Bidirectio (None, None, 384)         374784    
_________________________________________________________________
spatial_dropout1d_21 (Spatia (None, None, 384)         0         
_________________________________________________________________
dense_41 (Dense)             (None, None, 300)         115500    
_________________________________________________________________
dense_42 (Dense)             (None, None, 97)          29197     
Total params: 2,768,681
Trainable params: 2,768,681
Non-trainab

Adiitional val metrics: - ROC-AUC: 0.985648 - Log-Loss: 1.727742 - Hamming-Loss: 0.002006 - Subset-Accuracy: 0.884093 - F1-Score: 0.904003
predicting test data ...
preparing gold label targets ...

F1 Scores for global labels:
ALL (average="micro"): 0.8575842136735101


Iteration No: 23 ended. Search finished for the next optimal point.
Time taken: 1223.2852
Function value obtained: -0.8576
Current minimum: -0.8762
Iteration No: 24 started. Searching for the next optimal point.
********************************************************************************
Parameters (note: embed_size*10, latent_dim*64):
 {'up': 15, 'window_size': 3, 'embed_size': 5, 'latent_dim': 5, 'dropout_rate': 0.014653484995026837, 'epochs': 21, 'category': None}
********************************************************************************
upsampling for 15 times...
preparing features ...
preparing pretrained embedding matrix ...
preparing targets ...
model summary:
___________________________________________

Epoch 1/21
Adiitional val metrics: - ROC-AUC: 0.954218 - Log-Loss: 3.436125 - Hamming-Loss: 0.006667 - Subset-Accuracy: 0.706475 - F1-Score: 0.694388
Epoch 2/21
Adiitional val metrics: - ROC-AUC: 0.972014 - Log-Loss: 2.872298 - Hamming-Loss: 0.003669 - Subset-Accuracy: 0.819798 - F1-Score: 0.827496
Epoch 3/21
Adiitional val metrics: - ROC-AUC: 0.979893 - Log-Loss: 2.385076 - Hamming-Loss: 0.002565 - Subset-Accuracy: 0.874580 - F1-Score: 0.879574
Epoch 4/21
Adiitional val metrics: - ROC-AUC: 0.983924 - Log-Loss: 2.039147 - Hamming-Loss: 0.002224 - Subset-Accuracy: 0.872395 - F1-Score: 0.895326
Epoch 5/21
Adiitional val metrics: - ROC-AUC: 0.986229 - Log-Loss: 1.760109 - Hamming-Loss: 0.002064 - Subset-Accuracy: 0.876250 - F1-Score: 0.901824
predicting test data ...
preparing gold label targets ...

F1 Scores for global labels:
ALL (average="micro"): 0.8604784688995215


Iteration No: 26 ended. Search finished for the next optimal point.
Time taken: 1225.5209
Function value obtained: -0.

Adiitional val metrics: - ROC-AUC: 0.986810 - Log-Loss: 1.681946 - Hamming-Loss: 0.001777 - Subset-Accuracy: 0.888173 - F1-Score: 0.913872
predicting test data ...
preparing gold label targets ...

F1 Scores for global labels:
ALL (average="micro"): 0.8634392334846194


Iteration No: 28 ended. Search finished for the next optimal point.
Time taken: 503.4587
Function value obtained: -0.8634
Current minimum: -0.8762
Iteration No: 29 started. Searching for the next optimal point.
********************************************************************************
Parameters (note: embed_size*10, latent_dim*64):
 {'up': 15, 'window_size': 3, 'embed_size': 5, 'latent_dim': 5, 'dropout_rate': 0.018122400865408343, 'epochs': 20, 'category': None}
********************************************************************************
upsampling for 15 times...
preparing features ...
preparing pretrained embedding matrix ...
preparing targets ...
model summary:
____________________________________________

Epoch 1/21
Adiitional val metrics: - ROC-AUC: 0.974840 - Log-Loss: 2.939554 - Hamming-Loss: 0.001994 - Subset-Accuracy: 0.882505 - F1-Score: 0.903034
Epoch 2/21
Adiitional val metrics: - ROC-AUC: 0.981852 - Log-Loss: 2.314166 - Hamming-Loss: 0.001661 - Subset-Accuracy: 0.917577 - F1-Score: 0.921213
Epoch 3/21
Adiitional val metrics: - ROC-AUC: 0.984684 - Log-Loss: 1.950201 - Hamming-Loss: 0.001415 - Subset-Accuracy: 0.930737 - F1-Score: 0.933057
Epoch 4/21
Adiitional val metrics: - ROC-AUC: 0.986433 - Log-Loss: 1.741403 - Hamming-Loss: 0.001447 - Subset-Accuracy: 0.923246 - F1-Score: 0.931136
Epoch 5/21
Adiitional val metrics: - ROC-AUC: 0.987323 - Log-Loss: 1.602317 - Hamming-Loss: 0.001674 - Subset-Accuracy: 0.895639 - F1-Score: 0.918995
Epoch 6/21
Adiitional val metrics: - ROC-AUC: 0.987642 - Log-Loss: 1.496594 - Hamming-Loss: 0.001666 - Subset-Accuracy: 0.896188 - F1-Score: 0.919650
predicting test data ...
preparing gold label targets ...

F1 Scores for global labels:
ALL (average

Adiitional val metrics: - ROC-AUC: 0.987764 - Log-Loss: 1.565766 - Hamming-Loss: 0.001465 - Subset-Accuracy: 0.919806 - F1-Score: 0.930345
predicting test data ...
preparing gold label targets ...

F1 Scores for global labels:
ALL (average="micro"): 0.8620487804878048


Iteration No: 33 ended. Search finished for the next optimal point.
Time taken: 514.3058
Function value obtained: -0.8620
Current minimum: -0.8762
Iteration No: 34 started. Searching for the next optimal point.
********************************************************************************
Parameters (note: embed_size*10, latent_dim*64):
 {'up': 15, 'window_size': 5, 'embed_size': 5, 'latent_dim': 3, 'dropout_rate': 0.0, 'epochs': 21, 'category': None}
********************************************************************************
upsampling for 15 times...
preparing features ...
preparing pretrained embedding matrix ...
preparing targets ...
model summary:
_____________________________________________________________

Epoch 1/21
Adiitional val metrics: - ROC-AUC: 0.961255 - Log-Loss: 3.346919 - Hamming-Loss: 0.005229 - Subset-Accuracy: 0.740038 - F1-Score: 0.755456
Epoch 2/21
Adiitional val metrics: - ROC-AUC: 0.978879 - Log-Loss: 2.704393 - Hamming-Loss: 0.002553 - Subset-Accuracy: 0.877674 - F1-Score: 0.882321
Epoch 3/21
Adiitional val metrics: - ROC-AUC: 0.982059 - Log-Loss: 2.282866 - Hamming-Loss: 0.001897 - Subset-Accuracy: 0.899716 - F1-Score: 0.910719
Epoch 4/21
Adiitional val metrics: - ROC-AUC: 0.984744 - Log-Loss: 1.951064 - Hamming-Loss: 0.001663 - Subset-Accuracy: 0.911950 - F1-Score: 0.921570
Epoch 5/21
Adiitional val metrics: - ROC-AUC: 0.986105 - Log-Loss: 1.706265 - Hamming-Loss: 0.001593 - Subset-Accuracy: 0.914661 - F1-Score: 0.924646
predicting test data ...
preparing gold label targets ...

F1 Scores for global labels:
ALL (average="micro"): 0.8618890325051464


Iteration No: 36 ended. Search finished for the next optimal point.
Time taken: 1235.7347
Function value obtained: -0.



preparing pretrained embedding matrix ...
preparing targets ...
model summary:
_________________________________________________________________
Layer (type)                 Output Shape              Param #   
input_37 (InputLayer)        (None, None)              0         
_________________________________________________________________
embedding_37 (Embedding)     (None, None, 50)          2249200   
_________________________________________________________________
bidirectional_37 (Bidirectio (None, None, 640)         952320    
_________________________________________________________________
spatial_dropout1d_37 (Spatia (None, None, 640)         0         
_________________________________________________________________
dense_73 (Dense)             (None, None, 300)         192300    
_________________________________________________________________
dense_74 (Dense)             (None, None, 97)          29197     
Total params: 3,423,017
Trainable params: 3,423,017
Non-trainab

Adiitional val metrics: - ROC-AUC: 0.981064 - Log-Loss: 2.507731 - Hamming-Loss: 0.001522 - Subset-Accuracy: 0.927247 - F1-Score: 0.928027
Epoch 3/21
Adiitional val metrics: - ROC-AUC: 0.984755 - Log-Loss: 2.077492 - Hamming-Loss: 0.001367 - Subset-Accuracy: 0.934437 - F1-Score: 0.935564
Epoch 4/21
Adiitional val metrics: - ROC-AUC: 0.986747 - Log-Loss: 1.742924 - Hamming-Loss: 0.001321 - Subset-Accuracy: 0.936599 - F1-Score: 0.937701
Epoch 5/21
Adiitional val metrics: - ROC-AUC: 0.988451 - Log-Loss: 1.496919 - Hamming-Loss: 0.001281 - Subset-Accuracy: 0.938247 - F1-Score: 0.939875
Epoch 6/21
Adiitional val metrics: - ROC-AUC: 0.989041 - Log-Loss: 1.280814 - Hamming-Loss: 0.001233 - Subset-Accuracy: 0.939350 - F1-Score: 0.941905
predicting test data ...
preparing gold label targets ...

F1 Scores for global labels:
ALL (average="micro"): 0.876617441916398


Iteration No: 39 ended. Search finished for the next optimal point.
Time taken: 843.4599
Function value obtained: -0.8766
Current 

preparing pretrained embedding matrix ...
preparing targets ...
model summary:
_________________________________________________________________
Layer (type)                 Output Shape              Param #   
input_42 (InputLayer)        (None, None)              0         
_________________________________________________________________
embedding_42 (Embedding)     (None, None, 50)          2249200   
_________________________________________________________________
bidirectional_42 (Bidirectio (None, None, 640)         952320    
_________________________________________________________________
spatial_dropout1d_42 (Spatia (None, None, 640)         0         
_________________________________________________________________
dense_83 (Dense)             (None, None, 300)         192300    
_________________________________________________________________
dense_84 (Dense)             (None, None, 97)          29197     
Total params: 3,423,017
Trainable params: 3,423,017
Non-trainab

Epoch 1/20
Adiitional val metrics: - ROC-AUC: 0.977529 - Log-Loss: 3.002732 - Hamming-Loss: 0.001504 - Subset-Accuracy: 0.920678 - F1-Score: 0.927719
Epoch 2/20
Adiitional val metrics: - ROC-AUC: 0.983812 - Log-Loss: 2.285873 - Hamming-Loss: 0.001313 - Subset-Accuracy: 0.936272 - F1-Score: 0.937706
Epoch 3/20
Adiitional val metrics: - ROC-AUC: 0.986807 - Log-Loss: 1.932423 - Hamming-Loss: 0.001264 - Subset-Accuracy: 0.940210 - F1-Score: 0.940320
Epoch 4/20
Adiitional val metrics: - ROC-AUC: 0.988148 - Log-Loss: 1.713594 - Hamming-Loss: 0.001274 - Subset-Accuracy: 0.937911 - F1-Score: 0.939877
Epoch 5/20
Adiitional val metrics: - ROC-AUC: 0.989084 - Log-Loss: 1.518739 - Hamming-Loss: 0.001298 - Subset-Accuracy: 0.937664 - F1-Score: 0.938860
Epoch 6/20
Adiitional val metrics: - ROC-AUC: 0.989824 - Log-Loss: 1.369678 - Hamming-Loss: 0.001373 - Subset-Accuracy: 0.931774 - F1-Score: 0.935194
predicting test data ...
preparing gold label targets ...

F1 Scores for global labels:
ALL (average

Adiitional val metrics: - ROC-AUC: 0.987572 - Log-Loss: 1.559589 - Hamming-Loss: 0.001422 - Subset-Accuracy: 0.929443 - F1-Score: 0.932965
predicting test data ...
preparing gold label targets ...

F1 Scores for global labels:
ALL (average="micro"): 0.8600597609561753


Iteration No: 46 ended. Search finished for the next optimal point.
Time taken: 607.8691
Function value obtained: -0.8601
Current minimum: -0.8799
Iteration No: 47 started. Searching for the next optimal point.
********************************************************************************
Parameters (note: embed_size*10, latent_dim*64):
 {'up': 5, 'window_size': 3, 'embed_size': 5, 'latent_dim': 4, 'dropout_rate': 0.4657671206128833, 'epochs': 20, 'category': None}
********************************************************************************
upsampling for 5 times...
preparing features ...
preparing pretrained embedding matrix ...
preparing targets ...
model summary:
________________________________________________



preparing pretrained embedding matrix ...
preparing targets ...
model summary:
_________________________________________________________________
Layer (type)                 Output Shape              Param #   
input_49 (InputLayer)        (None, None)              0         
_________________________________________________________________
embedding_49 (Embedding)     (None, None, 50)          2249200   
_________________________________________________________________
bidirectional_49 (Bidirectio (None, None, 640)         952320    
_________________________________________________________________
spatial_dropout1d_49 (Spatia (None, None, 640)         0         
_________________________________________________________________
dense_97 (Dense)             (None, None, 300)         192300    
_________________________________________________________________
dense_98 (Dense)             (None, None, 97)          29197     
Total params: 3,423,017
Trainable params: 3,423,017
Non-trainab

Adiitional val metrics: - ROC-AUC: 0.971392 - Log-Loss: 2.710454 - Hamming-Loss: 0.003474 - Subset-Accuracy: 0.855555 - F1-Score: 0.841530
Epoch 3/20
Adiitional val metrics: - ROC-AUC: 0.978284 - Log-Loss: 2.279292 - Hamming-Loss: 0.002754 - Subset-Accuracy: 0.874190 - F1-Score: 0.872931
Epoch 4/20
Adiitional val metrics: - ROC-AUC: 0.982306 - Log-Loss: 1.931163 - Hamming-Loss: 0.002104 - Subset-Accuracy: 0.888839 - F1-Score: 0.900609
Epoch 5/20
Adiitional val metrics: - ROC-AUC: 0.984484 - Log-Loss: 1.630466 - Hamming-Loss: 0.001783 - Subset-Accuracy: 0.905321 - F1-Score: 0.915553
predicting test data ...
preparing gold label targets ...

F1 Scores for global labels:
ALL (average="micro"): 0.8530077778871714


Iteration No: 51 ended. Search finished for the next optimal point.
Time taken: 1257.5906
Function value obtained: -0.8530
Current minimum: -0.8799
Iteration No: 52 started. Searching for the next optimal point.
*******************************************************************

preparing pretrained embedding matrix ...
preparing targets ...
model summary:
_________________________________________________________________
Layer (type)                 Output Shape              Param #   
input_54 (InputLayer)        (None, None)              0         
_________________________________________________________________
embedding_54 (Embedding)     (None, None, 50)          2249200   
_________________________________________________________________
bidirectional_54 (Bidirectio (None, None, 384)         374784    
_________________________________________________________________
spatial_dropout1d_54 (Spatia (None, None, 384)         0         
_________________________________________________________________
dense_107 (Dense)            (None, None, 300)         115500    
_________________________________________________________________
dense_108 (Dense)            (None, None, 97)          29197     
Total params: 2,768,681
Trainable params: 2,768,681
Non-trainab

Epoch 1/20
Adiitional val metrics: - ROC-AUC: 0.954370 - Log-Loss: 3.623340 - Hamming-Loss: 0.005998 - Subset-Accuracy: 0.707699 - F1-Score: 0.716245
Epoch 2/20
Adiitional val metrics: - ROC-AUC: 0.971203 - Log-Loss: 2.901950 - Hamming-Loss: 0.003845 - Subset-Accuracy: 0.817706 - F1-Score: 0.820155
Epoch 3/20
Adiitional val metrics: - ROC-AUC: 0.978388 - Log-Loss: 2.453560 - Hamming-Loss: 0.002576 - Subset-Accuracy: 0.852921 - F1-Score: 0.876111
Epoch 4/20
Adiitional val metrics: - ROC-AUC: 0.983453 - Log-Loss: 2.118095 - Hamming-Loss: 0.002149 - Subset-Accuracy: 0.872782 - F1-Score: 0.896723
Epoch 5/20
Adiitional val metrics: - ROC-AUC: 0.986313 - Log-Loss: 1.815599 - Hamming-Loss: 0.001836 - Subset-Accuracy: 0.892764 - F1-Score: 0.911757
Epoch 6/20
Adiitional val metrics: - ROC-AUC: 0.988140 - Log-Loss: 1.553886 - Hamming-Loss: 0.001766 - Subset-Accuracy: 0.898990 - F1-Score: 0.915670
Epoch 7/20
Adiitional val metrics: - ROC-AUC: 0.989370 - Log-Loss: 1.424715 - Hamming-Loss: 0.001785

Adiitional val metrics: - ROC-AUC: 0.986810 - Log-Loss: 1.867489 - Hamming-Loss: 0.001516 - Subset-Accuracy: 0.917898 - F1-Score: 0.927975
Epoch 5/20
Adiitional val metrics: - ROC-AUC: 0.987547 - Log-Loss: 1.610566 - Hamming-Loss: 0.001496 - Subset-Accuracy: 0.919724 - F1-Score: 0.928936
predicting test data ...
preparing gold label targets ...

F1 Scores for global labels:
ALL (average="micro"): 0.8646961456609127


Iteration No: 58 ended. Search finished for the next optimal point.
Time taken: 947.9565
Function value obtained: -0.8647
Current minimum: -0.8799
Iteration No: 59 started. Searching for the next optimal point.
********************************************************************************
Parameters (note: embed_size*10, latent_dim*64):
 {'up': 5, 'window_size': 3, 'embed_size': 5, 'latent_dim': 5, 'dropout_rate': 0.0, 'epochs': 20, 'category': None}
********************************************************************************
upsampling for 5 times...
preparing featu



preparing pretrained embedding matrix ...
preparing targets ...
model summary:
_________________________________________________________________
Layer (type)                 Output Shape              Param #   
input_59 (InputLayer)        (None, None)              0         
_________________________________________________________________
embedding_59 (Embedding)     (None, None, 50)          2249200   
_________________________________________________________________
bidirectional_59 (Bidirectio (None, None, 640)         952320    
_________________________________________________________________
spatial_dropout1d_59 (Spatia (None, None, 640)         0         
_________________________________________________________________
dense_117 (Dense)            (None, None, 300)         192300    
_________________________________________________________________
dense_118 (Dense)            (None, None, 97)          29197     
Total params: 3,423,017
Trainable params: 3,423,017
Non-trainab

Epoch 1/21
Adiitional val metrics: - ROC-AUC: 0.973139 - Log-Loss: 3.086089 - Hamming-Loss: 0.001858 - Subset-Accuracy: 0.887616 - F1-Score: 0.909202
Epoch 2/21
Adiitional val metrics: - ROC-AUC: 0.982752 - Log-Loss: 2.336039 - Hamming-Loss: 0.001303 - Subset-Accuracy: 0.939347 - F1-Score: 0.938497
Epoch 3/21
Adiitional val metrics: - ROC-AUC: 0.986726 - Log-Loss: 1.983829 - Hamming-Loss: 0.001303 - Subset-Accuracy: 0.941176 - F1-Score: 0.938753
Epoch 4/21
Adiitional val metrics: - ROC-AUC: 0.988187 - Log-Loss: 1.659175 - Hamming-Loss: 0.001306 - Subset-Accuracy: 0.937905 - F1-Score: 0.938411
Epoch 5/21
Adiitional val metrics: - ROC-AUC: 0.988933 - Log-Loss: 1.538962 - Hamming-Loss: 0.001392 - Subset-Accuracy: 0.927763 - F1-Score: 0.934034
Epoch 6/21
Adiitional val metrics: - ROC-AUC: 0.990027 - Log-Loss: 1.333924 - Hamming-Loss: 0.001319 - Subset-Accuracy: 0.935635 - F1-Score: 0.937864
predicting test data ...
preparing gold label targets ...

F1 Scores for global labels:
ALL (average

Adiitional val metrics: - ROC-AUC: 0.989019 - Log-Loss: 1.598276 - Hamming-Loss: 0.001317 - Subset-Accuracy: 0.932915 - F1-Score: 0.937574
predicting test data ...
preparing gold label targets ...

F1 Scores for global labels:
ALL (average="micro"): 0.8517698025894747


Iteration No: 63 ended. Search finished for the next optimal point.
Time taken: 558.2252
Function value obtained: -0.8518
Current minimum: -0.8799
Iteration No: 64 started. Searching for the next optimal point.
********************************************************************************
Parameters (note: embed_size*10, latent_dim*64):
 {'up': 5, 'window_size': 3, 'embed_size': 5, 'latent_dim': 5, 'dropout_rate': 0.0, 'epochs': 20, 'category': None}
********************************************************************************
upsampling for 5 times...
preparing features ...




preparing pretrained embedding matrix ...
preparing targets ...
model summary:
_________________________________________________________________
Layer (type)                 Output Shape              Param #   
input_64 (InputLayer)        (None, None)              0         
_________________________________________________________________
embedding_64 (Embedding)     (None, None, 50)          2249200   
_________________________________________________________________
bidirectional_64 (Bidirectio (None, None, 640)         952320    
_________________________________________________________________
spatial_dropout1d_64 (Spatia (None, None, 640)         0         
_________________________________________________________________
dense_127 (Dense)            (None, None, 300)         192300    
_________________________________________________________________
dense_128 (Dense)            (None, None, 97)          29197     
Total params: 3,423,017
Trainable params: 3,423,017
Non-trainab

Adiitional val metrics: - ROC-AUC: 0.972321 - Log-Loss: 3.134548 - Hamming-Loss: 0.002170 - Subset-Accuracy: 0.867377 - F1-Score: 0.893507
Epoch 2/20
Adiitional val metrics: - ROC-AUC: 0.982663 - Log-Loss: 2.345861 - Hamming-Loss: 0.001400 - Subset-Accuracy: 0.936164 - F1-Score: 0.933967
Epoch 3/20
Adiitional val metrics: - ROC-AUC: 0.986461 - Log-Loss: 1.894087 - Hamming-Loss: 0.001203 - Subset-Accuracy: 0.943383 - F1-Score: 0.943375
Epoch 4/20
Adiitional val metrics: - ROC-AUC: 0.987903 - Log-Loss: 1.648128 - Hamming-Loss: 0.001249 - Subset-Accuracy: 0.939921 - F1-Score: 0.941288
Epoch 5/20
Adiitional val metrics: - ROC-AUC: 0.988736 - Log-Loss: 1.358313 - Hamming-Loss: 0.001202 - Subset-Accuracy: 0.942638 - F1-Score: 0.943458
Epoch 6/20
Adiitional val metrics: - ROC-AUC: 0.989749 - Log-Loss: 1.245969 - Hamming-Loss: 0.001282 - Subset-Accuracy: 0.938057 - F1-Score: 0.939891
predicting test data ...
preparing gold label targets ...

F1 Scores for global labels:
ALL (average="micro"): 

preparing gold label targets ...

F1 Scores for global labels:
ALL (average="micro"): 0.8590741100953123


Iteration No: 68 ended. Search finished for the next optimal point.
Time taken: 583.2892
Function value obtained: -0.8591
Current minimum: -0.8799
Iteration No: 69 started. Searching for the next optimal point.
********************************************************************************
Parameters (note: embed_size*10, latent_dim*64):
 {'up': 15, 'window_size': 3, 'embed_size': 3, 'latent_dim': 5, 'dropout_rate': 0.0118057655213229, 'epochs': 20, 'category': None}
********************************************************************************
upsampling for 15 times...
preparing features ...
preparing pretrained embedding matrix ...
preparing targets ...
model summary:
_________________________________________________________________
Layer (type)                 Output Shape              Param #   
input_69 (InputLayer)        (None, None)              0         
____________



preparing pretrained embedding matrix ...
preparing targets ...
model summary:
_________________________________________________________________
Layer (type)                 Output Shape              Param #   
input_70 (InputLayer)        (None, None)              0         
_________________________________________________________________
embedding_70 (Embedding)     (None, None, 50)          2249200   
_________________________________________________________________
bidirectional_70 (Bidirectio (None, None, 640)         952320    
_________________________________________________________________
spatial_dropout1d_70 (Spatia (None, None, 640)         0         
_________________________________________________________________
dense_139 (Dense)            (None, None, 300)         192300    
_________________________________________________________________
dense_140 (Dense)            (None, None, 97)          29197     
Total params: 3,423,017
Trainable params: 3,423,017
Non-trainab



preparing pretrained embedding matrix ...
preparing targets ...
model summary:
_________________________________________________________________
Layer (type)                 Output Shape              Param #   
input_72 (InputLayer)        (None, None)              0         
_________________________________________________________________
embedding_72 (Embedding)     (None, None, 50)          2249200   
_________________________________________________________________
bidirectional_72 (Bidirectio (None, None, 640)         952320    
_________________________________________________________________
spatial_dropout1d_72 (Spatia (None, None, 640)         0         
_________________________________________________________________
dense_143 (Dense)            (None, None, 300)         192300    
_________________________________________________________________
dense_144 (Dense)            (None, None, 97)          29197     
Total params: 3,423,017
Trainable params: 3,423,017
Non-trainab



preparing pretrained embedding matrix ...
preparing targets ...
model summary:
_________________________________________________________________
Layer (type)                 Output Shape              Param #   
input_73 (InputLayer)        (None, None)              0         
_________________________________________________________________
embedding_73 (Embedding)     (None, None, 50)          2249200   
_________________________________________________________________
bidirectional_73 (Bidirectio (None, None, 640)         952320    
_________________________________________________________________
spatial_dropout1d_73 (Spatia (None, None, 640)         0         
_________________________________________________________________
dense_145 (Dense)            (None, None, 300)         192300    
_________________________________________________________________
dense_146 (Dense)            (None, None, 97)          29197     
Total params: 3,423,017
Trainable params: 3,423,017
Non-trainab

Epoch 1/21
Adiitional val metrics: - ROC-AUC: 0.962134 - Log-Loss: 3.455731 - Hamming-Loss: 0.004119 - Subset-Accuracy: 0.717983 - F1-Score: 0.787522
Epoch 2/21
Adiitional val metrics: - ROC-AUC: 0.978471 - Log-Loss: 2.813006 - Hamming-Loss: 0.002109 - Subset-Accuracy: 0.888852 - F1-Score: 0.899550
Epoch 3/21
Adiitional val metrics: - ROC-AUC: 0.983005 - Log-Loss: 2.395660 - Hamming-Loss: 0.001656 - Subset-Accuracy: 0.913329 - F1-Score: 0.921397
Epoch 4/21
Adiitional val metrics: - ROC-AUC: 0.985920 - Log-Loss: 2.037358 - Hamming-Loss: 0.001538 - Subset-Accuracy: 0.912809 - F1-Score: 0.927367
Epoch 5/21
Adiitional val metrics: - ROC-AUC: 0.987125 - Log-Loss: 1.820534 - Hamming-Loss: 0.001547 - Subset-Accuracy: 0.911582 - F1-Score: 0.927051
predicting test data ...
preparing gold label targets ...

F1 Scores for global labels:
ALL (average="micro"): 0.8624963403923099


Iteration No: 75 ended. Search finished for the next optimal point.
Time taken: 1030.5669
Function value obtained: -0.



preparing pretrained embedding matrix ...
preparing targets ...
model summary:
_________________________________________________________________
Layer (type)                 Output Shape              Param #   
input_78 (InputLayer)        (None, None)              0         
_________________________________________________________________
embedding_78 (Embedding)     (None, None, 50)          2249200   
_________________________________________________________________
bidirectional_78 (Bidirectio (None, None, 640)         952320    
_________________________________________________________________
spatial_dropout1d_78 (Spatia (None, None, 640)         0         
_________________________________________________________________
dense_155 (Dense)            (None, None, 300)         192300    
_________________________________________________________________
dense_156 (Dense)            (None, None, 97)          29197     
Total params: 3,423,017
Trainable params: 3,423,017
Non-trainab



preparing pretrained embedding matrix ...
preparing targets ...
model summary:
_________________________________________________________________
Layer (type)                 Output Shape              Param #   
input_79 (InputLayer)        (None, None)              0         
_________________________________________________________________
embedding_79 (Embedding)     (None, None, 50)          2249200   
_________________________________________________________________
bidirectional_79 (Bidirectio (None, None, 640)         952320    
_________________________________________________________________
spatial_dropout1d_79 (Spatia (None, None, 640)         0         
_________________________________________________________________
dense_157 (Dense)            (None, None, 300)         192300    
_________________________________________________________________
dense_158 (Dense)            (None, None, 97)          29197     
Total params: 3,423,017
Trainable params: 3,423,017
Non-trainab

Epoch 1/20
Adiitional val metrics: - ROC-AUC: 0.969029 - Log-Loss: 3.185371 - Hamming-Loss: 0.005280 - Subset-Accuracy: 0.803158 - F1-Score: 0.768826
Epoch 2/20
Adiitional val metrics: - ROC-AUC: 0.978438 - Log-Loss: 2.640267 - Hamming-Loss: 0.002738 - Subset-Accuracy: 0.874589 - F1-Score: 0.874241
Epoch 3/20
Adiitional val metrics: - ROC-AUC: 0.982658 - Log-Loss: 2.265519 - Hamming-Loss: 0.001909 - Subset-Accuracy: 0.904770 - F1-Score: 0.910189
Epoch 4/20
Adiitional val metrics: - ROC-AUC: 0.985367 - Log-Loss: 1.967778 - Hamming-Loss: 0.001772 - Subset-Accuracy: 0.906624 - F1-Score: 0.915966
Epoch 5/20
Adiitional val metrics: - ROC-AUC: 0.986570 - Log-Loss: 1.721964 - Hamming-Loss: 0.001629 - Subset-Accuracy: 0.913298 - F1-Score: 0.922784
predicting test data ...
preparing gold label targets ...

F1 Scores for global labels:
ALL (average="micro"): 0.8585164835164835


Iteration No: 81 ended. Search finished for the next optimal point.
Time taken: 1046.7669
Function value obtained: -0.



preparing pretrained embedding matrix ...
preparing targets ...
model summary:
_________________________________________________________________
Layer (type)                 Output Shape              Param #   
input_83 (InputLayer)        (None, None)              0         
_________________________________________________________________
embedding_83 (Embedding)     (None, None, 50)          2249200   
_________________________________________________________________
bidirectional_83 (Bidirectio (None, None, 384)         374784    
_________________________________________________________________
spatial_dropout1d_83 (Spatia (None, None, 384)         0         
_________________________________________________________________
dense_165 (Dense)            (None, None, 300)         115500    
_________________________________________________________________
dense_166 (Dense)            (None, None, 97)          29197     
Total params: 2,768,681
Trainable params: 2,768,681
Non-trainab



preparing pretrained embedding matrix ...
preparing targets ...
model summary:
_________________________________________________________________
Layer (type)                 Output Shape              Param #   
input_85 (InputLayer)        (None, None)              0         
_________________________________________________________________
embedding_85 (Embedding)     (None, None, 50)          2249200   
_________________________________________________________________
bidirectional_85 (Bidirectio (None, None, 640)         952320    
_________________________________________________________________
spatial_dropout1d_85 (Spatia (None, None, 640)         0         
_________________________________________________________________
dense_169 (Dense)            (None, None, 300)         192300    
_________________________________________________________________
dense_170 (Dense)            (None, None, 97)          29197     
Total params: 3,423,017
Trainable params: 3,423,017
Non-trainab



preparing pretrained embedding matrix ...
preparing targets ...
model summary:
_________________________________________________________________
Layer (type)                 Output Shape              Param #   
input_86 (InputLayer)        (None, None)              0         
_________________________________________________________________
embedding_86 (Embedding)     (None, None, 50)          2249200   
_________________________________________________________________
bidirectional_86 (Bidirectio (None, None, 640)         952320    
_________________________________________________________________
spatial_dropout1d_86 (Spatia (None, None, 640)         0         
_________________________________________________________________
dense_171 (Dense)            (None, None, 300)         192300    
_________________________________________________________________
dense_172 (Dense)            (None, None, 97)          29197     
Total params: 3,423,017
Trainable params: 3,423,017
Non-trainab



preparing pretrained embedding matrix ...
preparing targets ...
model summary:
_________________________________________________________________
Layer (type)                 Output Shape              Param #   
input_87 (InputLayer)        (None, None)              0         
_________________________________________________________________
embedding_87 (Embedding)     (None, None, 50)          2249200   
_________________________________________________________________
bidirectional_87 (Bidirectio (None, None, 640)         952320    
_________________________________________________________________
spatial_dropout1d_87 (Spatia (None, None, 640)         0         
_________________________________________________________________
dense_173 (Dense)            (None, None, 300)         192300    
_________________________________________________________________
dense_174 (Dense)            (None, None, 97)          29197     
Total params: 3,423,017
Trainable params: 3,423,017
Non-trainab



preparing pretrained embedding matrix ...
preparing targets ...
model summary:
_________________________________________________________________
Layer (type)                 Output Shape              Param #   
input_88 (InputLayer)        (None, None)              0         
_________________________________________________________________
embedding_88 (Embedding)     (None, None, 50)          2249200   
_________________________________________________________________
bidirectional_88 (Bidirectio (None, None, 640)         952320    
_________________________________________________________________
spatial_dropout1d_88 (Spatia (None, None, 640)         0         
_________________________________________________________________
dense_175 (Dense)            (None, None, 300)         192300    
_________________________________________________________________
dense_176 (Dense)            (None, None, 97)          29197     
Total params: 3,423,017
Trainable params: 3,423,017
Non-trainab



preparing pretrained embedding matrix ...
preparing targets ...
model summary:
_________________________________________________________________
Layer (type)                 Output Shape              Param #   
input_89 (InputLayer)        (None, None)              0         
_________________________________________________________________
embedding_89 (Embedding)     (None, None, 50)          2249200   
_________________________________________________________________
bidirectional_89 (Bidirectio (None, None, 640)         952320    
_________________________________________________________________
spatial_dropout1d_89 (Spatia (None, None, 640)         0         
_________________________________________________________________
dense_177 (Dense)            (None, None, 300)         192300    
_________________________________________________________________
dense_178 (Dense)            (None, None, 97)          29197     
Total params: 3,423,017
Trainable params: 3,423,017
Non-trainab



preparing pretrained embedding matrix ...
preparing targets ...
model summary:
_________________________________________________________________
Layer (type)                 Output Shape              Param #   
input_91 (InputLayer)        (None, None)              0         
_________________________________________________________________
embedding_91 (Embedding)     (None, None, 50)          2249200   
_________________________________________________________________
bidirectional_91 (Bidirectio (None, None, 640)         952320    
_________________________________________________________________
spatial_dropout1d_91 (Spatia (None, None, 640)         0         
_________________________________________________________________
dense_181 (Dense)            (None, None, 300)         192300    
_________________________________________________________________
dense_182 (Dense)            (None, None, 97)          29197     
Total params: 3,423,017
Trainable params: 3,423,017
Non-trainab



preparing pretrained embedding matrix ...
preparing targets ...
model summary:
_________________________________________________________________
Layer (type)                 Output Shape              Param #   
input_93 (InputLayer)        (None, None)              0         
_________________________________________________________________
embedding_93 (Embedding)     (None, None, 50)          2249200   
_________________________________________________________________
bidirectional_93 (Bidirectio (None, None, 640)         952320    
_________________________________________________________________
spatial_dropout1d_93 (Spatia (None, None, 640)         0         
_________________________________________________________________
dense_185 (Dense)            (None, None, 300)         192300    
_________________________________________________________________
dense_186 (Dense)            (None, None, 97)          29197     
Total params: 3,423,017
Trainable params: 3,423,017
Non-trainab



preparing pretrained embedding matrix ...
preparing targets ...
model summary:
_________________________________________________________________
Layer (type)                 Output Shape              Param #   
input_95 (InputLayer)        (None, None)              0         
_________________________________________________________________
embedding_95 (Embedding)     (None, None, 50)          2249200   
_________________________________________________________________
bidirectional_95 (Bidirectio (None, None, 640)         952320    
_________________________________________________________________
spatial_dropout1d_95 (Spatia (None, None, 640)         0         
_________________________________________________________________
dense_189 (Dense)            (None, None, 300)         192300    
_________________________________________________________________
dense_190 (Dense)            (None, None, 97)          29197     
Total params: 3,423,017
Trainable params: 3,423,017
Non-trainab

Epoch 1/20
Adiitional val metrics: - ROC-AUC: 0.975795 - Log-Loss: 3.159631 - Hamming-Loss: 0.001592 - Subset-Accuracy: 0.913019 - F1-Score: 0.923345
Epoch 2/20
Adiitional val metrics: - ROC-AUC: 0.981485 - Log-Loss: 2.423840 - Hamming-Loss: 0.001534 - Subset-Accuracy: 0.921841 - F1-Score: 0.927247
Epoch 3/20
Adiitional val metrics: - ROC-AUC: 0.984700 - Log-Loss: 1.990146 - Hamming-Loss: 0.001377 - Subset-Accuracy: 0.933945 - F1-Score: 0.935026
Epoch 4/20
Adiitional val metrics: - ROC-AUC: 0.986549 - Log-Loss: 1.719195 - Hamming-Loss: 0.001247 - Subset-Accuracy: 0.940951 - F1-Score: 0.941126
Epoch 5/20
Adiitional val metrics: - ROC-AUC: 0.987477 - Log-Loss: 1.513113 - Hamming-Loss: 0.001276 - Subset-Accuracy: 0.939201 - F1-Score: 0.939765
predicting test data ...
preparing gold label targets ...

F1 Scores for global labels:
ALL (average="micro"): 0.852524222335543


Iteration No: 97 ended. Search finished for the next optimal point.
Time taken: 678.9616
Function value obtained: -0.85



preparing pretrained embedding matrix ...
preparing targets ...
model summary:
_________________________________________________________________
Layer (type)                 Output Shape              Param #   
input_99 (InputLayer)        (None, None)              0         
_________________________________________________________________
embedding_99 (Embedding)     (None, None, 50)          2249200   
_________________________________________________________________
bidirectional_99 (Bidirectio (None, None, 640)         952320    
_________________________________________________________________
spatial_dropout1d_99 (Spatia (None, None, 640)         0         
_________________________________________________________________
dense_197 (Dense)            (None, None, 300)         192300    
_________________________________________________________________
dense_198 (Dense)            (None, None, 97)          29197     
Total params: 3,423,017
Trainable params: 3,423,017
Non-trainab