In [4]:
import fastText
import math
import linecache
import numpy as np 
from numpy import random
from random import sample
from keras.models import Sequential, Model
from keras.callbacks import ModelCheckpoint
from keras.layers import *
from keras import *
from keras.utils import to_categorical
from keras.preprocessing.sequence import pad_sequences
from keras.initializers import RandomUniform
import re
from sklearn.metrics import f1_score, recall_score, precision_score, accuracy_score

# from attention_utils import get_activations, get_data_recurrent


  from ._conv import register_converters as _register_converters
Using TensorFlow backend.


In [5]:
%env CUDA_DEVICE_ORDER=PCI_BUS_ID
%env CUDA_VISIBLE_DEVICES=2

env: CUDA_DEVICE_ORDER=PCI_BUS_ID
env: CUDA_VISIBLE_DEVICES=2


In [6]:
ft = fastText.load_model("/home/jindal/notebooks/fastText/wiki.de.bin")

nb_embedding_dims = ft.get_dimension()
nb_sequence_length = 75

In [7]:
def twitter_tokenizer(textline):
    textLine = re.sub(r'http\S+', 'URL', textline)
    textline = re.sub('@[\w_]+', 'USER_MENTION', textline)
    textline = re.sub('\|LBR\|', '', textline)
    textline = re.sub('\.\.\.+', '...', textline)
    textline = re.sub('!!+', '!!', textline)
    textline = re.sub('\?\?+', '??', textline)
    words = re.compile('[\U00010000-\U0010ffff]|[\w-]+|[^ \w\U00010000-\U0010ffff]+', re.UNICODE).findall(textline.strip())
    words = [w.strip() for w in words if w.strip() != '']
    # print(words)
    return(words)

In [8]:
word_vectors_ft = {}
def process_features(textline, nb_sequence_length, nb_embedding_dims, tokenize=True):
    if not tokenize:
        words = textline.split()
    else:
        words = twitter_tokenizer(textline)
    features_ft = np.zeros((nb_sequence_length, nb_embedding_dims))
    features_idx = np.zeros(nb_sequence_length)
    max_words = min(len(words), nb_sequence_length)
    idx = nb_sequence_length - len(words[:max_words])
    for w in words[:max_words]:
        if w in word_vectors_ft:
            wv = word_vectors_ft[w]
        else:
            wv = ft.get_word_vector(w.lower())
            word_vectors_ft[w] = wv
        features_ft[idx] = wv
        
        idx = idx + 1
    return features_ft

In [9]:
def sequential_generator(filename, 
                         batch_size, 
                         labels2Idx:'dict to make output labels',
                         check:'to check if all lines in file are of same length.To check enter the len of line after splitting it by tabs' = None,
                         tokenize:'specify if using twitter tokenzor to preprocess lines'=False, 
                        ):    
    
    f = open(filename)
    n_labels = len(labels2Idx)
    while True:
        batch_features_ft = np.zeros((batch_size, nb_sequence_length, nb_embedding_dims))
#         print(type(labels2Idx))
        batch_labels = np.zeros((batch_size, len(labels2Idx)))
        for i in range(batch_size):
            line = f.readline()
            if ("" == line):
                f.seek(0)
                line = f.readline()
            data = line.strip().split('\t')
            if check:
                if len(data)!=check:
                    i-=1
                    continue
            batch_features_ft[i] = process_features(data[0], nb_sequence_length, nb_embedding_dims, tokenize= tokenize)
            if len(labels2Idx)==2:
                batch_labels[i] = to_categorical(0 if data[1] == 'OTHER' else 1, n_labels)
            else:
                batch_labels[i] = to_categorical(labels2Idx[data[1]], n_labels)
        yield ([batch_features_ft], batch_labels)

In [10]:
def train_dev_sentences(filetrain,filedev, check:'to check if lines of file are all same lenght after separating by tab'):
    labels2Idx = {}
    train_lines = [line.strip().split("\t") for line in open(filetrain) if len(line.strip().split('\t'))==check]
    dev_lines = [line.strip().split("\t") for line in open(filedev) if len(line.strip().split('\t'))==check]

    train_sentences = [x[0] for x in train_lines]
    for dataset in [train_lines, dev_lines]:
        for line in dataset:
            label = line[1]
            if label not in labels2Idx.keys():
                labels2Idx[label]= len(labels2Idx)
                
#     train_labels = [0 if x[1] == "OTHER" else 1 for x in train_lines]
    train_labels = [labels2Idx[x[1]] for x in train_lines]
    dev_sentences = [x[0] for x in dev_lines]
#     dev_labels = [0 if x[1] == "OTHER" else 1 for x in dev_lines]
    dev_labels = [labels2Idx[x[1]] for x in dev_lines]
    return (train_sentences, train_labels, dev_sentences, dev_labels, labels2Idx)


In [11]:
file_train = '/home/jindal/notebooks/jindal/NER/language_model/million_post_corpus_train.csv'
file_dev = '/home/jindal/notebooks/jindal/NER/language_model/million_post_corpus_dev.csv'
train_sentences, train_labels, dev_sentences, dev_labels, labels2Id = train_dev_sentences(filetrain=file_train,filedev=file_dev, check=2)

In [13]:
dev_labels[:10]

[1, 0, 0, 1, 0, 0, 0, 0, 0, 1]

In [105]:
dev_sentences[0]

'Dann diskutiere es doch mit dir selbst.'

In [14]:
n_labels =2

In [15]:
def compile_model(no_labels:'total labels for classification'):
    model_input_embedding = Input(shape = (nb_sequence_length, nb_embedding_dims))
    lstm_block = Bidirectional(LSTM(100, dropout = 0.5, return_sequences=True))(model_input_embedding)
    lstm_block = LeakyReLU()(lstm_block)

    filter_sizes = (3, 4, 5)
    conv_blocks = []
    for sz in filter_sizes:
        conv = Conv1D(
            filters = 200,
            kernel_size = sz,
            padding = 'valid',
            strides = 1
        )(lstm_block)
        conv = LeakyReLU()(conv)
        conv = GlobalMaxPooling1D()(conv)
        conv = Dropout(0.5)(conv)
        conv_blocks.append(conv)
    model_concatenated = concatenate([conv_blocks[0], conv_blocks[1], conv_blocks[2]])
    # model_concatenated = Dropout(0.8)(model_concatenated)
    model_concatenated = Dense(100)(model_concatenated)
    model_concatenated = LeakyReLU()(model_concatenated)
    model_output = Dense(no_labels, activation = "softmax")(model_concatenated)
    new_model = Model(model_input_embedding, model_output)
    new_model.compile(loss='categorical_crossentropy', optimizer='nadam', metrics = ['accuracy'])
#     new_model.summary()
    return new_model

In [18]:
def test_model(generator, 
               train_sentences, 
               devLabels, 
               number_of_tests,
               number_of_epochs,
               filename_to_log, 
               labels_earlier:'number of original labels if loading a pretrained model',
               filename_to_save_weigths,
               batch_size, 
               train_file:'filepath for traininig',
               f1_measure:'binary/macro etc', 
               pos_label:'only if binary f1',
               labels2Idx,
               load_model_weights=False,
               model_weights_file:'give filepath as str'=None, 
               tokenize=True,
               nb_sequence_length = nb_sequence_length,
               nb_embedding_dims= nb_embedding_dims, 
               check_for_generator=None,
                ):
    
#     f = open(filename_to_log,"w")
    
    max_f1=0
    max_p=0
    max_r=0
    max_a=0
    total_f1=0
    total_prec=0
    total_acc=0
    total_recall=0
    
    for test_number in range(number_of_tests):
        print("Test %d/%d" %(test_number+1, number_of_tests))
        model = compile_model(labels_earlier)

        # transfer learning
        if load_model_weights and model_weights_file:
                model.load_weights(model_weights_file)

        samples_per_epoch = len(train_sentences)
        epochs = number_of_epochs
        batch_size = batch_size
        steps_per_epoch = math.ceil(samples_per_epoch / batch_size)
        checkpoint = ModelCheckpoint(filename_to_save_weigths, monitor='val_acc',save_best_only = True, 
                                     save_weights_only = True)

        for epoch in range(epochs):
            print("Epoch: %d" %(epoch+1))
            model.fit_generator(
                generator(filename = train_file, batch_size = batch_size, check = check_for_generator, 
                          labels2Idx= labels2Idx,tokenize= tokenize), 
                steps_per_epoch= steps_per_epoch, epochs=1,
                validation_data = generator(filename ='/home/jindal/notebooks/jindal/NER/language_model/million_post_corpus_dev.csv', 
                                            batch_size = batch_size, check = check_for_generator, 
                                           labels2Idx = labels2Idx, tokenize = tokenize),
                validation_steps = math.ceil(len(dev_labels) / batch_size),
                callbacks = [checkpoint]
            )

#             testset_features = np.zeros((len(dev_sentences), nb_sequence_length, nb_embedding_dims))
#             for i in range(len(dev_sentences)):
#                 testset_features[i] = process_features(dev_sentences[i], nb_sequence_length, nb_embedding_dims)
#             results = model.predict(testset_features)


# #             idx2Label = {0 : "OTHER", 1 : "OFFENSIVE"}
#             predLabels = results.argmax(axis=-1)
#             devLabels = devLabels
#             f1 = f1_score(devLabels, predLabels, average=f1_measure, pos_label=pos_label) # offensive is the major class. So other is minor
#             r = recall_score(devLabels, predLabels, average=f1_measure, pos_label=pos_label)
#             p = precision_score(devLabels, predLabels, average=f1_measure, pos_label=pos_label)
#             a = accuracy_score(devLabels, predLabels)
#             if max_f1 < f1:
#                 print("model saved. F1 is %f" %(f1))
#                 model.save(filename_to_save_weigths)
#                 max_f1 = f1
#                 max_p = p
#                 max_r = r
#                 max_a = a
#             text = "prec: "+ str(p)+" rec: "+str(r) +" f1: "+str(f1) +" acc: "+str(a)+" \n"
#             print("Test-Data: Prec: %.3f, Rec: %.3f, F1: %.3f, Acc: %.3f" % (p, r, f1, a))
#         to_write= "prec: "+ str(max_p)+" rec: "+str(max_r) +" f1: "+str(max_f1) +" acc: "+str(max_a)+" \n"
#         print(to_write)
#         f.write(to_write)
#         total_f1+=max_f1
#         total_prec+=max_p
#         total_acc+=max_a
#         total_recall+=max_r    
#         print("*****************************************************************************")
#     final_text = "avg_prec: " +str(total_prec/number_of_tests)+" total_rec: "+str(total_recall/number_of_tests) +" total_f1: "+str(total_f1/number_of_tests) +" total_acc: "+str(total_acc/number_of_tests)+" \n"
#     print(final_text)
#     f.write(final_text)
#     f.close()




In [19]:
print(dev_sentences[1])

Nationalistisches Geseiere.


In [111]:
generator = sequential_generator
train_sentences = train_sentences
devLabels = dev_labels
number_of_tests = 1
number_of_epochs = 10
millionpostcorpus_pretraining_log = '/home/jindal/notebooks/jindal/NER/language_model/results_pretraining_millionpostcorpus.txt' 
millionpostcorpus_pretraining_save_weigths='/home/jindal/notebooks/jindal/NER/language_model/model_pretrained_millionpostcorpus.h5'
batch_size=32
millionpostcorpus_train_file='/home/jindal/notebooks/jindal/NER/language_model/million_post_corpus_train.csv'
tokenize = True
labels2Idx = labels2Id
f1_measure='binary'
pos_label=1
load_model_weights=False
# model_weights_file:'give filepath as str'=None, 
nb_sequence_length = nb_sequence_length
nb_embedding_dims= nb_embedding_dims
check_for_generator=2



In [112]:
test_model(generator=generator, 
           train_sentences=train_sentences, 
           devLabels=devLabels, 
           number_of_tests= number_of_tests,
           number_of_epochs=number_of_epochs, 
           filename_to_log=millionpostcorpus_pretraining_log, 
           labels_earlier = len(labels2Idx),
           filename_to_save_weigths=millionpostcorpus_pretraining_save_weigths,
           batch_size=batch_size,
           train_file=millionpostcorpus_train_file, 
           f1_measure=f1_measure, 
           pos_label=pos_label, 
           load_model_weights=load_model_weights,
           tokenize = tokenize,
           nb_sequence_length=nb_sequence_length, 
           nb_embedding_dims=nb_embedding_dims, 
           check_for_generator= check_for_generator)

Test 1/3
Epoch: 1
Epoch 1/1


  'precision', 'predicted', average, warn_for)
  'precision', 'predicted', average, warn_for)


Test-Data: Prec: 0.000, Rec: 0.000, F1: 0.000, Acc: 0.831
Epoch: 2
Epoch 1/1
Test-Data: Prec: 0.000, Rec: 0.000, F1: 0.000, Acc: 0.829
Epoch: 3
Epoch 1/1
model saved. F1 is 0.019802
Test-Data: Prec: 0.333, Rec: 0.010, F1: 0.020, Acc: 0.829
Epoch: 4
Epoch 1/1
Test-Data: Prec: 0.100, Rec: 0.010, F1: 0.019, Acc: 0.817
Epoch: 5
Epoch 1/1
model saved. F1 is 0.117647
Test-Data: Prec: 0.333, Rec: 0.071, F1: 0.118, Acc: 0.819
Epoch: 6
Epoch 1/1
Test-Data: Prec: 0.174, Rec: 0.082, F1: 0.111, Acc: 0.779
Epoch: 7
Epoch 1/1
model saved. F1 is 0.317073
Test-Data: Prec: 0.264, Rec: 0.398, F1: 0.317, Acc: 0.710
Epoch: 8
Epoch 1/1
Test-Data: Prec: 0.281, Rec: 0.276, F1: 0.278, Acc: 0.758
Epoch: 9
Epoch 1/1
Test-Data: Prec: 0.292, Rec: 0.214, F1: 0.247, Acc: 0.779
Epoch: 10
Epoch 1/1
Test-Data: Prec: 0.258, Rec: 0.235, F1: 0.246, Acc: 0.756
Epoch: 11
Epoch 1/1
Test-Data: Prec: 0.290, Rec: 0.276, F1: 0.283, Acc: 0.763
Epoch: 12
Epoch 1/1
Test-Data: Prec: 0.280, Rec: 0.235, F1: 0.256, Acc: 0.769
Epoch: 1

Epoch: 1
Epoch 1/1
Test-Data: Prec: 0.000, Rec: 0.000, F1: 0.000, Acc: 0.831
Epoch: 2
Epoch 1/1
Test-Data: Prec: 0.000, Rec: 0.000, F1: 0.000, Acc: 0.827
Epoch: 3
Epoch 1/1
Test-Data: Prec: 0.182, Rec: 0.020, F1: 0.037, Acc: 0.819
Epoch: 4
Epoch 1/1
Test-Data: Prec: 0.143, Rec: 0.020, F1: 0.036, Acc: 0.813
Epoch: 5
Epoch 1/1
Test-Data: Prec: 0.261, Rec: 0.061, F1: 0.099, Acc: 0.812
Epoch: 6
Epoch 1/1
Test-Data: Prec: 0.233, Rec: 0.071, F1: 0.109, Acc: 0.803
Epoch: 7
Epoch 1/1
Test-Data: Prec: 0.246, Rec: 0.306, F1: 0.273, Acc: 0.724
Epoch: 8
Epoch 1/1
Test-Data: Prec: 0.292, Rec: 0.143, F1: 0.192, Acc: 0.796
Epoch: 9
Epoch 1/1
Test-Data: Prec: 0.270, Rec: 0.245, F1: 0.257, Acc: 0.760
Epoch: 10
Epoch 1/1
Test-Data: Prec: 0.265, Rec: 0.133, F1: 0.177, Acc: 0.791
Epoch: 11
Epoch 1/1
Test-Data: Prec: 0.333, Rec: 0.133, F1: 0.190, Acc: 0.808
Epoch: 12
Epoch 1/1
Test-Data: Prec: 0.282, Rec: 0.112, F1: 0.161, Acc: 0.801
Epoch: 13
Epoch 1/1
Test-Data: Prec: 0.244, Rec: 0.102, F1: 0.144, Acc: 0

Epoch: 1
Epoch 1/1
Test-Data: Prec: 0.000, Rec: 0.000, F1: 0.000, Acc: 0.831
Epoch: 2
Epoch 1/1
Test-Data: Prec: 0.000, Rec: 0.000, F1: 0.000, Acc: 0.831
Epoch: 3
Epoch 1/1
Test-Data: Prec: 0.500, Rec: 0.010, F1: 0.020, Acc: 0.831
Epoch: 4
Epoch 1/1
Test-Data: Prec: 0.333, Rec: 0.020, F1: 0.038, Acc: 0.827
Epoch: 5
Epoch 1/1
Test-Data: Prec: 0.156, Rec: 0.051, F1: 0.077, Acc: 0.793
Epoch: 6
Epoch 1/1
Test-Data: Prec: 0.253, Rec: 0.224, F1: 0.238, Acc: 0.756
Epoch: 7
Epoch 1/1
Test-Data: Prec: 0.211, Rec: 0.163, F1: 0.184, Acc: 0.755
Epoch: 8
Epoch 1/1
Test-Data: Prec: 0.225, Rec: 0.235, F1: 0.230, Acc: 0.734
Epoch: 9
Epoch 1/1
Test-Data: Prec: 0.261, Rec: 0.184, F1: 0.216, Acc: 0.774
Epoch: 10
Epoch 1/1
Test-Data: Prec: 0.250, Rec: 0.173, F1: 0.205, Acc: 0.772
Epoch: 11
Epoch 1/1
Test-Data: Prec: 0.227, Rec: 0.153, F1: 0.183, Acc: 0.769
Epoch: 12
Epoch 1/1
Test-Data: Prec: 0.237, Rec: 0.143, F1: 0.178, Acc: 0.777
Epoch: 13
Epoch 1/1
Test-Data: Prec: 0.250, Rec: 0.102, F1: 0.145, Acc: 0

TypeError: bad operand type for unary +: 'str'

# Transfer learning now

In [113]:
n_labels =2

In [114]:
train_sentences, train_labels, dev_sentences, dev_labels = train_dev_sentences(filetrain='/home/gwiedemann/notebooks/OffLang/sample_train.txt',
                   filedev='/home/gwiedemann/notebooks/OffLang/sample_dev.txt', check=3)

In [115]:
print(len(train_sentences))
print(dev_labels[:20])

4200
[1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 1, 0, 0, 0, 1]


In [116]:
dev_sentences[0]

'@FilmElf_yt Diese ganzen leute die du angesprochen hast sind untermenschen ja aber das alte Deutschland und deutsche volk waren ehrenwerte leute und ein stolzes Land'

In [117]:
generator = sequential_generator
train_sentences = train_sentences
devLabels = dev_labels
number_of_tests = 5
number_of_epochs = 50
millionpostcorpus_tl_log = '/home/jindal/notebooks/jindal/NER/language_model/results_tl_millionpostcorpus.txt' 
millionpostcorpus_tl_save_weigths='/home/jindal/notebooks/jindal/NER/language_model/classification_model_tl_millionpostcorpus.h5'
batch_size=32
offlang_train_file='/home/gwiedemann/notebooks/OffLang/sample_train.txt'
f1_measure='binary'
pos_label=1
load_model_weights=True
model_weights_file = '/home/jindal/notebooks/jindal/NER/language_model/model_pretrained_millionpostcorpus.h5'
nb_sequence_length = nb_sequence_length
nb_embedding_dims= nb_embedding_dims
check_for_generator=3

In [118]:
test_model(generator=generator, train_sentences=train_sentences, devLabels=devLabels, number_of_tests= number_of_tests,
          number_of_epochs=number_of_epochs, filename_to_log=millionpostcorpus_tl_log, filename_to_save_weigths=millionpostcorpus_tl_save_weigths,
          batch_size=batch_size,train_file=offlang_train_file, f1_measure=f1_measure, pos_label=pos_label, load_model_weights=load_model_weights,
          model_weights_file = model_weights_file, nb_sequence_length=nb_sequence_length, nb_embedding_dims=nb_embedding_dims, check_for_generator= check_for_generator)

Test 1/5
Epoch: 1
Epoch 1/1
model saved. F1 is 0.539683
Test-Data: Prec: 0.684, Rec: 0.446, F1: 0.540, Acc: 0.749
Epoch: 2
Epoch 1/1
model saved. F1 is 0.640816
Test-Data: Prec: 0.704, Rec: 0.588, F1: 0.641, Acc: 0.782
Epoch: 3
Epoch 1/1
Test-Data: Prec: 0.713, Rec: 0.539, F1: 0.614, Acc: 0.776
Epoch: 4
Epoch 1/1
model saved. F1 is 0.662698
Test-Data: Prec: 0.705, Rec: 0.625, F1: 0.663, Acc: 0.790
Epoch: 5
Epoch 1/1
model saved. F1 is 0.684825
Test-Data: Prec: 0.713, Rec: 0.659, F1: 0.685, Acc: 0.800
Epoch: 6
Epoch 1/1
Test-Data: Prec: 0.684, Rec: 0.625, F1: 0.654, Acc: 0.781
Epoch: 7
Epoch 1/1
Test-Data: Prec: 0.700, Rec: 0.610, F1: 0.652, Acc: 0.785
Epoch: 8
Epoch 1/1
Test-Data: Prec: 0.709, Rec: 0.648, F1: 0.677, Acc: 0.796
Epoch: 9
Epoch 1/1
Test-Data: Prec: 0.701, Rec: 0.659, F1: 0.680, Acc: 0.795
Epoch: 10
Epoch 1/1
Test-Data: Prec: 0.687, Rec: 0.640, F1: 0.663, Acc: 0.785
Epoch: 11
Epoch 1/1
Test-Data: Prec: 0.672, Rec: 0.682, F1: 0.677, Acc: 0.785
Epoch: 12
Epoch 1/1
model save

Test-Data: Prec: 0.681, Rec: 0.712, F1: 0.696, Acc: 0.795
Epoch: 49
Epoch 1/1
Test-Data: Prec: 0.711, Rec: 0.655, F1: 0.682, Acc: 0.798
Epoch: 50
Epoch 1/1
Test-Data: Prec: 0.705, Rec: 0.697, F1: 0.701, Acc: 0.803
*****************************************************************************
Test 3/5
Epoch: 1
Epoch 1/1
Test-Data: Prec: 0.728, Rec: 0.442, F1: 0.550, Acc: 0.761
Epoch: 2
Epoch 1/1
Test-Data: Prec: 0.729, Rec: 0.573, F1: 0.642, Acc: 0.788
Epoch: 3
Epoch 1/1
Test-Data: Prec: 0.715, Rec: 0.592, F1: 0.648, Acc: 0.787
Epoch: 4
Epoch 1/1
Test-Data: Prec: 0.720, Rec: 0.693, F1: 0.706, Acc: 0.809
Epoch: 5
Epoch 1/1
Test-Data: Prec: 0.697, Rec: 0.682, F1: 0.689, Acc: 0.797
Epoch: 6
Epoch 1/1
Test-Data: Prec: 0.676, Rec: 0.727, F1: 0.700, Acc: 0.795
Epoch: 7
Epoch 1/1
Test-Data: Prec: 0.701, Rec: 0.640, F1: 0.669, Acc: 0.791
Epoch: 8
Epoch 1/1
Test-Data: Prec: 0.678, Rec: 0.685, F1: 0.682, Acc: 0.788
Epoch: 9
Epoch 1/1
Test-Data: Prec: 0.669, Rec: 0.682, F1: 0.675, Acc: 0.783
Epoch:

Test-Data: Prec: 0.721, Rec: 0.659, F1: 0.689, Acc: 0.803
Epoch: 47
Epoch 1/1
Test-Data: Prec: 0.688, Rec: 0.727, F1: 0.707, Acc: 0.801
Epoch: 48
Epoch 1/1
Test-Data: Prec: 0.745, Rec: 0.644, F1: 0.691, Acc: 0.809
Epoch: 49
Epoch 1/1
Test-Data: Prec: 0.730, Rec: 0.689, F1: 0.709, Acc: 0.813
Epoch: 50
Epoch 1/1
Test-Data: Prec: 0.700, Rec: 0.708, F1: 0.704, Acc: 0.803
*****************************************************************************
Test 5/5
Epoch: 1
Epoch 1/1
Test-Data: Prec: 0.718, Rec: 0.457, F1: 0.558, Acc: 0.761
Epoch: 2
Epoch 1/1
Test-Data: Prec: 0.710, Rec: 0.588, F1: 0.643, Acc: 0.785
Epoch: 3
Epoch 1/1
Test-Data: Prec: 0.736, Rec: 0.584, F1: 0.651, Acc: 0.793
Epoch: 4
Epoch 1/1
Test-Data: Prec: 0.704, Rec: 0.667, F1: 0.685, Acc: 0.797
Epoch: 5
Epoch 1/1
Test-Data: Prec: 0.734, Rec: 0.588, F1: 0.653, Acc: 0.793
Epoch: 6
Epoch 1/1
Test-Data: Prec: 0.720, Rec: 0.693, F1: 0.706, Acc: 0.809
Epoch: 7
Epoch 1/1
Test-Data: Prec: 0.707, Rec: 0.678, F1: 0.692, Acc: 0.801
Epoc

TypeError: bad operand type for unary +: 'str'

# gradual_unfreezing

In [20]:
train_sentences, train_labels, dev_sentences, dev_labels, labels2Idx = train_dev_sentences(filetrain='/home/gwiedemann/notebooks/OffLang/sample_train.txt',
                   filedev='/home/gwiedemann/notebooks/OffLang/sample_dev.txt', check=3)

In [21]:
print(dev_sentences[0])
print(len(dev_sentences))
print(len(dev_labels))

@FilmElf_yt Diese ganzen leute die du angesprochen hast sind untermenschen ja aber das alte Deutschland und deutsche volk waren ehrenwerte leute und ein stolzes Land
808
808


In [35]:
def test_model_tl_unfreezing(generator, 
               train_sentences, 
               devLabels, 
               number_of_tests,
               number_of_epochs,
               filename_to_log, 
               labels2Idx,
               filename_to_save_weigths,
               batch_size, 
               unfreezing_strategy: 'list containing a tuple of indices to unfreeze at each step',
               train_file:'filepath for traininig',
               f1_measure:'binary/macro etc', 
               pos_label:'only if binary f1',
               load_model_weights=False,
               model_weights_file:'give filepath as str'=None, 
               tokenize=True,
               nb_sequence_length = nb_sequence_length,
               nb_embedding_dims= nb_embedding_dims, 
               check_for_generator=None):
    
    f = open(filename_to_log, 'w', encoding='utf-8')
    f.close()
    
   
    total_f1=0
    total_prec=0
    total_acc=0
    total_recall=0
    
    for test_number in range(number_of_tests):
        print("Test %d/%d" %(test_number+1, number_of_tests))
        model = compile_model(2)

        # transfer learning
        if load_model_weights and model_weights_file:
                model.load_weights(model_weights_file)
                print("removing top layer")
                model.layers.pop()
                output = Dense(2, activation = 'softmax')(model.layers[-1].output)
                final_model = Model(inputs=model.input, outputs=[output])

        samples_per_epoch = len(train_sentences)
        epochs = number_of_epochs
        batch_size = batch_size
        steps_per_epoch = math.ceil(samples_per_epoch / batch_size)
#         checkpoint = ModelCheckpoint(filename_to_save_weigths, monitor='val_acc',save_best_only = True, 
#                                      save_weights_only = True)


        max_f1=0
        max_p=0
        max_r=0
        max_a=0
        
        # load pretrained weights
        # model.compile
        # save tmp weights
        # iterate over layers
        #    load tmp weights
        #    iterate over epochs
        #        unfreeze top frozen layer
        #        save best model as tmp weights
        
        
        final_model.save(filename_to_save_weigths)
        
        # layers_to_unfreeze = [18, 16, 3, 1]
        
        for ulayer in unfreezing_strategy:
            print("unfreezing " + final_model.layers[ulayer[0]].name)
            print("---------------------------------------")
            final_model.load_weights(filename_to_save_weigths)            
            for i, layer in enumerate(final_model.layers):
                
                # TF strategy: gradual unfreezing
                #if i >= ulayer:
                #    layer.trainable = True
                #else:
                #    layer.trainable = False
                # 
                ## TF strategy: single
                
                if i >= ulayer[1] and i <= ulayer[0]:
                    layer.trainable = True
                else:
                    layer.trainable = False
                    
                print(str(i) + ' ' + layer.name + ' ' + str(layer.trainable))
            final_model.compile(loss='categorical_crossentropy', optimizer='nadam', metrics=['accuracy'])
        
            for epoch in range(epochs):
                print("Epoch: %d/%d" %(epoch+1, epochs))
                final_model.fit_generator(
                    generator(filename = train_file, batch_size = batch_size, check = check_for_generator, 
                              labels2Idx= labels2Idx,tokenize= tokenize), 
                    steps_per_epoch= steps_per_epoch, epochs=1
                )

                testset_features = np.zeros((len(dev_sentences), nb_sequence_length, nb_embedding_dims))
                for i in range(len(dev_sentences)):
                    testset_features[i] = process_features(dev_sentences[i], nb_sequence_length, nb_embedding_dims)
                results = final_model.predict(testset_features)

                predLabels = results.argmax(axis=-1)
                devLabels = devLabels
                f1 = f1_score(devLabels, predLabels, average=f1_measure, pos_label=pos_label) # offensive is the major class. So other is minor
                r = recall_score(devLabels, predLabels, average=f1_measure, pos_label=pos_label)
                p = precision_score(devLabels, predLabels, average=f1_measure, pos_label=pos_label)
                a = accuracy_score(devLabels, predLabels)
                if max_f1 < f1:
                    print("model saved. F1 is %f" %(f1))
                    final_model.save(filename_to_save_weigths)
                    max_f1 = f1
                    max_p = p
                    max_r = r
                    max_a = a
                text = "prec: "+ str(p)+" rec: "+str(r) +" f1: "+str(f1) +" acc: "+str(a)+" \n"
                print("Test-Data: Prec: %.3f, Rec: %.3f, F1: %.3f, Acc: %.3f" % (p, r, f1, a))
        to_write= "prec: "+ str(max_p)+" rec: "+str(max_r) +" f1: "+str(max_f1) +" acc: "+str(max_a)+" \n"
        print(to_write)
        with open(filename_to_log,'a') as f:
            f.write(to_write)
        total_f1+=max_f1
        total_prec+=max_p
        total_acc+=max_a
        total_recall+=max_r    
        print("*****************************************************************************")
    final_text = "avg_prec: " +str(total_prec/number_of_tests)+" total_rec: "+str(total_recall/number_of_tests) +" total_f1: "+str(total_f1/number_of_tests) +" total_acc: "+str(total_acc/number_of_tests)+" \n"
    print(final_text)
    with open(filename_to_log,'a') as f:
        f.write(final_text)
#     f.close()

In [41]:
# list of tuples. Every tuple contains range of layers which need to be unfrozen. Rest all are frozen
single_unfreeze_bottom_up = [(18, 18), (17, 16), (15, 3), (2, 1), (18,1)] 
single_unfreeze_top_down = [(18, 18),   (2, 1),(15, 3), (17, 16), (18,1)]
all_unfreeze = [(18,1)]
gradual_unfreezing = [(18,18), (18,16), (18,3), (18,1)]

# strings =['suf_bu', 'suf_td','all_unfreeze','gradual_unfreeze']
strings=['gradual_unfreeze']
# unfreeze_strategy = [single_unfreeze_bottom_up, single_unfreeze_top_down, all_unfreeze, gradual_unfreezing]
unfreeze_strategy = [gradual_unfreezing]

In [None]:
for i in range(len(strings)):
    string = strings[i]
    print("approach: %s" %(string))


    generator = sequential_generator
    train_sentences = train_sentences
    devLabels = dev_labels
    number_of_tests = 5
    number_of_epochs = 50
    labels2Id = labels2Idx
    millionpostcorpus_tl_log = '/home/jindal/notebooks/jindal/NER/language_model/results_tl_millionpostcorpus_' +string+'.txt' 
    print("log file: %s" %(millionpostcorpus_tl_log))

    millionpostcorpus_tl_save_weigths='/home/jindal/notebooks/jindal/NER/language_model/classification_model_tl_millionpostcorpus_'+string+'.h5'
    print("save weights file: %s" %(millionpostcorpus_tl_save_weigths))
    batch_size=32
    millionpostcorpus_tl_train_file='/home/gwiedemann/notebooks/OffLang/sample_train.txt'
    f1_measure='binary'
    pos_label=1
    strategy = unfreeze_strategy[i]
    print(strategy)
    load_model_weights=True
    model_weights_file = '/home/jindal/notebooks/jindal/NER/language_model/model_pretrained_millionpostcorpus.h5'
    nb_sequence_length = nb_sequence_length
    nb_embedding_dims= nb_embedding_dims
    check_for_generator=3

    test_model_tl_unfreezing(generator=generator, 
               train_sentences=train_sentences, 
               devLabels=devLabels, 
               number_of_tests= number_of_tests,
               number_of_epochs=number_of_epochs, 
               filename_to_log=millionpostcorpus_tl_log, 
               labels2Idx = labels2Id,
               filename_to_save_weigths=millionpostcorpus_tl_save_weigths,
               batch_size=batch_size,
               unfreezing_strategy = strategy,       
               train_file=millionpostcorpus_tl_train_file, 
               f1_measure=f1_measure, 
               pos_label=pos_label, 
               load_model_weights=load_model_weights,
               model_weights_file = model_weights_file, 
               nb_sequence_length=nb_sequence_length, 
               nb_embedding_dims=nb_embedding_dims, 
               check_for_generator= check_for_generator)

approach: gradual_unfreeze
log file: /home/jindal/notebooks/jindal/NER/language_model/results_tl_millionpostcorpus_gradual_unfreeze.txt
save weights file: /home/jindal/notebooks/jindal/NER/language_model/classification_model_tl_millionpostcorpus_gradual_unfreeze.h5
[(18, 18), (18, 16), (18, 3), (18, 1)]
Test 1/5
removing top layer
unfreezing dense_84
---------------------------------------
0 input_28 False
1 bidirectional_28 False
2 leaky_re_lu_136 False
3 conv1d_82 False
4 conv1d_83 False
5 conv1d_84 False
6 leaky_re_lu_137 False
7 leaky_re_lu_138 False
8 leaky_re_lu_139 False
9 global_max_pooling1d_82 False
10 global_max_pooling1d_83 False
11 global_max_pooling1d_84 False
12 dropout_82 False
13 dropout_83 False
14 dropout_84 False
15 concatenate_28 False
16 dense_82 False
17 leaky_re_lu_140 False
18 dense_84 True
Epoch: 1/50
Epoch 1/1
model saved. F1 is 0.261838
Test-Data: Prec: 0.511, Rec: 0.176, F1: 0.262, Acc: 0.672
Epoch: 2/50
Epoch 1/1
Test-Data: Prec: 0.412, Rec: 0.052, F1: 0.0

Test-Data: Prec: 0.583, Rec: 0.105, F1: 0.178, Acc: 0.679
Epoch: 46/50
Epoch 1/1
Test-Data: Prec: 0.585, Rec: 0.206, F1: 0.305, Acc: 0.689
Epoch: 47/50
Epoch 1/1
Test-Data: Prec: 0.582, Rec: 0.120, F1: 0.199, Acc: 0.681
Epoch: 48/50
Epoch 1/1
Test-Data: Prec: 0.554, Rec: 0.116, F1: 0.192, Acc: 0.677
Epoch: 49/50
Epoch 1/1
Test-Data: Prec: 0.575, Rec: 0.157, F1: 0.247, Acc: 0.683
Epoch: 50/50
Epoch 1/1
Test-Data: Prec: 0.578, Rec: 0.097, F1: 0.167, Acc: 0.678
unfreezing dense_84
---------------------------------------
0 input_28 False
1 bidirectional_28 False
2 leaky_re_lu_136 False
3 conv1d_82 False
4 conv1d_83 False
5 conv1d_84 False
6 leaky_re_lu_137 False
7 leaky_re_lu_138 False
8 leaky_re_lu_139 False
9 global_max_pooling1d_82 False
10 global_max_pooling1d_83 False
11 global_max_pooling1d_84 False
12 dropout_82 False
13 dropout_83 False
14 dropout_84 False
15 concatenate_28 False
16 dense_82 True
17 leaky_re_lu_140 True
18 dense_84 True
Epoch: 1/50
Epoch 1/1
Test-Data: Prec: 0.683,

Test-Data: Prec: 0.681, Rec: 0.303, F1: 0.420, Acc: 0.723
Epoch: 41/50
Epoch 1/1
Test-Data: Prec: 0.713, Rec: 0.251, F1: 0.371, Acc: 0.719
Epoch: 42/50
Epoch 1/1
Test-Data: Prec: 0.661, Rec: 0.315, F1: 0.426, Acc: 0.720
Epoch: 43/50
Epoch 1/1
Test-Data: Prec: 0.678, Rec: 0.300, F1: 0.416, Acc: 0.722
Epoch: 44/50
Epoch 1/1
Test-Data: Prec: 0.670, Rec: 0.273, F1: 0.388, Acc: 0.715
Epoch: 45/50
Epoch 1/1
Test-Data: Prec: 0.705, Rec: 0.251, F1: 0.370, Acc: 0.718
Epoch: 46/50
Epoch 1/1
model saved. F1 is 0.442786
Test-Data: Prec: 0.659, Rec: 0.333, F1: 0.443, Acc: 0.723
Epoch: 47/50
Epoch 1/1
Test-Data: Prec: 0.688, Rec: 0.247, F1: 0.364, Acc: 0.714
Epoch: 48/50
Epoch 1/1
Test-Data: Prec: 0.669, Rec: 0.311, F1: 0.425, Acc: 0.722
Epoch: 49/50
Epoch 1/1
Test-Data: Prec: 0.647, Rec: 0.322, F1: 0.430, Acc: 0.718
Epoch: 50/50
Epoch 1/1
Test-Data: Prec: 0.673, Rec: 0.270, F1: 0.385, Acc: 0.715
unfreezing dense_84
---------------------------------------
0 input_28 False
1 bidirectional_28 False
2 

model saved. F1 is 0.630952
Test-Data: Prec: 0.671, Rec: 0.596, F1: 0.631, Acc: 0.770
Epoch: 36/50
Epoch 1/1
Test-Data: Prec: 0.697, Rec: 0.517, F1: 0.594, Acc: 0.766
Epoch: 37/50
Epoch 1/1
Test-Data: Prec: 0.705, Rec: 0.457, F1: 0.555, Acc: 0.757
Epoch: 38/50
Epoch 1/1
Test-Data: Prec: 0.697, Rec: 0.491, F1: 0.576, Acc: 0.761
Epoch: 39/50
Epoch 1/1
Test-Data: Prec: 0.679, Rec: 0.532, F1: 0.597, Acc: 0.762
Epoch: 40/50
Epoch 1/1
Test-Data: Prec: 0.718, Rec: 0.468, F1: 0.567, Acc: 0.764
Epoch: 41/50
Epoch 1/1
Test-Data: Prec: 0.704, Rec: 0.569, F1: 0.629, Acc: 0.778
Epoch: 42/50
Epoch 1/1
Test-Data: Prec: 0.683, Rec: 0.566, F1: 0.619, Acc: 0.770
Epoch: 43/50
Epoch 1/1
Test-Data: Prec: 0.694, Rec: 0.509, F1: 0.587, Acc: 0.764
Epoch: 44/50
Epoch 1/1
Test-Data: Prec: 0.721, Rec: 0.494, F1: 0.587, Acc: 0.770
Epoch: 45/50
Epoch 1/1
Test-Data: Prec: 0.688, Rec: 0.577, F1: 0.627, Acc: 0.774
Epoch: 46/50
Epoch 1/1
Test-Data: Prec: 0.701, Rec: 0.509, F1: 0.590, Acc: 0.766
Epoch: 47/50
Epoch 1/1


Test-Data: Prec: 0.726, Rec: 0.607, F1: 0.661, Acc: 0.795
Epoch: 31/50
Epoch 1/1
model saved. F1 is 0.698011
Test-Data: Prec: 0.675, Rec: 0.723, F1: 0.698, Acc: 0.793
Epoch: 32/50
Epoch 1/1
Test-Data: Prec: 0.685, Rec: 0.637, F1: 0.660, Acc: 0.783
Epoch: 33/50
Epoch 1/1
Test-Data: Prec: 0.700, Rec: 0.674, F1: 0.687, Acc: 0.797
Epoch: 34/50
Epoch 1/1
Test-Data: Prec: 0.746, Rec: 0.517, F1: 0.611, Acc: 0.782
Epoch: 35/50
Epoch 1/1
Test-Data: Prec: 0.732, Rec: 0.584, F1: 0.650, Acc: 0.792
Epoch: 40/50
Epoch 1/1
Test-Data: Prec: 0.734, Rec: 0.569, F1: 0.641, Acc: 0.790
Epoch: 41/50
Epoch 1/1
Test-Data: Prec: 0.727, Rec: 0.569, F1: 0.639, Acc: 0.787
Epoch: 42/50
Epoch 1/1
Test-Data: Prec: 0.697, Rec: 0.629, F1: 0.661, Acc: 0.787
Epoch: 43/50
Epoch 1/1
Test-Data: Prec: 0.715, Rec: 0.573, F1: 0.636, Acc: 0.783
Epoch: 44/50
Epoch 1/1
Test-Data: Prec: 0.751, Rec: 0.509, F1: 0.607, Acc: 0.782
Epoch: 45/50
Epoch 1/1
Test-Data: Prec: 0.715, Rec: 0.554, F1: 0.624, Acc: 0.780
Epoch: 46/50
Epoch 1/1


Test-Data: Prec: 0.554, Rec: 0.191, F1: 0.284, Acc: 0.682
Epoch: 28/50
Epoch 1/1
Test-Data: Prec: 0.562, Rec: 0.154, F1: 0.241, Acc: 0.681
Epoch: 29/50
Epoch 1/1
Test-Data: Prec: 0.536, Rec: 0.112, F1: 0.186, Acc: 0.675
Epoch: 30/50
Epoch 1/1
Test-Data: Prec: 0.591, Rec: 0.195, F1: 0.293, Acc: 0.689
Epoch: 31/50
Epoch 1/1
Test-Data: Prec: 0.567, Rec: 0.127, F1: 0.208, Acc: 0.679
Epoch: 32/50
Epoch 1/1
Test-Data: Prec: 0.525, Rec: 0.116, F1: 0.190, Acc: 0.673
Epoch: 33/50
Epoch 1/1
Test-Data: Prec: 0.569, Rec: 0.124, F1: 0.203, Acc: 0.679
Epoch: 34/50
Epoch 1/1
Test-Data: Prec: 0.587, Rec: 0.139, F1: 0.224, Acc: 0.683
Epoch: 35/50
Epoch 1/1
model saved. F1 is 0.313514
Test-Data: Prec: 0.563, Rec: 0.217, F1: 0.314, Acc: 0.686
Epoch: 36/50
Epoch 1/1
Test-Data: Prec: 0.600, Rec: 0.101, F1: 0.173, Acc: 0.681
Epoch: 37/50
Epoch 1/1
Test-Data: Prec: 0.545, Rec: 0.135, F1: 0.216, Acc: 0.677
Epoch: 38/50
Epoch 1/1
Test-Data: Prec: 0.548, Rec: 0.150, F1: 0.235, Acc: 0.678
Epoch: 39/50
Epoch 1/1


Test-Data: Prec: 0.681, Rec: 0.240, F1: 0.355, Acc: 0.712
Epoch: 23/50
Epoch 1/1
Test-Data: Prec: 0.667, Rec: 0.202, F1: 0.310, Acc: 0.703
Epoch: 24/50
Epoch 1/1
Test-Data: Prec: 0.667, Rec: 0.232, F1: 0.344, Acc: 0.708
Epoch: 25/50
Epoch 1/1
Test-Data: Prec: 0.654, Rec: 0.199, F1: 0.305, Acc: 0.700
Epoch: 26/50
Epoch 1/1
Test-Data: Prec: 0.663, Rec: 0.236, F1: 0.348, Acc: 0.708
Epoch: 27/50
Epoch 1/1
Test-Data: Prec: 0.651, Rec: 0.266, F1: 0.378, Acc: 0.710
Epoch: 28/50
Epoch 1/1
Test-Data: Prec: 0.671, Rec: 0.199, F1: 0.306, Acc: 0.703
Epoch: 29/50
Epoch 1/1
Test-Data: Prec: 0.682, Rec: 0.273, F1: 0.390, Acc: 0.718
Epoch: 30/50
Epoch 1/1
Test-Data: Prec: 0.657, Rec: 0.243, F1: 0.355, Acc: 0.708
Epoch: 31/50
Epoch 1/1
Test-Data: Prec: 0.684, Rec: 0.251, F1: 0.367, Acc: 0.714
Epoch: 32/50
Epoch 1/1
Test-Data: Prec: 0.696, Rec: 0.240, F1: 0.357, Acc: 0.714
Epoch: 33/50
Epoch 1/1
Test-Data: Prec: 0.696, Rec: 0.240, F1: 0.357, Acc: 0.714
Epoch: 34/50
Epoch 1/1
Test-Data: Prec: 0.697, Rec:

Test-Data: Prec: 0.683, Rec: 0.581, F1: 0.628, Acc: 0.772
Epoch: 18/50
Epoch 1/1
Test-Data: Prec: 0.694, Rec: 0.483, F1: 0.570, Acc: 0.759
Epoch: 19/50
Epoch 1/1
Test-Data: Prec: 0.672, Rec: 0.453, F1: 0.541, Acc: 0.746
Epoch: 20/50
Epoch 1/1
Test-Data: Prec: 0.670, Rec: 0.539, F1: 0.598, Acc: 0.760
Epoch: 21/50
Epoch 1/1
Test-Data: Prec: 0.673, Rec: 0.517, F1: 0.585, Acc: 0.757
Epoch: 22/50
Epoch 1/1
Test-Data: Prec: 0.667, Rec: 0.524, F1: 0.587, Acc: 0.756
Epoch: 23/50
Epoch 1/1
Test-Data: Prec: 0.682, Rec: 0.562, F1: 0.616, Acc: 0.769
Epoch: 24/50
Epoch 1/1
Test-Data: Prec: 0.665, Rec: 0.498, F1: 0.570, Acc: 0.751
Epoch: 25/50
Epoch 1/1
Test-Data: Prec: 0.679, Rec: 0.554, F1: 0.610, Acc: 0.766
Epoch: 26/50
Epoch 1/1
Test-Data: Prec: 0.677, Rec: 0.509, F1: 0.581, Acc: 0.757
Epoch: 27/50
Epoch 1/1
Test-Data: Prec: 0.700, Rec: 0.532, F1: 0.604, Acc: 0.770
Epoch: 28/50
Epoch 1/1
Test-Data: Prec: 0.696, Rec: 0.498, F1: 0.581, Acc: 0.762
Epoch: 29/50
Epoch 1/1
Test-Data: Prec: 0.711, Rec:

Test-Data: Prec: 0.683, Rec: 0.685, F1: 0.684, Acc: 0.791
Epoch: 13/50
Epoch 1/1
Test-Data: Prec: 0.711, Rec: 0.637, F1: 0.672, Acc: 0.795
Epoch: 14/50
Epoch 1/1
Test-Data: Prec: 0.698, Rec: 0.633, F1: 0.664, Acc: 0.788
Epoch: 15/50
Epoch 1/1
Test-Data: Prec: 0.680, Rec: 0.715, F1: 0.697, Acc: 0.795
Epoch: 16/50
Epoch 1/1
Test-Data: Prec: 0.718, Rec: 0.715, F1: 0.717, Acc: 0.813
Epoch: 17/50
Epoch 1/1
Test-Data: Prec: 0.726, Rec: 0.596, F1: 0.654, Acc: 0.792
Epoch: 18/50
Epoch 1/1
Test-Data: Prec: 0.657, Rec: 0.753, F1: 0.702, Acc: 0.788
Epoch: 19/50
Epoch 1/1
Test-Data: Prec: 0.669, Rec: 0.764, F1: 0.713, Acc: 0.797
Epoch: 20/50
Epoch 1/1
Test-Data: Prec: 0.687, Rec: 0.708, F1: 0.697, Acc: 0.797
Epoch: 21/50
Epoch 1/1
Test-Data: Prec: 0.655, Rec: 0.727, F1: 0.689, Acc: 0.783
Epoch: 22/50
Epoch 1/1
Test-Data: Prec: 0.700, Rec: 0.674, F1: 0.687, Acc: 0.797
Epoch: 23/50
Epoch 1/1
Test-Data: Prec: 0.682, Rec: 0.659, F1: 0.670, Acc: 0.786
Epoch: 24/50
Epoch 1/1
Test-Data: Prec: 0.677, Rec:

Test-Data: Prec: 0.571, Rec: 0.060, F1: 0.108, Acc: 0.675
Epoch: 8/50
Epoch 1/1
Test-Data: Prec: 0.488, Rec: 0.079, F1: 0.135, Acc: 0.668
Epoch: 9/50
Epoch 1/1
Test-Data: Prec: 0.556, Rec: 0.075, F1: 0.132, Acc: 0.675
Epoch: 10/50
Epoch 1/1
Test-Data: Prec: 0.564, Rec: 0.116, F1: 0.193, Acc: 0.678
Epoch: 11/50
Epoch 1/1
Test-Data: Prec: 0.551, Rec: 0.101, F1: 0.171, Acc: 0.676
Epoch: 12/50
Epoch 1/1
Test-Data: Prec: 0.532, Rec: 0.124, F1: 0.201, Acc: 0.675
Epoch: 13/50
Epoch 1/1
Test-Data: Prec: 0.542, Rec: 0.120, F1: 0.196, Acc: 0.676
Epoch: 14/50
Epoch 1/1
model saved. F1 is 0.212766
Test-Data: Prec: 0.565, Rec: 0.131, F1: 0.213, Acc: 0.679
Epoch: 15/50
Epoch 1/1
Test-Data: Prec: 0.541, Rec: 0.124, F1: 0.201, Acc: 0.676
Epoch: 16/50
Epoch 1/1
model saved. F1 is 0.250000
Test-Data: Prec: 0.558, Rec: 0.161, F1: 0.250, Acc: 0.681
Epoch: 17/50
Epoch 1/1
Test-Data: Prec: 0.595, Rec: 0.094, F1: 0.162, Acc: 0.679
Epoch: 18/50
Epoch 1/1
Test-Data: Prec: 0.577, Rec: 0.112, F1: 0.188, Acc: 0.6

Test-Data: Prec: 0.658, Rec: 0.180, F1: 0.282, Acc: 0.698
Epoch: 3/50
Epoch 1/1
model saved. F1 is 0.293948
Test-Data: Prec: 0.637, Rec: 0.191, F1: 0.294, Acc: 0.697
Epoch: 4/50
Epoch 1/1
Test-Data: Prec: 0.667, Rec: 0.180, F1: 0.283, Acc: 0.699
Epoch: 5/50
Epoch 1/1
model saved. F1 is 0.347826
Test-Data: Prec: 0.634, Rec: 0.240, F1: 0.348, Acc: 0.703
Epoch: 6/50
Epoch 1/1
Test-Data: Prec: 0.696, Rec: 0.180, F1: 0.286, Acc: 0.703
Epoch: 7/50
Epoch 1/1
Test-Data: Prec: 0.643, Rec: 0.236, F1: 0.345, Acc: 0.704
Epoch: 8/50
Epoch 1/1
model saved. F1 is 0.371968
Test-Data: Prec: 0.663, Rec: 0.258, F1: 0.372, Acc: 0.712
Epoch: 9/50
Epoch 1/1
Test-Data: Prec: 0.671, Rec: 0.199, F1: 0.306, Acc: 0.703
Epoch: 10/50
Epoch 1/1
Test-Data: Prec: 0.667, Rec: 0.210, F1: 0.319, Acc: 0.704
Epoch: 11/50
Epoch 1/1
Test-Data: Prec: 0.659, Rec: 0.202, F1: 0.309, Acc: 0.702
Epoch: 12/50
Epoch 1/1
Test-Data: Prec: 0.647, Rec: 0.165, F1: 0.263, Acc: 0.694
Epoch: 13/50
Epoch 1/1
model saved. F1 is 0.397906
Test

model saved. F1 is 0.459658
Test-Data: Prec: 0.662, Rec: 0.352, F1: 0.460, Acc: 0.726
unfreezing dense_90
---------------------------------------
0 input_30 False
1 bidirectional_30 False
2 leaky_re_lu_146 False
3 conv1d_88 True
4 conv1d_89 True
5 conv1d_90 True
6 leaky_re_lu_147 True
7 leaky_re_lu_148 True
8 leaky_re_lu_149 True
9 global_max_pooling1d_88 True
10 global_max_pooling1d_89 True
11 global_max_pooling1d_90 True
12 dropout_88 True
13 dropout_89 True
14 dropout_90 True
15 concatenate_30 True
16 dense_88 True
17 leaky_re_lu_150 True
18 dense_90 True
Epoch: 1/50
Epoch 1/1
Test-Data: Prec: 0.690, Rec: 0.225, F1: 0.339, Acc: 0.710
Epoch: 2/50
Epoch 1/1
Test-Data: Prec: 0.664, Rec: 0.318, F1: 0.430, Acc: 0.722
Epoch: 3/50
Epoch 1/1
Test-Data: Prec: 0.683, Rec: 0.322, F1: 0.438, Acc: 0.726
Epoch: 4/50
Epoch 1/1
model saved. F1 is 0.488038
Test-Data: Prec: 0.675, Rec: 0.382, F1: 0.488, Acc: 0.735
Epoch: 5/50
Epoch 1/1
Test-Data: Prec: 0.705, Rec: 0.367, F1: 0.483, Acc: 0.740
Epoch: 

Test-Data: Prec: 0.708, Rec: 0.446, F1: 0.547, Acc: 0.756
Epoch: 46/50
Epoch 1/1
Test-Data: Prec: 0.671, Rec: 0.558, F1: 0.609, Acc: 0.764
Epoch: 47/50
Epoch 1/1
Test-Data: Prec: 0.656, Rec: 0.513, F1: 0.576, Acc: 0.750
Epoch: 48/50
Epoch 1/1
Test-Data: Prec: 0.683, Rec: 0.532, F1: 0.598, Acc: 0.764
Epoch: 49/50
Epoch 1/1
Test-Data: Prec: 0.665, Rec: 0.521, F1: 0.584, Acc: 0.755
Epoch: 50/50
Epoch 1/1
Test-Data: Prec: 0.676, Rec: 0.532, F1: 0.595, Acc: 0.761
unfreezing dense_90
---------------------------------------
0 input_30 False
1 bidirectional_30 True
2 leaky_re_lu_146 True
3 conv1d_88 True
4 conv1d_89 True
5 conv1d_90 True
6 leaky_re_lu_147 True
7 leaky_re_lu_148 True
8 leaky_re_lu_149 True
9 global_max_pooling1d_88 True
10 global_max_pooling1d_89 True
11 global_max_pooling1d_90 True
12 dropout_88 True
13 dropout_89 True
14 dropout_90 True
15 concatenate_30 True
16 dense_88 True
17 leaky_re_lu_150 True
18 dense_90 True
Epoch: 1/50
Epoch 1/1
Test-Data: Prec: 0.704, Rec: 0.517, F1

Test-Data: Prec: 0.708, Rec: 0.599, F1: 0.649, Acc: 0.786
Epoch: 41/50
Epoch 1/1
Test-Data: Prec: 0.730, Rec: 0.577, F1: 0.644, Acc: 0.790
Epoch: 42/50
Epoch 1/1
Test-Data: Prec: 0.717, Rec: 0.625, F1: 0.668, Acc: 0.795
Epoch: 43/50
Epoch 1/1
Test-Data: Prec: 0.762, Rec: 0.577, F1: 0.657, Acc: 0.801
Epoch: 44/50
Epoch 1/1
Test-Data: Prec: 0.710, Rec: 0.678, F1: 0.693, Acc: 0.802
Epoch: 45/50
Epoch 1/1
 30/132 [=====>........................] - ETA: 22s - loss: 0.0351 - acc: 0.9875