In [1]:
# libraries
import keras
import numpy as np
import pandas as pd
import seaborn as sns
import matplotlib.pylab as plt
from sklearn.model_selection import train_test_split
from sklearn.utils import resample

In [2]:
# read csv
df = pd.read_csv('../input/dhanvarsha/Interview_round_dataset.csv') 

In [3]:
# check dataframe
df.head()

Unnamed: 0,Sr_No,Feature_1,Feature_2,Feature_3,Feature_4,Feature_5,Feature_6,Feature_7,Feature_8,Feature_9,...,Feature_21,Feature_22,Feature_23,Feature_24,Feature_25,Feature_26,Feature_27,Feature_28,Feature_29,Target_flag
0,26791,-1.101444,0.780847,-0.150606,0.044194,2.779388,3.826857,0.505011,0.448779,0.42835,...,-0.318102,-0.110152,-0.045112,1.008263,0.237554,-0.296286,0.072267,-0.072137,20.13,0
1,91547,0.905274,0.080784,1.547836,2.570243,-0.10063,2.017006,-0.840341,0.709949,-0.016073,...,0.064652,0.504713,0.201644,-0.61886,-0.043392,0.062233,0.117348,0.026562,6.08,0
2,281304,2.021258,0.153611,-1.710915,1.198175,0.602164,-0.6523,0.488583,-0.218795,0.048074,...,0.069765,0.385032,-0.0425,-0.405255,0.455746,-0.484028,-0.021226,-0.077854,1.99,0
3,83873,1.191927,-0.039543,0.537142,0.697681,-0.402698,-0.052089,-0.224193,0.045363,0.317585,...,-0.069138,0.024003,-0.133153,0.087927,0.580386,0.411193,-0.015511,0.000913,12.31,0
4,252334,0.121001,1.015667,-0.404468,-0.539553,0.988905,-0.84864,0.959057,-0.120624,-0.08233,...,-0.337542,-0.819971,0.094267,0.566302,-0.407398,0.112873,0.22301,0.085447,1.79,0


In [4]:
# check shape of dataframe
df.shape

(227198, 31)

In [5]:
# check columns of dataframe
df.columns

Index(['Sr_No', 'Feature_1', 'Feature_2', 'Feature_3', 'Feature_4',
       'Feature_5', 'Feature_6', 'Feature_7', 'Feature_8', 'Feature_9',
       'Feature_10', 'Feature_11', 'Feature_12', 'Feature_13', 'Feature_14',
       'Feature_15', 'Feature_16', 'Feature_17', 'Feature_18', 'Feature_19',
       'Feature_20', 'Feature_21', 'Feature_22', 'Feature_23', 'Feature_24',
       'Feature_25', 'Feature_26', 'Feature_27', 'Feature_28', 'Feature_29',
       'Target_flag'],
      dtype='object')

In [6]:
# check info of dataframe
df.info()

<class 'pandas.core.frame.DataFrame'>
RangeIndex: 227198 entries, 0 to 227197
Data columns (total 31 columns):
 #   Column       Non-Null Count   Dtype  
---  ------       --------------   -----  
 0   Sr_No        227198 non-null  int64  
 1   Feature_1    227198 non-null  float64
 2   Feature_2    227198 non-null  float64
 3   Feature_3    227198 non-null  float64
 4   Feature_4    227198 non-null  float64
 5   Feature_5    227198 non-null  float64
 6   Feature_6    227198 non-null  float64
 7   Feature_7    227198 non-null  float64
 8   Feature_8    227198 non-null  float64
 9   Feature_9    227198 non-null  float64
 10  Feature_10   227198 non-null  float64
 11  Feature_11   227198 non-null  float64
 12  Feature_12   227198 non-null  float64
 13  Feature_13   227198 non-null  float64
 14  Feature_14   227198 non-null  float64
 15  Feature_15   227198 non-null  float64
 16  Feature_16   227198 non-null  float64
 17  Feature_17   227198 non-null  float64
 18  Feature_18   227198 non-

In [7]:
# check number of unique values in each column
df.nunique(axis=0)

Sr_No          227198
Feature_1      220792
Feature_2      220792
Feature_3      220792
Feature_4      220794
Feature_5      220794
Feature_6      220790
Feature_7      220791
Feature_8      220784
Feature_9      220793
Feature_10     220785
Feature_11     220787
Feature_12     220791
Feature_13     220795
Feature_14     220792
Feature_15     220791
Feature_16     220785
Feature_17     220785
Feature_18     220792
Feature_19     220790
Feature_20     220778
Feature_21     220768
Feature_22     220787
Feature_23     220770
Feature_24     220789
Feature_25     220785
Feature_26     220786
Feature_27     220756
Feature_28     220721
Feature_29      29283
Target_flag         2
dtype: int64

In [8]:
# check target variable distribution
df['Target_flag'].value_counts()

0    226806
1       392
Name: Target_flag, dtype: int64

As seen from this cell, the dataset is highly imbalanced. While working on an imbalanced dataset accuracy is not an appropriate measure to evaluate model performance. For eg: A classifier which achieves an accuracy of 98 % with an event rate of 2 % is not accurate, if it classifies all instances as the majority class. And eliminates the 2 % minority class observations as noise.

# Baseline Model

We start by creating a base model.

In [9]:
# seperate the features and target variables
labels = df.columns[1:30]
X = df[labels]
y = df['Target_flag']

# create train-test split with stratify  
X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.1, random_state=7, stratify=y)

In [10]:
# check shape of created train-test split
print(X_train.shape)
print(y_train.shape)
print(X_test.shape)
print(y_test.shape)

(204478, 29)
(204478,)
(22720, 29)
(22720,)


In [11]:
# define the different metrics we will be using
metrics = [
      keras.metrics.TruePositives(name='tp'),
      keras.metrics.FalsePositives(name='fp'),
      keras.metrics.TrueNegatives(name='tn'),
      keras.metrics.FalseNegatives(name='fn'),
      keras.metrics.BinaryAccuracy(name='accuracy'),
      keras.metrics.Precision(name='precision'),
      keras.metrics.Recall(name='recall'),
      keras.metrics.AUC(name='auc'),
]

# define batch size
batch_size = 2048

In general, you should strive for a small batch size (e.g. 32). Our case is a bit specific, we have highly imbalanced data, so we’ll give a fair chance to each batch before the weights are updated.

In [12]:
# define our model
def build_model(train_data, metrics=metrics):
    
    model = keras.Sequential([
    keras.layers.Dense(units=29,activation='relu',input_shape=(train_data.shape[-1],)),
    keras.layers.BatchNormalization(),
    keras.layers.Dropout(0.25),
    keras.layers.Dense(units=29,activation='relu'),
    keras.layers.BatchNormalization(),
    keras.layers.Dropout(0.25),
    keras.layers.Dense(units=29,activation='relu'),
    keras.layers.BatchNormalization(),
    keras.layers.Dropout(0.25),
    keras.layers.Dense(units=1, activation='sigmoid'),
    ])
    
    # compile our model
    model.compile(
    optimizer=keras.optimizers.Adam(lr=0.001),
    loss=keras.losses.BinaryCrossentropy(),
    metrics=metrics
    )

    return model

In [13]:
# training the model
model = build_model(X_train)
history = model.fit(
    X_train,
    y_train,
    batch_size=batch_size,
    epochs=20,
    validation_split=0.05,
    shuffle=True,
    verbose=1
)

Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20


In [14]:
# model summary
model.summary()

Model: "sequential"
_________________________________________________________________
Layer (type)                 Output Shape              Param #   
dense (Dense)                (None, 29)                870       
_________________________________________________________________
batch_normalization (BatchNo (None, 29)                116       
_________________________________________________________________
dropout (Dropout)            (None, 29)                0         
_________________________________________________________________
dense_1 (Dense)              (None, 29)                870       
_________________________________________________________________
batch_normalization_1 (Batch (None, 29)                116       
_________________________________________________________________
dropout_1 (Dropout)          (None, 29)                0         
_________________________________________________________________
dense_2 (Dense)              (None, 29)                8

In [15]:
# evaluate model performance on unseen data
model.evaluate(X_test, y_test, batch_size=batch_size)



[0.00541849248111248,
 23.0,
 2.0,
 22679.0,
 16.0,
 0.9992077350616455,
 0.9200000166893005,
 0.5897436141967773,
 0.9225940704345703]

After trying a lot of combinations of different hyperparameters, the model performance is not that great in terms of different metrics. Let's explore weighted model next.

# Weighted Model

We have more examples of negative class compared to the positive class. Let’s force our model to pay attention to the underrepresented class. We can do that by passing weights for each class.

In [16]:
# get count of positive and negative class
negative_class, positive_class = np.bincount(df.Target_flag)
print("Count of Negative Instance, Positive Instance :", negative_class, positive_class)

# get number of total examples
total_count = len(df.Target_flag)
print("Total Examples :", total_count)

# set weight for majority class
weight_negative = (1 / negative_class) * (total_count) / 2.0
print("Weight for Majority Class :", weight_negative)

# set weight for minority class
weight_positive = (1 / positive_class) * (total_count) / 2.0
print("Weight for Minority Class :", weight_positive)

class_weights = {0: weight_negative, 1: weight_positive}

Count of Negative Instance, Positive Instance : 226806 392
Total Examples : 227198
Weight for Majority Class : 0.5008641746691005
Weight for Minority Class : 289.79336734693874


In [17]:
# training the model
model = build_model(X_train, metrics=metrics)

history = model.fit(
    X_train,
    y_train,
    batch_size=batch_size,
    epochs=20,
    validation_split=0.05,
    shuffle=True,
    verbose=1,
    class_weight=class_weights
)

Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20


In [18]:
# evaluate model performance on unseen data
model.evaluate(X_test, y_test, batch_size=batch_size)



[0.06097414717078209,
 33.0,
 155.0,
 22526.0,
 6.0,
 0.9929137229919434,
 0.17553190886974335,
 0.8461538553237915,
 0.9877967834472656]

After trying a lot of combinations of different hyperparameters,although there has been considerable improvement in other metrics, the precision of the model is found to be extremely low.

# Oversample Minority Class

Over-Sampling increases the number of instances in the minority class by randomly replicating them in order to present a higher representation of the minority class in the sample.

In [19]:
# seperate the features and target variables
labels = df.columns[1:30]
X = df[labels]
y = df['Target_flag']

# create train-test split with stratify  
X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.1, random_state=7, stratify=y)
X = pd.concat([X_train, y_train], axis=1)

# seperate the majority and minority classes
negative_class = X[X.Target_flag == 0]
positive_class = X[X.Target_flag == 1]

In [20]:
# length of minority class
print("Length of Minority Class :", len(positive_class))

Length of Minority Class : 353


In [21]:
# upsampling minority class
positive_upsampled = resample(positive_class,
                          replace=True,
                          n_samples=len(negative_class),
                          random_state=7)

In [22]:
# length of upsampled  minority class
print("Length of Upsampled Minority Class :", len(positive_upsampled))

Length of Upsampled Minority Class : 204125


In [23]:
# combine negative class and upsampled positive class
oversampled_data = pd.concat([negative_class, positive_upsampled], axis=0)

In [24]:
# check new data
oversampled_data

Unnamed: 0,Feature_1,Feature_2,Feature_3,Feature_4,Feature_5,Feature_6,Feature_7,Feature_8,Feature_9,Feature_10,...,Feature_21,Feature_22,Feature_23,Feature_24,Feature_25,Feature_26,Feature_27,Feature_28,Feature_29,Target_flag
22186,-0.923124,-0.341242,-1.207207,-4.585854,1.033464,-0.348103,0.375391,0.476410,0.010088,-1.615664,...,0.020497,0.595268,0.014555,-0.349121,-0.284302,-0.950774,0.396593,0.132040,31.20,0
221886,-2.012659,-0.195138,2.002589,-0.536759,-0.299436,-0.102073,-1.214421,-2.373126,0.437249,-1.480027,...,-1.480635,0.423519,0.985501,0.661672,0.037246,0.817614,0.332701,0.000969,30.00,0
56887,0.676771,-1.350408,0.694895,0.221955,-1.175833,0.639744,-0.620011,0.383131,1.168366,-0.395008,...,-0.046101,-0.499162,-0.139720,-0.263602,-0.064527,0.954492,-0.077430,0.036478,251.99,0
62117,-0.639618,0.560891,1.487671,-1.534404,-0.569355,0.239651,-0.416560,0.714844,0.676186,-1.638879,...,0.173382,0.632067,-0.177002,-0.258803,0.065025,-0.695940,0.014810,-0.036132,1.00,0
9214,-1.407331,1.607340,0.464506,-0.334922,0.087982,-0.851665,0.467961,0.574703,-0.767013,-1.337393,...,-0.139035,-0.583866,-0.338291,-0.097976,0.748038,-0.338749,-0.331576,-0.099529,1.00,0
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
164077,0.364377,1.443523,-2.220907,2.036985,-1.237055,-1.728161,-2.058582,0.358895,-1.393306,-3.505790,...,0.402730,-0.132129,-0.032977,0.460861,0.560404,0.409366,0.539668,0.296918,0.76,1
200118,-1.548788,1.808698,-0.953509,2.213085,-2.015728,-0.913457,-2.356013,1.197169,-1.678374,-3.538650,...,0.855138,0.774745,0.059037,0.343200,-0.468938,-0.278338,0.625922,0.395573,76.94,1
125611,-2.740483,3.658095,-4.110636,5.340242,-2.666775,-0.092782,-4.388699,-0.280133,-2.821895,-4.466284,...,2.417495,-0.097712,0.382155,-0.154757,-0.403956,0.277895,0.830062,0.218690,112.33,1
72212,-3.975939,-1.244939,-3.707414,4.544772,4.050676,-3.407679,-5.063118,1.007042,-3.190158,-4.250717,...,1.059737,-0.037395,0.348707,-0.162929,0.410531,-0.123612,0.877424,0.667568,8.30,1


In [25]:
# seperate the features and target variables
labels = oversampled_data.columns[:30]
X = oversampled_data[labels]
y = oversampled_data['Target_flag']

# create train-test split with stratify
X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.1, random_state=7, stratify=y)

In [26]:
# check shape of created train-test split
print(X_train.shape)
print(X_test.shape)
print(y_train.shape)
print(y_test.shape)

(367425, 30)
(40825, 30)
(367425,)
(40825,)


In [27]:
# training the model
model = build_model(X_train, metrics=metrics)

history = model.fit(
    X_train,
    y_train,
    batch_size=batch_size,
    epochs=20,
    validation_split=0.05,
    shuffle=True,
    verbose=1
)

Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20


In [28]:
# evaluate model performance on unseen data
model.evaluate(X_test, y_test, batch_size=batch_size)



[1.8236469259136356e-05, 20413.0, 0.0, 20412.0, 0.0, 1.0, 1.0, 1.0, 1.0]

We can see considerable improvements now in our model performance. But oversampling increases the likelihood of overfitting since it replicates the minority class events.

# Undersample Majority Class

Undersampling aims to balance class distribution by randomly eliminating majority class examples. This is done until the majority and minority class instances are balanced out.
We’ll remove samples from the majority class and balance the data this way.

In [29]:
# seperate the features and target variables
labels = df.columns[1:30]
X = df[labels]
y = df['Target_flag']


# create train-test split with stratify  
X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.1, random_state=7, stratify=y)
X = pd.concat([X_train, y_train], axis=1)

# seperate the majority and minority classes
negative_class = X[X.Target_flag == 0]
positive_class = X[X.Target_flag == 1]

In [30]:
# length of majority class
print("Length of Majority Class :", len(negative_class))

Length of Majority Class : 204125


In [31]:
# downsampling majority class
negative_downsampled = resample(negative_class,
                          replace=False,
                          n_samples=len(positive_class),
                          random_state=7)

In [32]:
# length of downsampled majority class
print("Length of Downsampled Majority Class :", len(negative_downsampled))

Length of Downsampled Majority Class : 353


In [33]:
# combine negative dowsampled class and positive class
undersampled_data = pd.concat([negative_downsampled, positive_class], axis=0)

In [34]:
# check new data
undersampled_data

Unnamed: 0,Feature_1,Feature_2,Feature_3,Feature_4,Feature_5,Feature_6,Feature_7,Feature_8,Feature_9,Feature_10,...,Feature_21,Feature_22,Feature_23,Feature_24,Feature_25,Feature_26,Feature_27,Feature_28,Feature_29,Target_flag
193797,1.906400,-0.573265,-1.009407,0.792257,-0.198142,-0.067769,-0.192298,0.030639,1.420956,-0.131447,...,-0.365444,-0.867700,0.272260,0.590118,-0.178745,0.074378,-0.050384,-0.045986,58.68,0
143015,1.031841,-0.480074,1.284097,0.551383,-1.234127,-0.180908,-0.823551,0.095998,2.307650,-0.679066,...,-0.001148,0.236531,0.007198,0.420524,0.016228,1.075350,-0.064337,0.018270,73.80,0
44633,1.208691,-0.224328,0.318862,-0.317760,-0.630465,-0.565430,-0.305962,0.096606,0.182844,0.001888,...,0.077888,0.180560,0.029645,0.283920,0.117552,1.455968,-0.110750,-0.019538,4.99,0
135008,2.017787,-0.933999,-0.125465,-1.514940,-1.165311,-0.303344,-1.153623,0.077438,2.591155,-1.016055,...,0.241294,0.968823,0.185530,0.723452,-0.284142,-0.210828,0.067739,-0.020727,14.72,0
172548,-0.817895,-0.621163,2.106390,-1.394239,-0.621589,2.778371,0.006265,0.554697,-0.574781,0.058164,...,0.180020,0.918703,0.010010,-1.331956,-0.318719,-0.168814,-0.031983,-0.182348,176.50,0
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
52630,-0.419820,-1.155978,-2.092516,2.786750,0.736297,-0.167292,1.600027,-0.117427,-0.796954,-0.133950,...,0.480640,0.533517,1.284645,0.516131,-0.602941,-0.305024,-0.021363,0.129096,451.27,1
123402,-1.125092,3.682876,-6.556168,4.016731,-0.425571,-2.031210,-2.650137,1.131249,-2.946890,-4.816401,...,1.185580,1.348156,-0.053686,0.284122,-1.174469,-0.087832,0.718790,0.676216,0.76,1
181339,-0.443794,1.271395,1.206178,0.790371,0.418935,-0.848376,0.917691,-0.235511,-0.285692,-0.867900,...,0.119279,0.513479,-0.264243,0.443311,0.029516,-0.335141,-0.188815,-0.123391,5.09,1
165973,-5.488032,3.329561,-5.996296,3.601720,-2.023926,-1.737393,-4.396859,0.228394,-1.675884,-3.991785,...,1.719631,0.343209,0.133584,0.833340,-0.839776,0.502010,-1.937473,1.521218,0.01,1


In [35]:
# seperate the features and target variables
labels = undersampled_data.columns[:30]
X = undersampled_data[labels]
y = undersampled_data['Target_flag']

# create train-test split with stratify
X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.1, random_state=7, stratify=y)

In [36]:
# check shape of created train-test split
print(X_train.shape)
print(X_test.shape)
print(y_train.shape)
print(y_test.shape)

(635, 30)
(71, 30)
(635,)
(71,)


In [37]:
# training the model
model = build_model(X_train, metrics=metrics)

history = model.fit(
    X_train,
    y_train,
    batch_size=batch_size,
    epochs=400,
    validation_split=0.05,
    shuffle=True,
    verbose=1
)

Epoch 1/400
Epoch 2/400
Epoch 3/400
Epoch 4/400
Epoch 5/400
Epoch 6/400
Epoch 7/400
Epoch 8/400
Epoch 9/400
Epoch 10/400
Epoch 11/400
Epoch 12/400
Epoch 13/400
Epoch 14/400
Epoch 15/400
Epoch 16/400
Epoch 17/400
Epoch 18/400
Epoch 19/400
Epoch 20/400
Epoch 21/400
Epoch 22/400


Epoch 23/400
Epoch 24/400
Epoch 25/400
Epoch 26/400
Epoch 27/400
Epoch 28/400
Epoch 29/400
Epoch 30/400
Epoch 31/400
Epoch 32/400
Epoch 33/400
Epoch 34/400
Epoch 35/400
Epoch 36/400
Epoch 37/400
Epoch 38/400
Epoch 39/400
Epoch 40/400
Epoch 41/400
Epoch 42/400
Epoch 43/400


Epoch 44/400
Epoch 45/400
Epoch 46/400
Epoch 47/400
Epoch 48/400
Epoch 49/400
Epoch 50/400
Epoch 51/400
Epoch 52/400
Epoch 53/400
Epoch 54/400
Epoch 55/400
Epoch 56/400
Epoch 57/400
Epoch 58/400
Epoch 59/400
Epoch 60/400
Epoch 61/400
Epoch 62/400
Epoch 63/400
Epoch 64/400


Epoch 65/400
Epoch 66/400
Epoch 67/400
Epoch 68/400
Epoch 69/400
Epoch 70/400
Epoch 71/400
Epoch 72/400
Epoch 73/400
Epoch 74/400
Epoch 75/400
Epoch 76/400
Epoch 77/400
Epoch 78/400
Epoch 79/400
Epoch 80/400
Epoch 81/400
Epoch 82/400
Epoch 83/400
Epoch 84/400
Epoch 85/400


Epoch 86/400
Epoch 87/400
Epoch 88/400
Epoch 89/400
Epoch 90/400
Epoch 91/400
Epoch 92/400
Epoch 93/400
Epoch 94/400
Epoch 95/400
Epoch 96/400
Epoch 97/400
Epoch 98/400
Epoch 99/400
Epoch 100/400
Epoch 101/400
Epoch 102/400
Epoch 103/400
Epoch 104/400
Epoch 105/400
Epoch 106/400


Epoch 107/400
Epoch 108/400
Epoch 109/400
Epoch 110/400
Epoch 111/400
Epoch 112/400
Epoch 113/400
Epoch 114/400
Epoch 115/400
Epoch 116/400
Epoch 117/400
Epoch 118/400
Epoch 119/400
Epoch 120/400
Epoch 121/400
Epoch 122/400
Epoch 123/400
Epoch 124/400
Epoch 125/400
Epoch 126/400
Epoch 127/400


Epoch 128/400
Epoch 129/400
Epoch 130/400
Epoch 131/400
Epoch 132/400
Epoch 133/400
Epoch 134/400
Epoch 135/400
Epoch 136/400
Epoch 137/400
Epoch 138/400
Epoch 139/400
Epoch 140/400
Epoch 141/400
Epoch 142/400
Epoch 143/400
Epoch 144/400
Epoch 145/400
Epoch 146/400
Epoch 147/400
Epoch 148/400


Epoch 149/400
Epoch 150/400
Epoch 151/400
Epoch 152/400
Epoch 153/400
Epoch 154/400
Epoch 155/400
Epoch 156/400
Epoch 157/400
Epoch 158/400
Epoch 159/400
Epoch 160/400
Epoch 161/400
Epoch 162/400
Epoch 163/400
Epoch 164/400
Epoch 165/400
Epoch 166/400
Epoch 167/400
Epoch 168/400
Epoch 169/400


Epoch 170/400
Epoch 171/400
Epoch 172/400
Epoch 173/400
Epoch 174/400
Epoch 175/400
Epoch 176/400
Epoch 177/400
Epoch 178/400
Epoch 179/400
Epoch 180/400
Epoch 181/400
Epoch 182/400
Epoch 183/400
Epoch 184/400
Epoch 185/400
Epoch 186/400
Epoch 187/400
Epoch 188/400
Epoch 189/400


Epoch 190/400
Epoch 191/400
Epoch 192/400
Epoch 193/400
Epoch 194/400
Epoch 195/400
Epoch 196/400
Epoch 197/400
Epoch 198/400
Epoch 199/400
Epoch 200/400
Epoch 201/400
Epoch 202/400
Epoch 203/400
Epoch 204/400
Epoch 205/400
Epoch 206/400
Epoch 207/400
Epoch 208/400
Epoch 209/400
Epoch 210/400
Epoch 211/400


Epoch 212/400
Epoch 213/400
Epoch 214/400
Epoch 215/400
Epoch 216/400
Epoch 217/400
Epoch 218/400
Epoch 219/400
Epoch 220/400
Epoch 221/400
Epoch 222/400
Epoch 223/400
Epoch 224/400
Epoch 225/400
Epoch 226/400
Epoch 227/400
Epoch 228/400
Epoch 229/400
Epoch 230/400
Epoch 231/400
Epoch 232/400


Epoch 233/400
Epoch 234/400
Epoch 235/400
Epoch 236/400
Epoch 237/400
Epoch 238/400
Epoch 239/400
Epoch 240/400
Epoch 241/400
Epoch 242/400
Epoch 243/400
Epoch 244/400
Epoch 245/400
Epoch 246/400
Epoch 247/400
Epoch 248/400
Epoch 249/400
Epoch 250/400
Epoch 251/400
Epoch 252/400
Epoch 253/400


Epoch 254/400
Epoch 255/400
Epoch 256/400
Epoch 257/400
Epoch 258/400
Epoch 259/400
Epoch 260/400
Epoch 261/400
Epoch 262/400
Epoch 263/400
Epoch 264/400
Epoch 265/400
Epoch 266/400
Epoch 267/400
Epoch 268/400
Epoch 269/400
Epoch 270/400
Epoch 271/400
Epoch 272/400
Epoch 273/400
Epoch 274/400


Epoch 275/400
Epoch 276/400
Epoch 277/400
Epoch 278/400
Epoch 279/400
Epoch 280/400
Epoch 281/400
Epoch 282/400
Epoch 283/400
Epoch 284/400
Epoch 285/400
Epoch 286/400
Epoch 287/400
Epoch 288/400
Epoch 289/400
Epoch 290/400
Epoch 291/400
Epoch 292/400
Epoch 293/400
Epoch 294/400
Epoch 295/400


Epoch 296/400
Epoch 297/400
Epoch 298/400
Epoch 299/400
Epoch 300/400
Epoch 301/400
Epoch 302/400
Epoch 303/400
Epoch 304/400
Epoch 305/400
Epoch 306/400
Epoch 307/400
Epoch 308/400
Epoch 309/400
Epoch 310/400
Epoch 311/400
Epoch 312/400
Epoch 313/400
Epoch 314/400
Epoch 315/400
Epoch 316/400


Epoch 317/400
Epoch 318/400
Epoch 319/400
Epoch 320/400
Epoch 321/400
Epoch 322/400
Epoch 323/400
Epoch 324/400
Epoch 325/400
Epoch 326/400
Epoch 327/400
Epoch 328/400
Epoch 329/400
Epoch 330/400
Epoch 331/400
Epoch 332/400
Epoch 333/400
Epoch 334/400
Epoch 335/400
Epoch 336/400
Epoch 337/400


Epoch 338/400
Epoch 339/400
Epoch 340/400
Epoch 341/400
Epoch 342/400
Epoch 343/400
Epoch 344/400
Epoch 345/400
Epoch 346/400
Epoch 347/400
Epoch 348/400
Epoch 349/400
Epoch 350/400
Epoch 351/400
Epoch 352/400
Epoch 353/400
Epoch 354/400
Epoch 355/400
Epoch 356/400
Epoch 357/400
Epoch 358/400


Epoch 359/400
Epoch 360/400
Epoch 361/400
Epoch 362/400
Epoch 363/400
Epoch 364/400
Epoch 365/400
Epoch 366/400
Epoch 367/400
Epoch 368/400
Epoch 369/400
Epoch 370/400
Epoch 371/400
Epoch 372/400
Epoch 373/400
Epoch 374/400
Epoch 375/400
Epoch 376/400
Epoch 377/400
Epoch 378/400
Epoch 379/400


Epoch 380/400
Epoch 381/400
Epoch 382/400
Epoch 383/400
Epoch 384/400
Epoch 385/400
Epoch 386/400
Epoch 387/400
Epoch 388/400
Epoch 389/400
Epoch 390/400
Epoch 391/400
Epoch 392/400
Epoch 393/400
Epoch 394/400
Epoch 395/400
Epoch 396/400
Epoch 397/400
Epoch 398/400
Epoch 399/400
Epoch 400/400




In [38]:
# evaluate model performance on unseen data
model.evaluate(X_test, y_test, batch_size=batch_size)



[0.161886066198349,
 32.0,
 1.0,
 34.0,
 4.0,
 0.9295774698257446,
 0.9696969985961914,
 0.8888888955116272,
 0.982539713382721]

We finally achieve good results across all metrics. We save the weights of this model into .h5 file 

In [39]:
# save the model weights to .h5 file
model.save_weights('trained_weights_400eps_tauc0.98.h5')

In [40]:
# save model
model.save('trained_model_object.h5')