# Neural Network Implementation

In [None]:
import numpy as np
import pandas as pd

import warnings
warnings.filterwarnings('ignore')

import lightgbm

from sklearn.externals import joblib
from sklearn.model_selection import StratifiedKFold
from sklearn.preprocessing import MinMaxScaler, LabelBinarizer, Imputer
from sklearn.utils import class_weight
#from category_encoders.hashing import HashingEncoder
from keras.layers import BatchNormalization, Dropout, Flatten, Dense
from keras.models import Sequential
from keras.layers import LeakyReLU
from keras.optimizers import Adam

from IPython.display import display

from utils import *

In [None]:
pd.set_option('display.max_columns', 500)
pd.set_option('display.max_rows', 500)
%load_ext autoreload
%autoreload 2
%matplotlib inline

## Load Data

In [None]:
train = pd.read_csv('input/train.csv')
print(train.shape)

In [None]:
test = pd.read_csv('input/test.csv')
print(test.shape)

## Preprocessing

Removing service columns

In [None]:
targets = train[['TARGET']]
train_size = train.shape[0]
train.drop(columns=['SK_ID_CURR', 'TARGET'], inplace=True)

In [None]:
test_ids = test['SK_ID_CURR']
test = test.drop(columns=['SK_ID_CURR'])

In [None]:
data = pd.concat([train, test])

Removing columns where too many missing values

In [None]:
missing_vals = compute_missing_values(data)
to_remove = idx_of_missing_values(missing_vals)
data.drop(columns=to_remove, inplace=True)

Categorical Features

In [None]:
data = pd.get_dummies(data)

Numerical Features Imputation

In [None]:
numerical = data.select_dtypes('float64').columns.tolist()

In [None]:
# median, so we do not that sensitive to outliers
imputer = Imputer(strategy = 'median')
# data[numerical] = imputer.fit_transform(data)
data[numerical] = imputer.fit_transform(data)

Features Normalization

In [None]:
scaler = MinMaxScaler()
data[numerical] = scaler.fit_transform(data[numerical])

Computing class weights

In [None]:
class_weights = class_weight.compute_class_weight('balanced', np.unique(targets), targets)
class_weights = dict(enumerate(class_weights))
class_weights

## Model

In [None]:
model = Sequential()
model.add(Dense(512, input_shape=train.shape[1:]))
model.add(BatchNormalization())
model.add(LeakyReLU())

model.add(Dense(512))
model.add(BatchNormalization())
model.add(LeakyReLU())

model.add(Dense(512))
model.add(BatchNormalization())
model.add(LeakyReLU())

model.add(Dense(512))
model.add(BatchNormalization())
model.add(LeakyReLU())

model.add(Dense(512))
model.add(BatchNormalization())
model.add(LeakyReLU())

model.add(Dense(1, activation='sigmoid'))
model.summary()

In [None]:
optimizer = Adam(lr=0.001)
model.compile(optimizer, loss='binary_crossentropy', metrics=['accuracy'])

In [None]:
# model.fit(class_weights)