In [18]:
import numpy as np
import pandas as pd
import os

from keras.models import Sequential
from keras.layers import Dense
from keras.wrappers.scikit_learn import KerasClassifier

from sklearn.model_selection import KFold
from sklearn.model_selection import cross_val_score
from sklearn.model_selection import StratifiedKFold

from sklearn.preprocessing import LabelEncoder
from sklearn.preprocessing import StandardScaler

from sklearn.pipeline import Pipeline

In [2]:
seed = 7
np.random.seed(seed)

In [4]:
# load dataset
dataframe = pd.read_csv('sonar.csv', header=None)
dataset = dataframe.values
X = dataset[:,:-1].astype(float)
Y = dataset[:,-1]

In [5]:
encoder = LabelEncoder().fit(Y)
encoded_y = encoder.transform(Y)

In [9]:
def create_baseline():
    # create model
    model = Sequential()
    model.add(Dense(60, input_dim=60, init='normal', activation='relu'))
    model.add(Dense(1, init='normal', activation='sigmoid'))
    # compile model
    model.compile(loss='binary_crossentropy', optimizer='adam', metrics=['accuracy'])
    return model

In [12]:
estimator = KerasClassifier(build_fn=create_baseline, nb_epoch=100, batch_size=5, verbose=0)

estimators = [
    ('Scaler', StandardScaler()),
    ('mlp', estimator)
]
pipeline = Pipeline(estimators)

kfold = StratifiedKFold(n_splits=10, shuffle=True, random_state=seed)
results = cross_val_score(pipeline, X, encoded_y, cv=kfold)
print results.mean(), results.std()

0.850649358842 0.0589354606026


In [13]:
'''
    By using a smaller network we force the network to perform rigid feature extraction,
    this will help us understand the importance of the features in the data
'''

def create_smaller():
    # create model
    model = Sequential()
    model.add(Dense(30, input_dim=60, init='normal', activation='relu'))
    model.add(Dense(1, init='normal', activation='sigmoid'))
    # compile model
    model.compile(loss='binary_crossentropy', optimizer='adam', metrics=['accuracy'])
    return model

In [14]:
estimator = KerasClassifier(build_fn=create_smaller, nb_epoch=100, batch_size=5, verbose=0)

estimators = [
    ('Scaler', StandardScaler()),
    ('mlp', estimator)
]
pipeline = Pipeline(estimators)

kfold = StratifiedKFold(n_splits=10, shuffle=True, random_state=seed)
results = cross_val_score(pipeline, X, encoded_y, cv=kfold)
print results.mean(), results.std()

0.860194813528 0.055167246433


In [21]:
def create_larger():
    # create model
    model = Sequential()
    model.add(Dense(30, input_dim=60, init='normal', activation='relu'))
    model.add(Dense(30, init='normal', activation='relu'))
    model.add(Dense(1, init='normal', activation='sigmoid'))
    # compile model
    model.compile(loss='binary_crossentropy', optimizer='adam', metrics=['accuracy'])
    return model

In [22]:
estimator = KerasClassifier(build_fn=create_larger, nb_epoch=100, batch_size=5, verbose=0)

estimators = [
    ('Scaler', StandardScaler()),
    ('mlp', estimator)
]
pipeline = Pipeline(estimators)

kfold = StratifiedKFold(n_splits=10, shuffle=True, random_state=seed)
results = cross_val_score(pipeline, X, encoded_y, cv=kfold)
print results.mean(), results.std()
os.system('say "training complete"')

0.85543290834 0.0606926889009


0

In [20]:
estimator = KerasClassifier(build_fn=create_smaller, nb_epoch=100, batch_size=5, verbose=0)

estimators = [
    ('Scaler', StandardScaler()),
    ('mlp', estimator)
]
pipeline = Pipeline(estimators)

kfold = StratifiedKFold(n_splits=10, shuffle=True, random_state=seed)
results = cross_val_score(pipeline, X, encoded_y, cv=kfold)
print results.mean(), results.std()
os.system('say "training complete"')

0.860194813528 0.055167246433


0