# Classification with Scikit

Deep Learning Classification on __Pima Indian diabetes dataset__ 

1) Perform classification using Scikit learn library:
- <font color=red>KerasClassifier</font>
- <font color=red>k-fold cross validation</font>

In [1]:
import numpy
from tensorflow import keras
from tensorflow.keras.models import Sequential
from tensorflow.keras.layers import Dense
from tensorflow.keras.wrappers.scikit_learn import KerasClassifier
from sklearn.model_selection import cross_val_score
from sklearn.model_selection import StratifiedKFold

In [2]:
def create_model():
    model = Sequential()
    model.add(Dense(12, input_dim=8, activation='relu'))
    model.add(Dense(8, activation='relu'))
    model.add(Dense(1, activation='sigmoid'))
    
    model.compile(loss='binary_crossentropy', optimizer='adam', metrics=['accuracy'])
    return model

In [3]:
dataset = numpy.loadtxt('Data/pima-indians-diabetes.csv', delimiter=',')

X = dataset[:, 0:8]
y = dataset[:, 8]

In [4]:
model = KerasClassifier(build_fn=create_model, epochs=150, batch_size=10, verbose=0)

In [5]:
kfold = StratifiedKFold(n_splits=10, shuffle=True)
results = cross_val_score(model, X, y, cv=kfold)

print(results.mean())

0.7174982964992523


2) Perform classification using Scikit learn library:
- <font color=red>KerasClassifier</font> _scikit's facility_
- <font color=red>k-fold cross validation</font> _to work with multiple sets of train and valid sets_
- <font color=red>GridSearchCV</font> _to operate on various parameters_

In [6]:
import numpy
from tensorflow import keras
from tensorflow.keras import models, layers
from tensorflow.keras.wrappers.scikit_learn import KerasClassifier
from sklearn.model_selection import StratifiedKFold
from sklearn.model_selection import cross_val_score
from sklearn.model_selection import GridSearchCV

In [7]:
def create_model(optimizer='rmsprop', init='glorot_uniform'):
    model = models.Sequential()
    model.add(layers.Dense(12, input_dim=8, activation='relu'))
    model.add(layers.Dense(8, activation='relu'))
    model.add(layers.Dense(1, activation='sigmoid'))
    
    model.compile(loss='binary_crossentropy', optimizer=optimizer, metrics=['accuracy'])
    return model

In [8]:
dataset = numpy.loadtxt('Data/pima-indians-diabetes.csv', delimiter=',')

X = dataset[:, 0:8]
y = dataset[:, 8]

In [9]:
model = KerasClassifier(build_fn=create_model, batch_size=10, verbose=0)

In [10]:
optimizers = ['rmsprop', 'adam']
inits = ['glorot_uniform', 'normal', 'uniform']
epochs = [50, 100, 150]
batches = [5, 10, 20]

In [11]:
param_grid = dict(optimizer=optimizers, epochs= epochs, batch_size=batches, init=inits)
grid = GridSearchCV(estimator=model, param_grid=param_grid, cv=3)
grid_result = grid.fit(X, y)

In [12]:
print("Best: %f using %s" % (grid_result.best_score_, grid_result.best_params_))

Best: 0.735677 using {'batch_size': 5, 'epochs': 150, 'init': 'glorot_uniform', 'optimizer': 'adam'}


In [13]:
means = grid_result.cv_results_['mean_test_score']
stds = grid_result.cv_results_['std_test_score']
params = grid_result.cv_results_['params']

In [14]:
for mean, stdev, param in zip(means, stds, params):
    print("%f (%f) with: %r" % (mean, stdev, param))

0.690104 (0.015073) with: {'batch_size': 5, 'epochs': 50, 'init': 'glorot_uniform', 'optimizer': 'rmsprop'}
0.705729 (0.012890) with: {'batch_size': 5, 'epochs': 50, 'init': 'glorot_uniform', 'optimizer': 'adam'}
0.671875 (0.029232) with: {'batch_size': 5, 'epochs': 50, 'init': 'normal', 'optimizer': 'rmsprop'}
0.684896 (0.030647) with: {'batch_size': 5, 'epochs': 50, 'init': 'normal', 'optimizer': 'adam'}
0.707031 (0.026107) with: {'batch_size': 5, 'epochs': 50, 'init': 'uniform', 'optimizer': 'rmsprop'}
0.653646 (0.014731) with: {'batch_size': 5, 'epochs': 50, 'init': 'uniform', 'optimizer': 'adam'}
0.713542 (0.025780) with: {'batch_size': 5, 'epochs': 100, 'init': 'glorot_uniform', 'optimizer': 'rmsprop'}
0.710938 (0.033299) with: {'batch_size': 5, 'epochs': 100, 'init': 'glorot_uniform', 'optimizer': 'adam'}
0.707031 (0.012758) with: {'batch_size': 5, 'epochs': 100, 'init': 'normal', 'optimizer': 'rmsprop'}
0.695312 (0.061516) with: {'batch_size': 5, 'epochs': 100, 'init': 'normal'