# GridSearch CrossValidation

In [1]:
import numpy
from sklearn.model_selection import GridSearchCV
from keras.models import Sequential
from keras.layers import Dense
from keras.wrappers.scikit_learn import KerasClassifier

Using TensorFlow backend.


In [2]:
# fix random seed for reproducibility
seed = 7
numpy.random.seed(seed)

# load dataset

In [3]:
dataset = numpy.loadtxt("data/pima-indians-diabetes.data.csv", delimiter=",")
# split into input (X) and output (Y) variables
X = dataset[:,0:8]
Y = dataset[:,8]

# create sklearn adapted model

In [4]:
#Function to create model, required for KerasClassifier
def create_model(optimizer):
    # create model
    
    model = Sequential()
    model.add(Dense(12, input_dim=8, activation='relu'))
    model.add(Dense(1, activation='sigmoid'))
    # Compile model
    model.compile(loss='binary_crossentropy', optimizer=optimizer, metrics=['accuracy'])
    return model

# tune batch size and epochs

### create model

In [5]:
model = KerasClassifier(build_fn=create_model, optimizer='adam', verbose=0)

### define grid search parameters

In [6]:
batch_size = [10, 20, 40, 60, 80, 100]
epochs = [10, 50, 100]
param_grid = dict(batch_size=batch_size, nb_epoch=epochs)

### define grid search

In [7]:
grid = GridSearchCV(estimator=model, param_grid=param_grid, n_jobs=-1)

### Fit the model

In [8]:
%%time
grid_result = grid.fit(X, Y)

CPU times: user 17.8 s, sys: 10.8 s, total: 28.6 s
Wall time: 56.3 s


### summarize results

In [9]:
print("Best: %f using %s" % (grid_result.best_score_, grid_result.best_params_))
means = grid_result.cv_results_['mean_test_score']
stds = grid_result.cv_results_['std_test_score']
params = grid_result.cv_results_['params']
for mean, stdev, param in zip(means, stds, params):
    print("%f (%f) with: %r" % (mean, stdev, param))

Best: 0.699219 using {'nb_epoch': 100, 'batch_size': 10}
0.660156 (0.022097) with: {'nb_epoch': 10, 'batch_size': 10}
0.679688 (0.017758) with: {'nb_epoch': 50, 'batch_size': 10}
0.699219 (0.013902) with: {'nb_epoch': 100, 'batch_size': 10}
0.658854 (0.026748) with: {'nb_epoch': 10, 'batch_size': 20}
0.626302 (0.045592) with: {'nb_epoch': 50, 'batch_size': 20}
0.680990 (0.024150) with: {'nb_epoch': 100, 'batch_size': 20}
0.658854 (0.038318) with: {'nb_epoch': 10, 'batch_size': 40}
0.425781 (0.132736) with: {'nb_epoch': 50, 'batch_size': 40}
0.591146 (0.147314) with: {'nb_epoch': 100, 'batch_size': 40}
0.572917 (0.134575) with: {'nb_epoch': 10, 'batch_size': 60}
0.634115 (0.029635) with: {'nb_epoch': 50, 'batch_size': 60}
0.666667 (0.031948) with: {'nb_epoch': 100, 'batch_size': 60}
0.600260 (0.052634) with: {'nb_epoch': 10, 'batch_size': 80}
0.597656 (0.024910) with: {'nb_epoch': 50, 'batch_size': 80}
0.569010 (0.131671) with: {'nb_epoch': 100, 'batch_size': 80}
0.575521 (0.136303) wit

# Tune the Training Optimization Algorithm

### create model

In [14]:
model = KerasClassifier(build_fn=create_model, nb_epoch=20, batch_size=10, verbose=1)

### define grid search parameters

In [15]:
optimizer = ['SGD', 'RMSprop', 'Adagrad', 'Adadelta', 'Adam', 'Adamax', 'Nadam']
param_grid = dict(optimizer=optimizer)

### define grid search

In [16]:
grid = GridSearchCV(estimator=model, param_grid=param_grid, n_jobs=1)

### Fit the model

In [17]:
%%time
grid_result = grid.fit(X, Y)

Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
 10/512 [..............................] - ETA: 0sEpoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
 10/512 [..............................] - ETA: 0sEpoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
 10/512 [..............................] - ETA: 0sEpoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/2

### summarize results

In [18]:
print("Best: %f using %s" % (grid_result.best_score_, grid_result.best_params_))
means = grid_result.cv_results_['mean_test_score']
stds = grid_result.cv_results_['std_test_score']
params = grid_result.cv_results_['params']
for mean, stdev, param in zip(means, stds, params):
    print("%f (%f) with: %r" % (mean, stdev, param))

Best: 0.658854 using {'optimizer': 'SGD'}
0.658854 (0.014382) with: {'optimizer': 'SGD'}
0.606771 (0.096442) with: {'optimizer': 'RMSprop'}
0.522135 (0.128939) with: {'optimizer': 'Adagrad'}
0.652344 (0.032369) with: {'optimizer': 'Adadelta'}
0.645833 (0.021236) with: {'optimizer': 'Adam'}
0.651042 (0.024774) with: {'optimizer': 'Adamax'}
0.631510 (0.033804) with: {'optimizer': 'Nadam'}
