# Lesson 9.03 Deep Learning Optimization (Solution Code)

## Import Libraries

In [1]:
import numpy
import pandas as pd
from sklearn.model_selection import GridSearchCV
from keras.models import Sequential
from keras.layers import Dense
import warnings
warnings.filterwarnings('ignore')
from keras.wrappers.scikit_learn import KerasClassifier

## Load Data

In [2]:
# training data
# outcome value = 1 means diabetic while Outcome value = 0 means non-diabetic
data = pd.read_csv('diabetes.csv')
data.head()

Unnamed: 0,Pregnancies,Glucose,BloodPressure,SkinThickness,Insulin,BMI,DiabetesPedigreeFunction,Age,Outcome
0,6,148,72,35,0,33.6,0.627,50,1
1,1,85,66,29,0,26.6,0.351,31,0
2,8,183,64,0,0,23.3,0.672,32,1
3,1,89,66,23,94,28.1,0.167,21,0
4,0,137,40,35,168,43.1,2.288,33,1


In [3]:
# split into predictors and response
X = data.iloc[:,0:8] #predictors
y = data.iloc[:,8] #target

## Create Model

In [4]:
# function to create model for KerasClassifier
def create_model():
    #define model
    model = Sequential() # keras sequential model
    model.add(Dense(12, input_dim=8, activation='relu')) # input layer contains 8 Independent Variables
    model.add(Dense(1, activation='sigmoid')) # binary classification use sigmoid
    # more info on which activation function to use at machinelearningmastery.com/choose-an-activation-function-for-deep-learning/
    
    # compile model
    # use binary_crossentropy as loss function for binary classification problems
    # on the other hand use categorical_crossentropy as loss function for multi-classification problems
    # use adam optimizer as default
    model.compile(loss='binary_crossentropy', optimizer='adam', metrics=['accuracy'])
    return model

In [5]:
# create model
model = KerasClassifier(build_fn=create_model)

## Optimizing Batch and Epoch

In [6]:
# determine grid search parameters

# The batch size defines the number of samples that will be propagated through the network.
# More info at https://stats.stackexchange.com/questions/153531/what-is-batch-size-in-neural-network
batchSize = [10, 20, 40, 60, 80, 100]

# An epoch is an iteration over the entire x and y data provided.
# More info at https://www.tensorflow.org/api_docs/python/tf/keras/Sequential
epochs = [10, 30, 50]

In [7]:
# store parameters and values in a dictionary
parameter_grid = dict(batch_size=batchSize, epochs=epochs)

# n_jobs = -1 means use all resources / processors avaiable in CPU
grid = GridSearchCV(estimator=model, param_grid=parameter_grid, n_jobs=-1)
grid_result = grid.fit(X, y)

Epoch 1/50
Epoch 2/50
Epoch 3/50
Epoch 4/50
Epoch 5/50
Epoch 6/50
Epoch 7/50
Epoch 8/50
Epoch 9/50
Epoch 10/50
Epoch 11/50
Epoch 12/50
Epoch 13/50
Epoch 14/50
Epoch 15/50
Epoch 16/50
Epoch 17/50
Epoch 18/50
Epoch 19/50
Epoch 20/50
Epoch 21/50
Epoch 22/50
Epoch 23/50
Epoch 24/50
Epoch 25/50
Epoch 26/50
Epoch 27/50
Epoch 28/50
Epoch 29/50
Epoch 30/50
Epoch 31/50
Epoch 32/50
Epoch 33/50
Epoch 34/50
Epoch 35/50
Epoch 36/50
Epoch 37/50
Epoch 38/50
Epoch 39/50
Epoch 40/50
Epoch 41/50
Epoch 42/50
Epoch 43/50
Epoch 44/50
Epoch 45/50
Epoch 46/50
Epoch 47/50
Epoch 48/50
Epoch 49/50
Epoch 50/50


In [8]:
# summarize accuracy results for best set of parameter values
print('Best: %f using %s' % (grid_result.best_score_, grid_result.best_params_))

Best: 0.694075 using {'batch_size': 10, 'epochs': 50}


## Tuning Optimizer Function
Find the best optimizer that fits the model

In [9]:
# create an updated function to tune optimizer 
def create_model(optimizer):
    #define model
    model = Sequential() # keras sequential model
    model.add(Dense(12, input_dim=8, activation='relu')) # input layer contains 8 Independent Variables
    model.add(Dense(1, activation='sigmoid')) # binary classification use sigmoid
    # more info on which activation function to use at machinelearningmastery.com/choose-an-activation-function-for-deep-learning/
    
    # compile model
    # use binary_crossentropy as loss function for binary classification problems
    # on the other hand use categorical_crossentropy as loss function for multi-classification problems
    model.compile(loss='binary_crossentropy', optimizer=optimizer, metrics=['accuracy'])
    return model

In [10]:
# create model using updated function and best param values for epochs and batch_size as found above
model = KerasClassifier(build_fn=create_model, epochs=50, batch_size=10)

In [11]:
# define grid search parameters
optimizer = ['adam', 'SGD']
parameter_grid = dict(optimizer=optimizer)

In [12]:
# n_jobs = -1 means use all resources / processors avaiable in CPU
grid = GridSearchCV(estimator=model, param_grid=parameter_grid, n_jobs=-1)
grid_result = grid.fit(X, y)

Epoch 1/50
Epoch 2/50
Epoch 3/50
Epoch 4/50
Epoch 5/50
Epoch 6/50
Epoch 7/50
Epoch 8/50
Epoch 9/50
Epoch 10/50
Epoch 11/50
Epoch 12/50
Epoch 13/50
Epoch 14/50
Epoch 15/50
Epoch 16/50
Epoch 17/50
Epoch 18/50
Epoch 19/50
Epoch 20/50
Epoch 21/50
Epoch 22/50
Epoch 23/50
Epoch 24/50
Epoch 25/50
Epoch 26/50
Epoch 27/50
Epoch 28/50
Epoch 29/50
Epoch 30/50
Epoch 31/50
Epoch 32/50
Epoch 33/50
Epoch 34/50
Epoch 35/50
Epoch 36/50
Epoch 37/50
Epoch 38/50
Epoch 39/50
Epoch 40/50
Epoch 41/50
Epoch 42/50
Epoch 43/50
Epoch 44/50
Epoch 45/50
Epoch 46/50
Epoch 47/50
Epoch 48/50
Epoch 49/50
Epoch 50/50


In [13]:
# summarize accuracy results for best set of parameter values
print('Best: %f using %s' % (grid_result.best_score_, grid_result.best_params_))

Best: 0.699279 using {'optimizer': 'adam'}
