# Keras- Neural Network Introduction

## 1. Multilayer Perceptron

### 1.1 Basic

In [35]:
import numpy
import pandas as pd

In [1]:
# Create your first MLP in Keras
from keras.models import Sequential
from keras.layers import Dense

Using TensorFlow backend.


In [2]:
# fix random seed for reproducibility
numpy.random.seed(7)

In [3]:
# load pima indians dataset
dataset = numpy.loadtxt("pima-indians-diabetes.csv", delimiter=",")

In [4]:
import pandas as pd
pd.DataFrame(dataset).head()

Unnamed: 0,0,1,2,3,4,5,6,7,8
0,6.0,148.0,72.0,35.0,0.0,33.6,0.627,50.0,1.0
1,1.0,85.0,66.0,29.0,0.0,26.6,0.351,31.0,0.0
2,8.0,183.0,64.0,0.0,0.0,23.3,0.672,32.0,1.0
3,1.0,89.0,66.0,23.0,94.0,28.1,0.167,21.0,0.0
4,0.0,137.0,40.0,35.0,168.0,43.1,2.288,33.0,1.0


In [5]:
# split into input (X) and output (Y) variables
X = dataset[:,0:8]
Y = dataset[:,8]
# create model

#### create model

In [6]:
model = Sequential()
model.add(Dense(12, input_dim=8, activation='relu')) 
model.add(Dense(8, activation='relu')) 
model.add(Dense(1, activation='sigmoid'))
model.summary()

_________________________________________________________________
Layer (type)                 Output Shape              Param #   
dense_1 (Dense)              (None, 12)                108       
_________________________________________________________________
dense_2 (Dense)              (None, 8)                 104       
_________________________________________________________________
dense_3 (Dense)              (None, 1)                 9         
Total params: 221
Trainable params: 221
Non-trainable params: 0
_________________________________________________________________


#### Compile model

In [7]:
model.compile(loss='binary_crossentropy',
              optimizer='adam',
              metrics=['accuracy'])


##### Fit the model

In [8]:
model.fit(X, Y, epochs=10, batch_size=10)

Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10


<keras.callbacks.History at 0x118bb0ac8>

##### Evaluate the model

In [9]:
# evaluate the model
scores = model.evaluate(X, Y)
print("\n%s: %.2f%%" % (model.metrics_names[1], scores[1]*100))

 32/768 [>.............................] - ETA: 0s
acc: 70.83%


------

### 1.2  Add validation split

In [10]:
model.fit(X, Y, validation_split=0.33, epochs=10, batch_size=10)

Train on 514 samples, validate on 254 samples
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10


<keras.callbacks.History at 0x118cfa470>

------

### 1.3.  Use a Manual Verification Dataset

In [11]:
from sklearn.model_selection import train_test_split

In [12]:
seed = 7
numpy.random.seed(seed)
# split into 67% for train and 33% for test
X_train, X_test, y_train, y_test = train_test_split(X, Y, test_size=0.33, random_state=seed) # create model

##### Fit the model

In [13]:
model.fit(X_train, y_train, validation_data=(X_test,y_test), epochs=10, batch_size=10)

Train on 514 samples, validate on 254 samples
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10


<keras.callbacks.History at 0x11aaf0978>

### 1.4.  Manual k-Fold Cross-Validation

In [14]:
from sklearn.model_selection import StratifiedKFold

In [15]:
kfold = StratifiedKFold(n_splits=10, shuffle=True, random_state=seed)

##### Build Model

In [18]:
cvscores = []
for train, test in kfold.split(X, Y):
    # create model
    model = Sequential()
    model.add(Dense(12, input_dim=8, activation='relu'))
    model.add(Dense(8, activation='relu'))
    model.add(Dense(1, activation='sigmoid'))


    # Compile model
    model.compile(loss='binary_crossentropy',
                  optimizer='adam',
                  metrics=['accuracy']) 
    
    
    # Fit the model
    model.fit(X[train], Y[train], epochs=10, batch_size=10, verbose=0)


    
    # evaluate the model
    scores = model.evaluate(X[test], Y[test], verbose=0)
    print((model.metrics_names[1], scores[1]*100)), cvscores.append(scores[1] * 100)

('acc', 68.831169140803354)
('acc', 63.636363945998156)
('acc', 35.064935529386844)
('acc', 59.740260127302889)
('acc', 62.337662724705488)
('acc', 70.129870594321915)
('acc', 58.441558906010215)
('acc', 64.93506516729083)
('acc', 61.842105576866544)
('acc', 64.473684524234969)


In [19]:
print("%.2f%% (+/- %.2f%%)" % (numpy.mean(cvscores), numpy.std(cvscores)))

60.94% (+/- 9.29%)


------

### 1.5. Use Keras Models With Scikit-Learn

In [20]:
from keras.wrappers.scikit_learn import KerasClassifier

In [21]:
from sklearn.model_selection import StratifiedKFold
from sklearn.model_selection import cross_val_score

In [22]:
def create_model():
    # create model
    model = Sequential()
    model.add(Dense(12, input_dim=8, activation='relu')) 
    model.add(Dense(8, activation='relu')) 
    model.add(Dense(1, activation='sigmoid'))

    # Compile model
    model.compile(loss='binary_crossentropy',
                  optimizer='adam',
                  metrics=['accuracy']) 
    return model

In [23]:
# fix random seed for reproducibility
seed = 7
numpy.random.seed(seed)
# load pima indians dataset
dataset = numpy.loadtxt("pima-indians-diabetes.csv", delimiter=",")
# split into input (X) and output (Y) variables
X = dataset[:,0:8]
Y = dataset[:,8]

In [25]:
# create model
model = KerasClassifier(build_fn=create_model, epochs=10, batch_size=10, verbose=0)

# evaluate using 10-fold cross validation
kfold = StratifiedKFold(n_splits=10,
                        shuffle=True,
                        random_state=seed)

results = cross_val_score(model, X, Y, cv=kfold)

print(results.mean())

0.5952494916


--------

### 1.6 Grid Search Deep Learning Model Parameters

In [30]:
from keras.wrappers.scikit_learn import KerasClassifier
from sklearn.model_selection import GridSearchCV

In [31]:
def create_model(optimizer='rmsprop', init='glorot_uniform'):
    # create model
    model = Sequential()
    model.add(Dense(12, input_dim=8, kernel_initializer=init, activation='relu'))
    model.add(Dense(8, kernel_initializer=init, activation='relu')) 
    model.add(Dense(1, kernel_initializer=init, activation='sigmoid'))


    # Compile model
    model.compile(loss='binary_crossentropy',
              optimizer=optimizer,
              metrics=['accuracy']) 
    return model

In [32]:
# fix random seed for reproducibility
seed = 7
numpy.random.seed(seed)
# load pima indians dataset
dataset = numpy.loadtxt("pima-indians-diabetes.csv", delimiter=",")
# split into input (X) and output (Y) variables
X = dataset[:,0:8]
Y = dataset[:,8]

In [33]:
# create model
model = KerasClassifier(build_fn=create_model, verbose=0)

In [None]:
# grid search epochs, batch size and optimizer

optimizers = ['rmsprop', 'adam']
inits = ['glorot_uniform', 'normal', 'uniform']
epochs = [5, 10, 15]
batches = [5, 10, 20]

param_grid = dict(optimizer=optimizers,
                  epochs=epochs, 
                  batch_size=batches, 
                  init=inits) 


grid = GridSearchCV(estimator=model,
                    param_grid=param_grid)


grid_result = grid.fit(X, Y)

In [None]:
# summarize results
print("Best: %f using %s" % (grid_result.best_score_, grid_result.best_params_))
means = grid_result.cv_results_['mean_test_score']
stds = grid_result.cv_results_['std_test_score']
params = grid_result.cv_results_['params']
for mean, stdev, param in zip(means, stds, params):
print("%f (%f) with: %r" % (mean, stdev, param))

---------

## 2. Multi class classifier

----------

### 2.1 Classification Of Flower Species

In [36]:
# Multiclass Classification with the Iris Flowers Dataset
from keras.wrappers.scikit_learn import KerasClassifier
from keras.utils import np_utils

In [37]:
from sklearn.model_selection import cross_val_score
from sklearn.model_selection import KFold
from sklearn.preprocessing import LabelEncoder
from sklearn.pipeline import Pipeline

In [40]:
# fix random seed for reproducibility
seed = 7
numpy.random.seed(seed)
# load dataset
dataframe = pd.read_csv("iris.csv", header=None)
dataset = dataframe.values
X = dataset[:,0:4].astype(float)
Y = dataset[:,4]
# encode class values as integers
encoder = LabelEncoder()
encoder.fit(Y)
encoded_Y = encoder.transform(Y)
# convert integers to dummy variables (i.e. one hot encoded)
dummy_y = np_utils.to_categorical(encoded_Y)


In [41]:
# define baseline model
def baseline_model():
    # create model
    model = Sequential()
    model.add(Dense(8, input_dim=4, activation='relu'))
    model.add(Dense(3, activation='softmax'))
    
    
    # Compile model
    model.compile(loss='categorical_crossentropy',
                  optimizer='adam',
                  metrics=['accuracy'])
    
    return model


In [44]:
estimator = KerasClassifier(build_fn=baseline_model,
                            epochs=10,
                            batch_size=5,
                            verbose=0)

kfold = KFold(n_splits=10,
              shuffle=True,
              random_state=seed)

results = cross_val_score(estimator, X, dummy_y, cv=kfold)

In [45]:
print("Accuracy: %.2f%% (%.2f%%)" % (results.mean()*100, results.std()*100))

Accuracy: 58.00% (27.01%)


---------

### 2.2 Binary Classification Of Sonar Returns

-------

In [46]:
# Binary Classification with Sonar Dataset: Baseline
from sklearn.preprocessing import LabelEncoder
from sklearn.preprocessing import StandardScaler
from sklearn.pipeline import Pipeline

In [47]:
# fix random seed for reproducibility
seed = 7
numpy.random.seed(seed)
# load dataset
dataframe = pd.read_csv("sonar.csv", header=None)
dataset = dataframe.values
# split into input (X) and output (Y) variables
X = dataset[:,0:60].astype(float)
Y = dataset[:,60]
# encode class values as integers
encoder = LabelEncoder()
encoder.fit(Y)
encoded_Y = encoder.transform(Y)

##### Baseline model

In [48]:
def create_baseline():
    # create model
    model = Sequential()
    model.add(Dense(60, input_dim=60, kernel_initializer='normal', activation='relu')) 
    model.add(Dense(1, kernel_initializer='normal', activation='sigmoid'))

    # Compile model
    model.compile(loss='binary_crossentropy',
                  optimizer='adam',
                  metrics=['accuracy'])
    return model

##### Evaluate

In [51]:
# evaluate model with standardized dataset
from keras.wrappers.scikit_learn import KerasClassifier
from sklearn.model_selection import StratifiedKFold

In [49]:
estimator = KerasClassifier(build_fn=create_baseline, epochs=10, batch_size=5, verbose=0)
kfold = StratifiedKFold(n_splits=10, shuffle=True, random_state=seed)

##### Result

In [52]:
from sklearn.model_selection import cross_val_score

In [50]:
results = cross_val_score(estimator, X, encoded_Y, cv=kfold)
print("Baseline: %.2f%% (%.2f%%)" % (results.mean()*100, results.std()*100))

Baseline: 76.37% (7.75%)


##### Improve Performance With Data Preparation Pipeline

In [55]:
from sklearn.pipeline import Pipeline
from sklearn.preprocessing import StandardScaler

In [53]:
# evaluate baseline model with standardized dataset
estimators = []
estimators.append(('standardize', StandardScaler()))

estimators.append(('mlp',
                   KerasClassifier(build_fn=create_baseline,
                   epochs=10,
                   batch_size=5,
                   verbose=0)))

pipeline = Pipeline(estimators)

kfold = StratifiedKFold(n_splits=10,
                        shuffle=True,
                        random_state=seed)

results = cross_val_score(pipeline, X, encoded_Y, cv=kfold)

In [54]:
print("Standardized: %.2f%% (%.2f%%)" % (results.mean()*100, results.std()*100))

Standardized: 83.68% (3.66%)


##### Evaluate a Smaller Network

In [56]:
from sklearn.preprocessing import StandardScaler
from sklearn.pipeline import Pipeline

In [57]:
def create_smaller():
    # create model
    model = Sequential()
    model.add(Dense(30, input_dim=60, kernel_initializer='normal', activation='relu')) 
    model.add(Dense(1, kernel_initializer='normal', activation='sigmoid'))
    # Compile model
    model.compile(loss='binary_crossentropy', optimizer='adam', metrics=['accuracy']) 
    return model

In [58]:
estimators = []
estimators.append(('standardize', StandardScaler()))
estimators.append(('mlp', KerasClassifier(build_fn=create_smaller,
                    epochs=10,
                    batch_size=5,
                    verbose=0)))

pipeline = Pipeline(estimators)

kfold = StratifiedKFold(n_splits=10,
                        shuffle=True,
                        random_state=seed)

results = cross_val_score(pipeline, X, encoded_Y, cv=kfold)

In [60]:
print("Smaller: %.2f%% (%.2f%%)" % (results.mean()*100, results.std()*100))

Smaller: 82.18% (4.44%)


##### Evaluate larger Network

In [59]:
from sklearn.preprocessing import StandardScaler
from sklearn.pipeline import Pipeline

In [61]:
# larger model
def create_larger():
    # create model
    model = Sequential()
    model.add(Dense(60, input_dim=60, kernel_initializer='normal', activation='relu')) 
    model.add(Dense(30, kernel_initializer='normal', activation='relu')) 
    model.add(Dense(1, kernel_initializer='normal', activation='sigmoid'))
    
    # Compile model
    model.compile(loss='binary_crossentropy',
                  optimizer='adam',
                  metrics=['accuracy'])
    
    return model

In [62]:
estimators = []
estimators.append(('standardize', StandardScaler()))
estimators.append(('mlp',
                   KerasClassifier(build_fn=create_larger,
                   epochs=10,
                   batch_size=5,
                   verbose=0)))

pipeline = Pipeline(estimators)

kfold = StratifiedKFold(n_splits=10,
                        shuffle=True,
                        random_state=seed)

results = cross_val_score(pipeline, X, encoded_Y, cv=kfold)

In [63]:
print("Larger: %.2f%% (%.2f%%)" % (results.mean()*100, results.std()*100))

Larger: 82.18% (4.91%)


-------

### 2.3 Regression of Boston House Prices

##### Baseline Model

In [64]:
import numpy
from pandas import read_csv
from keras.models import Sequential
from keras.layers import Dense
from keras.wrappers.scikit_learn import KerasRegressor
from sklearn.model_selection import cross_val_score
from sklearn.model_selection import KFold
from sklearn.preprocessing import StandardScaler
from sklearn.pipeline import Pipeline

In [65]:
# load dataset
dataframe = read_csv("housing.csv", delim_whitespace=True, header=None)
dataset = dataframe.values
# split into input and output variables
X = dataset[:,0:13]
Y = dataset[:,13]

In [66]:
# define base model
def baseline_model():
    # create model
    model = Sequential()
    model.add(Dense(13, input_dim=13, kernel_initializer='normal', activation='relu')) 
    model.add(Dense(1, kernel_initializer='normal'))
    
    
    # Compile model
    model.compile(loss='mean_squared_error', optimizer='adam') 
    
    return model

In [67]:
# fix random seed for reproducibility
seed = 7
numpy.random.seed(seed)

# evaluate model
estimator = KerasRegressor(build_fn=baseline_model,
                           epochs=10,
                           batch_size=5,
                           verbose=0)

kfold = KFold(n_splits=10, random_state=seed)

results = cross_val_score(estimator, X, Y, cv=kfold)

print("Baseline: %.2f (%.2f) MSE" % (results.mean(), results.std()))

Baseline: 57.86 (42.34) MSE


##### Lift Performance By Standardizing The Dataset

In [70]:
# evaluate model with standardized dataset
estimators = []
estimators.append(('standardize', StandardScaler()))

estimators.append(('mlp',
                   KerasRegressor(build_fn=baseline_model,
                   epochs=10, 
                   batch_size=5,
                   verbose=0)))

pipeline = Pipeline(estimators)

In [71]:
kfold = KFold(n_splits=10, random_state=seed)
results = cross_val_score(pipeline, X, Y, cv=kfold)
print("Standardized: %.2f (%.2f) MSE" % (results.mean(), results.std()))

Standardized: 53.87 (43.56) MSE


##### Evaluate a Deeper Network Topology

In [72]:
# define the model
def larger_model():
    # create model
    model = Sequential()
    model.add(Dense(13, input_dim=13, kernel_initializer='normal', activation='relu')) 
    model.add(Dense(6, kernel_initializer='normal', activation='relu')) 
    model.add(Dense(1, kernel_initializer='normal'))
    
    # Compile model
    model.compile(loss='mean_squared_error', optimizer='adam')
    return model

In [73]:
# evaluate model with standardized dataset
estimators = []
estimators.append(('standardize', StandardScaler()))

estimators.append(('mlp', 
                   KerasRegressor(build_fn=larger_model,
                   epochs=50, 
                   batch_size=5,
                   verbose=0)))

pipeline = Pipeline(estimators)
kfold = KFold(n_splits=10, random_state=seed)
results = cross_val_score(pipeline, X, Y, cv=kfold)
print("Larger: %.2f (%.2f) MSE" % (results.mean(), results.std()))

Larger: 22.60 (25.40) MSE


##### Evaluate a Wider Network Topology

In [76]:
# define wider model
def wider_model():
    # create model
    model = Sequential()
    model.add(Dense(20, input_dim=13, kernel_initializer='normal', activation='relu')) 
    model.add(Dense(1, kernel_initializer='normal'))
    
    # Compile model
    model.compile(loss='mean_squared_error', optimizer='adam')
    return model

In [75]:
# fix random seed for reproducibility
seed = 7
numpy.random.seed(seed)
# evaluate model with standardized dataset
estimators = []
estimators.append(('standardize', StandardScaler()))

estimators.append(('mlp', KerasRegressor(build_fn=wider_model,
                                         epochs=100, 
                                         batch_size=5,
                                         verbose=0)))

pipeline = Pipeline(estimators)

kfold = KFold(n_splits=10, random_state=seed)

results = cross_val_score(pipeline, X, Y, cv=kfold)

print("Wider: %.2f (%.2f) MSE" % (results.mean(), results.std()))


Wider: 22.40 (29.37) MSE


------------