# 1. Develop a Baseline Neural Network Model

In [2]:
import numpy as np
import pandas as pd
from keras.models import Sequential
from keras.layers import Dense
from keras.wrappers.scikit_learn import KerasRegressor
from sklearn.model_selection import cross_val_score
from sklearn.model_selection import KFold
from sklearn.preprocessing import StandardScaler
from sklearn.pipeline import Pipeline

In [3]:
# load dataset
dataframe = pd.read_csv('housing.csv',delim_whitespace=True,header=None)
dataset = dataframe.values

# split into input(X) and output(Y) variables
X = dataset[:,0:13]
Y = dataset[:,13]

In [4]:
# define base model
def baseline_model():
    model = Sequential()
    model.add(Dense(13,input_dim=13,activation='relu'))
    model.add(Dense(1))
    model.compile(loss='mean_squared_error',optimizer='adam')
    return model

In [5]:
# fix random seed for reproducibility
seed = 7
np.random.seed(seed)

In [6]:
# evaluate model with standardized dataset
estimator = KerasRegressor(build_fn=baseline_model,epochs=100,batch_size=5,verbose=0)

In [7]:
kfold = KFold(n_splits=10,shuffle=True,random_state=seed)
results = cross_val_score(estimator,X,Y,cv=kfold)
print("Baseline: %.2f (%.2f) MSE"%(results.mean(),results.std()))

Baseline: -32.86 (9.52) MSE


# 2. Lift Performance By Standardizing The Dataset

In [8]:
# evaluate model with standardized dataset
estimators = []
estimators.append(('standardize',StandardScaler()))
estimators.append(('mlp',KerasRegressor(build_fn=baseline_model,epochs=50,batch_size=5,verbose=0)))
pipeline = Pipeline(estimators)
kfold = KFold(n_splits=10,shuffle=True,random_state=seed)
results = cross_val_score(pipeline,X,Y,cv=kfold)
print("Baseline: %.2f (%.2f) MSE"%(results.mean(),results.std()))

Baseline: -19.06 (10.54) MSE


# 3. Tune The Neural Network Topology

## 3.1 Evaluate Deeper Network Topology
* 13 inputs -> [13->6] -> 1 output

In [11]:
# define the model
def larger_model():
    model = Sequential()
    model.add(Dense(13,input_dim=13,activation='relu'))
    model.add(Dense(6,activation='relu'))
    model.add(Dense(1))
    model.compile(loss='mean_squared_error',optimizer='adam')
    return model

estimators = []
estimators.append(('standardize',StandardScaler()))
estimators.append(('mlp',KerasRegressor(build_fn=larger_model,epochs=50,batch_size=5,verbose=0)))
pipeline = Pipeline(estimators)
kfold = KFold(n_splits=10,shuffle=True,random_state=seed)
results = cross_val_score(pipeline,X,Y,cv=kfold)
print("Baseline: %.2f (%.2f) MSE"%(results.mean(),results.std()))


Baseline: -14.43 (8.74) MSE


## 3.2 Evaluate a Wider Network Topology
* 13 inputs -> [20] -> 1 output

In [12]:
# define the model
def wider_model():
    model = Sequential()
    model.add(Dense(20,input_dim=13,activation='relu'))
    model.add(Dense(1))
    model.compile(loss='mean_squared_error',optimizer='adam')
    return model

estimators = []
estimators.append(('standardize',StandardScaler()))
estimators.append(('mlp',KerasRegressor(build_fn=wider_model,epochs=50,batch_size=5,verbose=0)))
pipeline = Pipeline(estimators)
kfold = KFold(n_splits=10,shuffle=True,random_state=seed)
results = cross_val_score(pipeline,X,Y,cv=kfold)
print("Baseline: %.2f (%.2f) MSE"%(results.mean(),results.std()))


Baseline: -15.14 (8.56) MSE


# Summary
* Discovered the Keras deep learning library for modelling regression problems.