<a href="https://colab.research.google.com/github/okanbuyuktepe/Deep-learning-Exercises/blob/master/boston_house_price.ipynb" target="_parent"><img src="https://colab.research.google.com/assets/colab-badge.svg" alt="Open In Colab"/></a>

In [16]:
import numpy
from pandas import read_csv
from keras.models import Sequential
from keras.layers import Dense
from keras.wrappers.scikit_learn import KerasRegressor
from sklearn.model_selection import cross_val_score, KFold
from sklearn.preprocessing import StandardScaler
from sklearn.pipeline import Pipeline

In [17]:
# Load dataset
url = 'https://raw.githubusercontent.com/jbrownlee/Datasets/master/housing.data'
dataframe = read_csv(url, delim_whitespace=True ,header=None) # the attributes are instead separated by whitespace.
dataset = dataframe.values
dataframe.info()

<class 'pandas.core.frame.DataFrame'>
RangeIndex: 506 entries, 0 to 505
Data columns (total 14 columns):
 #   Column  Non-Null Count  Dtype  
---  ------  --------------  -----  
 0   0       506 non-null    float64
 1   1       506 non-null    float64
 2   2       506 non-null    float64
 3   3       506 non-null    int64  
 4   4       506 non-null    float64
 5   5       506 non-null    float64
 6   6       506 non-null    float64
 7   7       506 non-null    float64
 8   8       506 non-null    int64  
 9   9       506 non-null    float64
 10  10      506 non-null    float64
 11  11      506 non-null    float64
 12  12      506 non-null    float64
 13  13      506 non-null    float64
dtypes: float64(12), int64(2)
memory usage: 55.5 KB


In [18]:
X = dataset[:,0:13]
Y = dataset[:,13]

In [19]:
# define base model
def baseline_model():
  #create model
  model = Sequential()
  model.add(Dense(13, input_dim=13, kernel_initializer='normal', activation='relu'))
  model.add(Dense(1, kernel_initializer='normal'))
  model.compile(loss='mean_squared_error', optimizer='adam')
  return model

In [20]:
# fix random seed for reproducibility
seed = 7
numpy.random.seed(seed)

In [21]:
# evaluate model
estimator = KerasRegressor(build_fn=baseline_model, epochs=100, batch_size=5, verbose=0)

In [22]:
kfold = KFold(n_splits=10, random_state=seed)
results = cross_val_score(estimator, X, Y, cv=kfold)
print('Baseline: %.2f (%.2f) MSE' % (results.mean(), results.std()))



Baseline: -38.11 (36.66) MSE


In [23]:
# Regression Example With Boston Dataset : Standardized
estimators = []
estimators.append(('standardize', StandardScaler()))
estimators.append(('mpl', KerasRegressor(build_fn=baseline_model, epochs=50, batch_size=5, verbose=0)))
pipeline = Pipeline(estimators)
kfold =KFold(n_splits=10, random_state=seed)
results = cross_val_score(pipeline, X, Y, cv=kfold)
print('Standardized: %.2f (%.2f) MSE' % (results.mean(), results.std()))



Standardized: -28.90 (26.41) MSE


In [24]:
# Regression Example With Boston Dataset: Standardized and larger
def larger_model():
  #create model
  model = Sequential()
  model.add(Dense(13, input_dim=13, kernel_initializer='normal', activation='relu'))
  model.add(Dense(6, kernel_initializer='normal', activation='relu'))
  model.add(Dense(1, kernel_initializer='normal'))
  model.compile(loss='mean_squared_error', optimizer='adam')
  return model

estimators = []
estimators.append(('standardize', StandardScaler()))
estimators.append(('mpl', KerasRegressor(build_fn=larger_model, epochs=50, batch_size=5, verbose=0)))
pipeline = Pipeline(estimators)
kfold =KFold(n_splits=10, random_state=seed)
results = cross_val_score(pipeline, X, Y, cv=kfold)
print('Standardized: %.2f (%.2f) MSE' % (results.mean(), results.std()))



Standardized: -23.22 (26.31) MSE


In [25]:
# Regression Example With Boston Dataset: Standardized and Wider
def wider_model():
  #create model
  model = Sequential()
  model.add(Dense(20, input_dim=13, kernel_initializer='normal', activation='relu'))
  model.add(Dense(1, kernel_initializer='normal'))
  model.compile(loss='mean_squared_error', optimizer='adam')
  return model

estimators = []
estimators.append(('standardize', StandardScaler()))
estimators.append(('mpl', KerasRegressor(build_fn=wider_model, epochs=50, batch_size=5, verbose=0)))
pipeline = Pipeline(estimators)
kfold =KFold(n_splits=10, random_state=seed)
results = cross_val_score(pipeline, X, Y, cv=kfold)
print('Standardized: %.2f (%.2f) MSE' % (results.mean(), results.std()))



Standardized: -25.02 (26.04) MSE
