# Loading the data

In [1]:
from keras.datasets import boston_housing

(train_data, train_targets), (test_data, test_targets) = boston_housing.load_data()

Using TensorFlow backend.


In [2]:
train_data[0]

array([   1.23247,    0.     ,    8.14   ,    0.     ,    0.538  ,
          6.142  ,   91.7    ,    3.9769 ,    4.     ,  307.     ,
         21.     ,  396.9    ,   18.72   ])

In [3]:
train_data.shape

(404, 13)

In [4]:
test_data.shape

(102, 13)

In [5]:
train_targets[0]

15.199999999999999

# Data preparation

In [6]:
mean = train_data.mean(axis=0)
train_data -= mean
std = train_data.std(axis=0)
train_data /= std

test_data -= mean
test_data /= std

# Network

In [9]:
from keras import models, layers
import numpy as np

In [8]:
def build_model():
    model = models.Sequential()
    model.add(layers.Dense(64, activation='relu', input_shape=(train_data.shape[1], )))
    model.add(layers.Dense(1))
    model.compile(optimizer='rmsprop', loss='mse', metrics=['mae'])
    return model

# K-fold validation

In [10]:
k = 4
num_val_sample = len(train_data) // k
all_scores = []

for i in range(k):
    print('processing fold # %d.' % i)
    
    # prepare the validation set
    val_data = train_data[i * num_val_sample: (i + 1) * num_val_sample]
    val_target = train_targets[i * num_val_sample: (i + 1) * num_val_sample]
    
    # prepare the training data
    partial_train_data = np.concatenate(
    [train_data[:i * num_val_sample],
    train_data[(i + 1) * num_val_sample:]], 
        axis = 0
    )
    
    partial_train_target = np.concatenate(
    [train_targets[:i * num_val_sample],
    train_targets[(i + 1) * num_val_sample:]],
        axis=0
    )
    
    # build the model
    model = build_model()
    
    #train the model
    model.fit(partial_train_data, partial_train_target,
             epochs=100, batch_size=1, verbose=0)
    
    # evaluate
    val_mse, val_mae = model.evaluate(val_data, val_target, verbose=0)
    
    all_scores.append(val_mae)

processing fold # 0.
processing fold # 1.
processing fold # 2.
processing fold # 3.


In [11]:
all_scores

[1.8711768613003268,
 2.3156409594092038,
 2.6260822421253316,
 2.3034281388367757]

In [12]:
np.mean(all_scores)

2.2790820504179092