In [9]:
import numpy
import pandas
from keras.callbacks import History 

from keras.models import Sequential
from keras.layers import Dense
from keras.wrappers.scikit_learn import KerasClassifier
from sklearn.model_selection import cross_val_score
from sklearn.preprocessing import LabelEncoder
from sklearn.model_selection import StratifiedKFold
from sklearn.preprocessing import StandardScaler
from sklearn.pipeline import Pipeline

In [10]:
seed = 7
numpy.random.seed(seed)


In [11]:
# load dataset
dataframe = pandas.read_csv("sonar.csv", header=None)
dataset = dataframe.values
# split into input (X) and output (Y) variables
X = dataset[:,0:60].astype(float)
Y = dataset[:,60]


In [12]:

from sklearn import preprocessing
encoder = preprocessing.LabelEncoder()
encoder.fit(Y)
encoded_Y = encoder.transform(Y)

In [13]:
for key, value in enumerate(encoder.classes_):
    print(value, "=",key)

M = 0
R = 1


In [14]:
# MLP for Pima Indians Dataset with 10-fold cross validation via sklearn
from keras.models import Sequential
from keras.layers import Dense
from keras.wrappers.scikit_learn import KerasClassifier
from sklearn.model_selection import StratifiedKFold
from sklearn.model_selection import cross_val_score
import numpy

# Function to create model, required for KerasClassifier
def create_baseline():
	# create model
    model = Sequential()
    model.add(Dense(60, input_dim=60, kernel_initializer='normal',activation='relu'))
    model.add(Dense(1, kernel_initializer='normal',activation='sigmoid'))
	# Compile model
    model.compile(loss='binary_crossentropy', optimizer='adam', metrics=['accuracy'])
    return model


In [15]:
# evaluate model with standardized dataset
estimator = KerasClassifier(build_fn=create_baseline, epochs=100, batch_size=5, verbose=0)
kfold = StratifiedKFold(n_splits=10, shuffle=True, random_state=seed)
results = cross_val_score(estimator, X, encoded_Y, cv=kfold)
print("Results: %.2f%% (%.2f%%)" % (results.mean()*100, results.std()*100))

Results: 80.75% (4.94%)


In [16]:
# evaluate baseline model with standardized dataset
numpy.random.seed(seed)
estimators = []
estimators.append(('standardize', StandardScaler()))
estimators.append(('mlp', KerasClassifier(build_fn=create_baseline, epochs=100, batch_size=5, verbose=0)))
pipeline = Pipeline(estimators)
kfold = StratifiedKFold(n_splits=10, shuffle=True, random_state=seed)
results = cross_val_score(pipeline, X, encoded_Y, cv=kfold)
print("Standardized: %.2f%% (%.2f%%)" % (results.mean()*100, results.std()*100))

Standardized: 84.63% (7.65%)


In [17]:
# evaluate baseline model with standardized dataset
numpy.random.seed(seed)
estimators = []
estimators.append(('standardize', StandardScaler()))
estimators.append(('mlp', KerasClassifier(build_fn=create_baseline, epochs=100, batch_size=5, verbose=0)))
pipeline = Pipeline(estimators)
kfold = StratifiedKFold(n_splits=10, shuffle=True, random_state=seed)
results = cross_val_score(pipeline, X, encoded_Y, cv=kfold)
print("Standardized: %.2f%% (%.2f%%)" % (results.mean()*100, results.std()*100))


Standardized: 84.63% (7.65%)


In [18]:
# smaller model
def create_smaller():
    # create model
    model = Sequential()
    model.add(Dense(30, input_dim=60, kernel_initializer='normal' ,activation='relu'))
    model.add(Dense(1,kernel_initializer='normal', activation='sigmoid'))
    # Compile model
    model.compile(loss='binary_crossentropy', optimizer='adam', metrics=['accuracy'])
    return model

estimators = []
estimators.append(('standardize', StandardScaler()))
estimators.append(('mlp', KerasClassifier(build_fn=create_smaller, epochs=100, batch_size=5, verbose=0)))
pipeline = Pipeline(estimators)
kfold = StratifiedKFold(n_splits=10, shuffle=True, random_state=seed)
results = cross_val_score(pipeline, X, encoded_Y, cv=kfold)
print("Smaller: %.2f%% (%.2f%%)" % (results.mean()*100, results.std()*100))



Smaller: 85.04% (7.38%)


In [19]:
# smaller model
def create_larger():
    # create model
    model = Sequential()
    model.add(Dense(60, input_dim=60, kernel_initializer='normal' ,activation='relu'))
    model.add(Dense(30,  kernel_initializer='normal' ,activation='relu'))
    model.add(Dense(1,kernel_initializer='normal', activation='sigmoid'))
    # Compile model
    history=model.compile(loss='binary_crossentropy', optimizer='adam', metrics=['accuracy'])
    
    return model


estimators = []
estimators.append(('standardize', StandardScaler()))
estimators.append(('mlp', KerasClassifier(build_fn=create_larger, epochs=100, batch_size=5, verbose=0)))
pipeline = Pipeline(estimators)
kfold = StratifiedKFold(n_splits=10, shuffle=True, random_state=seed)
results = cross_val_score(pipeline, X, encoded_Y, cv=kfold)
print("larger: %.2f%% (%.2f%%)" % (results.mean()*100, results.std()*100))

larger: 83.61% (7.57%)


In [20]:
# smaller model
def create_larger():
    # create model
    model = Sequential()
    model.add(Dense(60, input_dim=60, kernel_initializer='normal' ,activation='relu'))
    model.add(Dense(30,  kernel_initializer='normal' ,activation='relu'))
    model.add(Dense(1,kernel_initializer='normal', activation='sigmoid'))
    # Compile model
    history=model.compile(loss='binary_crossentropy', optimizer='adam', metrics=['accuracy'])
    
    return model


estimators = []
estimators.append(('standardize', StandardScaler()))
estimators.append(('mlp', KerasClassifier(build_fn=create_larger, epochs=100, batch_size=5, verbose=0)))
pipeline = Pipeline(estimators)
kfold = StratifiedKFold(n_splits=10, shuffle=True, random_state=seed)
results = cross_val_score(pipeline, X, encoded_Y, cv=kfold)
print("larger: %.2f%% (%.2f%%)" % (results.mean()*100, results.std()*100))

larger: 84.59% (8.03%)


# Step 5:Step 5: Really Scaling up: developing a model that overfits

In [21]:
# smaller model
def checking_overfiting():
    # create model
    model = Sequential()
    model.add(Dense(100, input_dim=60, kernel_initializer='normal' ,activation='relu'))
    model.add(Dense(70,  kernel_initializer='normal' ,activation='relu'))
    model.add(Dense(1,kernel_initializer='normal', activation='sigmoid'))
    # Compile model
    model.compile(loss='binary_crossentropy', optimizer='adam', metrics=['accuracy'])
    
    return model


estimators = []
estimators.append(('standardize', StandardScaler()))
estimators.append(('mlp', KerasClassifier(build_fn=checking_overfiting, epochs=60, batch_size=50, verbose=0)))
pipeline = Pipeline(estimators)
kfold = StratifiedKFold(n_splits=60, shuffle=True, random_state=seed)
results = cross_val_score(pipeline, X, encoded_Y, cv=kfold)
print("Result: %.2f%% (%.2f%%)" % (results.mean()*100, results.std()*100))

Result: 87.78% (19.69%)


# Tuning the Model

In [22]:
def tunning_the_model():
    # create model
    model = Sequential()
    model.add(Dense(70, input_dim=60, kernel_initializer='normal' ,activation='relu'))
#     



    model.add(Dense(1,kernel_initializer='normal', activation='sigmoid'))
    # Compile model
    history=model.compile(loss='binary_crossentropy', optimizer='adam', metrics=['accuracy'])
    
    return model


estimators = []
estimators.append(('standardize', StandardScaler()))
estimators.append(('mlp', KerasClassifier(build_fn=tunning_the_model, epochs=100, batch_size=5, verbose=0)))
pipeline = Pipeline(estimators)
kfold = StratifiedKFold(n_splits=10, shuffle=True, random_state=seed)
results = cross_val_score(pipeline, X, encoded_Y, cv=kfold)
print("Result: %.2f%% (%.2f%%)" % (results.mean()*100, results.std()*100))

Result: 84.09% (6.21%)


# Rewriting the code using the Keras Functional API

In [23]:
from keras.layers import Input, Dense
from keras.models import Model

# This returns a tensor
inputs = Input(shape=(60,))

# a layer instance is callable on a tensor, and returns a tensor
x = Dense(70, activation='relu')(inputs)
predictions = Dense(1, activation='sigmoid')(x)

# This creates a model that includes
# the Input layer and two Dense layers
model = Model(inputs=inputs, outputs=predictions)
model.compile(optimizer='adam',
              loss='binary_crossentropy',
              metrics=['accuracy'])
history=model.fit(X, encoded_Y,epochs=100, batch_size=5, verbose=False)
# print(model.summary())

history_dict = history.history
history_dict.keys()
acc_values = history_dict['acc']
print("Result: %.2f%% (%.2f%%)" % (numpy.mean(acc_values)*100, numpy.std(acc_values)*100))






Result: 87.89% (6.86%)


In [1]:
import tensorflow as tf
import keras
class MyModel(tf.keras.Model):
    
        def __init__(self):
            super(MyModel, self).__init__()
            self.dense1= Dense(70, activation='relu')
            self.dense2 = Dense(1, activation='sigmoid')

        def call(self, inputs):
            x = self.dense1(inputs)
            return self.dense2(x)
                        
                    
model = MyModel()
model.compile(loss='categorical_crossentropy', optimizer='adam',   metrics=['accuracy'])
history=model.fit(X,encoded_Y, epochs=100,batch_size=50,verbose=False)
history_dict = history.history
history_dict.keys()
acc_values = history_dict['acc']
print("Result: %.2f%% (%.2f%%)" % (numpy.mean(acc_values)*100, numpy.std(acc_values)*100))



Using TensorFlow backend.


NameError: name 'Dense' is not defined

In [25]:
from keras import models
from keras import layers
def build_model():
    # create model
    model = Sequential()
    model.add(Dense(100, input_dim=60, kernel_initializer='normal' ,activation='relu'))
    model.add(Dense(70,  kernel_initializer='normal' ,activation='relu'))
    model.add(Dense(1,kernel_initializer='normal', activation='sigmoid'))
    # Compile model
    model.compile(loss='binary_crossentropy', optimizer='adam', metrics=['accuracy'])
    
    return model
k=10
num_val_samples = len(X) // k
num_epochs = 100
all_scores = []

for i in range(k):
    print('processing fold #', i)
    val_data = X[i * num_val_samples: (i + 1) * num_val_samples]
    val_targets = encoded_Y[i * num_val_samples: (i + 1) * num_val_samples]
#     print(val_data,val_targets)
    partial_train_data =numpy.concatenate([X[:i * num_val_samples],X[(i + 1) * num_val_samples:]],axis=0)
    partial_train_targets =numpy.concatenate([encoded_Y[:i * num_val_samples],encoded_Y[(i + 1) * num_val_samples:]],axis=0)
    model = build_model()
    model.fit(partial_train_data, partial_train_targets,epochs=num_epochs, batch_size=5, verbose=0)
    val_mse, val_mae = model.evaluate(val_data, val_targets, verbose=0)
    all_scores.append(val_mae)

processing fold # 0
processing fold # 1
processing fold # 2
processing fold # 3
processing fold # 4
processing fold # 5
processing fold # 6
processing fold # 7
processing fold # 8
processing fold # 9


In [26]:
print("Result: %.2f%% (%.2f%%)" % (numpy.mean(all_scores)*100, numpy.std(all_scores)*100))


Result: 61.50% (19.88%)


# After Preparing the data

In [27]:
# Data Normalizing
mean=X.mean(axis=0)
X-=mean
std=X.std(axis=0)
X/=std



In [29]:
from keras import models
from keras import layers
def build_model():
    # create model
    model = Sequential()
    model.add(Dense(100, input_dim=60, kernel_initializer='normal' ,activation='relu'))
    model.add(Dense(70,  kernel_initializer='normal' ,activation='relu'))
    model.add(Dense(1,kernel_initializer='normal', activation='sigmoid'))
    # Compile model
    model.compile(loss='binary_crossentropy', optimizer='adam', metrics=['accuracy'])
    
    return model
k=10
num_val_samples = len(X) // k
num_epochs = 100
all_scores = []

for i in range(k):
    print('processing fold #', i)
    val_data = X[i * num_val_samples: (i + 1) * num_val_samples]
    val_targets = encoded_Y[i * num_val_samples: (i + 1) * num_val_samples]
#     print(val_data,val_targets)
    partial_train_data =numpy.concatenate([X[:i * num_val_samples],X[(i + 1) * num_val_samples:]],axis=0)
    partial_train_targets =numpy.concatenate([encoded_Y[:i * num_val_samples],encoded_Y[(i + 1) * num_val_samples:]],axis=0)
    model = build_model()
    model.fit(partial_train_data, partial_train_targets,epochs=num_epochs, batch_size=5, verbose=0)
    val_mse, val_mae = model.evaluate(val_data, val_targets, verbose=0)
    all_scores.append(val_mae)
print("Result: %.2f%% (%.2f%%)" % (numpy.mean(all_scores)*100, numpy.std(all_scores)*100))


processing fold # 0
processing fold # 1
processing fold # 2
processing fold # 3
processing fold # 4
processing fold # 5
processing fold # 6
processing fold # 7
processing fold # 8
processing fold # 9
Result: 64.00% (20.95%)
