In [48]:
import numpy
from pandas import read_csv
from keras.models import Sequential
from keras.layers import Dense
from keras.wrappers.scikit_learn import KerasClassifier
from sklearn.model_selection import cross_val_score
from sklearn.preprocessing import LabelEncoder
from sklearn.model_selection import StratifiedKFold
from sklearn.preprocessing import StandardScaler
from sklearn.pipeline import Pipeline


In [49]:
# fix random seed for reproducibility
seed = 7
numpy.random.seed(seed)

##### Loading Dataset

In [50]:
# load dataset
dataframe = read_csv("/home/hasan/DATA SET/sonar.all-data", header=None)
dataset = dataframe.values

In [51]:
print('length of the dataset is ', len(dataset))
print('Number of column of the dataset is :',len(dataset[0]))

length of the dataset is  208
Number of column of the dataset is : 61


##### Splitting dataset

In [52]:
# split into input (X) and output (Y) variables
X = dataset[:,0:60].astype(float)
Y = dataset[:,60]

##### Encoding Dataset

In [53]:
# encode class values as integers
encoder = LabelEncoder()
encoder.fit(Y)

LabelEncoder()

In [54]:
encoded_Y = encoder.transform(Y)

##### Model

In [55]:
def create_network():
    model = Sequential()
    model.add(Dense(60, input_dim=60, kernel_initializer='normal', activation='relu'))
    model.add(Dense(1, kernel_initializer='normal', activation='sigmoid'))
    
    # Compile model
    model.compile(loss='binary_crossentropy', 
                  optimizer='adam', 
                  metrics=['accuracy'])
    return model

##### keras classifier

In [56]:
# evaluate model with standardized dataset
estimator = KerasClassifier(build_fn=create_network, epochs=100, batch_size=5, verbose=0)

##### KFold

In [57]:
kfold = StratifiedKFold(n_splits=10, shuffle=True, random_state=seed)

##### cross_val_score

In [58]:
results = cross_val_score(estimator, X, encoded_Y, cv=kfold)
print("Baseline: %.2f%% (%.2f%%)" % (results.mean()*100, results.std()*100))

  This is separate from the ipykernel package so we can avoid doing imports until
  after removing the cwd from sys.path.


Baseline: 80.75% (7.40%)


# Same Project with Improve Performance With Data Preparation

In [24]:
import numpy
from pandas import read_csv
from keras.models import Sequential
from keras.layers import Dense
from keras.wrappers.scikit_learn import KerasClassifier
from sklearn.model_selection import cross_val_score
from sklearn.preprocessing import LabelEncoder
from sklearn.model_selection import StratifiedKFold
from sklearn.preprocessing import StandardScaler
from sklearn.pipeline import Pipeline


In [25]:
# fix random seed for reproducibility
seed = 7
numpy.random.seed(seed)

##### Reading dataset

In [26]:
# load dataset
dataframe = read_csv("/home/hasan/DATA SET/sonar.all-data", header=None)
dataset = dataframe.values

##### Dividing dataset

In [27]:
# split into input (X) and output (Y) variables
X = dataset[:,0:60].astype(float)
Y = dataset[:,60]

##### Encoder

In [28]:
# encode class values as integers
encoder = LabelEncoder()
encoder.fit(Y)
encoded_Y = encoder.transform(Y)

##### Model

In [29]:
def create_baseline():
    model = Sequential()
    model.add(Dense(60, input_dim=60, kernel_initializer='normal' , activation='relu'))
    model.add(Dense(1, kernel_initializer='normal', activation='sigmoid'))
    
    # Compile model
    model.compile(loss='binary_crossentropy', 
                  optimizer='adam', 
                  metrics=['accuracy'])
    return model


##### standardizing dataset

In [30]:
# evaluate baseline model with standardized dataset
estimators = []
estimators.append(('standardize' , StandardScaler()))


##### keras classifier

In [31]:
estimators.append(('mlp', KerasClassifier(build_fn=create_baseline, epochs=100, batch_size=5, verbose=0)))
pipeline = Pipeline(estimators)

##### K-Fold

In [32]:
kfold = StratifiedKFold(n_splits=10, shuffle=True, random_state=seed)


##### cross_val_score

In [33]:
results = cross_val_score(pipeline, X, encoded_Y, cv=kfold)
print("Standardized: %.2f%% (%.2f%%)" % (results.mean()*100, results.std()*100))


Standardized: 83.66% (3.10%)


# Evaluate with a Larger Network

In [34]:
import numpy
from pandas import read_csv
from keras.models import Sequential
from keras.layers import Dense
from keras.wrappers.scikit_learn import KerasClassifier
from sklearn.model_selection import cross_val_score
from sklearn.preprocessing import LabelEncoder
from sklearn.model_selection import StratifiedKFold
from sklearn.preprocessing import StandardScaler
from sklearn.pipeline import Pipeline


In [35]:
# fix random seed for reproducibility
seed = 7
numpy.random.seed(seed)

##### Reading dataset

In [36]:
# load dataset
dataframe = read_csv("/home/hasan/DATA SET/sonar.all-data", header=None)
dataset = dataframe.values

##### dividing dataset

In [37]:
# split into input (X) and output (Y) variables
X = dataset[:,0:60].astype(float)
Y = dataset[:,60]

##### Encoder

In [38]:
# encode class values as integers
encoder = LabelEncoder()
encoder.fit(Y)
encoded_Y = encoder.transform(Y)

##### Model

In [39]:
def create_baseline():
    model = Sequential()
    model.add(Dense(60, input_dim=60, kernel_initializer='normal' , activation='relu'))
    model.add(Dense(30, kernel_initializer='normal', activation='relu'))
    model.add(Dense(1, kernel_initializer='normal', activation='sigmoid'))
    
    # Compile model
    model.compile(loss='binary_crossentropy', 
                  optimizer='adam', 
                  metrics=['accuracy'])
    return model


##### standardize of dataset

In [40]:
# evaluate baseline model with standardized dataset
estimators = []
estimators.append(('standardize' , StandardScaler()))


##### keras classifier

In [41]:
estimators.append(('mlp', KerasClassifier(build_fn=create_baseline, epochs=100, batch_size=5, verbose=0)))
pipeline = Pipeline(estimators)

##### K-Fold

In [42]:
kfold = StratifiedKFold(n_splits=10, shuffle=True, random_state=seed)

##### cross_val_score

In [43]:
results = cross_val_score(pipeline, X, encoded_Y, cv=kfold)
print("Standardized: %.2f%% (%.2f%%)" % (results.mean()*100, results.std()*100))


Standardized: 85.52% (4.43%)
