In [1]:
import pandas as pd
from tensorflow import keras
import keras_tuner
from tensorflow.keras import layers
from kerastuner.tuners import RandomSearch

  from kerastuner.tuners import RandomSearch


In [2]:
df = pd.read_csv('diabetes.csv')

In [3]:
df.head()

Unnamed: 0,Pregnancies,Glucose,BloodPressure,SkinThickness,Insulin,BMI,DiabetesPedigreeFunction,Age,Outcome
0,6,148,72,35,0,33.6,0.627,50,1
1,1,85,66,29,0,26.6,0.351,31,0
2,8,183,64,0,0,23.3,0.672,32,1
3,1,89,66,23,94,28.1,0.167,21,0
4,0,137,40,35,168,43.1,2.288,33,1


In [4]:
X=df.iloc[:,:-1] ## independent features
y=df.iloc[:,-1] ## dependent features

# Hyperparameters
### 1.How many number of hidden layers we should have?
### 2.How many number of neurons we should have in hidden layers? 
### 3.Learning Rate

In [6]:
def build_model(hp):
    model = keras.Sequential()
    for i in range(hp.Int('num_layers', 2, 20)):
        model.add(layers.Dense(units=hp.Int('units_' + str(i),
                                            min_value=32,
                                            max_value=512,
                                            step=32),
                                            activation='relu'))
    model.add(layers.Dense(1, activation='linear'))
    model.compile(
        optimizer=keras.optimizers.Adam(hp.Choice('learning_rate', [1e-2, 1e-3, 1e-4])),
        loss='mean_absolute_error',
        metrics=['mean_absolute_error'])
    return model

In [7]:
tuner = RandomSearch(
    build_model,
    objective='val_mean_absolute_error',
    max_trials=5,
    executions_per_trial=3,
    directory='project',
    project_name='Air Quality Index')

In [8]:
tuner.search_space_summary()

Search space summary
Default search space size: 4
num_layers (Int)
{'default': None, 'conditions': [], 'min_value': 2, 'max_value': 20, 'step': 1, 'sampling': 'linear'}
units_0 (Int)
{'default': None, 'conditions': [], 'min_value': 32, 'max_value': 512, 'step': 32, 'sampling': 'linear'}
units_1 (Int)
{'default': None, 'conditions': [], 'min_value': 32, 'max_value': 512, 'step': 32, 'sampling': 'linear'}
learning_rate (Choice)
{'default': 0.01, 'conditions': [], 'values': [0.01, 0.001, 0.0001], 'ordered': True}


In [9]:
from sklearn.model_selection import train_test_split
X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.3, random_state=0)

In [10]:
tuner.search(X_train, y_train,
             epochs=5,
             validation_data=(X_test, y_test))

Trial 5 Complete [00h 00m 30s]
val_mean_absolute_error: 0.3213128050168355

Best val_mean_absolute_error So Far: 0.31615586082140607
Total elapsed time: 00h 02m 04s
INFO:tensorflow:Oracle triggered exit


In [11]:
tuner.results_summary()

Results summary
Results in project\Air Quality Index
Showing 10 best trials
Objective(name="val_mean_absolute_error", direction="min")

Trial 2 summary
Hyperparameters:
num_layers: 18
units_0: 160
units_1: 448
learning_rate: 0.001
units_2: 384
units_3: 224
units_4: 64
units_5: 160
units_6: 32
units_7: 448
units_8: 288
units_9: 32
units_10: 32
units_11: 32
units_12: 32
units_13: 32
units_14: 32
units_15: 32
units_16: 32
units_17: 32
Score: 0.31615586082140607

Trial 1 summary
Hyperparameters:
num_layers: 9
units_0: 512
units_1: 64
learning_rate: 0.01
units_2: 96
units_3: 192
units_4: 512
units_5: 128
units_6: 32
units_7: 32
units_8: 32
Score: 0.32109561562538147

Trial 4 summary
Hyperparameters:
num_layers: 15
units_0: 320
units_1: 32
learning_rate: 0.01
units_2: 96
units_3: 128
units_4: 448
units_5: 352
units_6: 64
units_7: 96
units_8: 352
units_9: 64
units_10: 480
units_11: 320
units_12: 448
units_13: 384
units_14: 416
units_15: 320
units_16: 192
units_17: 384
Score: 0.321312805016835