### Keras Tuner - Decide Number of Hidden Layers and Neural in Neural Network

In [3]:
import pandas as pd
from tensorflow import keras
from tensorflow.keras import layers
from keras_tuner.tuners import RandomSearch

In [10]:
df = pd.read_csv('Real_Combine.csv')
df.dropna(inplace=True)
print(df.head())
print(df.shape)

      T    TM   Tm     SLP     H   VV    V    VM      PM 2.5
1   7.4   9.8  4.8  1017.6  93.0  0.5  4.3   9.4  219.720833
3   7.8  12.7  4.4  1018.5  87.0  0.6  4.4  11.1  182.187500
5   6.7  13.4  2.4  1019.4  82.0  0.6  4.8  11.1  154.037500
7   8.6  15.5  3.3  1018.7  72.0  0.8  8.1  20.6  223.208333
9  12.4  20.9  4.4  1017.3  61.0  1.3  8.7  22.2  200.645833
(1092, 9)


In [7]:
X = df.iloc[:,:-1]  #independent feature
y = df.iloc[:,-1]  #dependent feature

### Hyperparameters
1. How many number of hidden layer should we have?
2. How many number of neurons should we have?
3. Learning Rate

In [13]:
def build_model(hp):
    model = keras.Sequential()
    for i in range(hp.Int('num_layer',2,20)):
        model.add(layers.Dense(units = hp.Int('units_'+str(i),
                                             min_value=32,
                                             max_value=512,
                                             step=32),
                              activation='relu'))
    model.add(layers.Dense(1, activation='linear'))
    model.compile(
        optimizer = keras.optimizers.Adam(
            hp.Choice('learning_rate',[1e-2, 1e-3, 1e-4])),
        loss='mean_absolute_error',
        metrics=['mean_absolute_error'])
    return model

In [14]:
tuner = RandomSearch(
    build_model,
    objective='val_mean_absolute_error',
    max_trials=5,
    executions_per_trial=3,
    directory='project',
    project_name='Air Quality Index')

In [15]:
tuner.search_space_summary()

Search space summary
Default search space size: 4
num_layer (Int)
{'default': None, 'conditions': [], 'min_value': 2, 'max_value': 20, 'step': 1, 'sampling': None}
units_0 (Int)
{'default': None, 'conditions': [], 'min_value': 32, 'max_value': 512, 'step': 32, 'sampling': None}
units_1 (Int)
{'default': None, 'conditions': [], 'min_value': 32, 'max_value': 512, 'step': 32, 'sampling': None}
learning_rate (Choice)
{'default': 0.01, 'conditions': [], 'values': [0.01, 0.001, 0.0001], 'ordered': True}


In [16]:
from sklearn.model_selection import train_test_split
X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.3, random_state=0)

In [18]:
tuner.search(X_train, y_train, epochs=5, validation_data=(X_test, y_test))

Trial 6 Complete [00h 00m 11s]
val_mean_absolute_error: 48.30751927693685

Best val_mean_absolute_error So Far: 48.30751927693685
Total elapsed time: 00h 01m 25s
INFO:tensorflow:Oracle triggered exit


In [20]:
tuner.results_summary()

Results summary
Results in project\Air Quality Index
Showing 10 best trials
Objective(name='val_mean_absolute_error', direction='min')
Trial summary
Hyperparameters:
num_layer: 6
units_0: 256
units_1: 480
learning_rate: 0.01
units_2: 224
units_3: 32
units_4: 128
units_5: 480
units_6: 128
units_7: 384
units_8: 384
units_9: 480
units_10: 96
units_11: 384
units_12: 288
units_13: 64
units_14: 160
units_15: 384
units_16: 448
units_17: 128
Score: 48.30751927693685
Trial summary
Hyperparameters:
num_layer: 10
units_0: 416
units_1: 224
learning_rate: 0.001
units_2: 32
units_3: 32
units_4: 32
units_5: 32
units_6: 32
units_7: 32
units_8: 32
units_9: 32
Score: 64.04886881510417
Trial summary
Hyperparameters:
num_layer: 10
units_0: 288
units_1: 288
learning_rate: 0.0001
units_2: 256
units_3: 128
units_4: 192
units_5: 448
units_6: 512
units_7: 416
units_8: 384
units_9: 384
Score: 64.28427505493164
Trial summary
Hyperparameters:
num_layer: 5
units_0: 352
units_1: 224
learning_rate: 0.0001
units_2: 1