In [None]:
import pandas as pd
from tensorflow import keras
from tensorflow.keras import layers
from keras_tuner.tuners import RandomSearch

In [None]:
dataset = pd.read_csv('Real_Combine.csv')

In [None]:
dataset.head()

Unnamed: 0,T,TM,Tm,SLP,H,VV,V,VM,PM 2.5
0,7.4,9.8,4.8,1017.6,93.0,0.5,4.3,9.4,219.720833
1,7.8,12.7,4.4,1018.5,87.0,0.6,4.4,11.1,182.1875
2,6.7,13.4,2.4,1019.4,82.0,0.6,4.8,11.1,154.0375
3,8.6,15.5,3.3,1018.7,72.0,0.8,8.1,20.6,223.208333
4,12.4,20.9,4.4,1017.3,61.0,1.3,8.7,22.2,200.645833


In [None]:
x = dataset.iloc[:, :-1]
y = dataset.iloc[:, -1]

### Hyper Parameters
1. how many number of hidden layers needed
2. how many number of neurons is needed
3. what is learning rate

In [None]:
def build_model(hp):
    model = keras.Sequential()
    for i in range(hp.Int('num_layers', 2, 20)):
        model.add(layers.Dense(units=hp.Int('units_'+ str(i),
                                            min_value=32,
                                            max_value=512,
                                            step=32),
                               activation='relu'))
    model.add(layers.Dense(1, activation='linear'))
    model.compile(optimizer=keras.optimizers.Adam(hp.Choice('learning_rate', [1e-2, 1e-3, 1e-4])),
                  loss='mean_absolute_error',
                  metrics=['mean_absolute_error'])
    return model
        # hp.choice - take/select any one from the options
        # hp.int - try with different different values

In [None]:
tuner = RandomSearch(
                     build_model, 
                     objective='val_mean_absolute_error', 
                     max_trials=5,
                     executions_per_trial=3,
                     directory='DeepLearning',
                     project_name='Air Quality Index')

In [None]:
tuner.search_space_summary()

Search space summary
Default search space size: 4
num_layers (Int)
{'default': None, 'conditions': [], 'min_value': 2, 'max_value': 20, 'step': 1, 'sampling': None}
units_0 (Int)
{'default': None, 'conditions': [], 'min_value': 32, 'max_value': 512, 'step': 32, 'sampling': None}
units_1 (Int)
{'default': None, 'conditions': [], 'min_value': 32, 'max_value': 512, 'step': 32, 'sampling': None}
learning_rate (Choice)
{'default': 0.01, 'conditions': [], 'values': [0.01, 0.001, 0.0001], 'ordered': True}


In [None]:
from sklearn.model_selection import train_test_split
X_train, X_test, y_train, y_test = train_test_split(x, y, test_size=0.3, random_state=0)

In [None]:
tuner.search(X_train, y_train, epochs=5, validation_data=(X_test, y_test))


Search: Running Trial #1

Hyperparameter    |Value             |Best Value So Far 
num_layers        |10                |?                 
units_0           |128               |?                 
units_1           |480               |?                 
learning_rate     |0.01              |?                 

Epoch 1/5
Epoch 2/5
Epoch 3/5
Epoch 4/5
Epoch 5/5
Epoch 1/5
Epoch 2/5
Epoch 3/5
Epoch 4/5
Epoch 5/5
Epoch 1/5
Epoch 2/5
Epoch 3/5
Epoch 4/5
Epoch 5/5
[2K[2KTrial 1 Complete [00h 00m 05s]
val_mean_absolute_error: nan

Best val_mean_absolute_error So Far: nan
Total elapsed time: 00h 00m 05s

Search: Running Trial #2

Hyperparameter    |Value             |Best Value So Far 
num_layers        |2                 |10                
units_0           |416               |128               
units_1           |480               |480               
learning_rate     |0.0001            |0.01              
units_2           |480               |32                
units_3           |288  

  return np.nanmin(values)
  return np.nanmin(values)
  return np.nanmin(values)
  return np.nanmin(values)
  return np.nanmin(values)


In [None]:
tuner.results_summary()

Results summary
Results in DeepLearning/Air Quality Index
Showing 10 best trials
Objective(name='val_mean_absolute_error', direction='min')
Trial summary
Hyperparameters:
num_layers: 10
units_0: 128
units_1: 480
learning_rate: 0.01
units_2: 32
units_3: 32
units_4: 32
units_5: 32
units_6: 32
units_7: 32
units_8: 32
units_9: 32
Score: nan
Trial summary
Hyperparameters:
num_layers: 2
units_0: 416
units_1: 480
learning_rate: 0.0001
units_2: 480
units_3: 288
units_4: 320
units_5: 256
units_6: 448
units_7: 416
units_8: 32
units_9: 480
Score: nan
Trial summary
Hyperparameters:
num_layers: 13
units_0: 64
units_1: 416
learning_rate: 0.0001
units_2: 160
units_3: 128
units_4: 384
units_5: 160
units_6: 352
units_7: 448
units_8: 512
units_9: 352
units_10: 32
units_11: 32
units_12: 32
Score: nan
Trial summary
Hyperparameters:
num_layers: 8
units_0: 64
units_1: 288
learning_rate: 0.01
units_2: 96
units_3: 288
units_4: 128
units_5: 64
units_6: 448
units_7: 224
units_8: 160
units_9: 224
units_10: 288
u