In [1]:
import numpy as np
import pandas as pd

from sklearn.model_selection import train_test_split
from sklearn.preprocessing import StandardScaler
from sklearn.metrics import accuracy_score

import tensorflow as tf
from tensorflow import keras
from keras.models import Sequential
from keras.layers import Dense

import keras_tuner as kt

In [2]:
df = pd.read_csv("D:/Intern/DataSets/Pima-Indians-Diabetes.csv")

In [3]:
df.shape

(768, 9)

In [4]:
df.head()

Unnamed: 0,Pregnancies,Glucose,BloodPressure,SkinThickness,Insulin,BMI,DiabetesPedigreeFunction,Age,Outcome
0,6,148,72,35,0,33.6,0.627,50,1
1,1,85,66,29,0,26.6,0.351,31,0
2,8,183,64,0,0,23.3,0.672,32,1
3,1,89,66,23,94,28.1,0.167,21,0
4,0,137,40,35,168,43.1,2.288,33,1


In [5]:
df.corr()['Outcome']

Pregnancies                 0.221898
Glucose                     0.466581
BloodPressure               0.065068
SkinThickness               0.074752
Insulin                     0.130548
BMI                         0.292695
DiabetesPedigreeFunction    0.173844
Age                         0.238356
Outcome                     1.000000
Name: Outcome, dtype: float64

In [6]:
X = df.drop('Outcome', axis=1)
y = df['Outcome']

In [7]:
X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.2, random_state=42)

In [8]:
scaler = StandardScaler()
X_train = scaler.fit_transform(X_train)
X_test = scaler.transform(X_test)

In [9]:
model = Sequential()
model.add(Dense(32, activation='relu', input_shape=(8,)))
model.add(Dense(1, activation='sigmoid'))


model.compile(optimizer='adam', loss='binary_crossentropy', metrics=['accuracy'])

  super().__init__(activity_regularizer=activity_regularizer, **kwargs)


In [10]:
model.fit(X_train, y_train, epochs=10, batch_size=32, validation_data=(X_test, y_test))

Epoch 1/10
[1m20/20[0m [32m━━━━━━━━━━━━━━━━━━━━[0m[37m[0m [1m1s[0m 12ms/step - accuracy: 0.6596 - loss: 0.6133 - val_accuracy: 0.7078 - val_loss: 0.6041
Epoch 2/10
[1m20/20[0m [32m━━━━━━━━━━━━━━━━━━━━[0m[37m[0m [1m0s[0m 5ms/step - accuracy: 0.7182 - loss: 0.5716 - val_accuracy: 0.7013 - val_loss: 0.5810
Epoch 3/10
[1m20/20[0m [32m━━━━━━━━━━━━━━━━━━━━[0m[37m[0m [1m0s[0m 4ms/step - accuracy: 0.7524 - loss: 0.5425 - val_accuracy: 0.6948 - val_loss: 0.5630
Epoch 4/10
[1m20/20[0m [32m━━━━━━━━━━━━━━━━━━━━[0m[37m[0m [1m0s[0m 5ms/step - accuracy: 0.7541 - loss: 0.5219 - val_accuracy: 0.7078 - val_loss: 0.5491
Epoch 5/10
[1m20/20[0m [32m━━━━━━━━━━━━━━━━━━━━[0m[37m[0m [1m0s[0m 9ms/step - accuracy: 0.7687 - loss: 0.5056 - val_accuracy: 0.7143 - val_loss: 0.5407
Epoch 6/10
[1m20/20[0m [32m━━━━━━━━━━━━━━━━━━━━[0m[37m[0m [1m0s[0m 6ms/step - accuracy: 0.7687 - loss: 0.4932 - val_accuracy: 0.7338 - val_loss: 0.5332
Epoch 7/10
[1m20/20[0m [32m━━━━━━━━━

<keras.src.callbacks.history.History at 0x1d1a0c4f6e0>

In [11]:
loss, acc = model.evaluate(X_test, y_test)
print(f"Loss: {loss:.4f}, Accuracy: {acc:.4f}")

[1m5/5[0m [32m━━━━━━━━━━━━━━━━━━━━[0m[37m[0m [1m0s[0m 5ms/step - accuracy: 0.7468 - loss: 0.5167 
Loss: 0.5167, Accuracy: 0.7468


In [12]:
def build_model(hp):
    model = Sequential()
    
    units = hp.Int('units', min_value=8, max_value=128, step=8)
    activation = hp.Choice('activation', values = ['relu', 'tanh'])
    model.add(Dense(units=units, activation=activation, input_shape=(8,)))
    model.add(Dense(1, activation='sigmoid'))
    
    optimizer = hp.Choice('optimizer', values = ['adam', 'sgd', 'rmsprop', 'adadelta'])
    model.compile(optimizer=optimizer, loss='binary_crossentropy', metrics=['accuracy'])
    
    return model

In [13]:
tuner = kt.RandomSearch(build_model, objective='val_accuracy', max_trials=5, directory='my_dir', project_name='Keras_Tuner_Pima-Diabetes')

In [14]:
tuner.search(X_train, y_train, epochs=5, validation_data=(X_test, y_test))

Trial 5 Complete [00h 00m 01s]
val_accuracy: 0.7337662577629089

Best val_accuracy So Far: 0.7597402334213257
Total elapsed time: 00h 00m 08s


In [15]:
tuner.get_best_hyperparameters()[0].values

{'units': 88, 'activation': 'tanh', 'optimizer': 'sgd'}

In [17]:
model = tuner.get_best_models(num_models=1)[0]
model.fit(X_train, y_train, epochs=20, initial_epoch=6, batch_size=32, validation_data=(X_test, y_test))

Epoch 7/20
[1m20/20[0m [32m━━━━━━━━━━━━━━━━━━━━[0m[37m[0m [1m0s[0m 11ms/step - accuracy: 0.7362 - loss: 0.6088 - val_accuracy: 0.7403 - val_loss: 0.5878
Epoch 8/20
[1m20/20[0m [32m━━━━━━━━━━━━━━━━━━━━[0m[37m[0m [1m0s[0m 4ms/step - accuracy: 0.7443 - loss: 0.5800 - val_accuracy: 0.7468 - val_loss: 0.5656
Epoch 9/20
[1m20/20[0m [32m━━━━━━━━━━━━━━━━━━━━[0m[37m[0m [1m0s[0m 4ms/step - accuracy: 0.7557 - loss: 0.5587 - val_accuracy: 0.7208 - val_loss: 0.5507
Epoch 10/20
[1m20/20[0m [32m━━━━━━━━━━━━━━━━━━━━[0m[37m[0m [1m0s[0m 4ms/step - accuracy: 0.7541 - loss: 0.5421 - val_accuracy: 0.7143 - val_loss: 0.5399
Epoch 11/20
[1m20/20[0m [32m━━━━━━━━━━━━━━━━━━━━[0m[37m[0m [1m0s[0m 4ms/step - accuracy: 0.7557 - loss: 0.5295 - val_accuracy: 0.7208 - val_loss: 0.5305
Epoch 12/20
[1m20/20[0m [32m━━━━━━━━━━━━━━━━━━━━[0m[37m[0m [1m0s[0m 4ms/step - accuracy: 0.7622 - loss: 0.5193 - val_accuracy: 0.7273 - val_loss: 0.5238
Epoch 13/20
[1m20/20[0m [32m━━━━━

<keras.src.callbacks.history.History at 0x1d1a62ec860>

In [19]:
loss, acc = model.evaluate(X_test, y_test)
print(f"Loss: {loss:.4f}, Accuracy: {acc:.4f}")

[1m5/5[0m [32m━━━━━━━━━━━━━━━━━━━━[0m[37m[0m [1m0s[0m 5ms/step - accuracy: 0.7532 - loss: 0.4983 
Loss: 0.4983, Accuracy: 0.7532
