In [1]:
import numpy as np
import pandas as pd

In [2]:
df = pd.read_csv('diabetes.csv')
df.head()

Unnamed: 0,Pregnancies,Glucose,BloodPressure,SkinThickness,Insulin,BMI,DiabetesPedigreeFunction,Age,Outcome
0,6,148,72,35,0,33.6,0.627,50,1
1,1,85,66,29,0,26.6,0.351,31,0
2,8,183,64,0,0,23.3,0.672,32,1
3,1,89,66,23,94,28.1,0.167,21,0
4,0,137,40,35,168,43.1,2.288,33,1


In [4]:
df.corr()['Outcome'].sort_values(ascending=False)

Outcome                     1.000000
Glucose                     0.466581
BMI                         0.292695
Age                         0.238356
Pregnancies                 0.221898
DiabetesPedigreeFunction    0.173844
Insulin                     0.130548
SkinThickness               0.074752
BloodPressure               0.065068
Name: Outcome, dtype: float64

In [5]:
X = df.iloc[:, :-1].values
y = df.iloc[:, -1].values

In [6]:
from sklearn.preprocessing import StandardScaler
scaler = StandardScaler()

In [7]:
X = scaler.fit_transform(X)

In [9]:
X

array([[ 0.63994726,  0.84832379,  0.14964075, ...,  0.20401277,
         0.46849198,  1.4259954 ],
       [-0.84488505, -1.12339636, -0.16054575, ..., -0.68442195,
        -0.36506078, -0.19067191],
       [ 1.23388019,  1.94372388, -0.26394125, ..., -1.10325546,
         0.60439732, -0.10558415],
       ...,
       [ 0.3429808 ,  0.00330087,  0.14964075, ..., -0.73518964,
        -0.68519336, -0.27575966],
       [-0.84488505,  0.1597866 , -0.47073225, ..., -0.24020459,
        -0.37110101,  1.17073215],
       [-0.84488505, -0.8730192 ,  0.04624525, ..., -0.20212881,
        -0.47378505, -0.87137393]])

In [10]:
from sklearn.model_selection import train_test_split
X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.2, random_state=1)

In [11]:
import tensorflow as tf
from tensorflow import keras
from keras import Sequential
from keras.layers import Dense

In [12]:
model = Sequential()
model.add(Dense(32, activation='relu', input_dim=8))
model.add(Dense(1, activation='sigmoid'))

model.compile(optimizer='adam', loss='binary_crossentropy', metrics=['accuracy'])

  super().__init__(activity_regularizer=activity_regularizer, **kwargs)


In [14]:
model.fit(X_train, y_train, batch_size=32, epochs=100, validation_data=(X_test, y_test))

Epoch 1/100


[1m20/20[0m [32m━━━━━━━━━━━━━━━━━━━━[0m[37m[0m [1m0s[0m 7ms/step - accuracy: 0.7853 - loss: 0.4909 - val_accuracy: 0.8117 - val_loss: 0.4708
Epoch 2/100
[1m20/20[0m [32m━━━━━━━━━━━━━━━━━━━━[0m[37m[0m [1m0s[0m 3ms/step - accuracy: 0.7973 - loss: 0.4735 - val_accuracy: 0.7987 - val_loss: 0.4655
Epoch 3/100
[1m20/20[0m [32m━━━━━━━━━━━━━━━━━━━━[0m[37m[0m [1m0s[0m 3ms/step - accuracy: 0.7454 - loss: 0.4899 - val_accuracy: 0.8117 - val_loss: 0.4612
Epoch 4/100
[1m20/20[0m [32m━━━━━━━━━━━━━━━━━━━━[0m[37m[0m [1m0s[0m 3ms/step - accuracy: 0.7682 - loss: 0.4946 - val_accuracy: 0.8052 - val_loss: 0.4582
Epoch 5/100
[1m20/20[0m [32m━━━━━━━━━━━━━━━━━━━━[0m[37m[0m [1m0s[0m 3ms/step - accuracy: 0.7719 - loss: 0.4994 - val_accuracy: 0.8052 - val_loss: 0.4554
Epoch 6/100
[1m20/20[0m [32m━━━━━━━━━━━━━━━━━━━━[0m[37m[0m [1m0s[0m 3ms/step - accuracy: 0.7896 - loss: 0.4643 - val_accuracy: 0.8052 - val_loss: 0.4527
Epoch 7/100
[1m20/20[0m [32m━━━━━━━━━━━━━━━

<keras.src.callbacks.history.History at 0x16b1daddc10>

In [None]:
# Hyperparameter tuning
import keras_tuner as kt

In [19]:
# defining function for keras tuner
def build_model(hp):
    model = Sequential()
    model.add(Dense(32, activation='relu', input_dim=8))
    model.add(Dense(1, activation='sigmoid'))

    optimizer = hp.Choice('optimizer', values = ['adam', 'sgd', 'rmsprop']) # choice of optimizer in keras tuner

    model.compile(optimizer=optimizer, loss='binary_crossentropy', metrics=['accuracy'])

    return model

In [20]:
# tuner object
tuner = kt.RandomSearch(build_model, objective='val_accuracy', max_trials=5) # RandomSearch method used in keras tuner for hyperparameter tuning

# tuner search
tuner.search(X_train, y_train, epochs=5, validation_data=(X_test, y_test)) # search method used to search for best hyperparameters

Trial 3 Complete [00h 00m 02s]
val_accuracy: 0.7727272510528564

Best val_accuracy So Far: 0.7727272510528564
Total elapsed time: 00h 00m 05s


In [23]:
# get best hyperparameters
best_hps = tuner.get_best_hyperparameters()[0] # get_best_hyperparameters method used to get best hyperparameters
best_hps.values

{'optimizer': 'adam'}

In [24]:
# get best model
model = tuner.hypermodel.build(best_hps) # build method used to build best model

  super().__init__(activity_regularizer=activity_regularizer, **kwargs)


In [25]:
model.summary()

In [26]:
# fit best model
model.fit(X_train, y_train, batch_size=32, epochs=100, initial_epoch=6, validation_data=(X_test, y_test))

Epoch 7/100
[1m20/20[0m [32m━━━━━━━━━━━━━━━━━━━━[0m[37m[0m [1m1s[0m 8ms/step - accuracy: 0.6142 - loss: 0.6549 - val_accuracy: 0.7078 - val_loss: 0.6069
Epoch 8/100
[1m20/20[0m [32m━━━━━━━━━━━━━━━━━━━━[0m[37m[0m [1m0s[0m 3ms/step - accuracy: 0.6406 - loss: 0.6087 - val_accuracy: 0.7468 - val_loss: 0.5659
Epoch 9/100
[1m20/20[0m [32m━━━━━━━━━━━━━━━━━━━━[0m[37m[0m [1m0s[0m 3ms/step - accuracy: 0.6854 - loss: 0.5780 - val_accuracy: 0.7597 - val_loss: 0.5368
Epoch 10/100
[1m20/20[0m [32m━━━━━━━━━━━━━━━━━━━━[0m[37m[0m [1m0s[0m 3ms/step - accuracy: 0.7182 - loss: 0.5519 - val_accuracy: 0.7727 - val_loss: 0.5151
Epoch 11/100
[1m20/20[0m [32m━━━━━━━━━━━━━━━━━━━━[0m[37m[0m [1m0s[0m 3ms/step - accuracy: 0.7380 - loss: 0.5182 - val_accuracy: 0.7727 - val_loss: 0.4990
Epoch 12/100
[1m20/20[0m [32m━━━━━━━━━━━━━━━━━━━━[0m[37m[0m [1m0s[0m 3ms/step - accuracy: 0.7251 - loss: 0.5354 - val_accuracy: 0.7857 - val_loss: 0.4882
Epoch 13/100
[1m20/20[0m [32

<keras.src.callbacks.history.History at 0x16b21ad5610>

In [32]:
# neuron tuning
def build_model(hp):
    model = Sequential()
    
    units = hp.Int('units',min_value=8, max_value=128, step=8) # Int method used to define range of neurons
    model.add(Dense(units, activation='relu', input_dim=8))
    model.add(Dense(1, activation='sigmoid'))

    model.compile(optimizer='adam', loss='binary_crossentropy', metrics=['accuracy'])

    return model


In [33]:
# tuner object
tuner = kt.RandomSearch(build_model, objective='val_accuracy', max_trials=5)

Reloading Tuner from .\untitled_project\tuner0.json


In [35]:
# tuner search
tuner.search(X_train, y_train, epochs=5, directory='my_dir', project_name='intro_to_kt', validation_data=(X_test, y_test))