In [14]:
import pandas as pd
from sklearn.preprocessing import StandardScaler, LabelEncoder
from sklearn.model_selection import train_test_split
from collections import Counter
from sklearn.compose import ColumnTransformer
from tensorflow.keras.models import Sequential
from tensorflow.keras.layers import Dense, InputLayer
from sklearn.metrics import classification_report
from tensorflow.keras.utils import to_categorical
import numpy as np
import tensorflow

# Design the model

In [16]:
#design the model
def design_model(x):
  model = Sequential(name = "Heart_Failure_Prediction")
  #your code here
  input = InputLayer(input_shape=(x.shape[1],)) 
  model.add(input)

  # hidden layers 
  model.add(Dense(12, activation = 'relu'))
  #adding an output layer to our model

  model.add(Dense(2, activation='softmax')) # add an output layer

  #add optimizer Adam
  model.compile(loss='categorical_crossentropy', optimizer='adam', metrics=['accuracy'])
  return model

# Load and Observe Data

In [3]:
#load dataset
data = pd.read_csv('heart_failure.csv')

print(data.info()) # obderve the columns and their datatypes
 

<class 'pandas.core.frame.DataFrame'>
RangeIndex: 299 entries, 0 to 298
Data columns (total 15 columns):
Unnamed: 0                  299 non-null int64
age                         299 non-null float64
anaemia                     299 non-null object
creatinine_phosphokinase    299 non-null int64
diabetes                    299 non-null object
ejection_fraction           299 non-null int64
high_blood_pressure         299 non-null object
platelets                   299 non-null float64
serum_creatinine            299 non-null float64
serum_sodium                299 non-null int64
sex                         299 non-null object
smoking                     299 non-null object
time                        299 non-null int64
DEATH_EVENT                 299 non-null int64
death_event                 299 non-null object
dtypes: float64(3), int64(6), object(6)
memory usage: 35.1+ KB
None


In [4]:
#print the class distribution
Counter(data['death_event'])

Counter({'yes': 96, 'no': 203})

In [6]:
#extract the features from the training data
y = data['death_event']

#extract the label column from the training data
x = data[['age','anaemia','creatinine_phosphokinase','diabetes','ejection_fraction','high_blood_pressure','platelets','serum_creatinine','serum_sodium','sex','smoking','time']]

# Data Preprocessing

In [9]:
x = pd.get_dummies(x) # convert categorical features to numerial using one-hot encoding

In [10]:
#split dataset into training and testing datasets
X_train, X_test, Y_train, Y_test = train_test_split(x, y, test_size = 0.3, random_state = 20)

#standardize
ct = ColumnTransformer([('standardize', StandardScaler(), ['age','creatinine_phosphokinase','ejection_fraction','platelets','serum_creatinine','serum_sodium','time'])], remainder='passthrough')
X_train = ct.fit_transform(X_train) 
X_test = ct.transform(X_test)


# Prepare labels for classification

In [15]:
#encode the labels into integers
le = LabelEncoder()
Y_train = le.fit_transform(Y_train.astype(str))
Y_test = le.transform(Y_test.astype(str))

#convert the integer encoded labels into binary vectors
Y_train = tensorflow.keras.utils.to_categorical(Y_train, dtype ='int64')
Y_test = tensorflow.keras.utils.to_categorical(Y_test, dtype ='int64')

# Train and evaluate the model

In [17]:
#invoke the function for our model design
model = design_model(X_train)

In [19]:
#train and evaluate the model
model.fit(X_train, Y_train, epochs=100, batch_size=16, verbose=1)

loss, acc = model.evaluate(X_test, Y_test, verbose=0) #accuracy of model

# generate classification report
y_estimate = np.argmax(model.predict(X_test), axis =1)

y_true = np.argmax(Y_test, axis=1)

print(model.summary())

print('Accuracy: ', acc)


print(classification_report(y_true, y_estimate))


Epoch 1/100
Epoch 2/100
Epoch 3/100
Epoch 4/100
Epoch 5/100
Epoch 6/100
Epoch 7/100
Epoch 8/100
Epoch 9/100
Epoch 10/100
Epoch 11/100
Epoch 12/100
Epoch 13/100
Epoch 14/100
Epoch 15/100
Epoch 16/100
Epoch 17/100
Epoch 18/100
Epoch 19/100
Epoch 20/100
Epoch 21/100
Epoch 22/100
Epoch 23/100
Epoch 24/100
Epoch 25/100
Epoch 26/100
Epoch 27/100
Epoch 28/100
Epoch 29/100
Epoch 30/100
Epoch 31/100
Epoch 32/100
Epoch 33/100
Epoch 34/100
Epoch 35/100
Epoch 36/100
Epoch 37/100
Epoch 38/100
Epoch 39/100
Epoch 40/100
Epoch 41/100
Epoch 42/100
Epoch 43/100
Epoch 44/100
Epoch 45/100
Epoch 46/100
Epoch 47/100
Epoch 48/100
Epoch 49/100
Epoch 50/100
Epoch 51/100
Epoch 52/100
Epoch 53/100
Epoch 54/100
Epoch 55/100
Epoch 56/100
Epoch 57/100
Epoch 58/100
Epoch 59/100
Epoch 60/100
Epoch 61/100
Epoch 62/100
Epoch 63/100
Epoch 64/100
Epoch 65/100
Epoch 66/100
Epoch 67/100
Epoch 68/100
Epoch 69/100
Epoch 70/100
Epoch 71/100
Epoch 72/100
Epoch 73/100
Epoch 74/100
Epoch 75/100
Epoch 76/100
Epoch 77/100
Epoch 78

Epoch 83/100
Epoch 84/100
Epoch 85/100
Epoch 86/100
Epoch 87/100
Epoch 88/100
Epoch 89/100
Epoch 90/100
Epoch 91/100
Epoch 92/100
Epoch 93/100
Epoch 94/100
Epoch 95/100
Epoch 96/100
Epoch 97/100
Epoch 98/100
Epoch 99/100
Epoch 100/100
Model: "Heart_Failure_Prediction"
_________________________________________________________________
Layer (type)                 Output Shape              Param #   
dense (Dense)                (None, 12)                216       
_________________________________________________________________
dense_1 (Dense)              (None, 2)                 26        
Total params: 242
Trainable params: 242
Non-trainable params: 0
_________________________________________________________________
None
Accuracy:  0.7555555701255798
              precision    recall  f1-score   support

           0       0.80      0.85      0.83        62
           1       0.62      0.54      0.58        28

    accuracy                           0.76        90
   macro avg      