# MI_FCHD - Neural Network

In [1]:
# Set the seed value for the notebook so the results are reproducible
from numpy.random import seed
seed(49)

In [2]:
# Dependencies
import numpy as np
import pandas as pd
import tensorflow
tensorflow.keras.__version__

'2.4.0'

In [3]:
df = pd.read_csv("Resources/MI_final_data.csv")
df.head()

Unnamed: 0,RANDID,SEX,TOTCHOL,AGE,SYSBP,DIABP,CURSMOKE,CIGPDAY,BMI,DIABETES,...,PREVMI,PREVSTRK,PREVHYP,TIME,PERIOD,DEATH,HOSPMI,MI_FCHD,TIMEMI,TIMEMIFC
0,2448,1,195.0,39,106.0,70.0,0,0.0,26.97,0,...,0,0,0,0,1,0,1,1,6438,6438
1,6238,2,250.0,46,121.0,81.0,0,0.0,28.73,0,...,0,0,0,0,1,0,0,0,8766,8766
2,9428,1,245.0,48,127.5,80.0,1,20.0,25.34,0,...,0,0,0,0,1,0,0,0,8766,8766
3,10552,2,225.0,61,150.0,95.0,1,30.0,28.58,0,...,0,0,1,0,1,1,0,0,2956,2956
4,11252,2,285.0,46,130.0,84.0,1,23.0,23.1,0,...,0,0,0,0,1,0,0,0,8766,8766


## Data Preprocessing

In [4]:
mi_fchd_df = df.set_index('RANDID')
#Remove columns not involved in analysis
mi_fchd_df = mi_fchd_df[['SEX', 'TOTCHOL', 'AGE', 'SYSBP', 'DIABP', 'CURSMOKE',
       'CIGPDAY', 'BMI', 'DIABETES', 'BPMEDS', 'HEARTRTE', 'GLUCOSE',
       'PREVCHD', 'PREVAP', 'PREVSTRK', 'PREVHYP', 'MI_FCHD']]
mi_fchd_df.head()

Unnamed: 0_level_0,SEX,TOTCHOL,AGE,SYSBP,DIABP,CURSMOKE,CIGPDAY,BMI,DIABETES,BPMEDS,HEARTRTE,GLUCOSE,PREVCHD,PREVAP,PREVSTRK,PREVHYP,MI_FCHD
RANDID,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1,Unnamed: 17_level_1
2448,1,195.0,39,106.0,70.0,0,0.0,26.97,0,0.0,80.0,77.0,0,0,0,0,1
6238,2,250.0,46,121.0,81.0,0,0.0,28.73,0,0.0,95.0,76.0,0,0,0,0,0
9428,1,245.0,48,127.5,80.0,1,20.0,25.34,0,0.0,75.0,70.0,0,0,0,0,0
10552,2,225.0,61,150.0,95.0,1,30.0,28.58,0,0.0,65.0,103.0,0,0,0,1,0
11252,2,285.0,46,130.0,84.0,1,23.0,23.1,0,0.0,85.0,85.0,0,0,0,0,0


In [5]:
X = mi_fchd_df.drop("MI_FCHD", axis=1)
y = mi_fchd_df["MI_FCHD"]
target_names = ["negative", "positive"]
print(X.shape, y.shape)

(3847, 16) (3847,)


In [6]:
from sklearn.model_selection import train_test_split
from sklearn.preprocessing import LabelEncoder, MinMaxScaler
from tensorflow.keras.utils import to_categorical

X_train, X_test, y_train, y_test = train_test_split(X, y, random_state=1)
X_scaler = MinMaxScaler().fit(X_train)
X_train_scaled = X_scaler.transform(X_train)
X_test_scaled = X_scaler.transform(X_test)


# Step 1: Label-encode data set
label_encoder = LabelEncoder()
label_encoder.fit(y_train)
encoded_y_train = label_encoder.transform(y_train)
encoded_y_test = label_encoder.transform(y_test)

# Step 2: Convert encoded labels to one-hot-encoding
y_train_categorical = to_categorical(encoded_y_train)
y_test_categorical = to_categorical(encoded_y_test)

## Create neural net model

In [7]:
from tensorflow.keras.models import Sequential
from tensorflow.keras.layers import Dense

# Create a Neural Network model here
model = Sequential()
model.add(Dense(units=100, activation='relu', input_dim=16))
model.add(Dense(units=2, activation='softmax'))

In [8]:
model.summary()

Model: "sequential"
_________________________________________________________________
Layer (type)                 Output Shape              Param #   
dense (Dense)                (None, 100)               1700      
_________________________________________________________________
dense_1 (Dense)              (None, 2)                 202       
Total params: 1,902
Trainable params: 1,902
Non-trainable params: 0
_________________________________________________________________


In [9]:
# Compile the model
model.compile(optimizer='adam',
              loss='categorical_crossentropy',
              metrics=['accuracy'])

# Fit the model to the training data
model.fit(
    X_train_scaled,
    y_train_categorical,
    epochs=100,
    shuffle=True,
    verbose=2,
    batch_size = 1
)

Epoch 1/100
2885/2885 - 1s - loss: 0.4105 - accuracy: 0.8423
Epoch 2/100
2885/2885 - 1s - loss: 0.3911 - accuracy: 0.8482
Epoch 3/100
2885/2885 - 1s - loss: 0.3832 - accuracy: 0.8447
Epoch 4/100
2885/2885 - 1s - loss: 0.3815 - accuracy: 0.8496
Epoch 5/100
2885/2885 - 1s - loss: 0.3786 - accuracy: 0.8492
Epoch 6/100
2885/2885 - 1s - loss: 0.3770 - accuracy: 0.8475
Epoch 7/100
2885/2885 - 1s - loss: 0.3755 - accuracy: 0.8485
Epoch 8/100
2885/2885 - 1s - loss: 0.3721 - accuracy: 0.8492
Epoch 9/100
2885/2885 - 1s - loss: 0.3742 - accuracy: 0.8489
Epoch 10/100
2885/2885 - 1s - loss: 0.3716 - accuracy: 0.8489
Epoch 11/100
2885/2885 - 1s - loss: 0.3728 - accuracy: 0.8506
Epoch 12/100
2885/2885 - 1s - loss: 0.3718 - accuracy: 0.8482
Epoch 13/100
2885/2885 - 1s - loss: 0.3696 - accuracy: 0.8523
Epoch 14/100
2885/2885 - 1s - loss: 0.3681 - accuracy: 0.8520
Epoch 15/100
2885/2885 - 1s - loss: 0.3685 - accuracy: 0.8492
Epoch 16/100
2885/2885 - 1s - loss: 0.3677 - accuracy: 0.8534
Epoch 17/100
2885

<tensorflow.python.keras.callbacks.History at 0x260c81e7c88>

In [10]:
model_loss, model_accuracy = model.evaluate(
    X_test_scaled, y_test_categorical, verbose=2, batch_size=1)
print(
    f"Normal Neural Network - Loss: {model_loss}, Accuracy: {model_accuracy}")

962/962 - 0s - loss: 0.4610 - accuracy: 0.8337
Normal Neural Network - Loss: 0.4609621465206146, Accuracy: 0.8336798548698425


## Deep Learning Model

In [16]:
# Create a deep learning model with an extra hidden layer of 6 nodes called `deep_model`
deep_model = Sequential()
deep_model.add(Dense(units=100, activation='relu', input_dim=16))
deep_model.add(Dense(units=20, activation='relu'))
deep_model.add(Dense(units=2, activation='softmax'))

In [17]:
deep_model.summary()

Model: "sequential_2"
_________________________________________________________________
Layer (type)                 Output Shape              Param #   
dense_5 (Dense)              (None, 100)               1700      
_________________________________________________________________
dense_6 (Dense)              (None, 20)                2020      
_________________________________________________________________
dense_7 (Dense)              (None, 2)                 42        
Total params: 3,762
Trainable params: 3,762
Non-trainable params: 0
_________________________________________________________________


In [18]:
# Compile and fit the deep_model
deep_model.compile(optimizer='adam',
                   loss='categorical_crossentropy',
                   metrics=['accuracy'])

deep_model.fit(
    X_train_scaled,
    y_train_categorical,
    epochs=100,
    shuffle=True,
    verbose=2,
    batch_size=1
)

Epoch 1/100
2885/2885 - 1s - loss: 0.4160 - accuracy: 0.8454
Epoch 2/100
2885/2885 - 1s - loss: 0.3916 - accuracy: 0.8454
Epoch 3/100
2885/2885 - 1s - loss: 0.3851 - accuracy: 0.8464
Epoch 4/100
2885/2885 - 1s - loss: 0.3797 - accuracy: 0.8464
Epoch 5/100
2885/2885 - 1s - loss: 0.3805 - accuracy: 0.8475
Epoch 6/100
2885/2885 - 1s - loss: 0.3769 - accuracy: 0.8461
Epoch 7/100
2885/2885 - 1s - loss: 0.3760 - accuracy: 0.8478
Epoch 8/100
2885/2885 - 1s - loss: 0.3731 - accuracy: 0.8485
Epoch 9/100
2885/2885 - 1s - loss: 0.3720 - accuracy: 0.8492
Epoch 10/100
2885/2885 - 1s - loss: 0.3711 - accuracy: 0.8496
Epoch 11/100
2885/2885 - 1s - loss: 0.3674 - accuracy: 0.8506
Epoch 12/100
2885/2885 - 1s - loss: 0.3718 - accuracy: 0.8492
Epoch 13/100
2885/2885 - 1s - loss: 0.3678 - accuracy: 0.8516
Epoch 14/100
2885/2885 - 1s - loss: 0.3689 - accuracy: 0.8489
Epoch 15/100
2885/2885 - 1s - loss: 0.3664 - accuracy: 0.8503
Epoch 16/100
2885/2885 - 1s - loss: 0.3683 - accuracy: 0.8510
Epoch 17/100
2885

<tensorflow.python.keras.callbacks.History at 0x260c9b38358>

In [19]:
model_loss, model_accuracy = deep_model.evaluate(
    X_test_scaled, y_test_categorical, verbose=2, batch_size=1)
print(f"Deep Neural Network - Loss: {model_loss}, Accuracy: {model_accuracy}")

962/962 - 0s - loss: 0.6488 - accuracy: 0.8316
Deep Neural Network - Loss: 0.6487565040588379, Accuracy: 0.8316008448600769
