# CVD - Neural Network

In [1]:
# Set the seed value for the notebook so the results are reproducible
from numpy.random import seed
seed(49)

In [2]:
# Dependencies
import numpy as np
import pandas as pd
import tensorflow
tensorflow.keras.__version__

'2.4.0'

In [3]:
df = pd.read_csv("Resources/cvd_period1_data.csv")
df.head()

Unnamed: 0,RANDID,SEX,TOTCHOL,AGE,SYSBP,DIABP,CURSMOKE,CIGPDAY,BMI,DIABETES,BPMEDS,HEARTRTE,GLUCOSE,PREVAP,PREVHYP,DEATH,CVD
0,2448,1,195.0,39,106.0,70.0,0,0.0,26.97,0,0.0,80.0,77.0,0,0,0,1
1,6238,2,250.0,46,121.0,81.0,0,0.0,28.73,0,0.0,95.0,76.0,0,0,0,0
2,9428,1,245.0,48,127.5,80.0,1,20.0,25.34,0,0.0,75.0,70.0,0,0,0,0
3,10552,2,225.0,61,150.0,95.0,1,30.0,28.58,0,0.0,65.0,103.0,0,1,1,1
4,11252,2,285.0,46,130.0,84.0,1,23.0,23.1,0,0.0,85.0,85.0,0,0,0,0


## Data Preprocessing

In [4]:
cvd_df = df.set_index('RANDID')
#Remove columns not involved in analysis
cvd_df = cvd_df[['SEX', 'TOTCHOL', 'AGE', 'SYSBP', 'DIABP', 'CURSMOKE',
       'CIGPDAY', 'BMI', 'DIABETES', 'BPMEDS', 'HEARTRTE', 'GLUCOSE', 'PREVAP',
       'PREVHYP', 'CVD']]
cvd_df.head()

Unnamed: 0_level_0,SEX,TOTCHOL,AGE,SYSBP,DIABP,CURSMOKE,CIGPDAY,BMI,DIABETES,BPMEDS,HEARTRTE,GLUCOSE,PREVAP,PREVHYP,CVD
RANDID,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1
2448,1,195.0,39,106.0,70.0,0,0.0,26.97,0,0.0,80.0,77.0,0,0,1
6238,2,250.0,46,121.0,81.0,0,0.0,28.73,0,0.0,95.0,76.0,0,0,0
9428,1,245.0,48,127.5,80.0,1,20.0,25.34,0,0.0,75.0,70.0,0,0,0
10552,2,225.0,61,150.0,95.0,1,30.0,28.58,0,0.0,65.0,103.0,0,1,1
11252,2,285.0,46,130.0,84.0,1,23.0,23.1,0,0.0,85.0,85.0,0,0,0


In [6]:
X = cvd_df.drop("CVD", axis=1)
y = cvd_df["CVD"]
print(X.shape, y.shape)

(3730, 14) (3730,)


In [7]:
from sklearn.model_selection import train_test_split
from sklearn.preprocessing import LabelEncoder, MinMaxScaler
from tensorflow.keras.utils import to_categorical

X_train, X_test, y_train, y_test = train_test_split(X, y, random_state=1)
X_scaler = MinMaxScaler().fit(X_train)
X_train_scaled = X_scaler.transform(X_train)
X_test_scaled = X_scaler.transform(X_test)


# Step 1: Label-encode data set
label_encoder = LabelEncoder()
label_encoder.fit(y_train)
encoded_y_train = label_encoder.transform(y_train)
encoded_y_test = label_encoder.transform(y_test)

# Step 2: Convert encoded labels to one-hot-encoding
y_train_categorical = to_categorical(encoded_y_train)
y_test_categorical = to_categorical(encoded_y_test)

## Create neural net model

In [8]:
from tensorflow.keras.models import Sequential
from tensorflow.keras.layers import Dense

# Create a Neural Network model here
model = Sequential()
model.add(Dense(units=100, activation='relu', input_dim=14))
model.add(Dense(units=2, activation='softmax'))

In [9]:
model.summary()

Model: "sequential"
_________________________________________________________________
Layer (type)                 Output Shape              Param #   
dense (Dense)                (None, 100)               1500      
_________________________________________________________________
dense_1 (Dense)              (None, 2)                 202       
Total params: 1,702
Trainable params: 1,702
Non-trainable params: 0
_________________________________________________________________


In [10]:
# Compile the model
model.compile(optimizer='adam',
              loss='categorical_crossentropy',
              metrics=['accuracy'])

# Fit the model to the training data
model.fit(
    X_train_scaled,
    y_train_categorical,
    epochs=100,
    shuffle=True,
    verbose=2,
    batch_size = 1
)

Epoch 1/100
2797/2797 - 1s - loss: 0.5253 - accuracy: 0.7562
Epoch 2/100
2797/2797 - 1s - loss: 0.5052 - accuracy: 0.7622
Epoch 3/100
2797/2797 - 1s - loss: 0.4989 - accuracy: 0.7655
Epoch 4/100
2797/2797 - 1s - loss: 0.4964 - accuracy: 0.7630
Epoch 5/100
2797/2797 - 1s - loss: 0.4966 - accuracy: 0.7630
Epoch 6/100
2797/2797 - 1s - loss: 0.4926 - accuracy: 0.7640
Epoch 7/100
2797/2797 - 1s - loss: 0.4933 - accuracy: 0.7594
Epoch 8/100
2797/2797 - 1s - loss: 0.4931 - accuracy: 0.7587
Epoch 9/100
2797/2797 - 1s - loss: 0.4917 - accuracy: 0.7673
Epoch 10/100
2797/2797 - 1s - loss: 0.4903 - accuracy: 0.7619
Epoch 11/100
2797/2797 - 1s - loss: 0.4898 - accuracy: 0.7665
Epoch 12/100
2797/2797 - 1s - loss: 0.4892 - accuracy: 0.7601
Epoch 13/100
2797/2797 - 1s - loss: 0.4881 - accuracy: 0.7615
Epoch 14/100
2797/2797 - 1s - loss: 0.4896 - accuracy: 0.7622
Epoch 15/100
2797/2797 - 1s - loss: 0.4901 - accuracy: 0.7676
Epoch 16/100
2797/2797 - 1s - loss: 0.4870 - accuracy: 0.7619
Epoch 17/100
2797

<tensorflow.python.keras.callbacks.History at 0x232ffc572b0>

In [11]:
model_loss, model_accuracy = model.evaluate(
    X_test_scaled, y_test_categorical, verbose=2, batch_size=1)
print(
    f"Normal Neural Network - Loss: {model_loss}, Accuracy: {model_accuracy}")

933/933 - 0s - loss: 0.4948 - accuracy: 0.7771
Normal Neural Network - Loss: 0.49480628967285156, Accuracy: 0.777063250541687


## Deep Learning Model

In [12]:
# Create a deep learning model with an extra hidden layer of 6 nodes called `deep_model`
deep_model = Sequential()
deep_model.add(Dense(units=100, activation='relu', input_dim=14))
deep_model.add(Dense(units=20, activation='relu'))
deep_model.add(Dense(units=2, activation='softmax'))

In [13]:
deep_model.summary()

Model: "sequential_1"
_________________________________________________________________
Layer (type)                 Output Shape              Param #   
dense_2 (Dense)              (None, 100)               1500      
_________________________________________________________________
dense_3 (Dense)              (None, 20)                2020      
_________________________________________________________________
dense_4 (Dense)              (None, 2)                 42        
Total params: 3,562
Trainable params: 3,562
Non-trainable params: 0
_________________________________________________________________


In [14]:
# Compile and fit the deep_model
deep_model.compile(optimizer='adam',
                   loss='categorical_crossentropy',
                   metrics=['accuracy'])

deep_model.fit(
    X_train_scaled,
    y_train_categorical,
    epochs=100,
    shuffle=True,
    verbose=2,
    batch_size=1
)

Epoch 1/100
2797/2797 - 2s - loss: 0.5234 - accuracy: 0.7562
Epoch 2/100
2797/2797 - 1s - loss: 0.5083 - accuracy: 0.7580
Epoch 3/100
2797/2797 - 2s - loss: 0.5009 - accuracy: 0.7633
Epoch 4/100
2797/2797 - 2s - loss: 0.5005 - accuracy: 0.7608
Epoch 5/100
2797/2797 - 3s - loss: 0.4942 - accuracy: 0.7615
Epoch 6/100
2797/2797 - 3s - loss: 0.4952 - accuracy: 0.7633
Epoch 7/100
2797/2797 - 3s - loss: 0.4939 - accuracy: 0.7630
Epoch 8/100
2797/2797 - 3s - loss: 0.4938 - accuracy: 0.7612
Epoch 9/100
2797/2797 - 2s - loss: 0.4911 - accuracy: 0.7594
Epoch 10/100
2797/2797 - 2s - loss: 0.4925 - accuracy: 0.7630
Epoch 11/100
2797/2797 - 2s - loss: 0.4910 - accuracy: 0.7615
Epoch 12/100
2797/2797 - 2s - loss: 0.4891 - accuracy: 0.7640
Epoch 13/100
2797/2797 - 2s - loss: 0.4902 - accuracy: 0.7630
Epoch 14/100
2797/2797 - 2s - loss: 0.4899 - accuracy: 0.7651
Epoch 15/100
2797/2797 - 2s - loss: 0.4887 - accuracy: 0.7608
Epoch 16/100
2797/2797 - 2s - loss: 0.4885 - accuracy: 0.7615
Epoch 17/100
2797

<tensorflow.python.keras.callbacks.History at 0x2328114a860>

In [15]:
model_loss, model_accuracy = deep_model.evaluate(
    X_test_scaled, y_test_categorical, verbose=2, batch_size=1)
print(f"Deep Neural Network - Loss: {model_loss}, Accuracy: {model_accuracy}")

933/933 - 0s - loss: 0.5527 - accuracy: 0.7663
Deep Neural Network - Loss: 0.5526836514472961, Accuracy: 0.7663451433181763
