In [115]:
import time
import numpy as np
import h5py
import matplotlib.pyplot as plt
import scipy
from PIL import Image
from scipy import ndimage
from dnn_app_utils_v4 import *
from sklearn.model_selection import train_test_split

In [117]:
data = np.load('heart_convert.npy')
data.shape

(918, 12)

In [102]:
X = data[:, :11]
Y = data[:, 11]

In [103]:
X_train,X_test,y_train,y_test = train_test_split(X,Y,test_size=0.2,stratify=Y,random_state=123)
Y_train = np.expand_dims(y_train,axis=1)
Y_test = np.expand_dims(y_test,axis=1)
X_train, X_test, Y_train, Y_test = X_train.T, X_test.T, Y_train.T, Y_test.T

In [104]:
print("Training X: ",X_train.shape)
print("Training Y: ",Y_train.shape)
print("Testing X: ",X_test.shape)
print("Testing Y: ",Y_test.shape)

Training X:  (11, 734)
Training Y:  (1, 734)
Testing X:  (11, 184)
Testing Y:  (1, 184)


In [110]:
def init_parameters(layers_dims):
    np.random.seed(3)
    L = len(layers_dims)
    parameters = {}
    for l in range(1,L):
        parameters["W" + str(l)] = np.random.randn(layers_dims[l],layers_dims[l-1])*np.sqrt(2/layers_dims[l-1])
        parameters["b" + str(l)] = np.zeros((layers_dims[l],1))
    return parameters
def sigmoid(Z):
    A = 1/(1+np.exp(-Z))
    return A,Z
def relu(Z):
    A = np.maximum(0,Z)
    return A,Z
def calc_ffw(W,A_prev,b,activation):
    if activation == "sigmoid":
        Z = np.dot(W,A_prev) + b
        A,Z = sigmoid(Z)
    else:
        Z = np.dot(W,A_prev) + b
        A,Z = relu(Z)
    linear_cache = (A_prev,W,b)
    activation_cache = Z
    cache = (linear_cache, activation_cache)
    return A,cache
def L_model_forward(X,parameters):
    L = len(parameters)//2
    caches = []
    A = X
    for l in range(1,L):
        A_prev = A
        A,cache = calc_ffw(parameters["W"+str(l)],A_prev,parameters["b"+str(l)],"relu")
        caches.append(cache)
    AL,cache = calc_ffw(parameters["W"+str(L)],A,parameters["b"+str(L)],"sigmoid")
    caches.append(cache)
    return AL, caches
def compute_cost(AL,Y,parameters,lamb):
    m = AL.shape[1]
    cross_entropy_cost = -1./m*(np.dot(Y,np.log(AL).T) + np.dot((1-Y),np.log(1-AL).T))
    sum_W = 0
    for l in range(1,len(parameters)//2+1):
        sum_W += np.sum(np.square(parameters["W"+str(l)]))
    L2_regularization_cost =  sum_W* 1./m * lamb/2
    cost = np.squeeze(cross_entropy_cost + L2_regularization_cost)  
    return cost
def sigmoid_grad(dA,Z):
    A,Z = sigmoid(Z)
    dZ = dA*A*(1-A)
    return dZ
def relu_grad(dA,Z):
    A,Z = relu(Z)
    dZ = np.multiply(dA, np.int64(A > 0))
    return dZ
def linear_backward(dZ,cache,lamb):
    A_prev, W, b = cache
    m = A_prev.shape[1] 
    dW = 1./m*np.dot(dZ,A_prev.T) + lamb/m*W
    db = 1./m*np.sum(dZ,axis=1,keepdims=True)
    dA_prev = np.dot(W.T,dZ)
    return dA_prev,dW,db
def linear_activation_backward(dA,cache,activation,lamb):
    linear_cache, activation_cache = cache
    if activation == "relu":
        dZ = relu_grad(dA,activation_cache)
        dA_prev,dW,db = linear_backward(dZ,linear_cache,lamb)
    elif activation == "sigmoid":
        dZ = sigmoid_grad(dA,activation_cache)
        dA_prev,dW,db = linear_backward(dZ,linear_cache,lamb)
    return dA_prev,dW,db
def L_model_backward(AL, Y, caches,lamb):
    grads = {}
    L = len(caches)
    Y = Y.reshape(AL.shape)
    dAL = np.divide(AL - Y, np.multiply(AL, 1 - AL))

    current_cache = caches[-1]
    grads["dA" + str(L-1)], grads["dW" + str(L)], grads["db" + str(L)] = linear_activation_backward(dAL,current_cache, activation = "sigmoid",lamb=lamb)

    for l in reversed(range(L-1)):
        current_cache = caches[l]
        dA_prev_temp, dW_temp, db_temp = linear_activation_backward(grads["dA" + str(l + 1)],  current_cache, activation = "relu", lamb=lamb)
        grads["dA" + str(l)] = dA_prev_temp
        grads["dW" + str(l + 1)] = dW_temp
        grads["db" + str(l + 1)] = db_temp
    return grads
def update_parameters(parameters, grads, lr):
    L = len(parameters)//2
    for l in range(L):
        parameters["W" + str(l+1)] = parameters["W" + str(l+1)]-lr*grads["dW" + str(l+1)]
        parameters["b" + str(l+1)] = parameters["b" + str(l+1)]-lr*grads["db" + str(l+1)]
    return parameters
def predict(X,Y,parameters):
    AL,cache =  L_model_forward(X,parameters)
    return np.round(AL)


In [111]:
def model(X,Y,X_test,y_test,num_iterations, learning_rate, lamb,print_cost=False):
    np.random.seed(3)
    input_size = X.shape[0]
    layer_dims = []
    layer_dims.append(input_size)
    layer_dims.append(16)
    #layer_dims.append(8)
    layer_dims.append(4)
    layer_dims.append(1)
    parameters = init_parameters(layer_dims)
    #return parameters
    costs = []
    for i in range(num_iterations):
        AL, caches = L_model_forward(X,parameters)
        cost = compute_cost(AL, Y,parameters,lamb=lamb)
        costs.append(cost)
        grads = L_model_backward(AL,Y,caches,lamb=lamb)
        parameters = update_parameters(parameters,grads,learning_rate)
        if print_cost and i % 1000 == 0:
            print ("Cost after iteration %i: %f" %(i, cost))
    Y_train_pred = predict(X,Y,parameters)
    Y_test_pred = predict(X_test,y_test,parameters)
    print("train accuracy: {} %".format(100 - np.mean(np.abs(Y_train_pred - Y)) * 100))
    print("test accuracy: {} %".format(100 - np.mean(np.abs(Y_test_pred - y_test)) * 100))
    return parameters,costs

In [112]:
input_size = X_train.shape[0]
input_size
print(Y_train.shape[1])

734


In [113]:

parameters,costs = model(X_train,Y_train,X_test,Y_test,15000,0.01,0.9,True)

  cross_entropy_cost = -1./m*(np.dot(Y,np.log(AL).T) + np.dot((1-Y),np.log(1-AL).T))
  dAL = np.divide(AL - Y, np.multiply(AL, 1 - AL))
  dAL = np.divide(AL - Y, np.multiply(AL, 1 - AL))
  dZ = dA*A*(1-A)


Cost after iteration 0: nan
Cost after iteration 1000: nan
Cost after iteration 2000: nan
Cost after iteration 3000: nan
Cost after iteration 4000: nan
Cost after iteration 5000: nan
Cost after iteration 6000: nan
Cost after iteration 7000: nan
Cost after iteration 8000: nan
Cost after iteration 9000: nan
Cost after iteration 10000: nan
Cost after iteration 11000: nan
Cost after iteration 12000: nan
Cost after iteration 13000: nan
Cost after iteration 14000: nan
train accuracy: nan %
test accuracy: nan %


In [77]:
pred_train = predict(train_x, train_y, parameters)

NameError: name 'train_x' is not defined

In [None]:
pred_test = predict(test_x, test_y, parameters)