Neural Networks

In [1]:
import numpy as np
import matplotlib.pyplot as plt
import pandas as pd
from sklearn.metrics import confusion_matrix
from sklearn.neural_network import MLPClassifier
from numpy import random
from sklearn.model_selection import StratifiedKFold
from sklearn import preprocessing
from numpy import matlib
import qgrid
from sklearn.model_selection import train_test_split
from sklearn.metrics import roc_curve, roc_auc_score
from imblearn.metrics import geometric_mean_score
from sklearn.metrics import f1_score
from sklearn.metrics import plot_confusion_matrix

In [2]:
df = pd.read_excel('../data/CTG.xls', sheet_name='Raw Data', header=0, skiprows=[1])
data = df.to_numpy()
# Features matrix
X = data[:,0:22]
Y = data[:,23]

In [3]:
X_train, X_test, y_train, y_test = train_test_split(X, Y, random_state=0, stratify=Y, shuffle=True)

In [4]:
def redes_neuronales(neuronas, capas_ocultas):
    capas = capas_ocultas*(neuronas,)    
        
    Folds = 4
    random.seed(19680801)
    f1 = np.zeros(Folds)
    auc_fpr = np.zeros(Folds)
    gmean = np.zeros(Folds)

    skf = StratifiedKFold(n_splits=Folds)
    j = 0
    for train, test in skf.split(X, Y):
        Xtrain = X[train,:]
        Ytrain = Y[train]
        Xtest = X[test,:]
        Ytest = Y[test]
        
        #Se normalizan los datos
        media = np.mean(Xtrain)
        desvia = np.std(Xtrain)
        Xtrain = preprocessing.scale(Xtrain)
        Xtest = (Xtest - np.matlib.repmat(media, Xtest.shape[0], 1))/np.matlib.repmat(desvia, Xtest.shape[0], 1)
        
        #Llamado a la función para crear y entrenar el modelo usando los datos de entrenamiento
        mlp = MLPClassifier(hidden_layer_sizes=capas,activation = 'relu',max_iter=1000)
        mlp.fit(Xtrain,Ytrain)
        
        #Validación con las muestras de entrenamiento
        Ytrain_pred = mlp.predict(Xtrain)

        #Validación con las muestras de test    
        Yest = mlp.predict(Xtest)
        Y_pred =mlp.predict_proba(Xtest)
        #Evaluamos las predicciones del modelo con los datos de test
        auc_fpr[j] = roc_auc_score(Ytest, Y_pred, multi_class="ovr", average="weighted")
        gmean[j] =  geometric_mean_score(y_true = Ytest, y_pred=Yest, average="weighted")
        f1[j] = f1_score(y_true = Ytest, y_pred=Yest, average = "weighted")
        j += 1
    print("Modelo entrenado con " + str(neuronas) + " neuronas y con " + str(capas_ocultas) + " capas ocultas" + str(capas))
    return str(np.mean(f1)), str(np.std(f1)), str(np.mean(auc_fpr)), str(np.std(auc_fpr)), str(np.mean(gmean)), str(np.std(gmean))

In [5]:


df_types = pd.DataFrame({
    'N. de capas ocultas' : pd.Series([1,1,1,1,1,
                                       2,2,2,2,2,
                                       3,3,3,3,3,
                                       4,4,4,4,4,
                                       5,5,5,5,5]),
    
    'Neuronas por capa' : pd.Series([10,30,50,70,90,
                                    10,30,50,70,90,
                                    10,30,50,70,90,
                                    10,30,50,70,90,
                                    10,30,50,70,90])})
    df_types["F1_Score"] = ""
    df_types["IC F1"]= ""
    df_types["AUC"]= ""
    df_types["Gmean"]= ""
    df_types["IC Gmean"]= ""
df_types.set_index(['N. de capas ocultas','Neuronas por capa'], inplace=True)


In [6]:
for cap,neu in df_types.index:
    f1, stdf1, auc, stdAuc, gmean, stdgmean =redes_neuronales(neuronas=neu,capas_ocultas=cap)
    df_types["F1_Score"][cap,neu] = str(f1) 
    df_types["IC F1"][cap,neu] = str(stdf1)
    df_types["AUC"][cap,neu]= str(auc)
    df_types["Gmean"][cap,neu] = str(gmean)
    df_types["IC Gmean"][cap,neu] = str(stdgmean)
df_types



Modelo entrenado con 10 neuronas y con 1 capas ocultas(10,)


KeyError: 'F1_Score'

In [None]:
model = MLPClassifier(hidden_layer_sizes=(10,10),activation = 'relu',max_iter=500)

In [None]:
skf = StratifiedKFold(n_splits=4)
for train, test in skf.split(X, Y):
    Xtrain = X[train,:]
    Ytrain = Y[train]
    Xtest = X[test,:]
    Ytest = Y[test]

    #Se normalizan los datos
    media = np.mean(Xtrain)
    desvia = np.std(Xtrain)
    Xtrain = preprocessing.scale(Xtrain)
    Xtest = (Xtest - np.matlib.repmat(media, Xtest.shape[0], 1))/np.matlib.repmat(desvia, Xtest.shape[0], 1)
  

In [None]:
model.fit(Xtrain,Ytrain)

In [None]:
plot_confusion_matrix(model,X=Xtest, y_true=Ytest,normalize='true')