In [34]:
# 0 no entra en mora 1 sí entra en mora.

In [35]:
import pandas as pd
import numpy as np
import tensorflow as tf
from sklearn.model_selection import train_test_split
from sklearn.preprocessing import StandardScaler
from tensorflow.keras.models import Sequential
from tensorflow.keras.layers import Dense, SimpleRNN
from tensorflow.keras.optimizers import Adam
from tensorflow.keras.regularizers import l2

In [36]:
# Abriendo el archivo de datos
df = pd.read_csv('dataset.csv')
#print(df)

# Eliminando la fila de encabezados
data = df.drop(0)

# Convertiendo los datos a tipo numérico
data = data.astype(float)

# La variable objetivo es la columna "Y".
X = data.iloc[:, 1:-1].values
Y = data["Y"].values

# Dividiendo los datos en conjuntos de entrenamiento y prueba
X_train, X_test, Y_train, Y_test = train_test_split(X, Y, test_size=0.2, random_state=42)

# Escalar las características para mejorar el rendimiento del modelo
scaler = StandardScaler()
X_train = scaler.fit_transform(X_train)
X_test = scaler.transform(X_test)

# Construyendo el modelo de red neuronal con regularización L2
model = Sequential()
model.add(Dense(128, input_dim=X_train.shape[1], activation='relu', kernel_regularizer=l2(0.01)))
model.add(Dense(256, activation='relu', kernel_regularizer=l2(0.01)))
model.add(Dense(128, activation='relu', kernel_regularizer=l2(0.01)))
model.add(Dense(64, activation='relu', kernel_regularizer=l2(0.01)))
model.add(Dense(32, activation='relu', kernel_regularizer=l2(0.01)))
model.add(Dense(1, activation='sigmoid'))

# Compilar el modelo
model.compile(loss='binary_crossentropy', optimizer=Adam(learning_rate=0.001), metrics=['accuracy'])

# Entrenando el modelo
history = model.fit(X_train, Y_train, epochs=100, batch_size=128, validation_split=0.2, verbose=2)

# Encontrar el mejor accuracy durante el entrenamiento
best_accuracy = max(history.history['val_accuracy'])
print(f'Mejor Accuracy en Validación: {best_accuracy:.4f}')

# Evaluando el modelo en el conjunto de prueba
loss, accuracy = model.evaluate(X_test, Y_test)
print(f'Loss: {loss}, Accuracy: {accuracy}')

Epoch 1/100
150/150 - 3s - loss: 2.0788 - accuracy: 0.7876 - val_loss: 0.7072 - val_accuracy: 0.8035 - 3s/epoch - 21ms/step
Epoch 2/100
150/150 - 1s - loss: 0.5675 - accuracy: 0.8126 - val_loss: 0.5144 - val_accuracy: 0.8148 - 687ms/epoch - 5ms/step
Epoch 3/100
150/150 - 1s - loss: 0.5007 - accuracy: 0.8150 - val_loss: 0.4977 - val_accuracy: 0.8150 - 678ms/epoch - 5ms/step
Epoch 4/100
150/150 - 1s - loss: 0.4927 - accuracy: 0.8159 - val_loss: 0.4928 - val_accuracy: 0.8179 - 683ms/epoch - 5ms/step
Epoch 5/100
150/150 - 1s - loss: 0.4890 - accuracy: 0.8166 - val_loss: 0.4927 - val_accuracy: 0.8152 - 719ms/epoch - 5ms/step
Epoch 6/100
150/150 - 1s - loss: 0.4870 - accuracy: 0.8160 - val_loss: 0.4956 - val_accuracy: 0.8037 - 756ms/epoch - 5ms/step
Epoch 7/100
150/150 - 1s - loss: 0.4855 - accuracy: 0.8165 - val_loss: 0.4926 - val_accuracy: 0.8138 - 724ms/epoch - 5ms/step
Epoch 8/100
150/150 - 1s - loss: 0.4838 - accuracy: 0.8176 - val_loss: 0.4915 - val_accuracy: 0.8167 - 712ms/epoch - 5ms

In [39]:
# Usando otra red neuronal.

# Eliminando la fila de encabezados
data = df.drop(0)

# Convertiendo los datos a tipo numérico
data = data.astype(float)

# La variable objetivo es la columna "Y".
X = data.iloc[:, 1:-1].values
Y = data["Y"].values

# Dividiendo los datos en conjuntos de entrenamiento y prueba
X_train, X_test, Y_train, Y_test = train_test_split(X, Y, test_size=0.2, random_state=42)

# Escalar las características para mejorar el rendimiento del modelo
scaler = StandardScaler()
X_train = scaler.fit_transform(X_train)
X_test = scaler.transform(X_test)

# Modificando los datos para usar en una RNN
# La entrada de la RNN debe tener la forma (número de muestras, pasos de tiempo, características)
# En nuestro caso, usaremos un solo paso de tiempo ya que no tenemos una secuencia de datos, sino características independientes.
X_train_rnn = X_train.reshape(X_train.shape[0], 1, X_train.shape[1])
X_test_rnn = X_test.reshape(X_test.shape[0], 1, X_test.shape[1])

# Construyendo el modelo de red neuronal con regularización L2
model = Sequential()
model.add(SimpleRNN(128, input_shape=(1, X_train.shape[1]), activation='relu', kernel_regularizer=l2(0.01))) 
model.add(Dense(128, activation='relu', kernel_regularizer=l2(0.01))) 
model.add(Dense(64, activation='relu', kernel_regularizer=l2(0.01)))
model.add(Dense(32, activation='relu', kernel_regularizer=l2(0.01)))
model.add(Dense(1, activation='sigmoid'))

# Compilar el modelo
model.compile(loss='binary_crossentropy', optimizer=Adam(learning_rate=0.001), metrics=['accuracy'])

# Entrenando el modelo
history = model.fit(X_train_rnn, Y_train, epochs=100, batch_size=128, validation_split=0.2, verbose=2)

# Encontrar el mejor accuracy durante el entrenamiento
best_accuracy = max(history.history['val_accuracy'])
print(f'Mejor Accuracy en Validación: {best_accuracy:.4f}')

# Evaluando el modelo en el conjunto de prueba
loss, accuracy = model.evaluate(X_test_rnn, Y_test)
print(f'Loss: {loss}, Accuracy: {accuracy}')

Epoch 1/100
150/150 - 9s - loss: 1.6882 - accuracy: 0.7837 - val_loss: 0.7477 - val_accuracy: 0.8144 - 9s/epoch - 57ms/step
Epoch 2/100
150/150 - 2s - loss: 0.5843 - accuracy: 0.8115 - val_loss: 0.5172 - val_accuracy: 0.8104 - 2s/epoch - 10ms/step
Epoch 3/100
150/150 - 2s - loss: 0.4984 - accuracy: 0.8153 - val_loss: 0.4940 - val_accuracy: 0.8112 - 2s/epoch - 11ms/step
Epoch 4/100
150/150 - 2s - loss: 0.4865 - accuracy: 0.8144 - val_loss: 0.4932 - val_accuracy: 0.8154 - 2s/epoch - 10ms/step
Epoch 5/100
150/150 - 2s - loss: 0.4827 - accuracy: 0.8161 - val_loss: 0.4848 - val_accuracy: 0.8092 - 2s/epoch - 11ms/step
Epoch 6/100
150/150 - 2s - loss: 0.4798 - accuracy: 0.8166 - val_loss: 0.4847 - val_accuracy: 0.8156 - 2s/epoch - 11ms/step
Epoch 7/100
150/150 - 2s - loss: 0.4777 - accuracy: 0.8169 - val_loss: 0.4808 - val_accuracy: 0.8140 - 2s/epoch - 11ms/step
Epoch 8/100
150/150 - 2s - loss: 0.4763 - accuracy: 0.8174 - val_loss: 0.4879 - val_accuracy: 0.8177 - 2s/epoch - 11ms/step
Epoch 9/