In [None]:
# Import the necessary libraries
import numpy as np                              # For numerical computations
import pandas as pd                             # For handling datasets
from sklearn.model_selection import train_test_split # For splitting data into training and testing sets
from sklearn.feature_extraction.text import CountVectorizer # For converting text to numerical features
import scipy.sparse                             # For working with sparse matrices
from keras.models import Sequential             # For creating a neural network model
from keras.layers import Dense                  # For adding layers to the neural network
from sklearn.metrics import classification_report



# Load the dataset
dataset = pd.read_csv('fraud_email_.csv')

# Replace NaN values with empty strings
dataset = dataset.fillna('')
X = dataset['Text'].values                       # Extract the text from the dataset
y = dataset['Class'].values                      # Extract the target variable (label) from the dataset


# Convert the text to numerical features using bag-of-words representation
vectorizer = CountVectorizer()
X = vectorizer.fit_transform(X)

# Total number of samples
n_samples = X.shape[0]
n_train = int(n_samples * 0.8) # Use 80% of samples for training

# Create the sparse matrix for the training and testing data
X_train = scipy.sparse.csr_matrix(X[:n_train, :])
X_test = scipy.sparse.csr_matrix(X[n_train:, :])

# Sort the indices of the sparse matrix
X_train.sort_indices()
X_test.sort_indices()

# Split the dataset into training and testing sets, with 80% for training and 20% for testing
y_train = y[:n_train]
y_test = y[n_train:]


# Create the neural network model
model = Sequential()                            # Create an instance of the sequential model
model.add(Dense(units=16, activation='relu', input_dim=X_train.shape[1])) # Add a dense layer with 16 units and ReLU activation function as the input layer
model.add(Dense(units=8, activation='relu'))    # Add a dense layer with 8 units and ReLU activation function
model.add(Dense(units=1, activation='sigmoid')) # Add a dense layer with 1 unit and sigmoid activation function as the output layer
model.compile(optimizer='adam', loss='binary_crossentropy', metrics=['accuracy']) # Compile the model with the Adam optimizer, binary cross-entropy loss function, and accuracy metric

# Train the model
model.fit(X_train, y_train, batch_size=32, epochs=100, validation_data=(X_test, y_test)) # Train the model on the training data with a batch size of 32, 100 epochs, and validation data for evaluating the model's performance during training

# Test the model and get the classification report
y_pred = model.predict(X_test)                 # Use the trained model to predict the target variable for the testing data
y_pred = (y_pred > 0.5)                        # Convert the predicted probabilities to binary predictions (1 if the probability is greater than 0.5, 0 otherwise)
print(classification_report(y_test, y_pred))

# Evaluate the model
from sklearn.metrics import confusion_matrix   # Import the confusion matrix from sklearn
cm = confusion_matrix(y_test, y_pred)           # Compute the confusion matrix using the predicted and actual target variables for the testing data
print(cm)                                       # Print the confusion matrix


Epoch 1/100
Epoch 2/100
Epoch 3/100
Epoch 4/100
Epoch 5/100
Epoch 6/100
Epoch 7/100
Epoch 8/100
Epoch 9/100
Epoch 10/100
Epoch 11/100
Epoch 12/100
Epoch 13/100
Epoch 14/100
Epoch 15/100
Epoch 16/100
Epoch 17/100
Epoch 18/100
Epoch 19/100
Epoch 20/100
Epoch 21/100
Epoch 22/100
Epoch 23/100
Epoch 24/100
Epoch 25/100
Epoch 26/100
Epoch 27/100
Epoch 28/100
Epoch 29/100
Epoch 30/100
Epoch 31/100
Epoch 32/100
Epoch 33/100
Epoch 34/100
Epoch 35/100
Epoch 36/100
Epoch 37/100
Epoch 38/100
Epoch 39/100
Epoch 40/100
Epoch 41/100
Epoch 42/100
Epoch 43/100
Epoch 44/100
Epoch 45/100
Epoch 46/100
Epoch 47/100
Epoch 48/100
Epoch 49/100
Epoch 50/100
Epoch 51/100
Epoch 52/100
Epoch 53/100
Epoch 54/100
Epoch 55/100
Epoch 56/100
Epoch 57/100
Epoch 58/100
Epoch 59/100
Epoch 60/100
Epoch 61/100
Epoch 62/100
Epoch 63/100
Epoch 64/100
Epoch 65/100
Epoch 66/100
Epoch 67/100
Epoch 68/100
Epoch 69/100
Epoch 70/100
Epoch 71/100
Epoch 72/100
Epoch 73/100
Epoch 74/100
Epoch 75/100
Epoch 76/100
Epoch 77/100
Epoch 78