In [1]:
import numpy as np
from sklearn.metrics import accuracy_score, confusion_matrix

In [2]:
def sigmoid(x):
    return 1 / (1 + np.exp(-x))

def sigmoid_derivative(x):
    return x * (1 - x)

class MLP:
    def __init__(self, input_size, hidden_size, output_size, lr=0.1, epochs=10000):
        self.input_size = input_size
        self.hidden_size = hidden_size
        self.output_size = output_size
        self.lr = lr
        self.epochs = epochs

        # Initialize weights and biases
        self.weights_input_hidden = np.random.randn(self.input_size, self.hidden_size)
        self.bias_hidden = np.zeros((1, self.hidden_size))
        self.weights_hidden_output = np.random.randn(self.hidden_size, self.output_size)
        self.bias_output = np.zeros((1, self.output_size))

    def forward(self, X):
        self.hidden_input = np.dot(X, self.weights_input_hidden) + self.bias_hidden
        self.hidden_output = sigmoid(self.hidden_input)
        self.final_input = np.dot(self.hidden_output, self.weights_hidden_output) + self.bias_output
        self.final_output = sigmoid(self.final_input)
        return self.final_output

    def backward(self, X, y, output):
        error = y - output
        output_gradient = error * sigmoid_derivative(output)
        hidden_error = output_gradient.dot(self.weights_hidden_output.T)
        hidden_gradient = hidden_error * sigmoid_derivative(self.hidden_output)

        # Update weights and biases
        self.weights_hidden_output += self.hidden_output.T.dot(output_gradient) * self.lr
        self.bias_output += np.sum(output_gradient, axis=0, keepdims=True) * self.lr
        self.weights_input_hidden += X.T.dot(hidden_gradient) * self.lr
        self.bias_hidden += np.sum(hidden_gradient, axis=0, keepdims=True) * self.lr

    def train(self, X, y):
        for _ in range(self.epochs):
            output = self.forward(X)
            self.backward(X, y, output)

    def predict(self, X):
        return np.round(self.forward(X))

In [3]:
# XOR dataset
X = np.array([[0, 0], [0, 1], [1, 0], [1, 1]])
y = np.array([[0], [1], [1], [0]])

In [4]:
# Train the MLP for XOR
mlp = MLP(input_size=2, hidden_size=4, output_size=1, lr=0.1, epochs=10000)
mlp.train(X, y)

In [5]:
predictions = mlp.predict(X)
print("Predictions for XOR:")
print(predictions)

Predictions for XOR:
[[0.]
 [1.]
 [1.]
 [0.]]


In [6]:
# Evaluation Metrics
accuracy = accuracy_score(y, predictions)
conf_matrix = confusion_matrix(y, predictions)
print("Accuracy:", accuracy)
print("Confusion Matrix:\n", conf_matrix)

Accuracy: 1.0
Confusion Matrix:
 [[2 0]
 [0 2]]
