In [1]:
import numpy as np

In [2]:
class MLP:
    def __init__(self, input_size, hidden_size, output_size):
        self.input_size = input_size
        self.hidden_size = hidden_size
        self.output_size = output_size

        # Initialize weights with random values
        self.W1 = np.random.randn(input_size, hidden_size)
        self.W2 = np.random.randn(hidden_size, output_size)

    def sigmoid(self, x):
        return 1 / (1 + np.exp(-x))

    def sigmoid_derivative(self, x):
        return x * (1 - x)

    def forward(self, X):
        self.hidden_layer = self.sigmoid(np.dot(X, self.W1))
        self.output_layer = self.sigmoid(np.dot(self.hidden_layer, self.W2))

    def backward(self, X, y, learning_rate):
        # Calculate the gradients
        output_error = y - self.output_layer
        output_delta = output_error * self.sigmoid_derivative(self.output_layer)
        hidden_error = output_delta.dot(self.W2.T)
        hidden_delta = hidden_error * self.sigmoid_derivative(self.hidden_layer)

        # Update the weights
        self.W2 -= self.hidden_layer.T.dot(output_delta) * learning_rate
        self.W1 -= X.T.dot(hidden_delta) * learning_rate

    def train(self, X, y, epochs=1000, learning_rate=0.01):
        for epoch in range(epochs):
            self.forward(X)
            self.backward(X, y, learning_rate)

    def predict(self, X):
        self.forward(X)
        return self.output_layer

In [3]:
# Training data
X = np.array([[0, 0], [0, 1], [1, 0], [1, 1]])
y = np.array([[0], [1], [1], [0]])

# Create an MLP object
mlp = MLP(input_size=2, hidden_size=4, output_size=1)

# Train the MLP
mlp.train(X, y, epochs=10000, learning_rate=0.1)

# Test the MLP
predictions = mlp.predict(X)
print(predictions)

[[1.71869322e-03]
 [1.76776254e-04]
 [2.29958558e-04]
 [3.84399413e-05]]
