In [1]:
import numpy as np

class NeuralNetwork:
    def __init__(self, input_size, hidden_size, output_size):
        self.input_size = input_size
        self.hidden_size = hidden_size
        self.output_size = output_size
        # Initialize weights and biases
        self.W1 = np.random.randn(input_size, hidden_size)
        self.b1 = np.zeros((1, hidden_size))
        self.W2 = np.random.randn(hidden_size, output_size)
        self.b2 = np.zeros((1, output_size))

    def sigmoid(self, x):
        return 1 / (1 + np.exp(-x))

    def sigmoid_derivative(self, x):
        return x * (1 - x)

    def forward(self, X):
        # Forward propagation
        self.z1 = np.dot(X, self.W1) + self.b1
        self.a1 = self.sigmoid(self.z1)
        self.z2 = np.dot(self.a1, self.W2) + self.b2
        self.a2 = self.sigmoid(self.z2)
        return self.a2

    def backward(self, X, y, learning_rate):
        # Backpropagation
        m = X.shape[0]
        # Compute gradients
        dz2 = self.a2 - y
        dw2 = (1 / m) * np.dot(self.a1.T, dz2)
        db2 = (1 / m) * np.sum(dz2, axis=0, keepdims=True)
        dz1 = np.dot(dz2, self.W2.T) * self.sigmoid_derivative(self.a1) 
        dW1 = (1 / m) * np.dot(X.T, dz1)
        db1 = (1 / m) * np.sum(dz1, axis=0, keepdims=True)

        # Update weights and biases
        self.W2 -= learning_rate * dw2
        self.b2 -= learning_rate * db2
        self.W1 -= learning_rate * dW1
        self.b1 -= learning_rate * db1

    def train(self, X, y, epochs, learning_rate):
        for epoch in range(epochs):
            # Forward propagation
            output = self.forward(X)
            # Backpropagation
            self.backward(X, y, learning_rate)
            # Print Loss every 100 epochs
            if epoch % 100 == 0:
                loss = np.mean(np.square(y - output))
                print(f'Epoch {epoch}, Loss: {loss}')

# Example usage:
input_size = 2
hidden_size = 3
output_size = 1

X = np.array([[0, 0], [0, 1], [1, 0], [1, 1]])
y = np.array([[0], [1], [1], [0]])

model = NeuralNetwork(input_size, hidden_size, output_size)
model.train(X, y, epochs=1500, learning_rate=0.1)

# Test the trained model
print("\nTest the trained model:")
test_data = np.array([[0, 0], [0, 1], [1, 0], [1, 1]])
print("Input data:", test_data)
print("Predicted output:", model.forward(test_data))

Epoch 0, Loss: 0.2545923725233581
Epoch 100, Loss: 0.2513353259988125
Epoch 200, Loss: 0.2497902952055434
Epoch 300, Loss: 0.24843068796227058
Epoch 400, Loss: 0.24702675729589813
Epoch 500, Loss: 0.24539106828033425
Epoch 600, Loss: 0.24336039915032132
Epoch 700, Loss: 0.24079439066676886
Epoch 800, Loss: 0.2375795853998242
Epoch 900, Loss: 0.23363080277235287
Epoch 1000, Loss: 0.2288934154279842
Epoch 1100, Loss: 0.22335518200092613
Epoch 1200, Loss: 0.21706724465399435
Epoch 1300, Loss: 0.21016275467416973
Epoch 1400, Loss: 0.2028585531349319

Test the trained model:
Input data: [[0 0]
 [0 1]
 [1 0]
 [1 1]]
Predicted output: [[0.29574046]
 [0.45594846]
 [0.68195916]
 [0.54508688]]
