In [1]:
import numpy as np


class ANN:
    def __init__(self, input_size, hidden_size, output_size):
        self.input_size = input_size
        self.hidden_size = hidden_size
        self.output_size = output_size

        # Initialize random weights & biases
        self.weights_input_hidden = np.random.randn(self.input_size, self.hidden_size)
        self.weights_hidden_output = np.random.randn(self.hidden_size, self.output_size)

        self.bias_hidden = np.zeros((1, self.hidden_size))
        self.bias_output = np.zeros((1, self.output_size))

    def sigmoid(self, x):
        return 1 / (1 + np.exp(-x))

    def sigmoid_derivative(self, x):
        return x * (1 - x)

    def forward(self, x):
        """Forward propagation"""
        self.hidden_activation = np.dot(x, self.weights_input_hidden) + self.bias_hidden
        self.hidden_output = self.sigmoid(self.hidden_activation)

        self.output_activation = (
            np.dot(self.hidden_output, self.weights_hidden_output) + self.bias_output
        )
        self.predicted_output = self.sigmoid(self.output_activation)

        return self.predicted_output

    def backward(self, x, y, learning_rate):
        """Backpropagation"""
        output_error = y - self.predicted_output
        output_delta = output_error * self.sigmoid_derivative(self.predicted_output)

        hidden_error = np.dot(output_delta, self.weights_hidden_output.T)
        hidden_delta = hidden_error * self.sigmoid_derivative(self.hidden_output)

        # Update weights & biases
        self.weights_hidden_output += (
            np.dot(self.hidden_output.T, output_delta) * learning_rate
        )
        self.bias_output += np.sum(output_delta, axis=0, keepdims=True) * learning_rate

        self.weights_input_hidden += np.dot(x.T, hidden_delta) * learning_rate
        self.bias_hidden += np.sum(hidden_delta, axis=0, keepdims=True) * learning_rate

    def train(self, x, y, epochs, learning_rate):
        """Train the neural network"""
        for epoch in range(epochs):
            self.forward(x)
            self.backward(x, y, learning_rate)
            if epoch % 500 == 0:
                loss = np.mean(np.square(y - self.predicted_output))
                print(f"Epoch {epoch}, Loss: {loss}")


if __name__ == "__main__":
    # XOR dataset
    X = np.array([[0, 0], [0, 1], [1, 0], [1, 1]])
    Y = np.array([[0], [1], [1], [0]])

    obj = ANN(input_size=2, hidden_size=4, output_size=1)
    obj.train(X, Y, epochs=5000, learning_rate=0.1)

    predictions = obj.forward(X)
    print("Predictions after training:")
    print(predictions)
    

Epoch 0, Loss: 0.2689827010069694
Epoch 500, Loss: 0.24121328867942893
Epoch 1000, Loss: 0.20994179947168076
Epoch 1500, Loss: 0.14153450379563173
Epoch 2000, Loss: 0.06831827042311621
Epoch 2500, Loss: 0.03302080593432051
Epoch 3000, Loss: 0.019202436561050917
Epoch 3500, Loss: 0.012856844871216072
Epoch 4000, Loss: 0.00942693042796883
Epoch 4500, Loss: 0.007341010383033843
Predictions after training:
[[0.04565815]
 [0.91398919]
 [0.92851314]
 [0.0961927 ]]
