In [5]:
import numpy as np

# Sigmoid Activation Function
def sigmoid(x):
    return 1 / (1 + np.exp(-x))

# Derivative of Sigmoid Activation Function
def sigmoid_derivative(x):
    return x * (1 - x)

# Neural Network Class Definition
class NeuralNetwork:
    def __init__(self, input_size, hidden_size, output_size):
        self.input_size = input_size
        self.hidden_size = hidden_size
        self.output_size = output_size
        self.weights_input_hidden = np.random.randn(self.input_size, self.hidden_size)
        self.bias_hidden = np.random.randn(1, self.hidden_size)
        self.weights_hidden_output = np.random.randn(self.hidden_size, self.output_size)
        self.bias_output = np.random.randn(1, self.output_size)

    def forward(self, X):
        self.input_layer = X
        self.hidden_layer_input = np.dot(self.input_layer, self.weights_input_hidden) + self.bias_hidden
        self.hidden_layer_output = sigmoid(self.hidden_layer_input)
        self.output_layer_input = np.dot(self.hidden_layer_output, self.weights_hidden_output) + self.bias_output
        self.output_layer_output = sigmoid(self.output_layer_input)
        return self.output_layer_output

    def backward(self, X, y, learning_rate):
        error_output = y - self.output_layer_output
        output_layer_delta = error_output * sigmoid_derivative(self.output_layer_output)
        error_hidden = output_layer_delta.dot(self.weights_hidden_output.T)
        hidden_layer_delta = error_hidden * sigmoid_derivative(self.hidden_layer_output)

        self.weights_hidden_output += self.hidden_layer_output.T.dot(output_layer_delta) * learning_rate
        self.bias_output += np.sum(output_layer_delta, axis=0, keepdims=True) * learning_rate
        self.weights_input_hidden += X.T.dot(hidden_layer_delta) * learning_rate
        self.bias_hidden += np.sum(hidden_layer_delta, axis=0, keepdims=True) * learning_rate

    def train(self, X, y, epochs, learning_rate):
        for epoch in range(epochs):
            self.forward(X)
            self.backward(X, y, learning_rate)
            if epoch % 1000 == 0:
                loss = np.mean(np.square(y - self.output_layer_output))
                print(f"Epoch {epoch} - Loss: {loss}")

# Main Program
if __name__ == "__main__":

    X = np.array([[0,0],[0,1],[1,0],[1,1],[1,1],[1,0]])
    y = np.array([[0], [1], [1], [0], [1], [1]])  # Expected output data

    nn = NeuralNetwork(input_size=2, hidden_size=4, output_size=1)

    nn.train(X, y, epochs=10000, learning_rate=0.1)

    # After training, print the final predictions of the network
    print("\nPredictions after training:")
    print(nn.forward(X))


Epoch 0 - Loss: 0.32691252657291936
Epoch 1000 - Loss: 0.16160738720391163
Epoch 2000 - Loss: 0.10605310998506579
Epoch 3000 - Loss: 0.09051322699918364
Epoch 4000 - Loss: 0.0868866482917001
Epoch 5000 - Loss: 0.08556849945826706
Epoch 6000 - Loss: 0.08492660177763396
Epoch 7000 - Loss: 0.08455624317721773
Epoch 8000 - Loss: 0.0843183880737144
Epoch 9000 - Loss: 0.0841540467562049

Predictions after training:
[[0.03626058]
 [0.96193559]
 [0.97333694]
 [0.5031994 ]
 [0.5031994 ]
 [0.97333694]]
