In [None]:
import numpy as np

class NeuralNetwork:
    def __init__(self, input_size, hidden_size, output_size):
        self.input_size = input_size
        self.hidden_size = hidden_size
        self.output_size = output_size

        # Initialize weights
        self.weight_input_hidden = np.random.randn(self.input_size, self.hidden_size)
        self.weights_hidden_output = np.random.randn(self.hidden_size, self.output_size)

        # Initialize biases
        self.b1 = np.zeros((1, self.hidden_size))
        self.b2 = np.zeros((1, self.output_size))

    def sigmoid(self, x):
        return 1 / (1 + np.exp(-x))

    def sigmoid_derivative(self, x):
        return x * (1 - x)

    def feedforward(self, X):
        # Input to hidden
        self.z1 = np.dot(X, self.weight_input_hidden) + self.b1
        self.a1 = self.sigmoid(self.z1)

        # Hidden to output
        self.output_z = np.dot(self.a1, self.weights_hidden_output) + self.b2
        output = self.sigmoid(self.output_z)

        return output

    def backward(self, X, y, learning_rate):
        # Output error
        output_error = y - self.output
        output_delta = output_error * self.sigmoid_derivative(self.output)

        # Hidden error
        hidden_error = np.dot(output_delta, self.weights_hidden_output.T)
        hidden_delta = hidden_error * self.sigmoid_derivative(self.a1)

        # Update weights and biases
        self.weights_hidden_output += np.dot(self.a1.T, output_delta) * learning_rate
        self.b2 += np.sum(output_delta, axis=0, keepdims=True) * learning_rate
        self.weight_input_hidden += np.dot(X.T, hidden_delta) * learning_rate
        self.b1 += np.sum(hidden_delta, axis=0, keepdims=True) * learning_rate

    def train(self, X, y, epochs, learning_rate):
        for epoch in range(epochs):
            # Feedforward
            self.output = self.feedforward(X)
            self.backward(X, y, learning_rate)
            if epoch % 4000 == 0:
                loss = np.mean(np.square(y - self.output))
                print(f"Epoch {epoch}, Loss: {loss}")

# Example training data (XOR problem)
x = np.array([[0, 0], [0, 1], [1, 0], [1, 1]])
y = np.array([[0], [1], [1], [0]])

# Initialize neural network with 2 inputs, 4 hidden neurons, and 1 output
nn = NeuralNetwork(2, 4, 1)

# Train the neural network
nn.train(x, y, epochs=10000, learning_rate=0.1)

# Make predictions after training
output = nn.feedforward(x)
print("Prediction after training:")
print(output)


Epoch 0, Loss: 0.26368457097071646
Epoch 4000, Loss: 0.006932700515262648
Epoch 8000, Loss: 0.00236217383863496
Prediction after training:
[[0.03835544]
 [0.95402286]
 [0.95966184]
 [0.04206602]]
