In [13]:
import numpy as np
import matplotlib.pyplot as plt


In [2]:
class NeuralNetwork:
    def __init__(self, input_size, hidden_size, output_size):
        self.input_size = input_size
        self.hidden_size = hidden_size
        self.output_size = output_size

        # Initialize weights and biases for the hidden and output layers
        self.weights_input_hidden = np.random.randn(self.input_size, self.hidden_size)
        self.bias_hidden = np.zeros((1, self.hidden_size))
        self.weights_hidden_output = np.random.randn(self.hidden_size, self.output_size)
        self.bias_output = np.zeros((1, self.output_size))

    def sigmoid(self, x):
        return 1 / (1 + np.exp(-x))

    def sigmoid_derivative(self, x):
        return x * (1 - x)

    def forward(self, X):
        # Perform the forward pass
        hidden_input = np.dot(X, self.weights_input_hidden) + self.bias_hidden
        hidden_output = self.sigmoid(hidden_input)

        output_input = np.dot(hidden_output, self.weights_hidden_output) + self.bias_output
        predicted_output = self.sigmoid(output_input)

        return predicted_output, hidden_output

    def train(self, X, y, epochs, learning_rate):
        for epoch in range(epochs):
            # Perform forward propagation
            predicted_output, hidden_output = self.forward(X)

            # Calculate the error
            error = y - predicted_output

            # Backpropagation
            output_delta = error * self.sigmoid_derivative(predicted_output)
            hidden_error = output_delta.dot(self.weights_hidden_output.T)
            hidden_delta = hidden_error * self.sigmoid_derivative(hidden_output)

            # Update weights and biases using gradient descent
            self.weights_hidden_output += hidden_output.T.dot(output_delta) * learning_rate
            self.bias_output += np.sum(output_delta) * learning_rate
            self.weights_input_hidden += X.T.dot(hidden_delta) * learning_rate
            self.bias_hidden += np.sum(hidden_delta) * learning_rate

            # Print the error every 1000 epochs
            if epoch % 1000 == 0:
                print(f"Error after epoch {epoch}: {np.mean(np.abs(error)):.4f}")

    def predict(self, X):
        # Perform a forward pass and return the predicted output
        predicted_output, _ = self.forward(X)
        return predicted_output


In [10]:
# Create a dataset for XOR problem
X = np.array([[0, 0], [0, 1], [1, 0], [1, 1]])
y = np.array([[0], [1], [1], [0]])
print(X)
print(y)

# Initialize and train the neural network
input_size = 2
hidden_size = 4
output_size = 1
epochs = 10000
learning_rate = 0.1


[[0 0]
 [0 1]
 [1 0]
 [1 1]]
[[0]
 [1]
 [1]
 [0]]


In [11]:
model = NeuralNetwork(input_size, hidden_size, output_size)
model.train(X, y, epochs, learning_rate)

# Predictions after training
predictions = model.predict(X)
print("Predictions after training:")
print(predictions)

Error after epoch 0: 0.5001
Error after epoch 1000: 0.4403
Error after epoch 2000: 0.2643
Error after epoch 3000: 0.1528
Error after epoch 4000: 0.1112
Error after epoch 5000: 0.0900
Error after epoch 6000: 0.0770
Error after epoch 7000: 0.0681
Error after epoch 8000: 0.0615
Error after epoch 9000: 0.0565
Predictions after training:
[[0.04574975]
 [0.95073778]
 [0.94335528]
 [0.05801924]]
