In [1]:
import numpy as np

# Sigmoid activation function
def sigmoid(x):
    return 1 / (1 + np.exp(-x))

# Derivative of the sigmoid function
def sigmoid_derivative(x):
    return x * (1 - x)

# Define the neural network class
class NeuralNetwork:
    def __init__(self, input_size, hidden_size, output_size):
        # Initialize weights and biases
        self.weights_input_hidden = np.random.rand(input_size, hidden_size)
        self.bias_input_hidden = np.random.rand(1, hidden_size)
        self.weights_hidden_output = np.random.rand(hidden_size, output_size)
        self.bias_hidden_output = np.random.rand(1, output_size)
    
    def forward(self, X):
        # Perform forward propagation
        self.hidden_output = sigmoid(np.dot(X, self.weights_input_hidden) + self.bias_input_hidden)
        self.output = sigmoid(np.dot(self.hidden_output, self.weights_hidden_output) + self.bias_hidden_output)
        return self.output
    
    def backward(self, X, y, learning_rate):
        # Perform backward propagation
        # Compute output layer error and delta
        output_error = y - self.output
        output_delta = output_error * sigmoid_derivative(self.output)
        
        # Compute hidden layer error and delta
        hidden_error = np.dot(output_delta, self.weights_hidden_output.T)
        hidden_delta = hidden_error * sigmoid_derivative(self.hidden_output)
        
        # Update weights and biases
        self.weights_hidden_output += learning_rate * np.dot(self.hidden_output.T, output_delta)
        self.bias_hidden_output += learning_rate * np.sum(output_delta, axis=0, keepdims=True)
        self.weights_input_hidden += learning_rate * np.dot(X.T, hidden_delta)
        self.bias_input_hidden += learning_rate * np.sum(hidden_delta, axis=0, keepdims=True)

# Example usage
# Define input, output, and hidden layer sizes
input_size = 2
hidden_size = 3
output_size = 1

# Create a neural network
nn = NeuralNetwork(input_size, hidden_size, output_size)

# Sample input and output data
X = np.array([[0, 0], [0, 1], [1, 0], [1, 1]])
y = np.array([[0], [1], [1], [0]])

# Train the neural network
epochs = 10000
learning_rate = 0.1
for epoch in range(epochs):
    output = nn.forward(X)
    nn.backward(X, y, learning_rate)
    if epoch % 1000 == 0:
        loss = np.mean(np.square(y - output))
        print(f"Epoch: {epoch}, Loss: {loss}")

# Test the trained model
test_input = np.array([[0, 0], [0, 1], [1, 0], [1, 1]])
predicted_output = nn.forward(test_input)
print("Predicted Output:")
print(predicted_output)


Epoch: 0, Loss: 0.38312474638549565
Epoch: 1000, Loss: 0.24472988171413584
Epoch: 2000, Loss: 0.21544664992514562
Epoch: 3000, Loss: 0.16941738605472628
Epoch: 4000, Loss: 0.08440864062796452
Epoch: 5000, Loss: 0.023868155613454206
Epoch: 6000, Loss: 0.011126683513587548
Epoch: 7000, Loss: 0.006849816702091066
Epoch: 8000, Loss: 0.004838505672081184
Epoch: 9000, Loss: 0.0036989784943961476
Predicted Output:
[[0.05620277]
 [0.94987237]
 [0.94532324]
 [0.05690739]]
