In [1]:
import numpy as np

class SimpleNeuralNetwork:
    def __init__(self, input_size, hidden_size, output_size, learning_rate=0.1):
        # Initialize weights
        self.learning_rate = learning_rate
        self.W1 = np.random.rand(input_size, hidden_size)
        self.b1 = np.zeros((1, hidden_size))
        self.W2 = np.random.rand(hidden_size, output_size)
        self.b2 = np.zeros((1, output_size))

    def sigmoid(self, x):
        return 1 / (1 + np.exp(-x))

    def sigmoid_derivative(self, x):
        return x * (1 - x)

    def forward(self, X):
        self.z1 = np.dot(X, self.W1) + self.b1
        self.a1 = self.sigmoid(self.z1)
        self.z2 = np.dot(self.a1, self.W2) + self.b2
        self.a2 = self.sigmoid(self.z2)
        return self.a2

    def backward(self, X, y, output):
        output_error = y - output
        output_delta = output_error * self.sigmoid_derivative(output)

        hidden_error = output_delta.dot(self.W2.T)
        hidden_delta = hidden_error * self.sigmoid_derivative(self.a1)

        self.W2 += self.a1.T.dot(output_delta) * self.learning_rate
        self.b2 += np.sum(output_delta, axis=0, keepdims=True) * self.learning_rate
        self.W1 += X.T.dot(hidden_delta) * self.learning_rate
        self.b1 += np.sum(hidden_delta, axis=0, keepdims=True) * self.learning_rate

    def train(self, X, y, epochs=10000):
        for epoch in range(epochs):
            output = self.forward(X)
            self.backward(X, y, output)
            if (epoch+1) % 1000 == 0:
                loss = np.mean(np.square(y - output))
                print(f"Epoch {epoch+1}/{epochs}, Loss: {loss:.6f}")

    def predict(self, X):
        output = self.forward(X)
        return output

if __name__ == "__main__":
    # XOR problem
    X = np.array([[0,0],
                  [0,1],
                  [1,0],
                  [1,1]])
    y = np.array([[0],
                  [1],
                  [1],
                  [0]])

    nn = SimpleNeuralNetwork(input_size=2, hidden_size=2, output_size=1, learning_rate=0.5)
    nn.train(X, y, epochs=10000)

    print("Predictions after training:")
    for x in X:
        print(f"Input: {x} -> Predicted Output: {nn.predict(x.reshape(1, -1))}")


Epoch 1000/10000, Loss: 0.190672
Epoch 2000/10000, Loss: 0.171687
Epoch 3000/10000, Loss: 0.169167
Epoch 4000/10000, Loss: 0.168245
Epoch 5000/10000, Loss: 0.167774
Epoch 6000/10000, Loss: 0.167486
Epoch 7000/10000, Loss: 0.167283
Epoch 8000/10000, Loss: 0.167116
Epoch 9000/10000, Loss: 0.166938
Epoch 10000/10000, Loss: 0.166608
Predictions after training:
Input: [0 0] -> Predicted Output: [[0.02304941]]
Input: [0 1] -> Predicted Output: [[0.66554338]]
Input: [1 0] -> Predicted Output: [[0.6655475]]
Input: [1 1] -> Predicted Output: [[0.66496543]]
