In [1]:
import numpy as np

class XORNetwork:
    def __init__(self):
        self.W1 = np.random.randn(2, 2)
        self.b1 = np.random.randn(2)
        self.W2 = np.random.randn(2, 1)
        self.b2 = np.random.randn(1)

    def sigmoid(self, x):
        return 1 / (1 + np.exp(-x))

    def sigmoid_derivative(self, x):
        return x * (1 - x)

    def forward(self, X):
        self.z1 = np.dot(X, self.W1) + self.b1
        self.a1 = self.sigmoid(self.z1)
        self.z2 = np.dot(self.a1, self.W2) + self.b2
        self.a2 = self.sigmoid(self.z2)
        return self.a2

    def backward(self, X, y, output, learning_rate):
        output_error = y - output
        output_delta = output_error * self.sigmoid_derivative(output)

        z1_error = output_delta.dot(self.W2.T)
        z1_delta = z1_error * self.sigmoid_derivative(self.a1)

        self.W1 += learning_rate * X.T.dot(z1_delta)
        self.b1 += learning_rate * np.sum(z1_delta, axis=0)
        self.W2 += learning_rate * self.a1.T.dot(output_delta)
        self.b2 += learning_rate * np.sum(output_delta, axis=0)

    def train(self, X, y, epochs, learning_rate=0.1):
        for i in range(epochs):
            output = self.forward(X)
            self.backward(X, y, output, learning_rate)
            if i % 1000 == 0:
                loss = np.mean(np.abs(y - output))
                print(f"Epoch {i}: Error = {loss:.4f}")

    def predict(self, X):
        return self.forward(X)

# XOR data
X = np.array([[0, 0], [0, 1], [1, 0], [1, 1]])
y = np.array([[0], [1], [1], [0]])

# Train and test
xor_nn = XORNetwork()
xor_nn.train(X, y, epochs=10000, learning_rate=0.1)
predictions = xor_nn.predict(X)

# Print raw and rounded predictions
print("Raw predictions:\n", predictions)
print("Binary predictions:\n", (predictions > 0.5).astype(int))


Epoch 0: Error = 0.4978
Epoch 1000: Error = 0.4481
Epoch 2000: Error = 0.3627
Epoch 3000: Error = 0.3229
Epoch 4000: Error = 0.3049
Epoch 5000: Error = 0.2949
Epoch 6000: Error = 0.2885
Epoch 7000: Error = 0.2841
Epoch 8000: Error = 0.2807
Epoch 9000: Error = 0.2781
Raw predictions:
 [[0.04511763]
 [0.94704773]
 [0.4968917 ]
 [0.50295181]]
Binary predictions:
 [[0]
 [1]
 [0]
 [1]]
