# Backpropagation

In [None]:
import numpy as np
import time

class backpropagation:
    def __init__(self, input_size, hidden_size, output_size, learning_rate):
        self.input_size = input_size
        self.hidden_size = hidden_size
        self.output_size = output_size
        self.learning_rate = learning_rate

        self.W1 = np.random.randn(self.input_size, self.hidden_size)
        self.b1 = np.zeros((1, self.hidden_size))
        self.W2 = np.random.randn(self.hidden_size, self.output_size)
        self.b2 = np.zeros((1, self.output_size))

    def sigmoid(self, x):
        return 1 / (1 + np.exp(-x))

    def sigmoid_derivative(self, x):
        return x * (1 - x)

    def forward(self, x):
        self.z1 = np.dot(x, self.W1) + self.b1
        self.a1 = self.sigmoid(self.z1)
        self.z2 = np.dot(self.a1, self.W2) + self.b2
        self.a2 = self.sigmoid(self.z2)
        return self.a2

    def backward(self, x, y):
        self.loss = 0.5 * np.power((y - self.a2), 2)
        self.a2_delta = (y - self.a2) * self.sigmoid_derivative(self.a2)
        self.a1_delta = self.a2_delta.dot(self.W2.T) * self.sigmoid_derivative(self.a1)

        self.W1 += x.T.dot(self.a1_delta) * self.learning_rate
        self.b1 += np.sum(self.a1_delta, axis=0, keepdims=True) * self.learning_rate
        self.W2 += self.a1.T.dot(self.a2_delta) * self.learning_rate
        self.b2 += np.sum(self.a2_delta, axis=0, keepdims=True) * self.learning_rate

    def train(self, x, y):
        self.forward(x)
        self.backward(x, y)

    def predict(self, x):
        return self.forward(x)