# building basic neural network from scratch

In [1]:
import numpy as np

In [5]:
def sigmoid(x):
    return 1 / (1 + np.exp(-x))

def sigmoid_derivative(x):
    return x * (1 - x)

def mean_squared_error(ytrue, ypred):
    return np.mean((ytrue - ypred) ** 2)

class BasicNeuralNetwork:
    def __init__(self, input_size, hidden_size, output_size):
        self.weights_input_hidden = np.random.rand(input_size, hidden_size)
        self.weights_hidden_output = np.random.rand(hidden_size, output_size)
        self.bias_hidden = np.random.rand(1, hidden_size)
        self.bias_output = np.random.rand(1, output_size)

    # forward pass
    def forward(self, x):
        self.hidden_input = np.dot(x, self.weights_input_hidden) + self.bias_hidden
        self.hidden_output = sigmoid(self.hidden_input)
        self.output_input = np.dot(self.hidden_output, self.weights_hidden_output) + self.bias_output
        self.output = sigmoid(self.output_input)

        return self.output
    
    # backward pass
    def backward(self, x, y, output, learning_rate):
        output_error = y - output
        output_delta = output_error * sigmoid_derivative(output)
        hidden_error = output_delta.dot(self.weights_hidden_output.T)
        hidden_delta = hidden_error * sigmoid_derivative(self.hidden_output)

        self.weights_hidden_output += np.dot(self.hidden_output.T, output_delta) * learning_rate
        self.bias_output += np.sum(output_delta, axis=0, keepdims=True) * learning_rate
        self.weights_input_hidden += np.dot(x.T, hidden_delta) * learning_rate
        self.bias_hidden += np.sum(hidden_delta, axis=0, keepdims=True) * learning_rate

    # train the model
    def train(self, x, y, epochs, learning_rate):
        for epoch in range(epochs):
            output = self.forward(x)
            self.backward(x, y, output, learning_rate)
            if epoch % 100 == 0:
                print(f'Epoch {epoch}, Loss: {mean_squared_error(y, output)}')



In [20]:
# xor dataset

x = np.array([[0, 0], [0, 1], [1, 0], [1, 1]])
y = np.array([[0], [1], [1], [0]])

nn = BasicNeuralNetwork(2, 2, 1)
nn.train(x, y, 10000, 0.1)

print("\ntest the trained neural network:")
for i in range(len(x)):
    output_value = nn.forward(x[i][0])
    round_output = np.where(output_value < 0.5, 0, 1)
    print(f'Input: {x[i]} \npredicted output: {output_value} \nround-off output: {round_output} \nActual output: {y[i]}')
    print('---------------------------')

Epoch 0, Loss: 0.35606955903668114
Epoch 100, Loss: 0.24992632072605808
Epoch 200, Loss: 0.24985668597160893
Epoch 300, Loss: 0.24979202555794666
Epoch 400, Loss: 0.24972153304416167
Epoch 500, Loss: 0.24964296454212415
Epoch 600, Loss: 0.24955376832331322
Epoch 700, Loss: 0.24945096712049358
Epoch 800, Loss: 0.24933102096715065
Epoch 900, Loss: 0.24918966289173522
Epoch 1000, Loss: 0.24902169893281031
Epoch 1100, Loss: 0.2488207625359602
Epoch 1200, Loss: 0.2485790116063753
Epoch 1300, Loss: 0.24828675429389918
Epoch 1400, Loss: 0.2479319869794125
Epoch 1500, Loss: 0.24749982510040106
Epoch 1600, Loss: 0.24697180521966683
Epoch 1700, Loss: 0.2463250376028425
Epoch 1800, Loss: 0.2455311988490228
Epoch 1900, Loss: 0.24455538776057562
Epoch 2000, Loss: 0.2433549516564448
Epoch 2100, Loss: 0.24187856926981627
Epoch 2200, Loss: 0.24006620548245883
Epoch 2300, Loss: 0.23785105350947489
Epoch 2400, Loss: 0.23516511006101937
Epoch 2500, Loss: 0.23195006020289255
Epoch 2600, Loss: 0.2281736674