In [None]:
import numpy as np

In [None]:
class NeuralNetwork:
  # input_size = Number of input features
  # hidden_size = number of neuron in hidden layer
  # output_size = number of neuron in output layer
  def __init__(self, input_size, hidden_size, output_size):
    self.input_size = input_size
    self.hidden_size = hidden_size
    self.output_size = output_size

    # Initialize weights
    # np.random.randn generates random numbers from a standard normal distribution
    self.weights_input_hidden = np.random.randn(self.input_size, self.hidden_size)
    self.weights_hidden_output = np.random.randn(self.hidden_size, self.output_size)

    # Initialize the biases
    self.bias_hidden = np.zeros((1, self.hidden_size))
    self.bias_output = np.zeros((1, self.output_size))

  def sigmoid(self, x):
    return 1 / (1 + np.exp(-x))

  def sigmoid_derivative(self, x):
    return x * (1 - x)

  def feed_forward(self, X):
    # Input layer to hidden layer
    self.hidden_activation = np.dot(X, self.weights_input_hidden) + self.bias_hidden
    self.hidden_output = self.sigmoid(self.hidden_activation)

    # Hidden layer to output layer
    self.output_activation = np.dot(self.hidden_output, self.weights_hidden_output) + self.bias_output
    self.predicted_output = self.sigmoid(self.output_activation)

    return self.predicted_output

  def back_propagation(self, X, y, learning_rate):
    output_error = y - self.predicted_output
    output_delta = output_error * self.sigmoid_derivative(self.predicted_output)

    hidden_error = np.dot(output_delta, self.weights_hidden_output.T)
    # hidden_delta indicates how much the hidden layer’s output contributed to the output error.
    hidden_delta = hidden_error * self.sigmoid_derivative(self.hidden_output)

    # update weights and biases
    self.weights_hidden_output += learning_rate * np.dot(self.hidden_output.T, output_delta)
    self.bias_output += learning_rate * np.sum(output_delta, axis=0, keepdims=True)

    self.weights_input_hidden += learning_rate * np.dot(X.T, hidden_delta)
    self.bias_hidden += learning_rate * np.sum(hidden_delta, axis=0, keepdims=True)

  def train_network(self, X, y, epochs, learning_rate):
    for epoch in range(epochs):
      output = self.feed_forward(X)
    self.back_propagation(X, y, learning_rate)
    if epoch % 4000 == 0:
      loss = np.mean(np.square(y - output))
      print(f"Epoch: {epoch}, Loss: {loss}")

In [None]:
X = np.array([[0, 0], [0, 1], [1, 0], [1, 1]])
y = np.array([[0], [1], [1], [0]])

In [None]:
nn = NeuralNetwork(input_size=2, hidden_size=4, output_size=1)
nn.train_network(X, y, epochs=10000, learning_rate=0.1)

# Test the trained model
output = nn.feed_forward(X)
print("Predictions after training: ")
print(output)

Predictions after training: 
[[0.29673854]
 [0.31986019]
 [0.34953992]
 [0.36480139]]
