In [9]:
# Example that uses the Neuron class to implement a simple neural network with 1 hidden layer (2 neurons)
# and the output layer with 1 neuron
import numpy as np
from ipynb.fs.full.Neuron_class import Neuron


In [12]:
class DummyNeuralNetwork:
    def __init__(self):
        weights = np.array([0, 1])
        bias = 0
        
        self.hidden_1 = Neuron(weights, bias)
        self.hidden_2 = Neuron(weights, bias)
        self.output   = Neuron(weights, bias)
        
    def feedforward(self, x):
        out_hidden_1 = self.hidden_1.feedforward(x)
        out_hidden_2 = self.hidden_2.feedforward(x)
        out_network = self.output.feedforward(np.array([out_hidden_1, out_hidden_2]))
        
        return out_network

In [13]:
network = DummyNeuralNetwork()
x = np.array([2, 3])
print(network.feedforward(x)) 

0.7216325609518421


In [19]:

def sigmoid(x):
    return 1/(1 + np.exp(-x))

def derivative_sigmoid(x):
    return sigmoid(x) * (1 - sigmoid(x))

def mse_loss(y_true, y_predicted):
    return ((y_true - y_predicted) **2).mean()

class MyNeuralNetwork:
    def __init__(self):
        
        self.w1 = np.random.normal()
        self.w2 = np.random.normal()
        self.w3 = np.random.normal()
        self.w4 = np.random.normal()
        self.w5 = np.random.normal()
        self.w6 = np.random.normal()
        
        self.b1 = np.random.normal()
        self.b2 = np.random.normal()
        self.b3 = np.random.normal()
        
    def feedforward(self,x):
        output_h1 = sigmoid((self.w1 * x[0] + self.w2 * x[1]) + self.b1)
        output_h2 = sigmoid((self.w3 * x[0] + self.w4 * x[1]) + self.b2)
        output = sigmoid((self.w5 * output_h1 + self.w6 * output_h2) + self.b3)
        
        return output
    
    def train(self, data, true_labels):
        learning_rate = 0.1
        epochs = 1000
        
        for epoch in range(epochs):
            for x, y_true in zip(data, true_labels):
                
                sum_h1 = x[0] * self.w1 + x[1] * self.w2 + self.b1
                output_h1 = sigmoid(sum_h1)
                
                sum_h2 = x[0] * self.w3 + x[1] * self.w4 + self.b2
                output_h2 = sigmoid(sum_h2)
                
                sum_out = output_h1 * self.w5 + output_h2 * self.w6 + self.b3
                y_predicted = sigmoid(sum_out)
                
                
                # Backpropagation -> using partial derivatives
                d_L_d_y_pred = -2 * (y_true - y_predicted)
                
                #output node
                d_y_pred_d_w5 = output_h1 * derivative_sigmoid(sum_out)
                d_y_pred_d_w6 = output_h2 * derivative_sigmoid(sum_out)
                d_y_pred_d_b3 = derivative_sigmoid(sum_out)
                
                d_y_pred_d_h1 = self.w5 * derivative_sigmoid(sum_out)
                d_y_pred_d_h2 = self.w6 * derivative_sigmoid(sum_out)

                #hidden 1 node
                d_h1_d_w1 = x[0] * derivative_sigmoid(output_h1)
                d_h1_d_w2 = x[1] * derivative_sigmoid(output_h1)
                d_h1_d_b1 = derivative_sigmoid(output_h1)
                
                #hidden 2 node
                d_h2_d_w3 = x[0] * derivative_sigmoid(output_h2)
                d_h2_d_w4 = x[1] * derivative_sigmoid(output_h2)
                d_h2_d_b2 = derivative_sigmoid(output_h2)
                
                
                #update weights and biases
                self.w1 -= learning_rate * d_L_d_y_pred * d_y_pred_d_h1 * d_h1_d_w1
                self.w2 -= learning_rate * d_L_d_y_pred * d_y_pred_d_h1 * d_h1_d_w2
                self.b1 -= learning_rate * d_L_d_y_pred * d_y_pred_d_h1 * d_h1_d_b1
                
                self.w3 -= learning_rate * d_L_d_y_pred * d_y_pred_d_h2 * d_h2_d_w3
                self.w4 -= learning_rate * d_L_d_y_pred * d_y_pred_d_h2 * d_h2_d_w4
                self.b2 -= learning_rate * d_L_d_y_pred * d_y_pred_d_h2 * d_h2_d_b2
                
                self.w5 -= learning_rate * d_L_d_y_pred * d_y_pred_d_w5
                self.w6 -= learning_rate * d_L_d_y_pred * d_y_pred_d_w6
                self.b3 -= learning_rate * d_L_d_y_pred * d_y_pred_d_b3
                
                if epoch % 10 == 0:
                    y_preds = np.apply_along_axis(self.feedforward, 1, data)
                    loss = mse_loss(true_labels, y_preds)
                    print("Epoch %d loss: %.3f" % (epoch, loss))

In [20]:
# Define dataset
data = np.array([
  [-2, -1],  # Alice
  [25, 6],   # Bob
  [17, 4],   # Charlie
  [-15, -6], # Diana
])
all_y_trues = np.array([
  1, # Alice
  0, # Bob
  0, # Charlie
  1, # Diana
])

# Train our neural network!
network = MyNeuralNetwork()
network.train(data, all_y_trues)

Epoch 0 loss: 0.453
Epoch 0 loss: 0.373
Epoch 0 loss: 0.358
Epoch 0 loss: 0.321
Epoch 10 loss: 0.065
Epoch 10 loss: 0.065
Epoch 10 loss: 0.065
Epoch 10 loss: 0.063
Epoch 20 loss: 0.039
Epoch 20 loss: 0.039
Epoch 20 loss: 0.039
Epoch 20 loss: 0.039
Epoch 30 loss: 0.030
Epoch 30 loss: 0.030
Epoch 30 loss: 0.030
Epoch 30 loss: 0.030
Epoch 40 loss: 0.025
Epoch 40 loss: 0.025
Epoch 40 loss: 0.025
Epoch 40 loss: 0.025
Epoch 50 loss: 0.022
Epoch 50 loss: 0.022
Epoch 50 loss: 0.022
Epoch 50 loss: 0.021
Epoch 60 loss: 0.019
Epoch 60 loss: 0.019
Epoch 60 loss: 0.019
Epoch 60 loss: 0.019
Epoch 70 loss: 0.017
Epoch 70 loss: 0.017
Epoch 70 loss: 0.017
Epoch 70 loss: 0.017
Epoch 80 loss: 0.015
Epoch 80 loss: 0.015
Epoch 80 loss: 0.015
Epoch 80 loss: 0.015
Epoch 90 loss: 0.014
Epoch 90 loss: 0.014
Epoch 90 loss: 0.014
Epoch 90 loss: 0.014
Epoch 100 loss: 0.013
Epoch 100 loss: 0.013
Epoch 100 loss: 0.013
Epoch 100 loss: 0.013
Epoch 110 loss: 0.012
Epoch 110 loss: 0.012
Epoch 110 loss: 0.012
Epoch 110 

  return 1/(1 + np.exp(-x))


In [21]:
emily = np.array([-7, -3]) # 128 pounds, 63 inches
frank = np.array([20, 2])  # 155 pounds, 68 inches
print("Emily: %.3f" % network.feedforward(emily)) # 0.951 - F
print("Frank: %.3f" % network.feedforward(frank)) # 0.039 - M

Emily: 0.963
Frank: 0.037


  return 1/(1 + np.exp(-x))
