## initialize_network function

In [19]:
# -*- coding:utf-8 -*-

from random import seed
from random import random

def initialize_network(n_inputs, n_hidden, n_outputs):
    network= list()
    hidden_layer = [{'weights': [random() for i in range(n_inputs + 1)]} for i in range(n_hidden)]
    network.append(hidden_layer)

    output_layer = [{'weights': [random() for i in range(n_hidden +1)]} for i in range(n_outputs)]
    network.append(output_layer)

    return network

seed(1)
network = initialize_network(2, 1, 2)
for layer in network:
    print(layer)



[{'weights': [0.13436424411240122, 0.8474337369372327, 0.763774618976614]}]
[{'weights': [0.2550690257394217, 0.49543508709194095]}, {'weights': [0.4494910647887381, 0.651592972722763]}]


akj: k = kth neuron of previous layer, 
     j = jth neuron of current layer  
                    b00                    a00                   a10  
[{'weights': [0.13436424411240122, 0.8474337369372327, 0.763774618976614]}]  
                     b00                    a00                                 b01                    a01  
[{'weights': [0.2550690257394217, 0.49543508709194095]}, {'weights': [0.4494910647887381, 0.651592972722763]}]

## activate function

In [20]:
from math import exp

# Calculate neuron activation for an input
# weights : weight corresponding to neurons of previous layer
# inputs  : output of neurons of previous layer 
def activate(weights, inputs, verbose=False):
    
    activation = weights[-1] # the last weight is bias
    
    # len(inputs) - 1 = we don't count bias in
    for i in range(len(inputs) - 1):
        if verbose:
            print("activation:{}".format(activation))
            print("weight[{}]: {} * inputs[{}] = {}".format(i, weights[i], i, inputs[i]))
        activation += weights[i] * inputs[i]
    
    if verbose:
        print("cur activation: {}".format(activation))
        
    return activation


## transfer function

In [21]:
# Transfer neruon activation
def transfer(activation):
    return 1.0 / (1.0 + exp(-activation))


## forward_propagate function

In [22]:
# Forward propagate input to a network output
def forward_propagate(network, row, verbose=False):
    inputs = row
    for layer in network:
        new_inputs = []
        if verbose:
            print("layer: {}".format(layer))
        
        for neuron in layer:
            if verbose:
                print("neuron: {}".format(neuron))
                
            activation = activate(neuron['weights'], inputs)
            neuron['output'] = transfer(activation)
            new_inputs.append(neuron['output'])
        inputs = new_inputs
    return inputs


In [23]:
# row = input 
# the last element of row is bias
row = [1, 0, None]
output = forward_propagate(network, row)

In [24]:
print(output)

[0.6213859615555266, 0.6573693455986976]


## transfer_derivative function

In [25]:
# Calculate the derivative of an neuron output
# y = 1/ (1 + exp(-z)))
def transfer_derivative(output):
    return output * (1.0 - output)


## backward_propagate_error function : Calculate Backpropagate error and store in neurons

In [26]:
# Backpropagate error and store in neurons

'''
for each neuron of output layer
    error = (expected - output) * transfer_derivative(output of output layer)

for each neuron of hidden layer
    error_kj = (weight_kj * error_j) * transfer_derivative(output_kj)
    
    假設目前在 "h" layer 的第 "k" 個 neuron
    output_kj_h   = "h"   layer 的第 "k" 個 neuron 輸出到下一個 "h+1" layer 的第 "j" 個 neuron
    weight_kj_h   = "h"   layer 的第 "k" 個 neuron 到下一個    "h+1" layer 的第 "j" 個 neuron 的 weigth
    error_j_h+1   = "h+1" layer 的第 "j" 個 neuron 的 error
                
                以 output layer(第 L 個 layer) 前一個 hidden layer(L-1) 而言
                "L-1" layer 的第 "j" 個 neuron 的 backpropagate error
                error_j = (expected - output_Lj) * transfer_derivative(output_j_L)

    error_k = sum(error_kj), j = 1 ~ n
'''

def backward_propagate_error(network, expected):
    for i in reversed(range(len(network))):
        layer = network[i]
        errors = list()
        if i != len(network)-1:
            #
            # Hidden layer
            #
            # the error of neuron of hidden layer = weight * 後一個 layer 的 error
            for j in range(len(layer)):
                error = 0.0
                for neuron in network[i + 1]:
                    # neuron['delta] = back propagation error
                    # 對於目前的 layer 的這個 neuron (假設為 k) 的 backpropagation error
                    # 就是將 k 到下一個 layer 的每一個 neuron 的 weight 都乘上該 neuron(下一個 layer) 的 backpropagation error
                    # 累加起來之後再乘上 transfer_derivative(k_output)
                    error += (neuron['weights'][j] * neuron['delta'])
                errors.append(error)
        else:
            #
            # The final layer = output layer
            #
            # the backpropagation error of output layer = (Real_Y - Predict_Y) * transfer_derivative(Predict_Y)
            for j in range(len(layer)):
                neuron = layer[j]
                errors.append(expected[j] - neuron['output'])
        
        # 將每個 neuron 的 error 存在 "delta"
        for j in range(len(layer)):
            neuron = layer[j]
            neuron['delta'] = errors[j] * transfer_derivative(neuron['output'])


In [27]:
expected = [0, 1]
backward_propagate_error(network, expected)
for layer in network:
    print(layer)

[{'output': 0.7105668883115941, 'weights': [0.13436424411240122, 0.8474337369372327, 0.763774618976614], 'delta': -0.0005348048046610517}]
[{'output': 0.6213859615555266, 'weights': [0.2550690257394217, 0.49543508709194095], 'delta': -0.14619064683582808}, {'output': 0.6573693455986976, 'weights': [0.4494910647887381, 0.651592972722763], 'delta': 0.0771723774346327}]


## update_weights function

In [28]:
# Update network weights with error

'''
w = w + learning_rate * backpropagation_error * input
'''

def update_weights(network, row, l_rate):
    for i in range(len(network)):
        inputs = row
        if i != 0:
            # 前一個 layer 的 output 等於目前 layer 的 input
            inputs = [neuron['output'] for neuron in network[i - 1]]
        
        # update weight of all neuron of current layer
        for neuron in network[i]:
            # 目前的設定是 每個 neuron 的最後一個 wieght 是 bias
            for j in range(len(inputs) - 1):
                neuron['weights'][j] += l_rate * neuron['delta'] * inputs[j]
            neuron['weights'][-1] += l_rate * neuron['delta']


## train_network Fuction : Put it all together

In [29]:
# Train a network for a fixed number of epochs
def train_network(network, train, l_rate, n_epoch, n_outputs):
    for epoch in range(n_epoch):
        sum_error = 0
        # a complete forward_propagate, backward_propagate process
        for row in train:
            outputs = forward_propagate(network, row)
            # initialize an zero-value vector has same length with n_outputs
            # expected 用來存每個 layer
            expected = [0 for i in range(n_outputs)]
            # bias = 1
            expected[row[-1]] = 1
            sum_error += sum([(expected[i] - outputs[i])**2 for i in range(len(expected))])
            backward_propagate_error(network, expected)
            update_weights(network, row, l_rate)
        
        print(">epoch=%d, lrate=%.3f, error=%.3f" % (epoch, l_rate, sum_error))


## example for training network

In [37]:
# Test training backprop algorithm
seed(1)
dataset = [[2.7810836,2.550537003,0],
           [1.465489372,2.362125076,0],
           [3.396561688,4.400293529,0],
           [1.38807019,1.850220317,0],
           [3.06407232,3.005305973,0],
           [7.627531214,2.759262235,1],
           [5.332441248,2.088626775,1],
           [6.922596716,1.77106367,1],
           [8.675418651,-0.242068655,1],
           [7.673756466,3.508563011,1] 
          ]
# dataset = [x1, x2, y], 所以 input 的個數為 2
n_inputs = len(dataset[0]) - 1
# set() : 取得不重覆的 element
# row[-1] = the last element of row = y, y 只有 (0, 1)
n_outputs = len(set([row[-1] for row in dataset]))
print("n_outputs: {}".format(set([row[-1] for row in dataset])))
      
network = initialize_network(n_inputs, 2, n_outputs)
train_network(network, dataset, 0.5, 20, n_outputs)

for layer in network:
    print(layer)


n_outputs: set([0, 1])
>epoch=0, lrate=0.500, error=5.421
>epoch=1, lrate=0.500, error=5.222
>epoch=2, lrate=0.500, error=5.096
>epoch=3, lrate=0.500, error=4.813
>epoch=4, lrate=0.500, error=4.409
>epoch=5, lrate=0.500, error=4.095
>epoch=6, lrate=0.500, error=3.782
>epoch=7, lrate=0.500, error=3.478
>epoch=8, lrate=0.500, error=3.192
>epoch=9, lrate=0.500, error=2.926
>epoch=10, lrate=0.500, error=2.682
>epoch=11, lrate=0.500, error=2.460
>epoch=12, lrate=0.500, error=2.258
>epoch=13, lrate=0.500, error=2.076
>epoch=14, lrate=0.500, error=1.913
>epoch=15, lrate=0.500, error=1.766
>epoch=16, lrate=0.500, error=1.634
>epoch=17, lrate=0.500, error=1.516
>epoch=18, lrate=0.500, error=1.410
>epoch=19, lrate=0.500, error=1.315
[{'output': 0.025670375645295517, 'weights': [-1.482313569067226, 1.8308790073202204, 1.078381922048799], 'delta': -0.00654781981492048}, {'output': 0.9693210809965882, 'weights': [0.23244990332399884, 0.3621998343835864, 0.40289821191094327], 'delta': 0.000123078825

## predict function

In [39]:
# Make a prediction with a network
def predict(network, row):
    outputs = forward_propagate(network, row)
    return outputs.index(max(outputs))



## Example for prediction

In [40]:
for row in dataset:
	prediction = predict(network, row)
	print('Expected=%d, Got=%d' % (row[-1], prediction))

Expected=0, Got=0
Expected=0, Got=0
Expected=0, Got=0
Expected=0, Got=0
Expected=0, Got=0
Expected=1, Got=1
Expected=1, Got=1
Expected=1, Got=1
Expected=1, Got=1
Expected=1, Got=1
