# ANMOL GUPTA 20BCB0135
# Slot : L11+L12
# Q1 BackPropagation Neural Network from Scratch

In [1]:
# Initialize a network
def initialize_network(n_inputs, n_hidden, n_outputs):
    network = list()
    hidden_layer = [{'weights':[random() for i in range(n_inputs + 1)]} for i in range(n_hidden)]
    network.append(hidden_layer)
    output_layer = [{'weights':[random() for i in range(n_hidden + 1)]} for i in range(n_outputs)]
    network.append(output_layer)
    return network

In [2]:
# Calculate neuron activation for an input
def activate(weights, inputs):
    activation = weights[-1]
    for i in range(len(weights)-1):
        activation += weights[i] * inputs[i]
    return activation

In [13]:
# Transfer neuron activation
from math import exp
def transfer(activation):
    return 1.0 / (1.0 + exp(-activation))

In [4]:
# Forward propagate input to a network output
def forward_propagate(network, row):
    inputs = row
    for layer in network:
        new_inputs = []
        for neuron in layer:
            activation = activate(neuron['weights'], inputs)
            neuron['output'] = transfer(activation)
            new_inputs.append(neuron['output'])
        inputs = new_inputs
    return inputs

In [5]:
# Calculate the derivative of an neuron output
def transfer_derivative(output):
    return output * (1.0 - output)

In [6]:
# Backpropagate error and store in neurons
def backward_propagate_error(network, expected):
    for i in reversed(range(len(network))):
        layer = network[i]
        errors = list()
        if i != len(network)-1:
            for j in range(len(layer)):
                error = 0.0
                for neuron in network[i + 1]:
                    error += (neuron['weights'][j] * neuron['delta'])
                errors.append(error)
        else:
            for j in range(len(layer)):
                neuron = layer[j]
                errors.append(neuron['output'] - expected[j])
        for j in range(len(layer)):
            neuron = layer[j]
            neuron['delta'] = errors[j] * transfer_derivative(neuron['output'])

In [7]:
# Update network weights with error
def update_weights(network, row, l_rate):
    for i in range(len(network)):
        inputs = row[:-1]
        if i != 0:
            inputs = [neuron['output'] for neuron in network[i - 1]]
        for neuron in network[i]:
            for j in range(len(inputs)):
                neuron['weights'][j] -= l_rate * neuron['delta'] * inputs[j]
            neuron['weights'][-1] -= l_rate * neuron['delta']

In [8]:
# Train a network for a fixed number of epochs
def train_network(network, train, l_rate, n_epoch, n_outputs):
    for epoch in range(n_epoch):
        sum_error = 0
        for row in train:
            outputs = forward_propagate(network, row)
            expected = [0 for i in range(n_outputs)]
            expected[row[-1]] = 1
            sum_error += sum([(expected[i]-outputs[i])**2 for i in range(len(expected))])
            backward_propagate_error(network, expected)
            update_weights(network, row, l_rate)
            print('>epoch=%d, lrate=%.3f, error=%.3f' % (epoch, l_rate, sum_error))

In [14]:
# Test training backprop algorithm
from random import random
from random import seed
seed(1)
dataset = [[2.7810836,2.550537003,0],
    [1.465489372,2.362125076,0],
    [3.396561688,4.400293529,0],
    [1.38807019,1.850220317,0],
    [3.06407232,3.005305973,0],
    [7.627531214,2.759262235,1],
    [5.332441248,2.088626775,1],
    [6.922596716,1.77106367,1],
    [8.675418651,-0.242068655,1],
    [7.673756466,3.508563011,1]]
n_inputs = len(dataset[0]) - 1
n_outputs = len(set([row[-1] for row in dataset]))
network = initialize_network(n_inputs, 2, n_outputs)
train_network(network, dataset, 0.5, 20, n_outputs)
for layer in network:
    print(layer)

>epoch=0, lrate=0.500, error=0.502
>epoch=0, lrate=0.500, error=0.964
>epoch=0, lrate=0.500, error=1.379
>epoch=0, lrate=0.500, error=1.763
>epoch=0, lrate=0.500, error=2.105
>epoch=0, lrate=0.500, error=2.919
>epoch=0, lrate=0.500, error=3.643
>epoch=0, lrate=0.500, error=4.303
>epoch=0, lrate=0.500, error=4.893
>epoch=0, lrate=0.500, error=5.411
>epoch=1, lrate=0.500, error=0.552
>epoch=1, lrate=0.500, error=1.056
>epoch=1, lrate=0.500, error=1.521
>epoch=1, lrate=0.500, error=1.941
>epoch=1, lrate=0.500, error=2.327
>epoch=1, lrate=0.500, error=3.021
>epoch=1, lrate=0.500, error=3.629
>epoch=1, lrate=0.500, error=4.160
>epoch=1, lrate=0.500, error=4.621
>epoch=1, lrate=0.500, error=5.049
>epoch=2, lrate=0.500, error=0.569
>epoch=2, lrate=0.500, error=1.077
>epoch=2, lrate=0.500, error=1.568
>epoch=2, lrate=0.500, error=1.995
>epoch=2, lrate=0.500, error=2.405
>epoch=2, lrate=0.500, error=2.994
>epoch=2, lrate=0.500, error=3.544
>epoch=2, lrate=0.500, error=4.026
>epoch=2, lrate=0.50

In [15]:
# Make a prediction with a network
def predict(network, row):
    outputs = forward_propagate(network, row)
    return outputs.index(max(outputs))

In [17]:
# Taking weights from the output above
network = [[{'weights': [-0.9344296833915354, 5.415265006528539, 2.119276792401685]}, {'weights': [-0.5318170193096409, 1.0495810605392335, 0.5702868778548295]}],
    [{'weights': [2.1016548017199077, 1.3278343588003103, -0.7153299338834901]}, {'weights': [-1.8562634078543176, -0.1503175676074742, 0.6396233936354067]}]]
for row in dataset:
    prediction = predict(network, row)
    print('Expected=%d, Got=%d' % (row[-1], prediction))

Expected=0, Got=0
Expected=0, Got=0
Expected=0, Got=1
Expected=0, Got=0
Expected=0, Got=1
Expected=1, Got=1
Expected=1, Got=1
Expected=1, Got=1
Expected=1, Got=1
Expected=1, Got=1
