# DOST Summer School

A Python implementation of the Backpropagation algorithm is given below. This implementation is not optimized and therefore not very efficient. But it was coded in order to be easily understood by the reader.

Use the Boolean OR, AND and XOR dataset as the input. 

Run the program by testing the three different boolean functions.

In [31]:
from math import exp
from random import seed
from random import random

# Initialize a network
def initialize_network(n_inputs, n_hidden, n_outputs):
	network = list()
	hidden_layer = [{'weights':[random() for i in range(n_inputs + 1)]} for i in range(n_hidden)]
	network.append(hidden_layer)
	output_layer = [{'weights':[random() for i in range(n_hidden + 1)]} for i in range(n_outputs)]
	network.append(output_layer)
	return network

# Calculate neuron activation for an input
def activate(weights, inputs):
	activation = weights[-1]
	for i in range(len(weights)-1):
		activation += weights[i] * inputs[i]
	return activation

# Transfer neuron activation
def transfer(activation):
	return 1.0 / (1.0 + exp(-activation))

# Forward propagate input to a network output
def forward_propagate(network, row):
	inputs = row
	for layer in network:
		new_inputs = []
		for neuron in layer:
			activation = activate(neuron['weights'], inputs)
			neuron['output'] = transfer(activation)
			new_inputs.append(neuron['output'])
		inputs = new_inputs
	return inputs

# Calculate the derivative of an neuron output
def transfer_derivative(output):
	return output * (1.0 - output)

# Backpropagate error and store in neurons
def backward_propagate_error(network, expected):
	for i in reversed(range(len(network))):
		layer = network[i]
		errors = list()
		if i != len(network)-1:
			for j in range(len(layer)):
				error = 0.0
				for neuron in network[i + 1]:
					error += (neuron['weights'][j] * neuron['delta'])
				errors.append(error)
		else:
			for j in range(len(layer)):
				neuron = layer[j]
				errors.append(expected[j] - neuron['output'])
		for j in range(len(layer)):
			neuron = layer[j]
			neuron['delta'] = errors[j] * transfer_derivative(neuron['output'])

# Update network weights with error
def update_weights(network, row, l_rate):
	for i in range(len(network)):
		inputs = row[:-1]
		if i != 0:
			inputs = [neuron['output'] for neuron in network[i - 1]]
		for neuron in network[i]:
			for j in range(len(inputs)):
				neuron['weights'][j] += l_rate * neuron['delta'] * inputs[j]
			neuron['weights'][-1] += l_rate * neuron['delta']

# Train a network for a fixed number of epochs
def train_network(network, train, l_rate, n_epoch, n_outputs):
	for epoch in range(n_epoch):
		sum_error = 0
		for row in train:
			outputs = forward_propagate(network, row)
			expected = [0 for i in range(n_outputs)]
			expected[row[-1]] = 1
			sum_error += sum([(expected[i]-outputs[i])**2 for i in range(len(expected))])
			backward_propagate_error(network, expected)
			update_weights(network, row, l_rate)
		print('>epoch=%d, lrate=%.3f, error=%.3f' % (epoch, l_rate, sum_error))

# Taining backprop algorithm
seed(1)

# OR dataset
#dataset = [[0,0,0],[0,1,1],[1,0,1],[1,1,0]]

# AND dataset
dataset = [[0,0,0],[0,1,0],[1,0,0],[1,1,1]]

# XOR dataset
dataset = [[0,0,0],[0,1,0],[1,0,0],[1,1,1]]


n_inputs = len(dataset[0]) - 1
n_outputs = len(set([row[-1] for row in dataset]))
network = initialize_network(n_inputs, 2, n_outputs)
train_network(network, dataset, 0.2, 10, n_outputs)

for layer in network:
    for ctr in range(0,(len(layer))):
        if(ctr==0):
            print("[[{'weights': ",layer[ctr]['weights'],"},")
        elif(ctr < (len(layer)-1)):
            print("{'weights': ",layer[ctr]['weights'],"},")
        else:
            print("{'weights': ",layer[ctr]['weights'],"}]]")

	#print(layer)

>epoch=0, lrate=0.200, error=2.447
>epoch=1, lrate=0.200, error=2.335
>epoch=2, lrate=0.200, error=2.227
>epoch=3, lrate=0.200, error=2.127
>epoch=4, lrate=0.200, error=2.038
>epoch=5, lrate=0.200, error=1.960
>epoch=6, lrate=0.200, error=1.895
>epoch=7, lrate=0.200, error=1.840
>epoch=8, lrate=0.200, error=1.795
>epoch=9, lrate=0.200, error=1.758
[[{'weights':  [0.12965772334007, 0.8328291113135146, 0.7992416732718532] },
{'weights':  [0.21663295302524663, 0.4554170305160552, 0.3654547561932233] }]]
[[{'weights':  [0.6316266616949571, 0.7709016231914724, 0.1081355435556114] },
{'weights':  [-0.40168941745294573, 0.4581583685980768, -0.1758807206839592] }]]


Below is the code for testing. Just copy the output weights and assign it to network.

In [32]:
from math import exp

# Calculate neuron activation for an input
def activate(weights, inputs):
	activation = weights[-1]
	for i in range(len(weights)-1):
		activation += weights[i] * inputs[i]
	return activation

# Transfer neuron activation
def transfer(activation):
	return 1.0 / (1.0 + exp(-activation))

# Forward propagate input to a network output
def forward_propagate(network, row):
	inputs = row
	for layer in network:
		new_inputs = []
		for neuron in layer:
			activation = activate(neuron['weights'], inputs)
			neuron['output'] = transfer(activation)
			new_inputs.append(neuron['output'])
		inputs = new_inputs
	return inputs

# Make a prediction with a network
def predict(network, row):
	outputs = forward_propagate(network, row)
	return outputs.index(max(outputs))

# Test making predictions with the network
# AND dataset
dataset = [[0,0,0],[0,1,0],[1,0,0],[1,1,1]]


# Assign to network the output weights from the training program: 
network=[[{'weights':  [0.12965772334007, 0.8328291113135146, 0.7992416732718532] },
{'weights':  [0.21663295302524663, 0.4554170305160552, 0.3654547561932233] }]]
[[{'weights':  [0.6316266616949571, 0.7709016231914724, 0.1081355435556114] },
{'weights':  [-0.40168941745294573, 0.4581583685980768, -0.1758807206839592] }]]
ghts': [-7.740341833598472, -1.2763941018119498, 3.60478086932667]}]]
  
for row in dataset:
	prediction = predict(network, row)
	print('Expected=%d, Got=%d' % (row[-1], prediction))

SyntaxError: EOL while scanning string literal (<ipython-input-32-d15a6914321f>, line 41)

# Challenge: Animals Dataset
Now use the "animals.csv" as a dataset. Perform necessary preprocessing of the dataset. Divide the dataset for training and testing. You have to tweak the parameters of the algorithm such as the number of neurons in the hidden layer, learning rate and the number of epochs to run in order to get the accuracy as high as possible.

# Result: 100% accuracy

In [75]:
import pandas as pd
from sklearn.neural_network import MLPClassifier
from sklearn.model_selection import train_test_split
from sklearn.metrics import classification_report
from sklearn import metrics

SEED = 0

animals = pd.read_csv('animals.csv')
y = animals['class']
X = animals.drop('class', 1)
X.drop('sample', 1, inplace=True)

X_train, X_test, y_train, y_test = train_test_split(X, y, random_state=SEED)

best_combo = 0
best_accuracy = 0
best_clf = None

LAYER_SIZE_TESTS = []
MAX = 20

for x in range(1, MAX):
    for y in range(1, MAX):
        LAYER_SIZE_TESTS.append((y, x))

for x, y in LAYER_SIZE_TESTS:
    clf = MLPClassifier(solver='lbfgs', alpha=1e-5, hidden_layer_sizes=(x, y), random_state=SEED)
    clf.fit(X_train, y_train)
    y_pred_class = clf.predict(X_test)
    acc = metrics.accuracy_score(y_test, y_pred_class)
    
    if acc > best_accuracy:
        best_accuracy = acc
        best_combo = ((x, y), acc)
        best_clf = clf
        
print('Hidden layer size of {0} gives an accuracy of {1}!'.format(*best_combo))

Hidden layer size of (8, 14) gives an accuracy of 1.0!


In [57]:
best_combo[2]

1.0