# S.I Adams - 3838305
# CSC311 - Back-Propagation Assignment
# Task 3

In [None]:
# Imports
import numpy as np 
      
# Each row is a training example, each column is a feature  [X1, X2, X3]
X = np.array(([0,0,1],[0,1,1],[1,0,1],[1,1,1]), dtype=float)
y = np.array(([0],[1],[1],[0]), dtype=float)

# Class definition
class NN:
    def __init__(self, x,y):
        self.x = x
        self.w1 = np.random.rand(self.x.shape[1],4) # randonly generated weights
        self.w2 = np.random.rand(4,1) # randonly generated weights
        self.y = y
        self.output = np.zeros(y.shape)
    
    # Activation function
    def sigmoid(self, z):
        return 1 / (1 + np.exp(-z))

    # Derivative of sigmoid
    def sigmoid_derivative(self, z):
        return z * (1 - z)

    # FeedForward algorithm feeds the input data forward through the layers
    # outputs the predicted output 
    def feedforward(self):
        # Dot product of inputs and weights and passing it through the activation function
        self.layer1 = sigmoid(np.dot(self.x, self.w1))
        self.layer2 = sigmoid(np.dot(self.layer1, self.w2))
        return self.layer2

    # mean sum squared error value
    def back_propagate_error(self):
        return np.mean(np.square(y - self.feedforward()))

    # Propagates backwards when predicted output is not equal to expected output
    # by updating the weights using gradient decient until error value is extremly small 
    # and predicted output is equal to expected output   
    def backprop(self):
        self.w1 += np.dot(np.transpose(self.x), np.dot(2 * (self.y - self.output) * sigmoid_derivative(self.output), np.transpose(self.w2)) * sigmoid_derivative(self.layer1))
        self.w2 += np.dot(np.transpose(self.layer1), 2 * (self.y - self.output) * sigmoid_derivative(self.output))
        
    # Trains the model by continuosly feeding the data forward and backwards until
    # prediction is accurate 
    def train(self, X, y):
        self.output = self.feedforward()
        self.backprop()

NN1 = NN(X,y)
for i in range(1000): # trains the NN
    if i % 100 == 0: # check if i mod 100 is equal to 0
        print ("Actual Output: \n", str(y))
        print ("Predicted Output: \n", str(NN1.feedforward()))
        print ("Error value: \n", str(NN1.back_propagate_error())) 
        print ("\n")
  
    NN1.train(X, y)


#--------------------------------------------------------------------------------------------------------------------------------------------
# Weights:
# Neural network training is about finding weights that minimize prediction error. We usually start our training with a set of randomly generated weights.
# weights associated with neuron connections must be updated after forward passes of data through the network
# The error represents the difference between actual output and predicted output values
# This error is required at neurons to make weight adjustments, and are propagated backward through the network after calculation of the backpropagation error. 
# This is used to update the weights in an attempt to correctly map arbitrary inputs to outputs.
# Gradient descent is used to more efficiently determine optimal weights by acting as a guide when searching for a cost function's optimal value
# Stochastic gradient descent is a randomization of data sampling on which a single selection is used for error backpropagation (and weight updates)
# Weight = weight + learning rate * error * input
# Error is the neuron delta weight update changes that are needed

# Update network weights with error
# takes in 3 args, network, row and learning rate
def update_weights(network, row, l_rate):
	for i in range(len(network)): # loops through length of network number of times
		inputs = row[:-1] # sets input to all values in row except the last col in the row
		if i != 0: # if i is not equal to 0 
			inputs = [neuron['output'] for neuron in network[i - 1]] 
		for neuron in network[i]: # loops through each element in network
			for j in range(len(inputs)):  # loops through length of input number of times
				neuron['weights'][j] += l_rate * neuron['delta'] * inputs[j] # updating weights
			neuron['weights'][-1] += l_rate * neuron['delta'] # updating weights

In [None]:
#!usr/bin/python3
import random
from sklearn.cluster import KMeans as kmeans
import numpy as np
import matplotlib.pyplot as plot

DATAPOINTS = 20
studentno = int(input('Please enter your student number: ')) # my student number is 3838305
random.seed(studentno % 10000)
col1 = [random.randint(0,studentno) for i in range(0,DATAPOINTS)]

random.seed(studentno % 1000)
col2 = [random.randint(0,studentno) for i in range(0,DATAPOINTS)]

random.seed(studentno % 100)
col3 = [random.randint(0,studentno) for i in range(0,DATAPOINTS)]

random.seed(studentno % 10)
col4 = [random.randint(0,studentno) for i in range(0,DATAPOINTS)]

random.seed(studentno % 100000)
col5 = [random.randint(0,studentno) for i in range(0,DATAPOINTS)]

col6 = [i % 3 for i in range(0,DATAPOINTS)]

sdata = open('data.txt', mode = 'w')
[print("%s, %s, %s, %s, %s, %s" % (str(col1[i]), str(col2[i]), str(col3[i]), str(col4[i]), str(col5[i]), str(col6[i])), file =sdata) for i in range(0,DATAPOINTS)]
sdata.close()

# Task 4

In [19]:
# Backprop on the Seeds Dataset
from random import seed
from random import randrange
from random import random
from csv import reader
from math import exp

# Load a CSV file
def load_csv(filename):
	dataset = list()
	with open(filename, 'r') as file:
		csv_reader = reader(file)
		for row in csv_reader:
			if not row:
				continue
			dataset.append(row)
	return dataset

# Convert string column to float
def str_column_to_float(dataset, column):
	for row in dataset:
		row[column] = float(row[column].strip())

# Convert string column to integer
def str_column_to_int(dataset, column):
	class_values = [row[column] for row in dataset]
	unique = set(class_values)
	lookup = dict()
	for i, value in enumerate(unique):
		lookup[value] = i
	for row in dataset:
		row[column] = lookup[row[column]]
	return lookup

# Find the min and max values for each column
def dataset_minmax(dataset):
	minmax = list()
	stats = [[min(column), max(column)] for column in zip(*dataset)]
	return stats

# Rescale dataset columns to the range 0-1
def normalize_dataset(dataset, minmax):
	for row in dataset:
		for i in range(len(row)-1):
			row[i] = (row[i] - minmax[i][0]) / (minmax[i][1] - minmax[i][0])

# Split a dataset into k folds
def cross_validation_split(dataset, n_folds):
	dataset_split = list()
	dataset_copy = list(dataset)
	fold_size = int(len(dataset) / n_folds)
	for i in range(n_folds):
		fold = list()
		while len(fold) < fold_size:
			index = randrange(len(dataset_copy))
			fold.append(dataset_copy.pop(index))
		dataset_split.append(fold)
	return dataset_split

# Calculate accuracy percentage
def accuracy_metric(actual, predicted):
	correct = 0
	for i in range(len(actual)):
		if actual[i] == predicted[i]:
			correct += 1
	return correct / float(len(actual)) * 100.0

# Evaluate an algorithm using a cross validation split
def evaluate_algorithm(dataset, algorithm, n_folds, *args):
	folds = cross_validation_split(dataset, n_folds)
	scores = list()
	for fold in folds:
		train_set = list(folds)
		train_set.remove(fold)
		train_set = sum(train_set, [])
		test_set = list()
		for row in fold:
			row_copy = list(row)
			test_set.append(row_copy)
			row_copy[-1] = None
		predicted = algorithm(train_set, test_set, *args)
		actual = [row[-1] for row in fold]
		accuracy = accuracy_metric(actual, predicted)
		scores.append(accuracy)
	return scores

# Calculate neuron activation for an input
def activate(weights, inputs):
	activation = weights[-1]
	for i in range(len(weights)-1):
		activation += weights[i] * inputs[i]
	return activation

# Transfer neuron activation
def transfer(activation):
	return 1.0 / (1.0 + exp(-activation))

# Forward propagate input to a network output
def forward_propagate(network, row):
	inputs = row
	for layer in network:
		new_inputs = []
		for neuron in layer:
			activation = activate(neuron['weights'], inputs)
			neuron['output'] = transfer(activation)
			new_inputs.append(neuron['output'])
		inputs = new_inputs
	return inputs

# Calculate the derivative of an neuron output
def transfer_derivative(output):
	return output * (1.0 - output)

# Backpropagate error and store in neurons
def backward_propagate_error(network, expected):
	for i in reversed(range(len(network))):
		layer = network[i]
		errors = list()
		if i != len(network)-1:
			for j in range(len(layer)):
				error = 0.0
				for neuron in network[i + 1]:
					error += (neuron['weights'][j] * neuron['delta'])
				errors.append(error)
		else:
			for j in range(len(layer)):
				neuron = layer[j]
				errors.append(expected[j] - neuron['output'])
		for j in range(len(layer)):
			neuron = layer[j]
			neuron['delta'] = errors[j] * transfer_derivative(neuron['output'])

# Update network weights with error
# takes in 3 args, network, row and learning rate
def update_weights(network, row, l_rate):
	for i in range(len(network)): # loops through length of network number of times
		inputs = row[:-1] # sets input to all values in row except the last col in the row
		if i != 0: # if i is not equal to 0 
			inputs = [neuron['output'] for neuron in network[i - 1]] 
		for neuron in network[i]: # loops through each element in network
			for j in range(len(inputs)):  # loops through length of input number of times
				neuron['weights'][j] += l_rate * neuron['delta'] * inputs[j] # updating weights
			neuron['weights'][-1] += l_rate * neuron['delta'] # updating weights

# Train a network for a fixed number of epochs
def train_network(network, train, l_rate, n_epoch, n_outputs):
	for epoch in range(n_epoch):
		for row in train:
			outputs = forward_propagate(network, row)
			expected = [0 for i in range(n_outputs)]
			expected[row[-1]] = 1
			backward_propagate_error(network, expected)
			update_weights(network, row, l_rate)

# Initialize a network
def initialize_network(n_inputs, n_hidden, n_outputs):
	network = list()
	hidden_layer = [{'weights':[random() for i in range(n_inputs + 1)]} for i in range(n_hidden)]
	network.append(hidden_layer)
	output_layer = [{'weights':[random() for i in range(n_hidden + 1)]} for i in range(n_outputs)]
	network.append(output_layer)
	return network

# Make a prediction with a network
def predict(network, row):
	outputs = forward_propagate(network, row)
	return outputs.index(max(outputs))

# Backpropagation Algorithm With Stochastic Gradient Descent
def back_propagation(train, test, l_rate, n_epoch, n_hidden):
	n_inputs = len(train[0]) - 1
	n_outputs = len(set([row[-1] for row in train]))
	network = initialize_network(n_inputs, n_hidden, n_outputs)
	train_network(network, train, l_rate, n_epoch, n_outputs)
	predictions = list()
	for row in test:
		prediction = predict(network, row)
		predictions.append(prediction)
	return(predictions)

# Test Backprop on Seeds dataset
seed(1)
# load and prepare data
filename = 'data.txt'
dataset = load_csv(filename)
for i in range(len(dataset[0])-1):
	str_column_to_float(dataset, i)
# convert class column to integers
str_column_to_int(dataset, len(dataset[0])-1)
# normalize input variables
minmax = dataset_minmax(dataset)
normalize_dataset(dataset, minmax)
# evaluate algorithm
n_folds = 5
l_rate = 0.3
n_epoch = 500
n_hidden = 5
scores = evaluate_algorithm(dataset, back_propagation, n_folds, l_rate, n_epoch, n_hidden)
sdata = open('back-prop-scores.txt', mode = 'w')
print('Scores: %s' % scores, file =sdata)
sdata.close()
print('Scores: %s' % scores)
print('Mean Accuracy: %.3f%%' % (sum(scores)/float(len(scores))))

Scores: [25.0, 0.0, 25.0, 25.0, 50.0]
Mean Accuracy: 25.000%
