In [39]:
# Imports

import random
import numpy as np
from sklearn.datasets import load_iris
import pandas as pd
import sklearn.model_selection
from sklearn.preprocessing import StandardScaler

In [2]:
# Declare constants

NUM_INPUT_NODES = 4
NUM_OUTPUT_NODES = 3
NUM_HIDDEN_NODES = 10
NUM_HIDDEN_LAYERS = 1

In [3]:
class Node:
    """Each node has a weight and bias"""
    def __init__(self, weight, bias):
        self.activation = 0
        self.weight = weight
        self.bias = bias

In [50]:
def relu(x):
    return np.maximum(0, x)

In [51]:
def softmax(logits):
    exp_logits = np.exp(logits - np.max(logits))  # for numerical stability
    return exp_logits / np.sum(exp_logits, axis=0)

In [64]:
class MLP:
    "Create a multilayer perceptron"
    def __init__(self, n_in, n_out, n_hidden, hidden_layers):
        self.n_hidden_layers = hidden_layers;
        self.nodes = []
        self.create(n_in, n_out, n_hidden, hidden_layers)

    def create(self, n_in, n_out, n_hidden, hidden_layers):
        nodes = []
        input_layer = [Node(0, 0) for _ in range(n_in)]
        nodes.append(input_layer)
        for i in range(hidden_layers):
            nodes.append([Node(random.uniform(0.0, 0.01), random.uniform(0.0, 0.01)) for _ in range(n_hidden)])
        hidden_layer = [Node(random.uniform(0.0, 0.01), random.uniform(0.0, 0.01)) for _ in range(n_out   )]
        nodes.append(hidden_layer)
        self.nodes = nodes

    def forward_pass(self, X_row):
        for i, node in enumerate(self.nodes[0]):
            node.activation = X_row[i]
        for L in range(1, self.n_hidden_layers):
            print("layer: " + L)
            for j in self.nodes[L]:
                j.activation = relu(sum(k.activation * j.weight for k in self.nodes[L - 1]) + j.bias)
        for node in self.nodes[-1]:
            node.activation = softmax(sum(k.activation * node.weight for k in self.nodes[-2]) + node.bias)

In [65]:
# Create MLP

mlp = MLP(NUM_INPUT_NODES, NUM_OUTPUT_NODES, NUM_HIDDEN_NODES, NUM_HIDDEN_LAYERS)

In [66]:
iris = load_iris()

In [67]:
iris

{'data': array([[5.1, 3.5, 1.4, 0.2],
        [4.9, 3. , 1.4, 0.2],
        [4.7, 3.2, 1.3, 0.2],
        [4.6, 3.1, 1.5, 0.2],
        [5. , 3.6, 1.4, 0.2],
        [5.4, 3.9, 1.7, 0.4],
        [4.6, 3.4, 1.4, 0.3],
        [5. , 3.4, 1.5, 0.2],
        [4.4, 2.9, 1.4, 0.2],
        [4.9, 3.1, 1.5, 0.1],
        [5.4, 3.7, 1.5, 0.2],
        [4.8, 3.4, 1.6, 0.2],
        [4.8, 3. , 1.4, 0.1],
        [4.3, 3. , 1.1, 0.1],
        [5.8, 4. , 1.2, 0.2],
        [5.7, 4.4, 1.5, 0.4],
        [5.4, 3.9, 1.3, 0.4],
        [5.1, 3.5, 1.4, 0.3],
        [5.7, 3.8, 1.7, 0.3],
        [5.1, 3.8, 1.5, 0.3],
        [5.4, 3.4, 1.7, 0.2],
        [5.1, 3.7, 1.5, 0.4],
        [4.6, 3.6, 1. , 0.2],
        [5.1, 3.3, 1.7, 0.5],
        [4.8, 3.4, 1.9, 0.2],
        [5. , 3. , 1.6, 0.2],
        [5. , 3.4, 1.6, 0.4],
        [5.2, 3.5, 1.5, 0.2],
        [5.2, 3.4, 1.4, 0.2],
        [4.7, 3.2, 1.6, 0.2],
        [4.8, 3.1, 1.6, 0.2],
        [5.4, 3.4, 1.5, 0.4],
        [5.2, 4.1, 1.5, 0.1],
  

In [68]:
X = iris.data

# Normalize the data

scaler = StandardScaler()
X = scaler.fit_transform(X)

In [69]:
y = iris.target

In [70]:
X

array([[-9.00681170e-01,  1.01900435e+00, -1.34022653e+00,
        -1.31544430e+00],
       [-1.14301691e+00, -1.31979479e-01, -1.34022653e+00,
        -1.31544430e+00],
       [-1.38535265e+00,  3.28414053e-01, -1.39706395e+00,
        -1.31544430e+00],
       [-1.50652052e+00,  9.82172869e-02, -1.28338910e+00,
        -1.31544430e+00],
       [-1.02184904e+00,  1.24920112e+00, -1.34022653e+00,
        -1.31544430e+00],
       [-5.37177559e-01,  1.93979142e+00, -1.16971425e+00,
        -1.05217993e+00],
       [-1.50652052e+00,  7.88807586e-01, -1.34022653e+00,
        -1.18381211e+00],
       [-1.02184904e+00,  7.88807586e-01, -1.28338910e+00,
        -1.31544430e+00],
       [-1.74885626e+00, -3.62176246e-01, -1.34022653e+00,
        -1.31544430e+00],
       [-1.14301691e+00,  9.82172869e-02, -1.28338910e+00,
        -1.44707648e+00],
       [-5.37177559e-01,  1.47939788e+00, -1.28338910e+00,
        -1.31544430e+00],
       [-1.26418478e+00,  7.88807586e-01, -1.22655167e+00,
      

In [71]:
y

array([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
       0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
       0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
       1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
       1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2,
       2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2,
       2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2])

In [72]:
# FIXME : the data sizes aren't making sense
X_train, X_test, y_train, y_test = sklearn.model_selection.train_test_split(X, y, test_size=0.33)

In [73]:
X_train.shape

(100, 4)

In [74]:
X_test.shape

(50, 4)

In [75]:
mlp.forward_pass(X_train[0])

In [76]:
mlp.nodes

[[<__main__.Node at 0x208ea10c8d0>,
  <__main__.Node at 0x208e9ed1ad0>,
  <__main__.Node at 0x208e9ed2590>,
  <__main__.Node at 0x208e9ed3050>],
 [<__main__.Node at 0x208e7568bd0>,
  <__main__.Node at 0x208e966db50>,
  <__main__.Node at 0x208e8b32f90>,
  <__main__.Node at 0x208e8b33390>,
  <__main__.Node at 0x208e8b31110>,
  <__main__.Node at 0x208e8b32590>,
  <__main__.Node at 0x208e8b31b10>,
  <__main__.Node at 0x208e8b32f50>,
  <__main__.Node at 0x208e8b33150>,
  <__main__.Node at 0x208e8b32090>],
 [<__main__.Node at 0x208e8b32e10>,
  <__main__.Node at 0x208e8b30d50>,
  <__main__.Node at 0x208e9f64a50>]]

In [49]:
X_train[0]

array([-1.38535265,  0.32841405, -1.22655167, -1.3154443 ])

# Next Steps

* 1 hot encode the targets
* make an error function
* so that you can do back propogation