In [1]:
%matplotlib inline

from __future__ import absolute_import, print_function, unicode_literals, division
from sklearn.datasets import fetch_mldata
import matplotlib.pyplot as plt
import numpy as np
import pandas as pd
import itertools
import random as rand
import copy

In [2]:
def mat_dbg(x):
    print(x.shape, ": \n", x)

In [280]:
class MLP(object):
    """
    NOTE: Matrix operations are modified from RBM file
    In particular, we have an an an input of n data points with
    dimension d as a d-by-n matrixspotify
    """
    def __init__(self, data, num_hidden, learn_rate):
        # First row are the target values
        self.targets = data[0]
        self.data = data[1:,:]
        self.num_data = data.shape[1]
        self.num_visible = data.shape[0] - 1
        self.num_hidden = num_hidden
        self.learn_rate = learn_rate
        
        self.weights = np.random.rand(self.num_visible + 1, self.num_hidden)/10
        #self.weights = np.insert(self.weights, 0, 1, axis = 0)
        self.data = np.insert(self.data, 0, 1, axis = 0)
    
    def _sigmoid(self,x):
        return 1.0/(1.0+np.exp(-x))
        
    def _activated(self,mat):
        activated = self._sigmoid(np.dot(self.weights.T,mat))
        #activated = np.sign(activated - 0.5) # -0.5 for logistic sigmoid, 0 for tanh
        #for elt in np.nditer(activated,op_flags=['readwrite']):
        #    if elt == 0: 
        #        elt[...] = 1
        return activated
    
    def _gradient(self,mat):
        w = copy.deepcopy(mat)
        for elt in np.nditer(w,op_flags=['readwrite']):
            elt[...] = elt - elt * elt
        return w
    
    def _feed_forward(self):
        data_copy = copy.deepcopy(self.data)
        for i in range(0,self.num_data):
            data_col = data_copy[:,i]
            data_col = np.reshape(data_col, (-1, 1))
            
            guess = (self._activated(data_col))[0]
            error = self.targets[i] - guess
            grad = (self._gradient(guess))[0]
            c = (error * self.learn_rate)[0]
            wt_change = c * grad * data_col
            
            self.weights = wt_change + self.weights
            #self.weights = self.weights / (np.amax(self.weights))
        
        print("New weights: ",self.weights)            
        
    def _prop_backward(self):
        return None
    
    def _calc_error(self,mat):
        return None


In [283]:
# See www.cse.unsw.edu.au/~cs9417ml/MLP2/
sample_data = np.sign(1-2*np.random.rand(3,5000))
sample_data[0] = sample_data[1]
# Need to write binary target values for data as well for MLP
mat_dbg(sample_data)
MLP_1 = MLP(sample_data,1,0.05)
print("Weights^T: \n",MLP_1.weights.T)
print("Targets: ")
print(MLP_1.targets)
print("Data: \n",MLP_1.data)

(3, 5000) : 
 [[-1.  1.  1. ...,  1.  1.  1.]
 [-1.  1.  1. ...,  1.  1.  1.]
 [ 1.  1. -1. ...,  1.  1.  1.]]
Weights^T: 
 [[ 0.06999576  0.03027737  0.04028881]]
Targets: 
[-1.  1.  1. ...,  1.  1.  1.]
Data: 
 [[ 1.  1.  1. ...,  1.  1.  1.]
 [-1.  1.  1. ...,  1.  1.  1.]
 [ 1.  1. -1. ...,  1.  1.  1.]]


In [284]:
for i in range(0,5):
    MLP_1._feed_forward()

New weights:  [[-1.25291073]
 [ 4.22680395]
 [-0.00575931]]
New weights:  [[-1.40913934]
 [ 4.77291374]
 [-0.00583104]]
New weights:  [[-1.50271854]
 [ 5.08822824]
 [-0.00588181]]
New weights:  [[-1.56993042]
 [ 5.3105247 ]
 [-0.00592042]]
New weights:  [[-1.62247406]
 [ 5.48226948]
 [-0.00595104]]
