In [14]:
import numpy as np

def tanh(x):
    return np.tanh(x)

def tanh_deriv(x):
    return 1.0 - np.tanh(x)**2

def logistic(x):
    return 1/(1 + np.exp(-x))

def logistic_derivative(x):
    return logistic(x)*(1-logistic(x))

class NeuralNetwork:
    def __init__(self, layers, activation='tanh'):
        """
        :param layers: A list containing the number of units in each layer.
        Should be at least two values
        :param activation: The activation function to be used. Can be
        "logistic" or "tanh"
        """
        if activation == 'logistic':
            self.activation = logistic
            self.activation_deriv = logistic_derivative
        elif activation == 'tanh':
            self.activation = tanh
            self.activation_deriv = tanh_deriv

        self.weights = []
        for i in range(1, len(layers) - 1):
            self.weights.append((2*np.random.random((layers[i - 1] + 1, layers[i]
                                + 1))-1)*0.25)
        self.weights.append((2*np.random.random((layers[i] + 1, layers[i +
                            1]))-1)*0.25)
        
        
        
    def fit(self, X, y, learning_rate=0.2, epochs=1):
        X = np.atleast_2d(X)
        temp = np.ones([X.shape[0], X.shape[1]+1])
        temp[:, 0:-1] = X  # adding the bias unit to the input layer
        X = temp
        y = np.array(y)

        for k in range(epochs):
            i = np.random.randint(X.shape[0])
            a = [X[i]]

            #a ist ein beliebier input
            
            for l in range(len(self.weights)):#über alle gewichte
                a.append(self.activation(np.dot(a[l], self.weights[l])))
        
            error = y[i] - a[-1]#a[-1] ist der output vom mlp
            deltas = [error * self.activation_deriv(a[-1])]
            
            print deltas

            for l in range(len(a) - 2, 0, -1): # we need to begin at the second to last layer
                deltas.append(deltas[-1].dot(self.weights[l].T)*self.activation_deriv(a[l]))
            print "deltas", deltas    
            deltas.reverse()
            print self.weights
            for i in range(len(self.weights)):
                print "-------------------",i
                layer = np.atleast_2d(a[i])
                print "layer", layer
                delta = np.atleast_2d(deltas[i])
                print "delta", delta
                self.weights[i] += learning_rate * layer.T.dot(delta)
                print "weights",self.weights[i]
                
                
    def predict(self, x):
        x = np.array(x)
        temp = np.ones(x.shape[0]+1)
        temp[0:-1] = x
        a = temp
        for l in range(0, len(self.weights)):
            a = self.activation(np.dot(a, self.weights[l]))
        return a
    
 

nn = NeuralNetwork([2,3,1], 'tanh')
X = np.array([[0, 0], [0, 1], [1, 0], [1, 1]])
y = np.array([0, 1, 1, 0])
nn.fit(X, y)
#for i in [[0, 0], [0, 1], [1, 0], [1,1]]:
    #print(i,nn.predict(i))

[array([ 1.05343625])]
deltas [array([ 1.05343625]), array([ 0.02019361,  0.06491458,  0.15016323, -0.11061611])]
[array([[-0.01973599,  0.09312209, -0.19961559,  0.04555807],
       [ 0.13307737,  0.11002721,  0.21148196, -0.05045024],
       [-0.05697868,  0.02242517, -0.17824634, -0.00578768]]), array([[ 0.01928187],
       [ 0.0624408 ],
       [ 0.16192709],
       [-0.10517103]])]
------------------- 0
layer [[ 1.  0.  1.]]
delta [[ 0.02019361  0.06491458  0.15016323 -0.11061611]]
weights [[-0.01569727  0.10610501 -0.16958295  0.02343485]
 [ 0.13307737  0.11002721  0.21148196 -0.05045024]
 [-0.05293996  0.03540809 -0.1482137  -0.0279109 ]]
------------------- 1
layer [[-0.07656453  0.11503576 -0.36084924  0.03974944]]
delta [[ 1.05343625]]
weights [[ 0.0031507 ]
 [ 0.08667737]
 [ 0.08590076]
 [-0.09679633]]
