<a href="https://colab.research.google.com/github/tayfununal/2-Hidden-Layer-Neural-Networks/blob/master/one_hiddne_layer_experiment.ipynb" target="_parent"><img src="https://colab.research.google.com/assets/colab-badge.svg" alt="Open In Colab"/></a>

In [None]:
!pip install playground-data

In [None]:
import numpy as np
import matplotlib.pyplot as plt
import pandas as pd
import plygdata as pg
import json
import requests

In [None]:
Datas = json.loads(requests.get("https://raw.githubusercontent.com/tayfununal/2-Hidden-Layer-Neural-Networks/master/produced_XOR_Datas.json").text)

In [None]:
data_one = np.array(Datas['1'])
X_train, y_train, X_test, y_test = pg.split_data(data_one, validation_size=0.2)

In [None]:
X_train = X_train.T
y_train = y_train.T
X_test = X_test.T
y_test = y_test.T
print("Shape of X_train:", X_train.shape,
      "\nShape of y_train:", y_train.shape,
      "\nShape of X_test:", X_test.shape,
      "\nShape of y_test:", y_test.shape)

In [None]:
def initialization_parameters(x, y, num_node):
  W1 = np.random.randn(num_node * x.shape[0]).reshape(num_node, x.shape[0]) * 0.001
  b1 = np.zeros((num_node,1))

  W2 = np.random.randn(y.shape[0],num_node) * 0.001
  b2 = np.zeros((y.shape[0],1))

  assert W1.shape == (num_node,x.shape[0])
  assert b1.shape == (num_node, 1)

  assert W2.shape == (y.shape[0], num_node)
  assert b2.shape == (y.shape[0], 1)

  parameters = {'W1':W1,
                'b1':b1,
                'W2':W2,
                'b2':b2}
  return parameters

def sigmoid(x):
  return 1/(1+np.exp(-x))

def relu(x):
  return np.maximum(0,x)

def reluDerivative(x):
  x[x<=0] = 0
  x[x>0] = 1
  return x

def forward_prop(x,parameters):
  W1 = parameters['W1']
  b1 = parameters['b1']
  W2 = parameters['W2']
  b2 = parameters['b2']
  
  Z1 = np.dot(W1, x) + b1
  A1 = relu(Z1)
  Z2 = np.dot(W2, A1) + b2
  A2 = sigmoid(Z2)

  assert (A2.shape == (1, x.shape[1]))
  cache = {
      'Z1' : Z1,
      'A1' : A1,
      'Z2' : Z2,
      'A2' : A2
  }
  return A2, cache

def backward_prop(x, y, parameters, cache, learning_rate = 0.1, lambd=0.1):
  m = y.shape[1]
  
  W1 = parameters['W1']
  b1 = parameters['b1']
  W2 = parameters['W2']
  b2 = parameters['b2']

  A1 = cache['A1']
  A2 = cache['A2']
  
  # Calculations of backward propagation: dW1, db1, dW2, db2
  dZ2 = A2 - y
  dW2 = (1 / m) * np.dot(dZ2, A1.T) + (lambd / m) * W2
  db2 = (1 / m) * np.sum(dZ2, axis = 1, keepdims = True)

  dZ1 = np.multiply(np.dot(W2.T, dZ2), reluDerivative(A1))
  dW1 = (1 / m) * np.dot(dZ1, x.T) + (lambd / m) * W1  
  db1 = (1 / m) * np.sum(dZ1 , axis = 1, keepdims = True)

  # Updating parameters
  W1 = W1 - learning_rate * dW1
  b1 = b1 - learning_rate * db1
  W2 = W2 - learning_rate * dW2
  b2 = b2 - learning_rate * db2
  
  parameters = {'W1':W1,
                'b1':b1,
                'W2':W2,
                'b2':b2}
  return parameters

def cross_entropy_cost(y, A2, parameters, lambd = 0.1):
  m = y.shape[1]

  W1 = parameters["W1"]
  W2 = parameters["W2"]
  
  cross_entropy = np.multiply(np.log(A2 + 1e-15), y) + np.multiply((1 - y), np.log(1 - A2 + 1e-15))
  L2_regularization_cost = (np.sum(np.square(W1)) + np.sum(np.square(W2))) * (lambd / (2 * m))

  cost = (- 1.0 / m) * np.sum(cross_entropy) + L2_regularization_cost

  # Squeezing to avoid unnecessary dimensions 
  cost = np.squeeze(cost) 
  return cost

In [None]:
def nn_model(x, y, parameters, number_of_iter = 1000):
  cost_value = {}
  A2, cache = forward_prop(x, parameters)
  cost = cross_entropy_cost(y, A2 ,parameters)
  cost_value[1] = cost

  for i in range(1,number_of_iter):
    parameters = backward_prop(x, y, parameters, cache, learning_rate=0.3, lambd=0.3)
    A2, cache = forward_prop(x, parameters)
    cost = cross_entropy_cost(y, A2, parameters)
    
    #cost_value[i+1] = cost
    if (i+1) % 100 == 0:
     cost_value[i+1] = cost
     print("%i."%(i+1),cost)
     
  return cost_value, parameters

In [None]:
np.random.seed(656562)
parameters = initialization_parameters(X_test, y_test, 10)
cost_value, parameters = nn_model(X_train, y_train, parameters, number_of_iter=1000)