# Tests for Dense Layer

To make sure that the output from the GPU is correct, you should test them against what you get with the original CPU implementation. The following code is what you get from the original implementation on the CPU.

You should do the same for any other layer you implement.

In [1]:
import numpy as np

import pyopencl as cl
import pyopencl.array as cl_array
import PyNetwork
from PyNetwork.layers.Dense_GPU import Dense_GPU

from PyNetwork.gpu.GPUNN import GPUOPERATOR

In [2]:
# from PyNetwork.gpu.c_code import c_code

In [3]:
input_shape = (10,)
output_nodes = 100

layer = PyNetwork.layers.Dense(output_nodes, 'relu')
layer.build(input_shape)

In [4]:
platform = cl.get_platforms()
devices = platform[0].get_devices()
context = cl.Context(devices)
queue = cl.CommandQueue(context)
gpuoperator = GPUOPERATOR(context=context, queue=queue)

In [5]:
layer_gpu = Dense_GPU(context=context, queue=queue, gpuoperator=gpuoperator, 
                      hidden_nodes=output_nodes, activation_function='relu')
layer_gpu.build(input_shape)

In [6]:
layer.W = layer_gpu.W
layer.b = layer_gpu.b

In [7]:
n_datapoints = 20
z_in = np.random.rand(n_datapoints, *input_shape).astype(np.float32) - 0.5
z_in_gpu = cl_array.to_device(queue, z_in)

# Test Predict

In [8]:
n_datapoints = 20
z_in = np.random.rand(n_datapoints, *input_shape).astype(np.float32) - 0.5

a_true, z_out_true = layer.predict(z_in, output_only=False)

In [9]:
z_in_gpu = cl_array.to_device(queue, z_in)
a_true_gpu, z_out_true_gpu = layer_gpu.predict(z_in_gpu, output_only=False)

# Test Backprop

In [10]:
g_prime = np.random.rand(n_datapoints, *input_shape).astype(np.float32)
new_delta = np.random.rand(n_datapoints, output_nodes).astype(np.float32)

delta_true = layer.get_delta_backprop_(g_prime, new_delta)

In [11]:
g_prime_gpu = cl_array.to_device(queue, g_prime)
new_delta_gpu =cl_array.to_device(queue, new_delta)

delta_true_gpu = layer_gpu.get_delta_backprop_(g_prime_gpu, new_delta_gpu)

In [12]:
np.testing.assert_almost_equal(delta_true_gpu.get(), delta_true)

# Test Weight Gradients

In [13]:
delta = np.random.rand(n_datapoints, *input_shape).astype(np.float32)
prev_z = np.random.rand(n_datapoints, output_nodes).astype(np.float32)

delta_grad_true, w_grad_true = layer.get_weight_grad_(delta, prev_z)

In [14]:
delta_gpu= cl_array.to_device(queue, delta)
prev_z_gpu =cl_array.to_device(queue, prev_z)

delta_grad_true_gpu, w_grad_true_gpu = layer_gpu.get_weight_grad_(delta_gpu, prev_z_gpu)

In [15]:
a = np.array([1,2,5]).astype(np.float32)
a_gpu = cl_array.to_device(queue, a)

b = np.array([10]).astype(np.float32)
b_gpu = cl_array.to_device(queue, b)

In [16]:
np.testing.assert_almost_equal(delta_grad_true, delta_grad_true_gpu.get())

In [17]:
np.testing.assert_almost_equal(w_grad_true, w_grad_true_gpu.get())