super-kernel functionality #67

robertleeplummerjr · 2017-05-11T14:28:34Z

Not even sure it is possible, but I'd love to see something like this:

const add = gpu.createKernel(function(left, right) {
  // add functionality
});
const multiply = gpu.createKernel(function(left, right) {
  // multiply funcitonality
});

const neuralLayer = gpu.combineKernels(function(add, multiply, mat1, mat2, mat3, mat4) {
  return multiply(multiply(add(mat1, mat2), mat3), mat4);
})(add, multiply);

const result = neuralLayer(mat1, mat2, mat3, mat4);

Combine kernels would change multiply & add so that they don't return data to the cpu, but rather the function returned from combineKernels would obtain the data from gpu. What would this approach be called?

The text was updated successfully, but these errors were encountered:

robertleeplummerjr · 2017-05-12T00:34:58Z

I believe this is what #54 was aiming for, just fyi.

robertleeplummerjr · 2017-05-13T01:42:35Z

So I've had a bit of a revelation, if we vectorize this, we could remove the need to jump from kernel to kernel. Here is a quick gist they may actually work:

function relu(value) {
  return Math.max(0, value[this.thread.y][this.thread.x]);
}

function add(left, right) {
  return left[this.thread.y][this.thread.x] + right[this.thread.y][this.thread.x];
}

function multiply(left, right) {
  var sum = 0;
  for (var i=0; i<512; i++) {
    sum += left[this.thread.y][i] * right[i][this.thread.x];
  }
  return sum;
}

const gpu = GPU({ mode: 'webgl' });
const layerForward = gpu
  .addFunction(relu)
  .addFunction(add)
  .addFunction(multiply)
  .createKernel(function(weightMatrix, inputMatrix, transitionMatrix, previousOutputMatrix, biasMatrix) {
    return relu(
      add(
        add(
          multiply(
            weightMatrix,
            inputMatrix
          ),
          multiply(
            transitionMatrix,
            previousOutputMatrix
          )
        ),
        biasMatrix
      )
    );
  });

This is a recurrent neural net layer, more to come.

fuzzie360 · 2017-05-13T14:33:03Z

Just a quick note, unfortunately in Javascript, "this" refers to the current function, so it might not work in JavaScript unless we use compilation to hijack what "this" means or pass this.thread.x y z as arguments.

The first example could be implemented by using by having combineKernels use the outputToTexture flag transparently. For the first example, we could return array size outputs, but the second example, we can only return singular values.

robertleeplummerjr · 2017-05-13T16:33:20Z

Bah, we can just x & y via args. It was just a pseudo script.

robertleeplummerjr · 2017-05-13T18:23:39Z

Which do you think would be faster?

robertleeplummerjr · 2017-05-15T01:30:04Z

Tried it locally, and the above is about 100 to 150 ms faster than multiple kernels!

robertleeplummerjr · 2017-05-15T01:36:44Z

Actual code:

var mat_size = 512;

    function splitArray(array, part) {
      var tmp = [];
      for(var i = 0; i < array.length; i += part) {
        tmp.push(array.slice(i, i + part));
      }
      return tmp;
    }

    function randomNestedArray(matSize) {
      var array = [];
      for (var n = 0; n < matSize * matSize; n++) {
        array.push(Math.random());
      }
      return splitArray(array, matSize);
    }

    function relu(value) {
      return Math.max(0, value);
    }

    function add(left, right) {
      return left * right;
    }

    function multiply(left, right, y, x) {
      var sum = 0;
      for (var i = 0; i < 512; i++) {
        sum += left[y][i] * right[i][x];
      }
      return sum;
    }

    var cpu = new GPU({ mode: 'cpu' });
    var gpu = new GPU({ mode: 'webgl' });
    [cpu, gpu].forEach(function(gpu) {
      const layerForward = gpu
        .addFunction(relu)
        .addFunction(add)
  //      .addFunction(multiply, {
  //        left: Array,
  //        right: Array,
  //        returns: Number
  //      })
        .createKernel(function(weightMatrix, inputMatrix, transitionMatrix, previousOutputMatrix, biasMatrix) {

          var weightAndMatrix = 0;
          var transitionAndPreviousOutput = 0;
          for (var i = 0; i < 512; i++) {
            weightAndMatrix += weightMatrix[this.thread.y][i] * inputMatrix[i][this.thread.x];
            transitionAndPreviousOutput += transitionMatrix[this.thread.y][i] * previousOutputMatrix[i][this.thread.x];
          }

          return relu(
            add(
              add(
                weightAndMatrix,
                transitionAndPreviousOutput
              ),
              biasMatrix[this.thread.y][this.thread.x]
            )
          );
        }, { dimensions: [mat_size, mat_size] });
      console.time(gpu.mode);
      console.log(layerForward(
        randomNestedArray(mat_size),
        randomNestedArray(mat_size),
        randomNestedArray(mat_size),
        randomNestedArray(mat_size),
        randomNestedArray(mat_size)
      ));
      console.timeEnd(gpu.mode);
    });

    var addKernel = gpu.createKernel(function(left, right) {
      return left[this.thread.y][this.thread.x] + right[this.thread.y][this.thread.x];
    }, { dimensions: [mat_size, mat_size] });
    var multiplyKernel = gpu.createKernel(function(left, right) {
      var sum = 0;
      for (var i = 0; i < 512; i++) {
        sum += left[this.thread.y][i] * right[i][this.thread.x];
      }
      return sum;
    }, { dimensions: [mat_size, mat_size] });
    var reluKernel = gpu.createKernel(function(value) {
      return Math.max(0, value[this.thread.y][this.thread.x]);
    }, { dimensions: [mat_size, mat_size] });
    console.time('nested');
    console.log(
      reluKernel(
        addKernel(
          addKernel(
            multiplyKernel(
              randomNestedArray(mat_size),
              randomNestedArray(mat_size)
            ),
            multiplyKernel(
              randomNestedArray(mat_size),
              randomNestedArray(mat_size)
            )
          ),
          randomNestedArray(mat_size)
        )
      )
    );
    console.timeEnd('nested');

robertleeplummerjr · 2017-05-15T22:43:25Z

Related issue here: #77
Continuing there.

robertleeplummerjr closed this as completed May 12, 2017

robertleeplummerjr reopened this May 12, 2017

robertleeplummerjr mentioned this issue May 14, 2017

Use for neural networks (ANN) arrayfire/arrayfire-js#10

Open

robertleeplummerjr closed this as completed May 15, 2017

Provide feedback

Saved searches

Use saved searches to filter your results more quickly

super-kernel functionality #67

super-kernel functionality #67

robertleeplummerjr commented May 11, 2017 •

edited

Loading

robertleeplummerjr commented May 12, 2017

robertleeplummerjr commented May 13, 2017 •

edited

Loading

fuzzie360 commented May 13, 2017

robertleeplummerjr commented May 13, 2017

robertleeplummerjr commented May 13, 2017

robertleeplummerjr commented May 15, 2017

robertleeplummerjr commented May 15, 2017

robertleeplummerjr commented May 15, 2017 •

edited

Loading

super-kernel functionality #67

super-kernel functionality #67

Comments

robertleeplummerjr commented May 11, 2017 • edited Loading

robertleeplummerjr commented May 12, 2017

robertleeplummerjr commented May 13, 2017 • edited Loading

fuzzie360 commented May 13, 2017

robertleeplummerjr commented May 13, 2017

robertleeplummerjr commented May 13, 2017

robertleeplummerjr commented May 15, 2017

robertleeplummerjr commented May 15, 2017

robertleeplummerjr commented May 15, 2017 • edited Loading

robertleeplummerjr commented May 11, 2017 •

edited

Loading

robertleeplummerjr commented May 13, 2017 •

edited

Loading

robertleeplummerjr commented May 15, 2017 •

edited

Loading