add pointer handling for function arguments

cucapra · Apr 26, 2021 · 14d7be3 · 14d7be3
1 parent af42790
commit 14d7be3
Show file tree

Hide file tree

Showing 9 changed files with 703 additions and 11 deletions.
diff --git a/cdios-tests/2d-matrices-add.c b/cdios-tests/2d-matrices-add.c
@@ -6,6 +6,8 @@
 #define QUATERNION_DIM 4
 #define SIZE 5
 
+void nested_pointer(float **test, int r, int c) {}
+
 // ---------------------QR FACTORIZATION---------------------------------
 float sgn(float v) { return (v > 0) - (v < 0); }
 

diff --git a/compile-out/kernel.c b/compile-out/kernel.c
@@ -0,0 +1,56 @@
+#include <float.h>
+#include <math.h>
+#include <stdint.h>
+#include <stdio.h>
+#include <stdlib.h>
+#include <xtensa/sim.h>
+#include <xtensa/tie/xt_pdxn.h>
+#include <xtensa/tie/xt_timer.h>
+#include <xtensa/xt_profiling.h>
+/*
+Git revision: af42790
+
+Warning: dirty git status:
+ cdios-tests/2d-matrices-add.c |  2 ++
+ cdios.py                      |  2 +-
+ src/c-meta.rkt                | 59 +++++++++++++++++++++++++++++++++++--------
+ 3 files changed, 51 insertions(+), 12 deletions(-)
+
+*/
+int __attribute__((section(".dram0.data"))) Z[4] = {0, 0, 0, 0};
+float __attribute__((section(".dram0.data"))) v_0[4] = {0.0, 0, 0, 0};
+int __attribute__((section(".dram0.data"))) v_1[4] = {0, 0, 2, 2};
+int __attribute__((section(".dram0.data"))) v_1_0[4] = {0, 0, 2, 2};
+int __attribute__((section(".dram0.data"))) v_3[4] = {0, 1, 0, 1};
+int __attribute__((section(".dram0.data"))) v_3_0[4] = {0, 1, 0, 1};
+int __attribute__((section(".dram0.data"))) v_6[4] = {1, 1, 3, 3};
+int __attribute__((section(".dram0.data"))) v_6_0[4] = {1, 1, 3, 3};
+int __attribute__((section(".dram0.data"))) v_8[4] = {2, 3, 2, 3};
+int __attribute__((section(".dram0.data"))) v_8_0[4] = {2, 3, 2, 3};
+void kernel(float * a_in, float * b_in, float * c_out) {
+float * __restrict a_in_mut = a_in;
+  valign align_a_in;
+  align_a_in = PDX_LA_MXF32_PP((xb_vecMxf32 *) a_in);
+  float * __restrict b_in_mut = b_in;
+  valign align_b_in;
+  align_b_in = PDX_LA_MXF32_PP((xb_vecMxf32 *) b_in);
+  float * __restrict c_out_mut = c_out;
+  valign align_c_out;
+  xb_vecMxf32 a_in_0_4;
+  PDX_LAV_MXF32_XP(a_in_0_4, align_a_in, (xb_vecMxf32 *) a_in_mut, 16);
+  xb_vecMxf32 b_in_0_4;
+  PDX_LAV_MXF32_XP(b_in_0_4, align_b_in, (xb_vecMxf32 *) b_in_mut, 16);
+  xb_vecMxf32 v_2;
+  v_2 = PDX_MOV_MXF32_FROM_MX32(PDX_SHFL_MX32(PDX_MOV_MX32_FROM_MXF32(a_in_0_4), *((xb_vecMx32 *) v_1_0)));
+  xb_vecMxf32 v_4;
+  v_4 = PDX_MOV_MXF32_FROM_MX32(PDX_SHFL_MX32(PDX_MOV_MX32_FROM_MXF32(b_in_0_4), *((xb_vecMx32 *) v_3_0)));
+  xb_vecMxf32 v_5 = PDX_MUL_MXF32(v_2, v_4);
+  xb_vecMxf32 v_7;
+  v_7 = PDX_MOV_MXF32_FROM_MX32(PDX_SHFL_MX32(PDX_MOV_MX32_FROM_MXF32(a_in_0_4), *((xb_vecMx32 *) v_6_0)));
+  xb_vecMxf32 v_9;
+  v_9 = PDX_MOV_MXF32_FROM_MX32(PDX_SHFL_MX32(PDX_MOV_MX32_FROM_MXF32(b_in_0_4), *((xb_vecMx32 *) v_8_0)));
+  xb_vecMxf32 v_10 = v_5;
+  PDX_MULA_MXF32(v_10, v_7, v_9);
+  PDX_SAV_MXF32_XP(v_10, align_c_out, (xb_vecMxf32 *) c_out, 16);
+  PDX_SAPOS_MXF32_FP(align_c_out, (xb_vecMxf32 *) c_out);
+}
diff --git a/compile-out/outputs.rkt b/compile-out/outputs.rkt
@@ -0,0 +1 @@
+'((c_out 4))
diff --git a/compile-out/prelude.rkt b/compile-out/prelude.rkt
@@ -0,0 +1,6 @@
+(prog
+ (list
+  (vec-const 'Z '#(0.0) 'float)
+  (vec-extern-decl 'a_in 4 'extern-input-array)
+  (vec-extern-decl 'b_in 4 'extern-input-array)
+  (vec-extern-decl 'c_out 4 'extern-output)))
diff --git a/compile-out/preprocessed.c b/compile-out/preprocessed.c
@@ -0,0 +1,271 @@
+
+
+
+
+
+
+
+
+void nested_pointer(float **test, int r, int c) {}
+
+
+float sgn(float v) { return (v > 0) - (v < 0); }
+
+
+void naive_fixed_transpose(float a[5][5]) {
+    for (int i = 0; i < 5; i++) {
+        for (int j = i + 1; j < 5; j++) {
+            float tmp = a[i][j];
+            a[i][j] = a[j][i];
+            a[j][i] = tmp;
+        }
+    }
+}
+
+
+
+
+
+float naive_norm(float *x, int m) {
+    float sum = 0;
+    for (int i = 0; i < m; i++) {
+        sum += pow(x[i], 2);
+    }
+    return sqrt(sum);
+}
+
+
+void naive_fixed_matrix_multiply(float a[5][5], float b[5][5],
+                                 float c[5][5]) {
+    for (int y = 0; y < 5; y++) {
+        for (int x = 0; x < 5; x++) {
+            c[y][x] = 0;
+            for (int k = 0; k < 5; k++) {
+                c[y][x] += a[y][k] * b[k][x];
+            }
+        }
+    }
+}
+
+
+void naive_fixed_qr_decomp(float A[5][5], float Q[5][5],
+                           float R[5][5]) {
+
+    for (int i = 0; i < 5; i++) {
+        for (int j = 0; j < 5; j++) {
+            R[i][j] = A[i][j];
+        }
+    }
+
+
+    float I[5][5];
+    for (int i = 0; i < 5; i++) {
+        for (int j = 0; j < 5; j++) {
+            I[i][j] = ((i == j) ? 1.0 : 0.0);
+        }
+    }
+
+
+    for (int k = 0; k < 5 - 1; k++) {
+        int m = 5 - k;
+
+        float x[m];
+        float e[m];
+        for (int i = 0; i < m; i++) {
+            int row = k + i;
+            x[i] = R[row][k];
+            e[i] = I[row][k];
+        }
+
+        float alpha = -sgn(x[0]) * naive_norm(x, m);
+
+        float u[m];
+        float v[m];
+        for (int i = 0; i < m; i++) {
+            u[i] = x[i] + alpha * e[i];
+        }
+        float norm_u = naive_norm(u, m);
+        for (int i = 0; i < m; i++) {
+            v[i] = u[i] / norm_u;
+        }
+
+        float q_min[m][m];
+        for (int i = 0; i < m; i++) {
+            for (int j = 0; j < m; j++) {
+                float q_min_i = ((i == j) ? 1.0 : 0.0) - 2 * v[i] * v[j];
+                q_min[i][j] = q_min_i;
+            }
+        }
+
+        float q_t[5][5];
+        for (int i = 0; i < 5; i++) {
+            for (int j = 0; j < 5; j++) {
+                float q_t_i = 0;
+                if ((i < k) || (j < k)) {
+                    q_t_i = (i == j) ? 1.0 : 0.0;
+                } else {
+                    q_t_i = q_min[(i - k)][(j - k)];
+                }
+                q_t[i][j] = q_t_i;
+            }
+        }
+
+        if (k == 0) {
+
+            for (int i = 0; i < 5; i++) {
+                for (int j = 0; j < 5; j++) {
+                    Q[i][j] = q_t[i][j];
+                }
+            }
+            naive_fixed_matrix_multiply(q_t, A, R);
+        } else {
+            float res[5][5];
+            naive_fixed_matrix_multiply(q_t, Q, res);
+
+            for (int i = 0; i < 5; i++) {
+                for (int j = 0; j < 5; j++) {
+                    Q[i][j] = res[i][j];
+                }
+            }
+            naive_fixed_matrix_multiply(q_t, R, res);
+
+            for (int i = 0; i < 5; i++) {
+                for (int j = 0; j < 5; j++) {
+                    R[i][j] = res[i][j];
+                }
+            }
+        }
+    }
+    naive_fixed_transpose(Q);
+}
+
+
+
+
+void naive_cross_product(float lhs[3], float rhs[3], float result[3]) {
+    result[0] = lhs[1] * rhs[2] - lhs[2] * rhs[1];
+    result[1] = lhs[2] * rhs[0] - lhs[0] * rhs[2];
+    result[2] = lhs[0] * rhs[1] - lhs[1] * rhs[0];
+}
+
+
+void naive_dot_product(float a_in[4], float b_in[4],
+                       float c_out) {
+    for (int i = 0; i < 4; i++) {
+        c_out += a_in[i] * b_in[i];
+    }
+}
+
+
+void quaternion_matrix_vec_mult(float a_in[4][4],
+                                float b_in[4],
+                                float c_out[4]) {
+    for (int i = 0; i < 4; i++) {
+        float sum = 0.0;
+        for (int k = 0; k < 4; k++) {
+            sum += a_in[i][k] * b_in[k];
+        }
+        c_out[i] = sum;
+    }
+}
+
+
+
+void naive_quaternion_product(float a_in[4],
+                              float b_in[4],
+                              float c_out[4]) {
+    float A_matrix[4][4];
+    A_matrix[0][0] = a_in[0];
+    A_matrix[0][1] = a_in[1];
+    A_matrix[0][2] = a_in[2];
+    A_matrix[0][3] = a_in[3];
+
+    A_matrix[1][0] = -a_in[1];
+    A_matrix[1][1] = a_in[0];
+    A_matrix[1][2] = a_in[3];
+    A_matrix[1][3] = -a_in[2];
+
+    A_matrix[2][0] = -a_in[2];
+    A_matrix[2][1] = -a_in[3];
+    A_matrix[2][2] = a_in[0];
+    A_matrix[2][3] = a_in[1];
+
+    A_matrix[3][0] = -a_in[3];
+    A_matrix[3][1] = a_in[2];
+    A_matrix[3][2] = -a_in[1];
+    A_matrix[3][3] = a_in[0];
+
+    quaternion_matrix_vec_mult(A_matrix, b_in, c_out);
+}
+
+
+
+void add_matrices(float a[3][3], float b[3][3],
+                  float c[3][3]) {
+
+    for (int i = 0; i < 3; i++) {
+        for (int j = 0; j < 3; j++) {
+            c[i][j] = a[i][j] + b[i][j];
+        }
+    }
+}
+
+void multiply_matrices(float a_in[3][3], float b_in[3][3],
+                       float c_out[3][3]) {
+    for (int i = 0; i < 3; i++) {
+        for (int j = 0; j < 3; j++) {
+            float sum = 0.0;
+            for (int k = 0; k < 3; k++) {
+                sum += a_in[i][k] * b_in[k][j];
+            }
+            c_out[i][j] = sum;
+        }
+    }
+}
+
+void matrix_multiply(float a_in[2 * 2], float b_in[2 * 2],
+                     float c_out[2 * 2]) {
+    float test4d[3][3][3][3];
+    test4d[2][2][2][2];
+    test4d[0][0][1][0] = 3.0;
+    test4d[0][0][1][0] += test4d[0][0][1][0];
+
+    float test[3][3];
+    test[1][1] = 3;
+    for (int y = 0; y < 3; y++) {
+        for (int x = 0; x < 3; x++) {
+            test[y][x] = 1;
+        }
+    }
+
+
+
+    float extra[3][3];
+    for (int i = 0; i < 3; i++) {
+        for (int j = 0; j < 3; j++) {
+            float sum = 0.0;
+            for (int k = 0; k < 3; k++) {
+                sum += test[i][k] * test[k][j];
+            }
+            extra[i][j] = sum;
+        }
+    }
+
+
+    for (int i = 0; i < 3; i++) {
+        for (int j = 0; j < 3; j++) {
+            extra[i][j] = extra[i][j] + extra[i][j];
+        }
+    }
+
+
+    for (int y = 0; y < 2; y++) {
+        for (int x = 0; x < 2; x++) {
+            c_out[2 * y + x] = 0;
+            for (int k = 0; k < 2; k++) {
+                c_out[2 * y + x] +=
+                    a_in[2 * y + k] * b_in[2 * k + x];
+            }
+        }
+    }
+}