1+ float *a &[1] = 0000022c648e3570
2+ float *a_grad &[1] = 0000022c648e3580
3+ float *b &[1] = 0000022c648e3590
4+ float *b_grad &[1] = 0000022c648e3560
5+ float *g &[1] = 0000022c648e3540
6+ COMMENT: g gradient update
7+ COMMENT: g fwd
8+ # n4_c[0] := (a[0] + b[0]);
9+ n4_c[0]{=MAYBE UNINITIALIZED} = -2000e-3 = (a[0]{=-4000e-3} + b[0]{=2000e-3})
10+ # n19_c[0] := ((n4_c[0] + n4_c[0]) + 1);
11+ n19_c[0]{=MAYBE UNINITIALIZED} = -3000e-3 = ((n4_c[0]{=-2000e-3} + n4_c[0]{=-2000e-3}) + (float)(1))
12+ # n42[0] := (b[0] - a[0]);
13+ n42[0]{=MAYBE UNINITIALIZED} = 6000e-3 = (b[0]{=2000e-3} - a[0]{=-4000e-3})
14+ # n31[0] := (b[0] + a[0]);
15+ n31[0]{=MAYBE UNINITIALIZED} = -2000e-3 = (b[0]{=2000e-3} + a[0]{=-4000e-3})
16+ # n14_d[0] := fma(a[0], b[0], (b[0] * (b[0] * b[0])));
17+ n14_d[0]{=MAYBE UNINITIALIZED} = 0e-3 = fmaf(a[0]{=-4000e-3}, b[0]{=2000e-3}, (b[0]{=2000e-3} * (b[0]{=2000e-3} * b[0]{=2000e-3})))
18+ # n40_d[0] := (fma(n14_d[0], 2, n14_d[0]) + relu(n31[0]));
19+ n40_d[0]{=MAYBE UNINITIALIZED} = 0e-3 = (fmaf(n14_d[0]{=0e-3}, (float)(2), n14_d[0]{=0e-3}) + fmaxf(0.0, n31[0]{=-2000e-3}))
20+ # e[0] :=$ (fma(-1, a[0], ((n19_c[0] + 1) + n19_c[0])) -$ (fma(3, n40_d[0], n40_d[0]) + relu(n42[0])));
21+ e[0]{=MAYBE UNINITIALIZED} = -7000e-3 = (fmaf((float)(-1), a[0]{=-4000e-3}, ((n19_c[0]{=-3000e-3} + (float)(1)) + n19_c[0]{=-3000e-3})) - (fmaf((float)(3), n40_d[0]{=0e-3}, n40_d[0]{=0e-3}) + fmaxf(0.0, n42[0]{=6000e-3})))
22+ # f[0] := (e[0] * e[0]);
23+ f[0]{=MAYBE UNINITIALIZED} = 49000e-3 = (e[0]{=-7000e-3} * e[0]{=-7000e-3})
24+ # g[0] := ((f[0] / 2) + (10 / f[0]));
25+ g[0]{=MAYBE UNINITIALIZED} = 24704e-3 = ((f[0]{=49000e-3} / (float)(2)) + ((float)(10) / f[0]{=49000e-3}))
26+ COMMENT: end
27+ COMMENT: g zero grads
28+ # a_grad := 0
29+ a_grad[0]{=MAYBE UNINITIALIZED} = 0e-3 = (float)(0)
30+ # b_grad := 0
31+ b_grad[0]{=MAYBE UNINITIALIZED} = 0e-3 = (float)(0)
32+ # n4_c_grad := 0
33+ n4_c_grad[0]{=MAYBE UNINITIALIZED} = 0e-3 = (float)(0)
34+ # n19_c_grad := 0
35+ n19_c_grad[0]{=MAYBE UNINITIALIZED} = 0e-3 = (float)(0)
36+ # n14_d_grad := 0
37+ n14_d_grad[0]{=MAYBE UNINITIALIZED} = 0e-3 = (float)(0)
38+ # n40_d_grad := 0
39+ n40_d_grad[0]{=MAYBE UNINITIALIZED} = 0e-3 = (float)(0)
40+ # f_grad := 0
41+ f_grad[0]{=MAYBE UNINITIALIZED} = 0e-3 = (float)(0)
42+ COMMENT: end
43+ COMMENT: g bprop
44+ # f.grad[0] := fma(1, (-10 / (f[0] * f[0])), f.grad[0]);
45+ f_grad[0]{=MAYBE UNINITIALIZED} = -4e-3 = fmaf((float)(1), ((float)(-10) / (f[0]{=49000e-3} * f[0]{=49000e-3})), f_grad[0]{=0e-3})
46+ # f.grad[0] := (f.grad[0] + 0.5);
47+ f_grad[0]{=MAYBE UNINITIALIZED} = 495e-3 = (f_grad[0]{=-4e-3} + (float)(0.5))
48+ # n40_d.grad[0] := fma(-1, ((2 * e[0]) * f.grad[0]), n40_d.grad[0]);
49+ n40_d_grad[0]{=MAYBE UNINITIALIZED} = 6941e-3 = fmaf((float)(-1), (((float)(2) * e[0]{=-7000e-3}) * f_grad[0]{=495e-3}), n40_d_grad[0]{=0e-3})
50+ # n40_d.grad[0] := fma(3, (-1 * ((2 * e[0]) * f.grad[0])), n40_d.grad[0]);
51+ n40_d_grad[0]{=MAYBE UNINITIALIZED} = 27766e-3 = fmaf((float)(3), ((float)(-1) * (((float)(2) * e[0]{=-7000e-3}) * f_grad[0]{=495e-3})), n40_d_grad[0]{=6941e-3})
52+ # n14_d.grad[0] := (n14_d.grad[0] + n40_d.grad[0]);
53+ n14_d_grad[0]{=MAYBE UNINITIALIZED} = 27766e-3 = (n14_d_grad[0]{=0e-3} + n40_d_grad[0]{=27766e-3})
54+ # n14_d.grad[0] := fma(n40_d.grad[0], 2, n14_d.grad[0]);
55+ n14_d_grad[0]{=MAYBE UNINITIALIZED} = 83300e-3 = fmaf(n40_d_grad[0]{=27766e-3}, (float)(2), n14_d_grad[0]{=27766e-3})
56+ # a.grad[0] := fma(n14_d.grad[0], b[0], a.grad[0]);
57+ a_grad[0]{=MAYBE UNINITIALIZED} = 166600e-3 = fmaf(n14_d_grad[0]{=83300e-3}, b[0]{=2000e-3}, a_grad[0]{=0e-3})
58+ # b.grad[0] := fma(a[0], n14_d.grad[0], b.grad[0]);
59+ b_grad[0]{=MAYBE UNINITIALIZED} = -333201e-3 = fmaf(a[0]{=-4000e-3}, n14_d_grad[0]{=83300e-3}, b_grad[0]{=0e-3})
60+ # b.grad[0] := fma((3 * (b[0] * b[0])), n14_d.grad[0], b.grad[0]);
61+ b_grad[0]{=MAYBE UNINITIALIZED} = 666402e-3 = fmaf(((float)(3) * (b[0]{=2000e-3} * b[0]{=2000e-3})), n14_d_grad[0]{=83300e-3}, b_grad[0]{=-333201e-3})
62+ # b.grad[0] := (b.grad[0] + relu_gate(n31[0], n40_d.grad[0]));
63+ b_grad[0]{=MAYBE UNINITIALIZED} = 666402e-3 = (b_grad[0]{=666402e-3} + (n31[0]{=-2000e-3} > 0.0 ? n40_d_grad[0]{=27766e-3} : 0.0))
64+ # a.grad[0] := (a.grad[0] + relu_gate(n31[0], n40_d.grad[0]));
65+ a_grad[0]{=MAYBE UNINITIALIZED} = 166600e-3 = (a_grad[0]{=166600e-3} + (n31[0]{=-2000e-3} > 0.0 ? n40_d_grad[0]{=27766e-3} : 0.0))
66+ # b.grad[0] :=$ (b.grad[0] + relu_gate(n42[0], (-1 * ((2 * e[0]) * f.grad[0]))));
67+ b_grad[0]{=MAYBE UNINITIALIZED} = 673344e-3 = (b_grad[0]{=666402e-3} + (n42[0]{=6000e-3} > 0.0 ? ((float)(-1) * (((float)(2) * e[0]{=-7000e-3}) * f_grad[0]{=495e-3})) : 0.0))
68+ # a.grad[0] :=$ (a.grad[0] - relu_gate(n42[0], (-1 * ((2 * e[0]) * f.grad[0]))));
69+ a_grad[0]{=MAYBE UNINITIALIZED} = 159658e-3 = (a_grad[0]{=166600e-3} - (n42[0]{=6000e-3} > 0.0 ? ((float)(-1) * (((float)(2) * e[0]{=-7000e-3}) * f_grad[0]{=495e-3})) : 0.0))
70+ # n19_c.grad[0] := fma((2 * e[0]), f.grad[0], n19_c.grad[0]);
71+ n19_c_grad[0]{=MAYBE UNINITIALIZED} = -6941e-3 = fmaf(((float)(2) * e[0]{=-7000e-3}), f_grad[0]{=495e-3}, n19_c_grad[0]{=0e-3})
72+ # n19_c.grad[0] := fma((2 * e[0]), f.grad[0], n19_c.grad[0]);
73+ n19_c_grad[0]{=MAYBE UNINITIALIZED} = -13883e-3 = fmaf(((float)(2) * e[0]{=-7000e-3}), f_grad[0]{=495e-3}, n19_c_grad[0]{=-6941e-3})
74+ # n4_c.grad[0] := (n4_c.grad[0] + n19_c.grad[0]);
75+ n4_c_grad[0]{=MAYBE UNINITIALIZED} = -13883e-3 = (n4_c_grad[0]{=0e-3} + n19_c_grad[0]{=-13883e-3})
76+ # n4_c.grad[0] := (n4_c.grad[0] + n19_c.grad[0]);
77+ n4_c_grad[0]{=MAYBE UNINITIALIZED} = -27766e-3 = (n4_c_grad[0]{=-13883e-3} + n19_c_grad[0]{=-13883e-3})
78+ # a.grad[0] := (a.grad[0] + n4_c.grad[0]);
79+ a_grad[0]{=MAYBE UNINITIALIZED} = 131892e-3 = (a_grad[0]{=159658e-3} + n4_c_grad[0]{=-27766e-3})
80+ # b.grad[0] := (b.grad[0] + n4_c.grad[0]);
81+ b_grad[0]{=MAYBE UNINITIALIZED} = 645577e-3 = (b_grad[0]{=673344e-3} + n4_c_grad[0]{=-27766e-3})
82+ # a.grad[0] := fma(-1, ((2 * e[0]) * f.grad[0]), a.grad[0]);
83+ a_grad[0]{=MAYBE UNINITIALIZED} = 138833e-3 = fmaf((float)(-1), (((float)(2) * e[0]{=-7000e-3}) * f_grad[0]{=495e-3}), a_grad[0]{=131892e-3})
84+ COMMENT: end
85+ COMMENT: end
0 commit comments