ahrefs
diff --git a/‎CLAUDE.md‎
Lines changed: 11 additions & 1 deletion b/‎CLAUDE.md‎
Lines changed: 11 additions & 1 deletion
diff --git a/‎bin/compilation_speed.ml‎
Lines changed: 1 addition & 1 deletion b/‎bin/compilation_speed.ml‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎bin/hello_world.ml‎
Lines changed: 2 additions & 2 deletions b/‎bin/hello_world.ml‎
Lines changed: 2 additions & 2 deletions
diff --git a/‎bin/hello_world_op.ml‎
Lines changed: 3 additions & 3 deletions b/‎bin/hello_world_op.ml‎
Lines changed: 3 additions & 3 deletions
diff --git a/‎bin/micrograd_basic.ml‎
Lines changed: 2 additions & 2 deletions b/‎bin/micrograd_basic.ml‎
Lines changed: 2 additions & 2 deletions
diff --git a/‎bin/micrograd_demo_logging.ml‎
Lines changed: 2 additions & 2 deletions b/‎bin/micrograd_demo_logging.ml‎
Lines changed: 2 additions & 2 deletions
diff --git a/‎bin/moons_benchmark.ml‎
Lines changed: 7 additions & 4 deletions b/‎bin/moons_benchmark.ml‎
Lines changed: 7 additions & 4 deletions
diff --git a/‎bin/zero2hero_1of7.ml‎
Lines changed: 4 additions & 4 deletions b/‎bin/zero2hero_1of7.ml‎
Lines changed: 4 additions & 4 deletions
diff --git a/‎lib/nn_blocks.ml‎
Lines changed: 1 addition & 1 deletion b/‎lib/nn_blocks.ml‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎lib/operation.ml‎
Lines changed: 7 additions & 6 deletions b/‎lib/operation.ml‎
Lines changed: 7 additions & 6 deletions
@@ -151,9 +151,19 @@ opam install cudajit  # for CUDA backend
 
 - `%cd` requires `NTDSL` module in scope (from `Operation.NTDSL`)
 - `%op` requires `TDSL` module in scope (from `Operation.TDSL`)
-- Inline tensor declarations using string literals
+- Record syntax for inline tensor declarations: `{ tensor_name }` or `{ tensor_name = init_expr }`
 - Generalized einsum notation for complex tensor operations
 
+**Key differences between %op and %cd**:
+- `%op` allows initialization expressions (`{ x = uniform () }`), used for model parameters
+- `%cd` is self-referential only (`{ x }`), used in computation graphs where tensors are defined by operations
+
+**Record syntax features**:
+- OCaml punning: `{ x }` expands to default initialization (uniform() for parameters in %op)
+- Shorthand field names: `o` → `output_dims`, `i` → `input_dims`, `b` → `batch_dims`
+- Additional fields map to labeled arguments of tensor creation functions
+- Dimension specification: lists `[...]` for output, tuples `(...)` for input, arrays `[|...|]` for batch
+
 ## Common Development Tasks
 
 ### Adding New Operations
 
@@ -16,7 +16,7 @@ let benchmark_overhead backend () =
   CDSL.disable_all_debugs ();
   Stdio.prerr_endline @@ "\n\n****** Benchmarking " ^ Backend.name ^ " ******";
   let init_time = Time_now.nanoseconds_since_unix_epoch () in
-  let%op f = (3 *. ("x" [ 5 ] **. 2)) - (4 *. x) + 5 in
+  let%op f = (3 *. ({ x; o = [ 5 ] } **. 2)) - (4 *. x) + 5 in
   Train.set_hosted f.value;
 
   (* Train.every_non_literal_on_host f; *)
 
@@ -23,7 +23,7 @@ let hello1 () =
 let hello2 () =
   let module Backend = (val Backends.fresh_backend ()) in
   (* Hey is inferred to be a matrix. *)
-  let%op y = ("hey" * 'q' 2.0) + 'p' 1.0 in
+  let%op y = ({ hey } * 'q' 2.0) + 'p' 1.0 in
   (* Punning for ["hey"] above introduced the [hey] identifier. *)
   Train.every_non_literal_on_host y;
   ignore (Train.forward_once (module Backend) y);
@@ -106,7 +106,7 @@ let hello6 () =
   in
 
   (* "Hey" is inferred to be a scalar. *)
-  let%op y = 2 *. "hey" in
+  let%op y = 2 *. { hey } in
   ignore (Train.forward_once backend y);
   (* Train.printf ~here:[%here] ~with_code:false ~with_grad:false hey; *)
   Train.printf ~here:[%here] ~with_code:false ~with_grad:false y
 
@@ -27,7 +27,7 @@ let%track2_sexp _Pointwise_multiplication_dims_1 (() : unit) : unit =
   in
 
   (* "Hey" is inferred to be a scalar. *)
-  let%op ya = 2 *. "hey" 7.0 in
+  let%op ya = 2 *. { hey = 7.0 } in
   ignore (Train.forward_once backend ya);
   Train.printf ~here:[%here] ~with_code:false ~with_grad:false ya
 
@@ -44,7 +44,7 @@ let%track2_sexp _Matrix_multiplication_dims_1x1 (() : unit) : unit =
   in
 
   (* Hey is inferred to be a matrix because of matrix multiplication [*]. *)
-  let%op yb = ("hey" 7.0 * 'q' 2.0) + 'p' 1.0 in
+  let%op yb = ({ hey = 7.0 } * 'q' 2.0) + 'p' 1.0 in
   ignore (Train.forward_once backend yb);
   (* Punning for ["hey"] above introduced the [hey] identifier. *)
   Train.printf ~here:[%here] ~with_code:false ~with_grad:false hey;
@@ -172,7 +172,7 @@ let%track2_sexp _Matrix_multiplication_dims_2x3 (() : unit) : unit =
   in
 
   (* Hey is inferred to be a matrix. *)
-  let%op yc = ("hey" 7.0 * [ 2; 3 ]) + [ 4; 5; 6 ] in
+  let%op yc = ({ hey = 7.0 } * [ 2; 3 ]) + [ 4; 5; 6 ] in
   ignore (Train.forward_once backend yc);
   Train.printf ~here:[%here] ~with_code:false ~with_grad:false hey;
   Train.printf ~here:[%here] ~with_code:false ~with_grad:false yc
 
@@ -9,7 +9,7 @@ let _get_local_debug_runtime = Utils.get_local_debug_runtime
 
 let%diagn_sexp () =
   let module Backend = (val Backends.fresh_backend ~backend_name:"multicore_cc" ()) in
-  let%op c = "a" [ -4 ] + "b" [ 2 ] in
+  let%op c = { a = [ -4 ] } + { b = [ 2 ] } in
   let%op d = c + c + 1 in
   (* let%op c = c + 1 + c + ~-a in *)
   (* Uncomment just the first "fully on host" line to see which arrays can be virtual, and just the
@@ -25,7 +25,7 @@ let%diagn_sexp () =
   Train.printf ~here:[%here] ~with_code:false ~with_grad:true b
 
 let%diagn_sexp _suspended () : unit =
-  let%op c = "a" [ -4 ] + "b" [ 2 ] in
+  let%op c = { a = [ -4 ] } + { b = [ 2 ] } in
   let%op d = (a *. b) + (b **. 3) in
   let%op c = c + c + 1 in
   let%op c = c + 1 + c + ~-a in
 
@@ -12,7 +12,7 @@ module type Backend = Ir.Backend_intf.Backend
 let () =
   Tensor.unsafe_reinitialize ();
   let module Backend = (val Backends.fresh_backend ()) in
-  let%op c = "a" [ -4 ] + "b" [ 2 ] in
+  let%op c = { a = [ -4 ] } + { b = [ 2 ] } in
   let%op d = (a *. b) + (b **. 3) in
   let%op c = c + c + 1 in
   let%op c = c + 1 + c + ~-a in
@@ -33,7 +33,7 @@ let () =
 let _suspended () =
   Tensor.unsafe_reinitialize ();
   let module Backend = (val Backends.fresh_backend ()) in
-  let%op c = "a" [ -4 ] + "b" [ 2 ] in
+  let%op c = { a = [ -4 ] } + { b = [ 2 ] } in
   let%op d = (a *. b) + (b **. 3) in
   let%op c = c + c + 1 in
   let%op c = c + 1 + c + ~-a in
 
@@ -64,13 +64,16 @@ let classify_moons ~seed ~on_device ~inlining_cutoff ~num_streams ~batch_size ~b
 
   let init_time = Time_now.nanoseconds_since_unix_epoch () in
   let%op mlp x =
-    "w4"
+    { w4 }
     * relu
-        ("b3" hid_dim_3
-        + ("w3" * relu ("b2" hid_dim_2 + ("w2" * relu ("b1" hid_dim_1 + ("w1" * x))))))
+        ({ b3; o = [ hid_dim_3 ] }
+        + { w3 }
+          * relu
+              ({ b2; o = [ hid_dim_2 ] }
+              + ({ w2 } * relu ({ b1; o = [ hid_dim_1 ] } + ({ w1 } * x)))))
   in
   (* TINY for debugging: *)
-  (* let%op mlp x = "w2" * relu("b1" hid_dim + ("w1" * x)) in *)
+  (* let%op mlp x = { w2 } * relu({ b1; o = [ hid_dim ] } + ({ w1 } * x)) in *)
   let%op loss_fn ~output ~expectation = relu (!..1 - (expectation *. output)) in
   let start_time = ref None in
   let weight_decay = 0.0002 in
 
@@ -17,7 +17,7 @@ let _get_local_debug_runtime = Utils.get_local_debug_runtime
 
 let _suspended () =
   let module Backend = (val Backends.fresh_backend ()) in
-  let%op v = ("w" [ (-3, 1) ] * "x" [ 2; 0 ]) + "b" [ 6.7 ] in
+  let%op v = ({ w = [ (-3, 1) ] } * { x = [ 2; 0 ] }) + { b = [ 6.7 ] } in
   Train.every_non_literal_on_host v;
   let code = Train.grad_update v in
   let stream = Backend.(new_stream @@ get_device ~ordinal:0) in
@@ -131,9 +131,9 @@ let _suspended () =
   ()
 
 let _suspended () =
-  let%op e = "a" [ 2 ] *. "b" [ -3 ] in
-  let%op d = e + "c" [ 10 ] in
-  let%op l = d *. "f" [ -2 ] in
+  let%op e = { a = [ 2 ] } *. { b = [ -3 ] } in
+  let%op d = e + { c = [ 10 ] } in
+  let%op l = d *. { f = [ -2 ] } in
   Train.every_non_literal_on_host l;
   let module Backend = (val Backends.fresh_backend ()) in
   let ctx = Train.update_once (module Backend) ~hosted:true l in
 
@@ -7,7 +7,7 @@ module NTDSL = Operation.NTDSL
 
 type mlp_layer_config = { label : string list; hid_dim : int }
 
-let%op mlp_layer ~config x = relu (("w" * x) + "b" config.hid_dim)
+let%op mlp_layer ~config x = relu (({ w = uniform () } * x) + { b = 0.; o = [ config.hid_dim ] })
 
 type mlp_config = { label : string list; hid_dims : int list }
 
 
@@ -639,13 +639,14 @@ module TDSL = struct
   (** The default initialization operation for {!param} calls. *)
   let default_param_init = ref (uniform ~grad_spec:Require_grad)
 
-  let param ?value ?values =
+  let param ?value ?values ?param_init =
     let t =
-      match (value, values) with
-      | Some _, Some _ -> invalid_arg "TDSL.param: both value and values are set"
-      | Some value, None -> Tensor.term_init ~grad_spec:Require_grad [| value |]
-      | None, Some values -> Tensor.term_init ~grad_spec:Require_grad values
-      | None, None -> !default_param_init ()
+      match (value, values, param_init) with
+      | Some value, None, None -> Tensor.term_init ~grad_spec:Require_grad [| value |]
+      | None, Some values, None -> Tensor.term_init ~grad_spec:Require_grad values
+      | None, None, Some param_init -> param_init
+      | None, None, None -> !default_param_init ()
+      | _ -> invalid_arg "TDSL.param: at most one of value, values, and param_init can be set"
     in
     Tensor.param ~t