Fixed, correct surjectivity testing for initialization; problem spotted and fixed by Claude Opus with my guidance on the surjectivity algo/heuristic

lukstafi · lukstafi · commit 153e04bc5b71 · 2025-08-14T20:25:07.000+02:00
Signed-off-by: Lukasz Stafiniak &lt;lukstafi@gmail.com&gt;
diff --git a/arrayjit/lib/assignments.ml b/arrayjit/lib/assignments.ml
@@ -96,7 +96,7 @@ let get_name_exn asgns =
   if String.is_empty result then invalid_arg "Assignments.get_name: no comments in code" else result
 
 let is_total ~initialize_neutral ~projections =
-  initialize_neutral && Indexing.is_bijective projections
+  initialize_neutral && Indexing.is_surjective projections
 
 (** Returns materialized nodes in the sense of {!Tnode.is_in_context_force}. NOTE: it must be called
     after compilation; otherwise, it will disrupt memory mode inference. *)
diff --git a/arrayjit/lib/indexing.ml b/arrayjit/lib/indexing.ml
@@ -149,10 +149,9 @@ let iterated dim = dim > 1
 let opt_symbol d = if iterated d then Some (get_symbol ()) else None
 let opt_iterator = function None -> Fixed_idx 0 | Some sym -> Iterator sym
 
-let is_bijective proj =
-  (* For bijection, we need the assignment to be both injective and surjective.
-     We check surjectivity (all target positions are written) and that each source 
-     position maps to exactly one target position. *)
+let is_surjective proj =
+  (* For surjectivity, we check if all target (LHS) positions will be written to.
+     This is used to determine if we need to zero-initialize before assignment. *)
   
   (* Check if there are any fixed indices (except Fixed_idx 0 when dim is 1) *)
   let has_non_trivial_fixed =
@@ -163,7 +162,7 @@ let is_bijective proj =
   in
   if has_non_trivial_fixed then false
   else
-    (* Collect symbols used in LHS with their properties *)
+    (* Collect symbols used in LHS *)
     let lhs_symbols, has_affine, has_sub_axis = 
       Array.fold proj.project_lhs ~init:([], false, false) 
         ~f:(fun (syms, has_aff, has_sub) idx ->
@@ -181,24 +180,24 @@ let is_bijective proj =
     let lhs_symbol_set = Set.of_list (module Symbol) lhs_symbols in
     let product_symbol_set = Set.of_array (module Symbol) proj.product_iterators in
     
-    (* Basic check: All lhs symbols must be from product iterators (no bound symbols) *)
+    (* All lhs symbols must be from product iterators (no bound symbols) *)
     if not (Set.is_subset lhs_symbol_set ~of_:product_symbol_set) then false
     else if has_sub_axis then 
-      (* Conservative: Sub_axis case is complex, so assume non-bijective.
+      (* Conservative: Sub_axis case is complex, so assume non-surjective.
          This is pessimistic but safe - Sub_axis would require comparing
          lhs_dims and product_space dimensions carefully. *)
       false
     else if has_affine then
-      (* For Affine indices: check that coefficient=1 symbols don't have
-         dimensions smaller than any stride coefficients used *)
+      (* For Affine indices with strides: check coefficient compatibility.
+         A strided access pattern may skip elements. *)
       let symbol_dims = 
         Array.filter_mapi proj.product_iterators ~f:(fun i sym ->
           if Set.mem lhs_symbol_set sym then Some (sym, proj.product_space.(i))
           else None)
         |> Array.to_list
         |> Map.of_alist_exn (module Symbol)
       in
-      let check_affine_valid =
+      let check_affine_surjective =
         Array.for_all proj.project_lhs ~f:(function
           | Affine { symbols; _ } ->
               (* Find max dimension of coeff=1 symbols *)
@@ -208,22 +207,37 @@ let is_bijective proj =
                 |> List.max_elt ~compare:Int.compare
                 |> Option.value ~default:Int.max_value
               in
-              (* Check that it's not smaller than any stride coefficient *)
+              (* Check that coeff=1 dimension is not smaller than any stride *)
               List.for_all symbols ~f:(fun (coeff, _) ->
                 coeff = 1 || max_coeff1_dim >= coeff)
           | _ -> true)
       in
-      if not check_affine_valid then false
+      if not check_affine_surjective then false
       else
-        (* Final check: number of unique symbols must equal number of LHS dims 
-           AND the symbols must equal product iterators *)
-        Set.length lhs_symbol_set = Array.length proj.project_lhs
-        && Set.equal lhs_symbol_set product_symbol_set
+        (* Check that we have enough unique symbols to cover all LHS dimensions *)
+        Set.length lhs_symbol_set >= Array.length proj.project_lhs
     else
       (* Simple case: only Iterator and Fixed_idx *)
-      (* Need all dimensions covered and symbols to match exactly *)
-      Set.length lhs_symbol_set = Array.length proj.project_lhs
-      && Set.equal lhs_symbol_set product_symbol_set
+      (* Need enough unique symbols to cover all dimensions *)
+      Set.length lhs_symbol_set >= Array.length proj.project_lhs
+      
+(* For backwards compatibility, keep is_bijective as an alias that checks 
+   both surjectivity and injectivity (stricter than just surjectivity) *)
+let is_bijective proj =
+  is_surjective proj && 
+  let lhs_symbols = 
+    Array.concat_map proj.project_lhs ~f:(function
+      | Iterator s -> [| s |]
+      | Fixed_idx _ -> [||]
+      | Affine { symbols; _ } ->
+          List.filter_map symbols ~f:(fun (coeff, s) -> 
+            if coeff = 1 then Some s else None)
+          |> Array.of_list
+      | Sub_axis -> [||])
+    |> Set.of_array (module Symbol)
+  in
+  (* For bijectivity, also need exact match of symbols *)
+  Set.equal lhs_symbols (Set.of_array (module Symbol) proj.product_iterators)
 
 (** Projections for a pointwise unary operator. Provide only one of [debug_info] or [derived_for].
 *)
diff --git a/bin/einsum_trivia.ml b/bin/einsum_trivia.ml
@@ -3,6 +3,7 @@ open Ocannl
 module IDX = Train.IDX
 module CDSL = Train.CDSL
 module TDSL = Operation.TDSL
+module NTDSL = Operation.NTDSL
 
 module type Backend = Ir.Backend_intf.Backend
 
@@ -37,7 +38,7 @@ let _suspended () =
   ignore (Train.forward_once backend ho2);
   Train.printf ~here:[%here] ~with_code:false ~with_grad:false ho2
 
-let () =
+let _suspended () =
   let module Backend = (val Backends.fresh_backend ()) in
   let backend =
     (module Backend : Backend
@@ -59,3 +60,30 @@ let () =
      "a|i->h; b|h->o => i->o" b in Utils.capture_stdout_logs (fun () -> ignore (Train.forward_once backend f)); *)
   (* Train.printf ~here:[%here] ~with_code:false ~with_grad:false a2; *)
   Train.printf ~here:[%here] ~with_code:false ~with_grad:false c
+
+let () =
+  Tensor.unsafe_reinitialize ();
+  let module Backend = (val Backends.fresh_backend ()) in
+  let backend =
+    (module Backend : Backend
+      with type buffer_ptr = Backend.buffer_ptr
+       and type dev = Backend.dev
+       and type runner = Backend.runner
+       and type event = Backend.event
+       and type optimize_ctx = Backend.optimize_ctx)
+  in
+
+  let ri = TDSL.range 3 in
+  let%op ti = ri ++ "i=>i0" in
+  (* Write position 2 of ti, otherwise shape inference concludes it's dim-1 and broadcasted. *)
+  let%cd _ = ti =: 0 ++ "i=>i2" in
+  let rj = TDSL.range 4 in
+  let%op tj = rj ++ "j=>j1" in
+  let rk = TDSL.range 5 in
+  let%op tk = rk ++ "k=>k2" in
+  let positions = TDSL.outer_sum "ijl;kl=>ijkl" (TDSL.outer_sum "il;jl=>ijl" ti tj ()) tk () in
+  Train.set_hosted tk.value;
+  ignore (Train.forward_once backend positions);
+  Train.printf ~here:[%here] ~with_code:false ~with_grad:false positions;
+  Train.printf ~here:[%here] ~with_code:false ~with_grad:false ti;
+  Train.printf ~here:[%here] ~with_code:false ~with_grad:false tk
diff --git a/test/einsum/dune b/test/einsum/dune
@@ -33,13 +33,21 @@
  (preprocess
   (pps ppx_here ppx_ocannl)))
 
+(test
+ (name test_surjectivity)
+ (deps ocannl_config)
+ (modules test_surjectivity)
+ (libraries ocannl)
+ (preprocess
+  (pps ppx_here ppx_ocannl)))
+
 (library
  (name einsum_tutorials)
  (package neural_nets_lib)
  (inline_tests
   (deps ocannl_config))
  (libraries base dynlink ocannl)
- (modules einsum_trivia)
+ (modules einsum_trivia surjectivity)
  (preprocess
   (pps ppx_here ppx_expect ppx_inline_test ppx_ocannl))
  (modes best))
diff --git a/test/einsum/surjectivity.ml b/test/einsum/surjectivity.ml
@@ -0,0 +1,159 @@
+open Base
+open Ocannl
+module IDX = Train.IDX
+module CDSL = Train.CDSL
+module TDSL = Operation.TDSL
+module NTDSL = Operation.NTDSL
+
+module type Backend = Ir.Backend_intf.Backend
+
+let%expect_test "diagonal_tensor_initialization" =
+  Tensor.unsafe_reinitialize ();
+  let module Backend = (val Backends.fresh_backend ()) in
+  let backend =
+    (module Backend : Backend
+      with type buffer_ptr = Backend.buffer_ptr
+       and type dev = Backend.dev
+       and type runner = Backend.runner
+       and type event = Backend.event
+       and type optimize_ctx = Backend.optimize_ctx)
+  in
+
+  (* Create a diagonal tensor using einsum: i->ii *)
+  let input = TDSL.range 5 in
+  let%op diagonal = input ++ "i=>ii" in
+  
+  (* Ensure the diagonal tensor is hosted *)
+  Train.set_hosted diagonal.value;
+  ignore (Train.forward_once backend diagonal);
+  
+  (* Print the diagonal tensor *)
+  Train.printf ~here:[%here] ~with_code:false ~with_grad:false diagonal;
+  [%expect {|
+    HERE: test/einsum/surjectivity.ml:31:21
+    ┌──────────────────────────────────────┐
+    │[1]: =>_diagonal shape 0:6,1:6        │
+    │┌──────┬─────────────────────────────┐│
+    ││      │axis 1                       ││
+    │├──────┼─────────────────────────────┤│
+    ││axis 0│ 0.00  0.00  ...  0.00  0.00 ││
+    ││      │ 0.00  1.00  ...  0.00  0.00 ││
+    ││      │ ...   ...   ...  ...   ...  ││
+    ││      │ 0.00  0.00  ...  4.00  0.00 ││
+    ││      │ 0.00  0.00  ...  0.00  5.00 ││
+    │└──────┴─────────────────────────────┘│
+    └──────────────────────────────────────┘
+    |}]
+
+let%expect_test "sparse_assignment_with_fixed_indices" =
+  Tensor.unsafe_reinitialize ();
+  let module Backend = (val Backends.fresh_backend ()) in
+  let backend =
+    (module Backend : Backend
+      with type buffer_ptr = Backend.buffer_ptr
+       and type dev = Backend.dev
+       and type runner = Backend.runner
+       and type event = Backend.event
+       and type optimize_ctx = Backend.optimize_ctx)
+  in
+
+  (* Create a sparse tensor using fixed indices: i->i0j *)
+  let input = TDSL.range 4 in
+  let%op sparse = input ++ "i=>i0j" in
+  
+  Train.set_hosted sparse.value;
+  ignore (Train.forward_once backend sparse);
+  
+  Train.printf ~here:[%here] ~with_code:false ~with_grad:false sparse;
+  [%expect {|
+    HERE: test/einsum/surjectivity.ml:64:21
+    ┌─────────────────────────────────┐
+    │[1]: =>_sparse shape 0:5,1:1,2:1 │
+    │┌──────┬──────┐                  │
+    ││      │axis 2│                  │
+    │├──────┼──────┤                  │
+    ││0 @ 0 │ 0.00 │                  │
+    ││axis 1│      │                  │
+    │├──────┼──────┤                  │
+    ││1 @ 0 │ 1.00 │                  │
+    ││axis 1│      │                  │
+    │├──────┼──────┤                  │
+    ││2 @ 0 │ 2.00 │                  │
+    ││axis 1│      │                  │
+    │├──────┼──────┤                  │
+    ││3 @ 0 │ 3.00 │                  │
+    ││axis 1│      │                  │
+    │├──────┼──────┤                  │
+    ││4 @ 0 │ 4.00 │                  │
+    ││axis 1│      │                  │
+    │└──────┴──────┘                  │
+    └─────────────────────────────────┘
+    |}]
+
+let%expect_test "multiple_sparse_axes" =
+  Tensor.unsafe_reinitialize ();
+  let module Backend = (val Backends.fresh_backend ()) in
+  let backend =
+    (module Backend : Backend
+      with type buffer_ptr = Backend.buffer_ptr
+       and type dev = Backend.dev
+       and type runner = Backend.runner
+       and type event = Backend.event
+       and type optimize_ctx = Backend.optimize_ctx)
+  in
+
+  (* Test with multiple fixed indices: ij->i1j2 *)
+  let input = TDSL.range_of_shape ~output_dims:[3; 4] () in
+  let%op sparse_multi = input ++ "ij=>i1j2" in
+  
+  Train.set_hosted sparse_multi.value;
+  ignore (Train.forward_once backend sparse_multi);
+  
+  Train.printf ~here:[%here] ~with_code:false ~with_grad:false sparse_multi;
+  [%expect {|
+    HERE: test/einsum/surjectivity.ml:113:21
+    ┌───────────────────────────────────────────┐
+    │[1]: =>_sparse_multi shape 0:3,1:2,2:4,3:3 │
+    │┌──────┬──────────────────┐                │
+    ││0 @ 0 │axis 3            │                │
+    │├──────┼──────────────────┤                │
+    ││0 @ 1 │ 0.00  0.00  0.00 │                │
+    ││axis 2│ 0.00  0.00  0.00 │                │
+    ││      │ 0.00  0.00  0.00 │                │
+    ││      │ 0.00  0.00  0.00 │                │
+    │├──────┼──────────────────┤                │
+    ││1 @ 1 │ 0.00  0.00  0.00 │                │
+    ││axis 2│ 0.00  0.00  1.00 │                │
+    ││      │ 0.00  0.00  2.00 │                │
+    ││      │ 0.00  0.00  3.00 │                │
+    │└──────┴──────────────────┘                │
+    ├───────────────────────────────────────────┤
+    │┌──────┬──────────────────┐                │
+    ││1 @ 0 │axis 3            │                │
+    │├──────┼──────────────────┤                │
+    ││0 @ 1 │ 0.00  0.00  0.00 │                │
+    ││axis 2│ 0.00  0.00  0.00 │                │
+    ││      │ 0.00  0.00  0.00 │                │
+    ││      │ 0.00  0.00  0.00 │                │
+    │├──────┼──────────────────┤                │
+    ││1 @ 1 │ 0.00  0.00  4.00 │                │
+    ││axis 2│ 0.00  0.00  5.00 │                │
+    ││      │ 0.00  0.00  6.00 │                │
+    ││      │ 0.00  0.00  7.00 │                │
+    │└──────┴──────────────────┘                │
+    ├───────────────────────────────────────────┤
+    │┌──────┬─────────────────────┐             │
+    ││2 @ 0 │axis 3               │             │
+    │├──────┼─────────────────────┤             │
+    ││0 @ 1 │ 0.00  0.00  0.00    │             │
+    ││axis 2│ 0.00  0.00  0.00    │             │
+    ││      │ 0.00  0.00  0.00    │             │
+    ││      │ 0.00  0.00  0.00    │             │
+    │├──────┼─────────────────────┤             │
+    ││1 @ 1 │ 0.00  0.00  8.00    │             │
+    ││axis 2│ 0.00  0.00  9.00    │             │
+    ││      │ 0.00  0.00  1.00e+1 │             │
+    ││      │ 0.00  0.00  1.10e+1 │             │
+    │└──────┴─────────────────────┘             │
+    └───────────────────────────────────────────┘
+    |}]
diff --git a/test/einsum/test_surjectivity.expected b/test/einsum/test_surjectivity.expected
@@ -0,0 +1,54 @@
+Retrieving commandline, environment, or config file variable ocannl_log_level
+Found 0, in the config file
+
+Testing diagonal tensor initialization:
+HERE: test/einsum/test_surjectivity.ml:24:21
+┌──────────────────────────────────────┐
+│[1]: =>_diagonal shape 0:6,1:6        │
+│┌──────┬─────────────────────────────┐│
+││      │axis 1                       ││
+│├──────┼─────────────────────────────┤│
+││axis 0│ 0.00  0.00  ...  0.00  0.00 ││
+││      │ 0.00  1.00  ...  0.00  0.00 ││
+││      │ ...   ...   ...  ...   ...  ││
+││      │ 0.00  0.00  ...  4.00  0.00 ││
+││      │ 0.00  0.00  ...  0.00  5.00 ││
+│└──────┴─────────────────────────────┘│
+└──────────────────────────────────────┘
+
+
+Testing sparse assignment with fixed index:
+HERE: test/einsum/test_surjectivity.ml:39:21
+┌─────────────────────────────┐
+│[1]: =>_sparse shape 0:5,1:1 │
+│┌──────┬──────┐              │
+││      │axis 1│              │
+│├──────┼──────┤              │
+││axis 0│ 0.00 │              │
+││      │ 1.00 │              │
+││      │ 2.00 │              │
+││      │ 3.00 │              │
+││      │ 4.00 │              │
+│└──────┴──────┘              │
+└─────────────────────────────┘
+
+
+Testing multiple sparse axes:
+HERE: test/einsum/test_surjectivity.ml:54:21
+┌───────────────────────────────────────┐
+│[1]: =>_result shape 0:3,1:2,2:4       │
+│┌──────┬──────────────────────────────┐│
+││      │axis 2                        ││
+│├──────┼──────────────────────────────┤│
+││0 @ 0 │ 0.00  0.00  0.00  0.00       ││
+││axis 1│ 0.00  1.00  2.00  3.00       ││
+│├──────┼──────────────────────────────┤│
+││1 @ 0 │ 0.00  0.00  0.00  0.00       ││
+││axis 1│ 4.00  5.00  6.00  7.00       ││
+│├──────┼──────────────────────────────┤│
+││2 @ 0 │ 0.00  0.00  0.00     0.00    ││
+││axis 1│ 8.00  9.00  1.00e+1  1.10e+1 ││
+│└──────┴──────────────────────────────┘│
+└───────────────────────────────────────┘
+
+All surjectivity tests completed.
diff --git a/test/einsum/test_surjectivity.ml b/test/einsum/test_surjectivity.ml