ahrefs
diff --git a/‎bin/einsum_trivia.ml‎
Lines changed: 6 additions & 6 deletions b/‎bin/einsum_trivia.ml‎
Lines changed: 6 additions & 6 deletions
diff --git a/‎lib/ppx_cd.ml‎
Lines changed: 2 additions & 2 deletions b/‎lib/ppx_cd.ml‎
Lines changed: 2 additions & 2 deletions
diff --git a/‎lib/ppx_op.ml‎
Lines changed: 2 additions & 2 deletions b/‎lib/ppx_op.ml‎
Lines changed: 2 additions & 2 deletions
diff --git a/‎lib/syntax_extensions.md‎
Lines changed: 6 additions & 6 deletions b/‎lib/syntax_extensions.md‎
Lines changed: 6 additions & 6 deletions
diff --git a/‎test/einsum/einsum_trivia.ml‎
Lines changed: 12 additions & 12 deletions b/‎test/einsum/einsum_trivia.ml‎
Lines changed: 12 additions & 12 deletions
@@ -10,7 +10,7 @@ let _suspended () =
   let module Backend = (val Backends.fresh_backend ()) in
   let a = TDSL.range_of_shape ~label:[ "a" ] ~input_dims:[ 2 ] ~output_dims:[ 2 ] () in
   let b = TDSL.range_of_shape ~label:[ "b" ] ~input_dims:[ 2; 3; 4 ] ~output_dims:[ 2 ] () in
-  let%op c = a *+ "i->1; ij...->0 => ...->ji" b in
+  let%op c = a +* "i->1; ij...->0 => ...->ji" b in
   ignore (Train.forward_once (module Backend) c);
   Train.printf ~here:[%here] ~with_code:false ~with_grad:false c;
   Stdio.printf "\n%!"
@@ -50,12 +50,12 @@ let _suspended () =
 
   let a = TDSL.range_of_shape ~batch_dims:[ 2 ] ~input_dims:[ 3 ] ~output_dims:[ 4 ] () in
   let b = TDSL.range_of_shape ~batch_dims:[ 2 ] ~input_dims:[ 4 ] ~output_dims:[ 5 ] () in
-  let%op _ = a *+ "b|i->o; b|i->o => b|i->o" a in
-  let%op c = b *+ "b|h->o; b|i->h => b|i->o" a in
+  let%op _ = a +* "b|i->o; b|i->o => b|i->o" a in
+  let%op c = b +* "b|h->o; b|i->h => b|i->o" a in
   Utils.capture_stdout_logs (fun () -> ignore (Train.forward_once backend c));
-  (* let%op d = a *+ "a|i->h; b|h->o => ab|i->o" b in Utils.capture_stdout_logs (fun () ->
-     ignore (Train.forward_once backend d)); let%op e = a *+ "b|i->h; b|h->o => i->o" b in
-     Utils.capture_stdout_logs (fun () -> ignore (Train.forward_once backend e)); let%op f = a *+
+  (* let%op d = a +* "a|i->h; b|h->o => ab|i->o" b in Utils.capture_stdout_logs (fun () ->
+     ignore (Train.forward_once backend d)); let%op e = a +* "b|i->h; b|h->o => i->o" b in
+     Utils.capture_stdout_logs (fun () -> ignore (Train.forward_once backend e)); let%op f = a +*
      "a|i->h; b|h->o => i->o" b in Utils.capture_stdout_logs (fun () -> ignore (Train.forward_once backend f)); *)
   (* Train.printf ~here:[%here] ~with_code:false ~with_grad:false a2; *)
   Train.printf ~here:[%here] ~with_code:false ~with_grad:false c
 
@@ -992,7 +992,7 @@ let translate ?ident_label (expr : expression) : result =
         { res1 with typ = Tensor; expr = [%expr NTDSL.O.( **. ) [%e res1.expr] [%e expr2]] }
     | [%expr
         [%e? expr1]
-        *+ [%e? { pexp_desc = Pexp_constant (Pconst_string (spec_str, _, _)); _ }] [%e? expr2]]
+        +* [%e? { pexp_desc = Pexp_constant (Pconst_string (spec_str, _, _)); _ }] [%e? expr2]]
       when String.contains spec_str '>' ->
         let res1 = loop ~proj_in_scope expr1 in
         let res2 = loop ~proj_in_scope expr2 in
@@ -1007,7 +1007,7 @@ let translate ?ident_label (expr : expression) : result =
         }
     | [%expr
         [%e? expr1]
-        *+ [%e? { pexp_desc = Pexp_constant (Pconst_string (spec_str, _, _)); _ }]
+        +* [%e? { pexp_desc = Pexp_constant (Pconst_string (spec_str, _, _)); _ }]
              ([%e? { pexp_desc = Pexp_constant (Pconst_string _); _ } as head] :: [%e? rest])
              [%e? expr2]]
       when String.contains spec_str '>' ->
 
@@ -185,7 +185,7 @@ let rec translate ~num_configs ~is_toplevel ~opt_label ?label expr =
       )
   | [%expr
       [%e? expr1]
-      *+ [%e? { pexp_desc = Pexp_constant (Pconst_string (spec_str, _, _)); _ }] [%e? expr2]]
+      +* [%e? { pexp_desc = Pexp_constant (Pconst_string (spec_str, _, _)); _ }] [%e? expr2]]
     when String.contains spec_str '>' ->
       let vbs1, e1 = loop expr1 in
       let vbs2, e2 = loop expr2 in
@@ -199,7 +199,7 @@ let rec translate ~num_configs ~is_toplevel ~opt_label ?label expr =
       (vbs1, [%expr einsum1 ?label:[%e opt_expr ~loc label] [%e spec] [%e e1]])
   | [%expr
       [%e? expr1]
-      *+ [%e? { pexp_desc = Pexp_constant (Pconst_string (spec_str, _, _)); _ }]
+      +* [%e? { pexp_desc = Pexp_constant (Pconst_string (spec_str, _, _)); _ }]
            ([%e? { pexp_desc = Pexp_constant (Pconst_string _); _ } as head] :: [%e? rest])
            [%e? expr2]]
     when String.contains spec_str '>' ->
 
@@ -212,7 +212,7 @@ type Assignments.t =
 
 For example the binary case in pseudocode: `if initialize_neutral then lhs = 0; lhs = lhs accum (rhs1 op rhs2)` (assuming the neutral element of `accum` is 0). The representation also has a field `projections` which determines which loops should be run and how the tensor nodes should be indexed to perform the computation.
 
-The basic `%cd` syntax for assignments has the form: `<lhs> <asgn-op> <primitive-op-application[rhs1, rhs2?, rhs3?]>`. See [Primitive operations](#primitive-operations) for the syntax of primitive operation application, where `<rhs1>`, `<rhs2>` (for binary and ternary ops), `<rhs3>` (for ternary ops) are subexpressions. `<asgn-op>` starts with `=`, followed by `:` only if `initialize_neutral` is true, then followed by the operator syntax variant of a binary primitive operation. The fields `<lhs>`, `<rhs1>`, `<rhs2>`, `<rhs3>` will often be either special-purpose identifiers (specifically `v`, `t`, `t1`, `t2`, `t3`, `g`, `g1`, `g2`, `g3`) or identifiers bound to tensors. `<rhs1>`, `<rsh2>`, `<rsh3>` will also often be (non-differentiable) tensor expressions. The notation `<tensor>.grad` stands for the gradient node of the given tensor. For more about "slot fillers", and to learn about the operators `*+` and `++`, see the section [further features of the syntax extension %cd](#further-features-of-the-syntax-extension-cd).
+The basic `%cd` syntax for assignments has the form: `<lhs> <asgn-op> <primitive-op-application[rhs1, rhs2?, rhs3?]>`. See [Primitive operations](#primitive-operations) for the syntax of primitive operation application, where `<rhs1>`, `<rhs2>` (for binary and ternary ops), `<rhs3>` (for ternary ops) are subexpressions. `<asgn-op>` starts with `=`, followed by `:` only if `initialize_neutral` is true, then followed by the operator syntax variant of a binary primitive operation. The fields `<lhs>`, `<rhs1>`, `<rhs2>`, `<rhs3>` will often be either special-purpose identifiers (specifically `v`, `t`, `t1`, `t2`, `t3`, `g`, `g1`, `g2`, `g3`) or identifiers bound to tensors. `<rhs1>`, `<rsh2>`, `<rsh3>` will also often be (non-differentiable) tensor expressions. The notation `<tensor>.grad` stands for the gradient node of the given tensor. For more about "slot fillers", and to learn about the operators `+*` and `++`, see the section [further features of the syntax extension %cd](#further-features-of-the-syntax-extension-cd).
 
 How is the `projections` field determined? `projections` can be given explicitly as a labeled argument `~projections`. If they aren't but `%cd` realizes there is a `~projections` parameter in scope, it uses it -- see `lib/operation.ml` where this option is used to define tensor operations. If instead of `~projections` a `~logic` labeled argument is given, the string passed is used to determine projections. `~logic:"."` means a pointwise operation. `~logic:"@"` means an "output axes of rhs2 match input axes of rhs1" operation (matrix multiplication is a special case). `~logic:"T"` means transpose of input and output axes. The string passed to `~logic` can also use OCANNL's generalization of the einsum notation, allowing arbitrary permutations and reductions of axes. If no information is given, the default depends on the primitive operation, but it is almost always a pointwise operation.
 
@@ -318,9 +318,9 @@ let%op mlp_layer ~label ~hid_dim () x = relu ({ w } * x + { b; o = [ hid_dim ] }
 
 ## Using OCANNL's generalized einsum notation
 
-As we mentioned above, in the `%cd` syntax you can set up an arbitrary assignment with projections derived from a generalized einsum specification, by passing the specification as a string with the `~logic` label. However, both the `%cd` and `%op` syntaxes support built-in operators that take an einsum specification: `*+` binding to `NTDSL.einsum` resp. `TDSL.einsum`, and `++` binding to `NTDSL.einsum1` resp. `TDSL.einsum1`. `*+` is a "ternary" operator, binary wrt. tensor arguments, and `++` is a binary operator, unary postfix wrt. tensor arguments. The einsum specification string should directly follow `*+` and `++`.
+As we mentioned above, in the `%cd` syntax you can set up an arbitrary assignment with projections derived from a generalized einsum specification, by passing the specification as a string with the `~logic` label. However, both the `%cd` and `%op` syntaxes support built-in operators that take an einsum specification: `+*` binding to `NTDSL.einsum` resp. `TDSL.einsum`, and `++` binding to `NTDSL.einsum1` resp. `TDSL.einsum1`. `+*` is a "ternary" operator, binary wrt. tensor arguments, and `++` is a binary operator, unary postfix wrt. tensor arguments. The einsum specification string should directly follow `+*` and `++`.
 
-Both `*+` and `++` use addition for the accumulation operation; `*+` uses multiplication. You can verify that looking at the `Operation.einsum` and `Operation.einsum1` definitions. You can find examples of `*+` and `++` behavior in the test suite [einsum_trivia.ml](test/einsum_trivia.ml). A frequent use-case for `++` is to sum out all axes of a tensor:
+Both `+*` and `++` use addition for the accumulation operation; `+*` uses multiplication. You can verify that looking at the `Operation.einsum` and `Operation.einsum1` definitions. You can find examples of `+*` and `++` behavior in the test suite [einsum_trivia.ml](test/einsum_trivia.ml). A frequent use-case for `++` is to sum out all axes of a tensor:
 
 ```ocaml
   let%op scalar_loss = (margin_loss ++ "...|... => 0") /. !..batch_size in
@@ -365,8 +365,8 @@ The syntax of an axis spec:
 - A number specifies the particular dimension within the axis,
 - A `+` sign specifies a convolution input axis with the output on the left of `+` and the kernel on the right of `+`.
   - In both the output part and the kernel part you can prefix the axis variable by a constant coefficient with the `*` sign.
-  - The coefficient can directly only be an integer, e.g. `"2*i+3*k"`, but under the `%op` and `%cd` syntax extensions, it can also be an identifier of an integer value, e.g. `let stride = 2 and dilation = 3 in [%op "input" *+ "stride * a + dilation * b; b=>a," "kernel"]`.
-  - Note the comma above. The syntax extension's expansion of stride and dilation respects the "multichar" mode. Without the comma we are limited to single-character identifiers, e.g. `let s = 2 and d = 3 in [%op "input" *+ "is*a+d*bc;b=>iac" "kernel"]`.
+  - The coefficient can directly only be an integer, e.g. `"2*i+3*k"`, but under the `%op` and `%cd` syntax extensions, it can also be an identifier of an integer value, e.g. `let stride = 2 and dilation = 3 in [%op "input" +* "stride * a + dilation * b; b=>a," "kernel"]`.
+  - Note the comma above. The syntax extension's expansion of stride and dilation respects the "multichar" mode. Without the comma we are limited to single-character identifiers, e.g. `let s = 2 and d = 3 in [%op "input" +* "is*a+d*bc;b=>iac" "kernel"]`.
 
 Examples:
 
@@ -385,7 +385,7 @@ Examples:
 
 ### Capturing the dimensions of selected axes for further computation or to add shape constraints
 
-The syntaxes `*+` and `++` accept an optional list of strings argument after the specification string. When passed, the strings should be some of the identifiers used in the specification. Both dimension variable and row variable labels are supported. This will introduce bindings for `Indexing.variable_ref` objects at the same point as the inline parameter definition bindings, and will pass these objects with the `~capture_dims` argument to `einsum` resp. `einsum1`. The bound objects can later be used with `Operation.embed_dim` or its alias `Operation.TDSL.O.dim` to embed the solved dimension of the corresponding variable (as a number) into a tensor expression. For a row variable, the number will be the product of the dimensions it resolved into.
+The syntaxes `+*` and `++` accept an optional list of strings argument after the specification string. When passed, the strings should be some of the identifiers used in the specification. Both dimension variable and row variable labels are supported. This will introduce bindings for `Indexing.variable_ref` objects at the same point as the inline parameter definition bindings, and will pass these objects with the `~capture_dims` argument to `einsum` resp. `einsum1`. The bound objects can later be used with `Operation.embed_dim` or its alias `Operation.TDSL.O.dim` to embed the solved dimension of the corresponding variable (as a number) into a tensor expression. For a row variable, the number will be the product of the dimensions it resolved into.
 
 ## Further features of the syntax extension %cd
 
 
@@ -225,7 +225,7 @@ let%expect_test "einsum outer product" =
 
   let a = TDSL.range_of_shape ~batch_dims:[] ~input_dims:[] ~output_dims:[ 2 ] () in
   let b = TDSL.range_of_shape ~batch_dims:[] ~input_dims:[] ~output_dims:[ 3 ] () in
-  let%op c = (a + 1) *+ "i; j => i->j" b in
+  let%op c = (a + 1) +* "i; j => i->j" b in
   ignore (Train.forward_once backend c);
   Train.printf ~here:[%here] ~with_code:false ~with_grad:false c;
   [%expect
@@ -244,7 +244,7 @@ let%expect_test "einsum outer product" =
     |}];
   let a = TDSL.range_of_shape ~batch_dims:[ 2 ] ~input_dims:[ 3 ] ~output_dims:[ 4 ] () in
   let b = TDSL.range_of_shape ~batch_dims:[ 5 ] ~input_dims:[ 6 ] ~output_dims:[ 7 ] () in
-  let%op c = a *+ "i|j->k; l|m->n => il|jm->kn" b in
+  let%op c = a +* "i|j->k; l|m->n => il|jm->kn" b in
   ignore (Train.forward_once backend c);
   Train.printf ~here:[%here] ~with_code:false ~with_grad:false c;
   [%expect
@@ -413,15 +413,15 @@ let%expect_test "einsum matrix/inner+outer products" =
 
   let a = TDSL.range_of_shape ~batch_dims:[ 2 ] ~input_dims:[ 3 ] ~output_dims:[ 4 ] () in
   let b = TDSL.range_of_shape ~batch_dims:[ 2 ] ~input_dims:[ 4 ] ~output_dims:[ 5 ] () in
-  let%op a2 = a *+ "b|i->o; b|i->o => b|i->o" a in
+  let%op a2 = a +* "b|i->o; b|i->o => b|i->o" a in
   let ctx = Train.forward_once backend a2 in
-  let%op c = b *+ "b|h->o; b|i->h => b|i->o" a in
+  let%op c = b +* "b|h->o; b|i->h => b|i->o" a in
   let ctx = Train.forward_once backend ~ctx c in
-  let%op d = a *+ "a|i->h; b|h->o => ab|i->o" b in
+  let%op d = a +* "a|i->h; b|h->o => ab|i->o" b in
   ignore (Train.forward_once backend ~ctx d);
-  let%op e = a *+ "b|i->h; b|h->o => i->o" b in
+  let%op e = a +* "b|i->h; b|h->o => i->o" b in
   ignore (Train.forward_once backend ~ctx e);
-  let%op f = a *+ "a|i->h; b|h->o => i->o" b in
+  let%op f = a +* "a|i->h; b|h->o => i->o" b in
   ignore (Train.forward_once backend ~ctx f);
   Train.printf ~here:[%here] ~with_code:false ~with_grad:false a2;
   [%expect
@@ -792,7 +792,7 @@ let%expect_test "einsum broadcast or sum out prefix axes" =
 
   let a = TDSL.range_of_shape ~batch_dims:[ 3 ] ~input_dims:[ 4 ] ~output_dims:[ 2 ] () in
   let b = TDSL.range_of_shape ~batch_dims:[ 3 ] ~input_dims:[ 1 ] ~output_dims:[ 4 ] () in
-  let%op c = a *+ "...|i->...; ...|...->i => ...|i" b in
+  let%op c = a +* "...|i->...; ...|...->i => ...|i" b in
   ignore (Train.forward_once backend c);
   Train.printf ~here:[%here] ~with_code:false ~with_grad:false c;
   [%expect
@@ -812,7 +812,7 @@ let%expect_test "einsum broadcast or sum out prefix axes" =
   (* Broadcast with a shift. *)
   let d = TDSL.range_of_shape ~input_dims:[ 2 ] ~output_dims:[ 3 ] () in
   let e = TDSL.range_of_shape ~input_dims:[ 4 ] ~output_dims:[ 3 ] () in
-  let%op f = d *+ "i->...;j->... => ...ij" e in
+  let%op f = d +* "i->...;j->... => ...ij" e in
   ignore (Train.forward_once backend f);
   Train.printf ~here:[%here] ~with_code:false ~with_grad:false f;
   [%expect
@@ -930,7 +930,7 @@ let%expect_test "einsum with fixed dim axes" =
 
   let a = TDSL.range_of_shape ~batch_dims:[ 3 ] ~input_dims:[ 4 ] ~output_dims:[ 2 ] () in
   let b = TDSL.range_of_shape ~batch_dims:[ 3 ] ~input_dims:[ 1 ] ~output_dims:[ 4 ] () in
-  let%op c = a *+ "...|i->1; ...|...->i => ...|i" b in
+  let%op c = a +* "...|i->1; ...|...->i => ...|i" b in
   ignore (Train.forward_once backend c);
   Train.printf ~here:[%here] ~with_code:false ~with_grad:false c;
   [%expect
@@ -1156,7 +1156,7 @@ let%expect_test "einsum with a leftmost input axis preserved as output axis" =
   let b =
     TDSL.range_of_shape ~label:[ "b" ] ~batch_dims:[ 3 ] ~input_dims:[ 2; 3 ] ~output_dims:[ 4 ] ()
   in
-  let%op c = a *+ "...|i->1; ...|j...->i => ...|ij" b in
+  let%op c = a +* "...|i->1; ...|j...->i => ...|ij" b in
   ignore (Train.forward_once backend c);
   Train.printf ~here:[%here] ~with_code:false ~with_grad:false c;
   [%expect
@@ -1190,7 +1190,7 @@ let%expect_test "einsum permuting two leftmost input axes as output axes" =
 
   let a = TDSL.range_of_shape ~label:[ "a" ] ~input_dims:[ 2 ] ~output_dims:[ 2 ] () in
   let b = TDSL.range_of_shape ~label:[ "b" ] ~input_dims:[ 2; 3; 4 ] ~output_dims:[ 2 ] () in
-  let%op c = a *+ "i->1; ij...->0 => ...->ji" b in
+  let%op c = a +* "i->1; ij...->0 => ...->ji" b in
   ignore (Train.forward_once backend c);
   Train.printf ~here:[%here] ~with_code:false ~with_grad:false c;
   [%expect