Formatting

lukstafi · lukstafi · commit 4acb6df4cc4b · 2025-08-31T15:49:32.000+02:00
diff --git a/arrayjit/lib/c_syntax.ml b/arrayjit/lib/c_syntax.ml
@@ -312,9 +312,10 @@ module C_syntax (B : C_syntax_config) = struct
     | For_loop { index = i; from_; to_; body; trace_it = _ } ->
         let header =
           let idx_type = if Utils.settings.big_models then "uint64_t " else "uint32_t " in
-          string ("for (" ^ idx_type) ^^ pp_symbol i ^^ string " = " ^^ PPrint.OCaml.int from_ ^^ semi
-          ^^ space ^^ pp_symbol i ^^ string " <= " ^^ PPrint.OCaml.int to_ ^^ semi ^^ space
-          ^^ string "++" ^^ pp_symbol i ^^ string ")"
+          string ("for (" ^ idx_type)
+          ^^ pp_symbol i ^^ string " = " ^^ PPrint.OCaml.int from_ ^^ semi ^^ space ^^ pp_symbol i
+          ^^ string " <= " ^^ PPrint.OCaml.int to_ ^^ semi ^^ space ^^ string "++" ^^ pp_symbol i
+          ^^ string ")"
         in
         let body_doc = ref (pp_ll body) in
         (if Utils.debug_log_from_routines () then
diff --git a/arrayjit/lib/metal_backend.ml b/arrayjit/lib/metal_backend.ml
@@ -433,7 +433,9 @@ end) : Ir.Backend_impl.Lowered_backend = struct
     let main_kernel_prefix = "kernel"
     let buffer_prefix = "device "
     let buffer_suffix = fun ~pos -> " [[buffer(" ^ Int.to_string pos ^ ")]]"
-    let arg_int_prefix = if Utils.settings.big_models then "const uint64_t& " else "const uint32_t& "
+
+    let arg_int_prefix =
+      if Utils.settings.big_models then "const uint64_t& " else "const uint32_t& "
 
     let extra_args =
       [
diff --git a/arrayjit/lib/ops.ml b/arrayjit/lib/ops.ml
@@ -17,9 +17,11 @@ type ('ocaml, 'impl) precision =
   | Byte : (char, uint8_elt) precision
   | Uint16 : (int, uint16_elt) precision
   | Int32 : (int32, int32_elt) precision
-  | Uint32 : (int32, int32_elt) precision  (** Using int32_elt representation but treating as unsigned *)
+  | Uint32 : (int32, int32_elt) precision
+      (** Using int32_elt representation but treating as unsigned *)
   | Int64 : (int64, int64_elt) precision
-  | Uint64 : (int64, int64_elt) precision  (** Using int64_elt representation but treating as unsigned *)
+  | Uint64 : (int64, int64_elt) precision
+      (** Using int64_elt representation but treating as unsigned *)
   | Uint4x32 : (Stdlib.Complex.t, Bigarray.complex64_elt) precision
       (** A 128-bit value that corresponds to e.g. CUDA's uint4 type. Luckily, the OCaml Bigarray
           library supports complex64_elt which is a 128-bit value, so we avoid dims conversions. *)
@@ -563,21 +565,32 @@ let binop_c_syntax prec v =
   | Mul, _ -> ("(", " *", ")")
   | Div, _ -> ("(", " /", ")")
   | ToPowOf, Double_prec _ -> ("pow(", ",", ")")
-  | ToPowOf, (Byte_prec _ | Uint16_prec _ | Int32_prec _ | Uint32_prec _ | Int64_prec _ | Uint64_prec _ | Fp8_prec _) ->
+  | ( ToPowOf,
+      ( Byte_prec _ | Uint16_prec _ | Int32_prec _ | Uint32_prec _ | Int64_prec _ | Uint64_prec _
+      | Fp8_prec _ ) ) ->
       invalid_arg "Ops.binop_c_syntax: ToPowOf not supported for integer precisions"
   | ToPowOf, _ -> ("powf(", ",", ")")
-  | Relu_gate, (Byte_prec _ | Uint16_prec _ | Int32_prec _ | Uint32_prec _ | Int64_prec _ | Uint64_prec _ | Fp8_prec _) -> ("(", " > 0 ?", " : 0)")
+  | ( Relu_gate,
+      ( Byte_prec _ | Uint16_prec _ | Int32_prec _ | Uint32_prec _ | Int64_prec _ | Uint64_prec _
+      | Fp8_prec _ ) ) ->
+      ("(", " > 0 ?", " : 0)")
   | Relu_gate, _ -> ("(", " > 0.0 ?", " : 0.0)")
-  | Satur01_gate, (Byte_prec _ | Uint16_prec _ | Int32_prec _ | Uint32_prec _ | Int64_prec _ | Uint64_prec _ | Fp8_prec _) ->
+  | ( Satur01_gate,
+      ( Byte_prec _ | Uint16_prec _ | Int32_prec _ | Uint32_prec _ | Int64_prec _ | Uint64_prec _
+      | Fp8_prec _ ) ) ->
       ("(abs(", " ) > 0 ? 0 : (", "))")
   | Satur01_gate, Single_prec _ ->
       (* This disagrees at 0 with the semantics. *)
       ("(fabsf(floorf(", ")) > 0.0 ? 0.0 : (", "))")
   | Satur01_gate, _ -> ("(fabs(floor(", ")) > 0.0 ? 0.0 : (", "))")
-  | Max, (Double_prec _ | Byte_prec _ | Uint16_prec _ | Int32_prec _ | Uint32_prec _ | Int64_prec _ | Uint64_prec _ | Fp8_prec _) ->
+  | ( Max,
+      ( Double_prec _ | Byte_prec _ | Uint16_prec _ | Int32_prec _ | Uint32_prec _ | Int64_prec _
+      | Uint64_prec _ | Fp8_prec _ ) ) ->
       ("fmax(", ",", ")")
   | Max, _ -> ("fmaxf(", ",", ")")
-  | Min, (Double_prec _ | Byte_prec _ | Uint16_prec _ | Int32_prec _ | Uint32_prec _ | Int64_prec _ | Uint64_prec _ | Fp8_prec _) ->
+  | ( Min,
+      ( Double_prec _ | Byte_prec _ | Uint16_prec _ | Int32_prec _ | Uint32_prec _ | Int64_prec _
+      | Uint64_prec _ | Fp8_prec _ ) ) ->
       ("fmin(", ",", ")")
   | Min, _ -> ("fminf(", ",", ")")
   | Mod, _ -> ("(", " %", ")")
@@ -654,43 +667,80 @@ let unop_c_syntax prec op =
   let fmax () =
     (* See: https://en.cppreference.com/w/c/numeric/math/fmax option (4) *)
     match prec with
-    | Double_prec _ | Byte_prec _ | Uint16_prec _ | Int32_prec _ | Uint32_prec _ | Int64_prec _ | Uint64_prec _ | Fp8_prec _ -> "fmax"
+    | Double_prec _ | Byte_prec _ | Uint16_prec _ | Int32_prec _ | Uint32_prec _ | Int64_prec _
+    | Uint64_prec _ | Fp8_prec _ ->
+        "fmax"
     | _ -> "fmaxf"
   in
   let fmin () =
     match prec with
-    | Double_prec _ | Byte_prec _ | Uint16_prec _ | Int32_prec _ | Uint32_prec _ | Int64_prec _ | Uint64_prec _ | Fp8_prec _ -> "fmin"
+    | Double_prec _ | Byte_prec _ | Uint16_prec _ | Int32_prec _ | Uint32_prec _ | Int64_prec _
+    | Uint64_prec _ | Fp8_prec _ ->
+        "fmin"
     | _ -> "fminf"
   in
   match (op, prec) with
   | Identity, _ -> ("", "")
-  | Relu, (Byte_prec _ | Uint16_prec _ | Int32_prec _ | Uint32_prec _ | Int64_prec _ | Uint64_prec _ | Fp8_prec _) -> ("fmax(0, ", ")")
+  | ( Relu,
+      ( Byte_prec _ | Uint16_prec _ | Int32_prec _ | Uint32_prec _ | Int64_prec _ | Uint64_prec _
+      | Fp8_prec _ ) ) ->
+      ("fmax(0, ", ")")
   | Relu, _ -> (fmax () ^ "(0.0, ", ")")
-  | Satur01, (Byte_prec _ | Uint16_prec _ | Int32_prec _ | Uint32_prec _ | Int64_prec _ | Uint64_prec _ | Fp8_prec _) -> ("fmax(0, fmin(1, ", "))")
+  | ( Satur01,
+      ( Byte_prec _ | Uint16_prec _ | Int32_prec _ | Uint32_prec _ | Int64_prec _ | Uint64_prec _
+      | Fp8_prec _ ) ) ->
+      ("fmax(0, fmin(1, ", "))")
   | Satur01, _ -> (fmax () ^ "(0.0, " ^ fmin () ^ "(1.0, ", "))")
-  | Exp, (Double_prec _ | Byte_prec _ | Uint16_prec _ | Int32_prec _ | Uint32_prec _ | Int64_prec _ | Uint64_prec _ | Fp8_prec _) -> ("exp(", ")")
+  | ( Exp,
+      ( Double_prec _ | Byte_prec _ | Uint16_prec _ | Int32_prec _ | Uint32_prec _ | Int64_prec _
+      | Uint64_prec _ | Fp8_prec _ ) ) ->
+      ("exp(", ")")
   | Exp, _ -> ("expf(", ")")
-  | Log, (Double_prec _ | Byte_prec _ | Uint16_prec _ | Int32_prec _ | Uint32_prec _ | Int64_prec _ | Uint64_prec _ | Fp8_prec _) -> ("log(", ")")
+  | ( Log,
+      ( Double_prec _ | Byte_prec _ | Uint16_prec _ | Int32_prec _ | Uint32_prec _ | Int64_prec _
+      | Uint64_prec _ | Fp8_prec _ ) ) ->
+      ("log(", ")")
   | Log, _ -> ("logf(", ")")
-  | Exp2, (Double_prec _ | Byte_prec _ | Uint16_prec _ | Int32_prec _ | Uint32_prec _ | Int64_prec _ | Uint64_prec _ | Fp8_prec _) -> ("exp2(", ")")
+  | ( Exp2,
+      ( Double_prec _ | Byte_prec _ | Uint16_prec _ | Int32_prec _ | Uint32_prec _ | Int64_prec _
+      | Uint64_prec _ | Fp8_prec _ ) ) ->
+      ("exp2(", ")")
   | Exp2, _ -> ("exp2f(", ")")
-  | Log2, (Double_prec _ | Byte_prec _ | Uint16_prec _ | Int32_prec _ | Uint32_prec _ | Int64_prec _ | Uint64_prec _ | Fp8_prec _) -> ("log2(", ")")
+  | ( Log2,
+      ( Double_prec _ | Byte_prec _ | Uint16_prec _ | Int32_prec _ | Uint32_prec _ | Int64_prec _
+      | Uint64_prec _ | Fp8_prec _ ) ) ->
+      ("log2(", ")")
   | Log2, _ -> ("log2f(", ")")
-  | Sin, (Double_prec _ | Byte_prec _ | Uint16_prec _ | Int32_prec _ | Uint32_prec _ | Int64_prec _ | Uint64_prec _ | Fp8_prec _) -> ("sin(", ")")
+  | ( Sin,
+      ( Double_prec _ | Byte_prec _ | Uint16_prec _ | Int32_prec _ | Uint32_prec _ | Int64_prec _
+      | Uint64_prec _ | Fp8_prec _ ) ) ->
+      ("sin(", ")")
   | Sin, _ -> ("sinf(", ")")
-  | Cos, (Double_prec _ | Byte_prec _ | Uint16_prec _ | Int32_prec _ | Uint32_prec _ | Int64_prec _ | Uint64_prec _ | Fp8_prec _) -> ("cos(", ")")
+  | ( Cos,
+      ( Double_prec _ | Byte_prec _ | Uint16_prec _ | Int32_prec _ | Uint32_prec _ | Int64_prec _
+      | Uint64_prec _ | Fp8_prec _ ) ) ->
+      ("cos(", ")")
   | Cos, _ -> ("cosf(", ")")
-  | Sqrt, (Double_prec _ | Byte_prec _ | Uint16_prec _ | Int32_prec _ | Uint32_prec _ | Int64_prec _ | Uint64_prec _ | Fp8_prec _) -> ("sqrt(", ")")
+  | ( Sqrt,
+      ( Double_prec _ | Byte_prec _ | Uint16_prec _ | Int32_prec _ | Uint32_prec _ | Int64_prec _
+      | Uint64_prec _ | Fp8_prec _ ) ) ->
+      ("sqrt(", ")")
   | Sqrt, _ -> ("sqrtf(", ")")
-  | Recip, (Byte_prec _ | Uint16_prec _ | Int32_prec _ | Uint32_prec _ | Int64_prec _ | Uint64_prec _ | Fp8_prec _) ->
+  | ( Recip,
+      ( Byte_prec _ | Uint16_prec _ | Int32_prec _ | Uint32_prec _ | Int64_prec _ | Uint64_prec _
+      | Fp8_prec _ ) ) ->
       invalid_arg "Ops.unop_c_syntax: Recip not supported for integer precisions"
   | Recip, _ -> ("(1.0 / (", "))")
-  | Recip_sqrt, (Byte_prec _ | Uint16_prec _ | Int32_prec _ | Uint32_prec _ | Int64_prec _ | Uint64_prec _ | Fp8_prec _) ->
+  | ( Recip_sqrt,
+      ( Byte_prec _ | Uint16_prec _ | Int32_prec _ | Uint32_prec _ | Int64_prec _ | Uint64_prec _
+      | Fp8_prec _ ) ) ->
       invalid_arg "Ops.unop_c_syntax: Recip_sqrt not supported for integer precisions"
   | Recip_sqrt, Double_prec _ -> ("(1.0 / sqrt(", "))")
   | Recip_sqrt, _ -> ("(1.0 / sqrtf(", "))")
   | Neg, _ -> ("(-(", "))")
-  | Tanh_approx, (Byte_prec _ | Uint16_prec _ | Int32_prec _ | Uint32_prec _ | Int64_prec _ | Uint64_prec _ | Fp8_prec _) ->
+  | ( Tanh_approx,
+      ( Byte_prec _ | Uint16_prec _ | Int32_prec _ | Uint32_prec _ | Int64_prec _ | Uint64_prec _
+      | Fp8_prec _ ) ) ->
       invalid_arg "Ops.unop_c_syntax: Tanh_approx not supported for integer precisions"
   | Tanh_approx, _ -> ("tanhf(", ")")
   | Not, _ -> ("(", " == 0.0 ? 1.0 : 0.0)")
@@ -709,10 +759,14 @@ let ternop_cd_syntax = function Where -> "where" | FMA -> "fma"
 
 let ternop_c_syntax prec op =
   match (op, prec) with
-  | Where, (Byte_prec _ | Uint16_prec _ | Int32_prec _ | Uint32_prec _ | Int64_prec _ | Uint64_prec _ | Fp8_prec _) ->
+  | ( Where,
+      ( Byte_prec _ | Uint16_prec _ | Int32_prec _ | Uint32_prec _ | Int64_prec _ | Uint64_prec _
+      | Fp8_prec _ ) ) ->
       ("((", ") != 0 ? (", ") : (", "))")
   | Where, _ -> ("((", ") != 0.0 ? (", ") : (", "))")
-  | FMA, (Double_prec _ | Byte_prec _ | Uint16_prec _ | Int32_prec _ | Uint32_prec _ | Int64_prec _ | Uint64_prec _ | Fp8_prec _) ->
+  | ( FMA,
+      ( Double_prec _ | Byte_prec _ | Uint16_prec _ | Int32_prec _ | Uint32_prec _ | Int64_prec _
+      | Uint64_prec _ | Fp8_prec _ ) ) ->
       ("fma(", ",", ",", ")")
   | FMA, _ -> ("fmaf(", ",", ",", ")")
 
@@ -745,16 +799,22 @@ let c_convert_precision ~from ~to_ =
   (* Conversions involving BFloat16 and other types *)
   | Bfloat16_prec _, Half_prec _ -> ("FLOAT_TO_HALF(bfloat16_to_single(", "))")
   | Half_prec _, Bfloat16_prec _ -> ("single_to_bfloat16(HALF_TO_FLOAT(", "))")
-  | Bfloat16_prec _, (Byte_prec _ | Uint16_prec _ | Int32_prec _ | Uint32_prec _ | Int64_prec _ | Uint64_prec _) ->
+  | ( Bfloat16_prec _,
+      (Byte_prec _ | Uint16_prec _ | Int32_prec _ | Uint32_prec _ | Int64_prec _ | Uint64_prec _) )
+    ->
       ("(" ^ c_typ_of_prec to_ ^ ")bfloat16_to_single(", ")")
-  | (Byte_prec _ | Uint16_prec _ | Int32_prec _ | Uint32_prec _ | Int64_prec _ | Uint64_prec _), Bfloat16_prec _ ->
+  | ( (Byte_prec _ | Uint16_prec _ | Int32_prec _ | Uint32_prec _ | Int64_prec _ | Uint64_prec _),
+      Bfloat16_prec _ ) ->
       ("single_to_bfloat16((float)", ")")
   (* Conversions involving FP8 and other types *)
   | Fp8_prec _, Half_prec _ -> ("FLOAT_TO_HALF(fp8_to_single(", "))")
   | Half_prec _, Fp8_prec _ -> ("single_to_fp8(HALF_TO_FLOAT(", "))")
-  | Fp8_prec _, (Byte_prec _ | Uint16_prec _ | Int32_prec _ | Uint32_prec _ | Int64_prec _ | Uint64_prec _) ->
+  | ( Fp8_prec _,
+      (Byte_prec _ | Uint16_prec _ | Int32_prec _ | Uint32_prec _ | Int64_prec _ | Uint64_prec _) )
+    ->
       ("(" ^ c_typ_of_prec to_ ^ ")fp8_to_single(", ")")
-  | (Byte_prec _ | Uint16_prec _ | Int32_prec _ | Uint32_prec _ | Int64_prec _ | Uint64_prec _), Fp8_prec _ ->
+  | ( (Byte_prec _ | Uint16_prec _ | Int32_prec _ | Uint32_prec _ | Int64_prec _ | Uint64_prec _),
+      Fp8_prec _ ) ->
       ("single_to_fp8((float)", ")")
   (* BFloat16 <-> FP8 conversions *)
   | Bfloat16_prec _, Fp8_prec _ -> ("single_to_fp8(bfloat16_to_single(", "))")
@@ -764,9 +824,12 @@ let c_convert_precision ~from ~to_ =
   | Single_prec _, Half_prec _ -> ("FLOAT_TO_HALF(", ")")
   | Half_prec _, Double_prec _ -> ("(double)HALF_TO_FLOAT(", ")")
   | Double_prec _, Half_prec _ -> ("FLOAT_TO_HALF((float)", ")")
-  | Half_prec _, (Byte_prec _ | Uint16_prec _ | Int32_prec _ | Uint32_prec _ | Int64_prec _ | Uint64_prec _) ->
+  | ( Half_prec _,
+      (Byte_prec _ | Uint16_prec _ | Int32_prec _ | Uint32_prec _ | Int64_prec _ | Uint64_prec _) )
+    ->
       ("(" ^ c_typ_of_prec to_ ^ ")HALF_TO_FLOAT(", ")")
-  | (Byte_prec _ | Uint16_prec _ | Int32_prec _ | Uint32_prec _ | Int64_prec _ | Uint64_prec _), Half_prec _ ->
+  | ( (Byte_prec _ | Uint16_prec _ | Int32_prec _ | Uint32_prec _ | Int64_prec _ | Uint64_prec _),
+      Half_prec _ ) ->
       ("FLOAT_TO_HALF((float)", ")")
   (* Uint4x32 conversions - special handling *)
   | Uint4x32_prec _, _ -> ("uint4x32_to_" ^ prec_string to_ ^ "(", ")")
diff --git a/lib/ppx_op.ml b/lib/ppx_op.ml
@@ -4,9 +4,11 @@ open Ppx_arrayjit.Ppx_helper
 open Ppx_shared
 
 let make_p ~opt_label ~loc ?value ?values ?param_init ~extra_args name =
-  let more_label = match opt_label with 
+  let more_label =
+    match opt_label with
     | Some (_label_name, label_pat) -> [%expr Some [%e pat2expr label_pat]]
-    | None -> [%expr None] in
+    | None -> [%expr None]
+  in
   let value = match value with Some c -> [%expr Some [%e c]] | None -> [%expr None] in
   let values = match values with Some c -> [%expr Some [%e c]] | None -> [%expr None] in
   let param_init =
@@ -264,7 +266,7 @@ let rec translate ~num_configs ~is_toplevel ~opt_label ?label expr =
       (* Check if there's a unit parameter or a labeled parameter with label "label" *)
       let rec find_unit_pos idx = function
         | [] -> None
-        | { pparam_desc = Pparam_val (Nolabel, _, pat); _ } :: _ 
+        | { pparam_desc = Pparam_val (Nolabel, _, pat); _ } :: _
           when match pat.ppat_desc with
                | Ppat_construct ({ txt = Lident "()"; _ }, None) -> true
                | _ -> false ->
@@ -280,9 +282,11 @@ let rec translate ~num_configs ~is_toplevel ~opt_label ?label expr =
       | Some unit_idx ->
           (* Split args at unit parameter *)
           let before_unit, unit_and_after = List.split_n args unit_idx in
-          let unit_param, after_unit = match unit_and_after with
+          let unit_param, after_unit =
+            match unit_and_after with
             | unit :: rest -> (unit, rest)
-            | [] -> failwith "Internal error: unit_and_after should not be empty" in
+            | [] -> failwith "Internal error: unit_and_after should not be empty"
+          in
           let opt_label = find_label_param before_unit in
           let vbs, inner_body =
             translate ~num_configs ~is_toplevel:false ~opt_label ?label
@@ -293,54 +297,61 @@ let rec translate ~num_configs ~is_toplevel ~opt_label ?label expr =
           let new_body = inner_body in
           ( no_vbs,
             if List.is_empty before_unit then
-              { expr with pexp_desc = Pexp_function ([unit_param], constr, Pfunction_body new_body) }
+              {
+                expr with
+                pexp_desc = Pexp_function ([ unit_param ], constr, Pfunction_body new_body);
+              }
             else
-              { expr with pexp_desc = Pexp_function (before_unit @ [unit_param], constr, Pfunction_body new_body) } )
+              {
+                expr with
+                pexp_desc =
+                  Pexp_function (before_unit @ [ unit_param ], constr, Pfunction_body new_body);
+              } )
       | None ->
-      (* No unit parameter, normal processing *)
-      let labels =
-        Option.to_list label
-        @ List.filter_map args ~f:(function
-            | { pparam_desc = Pparam_val (_, _, pat); _ } ->
-                let loc = pat.ppat_loc in
-                Some [%expr [%e pat2expr pat].Tensor.value.Ir.Tnode.label]
-            | _ -> None)
-      in
-      let label_locs = List.map labels ~f:(fun label -> label.pexp_loc) in
-      let label_starts = List.map label_locs ~f:(fun l -> l.loc_start) in
-      let label_ends = List.map label_locs ~f:(fun l -> l.loc_end) in
-      let label_loc =
-        if List.is_empty labels then loc
-        else
-          Location.
-            {
-              loc_start = List.reduce_exn label_starts ~f:min_pos;
-              loc_end = List.reduce_exn label_ends ~f:max_pos;
-              loc_ghost = false;
-            }
-      in
-      let label =
-        let loc = label_loc in
-        [%expr List.concat [%e Ast_builder.Default.elist ~loc labels]]
-      in
-      let vbs, body =
-        match body with
-        | Pfunction_body body ->
-            let vbs, body = loop ~label body in
-            (vbs, Pfunction_body body)
-        | Pfunction_cases (cases, loc, attrs) ->
-            let vbs, cases =
-              List.unzip
-              @@ List.map cases ~f:(fun ({ pc_rhs; _ } as c) ->
-                     let vbs, pc_rhs = loop ~label pc_rhs in
-                     (vbs, { c with pc_rhs }))
-            in
-            ( List.fold vbs
-                ~init:(Map.empty (module String))
-                ~f:(fun acc vbs -> Map.merge_disjoint_exn acc vbs),
-              Pfunction_cases (cases, loc, attrs) )
-      in
-      (vbs, { expr with pexp_desc = Pexp_function (args, constr, body) }) )
+          (* No unit parameter, normal processing *)
+          let labels =
+            Option.to_list label
+            @ List.filter_map args ~f:(function
+                | { pparam_desc = Pparam_val (_, _, pat); _ } ->
+                    let loc = pat.ppat_loc in
+                    Some [%expr [%e pat2expr pat].Tensor.value.Ir.Tnode.label]
+                | _ -> None)
+          in
+          let label_locs = List.map labels ~f:(fun label -> label.pexp_loc) in
+          let label_starts = List.map label_locs ~f:(fun l -> l.loc_start) in
+          let label_ends = List.map label_locs ~f:(fun l -> l.loc_end) in
+          let label_loc =
+            if List.is_empty labels then loc
+            else
+              Location.
+                {
+                  loc_start = List.reduce_exn label_starts ~f:min_pos;
+                  loc_end = List.reduce_exn label_ends ~f:max_pos;
+                  loc_ghost = false;
+                }
+          in
+          let label =
+            let loc = label_loc in
+            [%expr List.concat [%e Ast_builder.Default.elist ~loc labels]]
+          in
+          let vbs, body =
+            match body with
+            | Pfunction_body body ->
+                let vbs, body = loop ~label body in
+                (vbs, Pfunction_body body)
+            | Pfunction_cases (cases, loc, attrs) ->
+                let vbs, cases =
+                  List.unzip
+                  @@ List.map cases ~f:(fun ({ pc_rhs; _ } as c) ->
+                         let vbs, pc_rhs = loop ~label pc_rhs in
+                         (vbs, { c with pc_rhs }))
+                in
+                ( List.fold vbs
+                    ~init:(Map.empty (module String))
+                    ~f:(fun acc vbs -> Map.merge_disjoint_exn acc vbs),
+                  Pfunction_cases (cases, loc, attrs) )
+          in
+          (vbs, { expr with pexp_desc = Pexp_function (args, constr, body) }))
   | { pexp_desc = Pexp_function (args, constr, body); _ } ->
       let vbs, body =
         match body with
diff --git a/lib/train.ml b/lib/train.ml
diff --git a/test/ppx/test_ppx_op.ml b/test/ppx/test_ppx_op.ml