For more illustrative CI logs, add a moons_demo_parallel test run logging to stdout

lukstafi · lukstafi · commit e167b05ced9f · 2024-09-04T06:05:56.000+02:00
diff --git a/test/dune b/test/dune
@@ -1,3 +1,12 @@
+(test
+ (name moons_demo_parallel_run)
+ (package neural_nets_lib)
+ (modules moons_demo_parallel_run)
+ (deps ocannl_config)
+ (libraries ocannl)
+ (preprocess
+  (pps ppx_jane ppx_ocannl)))
+
 (library
  (name tutorials)
  (package neural_nets_lib)
diff --git a/test/moons_demo_parallel.ml b/test/moons_demo_parallel.ml
@@ -8,7 +8,7 @@ module CDSL = Train.CDSL
 module Utils = Arrayjit.Utils
 module Rand = Arrayjit.Rand.Lib
 
-let%expect_test "Half-moons data parallel" =
+let main () =
   let seed = 1 in
   let hid_dim = 16 in
   (* let hid_dim = 4 in *)
@@ -75,7 +75,10 @@ let%expect_test "Half-moons data parallel" =
       ]
   in
   Stdio.printf "\nHalf-moons scatterplot and decision boundary:\n";
-  PrintBox_text.output Stdio.stdout plot_moons;
+  PrintBox_text.output Stdio.stdout plot_moons
+
+let%expect_test "Half-moons data parallel" =
+  main ();
   (* NOTE: as of OCANNL 0.4, moons_demo_parallel, while deterministic on a single machine, gives
      slightly different results on machines with a different hardware, e.g. arm64, ppc. Here we list
      the results from the various CI targets. The first result is the one typically observed, the
diff --git a/test/moons_demo_parallel_run.ml b/test/moons_demo_parallel_run.ml
@@ -0,0 +1,84 @@
+open Base
+open Ocannl
+module Tn = Arrayjit.Tnode
+module IDX = Train.IDX
+module TDSL = Operation.TDSL
+module NTDSL = Operation.NTDSL
+module CDSL = Train.CDSL
+module Utils = Arrayjit.Utils
+module Rand = Arrayjit.Rand.Lib
+
+let main () =
+  let seed = 1 in
+  let hid_dim = 16 in
+  (* let hid_dim = 4 in *)
+  let batch_size = 120 in
+  (* let batch_size = 60 in *)
+  (* let batch_size = 20 in *)
+  let len = batch_size * 20 in
+  let init_lr = 0.1 in
+  (* let epochs = 10 in *)
+  let epochs = 20 in
+  (* let epochs = 1 in *)
+  let noise () = Rand.float_range (-0.1) 0.1 in
+  let moons_flat =
+    Array.concat_map (Array.create ~len ())
+      ~f:
+        Float.(
+          fun () ->
+            let i = Rand.int len in
+            let v = of_int i * pi / of_int len in
+            let c = cos v and s = sin v in
+            [| c + noise (); s + noise (); 1.0 - c + noise (); 0.5 - s + noise () |])
+  in
+  let moons_flat ~b = TDSL.init_const ~l:"moons_flat" ~b ~o:[ 2 ] moons_flat in
+  let moons_classes = Array.init (len * 2) ~f:(fun i -> if i % 2 = 0 then 1. else -1.) in
+  let moons_classes ~b = TDSL.init_const ~l:"moons_classes" ~b ~o:[ 1 ] moons_classes in
+  let%op mlp x = "b3" + ("w3" * ?/("b2" hid_dim + ("w2" * ?/("b1" hid_dim + ("w1" * x))))) in
+  (* let%op mlp x = "b" + ("w" * x) in *)
+  let%op loss_fn ~output ~expectation = ?/(!..1 - (expectation *. output)) in
+  (* We don't need a regression loss formula thanks to weight_decay built into the sgd_update
+     computation. *)
+  let weight_decay = 0.0002 in
+  (* So that we can inspect them. *)
+  let backend = Arrayjit.Backends.fresh_backend () in
+  let per_batch_callback ~at_batch ~at_step ~learning_rate ~batch_loss ~epoch_loss =
+    if (at_batch + 1) % 20 = 0 then
+      Stdio.printf "Batch=%d, step=%d, lr=%f, batch loss=%f, epoch loss=%f\n%!" at_batch at_step
+        learning_rate batch_loss epoch_loss
+  in
+  (* Tn.print_accessible_headers (); *)
+  let per_epoch_callback ~at_step ~at_epoch ~learning_rate ~epoch_loss =
+    Stdio.printf "Epoch=%d, step=%d, lr=%f, epoch loss=%f\n%!" at_epoch at_step learning_rate
+      epoch_loss
+  in
+  let module Backend = (val backend) in
+  let inputs, outputs, _model_result, infer_callback, _batch_losses, _epoch_losses, _learning_rates
+      =
+    Train.example_train_loop ~seed ~batch_size ~max_num_devices:(batch_size / 2) ~init_lr
+      ~data_len:len ~epochs ~inputs:moons_flat ~outputs:moons_classes ~model:mlp ~loss_fn
+      ~weight_decay ~per_batch_callback ~per_epoch_callback
+      (module Backend)
+      ()
+  in
+  let points = Tensor.value_2d_points ~xdim:0 ~ydim:1 inputs in
+  let classes = Tensor.value_1d_points ~xdim:0 outputs in
+  let points1, points2 = Array.partitioni_tf points ~f:Float.(fun i _ -> classes.(i) > 0.) in
+  let callback (x, y) = Float.((infer_callback [| x; y |]).(0) >= 0.) in
+  let plot_moons =
+    let open PrintBox_utils in
+    plot ~no_axes:true ~size:(120, 40)
+      [
+        Scatterplot { points = points1; pixel = "#" };
+        Scatterplot { points = points2; pixel = "%" };
+        Boundary_map { pixel_false = "."; pixel_true = "*"; callback };
+      ]
+  in
+  Stdio.printf "\nHalf-moons scatterplot and decision boundary:\n";
+  PrintBox_text.output Stdio.stdout plot_moons
+
+
+let () =
+  (* Get some insights. *)
+  Utils.set_log_level 1;
+  Exn.protect ~f:main ~finally:Utils.restore_settings