File tree Expand file tree Collapse file tree 2 files changed +14
-4
lines changed Expand file tree Collapse file tree 2 files changed +14
-4
lines changed Original file line number Diff line number Diff line change @@ -47,9 +47,9 @@ let classify_moons ~seed ~on_device ~inlining_cutoff ~num_streams ~batch_size ~b
4747 let flat_len = data_len / 2 in
4848 (* Note: [minibatch_size = batch_size / num_streams] is the actual per-device batch used. *)
4949 (* let epochs = 200 in *)
50- (* let epochs = 100 in *)
50+ let epochs = 100 in
5151 (* TINY for debugging: *)
52- let epochs = 2 in
52+ (* let epochs = 2 in *)
5353 (* let epochs = 1 in *)
5454 (* let init_lr = 0.1 in *)
5555 let init_lr = 0.01 in
@@ -214,8 +214,13 @@ let _mem_benchmarks =
214214 ~f: (fun batch_size ->
215215 List. concat_map [ 0 ; (* 1; 2; *) 3 ] ~f: (fun inlining_cutoff ->
216216 List. concat_map [ (* 1; 3; *) 7 (* *) ] ~f: (fun seed ->
217- List. concat_map [ (* "gccjit" ; *) " cc" ; " cuda" ] ~f: (fun backend_name ->
218- List. concat_map [ (* CDSL.double; *) CDSL. single; CDSL. half ]
217+ List. concat_map
218+ [
219+ (* "gccjit" ; *)
220+ (* "cc"; *)
221+ " cuda" ;
222+ ] ~f: (fun backend_name ->
223+ List. concat_map [ (* CDSL.double; *) CDSL. single (* ; CDSL.half *) ]
219224 ~f: (fun value_prec ->
220225 [
221226 classify_moons ~seed ~on_device: true ~inlining_cutoff ~num_streams
Original file line number Diff line number Diff line change 1+ # This file is for tasks with a smaller granularity than issues, typically immediate tasks.
2+ (B) bin/moons_benchmark with the cc backend crashes with half-prec overflow
3+ (B) remove syncing from the data parallel algo: stream-to-stream syncing is now automatic
4+ (A) cuda backend crashes in bin/moons_benchmark {cm:2024-11-22}
5+ (B) figure out why cuda backend parallelism slows down in later epochs
You can’t perform that action at this time.
0 commit comments