Skip to content

Commit 9dd686b

Browse files
committed
a TODO file
1 parent f571d9e commit 9dd686b

File tree

2 files changed

+14
-4
lines changed

2 files changed

+14
-4
lines changed

bin/moons_benchmark.ml

Lines changed: 9 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -47,9 +47,9 @@ let classify_moons ~seed ~on_device ~inlining_cutoff ~num_streams ~batch_size ~b
4747
let flat_len = data_len / 2 in
4848
(* Note: [minibatch_size = batch_size / num_streams] is the actual per-device batch used. *)
4949
(* let epochs = 200 in *)
50-
(* let epochs = 100 in *)
50+
let epochs = 100 in
5151
(* TINY for debugging: *)
52-
let epochs = 2 in
52+
(* let epochs = 2 in *)
5353
(* let epochs = 1 in *)
5454
(* let init_lr = 0.1 in *)
5555
let init_lr = 0.01 in
@@ -214,8 +214,13 @@ let _mem_benchmarks =
214214
~f:(fun batch_size ->
215215
List.concat_map [ 0; (* 1; 2; *) 3 ] ~f:(fun inlining_cutoff ->
216216
List.concat_map [ (* 1; 3; *) 7 (* *) ] ~f:(fun seed ->
217-
List.concat_map [ (* "gccjit" ; *) "cc"; "cuda" ] ~f:(fun backend_name ->
218-
List.concat_map [ (* CDSL.double; *) CDSL.single; CDSL.half ]
217+
List.concat_map
218+
[
219+
(* "gccjit" ; *)
220+
(* "cc"; *)
221+
"cuda";
222+
] ~f:(fun backend_name ->
223+
List.concat_map [ (* CDSL.double; *) CDSL.single (* ; CDSL.half *) ]
219224
~f:(fun value_prec ->
220225
[
221226
classify_moons ~seed ~on_device:true ~inlining_cutoff ~num_streams

todo.md

Lines changed: 5 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,5 @@
1+
# This file is for tasks with a smaller granularity than issues, typically immediate tasks.
2+
(B) bin/moons_benchmark with the cc backend crashes with half-prec overflow
3+
(B) remove syncing from the data parallel algo: stream-to-stream syncing is now automatic
4+
(A) cuda backend crashes in bin/moons_benchmark {cm:2024-11-22}
5+
(B) figure out why cuda backend parallelism slows down in later epochs

0 commit comments

Comments
 (0)