Skip to content

Commit

Permalink
a TODO file
Browse files Browse the repository at this point in the history
  • Loading branch information
lukstafi committed Nov 22, 2024
1 parent f571d9e commit 9dd686b
Show file tree
Hide file tree
Showing 2 changed files with 14 additions and 4 deletions.
13 changes: 9 additions & 4 deletions bin/moons_benchmark.ml
Original file line number Diff line number Diff line change
Expand Up @@ -47,9 +47,9 @@ let classify_moons ~seed ~on_device ~inlining_cutoff ~num_streams ~batch_size ~b
let flat_len = data_len / 2 in
(* Note: [minibatch_size = batch_size / num_streams] is the actual per-device batch used. *)
(* let epochs = 200 in *)
(* let epochs = 100 in *)
let epochs = 100 in
(* TINY for debugging: *)
let epochs = 2 in
(* let epochs = 2 in *)
(* let epochs = 1 in *)
(* let init_lr = 0.1 in *)
let init_lr = 0.01 in
Expand Down Expand Up @@ -214,8 +214,13 @@ let _mem_benchmarks =
~f:(fun batch_size ->
List.concat_map [ 0; (* 1; 2; *) 3 ] ~f:(fun inlining_cutoff ->
List.concat_map [ (* 1; 3; *) 7 (* *) ] ~f:(fun seed ->
List.concat_map [ (* "gccjit" ; *) "cc"; "cuda" ] ~f:(fun backend_name ->
List.concat_map [ (* CDSL.double; *) CDSL.single; CDSL.half ]
List.concat_map
[
(* "gccjit" ; *)
(* "cc"; *)
"cuda";
] ~f:(fun backend_name ->
List.concat_map [ (* CDSL.double; *) CDSL.single (* ; CDSL.half *) ]
~f:(fun value_prec ->
[
classify_moons ~seed ~on_device:true ~inlining_cutoff ~num_streams
Expand Down
5 changes: 5 additions & 0 deletions todo.md
Original file line number Diff line number Diff line change
@@ -0,0 +1,5 @@
# This file is for tasks with a smaller granularity than issues, typically immediate tasks.
(B) bin/moons_benchmark with the cc backend crashes with half-prec overflow
(B) remove syncing from the data parallel algo: stream-to-stream syncing is now automatic
(A) cuda backend crashes in bin/moons_benchmark {cm:2024-11-22}
(B) figure out why cuda backend parallelism slows down in later epochs

0 comments on commit 9dd686b

Please sign in to comment.