-
Notifications
You must be signed in to change notification settings - Fork 4
Commit
This commit does not belong to any branch on this repository, and may belong to a fork outside of the repository.
compute-engine gpu: add qs and allreduce runs
Signed-off-by: vsoch <[email protected]>
- Loading branch information
Showing
34 changed files
with
1,348 additions
and
328 deletions.
There are no files selected for viewing
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
36 changes: 36 additions & 0 deletions
36
...compute-engine/gpu/size16/results/osu-allreduce/osu-allreduce-16-iter-1-3561500966912.out
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,36 @@ | ||
58.145s: job.exception type=cancel severity=0 interrupted by ctrl-C | ||
58.552s: job.exception type=cancel severity=0 interrupted by ctrl-C | ||
flux-job: task(s) Terminated | ||
|
||
# OSU MPI-CUDA Allreduce Latency Test v5.8 | ||
# Size Avg Latency(us) | ||
4 337.07 | ||
8 333.06 | ||
16 334.79 | ||
32 340.88 | ||
64 333.40 | ||
128 341.31 | ||
256 343.44 | ||
512 356.03 | ||
1024 373.93 | ||
2048 411.85 | ||
4096 451.33 | ||
8192 746.66 | ||
16384 1038.96 | ||
32768 1323.51 | ||
65536 1420.76 | ||
131072 2002.24 | ||
262144 1318.68 | ||
524288 2188.49 | ||
1048576 3982.10 | ||
START OF JOBSPEC | ||
{"resources": [{"type": "node", "count": 16, "with": [{"type": "slot", "count": 8, "with": [{"type": "core", "count": 1}, {"type": "gpu", "count": 1}], "label": "task"}]}], "tasks": [{"command": ["/opt/osu-benchmark/build.openmpi/mpi/collective/osu_allreduce", "-d", "cuda", "H", "H"], "slot": "task", "count": {"per_slot": 1}}], "attributes": {"system": {"duration": 0, "cwd": "/home/sochat1_llnl_gov", "shell": {"options": {"rlimit": {"cpu": -1, "fsize": -1, "data": -1, "stack": 8388608, "core": 0, "nofile": 1048576, "as": -1, "rss": -1, "nproc": -1}, "cpu-affinity": "per-task", "gpu-affinity": "per-task"}}}, "user": {"study_id": "osu-allreduce-16-iter-1"}}, "version": 1} | ||
START OF EVENTLOG | ||
{"timestamp":1725922820.0990932,"name":"init"} | ||
{"timestamp":1725922820.1000268,"name":"starting"} | ||
{"timestamp":1725922820.779249,"name":"shell.init","context":{"service":"501043911-shell-f2cZAePdh","leader-rank":0,"size":16}} | ||
{"timestamp":1725922820.9687486,"name":"shell.start","context":{"taskmap":{"version":1,"map":[[0,16,8,1]]}}} | ||
{"timestamp":1725922878.296582,"name":"shell.task-exit","context":{"localid":1,"rank":65,"state":"Exited","pid":1487,"wait_status":15,"signaled":15,"exitcode":143}} | ||
{"timestamp":1725922878.8372781,"name":"complete","context":{"status":36608}} | ||
{"timestamp":1725922878.837321,"name":"done"} | ||
|
37 changes: 37 additions & 0 deletions
37
...compute-engine/gpu/size16/results/osu-allreduce/osu-allreduce-16-iter-2-4692083998720.out
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,37 @@ | ||
23.953s: job.exception type=cancel severity=0 interrupted by ctrl-C | ||
24.155s: job.exception type=cancel severity=0 interrupted by ctrl-C | ||
24.348s: job.exception type=cancel severity=0 interrupted by ctrl-C | ||
flux-job: task(s) Terminated | ||
|
||
# OSU MPI-CUDA Allreduce Latency Test v5.8 | ||
# Size Avg Latency(us) | ||
4 346.93 | ||
8 343.36 | ||
16 345.98 | ||
32 345.99 | ||
64 345.13 | ||
128 343.23 | ||
256 359.02 | ||
512 366.02 | ||
1024 379.76 | ||
2048 423.79 | ||
4096 467.01 | ||
8192 738.21 | ||
16384 1113.73 | ||
32768 1372.31 | ||
65536 1449.55 | ||
131072 2002.28 | ||
262144 1318.81 | ||
524288 2209.33 | ||
1048576 4025.37 | ||
START OF JOBSPEC | ||
{"resources": [{"type": "node", "count": 16, "with": [{"type": "slot", "count": 8, "with": [{"type": "core", "count": 1}, {"type": "gpu", "count": 1}], "label": "task"}]}], "tasks": [{"command": ["/opt/osu-benchmark/build.openmpi/mpi/collective/osu_allreduce", "-d", "cuda", "H", "H"], "slot": "task", "count": {"per_slot": 1}}], "attributes": {"system": {"duration": 0, "cwd": "/home/sochat1_llnl_gov", "shell": {"options": {"rlimit": {"cpu": -1, "fsize": -1, "data": -1, "stack": 8388608, "core": 0, "nofile": 1048576, "as": -1, "rss": -1, "nproc": -1}, "cpu-affinity": "per-task", "gpu-affinity": "per-task"}}}, "user": {"study_id": "osu-allreduce-16-iter-2"}}, "version": 1} | ||
START OF EVENTLOG | ||
{"timestamp":1725922887.4867351,"name":"init"} | ||
{"timestamp":1725922887.4880421,"name":"starting"} | ||
{"timestamp":1725922887.6449196,"name":"shell.init","context":{"service":"501043911-shell-f38FgPx4w","leader-rank":0,"size":16}} | ||
{"timestamp":1725922887.6735122,"name":"shell.start","context":{"taskmap":{"version":1,"map":[[0,16,8,1]]}}} | ||
{"timestamp":1725922911.4788885,"name":"shell.task-exit","context":{"localid":0,"rank":16,"state":"Exited","pid":1540,"wait_status":15,"signaled":15,"exitcode":143}} | ||
{"timestamp":1725922911.8023748,"name":"complete","context":{"status":36608}} | ||
{"timestamp":1725922911.8023956,"name":"done"} | ||
|
37 changes: 37 additions & 0 deletions
37
...compute-engine/gpu/size16/results/osu-allreduce/osu-allreduce-16-iter-3-5154749284352.out
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,37 @@ | ||
28.598s: job.exception type=cancel severity=0 interrupted by ctrl-C | ||
28.759s: job.exception type=cancel severity=0 interrupted by ctrl-C | ||
28.880s: job.exception type=cancel severity=0 interrupted by ctrl-C | ||
flux-job: task(s) Terminated | ||
|
||
# OSU MPI-CUDA Allreduce Latency Test v5.8 | ||
# Size Avg Latency(us) | ||
4 343.81 | ||
8 340.60 | ||
16 342.57 | ||
32 341.13 | ||
64 349.80 | ||
128 352.47 | ||
256 366.56 | ||
512 372.22 | ||
1024 389.31 | ||
2048 433.20 | ||
4096 469.32 | ||
8192 772.67 | ||
16384 1108.57 | ||
32768 1423.65 | ||
65536 1486.61 | ||
131072 1971.11 | ||
262144 1310.67 | ||
524288 2192.83 | ||
1048576 4009.07 | ||
START OF JOBSPEC | ||
{"resources": [{"type": "node", "count": 16, "with": [{"type": "slot", "count": 8, "with": [{"type": "core", "count": 1}, {"type": "gpu", "count": 1}], "label": "task"}]}], "tasks": [{"command": ["/opt/osu-benchmark/build.openmpi/mpi/collective/osu_allreduce", "-d", "cuda", "H", "H"], "slot": "task", "count": {"per_slot": 1}}], "attributes": {"system": {"duration": 0, "cwd": "/home/sochat1_llnl_gov", "shell": {"options": {"rlimit": {"cpu": -1, "fsize": -1, "data": -1, "stack": 8388608, "core": 0, "nofile": 1048576, "as": -1, "rss": -1, "nproc": -1}, "cpu-affinity": "per-task", "gpu-affinity": "per-task"}}}, "user": {"study_id": "osu-allreduce-16-iter-3"}}, "version": 1} | ||
START OF EVENTLOG | ||
{"timestamp":1725922915.0641441,"name":"init"} | ||
{"timestamp":1725922915.0654099,"name":"starting"} | ||
{"timestamp":1725922915.1928067,"name":"shell.init","context":{"service":"501043911-shell-f3LQaYUUF","leader-rank":0,"size":16}} | ||
{"timestamp":1725922915.2170558,"name":"shell.start","context":{"taskmap":{"version":1,"map":[[0,16,8,1]]}}} | ||
{"timestamp":1725922943.6773355,"name":"shell.task-exit","context":{"localid":0,"rank":64,"state":"Exited","pid":1619,"wait_status":15,"signaled":15,"exitcode":143}} | ||
{"timestamp":1725922944.1458526,"name":"complete","context":{"status":36608}} | ||
{"timestamp":1725922944.1458805,"name":"done"} | ||
|
Oops, something went wrong.