Skip to content

Commit 4e6935a

Browse files
authored
Bug Fix - Fix stderr message in gpu-copy benchmark (#673)
Fix ordering of args in err messages.
1 parent 96f5cce commit 4e6935a

File tree

1 file changed

+21
-21
lines changed
  • superbench/benchmarks/micro_benchmarks/gpu_copy_performance

1 file changed

+21
-21
lines changed

superbench/benchmarks/micro_benchmarks/gpu_copy_performance/gpu_copy.cu

Lines changed: 21 additions & 21 deletions
Original file line numberDiff line numberDiff line change
@@ -913,7 +913,7 @@ int RunAllToAllBench(const Opts &opts, int gpu_count, int src_rank, int dst_rank
913913

914914
for (int rank = 0; rank < gpu_count; rank++) {
915915
if (SetGpu(rank)) {
916-
fprintf(stderr, "RunAllToAllBench::SetGpu for rank %d error: %d\n", cuda_err, rank);
916+
fprintf(stderr, "RunAllToAllBench::SetGpu for rank %d error: %d\n", rank, cuda_err);
917917
return -1;
918918
}
919919

@@ -924,7 +924,7 @@ int RunAllToAllBench(const Opts &opts, int gpu_count, int src_rank, int dst_rank
924924
cuda_err = GpuMallocDataBuf(&(src_buffers_gpu[rank]), opts.size);
925925
#endif
926926
if (cuda_err != cudaSuccess) {
927-
fprintf(stderr, "RunAllToAllBench::cudaMalloc for src_buffers_gpu[%d] error: %d\n", cuda_err, rank);
927+
fprintf(stderr, "RunAllToAllBench::cudaMalloc for src_buffers_gpu[%d] error: %d\n", rank, cuda_err);
928928
return -1;
929929
}
930930
if (opts.check_data) {
@@ -933,7 +933,7 @@ int RunAllToAllBench(const Opts &opts, int gpu_count, int src_rank, int dst_rank
933933
}
934934
cuda_err = cudaMemcpy(src_buffers_gpu[rank], data_buffer_cpu, opts.size, cudaMemcpyDefault);
935935
if (cuda_err != cudaSuccess) {
936-
fprintf(stderr, "RunAllToAllBench::cudaMemcpy to src_buffers_gpu[%d] error: %d\n", cuda_err, rank);
936+
fprintf(stderr, "RunAllToAllBench::cudaMemcpy to src_buffers_gpu[%d] error: %d\n", rank, cuda_err);
937937
return -1;
938938
}
939939
}
@@ -945,7 +945,7 @@ int RunAllToAllBench(const Opts &opts, int gpu_count, int src_rank, int dst_rank
945945
cuda_err = GpuMallocDataBuf(&(dst_buffers_gpu[rank]), opts.size);
946946
#endif
947947
if (cuda_err != cudaSuccess) {
948-
fprintf(stderr, "RunAllToAllBench::cudaMalloc for dst_buffers_gpu[%d] error: %d\n", cuda_err, rank);
948+
fprintf(stderr, "RunAllToAllBench::cudaMalloc for dst_buffers_gpu[%d] error: %d\n", rank, cuda_err);
949949
return -1;
950950
}
951951

@@ -959,33 +959,33 @@ int RunAllToAllBench(const Opts &opts, int gpu_count, int src_rank, int dst_rank
959959
// Prepare events
960960
cuda_err = cudaEventCreate(&(start_events[rank]));
961961
if (cuda_err != cudaSuccess) {
962-
fprintf(stderr, "RunAllToAllBench::cudaEventCreate for start_events[%d] error: %d\n", cuda_err, rank);
962+
fprintf(stderr, "RunAllToAllBench::cudaEventCreate for start_events[%d] error: %d\n", rank, cuda_err);
963963
return -1;
964964
}
965965
cuda_err = cudaEventCreate(&(stop_events[rank]));
966966
if (cuda_err != cudaSuccess) {
967-
fprintf(stderr, "RunAllToAllBench::cudaEventCreate for stop_events[%d] error: %d\n", cuda_err, rank);
967+
fprintf(stderr, "RunAllToAllBench::cudaEventCreate for stop_events[%d] error: %d\n", rank, cuda_err);
968968
return -1;
969969
}
970970
}
971971

972972
// Prepare kernel arguments
973973
for (int rank = 0; rank < gpu_count; rank++) {
974974
if (SetGpu(rank)) {
975-
fprintf(stderr, "RunAllToAllBench::SetGpu for rank %d error: %d\n", cuda_err, rank);
975+
fprintf(stderr, "RunAllToAllBench::SetGpu for rank %d error: %d\n", rank, cuda_err);
976976
return -1;
977977
}
978978

979979
// Prepare destination buffer args
980980
cuda_err = cudaMalloc(&(dst_buffer_gpu_args[rank]), sizeof(uint8_t *) * gpu_count);
981981
if (cuda_err != cudaSuccess) {
982-
fprintf(stderr, "RunAllToAllBench::cudaMalloc for dst_buffer_gpu_args[%d] error: %d\n", cuda_err, rank);
982+
fprintf(stderr, "RunAllToAllBench::cudaMalloc for dst_buffer_gpu_args[%d] error: %d\n", rank, cuda_err);
983983
return -1;
984984
}
985985
cuda_err = cudaMemcpy(dst_buffer_gpu_args[rank], dst_buffers_gpu.data(), sizeof(uint8_t *) * gpu_count,
986986
cudaMemcpyDefault);
987987
if (cuda_err != cudaSuccess) {
988-
fprintf(stderr, "RunAllToAllBench::cudaMemcpy to dst_buffer_gpu_args[%d] error: %d\n", cuda_err, rank);
988+
fprintf(stderr, "RunAllToAllBench::cudaMemcpy to dst_buffer_gpu_args[%d] error: %d\n", rank, cuda_err);
989989
return -1;
990990
}
991991
}
@@ -998,15 +998,15 @@ int RunAllToAllBench(const Opts &opts, int gpu_count, int src_rank, int dst_rank
998998
}
999999

10001000
if (SetGpu(rank)) {
1001-
fprintf(stderr, "RunAllToAllBench::SetGpu for rank %d error: %d\n", cuda_err, rank);
1001+
fprintf(stderr, "RunAllToAllBench::SetGpu for rank %d error: %d\n", rank, cuda_err);
10021002
return -1;
10031003
}
10041004

10051005
if (i == opts.num_warm_up) {
10061006
cuda_err = cudaEventRecord(start_events[rank], streams[rank]);
10071007
if (cuda_err != cudaSuccess) {
1008-
fprintf(stderr, "RunAllToAllBench::cudaEventRecord for start_events[%d] error: %d\n", cuda_err,
1009-
rank);
1008+
fprintf(stderr, "RunAllToAllBench::cudaEventRecord for start_events[%d] error: %d\n", rank,
1009+
cuda_err);
10101010
return -1;
10111011
}
10121012
}
@@ -1017,8 +1017,8 @@ int RunAllToAllBench(const Opts &opts, int gpu_count, int src_rank, int dst_rank
10171017
if (i == opts.num_warm_up + opts.num_loops - 1) {
10181018
cuda_err = cudaEventRecord(stop_events[rank], streams[rank]);
10191019
if (cuda_err != cudaSuccess) {
1020-
fprintf(stderr, "RunAllToAllBench::cudaEventRecord for stop_events[%d] error: %d\n", cuda_err,
1021-
rank);
1020+
fprintf(stderr, "RunAllToAllBench::cudaEventRecord for stop_events[%d] error: %d\n", rank,
1021+
cuda_err);
10221022
return -1;
10231023
}
10241024
}
@@ -1030,7 +1030,7 @@ int RunAllToAllBench(const Opts &opts, int gpu_count, int src_rank, int dst_rank
10301030
}
10311031
cuda_err = cudaStreamSynchronize(streams[rank]);
10321032
if (cuda_err != cudaSuccess) {
1033-
fprintf(stderr, "RunAllToAllBench::cudaStreamSynchronize streams[%d] error: %d\n", cuda_err, rank);
1033+
fprintf(stderr, "RunAllToAllBench::cudaStreamSynchronize streams[%d] error: %d\n", rank, cuda_err);
10341034
return -1;
10351035
}
10361036
}
@@ -1045,7 +1045,7 @@ int RunAllToAllBench(const Opts &opts, int gpu_count, int src_rank, int dst_rank
10451045
float time_in_ms = 0;
10461046
cuda_err = cudaEventElapsedTime(&time_in_ms, start_events[rank], stop_events[rank]);
10471047
if (cuda_err != cudaSuccess) {
1048-
fprintf(stderr, "RunAllToAllBench::cudaEventElapsedTime for rank %d error: %d\n", cuda_err, rank);
1048+
fprintf(stderr, "RunAllToAllBench::cudaEventElapsedTime for rank %d error: %d\n", rank, cuda_err);
10491049
return -1;
10501050
}
10511051
double bw = opts.size * (gpu_count - 1) * opts.num_loops / gpu_count / time_in_ms / 1e6;
@@ -1072,8 +1072,8 @@ int RunAllToAllBench(const Opts &opts, int gpu_count, int src_rank, int dst_rank
10721072
}
10731073
cuda_err = cudaMemcpy(data_buffer_cpu, dst_buffers_gpu[curr_dst_rank], opts.size, cudaMemcpyDefault);
10741074
if (cuda_err != cudaSuccess) {
1075-
fprintf(stderr, "RunAllToAllBench::cudaMemcpy from dst_buffers_gpu[%d] error: %d\n", cuda_err,
1076-
curr_dst_rank);
1075+
fprintf(stderr, "RunAllToAllBench::cudaMemcpy from dst_buffers_gpu[%d] error: %d\n", curr_dst_rank,
1076+
cuda_err);
10771077
return -1;
10781078
}
10791079
for (uint64_t i = 0; i < opts.size / sizeof(uint64_t); i++) {
@@ -1100,17 +1100,17 @@ int RunAllToAllBench(const Opts &opts, int gpu_count, int src_rank, int dst_rank
11001100
for (int rank = 0; rank < gpu_count; rank++) {
11011101
cuda_err = cudaFree(src_buffers_gpu[rank]);
11021102
if (cuda_err != cudaSuccess) {
1103-
fprintf(stderr, "RunAllToAllBench::cudaFree for src_buffers_gpu[%d] error: %d\n", cuda_err, rank);
1103+
fprintf(stderr, "RunAllToAllBench::cudaFree for src_buffers_gpu[%d] error: %d\n", rank, cuda_err);
11041104
return -1;
11051105
}
11061106
cuda_err = cudaFree(dst_buffers_gpu[rank]);
11071107
if (cuda_err != cudaSuccess) {
1108-
fprintf(stderr, "RunAllToAllBench::cudaFree for dst_buffers_gpu[%d] error: %d\n", cuda_err, rank);
1108+
fprintf(stderr, "RunAllToAllBench::cudaFree for dst_buffers_gpu[%d] error: %d\n", rank, cuda_err);
11091109
return -1;
11101110
}
11111111
cuda_err = cudaFree(dst_buffer_gpu_args[rank]);
11121112
if (cuda_err != cudaSuccess) {
1113-
fprintf(stderr, "RunAllToAllBench::cudaFree for dst_buffer_gpu_args[%d] error: %d\n", cuda_err, rank);
1113+
fprintf(stderr, "RunAllToAllBench::cudaFree for dst_buffer_gpu_args[%d] error: %d\n", rank, cuda_err);
11141114
return -1;
11151115
}
11161116
}

0 commit comments

Comments
 (0)