Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in
Toggle navigation
Menu
Open sidebar
tsoc
superbenchmark
Commits
4e6935ab
Unverified
Commit
4e6935ab
authored
Nov 27, 2024
by
pdr
Committed by
GitHub
Nov 27, 2024
Browse files
Bug Fix - Fix stderr message in gpu-copy benchmark (#673)
Fix ordering of args in err messages.
parent
96f5ccea
Changes
1
Hide whitespace changes
Inline
Side-by-side
Showing
1 changed file
with
21 additions
and
21 deletions
+21
-21
superbench/benchmarks/micro_benchmarks/gpu_copy_performance/gpu_copy.cu
...chmarks/micro_benchmarks/gpu_copy_performance/gpu_copy.cu
+21
-21
No files found.
superbench/benchmarks/micro_benchmarks/gpu_copy_performance/gpu_copy.cu
View file @
4e6935ab
...
...
@@ -913,7 +913,7 @@ int RunAllToAllBench(const Opts &opts, int gpu_count, int src_rank, int dst_rank
for
(
int
rank
=
0
;
rank
<
gpu_count
;
rank
++
)
{
if
(
SetGpu
(
rank
))
{
fprintf
(
stderr
,
"RunAllToAllBench::SetGpu for rank %d error: %d
\n
"
,
cuda_err
,
rank
);
fprintf
(
stderr
,
"RunAllToAllBench::SetGpu for rank %d error: %d
\n
"
,
rank
,
cuda_err
);
return
-
1
;
}
...
...
@@ -924,7 +924,7 @@ int RunAllToAllBench(const Opts &opts, int gpu_count, int src_rank, int dst_rank
cuda_err
=
GpuMallocDataBuf
(
&
(
src_buffers_gpu
[
rank
]),
opts
.
size
);
#endif
if
(
cuda_err
!=
cudaSuccess
)
{
fprintf
(
stderr
,
"RunAllToAllBench::cudaMalloc for src_buffers_gpu[%d] error: %d
\n
"
,
cuda_err
,
rank
);
fprintf
(
stderr
,
"RunAllToAllBench::cudaMalloc for src_buffers_gpu[%d] error: %d
\n
"
,
rank
,
cuda_err
);
return
-
1
;
}
if
(
opts
.
check_data
)
{
...
...
@@ -933,7 +933,7 @@ int RunAllToAllBench(const Opts &opts, int gpu_count, int src_rank, int dst_rank
}
cuda_err
=
cudaMemcpy
(
src_buffers_gpu
[
rank
],
data_buffer_cpu
,
opts
.
size
,
cudaMemcpyDefault
);
if
(
cuda_err
!=
cudaSuccess
)
{
fprintf
(
stderr
,
"RunAllToAllBench::cudaMemcpy to src_buffers_gpu[%d] error: %d
\n
"
,
cuda_err
,
rank
);
fprintf
(
stderr
,
"RunAllToAllBench::cudaMemcpy to src_buffers_gpu[%d] error: %d
\n
"
,
rank
,
cuda_err
);
return
-
1
;
}
}
...
...
@@ -945,7 +945,7 @@ int RunAllToAllBench(const Opts &opts, int gpu_count, int src_rank, int dst_rank
cuda_err
=
GpuMallocDataBuf
(
&
(
dst_buffers_gpu
[
rank
]),
opts
.
size
);
#endif
if
(
cuda_err
!=
cudaSuccess
)
{
fprintf
(
stderr
,
"RunAllToAllBench::cudaMalloc for dst_buffers_gpu[%d] error: %d
\n
"
,
cuda_err
,
rank
);
fprintf
(
stderr
,
"RunAllToAllBench::cudaMalloc for dst_buffers_gpu[%d] error: %d
\n
"
,
rank
,
cuda_err
);
return
-
1
;
}
...
...
@@ -959,12 +959,12 @@ int RunAllToAllBench(const Opts &opts, int gpu_count, int src_rank, int dst_rank
// Prepare events
cuda_err
=
cudaEventCreate
(
&
(
start_events
[
rank
]));
if
(
cuda_err
!=
cudaSuccess
)
{
fprintf
(
stderr
,
"RunAllToAllBench::cudaEventCreate for start_events[%d] error: %d
\n
"
,
cuda_err
,
rank
);
fprintf
(
stderr
,
"RunAllToAllBench::cudaEventCreate for start_events[%d] error: %d
\n
"
,
rank
,
cuda_err
);
return
-
1
;
}
cuda_err
=
cudaEventCreate
(
&
(
stop_events
[
rank
]));
if
(
cuda_err
!=
cudaSuccess
)
{
fprintf
(
stderr
,
"RunAllToAllBench::cudaEventCreate for stop_events[%d] error: %d
\n
"
,
cuda_err
,
rank
);
fprintf
(
stderr
,
"RunAllToAllBench::cudaEventCreate for stop_events[%d] error: %d
\n
"
,
rank
,
cuda_err
);
return
-
1
;
}
}
...
...
@@ -972,20 +972,20 @@ int RunAllToAllBench(const Opts &opts, int gpu_count, int src_rank, int dst_rank
// Prepare kernel arguments
for
(
int
rank
=
0
;
rank
<
gpu_count
;
rank
++
)
{
if
(
SetGpu
(
rank
))
{
fprintf
(
stderr
,
"RunAllToAllBench::SetGpu for rank %d error: %d
\n
"
,
cuda_err
,
rank
);
fprintf
(
stderr
,
"RunAllToAllBench::SetGpu for rank %d error: %d
\n
"
,
rank
,
cuda_err
);
return
-
1
;
}
// Prepare destination buffer args
cuda_err
=
cudaMalloc
(
&
(
dst_buffer_gpu_args
[
rank
]),
sizeof
(
uint8_t
*
)
*
gpu_count
);
if
(
cuda_err
!=
cudaSuccess
)
{
fprintf
(
stderr
,
"RunAllToAllBench::cudaMalloc for dst_buffer_gpu_args[%d] error: %d
\n
"
,
cuda_err
,
rank
);
fprintf
(
stderr
,
"RunAllToAllBench::cudaMalloc for dst_buffer_gpu_args[%d] error: %d
\n
"
,
rank
,
cuda_err
);
return
-
1
;
}
cuda_err
=
cudaMemcpy
(
dst_buffer_gpu_args
[
rank
],
dst_buffers_gpu
.
data
(),
sizeof
(
uint8_t
*
)
*
gpu_count
,
cudaMemcpyDefault
);
if
(
cuda_err
!=
cudaSuccess
)
{
fprintf
(
stderr
,
"RunAllToAllBench::cudaMemcpy to dst_buffer_gpu_args[%d] error: %d
\n
"
,
cuda_err
,
rank
);
fprintf
(
stderr
,
"RunAllToAllBench::cudaMemcpy to dst_buffer_gpu_args[%d] error: %d
\n
"
,
rank
,
cuda_err
);
return
-
1
;
}
}
...
...
@@ -998,15 +998,15 @@ int RunAllToAllBench(const Opts &opts, int gpu_count, int src_rank, int dst_rank
}
if
(
SetGpu
(
rank
))
{
fprintf
(
stderr
,
"RunAllToAllBench::SetGpu for rank %d error: %d
\n
"
,
cuda_err
,
rank
);
fprintf
(
stderr
,
"RunAllToAllBench::SetGpu for rank %d error: %d
\n
"
,
rank
,
cuda_err
);
return
-
1
;
}
if
(
i
==
opts
.
num_warm_up
)
{
cuda_err
=
cudaEventRecord
(
start_events
[
rank
],
streams
[
rank
]);
if
(
cuda_err
!=
cudaSuccess
)
{
fprintf
(
stderr
,
"RunAllToAllBench::cudaEventRecord for start_events[%d] error: %d
\n
"
,
cuda_err
,
rank
);
fprintf
(
stderr
,
"RunAllToAllBench::cudaEventRecord for start_events[%d] error: %d
\n
"
,
rank
,
cuda_err
);
return
-
1
;
}
}
...
...
@@ -1017,8 +1017,8 @@ int RunAllToAllBench(const Opts &opts, int gpu_count, int src_rank, int dst_rank
if
(
i
==
opts
.
num_warm_up
+
opts
.
num_loops
-
1
)
{
cuda_err
=
cudaEventRecord
(
stop_events
[
rank
],
streams
[
rank
]);
if
(
cuda_err
!=
cudaSuccess
)
{
fprintf
(
stderr
,
"RunAllToAllBench::cudaEventRecord for stop_events[%d] error: %d
\n
"
,
cuda_err
,
rank
);
fprintf
(
stderr
,
"RunAllToAllBench::cudaEventRecord for stop_events[%d] error: %d
\n
"
,
rank
,
cuda_err
);
return
-
1
;
}
}
...
...
@@ -1030,7 +1030,7 @@ int RunAllToAllBench(const Opts &opts, int gpu_count, int src_rank, int dst_rank
}
cuda_err
=
cudaStreamSynchronize
(
streams
[
rank
]);
if
(
cuda_err
!=
cudaSuccess
)
{
fprintf
(
stderr
,
"RunAllToAllBench::cudaStreamSynchronize streams[%d] error: %d
\n
"
,
cuda_err
,
rank
);
fprintf
(
stderr
,
"RunAllToAllBench::cudaStreamSynchronize streams[%d] error: %d
\n
"
,
rank
,
cuda_err
);
return
-
1
;
}
}
...
...
@@ -1045,7 +1045,7 @@ int RunAllToAllBench(const Opts &opts, int gpu_count, int src_rank, int dst_rank
float
time_in_ms
=
0
;
cuda_err
=
cudaEventElapsedTime
(
&
time_in_ms
,
start_events
[
rank
],
stop_events
[
rank
]);
if
(
cuda_err
!=
cudaSuccess
)
{
fprintf
(
stderr
,
"RunAllToAllBench::cudaEventElapsedTime for rank %d error: %d
\n
"
,
cuda_err
,
rank
);
fprintf
(
stderr
,
"RunAllToAllBench::cudaEventElapsedTime for rank %d error: %d
\n
"
,
rank
,
cuda_err
);
return
-
1
;
}
double
bw
=
opts
.
size
*
(
gpu_count
-
1
)
*
opts
.
num_loops
/
gpu_count
/
time_in_ms
/
1e6
;
...
...
@@ -1072,8 +1072,8 @@ int RunAllToAllBench(const Opts &opts, int gpu_count, int src_rank, int dst_rank
}
cuda_err
=
cudaMemcpy
(
data_buffer_cpu
,
dst_buffers_gpu
[
curr_dst_rank
],
opts
.
size
,
cudaMemcpyDefault
);
if
(
cuda_err
!=
cudaSuccess
)
{
fprintf
(
stderr
,
"RunAllToAllBench::cudaMemcpy from dst_buffers_gpu[%d] error: %d
\n
"
,
cu
da_err
,
cu
rr_dst_rank
);
fprintf
(
stderr
,
"RunAllToAllBench::cudaMemcpy from dst_buffers_gpu[%d] error: %d
\n
"
,
cu
rr_dst_rank
,
cu
da_err
);
return
-
1
;
}
for
(
uint64_t
i
=
0
;
i
<
opts
.
size
/
sizeof
(
uint64_t
);
i
++
)
{
...
...
@@ -1100,17 +1100,17 @@ int RunAllToAllBench(const Opts &opts, int gpu_count, int src_rank, int dst_rank
for
(
int
rank
=
0
;
rank
<
gpu_count
;
rank
++
)
{
cuda_err
=
cudaFree
(
src_buffers_gpu
[
rank
]);
if
(
cuda_err
!=
cudaSuccess
)
{
fprintf
(
stderr
,
"RunAllToAllBench::cudaFree for src_buffers_gpu[%d] error: %d
\n
"
,
cuda_err
,
rank
);
fprintf
(
stderr
,
"RunAllToAllBench::cudaFree for src_buffers_gpu[%d] error: %d
\n
"
,
rank
,
cuda_err
);
return
-
1
;
}
cuda_err
=
cudaFree
(
dst_buffers_gpu
[
rank
]);
if
(
cuda_err
!=
cudaSuccess
)
{
fprintf
(
stderr
,
"RunAllToAllBench::cudaFree for dst_buffers_gpu[%d] error: %d
\n
"
,
cuda_err
,
rank
);
fprintf
(
stderr
,
"RunAllToAllBench::cudaFree for dst_buffers_gpu[%d] error: %d
\n
"
,
rank
,
cuda_err
);
return
-
1
;
}
cuda_err
=
cudaFree
(
dst_buffer_gpu_args
[
rank
]);
if
(
cuda_err
!=
cudaSuccess
)
{
fprintf
(
stderr
,
"RunAllToAllBench::cudaFree for dst_buffer_gpu_args[%d] error: %d
\n
"
,
cuda_err
,
rank
);
fprintf
(
stderr
,
"RunAllToAllBench::cudaFree for dst_buffer_gpu_args[%d] error: %d
\n
"
,
rank
,
cuda_err
);
return
-
1
;
}
}
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment