Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in / Register
Toggle navigation
Menu
Open sidebar
one
TransferBench
Commits
7644fef5
Commit
7644fef5
authored
Dec 12, 2024
by
srawat
Browse files
Refining API library
parent
38f89e59
Changes
2
Show whitespace changes
Inline
Side-by-side
Showing
2 changed files
with
8 additions
and
6 deletions
+8
-6
docs/doxygen/Doxyfile
docs/doxygen/Doxyfile
+1
-1
src/header/TransferBench.hpp
src/header/TransferBench.hpp
+7
-5
No files found.
docs/doxygen/Doxyfile
View file @
7644fef5
...
...
@@ -775,7 +775,7 @@ WARN_LOGFILE =
# spaces. See also FILE_PATTERNS and EXTENSION_MAPPING
# Note: If this tag is empty the current directory is searched.
INPUT = ../../src/header
INPUT = ../../src/header
\
../../src/include
# This tag can be used to specify the character encoding of the source files
...
...
src/header/TransferBench.hpp
View file @
7644fef5
...
...
@@ -20,6 +20,7 @@ OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
THE SOFTWARE.
*/
/**
#pragma once
#include <cstring>
#include <future>
...
...
@@ -41,6 +42,7 @@ THE SOFTWARE.
#include <hsa/hsa.h>
#include <hsa/hsa_ext_amd.h>
#endif
*/
namespace
TransferBench
{
...
...
@@ -118,7 +120,7 @@ namespace TransferBench
*/
struct
Transfer
{
size_t
numBytes
=
(
1
<<
26
);
///<
#
of bytes to Transfer
size_t
numBytes
=
(
1
<<
26
);
///<
Number
of bytes to Transfer
vector
<
MemDevice
>
srcs
=
{};
///< List of source memory devices
vector
<
MemDevice
>
dsts
=
{};
///< List of destination memory devices
ExeDevice
exeDevice
=
{};
///< Executor to use
...
...
@@ -132,8 +134,8 @@ namespace TransferBench
*/
struct
GeneralOptions
{
int
numIterations
=
10
;
///<
#
of timed iterations to perform. If negative, run for -numIterations seconds instead
int
numSubIterations
=
1
;
///<
#
of sub-iterations per iteration
int
numIterations
=
10
;
///<
Number
of timed iterations to perform. If negative, run for -numIterations seconds instead
int
numSubIterations
=
1
;
///<
Number
of sub-iterations per iteration
int
numWarmups
=
3
;
///< Number of un-timed warmup iterations to perform
int
recordPerIteration
=
0
;
///< Record per-iteration timing information
int
useInteractive
=
0
;
///< Pause for user-input before starting transfer loop
...
...
@@ -468,8 +470,8 @@ namespace {
int
constexpr
MAX_BLOCKSIZE
=
512
;
// Max threadblock size
int
constexpr
MAX_WAVEGROUPS
=
MAX_BLOCKSIZE
/
64
;
// Max wavegroups/warps
int
constexpr
MAX_UNROLL
=
8
;
// Max unroll factor
int
constexpr
MAX_SRCS
=
8
;
// Max
#
srcs per Transfer
int
constexpr
MAX_DSTS
=
8
;
// Max
#
dsts per Transfer
int
constexpr
MAX_SRCS
=
8
;
// Max
number of
srcs per Transfer
int
constexpr
MAX_DSTS
=
8
;
// Max
number of
dsts per Transfer
int
constexpr
MEMSET_CHAR
=
75
;
// Value to memset (char)
float
constexpr
MEMSET_VAL
=
13323083.0
f
;
// Value to memset (double)
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment