Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in / Register
Toggle navigation
Menu
Open sidebar
one
TransferBench
Commits
437b6e70
Unverified
Commit
437b6e70
authored
Nov 29, 2023
by
gilbertlee-amd
Committed by
GitHub
Nov 29, 2023
Browse files
v1.40 Fixing USE_XCC_FILTER for preset configurations (#72)
parent
7a1dbd6a
Changes
3
Hide whitespace changes
Inline
Side-by-side
Showing
3 changed files
with
11 additions
and
1 deletion
+11
-1
CHANGELOG.md
CHANGELOG.md
+5
-0
src/TransferBench.cpp
src/TransferBench.cpp
+5
-0
src/include/EnvVars.hpp
src/include/EnvVars.hpp
+1
-1
No files found.
CHANGELOG.md
View file @
437b6e70
...
...
@@ -3,6 +3,11 @@
Documentation for TransferBench is available at
[
https://rocm.docs.amd.com/projects/TransferBench
](
https://rocm.docs.amd.com/projects/TransferBench
)
.
## v1.40
### Fixes
*
Fixing XCC defaulting to 0 instead of random for preset configs, ignoring XCC_PREF_TABLE
## v1.39
### Additions
...
...
src/TransferBench.cpp
View file @
437b6e70
...
...
@@ -1599,6 +1599,7 @@ void RunPeerToPeerBenchmarks(EnvVars const& ev, size_t N)
transfers
[
0
].
numSrcs
=
transfers
[
0
].
numDsts
=
1
;
transfers
[
0
].
exeType
=
IsGpuType
(
ev
.
useRemoteRead
?
dstType
:
srcType
)
?
gpuExeType
:
EXE_CPU
;
transfers
[
0
].
exeIndex
=
(
ev
.
useRemoteRead
?
dstIndex
:
srcIndex
);
transfers
[
0
].
exeSubIndex
=
-
1
;
transfers
[
0
].
numSubExecs
=
IsGpuType
(
transfers
[
0
].
exeType
)
?
ev
.
numGpuSubExecs
:
ev
.
numCpuSubExecs
;
// DST -> SRC
...
...
@@ -1612,6 +1613,7 @@ void RunPeerToPeerBenchmarks(EnvVars const& ev, size_t N)
transfers
[
1
].
dstIndex
.
push_back
(
srcIndex
);
transfers
[
1
].
exeType
=
IsGpuType
(
ev
.
useRemoteRead
?
srcType
:
dstType
)
?
gpuExeType
:
EXE_CPU
;
transfers
[
1
].
exeIndex
=
(
ev
.
useRemoteRead
?
srcIndex
:
dstIndex
);
transfers
[
1
].
exeSubIndex
=
-
1
;
transfers
[
1
].
numSubExecs
=
IsGpuType
(
transfers
[
1
].
exeType
)
?
ev
.
numGpuSubExecs
:
ev
.
numCpuSubExecs
;
}
...
...
@@ -1819,6 +1821,7 @@ void RunScalingBenchmark(EnvVars const& ev, size_t N, int const exeIndex, int co
transfers
[
0
].
numDsts
=
1
;
transfers
[
0
].
exeType
=
EXE_GPU_GFX
;
transfers
[
0
].
exeIndex
=
exeIndex
;
transfers
[
0
].
exeSubIndex
=
-
1
;
transfers
[
0
].
srcType
.
resize
(
1
,
MEM_GPU
);
transfers
[
0
].
dstType
.
resize
(
1
,
MEM_GPU
);
transfers
[
0
].
srcIndex
.
resize
(
1
);
...
...
@@ -1887,6 +1890,7 @@ void RunAllToAllBenchmark(EnvVars const& ev, size_t const numBytesPerTransfer, i
transfer
.
numSrcs
=
1
;
transfer
.
numDsts
=
1
;
transfer
.
exeType
=
EXE_GPU_GFX
;
transfer
.
exeSubIndex
=
-
1
;
transfer
.
srcType
.
resize
(
1
,
ev
.
useFineGrain
?
MEM_GPU_FINE
:
MEM_GPU
);
transfer
.
dstType
.
resize
(
1
,
ev
.
useFineGrain
?
MEM_GPU_FINE
:
MEM_GPU
);
transfer
.
srcIndex
.
resize
(
1
);
...
...
@@ -2459,6 +2463,7 @@ void RunSweepPreset(EnvVars const& ev, size_t const numBytesPerTransfer, int con
transfer
.
srcIndex
=
{
possibleTransfers
[
value
].
srcIndex
};
transfer
.
exeType
=
possibleTransfers
[
value
].
exeType
;
transfer
.
exeIndex
=
possibleTransfers
[
value
].
exeIndex
;
transfer
.
exeSubIndex
=
-
1
;
transfer
.
dstType
=
{
possibleTransfers
[
value
].
dstType
};
transfer
.
dstIndex
=
{
possibleTransfers
[
value
].
dstIndex
};
transfer
.
numSubExecs
=
IsGpuType
(
transfer
.
exeType
)
?
numGpuSubExecs
:
numCpuSubExecs
;
...
...
src/include/EnvVars.hpp
View file @
437b6e70
...
...
@@ -29,7 +29,7 @@ THE SOFTWARE.
#include "Compatibility.hpp"
#include "Kernels.hpp"
#define TB_VERSION "1.
39
"
#define TB_VERSION "1.
40
"
extern
char
const
MemTypeStr
[];
extern
char
const
ExeTypeStr
[];
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment