Unverified Commit 004710fb authored by gilbertlee-amd's avatar gilbertlee-amd Committed by GitHub
Browse files

Setting default GPU_KERNEL=3 for gfx942 (#64)

parent 82d55c36
# Changelog for TransferBench
## v1.34
### Added
- Set GPU_KERNEL=3 to default for gfx942
## v1.33
### Added
- Adding ALWAYS_VALIDATE env var to allow for validation after every iteration instead of just once at end of all iterations
......
......@@ -29,7 +29,7 @@ THE SOFTWARE.
#include "Compatibility.hpp"
#include "Kernels.hpp"
#define TB_VERSION "1.33"
#define TB_VERSION "1.34"
extern char const MemTypeStr[];
extern char const ExeTypeStr[];
......@@ -166,6 +166,7 @@ public:
else if (archName == "gfx90a") defaultGpuKernel = 9;
else if (archName == "gfx940") defaultGpuKernel = 6;
else if (archName == "gfx941") defaultGpuKernel = 6;
else if (archName == "gfx942") defaultGpuKernel = 3;
alwaysValidate = GetEnvVar("ALWAYS_VALIDATE" , 0);
blockSize = GetEnvVar("BLOCK_SIZE" , 256);
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment