Unverified Commit 97b5e7fc authored by Lisa's avatar Lisa Committed by GitHub
Browse files

Merge branch 'develop' into readme-updates

parents bbd61829 004710fb
# Changelog for TransferBench # Changelog for TransferBench
Full documentation for TransferBench is available at Documentation for TransferBench is available at
[https://rocm.docs.amd.com/projects/TransferBench](https://rocm.docs.amd.com/projects/TransferBench). [https://rocm.docs.amd.com/projects/TransferBench](https://rocm.docs.amd.com/projects/TransferBench).
## v1.34
### Additions
* Set `GPU_KERNEL=3` as default for gfx942
## v1.33 ## v1.33
### Additions ### Additions
......
rocm-docs-core==0.26.0 rocm-docs-core==0.27.0
...@@ -84,7 +84,9 @@ pygments==2.14.0 ...@@ -84,7 +84,9 @@ pygments==2.14.0
# pydata-sphinx-theme # pydata-sphinx-theme
# sphinx # sphinx
pyjwt[crypto]==2.6.0 pyjwt[crypto]==2.6.0
# via pygithub # via
# pygithub
# pyjwt
pynacl==1.5.0 pynacl==1.5.0
# via pygithub # via pygithub
pytz==2023.3.post1 pytz==2023.3.post1
...@@ -98,7 +100,7 @@ requests==2.28.2 ...@@ -98,7 +100,7 @@ requests==2.28.2
# via # via
# pygithub # pygithub
# sphinx # sphinx
rocm-docs-core==0.26.0 rocm-docs-core==0.27.0
# via -r requirements.in # via -r requirements.in
smmap==5.0.0 smmap==5.0.0
# via gitdb # via gitdb
......
...@@ -29,7 +29,7 @@ THE SOFTWARE. ...@@ -29,7 +29,7 @@ THE SOFTWARE.
#include "Compatibility.hpp" #include "Compatibility.hpp"
#include "Kernels.hpp" #include "Kernels.hpp"
#define TB_VERSION "1.33" #define TB_VERSION "1.34"
extern char const MemTypeStr[]; extern char const MemTypeStr[];
extern char const ExeTypeStr[]; extern char const ExeTypeStr[];
...@@ -166,6 +166,7 @@ public: ...@@ -166,6 +166,7 @@ public:
else if (archName == "gfx90a") defaultGpuKernel = 9; else if (archName == "gfx90a") defaultGpuKernel = 9;
else if (archName == "gfx940") defaultGpuKernel = 6; else if (archName == "gfx940") defaultGpuKernel = 6;
else if (archName == "gfx941") defaultGpuKernel = 6; else if (archName == "gfx941") defaultGpuKernel = 6;
else if (archName == "gfx942") defaultGpuKernel = 3;
alwaysValidate = GetEnvVar("ALWAYS_VALIDATE" , 0); alwaysValidate = GetEnvVar("ALWAYS_VALIDATE" , 0);
blockSize = GetEnvVar("BLOCK_SIZE" , 256); blockSize = GetEnvVar("BLOCK_SIZE" , 256);
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment