warnings.warn("TMA load is disabled as there is no TMA descriptor support!")
ifUSE_TMA_STOREandnotHAS_TMA_DESC:
USE_TMA_STORE=False
warnings.warn("TMA store is disabled as there is no TMA descriptor support!")
# TODO(shikaili): Check the readniess of WS on ROCm side in Meta's Triton.
ifuse_warp_specializationandtorch.version.hip:
warnings.warn("Warp specialization is disabled as it is not supported on ROCm.")
use_warp_specialization=False
ifuse_warp_specializationandnot_HAS_WS_SUPPORT:
warnings.warn(
"Warp specialization is disabled as the Triton build in current environment doesn't have such support. Please build from https://github.com/facebookexperimental/triton/tree/ws-3.2.x to enable it for best performance on Nvidia's SM90 GPUs."