Unverified Commit 4aeba40d authored by Lianmin Zheng's avatar Lianmin Zheng Committed by GitHub
Browse files

[Sync] Update mxfp4.py (20250827) (#9724)


Co-authored-by: default avatargithub-actions[bot] <github-actions[bot]@users.noreply.github.com>
Co-authored-by: default avatarShiyang Chen <shiyang@x.ai>
parent 28684f90
...@@ -66,10 +66,15 @@ _is_hip = is_hip() ...@@ -66,10 +66,15 @@ _is_hip = is_hip()
if _is_hip: if _is_hip:
# import aiter # import aiter
try:
from aiter import ActivationType, QuantType, dtypes from aiter import ActivationType, QuantType, dtypes
from aiter.fused_moe import fused_moe from aiter.fused_moe import fused_moe
from aiter.ops.triton.quant import dynamic_mxfp4_quant from aiter.ops.triton.quant import dynamic_mxfp4_quant
from aiter.utility.fp4_utils import e8m0_shuffle from aiter.utility.fp4_utils import e8m0_shuffle
except ImportError as err:
ActivationType = QuantType = dtypes = fused_moe = dynamic_mxfp4_quant = (
e8m0_shuffle
) = err
def _swizzle_mxfp4(quant_tensor, scale, num_warps): def _swizzle_mxfp4(quant_tensor, scale, num_warps):
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment