Unverified Commit 37bd8d6e authored by Wentao Ye's avatar Wentao Ye Committed by GitHub
Browse files

[Bug] DeepGemm: Fix TypeError: per_block_cast_to_fp8() missing 1 required...


[Bug] DeepGemm: Fix TypeError: per_block_cast_to_fp8() missing 1 required positional argument: 'use_ue8m0' for SM100 (#21187)
Signed-off-by: default avataryewentao256 <zhyanwentao@126.com>
parent 468e2400
...@@ -99,7 +99,7 @@ def fp8_m_grouped_gemm_nt_masked(*args, **kwargs): ...@@ -99,7 +99,7 @@ def fp8_m_grouped_gemm_nt_masked(*args, **kwargs):
def per_block_cast_to_fp8(x, *args, **kwargs): def per_block_cast_to_fp8(x, *args, **kwargs):
if _per_block_cast_impl is not None and is_blackwell_deep_gemm_used(): if _per_block_cast_impl is not None and is_blackwell_deep_gemm_used():
return _per_block_cast_impl(x) return _per_block_cast_impl(x, use_ue8m0=True)
# TODO: refactor the `per_block_cast_to_fp8` from tests to vllm utils # TODO: refactor the `per_block_cast_to_fp8` from tests to vllm utils
from tests.kernels.quant_utils import per_block_cast_to_fp8 as _pbcf from tests.kernels.quant_utils import per_block_cast_to_fp8 as _pbcf
return _pbcf(x, *args, **kwargs) return _pbcf(x, *args, **kwargs)
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment