"vscode:/vscode.git/clone" did not exist on "2161efe9781cc0bee2f60342dffd0c1f7f0f2b57"
Unverified Commit 86483ca7 authored by tomeras91's avatar tomeras91 Committed by GitHub
Browse files

[Bugfix] Disable FlashInfer TRTLLM BF16 path for non-gated MoE (#36146)


Signed-off-by: default avatarTomer Asida <57313761+tomeras91@users.noreply.github.com>
parent b93a9e6f
......@@ -25,12 +25,12 @@ def _supports_current_device() -> bool:
def _supports_no_act_and_mul() -> bool:
"""Supports non-gated MoE."""
return True
"""BF16 kernels do not support non-gated MoE"""
return False
def _supports_activation(activation: MoEActivation) -> bool:
return activation in [MoEActivation.SILU, MoEActivation.RELU2_NO_MUL]
return activation in [MoEActivation.SILU]
def _supports_routing_method_bf16(
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment