Unverified Commit 432e1cbc authored by Simon Danielsson's avatar Simon Danielsson Committed by GitHub
Browse files

[Bugfix]: Assertion error when using FlashInfer backend (#25933)


Signed-off-by: default avatarsimondanielsson <simon.danielsson99@hotmail.com>
Co-authored-by: default avatarCyrus Leung <tlleungac@connect.ust.hk>
parent 201c971e
...@@ -508,7 +508,7 @@ class Fp8MoEMethod(FusedMoEMethodBase): ...@@ -508,7 +508,7 @@ class Fp8MoEMethod(FusedMoEMethodBase):
self.layer = layer self.layer = layer
self.quant_config = quant_config self.quant_config = quant_config
self.weight_block_size = self.quant_config.weight_block_size self.weight_block_size = self.quant_config.weight_block_size
self.block_quant = self.weight_block_size is not None self.block_quant: bool = self.weight_block_size is not None
self.fused_experts: Optional[ self.fused_experts: Optional[
mk.FusedMoEModularKernel] = None # type: ignore mk.FusedMoEModularKernel] = None # type: ignore
...@@ -1094,7 +1094,7 @@ class Fp8MoEMethod(FusedMoEMethodBase): ...@@ -1094,7 +1094,7 @@ class Fp8MoEMethod(FusedMoEMethodBase):
expert_map=expert_map, expert_map=expert_map,
) )
elif self.flashinfer_moe_backend == FlashinferMoeBackend.CUTLASS: elif self.flashinfer_moe_backend == FlashinferMoeBackend.CUTLASS:
assert self.block_quant is None assert not self.block_quant
assert (not renormalize and custom_routing_function is not None) assert (not renormalize and custom_routing_function is not None)
assert activation == 'silu', ( assert activation == 'silu', (
f"Expected 'silu' activation but got {activation}") f"Expected 'silu' activation but got {activation}")
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment