Commit a70bdf09 authored by maxiao1's avatar maxiao1
Browse files

fix bug in loading Qwen3-VL-30B-A3B-Thinking

parent 1441a435
...@@ -284,6 +284,10 @@ def fused_experts( ...@@ -284,6 +284,10 @@ def fused_experts(
and moe_runner_config.activation.lower() == "silu") and moe_runner_config.activation.lower() == "silu")
) else 1 ) else 1
) )
filter_expert = (
moe_runner_config.num_experts is None
or moe_runner_config.num_experts != moe_runner_config.num_local_experts
)
if moe_runner_config.inplace: if moe_runner_config.inplace:
assert not moe_runner_config.no_combine, "no combine + inplace makes no sense" assert not moe_runner_config.no_combine, "no combine + inplace makes no sense"
torch.ops.sglang.inplace_fused_experts( torch.ops.sglang.inplace_fused_experts(
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment