fix bug in loading Qwen3-VL-30B-A3B-Thinking

a70bdf09 · maxiao1 · 1441a435 · a70bdf09
Commit a70bdf09 authored Nov 25, 2025 by maxiao1
Hide whitespace changes
Inline Side-by-side

Showing with 4 additions and 0 deletions

python/sglang/srt/layers/moe/fused_moe_triton/fused_moe.py python/sglang/srt/layers/moe/fused_moe_triton/fused_moe.py +4 -0

No files found.
--- a/python/sglang/srt/layers/moe/fused_moe_triton/fused_moe.py
+++ b/python/sglang/srt/layers/moe/fused_moe_triton/fused_moe.py
@@ -284,6 +284,10 @@ def fused_experts(
                and moe_runner_config.activation.lower() == "silu")
        ) else 1
    )
+    filter_expert = (
+        moe_runner_config.num_experts is None
+        or moe_runner_config.num_experts != moe_runner_config.num_local_experts
+    )
    if moe_runner_config.inplace:
        assert not moe_runner_config.no_combine, "no combine + inplace makes no sense"
        torch.ops.sglang.inplace_fused_experts(