[Bugfix] Fix MoE Routing Simulation (#28002)

Signed-off-by: Tyler Michael Smith <tlrmchlsmth@gmail.com>

[Bugfix] Fix MoE Routing Simulation (#28002)
Signed-off-by: Tyler Michael Smith <tlrmchlsmth@gmail.com>
37587573 · Tyler Michael Smith · GitHub · ccd3e55e · 37587573 · 37587573
Unverified Commit 37587573 authored Nov 03, 2025 by Tyler Michael Smith Committed by GitHub Nov 03, 2025
Showing with 11 additions and 1 deletion

vllm/model_executor/layers/fused_moe/layer.py vllm/model_executor/layers/fused_moe/layer.py +1 -1

vllm/model_executor/layers/fused_moe/routing_simulator.py vllm/model_executor/layers/fused_moe/routing_simulator.py +10 -0

No files found.
--- a/vllm/model_executor/layers/fused_moe/layer.py
+++ b/vllm/model_executor/layers/fused_moe/layer.py
@@ -2066,7 +2066,7 @@ class FusedMoE(CustomOp):
            )
        # DeepSeekv2 uses grouped_top_k
-        if use_grouped_topk:
+        elif use_grouped_topk:
            assert topk_group is not None
            assert num_expert_group is not None
            if is_rocm_aiter_moe_enabled():

--- a/vllm/model_executor/layers/fused_moe/routing_simulator.py
+++ b/vllm/model_executor/layers/fused_moe/routing_simulator.py
@@ -14,6 +14,10 @@ from typing import Any
 import torch
+from vllm.logger import init_logger
+logger = init_logger(__name__)
 class RoutingStrategy(ABC):
    """Base class for token-to-expert routing strategies."""
@@ -290,6 +294,12 @@ class RoutingSimulator:
                f"Available strategies: "
                f"{list(RoutingSimulator._routing_strategies.keys())}"
            )
+        logger.warning_once(
+            "Simulating MoE routing using a %s strategy. "
+            "This should only be used for performance testing. "
+            "Model outputs will not be valid.",
+            strategy_name,
+        )
        strategy = RoutingSimulator._routing_strategies[strategy_name]
        return strategy.route_tokens(