[Bugfix] Fix MoE Routing Simulation (vllm-project#28002)

tlrmchlsmth · ZhengHongming888 · commit d7ce5fe22976 · 2025-11-08T08:32:52.000-08:00
Signed-off-by: Tyler Michael Smith &lt;tlrmchlsmth@gmail.com&gt;
diff --git a/vllm/model_executor/layers/fused_moe/layer.py b/vllm/model_executor/layers/fused_moe/layer.py
@@ -2066,7 +2066,7 @@ def select_experts(
             )
 
         # DeepSeekv2 uses grouped_top_k
-        if use_grouped_topk:
+        elif use_grouped_topk:
             assert topk_group is not None
             assert num_expert_group is not None
             if is_rocm_aiter_moe_enabled():
diff --git a/vllm/model_executor/layers/fused_moe/routing_simulator.py b/vllm/model_executor/layers/fused_moe/routing_simulator.py
@@ -14,6 +14,10 @@
 
 import torch
 
+from vllm.logger import init_logger
+
+logger = init_logger(__name__)
+
 
 class RoutingStrategy(ABC):
     """Base class for token-to-expert routing strategies."""
@@ -290,6 +294,12 @@ def simulate_routing(
                 f"Available strategies: "
                 f"{list(RoutingSimulator._routing_strategies.keys())}"
             )
+        logger.warning_once(
+            "Simulating MoE routing using a %s strategy. "
+            "This should only be used for performance testing. "
+            "Model outputs will not be valid.",
+            strategy_name,
+        )
 
         strategy = RoutingSimulator._routing_strategies[strategy_name]
         return strategy.route_tokens(

Original file line number	Diff line number	Diff line change
`@@ -2066,7 +2066,7 @@ def select_experts(`
`2066`	`2066`	`)`
`2067`	`2067`
`2068`	`2068`	`# DeepSeekv2 uses grouped_top_k`
`2069`		`- if use_grouped_topk:`
	`2069`	`+ elif use_grouped_topk:`
`2070`	`2070`	`assert topk_group is not None`
`2071`	`2071`	`assert num_expert_group is not None`
`2072`	`2072`	`if is_rocm_aiter_moe_enabled():`