Correct PPMissingLayer handling in Deepseek-V2-Lite PP deployment (#20665)

Signed-off-by: Seiji Eicher <seiji@anyscale.com>

Correct PPMissingLayer handling in Deepseek-V2-Lite PP deployment (#20665)
Signed-off-by: Seiji Eicher <seiji@anyscale.com>
ad6c2e1a · Seiji Eicher · GitHub · 49e8c7ea · ad6c2e1a
Unverified Commit ad6c2e1a authored Jul 09, 2025 by Seiji Eicher Committed by GitHub Jul 09, 2025
Show whitespace changes
Inline Side-by-side

Showing with 9 additions and 3 deletions

vllm/model_executor/models/deepseek_v2.py vllm/model_executor/models/deepseek_v2.py +9 -3

No files found.
--- a/vllm/model_executor/models/deepseek_v2.py
+++ b/vllm/model_executor/models/deepseek_v2.py
@@ -739,14 +739,20 @@ class DeepseekV2ForCausalLM(nn.Module, SupportsPP, MixtureOfExperts):
        self.num_expert_groups = config.n_group
        self.moe_layers: list[FusedMoE] = []
+        example_moe = None
        for layer in self.model.layers:
+            if isinstance(layer, PPMissingLayer):
+                continue
            assert isinstance(layer, DeepseekV2DecoderLayer)
            if isinstance(layer.mlp, DeepseekV2MoE):
+                # Pick last one layer since the first ones may be dense layers.
+                example_moe = layer.mlp
                self.moe_layers.append(layer.mlp.experts)
-        # Pick last one layer since the first ones may be dense layers.
+        if example_moe is None:
-        example_moe = typing.cast(
+            raise RuntimeError("No DeepseekV2MoE layer found in model.layers.")
-            DeepseekV2MoE, self.model.layers[config.num_hidden_layers - 1].mlp)
        self.num_logical_experts = example_moe.n_logical_experts
        self.num_physical_experts = example_moe.n_physical_experts
        self.num_local_physical_experts = example_moe.n_local_physical_experts