[BugFix] Fix glm4_moe_mtp load weights bug (#28805)

Signed-off-by: wuyaoxuehun <798143193@qq.com>

[BugFix] Fix glm4_moe_mtp load weights bug (#28805)
Signed-off-by: wuyaoxuehun <798143193@qq.com>
ab01cd14 · wuyaoxuehun · GitHub · 577bb34f · ab01cd14
Unverified Commit ab01cd14 authored Nov 17, 2025 by wuyaoxuehun Committed by GitHub Nov 17, 2025
Show whitespace changes
Inline Side-by-side

Showing with 3 additions and 4 deletions

vllm/model_executor/models/glm4_moe_mtp.py vllm/model_executor/models/glm4_moe_mtp.py +3 -4

No files found.
--- a/vllm/model_executor/models/glm4_moe_mtp.py
+++ b/vllm/model_executor/models/glm4_moe_mtp.py
@@ -256,13 +256,12 @@ class Glm4MoeMTP(nn.Module, SupportsPP, Glm4MixtureOfExperts):
        params_dict = dict(self.named_parameters())
        loaded_params: set[str] = set()
-        spec_layer = self.model.mtp_start_layer_idx
        for name, loaded_weight in weights:
            if name == "lm_head.weight":
-                name = f"model.layers.{spec_layer}.shard_head.head.weight"
+                spec_layer = self.model.mtp_start_layer_idx
+                name = f"model.layers.{spec_layer}.shared_head.head.weight"
            elif name == "model.embed_tokens.weight":
-                # This name is same with local model, rewriting is not needed.
+                spec_layer = self.model.mtp_start_layer_idx
-                pass
            else:
                spec_layer = get_spec_layer_idx_from_weight_name(self.config, name)
                if spec_layer is None: