Unverified Commit 471997ad authored by JJJYmmm's avatar JJJYmmm Committed by GitHub
Browse files

[Bugfix] fix Qwen3VLMoe load when pp > 1 (#25838)


Signed-off-by: default avatarliuye.hj <liuye.hj@alibaba-inc.com>
Co-authored-by: default avatarliuye.hj <liuye.hj@alibaba-inc.com>
parent b1ded114
......@@ -212,6 +212,8 @@ class Qwen3MoeLLMModel(Qwen3MoeModel):
# attempted to load as other weights later
is_expert_weight = True
name_mapped = name.replace(weight_name, param_name)
if is_pp_missing_parameter(name_mapped, self):
continue
if is_fused_expert:
loaded_weight = loaded_weight.transpose(-1,
-2) # no bias
......@@ -230,8 +232,6 @@ class Qwen3MoeLLMModel(Qwen3MoeModel):
name_mapped, params_dict, loaded_weight,
shard_id, num_experts)
else:
if is_pp_missing_parameter(name_mapped, self):
continue
# Skip loading extra parameters for GPTQ/modelopt models
if name_mapped.endswith(
ignore_suffixes
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment