Commit cf360956 authored by zhuwenwen's avatar zhuwenwen
Browse files

support dsv32

parent 5eec6110
...@@ -1039,7 +1039,10 @@ class DeepseekV2ForCausalLM(nn.Module, SupportsPP, MixtureOfExperts): ...@@ -1039,7 +1039,10 @@ class DeepseekV2ForCausalLM(nn.Module, SupportsPP, MixtureOfExperts):
if is_pp_missing_parameter(name_mapped, self): if is_pp_missing_parameter(name_mapped, self):
continue continue
param = params_dict[name_mapped] try:
param = params_dict[name_mapped]
except Exception as e:
continue
# We should ask the weight loader to return success or not # We should ask the weight loader to return success or not
# here since otherwise we may skip experts with other # here since otherwise we may skip experts with other
# available replicas. # available replicas.
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment