Commit cf360956 authored by zhuwenwen's avatar zhuwenwen
Browse files

support dsv32

parent 5eec6110
......@@ -1039,7 +1039,10 @@ class DeepseekV2ForCausalLM(nn.Module, SupportsPP, MixtureOfExperts):
if is_pp_missing_parameter(name_mapped, self):
continue
param = params_dict[name_mapped]
try:
param = params_dict[name_mapped]
except Exception as e:
continue
# We should ask the weight loader to return success or not
# here since otherwise we may skip experts with other
# available replicas.
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment