Commit 633f8199 authored by zhuwenwen's avatar zhuwenwen
Browse files

support dsv32

parent ed3cdc81
......@@ -1123,7 +1123,10 @@ class DeepseekV2ForCausalLM(nn.Module, SupportsPP, MixtureOfExperts):
if is_pp_missing_parameter(name, self):
continue
try:
param = params_dict[name]
except Exception as e:
continue
weight_loader = getattr(param, "weight_loader",
default_weight_loader)
weight_loader(param, loaded_weight)
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment