Commit f9f4a735 authored by zhuwenwen's avatar zhuwenwen
Browse files

update qwen&qwen2-moe and baichuan layout

parent ca7f98e5
......@@ -489,7 +489,7 @@ class BaiChuanBaseForCausalLM(nn.Module, SupportsLoRA, SupportsPP):
weight_loader = getattr(param, "weight_loader",
default_weight_loader)
weight_loader(param, loaded_weight)
loaded_params.add(name)
loaded_params.add(name)
if self.use_llama_nn and self.quant_method is None :
lay_key_words = [
......
......@@ -1028,7 +1028,7 @@ class QWenBaseModel(nn.Module, SupportsPP, SupportsLoRA):
weight_loader = getattr(param, "weight_loader",
default_weight_loader)
weight_loader(param, loaded_weight)
loaded_params.add(name)
loaded_params.add(name)
if self.use_llama_nn and self.quant_method is None :
lay_key_words = [
......
......@@ -553,7 +553,7 @@ class Qwen2MoeForCausalLM(nn.Module, SupportsPP):
weight_loader = getattr(param, "weight_loader",
default_weight_loader)
weight_loader(param, loaded_weight)
loaded_params.add(name)
loaded_params.add(name)
if self.use_llama_nn and self.quant_method is None:
lay_key_words = [
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment