update baichuan.py

277271f8 · zhuwenwen · 746d9b40 · 277271f8
Commit 277271f8 authored Apr 09, 2025 by zhuwenwen
Hide whitespace changes
Inline Side-by-side

Showing with 7 additions and 1 deletion

vllm/model_executor/models/baichuan.py vllm/model_executor/models/baichuan.py +7 -1

No files found.
--- a/vllm/model_executor/models/baichuan.py
+++ b/vllm/model_executor/models/baichuan.py
@@ -399,6 +399,12 @@ class BaiChuanModel(nn.Module):
            for layername in loaded_params:
                weight = params_dict[layername]
+                if "lm_head.weight" in layername and weight.shape[1] >= 4096:
+                    lay_key_words.append("lm_head.weight")
+                    combined_words = "|".join(lay_key_words)
+                    os.environ['LM_NN'] = '1'  
+                else:
+                    os.environ['LM_NN'] = '0' 
                matches = re.findall(combined_words, layername)
                if matches:      
                    # if self.use_gemm_pad and gemm_bank_conf(weight.data.shape[0]):
@@ -579,4 +585,4 @@ class BaiChuanForCausalLM(BaiChuanBaseForCausalLM):
    def __init__(self, *, vllm_config: VllmConfig, prefix: str = ""):
        super().__init__(vllm_config=vllm_config,
                         prefix=prefix,
                         position_embedding="ROPE")
\ No newline at end of file