[fix]修复ds3量化代码引入的报错

bcce8974 · 王敏 · 4fb33500 · bcce8974 · bcce8974
Commit bcce8974 authored Feb 26, 2025 by 王敏
Showing with 2 additions and 2 deletions

vllm/model_executor/model_loader/utils.py vllm/model_executor/model_loader/utils.py +1 -1

vllm/model_executor/models/deepseek_v2.py vllm/model_executor/models/deepseek_v2.py +1 -1

No files found.
--- a/vllm/model_executor/model_loader/utils.py
+++ b/vllm/model_executor/model_loader/utils.py
@@ -84,7 +84,7 @@ def get_model_architecture(
                                'Qwen2MoeForCausalLM', 'ChatGLMModel', 'ChatGLMForConditionalGeneration', 
                                'BaichuanForCausalLM', 'BloomForCausalLM', 'MedusaModel', 'MixtralForCausalLM', 
                                'MLPSpeculatorPreTrainedModel', 'FalconForCausalLM', 'DeepseekV2ForCausalLM', 
-                                'DeepseekV3ForCausalLM', 'DeepSeekMTP']  
+                                'DeepseekV3ForCausalLM', 'DeepSeekMTPModel']  
    if any(arch in architectures for arch in support_nn_architectures): 
        if os.getenv('LLAMA_NN') != '0': 
             if (architectures == ['QWenLMHeadModel'] or architectures == ['ChatGLMModel'] ) and visions != []:

--- a/vllm/model_executor/models/deepseek_v2.py
+++ b/vllm/model_executor/models/deepseek_v2.py
@@ -870,7 +870,7 @@ class DeepseekV2ForCausalLM(nn.Module, SupportsPP):
                    weight.data=weight.data.reshape(ori_shape[1],-1)
-        if self.config.quantization_config["quant_method"] == "awq" and not envs.VLLM_USE_TRITON_AWQ:
+        if hasattr(self.config, "quantization_config") and self.config.quantization_config["quant_method"] == "awq" and not envs.VLLM_USE_TRITON_AWQ:
            lay_key_words = [
                "self_attn.q_a_proj.qweight",
                "self_attn.q_b_proj.qweight",