修复qwen3-moe-awq的bug问题

1a4e4cad · yangql · d36deb1a · 1a4e4cad
Commit 1a4e4cad authored Jun 04, 2025 by yangql
Hide whitespace changes
Inline Side-by-side

Showing with 3 additions and 0 deletions

vllm/model_executor/models/qwen3_moe.py vllm/model_executor/models/qwen3_moe.py +3 -0

No files found.
--- a/vllm/model_executor/models/qwen3_moe.py
+++ b/vllm/model_executor/models/qwen3_moe.py
@@ -332,6 +332,9 @@ class Qwen3MoeModel(nn.Module):
        self.padding_idx = config.pad_token_id
        self.vocab_size = config.vocab_size
        self.config = config
+        if self.config.quantization_config["bits"] == 4:
+            os.environ['LLAMA_NN'] = '0'
+            os.environ['LM_NN'] = '0'  
        self.embed_tokens = VocabParallelEmbedding(
            config.vocab_size,
            config.hidden_size,