Commit 07c69390 authored by zhuwenwen's avatar zhuwenwen
Browse files

Update qwen3_moe.py

parent 90e10dee
...@@ -332,9 +332,9 @@ class Qwen3MoeModel(nn.Module): ...@@ -332,9 +332,9 @@ class Qwen3MoeModel(nn.Module):
self.padding_idx = config.pad_token_id self.padding_idx = config.pad_token_id
self.vocab_size = config.vocab_size self.vocab_size = config.vocab_size
self.config = config self.config = config
if self.config.quantization_config["bits"] == 4: # if self.config.quantization_config["bits"] == 4:
os.environ['LLAMA_NN'] = '0' # os.environ['LLAMA_NN'] = '0'
os.environ['LM_NN'] = '0' # os.environ['LM_NN'] = '0'
self.embed_tokens = VocabParallelEmbedding( self.embed_tokens = VocabParallelEmbedding(
config.vocab_size, config.vocab_size,
config.hidden_size, config.hidden_size,
...@@ -589,4 +589,4 @@ class Qwen3MoeForCausalLM(nn.Module, SupportsPP): ...@@ -589,4 +589,4 @@ class Qwen3MoeForCausalLM(nn.Module, SupportsPP):
self, self,
skip_prefixes=(["rotary_emb.inv_freq"]), skip_prefixes=(["rotary_emb.inv_freq"]),
) )
return loader.load_weights(weights) return loader.load_weights(weights)
\ No newline at end of file
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment