Unverified Commit 4f204db5 authored by Yineng Zhang's avatar Yineng Zhang Committed by GitHub
Browse files

fix: resolve b200 dsv3 mtp issue (#7286)

parent 3eb4a800
......@@ -1932,6 +1932,8 @@ class DeepseekV2ForCausalLM(nn.Module):
self._weight_requant_ue8m0()
def _weight_requant_ue8m0(self):
if self.config.architectures[0] == "DeepseekV3ForCausalLMNextN":
return
weight_block_size = self.quant_config.weight_block_size
moe_layers = list(
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment