Unverified Commit 4120a05f authored by Jim Smith's avatar Jim Smith Committed by GitHub
Browse files

Fix AttributeError in Qwen3.5 GDN layers with quantized models (#37448)


Signed-off-by: default avatarJim Smith <jim@joshua8.ai>
Signed-off-by: default avatarmgoin <mgoin64@gmail.com>
Signed-off-by: default avatarMichael Goin <mgoin64@gmail.com>
Co-authored-by: default avatarmgoin <mgoin64@gmail.com>
Co-authored-by: default avatarXin Yang <105740670+xyang16@users.noreply.github.com>
parent 98ff0429
...@@ -182,8 +182,8 @@ class Qwen3_5GatedDeltaNet(Qwen3NextGatedDeltaNet): ...@@ -182,8 +182,8 @@ class Qwen3_5GatedDeltaNet(Qwen3NextGatedDeltaNet):
# ============================================================ # ============================================================
mixed_qkvz, ba = torch.ops.vllm.gdn_in_proj( mixed_qkvz, ba = torch.ops.vllm.gdn_in_proj(
hidden_states, hidden_states,
self.in_proj_qkvz.weight.shape[0], sum(self.in_proj_qkvz.output_sizes) // self.tp_size,
self.in_proj_ba.weight.shape[0], sum(self.in_proj_ba.output_sizes) // self.tp_size,
self.prefix, self.prefix,
) )
qkv_size = (self.key_dim * 2 + self.value_dim) // self.tp_size qkv_size = (self.key_dim * 2 + self.value_dim) // self.tp_size
......
...@@ -660,8 +660,8 @@ class Qwen3NextGatedDeltaNet(nn.Module, MambaBase): ...@@ -660,8 +660,8 @@ class Qwen3NextGatedDeltaNet(nn.Module, MambaBase):
# ============================================================ # ============================================================
projected_states_qkvz, projected_states_ba = torch.ops.vllm.gdn_in_proj( projected_states_qkvz, projected_states_ba = torch.ops.vllm.gdn_in_proj(
hidden_states, hidden_states,
self.in_proj_qkvz.weight.shape[0], sum(self.in_proj_qkvz.output_sizes) // self.tp_size,
self.in_proj_ba.weight.shape[0], sum(self.in_proj_ba.output_sizes) // self.tp_size,
self.prefix, self.prefix,
) )
query, key, value, z, b, a = self.fix_query_key_value_ordering( query, key, value, z, b, a = self.fix_query_key_value_ordering(
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment