Unverified Commit cbc8457b authored by vllmellm's avatar vllmellm Committed by GitHub
Browse files

[Model] Switch to Fused RMS norm in Qwen2.5_VL model. (#22184)


Signed-off-by: default avatarkf <kuanfu.liu@embeddedllm.com>
Signed-off-by: default avatartjtanaavllm <tunjian.tan@amd.com>
Signed-off-by: default avatarvllmellm <vllm.ellm@embeddedllm.com>
Co-authored-by: default avatarkf <kuanfu.liu@embeddedllm.com>
parent 4d4297e8
......@@ -396,13 +396,13 @@ class Qwen2_5_VisionBlock(nn.Module):
max_seqlen: Optional[int] = None, # Only used for Flash Attention
seqlens: Optional[list[int]] = None, # Only used for xFormers
) -> torch.Tensor:
x = x + self.attn(self.norm1(x),
cu_seqlens=cu_seqlens,
rotary_pos_emb=rotary_pos_emb,
max_seqlen=max_seqlen,
seqlens=seqlens)
x = x + self.mlp(self.norm2(x))
x_attn = self.attn(self.norm1(x),
cu_seqlens=cu_seqlens,
rotary_pos_emb=rotary_pos_emb,
max_seqlen=max_seqlen,
seqlens=seqlens)
x_fused_norm, residual = self.norm2(x, residual=x_attn)
x = residual + self.mlp(x_fused_norm)
return x
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment