Unverified Commit 48eb8eba authored by Chenheli Hua's avatar Chenheli Hua Committed by GitHub
Browse files

[Temp fix] Disable torch.compile for Qwen2.5 VL's VisionBlock temporarily. (#27760)


Signed-off-by: default avatarChenheli Hua <huachenheli@outlook.com>
Signed-off-by: default avatarRoger Wang <hey@rogerw.io>
Co-authored-by: default avatarRoger Wang <hey@rogerw.io>
parent b5d90f74
...@@ -460,15 +460,17 @@ class Qwen2_5_VisionAttention(nn.Module): ...@@ -460,15 +460,17 @@ class Qwen2_5_VisionAttention(nn.Module):
return output return output
@support_torch_compile( # (FIXME): Enable this after dynamic slicing is fixed
dynamic_arg_dims={ # See https://github.com/vllm-project/vllm/pull/27760
"x": 0, # @support_torch_compile(
"cu_seqlens": 0, # dynamic_arg_dims={
"rotary_pos_emb": 0, # "x": 0,
"seqlens": 0, # "cu_seqlens": 0,
}, # "rotary_pos_emb": 0,
mark_unbacked_dims={"seqlens": 0}, # "seqlens": 0,
) # },
# mark_unbacked_dims={"seqlens": 0},
# )
class Qwen2_5_VisionBlock(nn.Module): class Qwen2_5_VisionBlock(nn.Module):
def __init__( def __init__(
self, self,
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment