[Temp fix] Disable torch.compile for Qwen2.5 VL's VisionBlock temporarily. (#27760)

Signed-off-by: Chenheli Hua <huachenheli@outlook.com> Signed-off-by: Roger Wang <hey@rogerw.io> Co-authored-by: Roger Wang <hey@rogerw.io>

[Temp fix] Disable torch.compile for Qwen2.5 VL's VisionBlock temporarily. (#27760)
Signed-off-by: Chenheli Hua <huachenheli@outlook.com> Signed-off-by: Roger Wang <hey@rogerw.io> Co-authored-by: Roger Wang <hey@rogerw.io>
48eb8eba · Chenheli Hua · GitHub · b5d90f74 · 48eb8eba
Unverified Commit 48eb8eba authored Oct 29, 2025 by Chenheli Hua Committed by GitHub Oct 29, 2025
Show whitespace changes
Inline Side-by-side

Showing with 11 additions and 9 deletions

vllm/model_executor/models/qwen2_5_vl.py vllm/model_executor/models/qwen2_5_vl.py +11 -9

No files found.
--- a/vllm/model_executor/models/qwen2_5_vl.py
+++ b/vllm/model_executor/models/qwen2_5_vl.py
@@ -460,15 +460,17 @@ class Qwen2_5_VisionAttention(nn.Module):
        return output
-@support_torch_compile(
+# (FIXME): Enable this after dynamic slicing is fixed
-    dynamic_arg_dims={
+# See https://github.com/vllm-project/vllm/pull/27760
-        "x": 0,
+# @support_torch_compile(
-        "cu_seqlens": 0,
+#     dynamic_arg_dims={
-        "rotary_pos_emb": 0,
+#         "x": 0,
-        "seqlens": 0,
+#         "cu_seqlens": 0,
-    },
+#         "rotary_pos_emb": 0,
-    mark_unbacked_dims={"seqlens": 0},
+#         "seqlens": 0,
-)
+#     },
+#     mark_unbacked_dims={"seqlens": 0},
+# )
 class Qwen2_5_VisionBlock(nn.Module):
    def __init__(
        self,