[XPU]Fix crash due to removed VLLM_USE_V1 attribute (#28520)

Signed-off-by: chaojun-zhang <chaojun.zhang@intel.com>

[XPU]Fix crash due to removed VLLM_USE_V1 attribute (#28520)
Signed-off-by: chaojun-zhang <chaojun.zhang@intel.com>
a4730c1b · Chaojun Zhang · GitHub · d3ade61e · a4730c1b
Unverified Commit a4730c1b authored Nov 12, 2025 by Chaojun Zhang Committed by GitHub Nov 12, 2025
Hide whitespace changes
Inline Side-by-side

Showing with 3 additions and 2 deletions

vllm/platforms/xpu.py vllm/platforms/xpu.py +3 -2

No files found.
--- a/vllm/platforms/xpu.py
+++ b/vllm/platforms/xpu.py
@@ -65,7 +65,6 @@ class XPUPlatform(Platform):

        if use_sparse:
            raise NotImplementedError("Sparse Attention is not supported on XPU.")
-        use_v1 = envs.VLLM_USE_V1
        if not use_v1:
            raise ValueError("XPU backend only supports V1.")
        if selected_backend == AttentionBackendEnum.TRITON_ATTN:
@@ -115,7 +114,9 @@ class XPUPlatform(Platform):
    @classmethod
    def get_vit_attn_backend(
        cls, head_size: int, dtype: torch.dtype
-    ) -> AttentionBackendEnum:
+    ) -> "AttentionBackendEnum":
+        from vllm.attention.backends.registry import AttentionBackendEnum
+
        return AttentionBackendEnum.FLASH_ATTN

    @classmethod