[XPU] Fix circular import error. (#24927)

Signed-off-by: Kunshang Ji <kunshang.ji@intel.com>

[XPU] Fix circular import error. (#24927)
Signed-off-by: Kunshang Ji <kunshang.ji@intel.com>
5206ab20 · Kunshang Ji · GitHub · 0af3ce13 · 5206ab20
Unverified Commit 5206ab20 authored Sep 16, 2025 by Kunshang Ji Committed by GitHub Sep 16, 2025
Hide whitespace changes
Inline Side-by-side

Showing with 5 additions and 1 deletion

vllm/platforms/xpu.py vllm/platforms/xpu.py +5 -1

No files found.
--- a/vllm/platforms/xpu.py
+++ b/vllm/platforms/xpu.py
@@ -9,7 +9,6 @@ import torch
 import vllm.envs as envs
 from vllm.logger import init_logger
 from vllm.utils import DEFAULT_MAX_NUM_BATCHED_TOKENS
-from vllm.v1.attention.backends.utils import set_kv_cache_layout
 from .interface import DeviceCapability, Platform, PlatformEnum, _Backend
@@ -164,11 +163,16 @@ class XPUPlatform(Platform):
            vllm_config.scheduler_config.max_num_batched_tokens = max(
                vllm_config.scheduler_config.max_model_len,
                DEFAULT_MAX_NUM_BATCHED_TOKENS)
+        from vllm.v1.attention.backends.utils import set_kv_cache_layout
        set_kv_cache_layout("NHD")
        logger.info("Setting VLLM_KV_CACHE_LAYOUT to 'NHD' for XPU; "
                    "only NHD layout is supported by XPU attention kernels.")
+    @classmethod
+    def support_hybrid_kv_cache(cls) -> bool:
+        return True
    @classmethod
    def is_pin_memory_available(cls):
        return True