[Platform] Allow platform use V1 Engine by default (#19792)

Signed-off-by: wangxiyuan <wangxiyuan1007@gmail.com>

[Platform] Allow platform use V1 Engine by default (#19792)
Signed-off-by: wangxiyuan <wangxiyuan1007@gmail.com>
257ab954 · wangxiyuan · GitHub · cca91a7a · 257ab954 · 257ab954
Unverified Commit 257ab954 authored Jun 18, 2025 by wangxiyuan Committed by GitHub Jun 18, 2025
Show whitespace changes
Inline Side-by-side

Showing with 20 additions and 9 deletions

vllm/engine/arg_utils.py vllm/engine/arg_utils.py +5 -9

vllm/platforms/cpu.py vllm/platforms/cpu.py +8 -0

vllm/platforms/interface.py vllm/platforms/interface.py +7 -0

No files found.
--- a/vllm/engine/arg_utils.py
+++ b/vllm/engine/arg_utils.py
@@ -1303,7 +1303,7 @@ class EngineArgs:
        # Skip this check if we are running on a non-GPU platform,
        # or if the device capability is not available
        # (e.g. in a Ray actor without GPUs).
-        from vllm.platforms import CpuArchEnum, current_platform
+        from vllm.platforms import current_platform
        if (current_platform.is_cuda()
                and current_platform.get_device_capability()
                and current_platform.get_device_capability().major < 8):
@@ -1445,13 +1445,9 @@ class EngineArgs:
            _raise_or_fallback(feature_name=name, recommend_to_remove=False)
            return False
-        # Non-[CUDA, TPU, x86 CPU] may be supported on V1,
+        # The platform may be supported on V1, but off by default for now.
-        # but off by default for now.
+        if not current_platform.default_v1(  # noqa: SIM103
-        v0_hardware = not any(
+                model_config=model_config) and _warn_or_fallback(
-            (current_platform.is_cuda_alike(), current_platform.is_tpu(),
-             (current_platform.is_cpu()
-              and current_platform.get_cpu_architecture() == CpuArchEnum.X86)))
-        if v0_hardware and _warn_or_fallback(  # noqa: SIM103
                    current_platform.device_name):
            return False
        #############################################################

--- a/vllm/platforms/cpu.py
+++ b/vllm/platforms/cpu.py
@@ -269,3 +269,11 @@ class CpuPlatform(Platform):
        model configuration.
        """
        return True
+    @classmethod
+    def default_v1(cls, model_config) -> bool:
+        """Returns whether the current platform can use v1 by default for the
+        supplied model configuration.
+        """
+        return cls.supports_v1(
+            model_config) and cls.get_cpu_architecture() == CpuArchEnum.X86
--- a/vllm/platforms/interface.py
+++ b/vllm/platforms/interface.py
@@ -479,6 +479,13 @@ class Platform:
        """
        return False
+    @classmethod
+    def default_v1(cls, model_config: ModelConfig) -> bool:
+        """
+        Returns whether the current platform supports v1 by default.
+        """
+        return cls.supports_v1(model_config)
    @classmethod
    def use_custom_allreduce(cls) -> bool:
        """