[Platform] Allow platform use V1 Engine by default (#19792)

Signed-off-by: wangxiyuan <wangxiyuan1007@gmail.com>
2025-12-15 11:55:00 +08:00 · 2025-06-18 21:03:36 +08:00 · 2025-06-18 21:03:36 +08:00 · 257ab95439
commit 257ab95439
parent cca91a7a10
3 changed files with 20 additions and 9 deletions
--- a/vllm/engine/arg_utils.py
+++ b/vllm/engine/arg_utils.py
@ -1303,7 +1303,7 @@ class EngineArgs:
        # Skip this check if we are running on a non-GPU platform,
        # or if the device capability is not available
        # (e.g. in a Ray actor without GPUs).
-        from vllm.platforms import CpuArchEnum, current_platform
+        from vllm.platforms import current_platform
        if (current_platform.is_cuda()
                and current_platform.get_device_capability()
                and current_platform.get_device_capability().major < 8):
@ -1445,14 +1445,10 @@ class EngineArgs:
            _raise_or_fallback(feature_name=name, recommend_to_remove=False)
            return False
-        # Non-[CUDA, TPU, x86 CPU] may be supported on V1,
+        # The platform may be supported on V1, but off by default for now.
-        # but off by default for now.
+        if not current_platform.default_v1(  # noqa: SIM103
-        v0_hardware = not any(
+                model_config=model_config) and _warn_or_fallback(
-            (current_platform.is_cuda_alike(), current_platform.is_tpu(),
+                    current_platform.device_name):
             (current_platform.is_cpu()
              and current_platform.get_cpu_architecture() == CpuArchEnum.X86)))
        if v0_hardware and _warn_or_fallback(  # noqa: SIM103
                current_platform.device_name):
            return False
        #############################################################
--- a/vllm/platforms/cpu.py
+++ b/vllm/platforms/cpu.py
@ -269,3 +269,11 @@ class CpuPlatform(Platform):
        model configuration.
        """
        return True
    @classmethod
    def default_v1(cls, model_config) -> bool:
        """Returns whether the current platform can use v1 by default for the
        supplied model configuration.
        """
        return cls.supports_v1(
            model_config) and cls.get_cpu_architecture() == CpuArchEnum.X86
--- a/vllm/platforms/interface.py
+++ b/vllm/platforms/interface.py
@ -479,6 +479,13 @@ class Platform:
        """
        return False
    @classmethod
    def default_v1(cls, model_config: ModelConfig) -> bool:
        """
        Returns whether the current platform supports v1 by default.
        """
        return cls.supports_v1(model_config)
    @classmethod
    def use_custom_allreduce(cls) -> bool:
        """