[Bugfix][Platform][CPU] Fix cuda platform detection on CPU backend edge case (#13358)

Signed-off-by: Isotr0py <2037008807@qq.com>
2026-07-29 05:01:19 +08:00 · 2025-02-17 02:55:27 +08:00 · 2025-02-17 02:55:27 +08:00 · d67cc21b78
commit d67cc21b78
parent e18227b04a
1 changed files with 9 additions and 2 deletions
--- a/vllm/platforms/init.py
+++ b/vllm/platforms/init.py
@ -33,12 +33,19 @@ def cuda_platform_plugin() -> Optional[str]:
    is_cuda = False
    try:
        from importlib.metadata import version
        from vllm.utils import import_pynvml
        pynvml = import_pynvml()
        pynvml.nvmlInit()
        try:
-            if pynvml.nvmlDeviceGetCount() > 0:
+            # NOTE: Edge case: vllm cpu build on a GPU machine.
-                is_cuda = True
+            # Third-party pynvml can be imported in cpu build,
            # we need to check if vllm is built with cpu too.
            # Otherwise, vllm will always activate cuda plugin
            # on a GPU machine, even if in a cpu build.
            is_cuda = (pynvml.nvmlDeviceGetCount() > 0
                       and "cpu" not in version("vllm"))
        finally:
            pynvml.nvmlShutdown()
    except Exception as e: