[torch.compile] add warning for unsupported models (#10622)

Signed-off-by: youkaichao <youkaichao@gmail.com>
2026-07-14 07:27:10 +08:00 · 2024-11-24 23:27:51 -08:00 · 2024-11-24 23:27:51 -08:00 · 65813781a2
commit 65813781a2
parent 7c2134beda
3 changed files with 18 additions and 0 deletions
--- a/vllm/compilation/counter.py
+++ b/vllm/compilation/counter.py
@ -5,6 +5,7 @@ from contextlib import contextmanager

@dataclasses.dataclass
 class CompilationCounter:
+    num_models_seen: int = 0
    num_graphs_seen: int = 0
    # including the splitting ops
    num_piecewise_graphs_seen: int = 0
--- a/vllm/compilation/decorators.py
+++ b/vllm/compilation/decorators.py
@ -3,6 +3,7 @@ from typing import Dict, List, Optional, Union

 import torch

+from vllm.compilation.counter import compilation_counter
 from vllm.compilation.wrapper import TorchCompileWrapperWithCustomDispatcher
 from vllm.config import CompilationLevel, VllmConfig
 from vllm.logger import init_logger
@ -130,6 +131,7 @@ def _support_torch_compile(cls: type,
        ] or not supports_dynamo()
        if self.do_not_compile:
            return
+        compilation_counter.num_models_seen += 1
        TorchCompileWrapperWithCustomDispatcher.__init__(
            self, compilation_level=vllm_config.compilation_config.level)

--- a/vllm/plugins/init.py
+++ b/vllm/plugins/init.py
@ -80,6 +80,9 @@ def set_current_vllm_config(vllm_config: "VllmConfig"):
    """
    global _current_vllm_config
    old_vllm_config = _current_vllm_config
+    from vllm.compilation.counter import compilation_counter
+    from vllm.config import CompilationLevel
+    num_models_seen = compilation_counter.num_models_seen
    try:
        _current_vllm_config = vllm_config
        yield
@ -88,6 +91,18 @@ def set_current_vllm_config(vllm_config: "VllmConfig"):
                     vllm_config.compilation_config.enabled_custom_ops)
        logger.debug("disabled custom ops: %s",
                     vllm_config.compilation_config.disabled_custom_ops)
+        if vllm_config.compilation_config.level == CompilationLevel.PIECEWISE \
+            and compilation_counter.num_models_seen == num_models_seen:
+            # If the model supports compilation,
+            # compilation_counter.num_models_seen should be increased
+            # by at least 1.
+            # If it is not increased, it means the model does not support
+            # compilation (does not have @support_torch_compile decorator).
+            logger.warning(
+                "`torch.compile` is turned on, but the model %s"
+                " does not support it. Please open an issue on GitHub"
+                "if you want it to be supported.",
+                vllm_config.model_config.model)
        _current_vllm_config = old_vllm_config