[torch.compile] add warning for unsupported models (#10622)

Signed-off-by: youkaichao <youkaichao@gmail.com>
2025-12-16 01:49:19 +08:00 · 2024-11-24 23:27:51 -08:00 · 2024-11-24 23:27:51 -08:00 · 65813781a2
commit 65813781a2
parent 7c2134beda
3 changed files with 18 additions and 0 deletions
--- a/vllm/compilation/counter.py
+++ b/vllm/compilation/counter.py
@ -5,6 +5,7 @@ from contextlib import contextmanager
@dataclasses.dataclass
 class CompilationCounter:
    num_models_seen: int = 0
    num_graphs_seen: int = 0
    # including the splitting ops
    num_piecewise_graphs_seen: int = 0
--- a/vllm/compilation/decorators.py
+++ b/vllm/compilation/decorators.py
@ -3,6 +3,7 @@ from typing import Dict, List, Optional, Union
 import torch
 from vllm.compilation.counter import compilation_counter
 from vllm.compilation.wrapper import TorchCompileWrapperWithCustomDispatcher
 from vllm.config import CompilationLevel, VllmConfig
 from vllm.logger import init_logger
@ -130,6 +131,7 @@ def _support_torch_compile(cls: type,
        ] or not supports_dynamo()
        if self.do_not_compile:
            return
        compilation_counter.num_models_seen += 1
        TorchCompileWrapperWithCustomDispatcher.__init__(
            self, compilation_level=vllm_config.compilation_config.level)
--- a/vllm/plugins/init.py
+++ b/vllm/plugins/init.py
@ -80,6 +80,9 @@ def set_current_vllm_config(vllm_config: "VllmConfig"):
    """
    global _current_vllm_config
    old_vllm_config = _current_vllm_config
    from vllm.compilation.counter import compilation_counter
    from vllm.config import CompilationLevel
    num_models_seen = compilation_counter.num_models_seen
    try:
        _current_vllm_config = vllm_config
        yield
@ -88,6 +91,18 @@ def set_current_vllm_config(vllm_config: "VllmConfig"):
                     vllm_config.compilation_config.enabled_custom_ops)
        logger.debug("disabled custom ops: %s",
                     vllm_config.compilation_config.disabled_custom_ops)
        if vllm_config.compilation_config.level == CompilationLevel.PIECEWISE \
            and compilation_counter.num_models_seen == num_models_seen:
            # If the model supports compilation,
            # compilation_counter.num_models_seen should be increased
            # by at least 1.
            # If it is not increased, it means the model does not support
            # compilation (does not have @support_torch_compile decorator).
            logger.warning(
                "`torch.compile` is turned on, but the model %s"
                " does not support it. Please open an issue on GitHub"
                "if you want it to be supported.",
                vllm_config.model_config.model)
        _current_vllm_config = old_vllm_config