[CustomOp] Support object-level enable for CustomOp (#30547)

Signed-off-by: shen-shanshan <467638484@qq.com>
2026-05-09 17:23:38 +08:00 · 2025-12-15 11:02:09 +08:00 · 2025-12-15 11:02:09 +08:00 · 738648fb81
commit 738648fb81
parent 917fdae5b2
1 changed files with 7 additions and 2 deletions
--- a/vllm/model_executor/custom_op.py
+++ b/vllm/model_executor/custom_op.py
@ -38,8 +38,9 @@ class CustomOp(nn.Module):
            )
        return super().__new__(op_cls_to_instantiate)

-    def __init__(self):
+    def __init__(self, enforce_enable: bool = False):
        super().__init__()
+        self._enforce_enable = enforce_enable
        self._forward_method = self.dispatch_forward()

    def forward(self, *args, **kwargs):
@ -84,7 +85,11 @@ class CustomOp(nn.Module):
        # NOTE(woosuk): Here we assume that vLLM was built for only one
        # specific backend. Currently, we do not support dynamic dispatching.
        compilation_config = get_cached_compilation_config()
-        enabled = self.enabled()
+
+        # CustomOp object can be enforce enabled, e.g., enable device-specific
+        # kernels in ViT models when enabling graph mode. By default, it will
+        # follow the compilation_config to determine whether enable itself.
+        enabled = self._enforce_enable or self.enabled()
        if enabled:
            compilation_config.enabled_custom_ops.update([self.__class__.name])
        else: