[compile] Disable aot when eager backend is used. (#30810)

Signed-off-by: zhxchen17 <zhxchen17@fb.com>
2026-07-03 06:27:10 +08:00 · 2025-12-17 04:55:56 -05:00 · 2025-12-17 04:55:56 -05:00 · 177c391db2
commit 177c391db2
parent 519ef9a911
1 changed files with 9 additions and 2 deletions
--- a/vllm/compilation/decorators.py
+++ b/vllm/compilation/decorators.py
@ -435,7 +435,10 @@ def _support_torch_compile(
                return self.aot_compiled_fn(self, *args, **kwargs)

        if self.compiled:
-            assert not envs.VLLM_USE_AOT_COMPILE
+            assert (
+                not envs.VLLM_USE_AOT_COMPILE
+                or self.vllm_config.compilation_config.backend == "eager"
+            )
            return TorchCompileWithNoGuardsWrapper.__call__(self, *args, **kwargs)

        # This is the path for the first compilation.
@ -508,7 +511,11 @@ def _support_torch_compile(
            _torch27_patch_tensor_subclasses(),
            torch._inductor.config.patch(**inductor_config_patches),
        ):
-            if envs.VLLM_USE_AOT_COMPILE:
+            use_aot_compile = envs.VLLM_USE_AOT_COMPILE
+            if self.vllm_config.compilation_config.backend == "eager":
+                logger.warning("Detected eager backend, disabling AOT compile.")
+                use_aot_compile = False
+            if use_aot_compile:
                self.aot_compiled_fn = self.aot_compile(*args, **kwargs)
                output = self.aot_compiled_fn(self, *args, **kwargs)
                assert aot_compilation_path is not None