[compile] Disable aot when eager backend is used. (#30810)

Signed-off-by: zhxchen17 <zhxchen17@fb.com>

[compile] Disable aot when eager backend is used. (#30810)
Signed-off-by: zhxchen17 <zhxchen17@fb.com>
177c391d · Zhengxu Chen · GitHub · 519ef9a9 · 177c391d
Unverified Commit 177c391d authored Dec 17, 2025 by Zhengxu Chen Committed by GitHub Dec 17, 2025
Hide whitespace changes
Inline Side-by-side

Showing with 9 additions and 2 deletions

vllm/compilation/decorators.py vllm/compilation/decorators.py +9 -2

No files found.
--- a/vllm/compilation/decorators.py
+++ b/vllm/compilation/decorators.py
@@ -435,7 +435,10 @@ def _support_torch_compile(
                return self.aot_compiled_fn(self, *args, **kwargs)

        if self.compiled:
-            assert not envs.VLLM_USE_AOT_COMPILE
+            assert (
+                not envs.VLLM_USE_AOT_COMPILE
+                or self.vllm_config.compilation_config.backend == "eager"
+            )
            return TorchCompileWithNoGuardsWrapper.__call__(self, *args, **kwargs)

        # This is the path for the first compilation.
@@ -508,7 +511,11 @@ def _support_torch_compile(
            _torch27_patch_tensor_subclasses(),
            torch._inductor.config.patch(**inductor_config_patches),
        ):
-            if envs.VLLM_USE_AOT_COMPILE:
+            use_aot_compile = envs.VLLM_USE_AOT_COMPILE
+            if self.vllm_config.compilation_config.backend == "eager":
+                logger.warning("Detected eager backend, disabling AOT compile.")
+                use_aot_compile = False
+            if use_aot_compile:
                self.aot_compiled_fn = self.aot_compile(*args, **kwargs)
                output = self.aot_compiled_fn(self, *args, **kwargs)
                assert aot_compilation_path is not None