Unverified Commit 177c391d authored by Zhengxu Chen's avatar Zhengxu Chen Committed by GitHub
Browse files

[compile] Disable aot when eager backend is used. (#30810)


Signed-off-by: default avatarzhxchen17 <zhxchen17@fb.com>
parent 519ef9a9
...@@ -435,7 +435,10 @@ def _support_torch_compile( ...@@ -435,7 +435,10 @@ def _support_torch_compile(
return self.aot_compiled_fn(self, *args, **kwargs) return self.aot_compiled_fn(self, *args, **kwargs)
if self.compiled: if self.compiled:
assert not envs.VLLM_USE_AOT_COMPILE assert (
not envs.VLLM_USE_AOT_COMPILE
or self.vllm_config.compilation_config.backend == "eager"
)
return TorchCompileWithNoGuardsWrapper.__call__(self, *args, **kwargs) return TorchCompileWithNoGuardsWrapper.__call__(self, *args, **kwargs)
# This is the path for the first compilation. # This is the path for the first compilation.
...@@ -508,7 +511,11 @@ def _support_torch_compile( ...@@ -508,7 +511,11 @@ def _support_torch_compile(
_torch27_patch_tensor_subclasses(), _torch27_patch_tensor_subclasses(),
torch._inductor.config.patch(**inductor_config_patches), torch._inductor.config.patch(**inductor_config_patches),
): ):
if envs.VLLM_USE_AOT_COMPILE: use_aot_compile = envs.VLLM_USE_AOT_COMPILE
if self.vllm_config.compilation_config.backend == "eager":
logger.warning("Detected eager backend, disabling AOT compile.")
use_aot_compile = False
if use_aot_compile:
self.aot_compiled_fn = self.aot_compile(*args, **kwargs) self.aot_compiled_fn = self.aot_compile(*args, **kwargs)
output = self.aot_compiled_fn(self, *args, **kwargs) output = self.aot_compiled_fn(self, *args, **kwargs)
assert aot_compilation_path is not None assert aot_compilation_path is not None
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment