Unverified Commit 73b24346 authored by Jee Jee Li's avatar Jee Jee Li Committed by GitHub
Browse files

[BugFix] Add env variable to control PDL in LoRA (#32836)


Signed-off-by: default avatarJee Jee Li <pandaleefree@gmail.com>
parent 7e67df55
...@@ -251,6 +251,7 @@ if TYPE_CHECKING: ...@@ -251,6 +251,7 @@ if TYPE_CHECKING:
VLLM_LOG_MODEL_INSPECTION: bool = False VLLM_LOG_MODEL_INSPECTION: bool = False
VLLM_DEBUG_MFU_METRICS: bool = False VLLM_DEBUG_MFU_METRICS: bool = False
VLLM_DISABLE_LOG_LOGO: bool = False VLLM_DISABLE_LOG_LOGO: bool = False
VLLM_LORA_DISABLE_PDL: bool = False
def get_default_cache_root(): def get_default_cache_root():
...@@ -1618,8 +1619,12 @@ environment_variables: dict[str, Callable[[], Any]] = { ...@@ -1618,8 +1619,12 @@ environment_variables: dict[str, Callable[[], Any]] = {
), ),
# Disable logging of vLLM logo at server startup time. # Disable logging of vLLM logo at server startup time.
"VLLM_DISABLE_LOG_LOGO": lambda: bool(int(os.getenv("VLLM_DISABLE_LOG_LOGO", "0"))), "VLLM_DISABLE_LOG_LOGO": lambda: bool(int(os.getenv("VLLM_DISABLE_LOG_LOGO", "0"))),
# Disable PDL for LoRA, as enabling PDL with LoRA on SM100 causes
# Triton compilation to fail.
"VLLM_LORA_DISABLE_PDL": lambda: bool(int(os.getenv("VLLM_LORA_DISABLE_PDL", "0"))),
} }
# --8<-- [end:env-vars-definition] # --8<-- [end:env-vars-definition]
......
...@@ -310,4 +310,9 @@ def supports_pdl(device: torch.device | None = None) -> bool: ...@@ -310,4 +310,9 @@ def supports_pdl(device: torch.device | None = None) -> bool:
Refer to: https://github.com/triton-lang/triton/blob/v3.5.0/python/tutorials/11-programmatic-dependent-launch.py Refer to: https://github.com/triton-lang/triton/blob/v3.5.0/python/tutorials/11-programmatic-dependent-launch.py
""" """
# PDL requires compute capability SM90 or above # PDL requires compute capability SM90 or above
return current_platform.is_cuda() and current_platform.has_device_capability(90)
return (
current_platform.is_cuda()
and current_platform.has_device_capability(90)
and not envs.VLLM_LORA_DISABLE_PDL
)
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment