Commit e4a84fdc authored by zhuwenwen's avatar zhuwenwen
Browse files

set VLLM_USE_V1=1

parent 7151fd54
...@@ -1745,7 +1745,8 @@ class AsyncEngineArgs(EngineArgs): ...@@ -1745,7 +1745,8 @@ class AsyncEngineArgs(EngineArgs):
def _raise_or_fallback(feature_name: str, recommend_to_remove: bool): def _raise_or_fallback(feature_name: str, recommend_to_remove: bool):
if envs.is_set("VLLM_USE_V1") and envs.VLLM_USE_V1: # if envs.is_set("VLLM_USE_V1") and envs.VLLM_USE_V1:
if envs.VLLM_USE_V1:
raise NotImplementedError( raise NotImplementedError(
f"VLLM_USE_V1=1 is not supported with {feature_name}.") f"VLLM_USE_V1=1 is not supported with {feature_name}.")
msg = f"{feature_name} is not supported by the V1 Engine. " msg = f"{feature_name} is not supported by the V1 Engine. "
...@@ -1757,7 +1758,8 @@ def _raise_or_fallback(feature_name: str, recommend_to_remove: bool): ...@@ -1757,7 +1758,8 @@ def _raise_or_fallback(feature_name: str, recommend_to_remove: bool):
def _warn_or_fallback(feature_name: str) -> bool: def _warn_or_fallback(feature_name: str) -> bool:
if envs.is_set("VLLM_USE_V1") and envs.VLLM_USE_V1: # if envs.is_set("VLLM_USE_V1") and envs.VLLM_USE_V1:
if envs.VLLM_USE_V1:
logger.warning( logger.warning(
"Detected VLLM_USE_V1=1 with %s. Usage should " "Detected VLLM_USE_V1=1 with %s. Usage should "
"be considered experimental. Please report any " "be considered experimental. Please report any "
......
...@@ -665,7 +665,7 @@ environment_variables: dict[str, Callable[[], Any]] = { ...@@ -665,7 +665,7 @@ environment_variables: dict[str, Callable[[], Any]] = {
# If set, use the V1 code path. # If set, use the V1 code path.
"VLLM_USE_V1": "VLLM_USE_V1":
lambda: bool(int(os.getenv("VLLM_USE_V1", "0"))), lambda: bool(int(os.getenv("VLLM_USE_V1", "1"))),
# Disable aiter ops unless specifically enabled. # Disable aiter ops unless specifically enabled.
# Acts as a parent switch to enable the rest of the other operations. # Acts as a parent switch to enable the rest of the other operations.
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment