Commit 91577443 authored by zhuwenwen's avatar zhuwenwen
Browse files

set VLLM_USE_TC_PAGED_ATTN=1

parent 905411f1
...@@ -206,7 +206,7 @@ environment_variables: Dict[str, Callable[[], Any]] = { ...@@ -206,7 +206,7 @@ environment_variables: Dict[str, Callable[[], Any]] = {
# flag to control vllm to use optimized tc paged attn kernels # flag to control vllm to use optimized tc paged attn kernels
"VLLM_USE_TC_PAGED_ATTN": "VLLM_USE_TC_PAGED_ATTN":
lambda: (os.environ.get("VLLM_USE_TC_PAGED_ATTN", "False").lower() in lambda: (os.environ.get("VLLM_USE_TC_PAGED_ATTN", "True").lower() in
("true", "1")), ("true", "1")),
# flag to control if vllm print pa parameters # flag to control if vllm print pa parameters
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment