Commit 4c167900 authored by zhuwenwen's avatar zhuwenwen
Browse files

set VLLM_USE_TOPK_RENORM=1

parent 2fc5b0bb
...@@ -1235,7 +1235,7 @@ environment_variables: dict[str, Callable[[], Any]] = { ...@@ -1235,7 +1235,7 @@ environment_variables: dict[str, Callable[[], Any]] = {
# vLLM will use optimized topk_softmax + renormalize # vLLM will use optimized topk_softmax + renormalize
"VLLM_USE_TOPK_RENORM": "VLLM_USE_TOPK_RENORM":
lambda: lambda:
(os.environ.get("VLLM_USE_TOPK_RENORM", "False").lower() in (os.environ.get("VLLM_USE_TOPK_RENORM", "True").lower() in
("true", "1")), ("true", "1")),
} }
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment