Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in
Toggle navigation
Menu
Open sidebar
OpenDAS
vllm_cscc
Commits
ee7a66dd
Unverified
Commit
ee7a66dd
authored
Sep 19, 2025
by
Lucia Fang
Committed by
GitHub
Sep 19, 2025
Browse files
allow disable flashinfer prefill (#25276)
Signed-off-by:
Lu Fang
<
fanglu@fb.com
>
parent
431535b5
Changes
2
Show whitespace changes
Inline
Side-by-side
Showing
2 changed files
with
5 additions
and
1 deletion
+5
-1
vllm/envs.py
vllm/envs.py
+3
-0
vllm/v1/attention/backends/mla/common.py
vllm/v1/attention/backends/mla/common.py
+2
-1
No files found.
vllm/envs.py
View file @
ee7a66dd
...
...
@@ -32,6 +32,7 @@ if TYPE_CHECKING:
VLLM_CONFIG_ROOT
:
str
=
os
.
path
.
expanduser
(
"~/.config/vllm"
)
VLLM_USAGE_STATS_SERVER
:
str
=
"https://stats.vllm.ai"
VLLM_NO_USAGE_STATS
:
bool
=
False
VLLM_DISABLE_FLASHINFER_PREFILL
:
bool
=
False
VLLM_DO_NOT_TRACK
:
bool
=
False
VLLM_USAGE_SOURCE
:
str
=
""
VLLM_CONFIGURE_LOGGING
:
int
=
1
...
...
@@ -479,6 +480,8 @@ environment_variables: dict[str, Callable[[], Any]] = {
lambda
:
os
.
environ
.
get
(
"VLLM_USAGE_STATS_SERVER"
,
"https://stats.vllm.ai"
),
"VLLM_NO_USAGE_STATS"
:
lambda
:
os
.
environ
.
get
(
"VLLM_NO_USAGE_STATS"
,
"0"
)
==
"1"
,
"VLLM_DISABLE_FLASHINFER_PREFILL"
:
lambda
:
os
.
environ
.
get
(
"VLLM_DISABLE_FLASHINFER_PREFILL"
,
"0"
)
==
"1"
,
"VLLM_DO_NOT_TRACK"
:
lambda
:
(
os
.
environ
.
get
(
"VLLM_DO_NOT_TRACK"
,
None
)
or
os
.
environ
.
get
(
"DO_NOT_TRACK"
,
None
)
or
"0"
)
==
"1"
,
...
...
vllm/v1/attention/backends/mla/common.py
View file @
ee7a66dd
...
...
@@ -412,7 +412,8 @@ M = TypeVar("M", bound=MLACommonMetadata)
def
use_flashinfer_prefill
()
->
bool
:
# For blackwell default to flashinfer prefill if it's available since
# it is faster than FA2.
return
(
flashinfer_available
and
not
envs
.
VLLM_USE_CUDNN_PREFILL
return
(
not
envs
.
VLLM_DISABLE_FLASHINFER_PREFILL
and
flashinfer_available
and
not
envs
.
VLLM_USE_CUDNN_PREFILL
and
current_platform
.
is_device_capability
(
100
))
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment