Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in
Toggle navigation
Menu
Open sidebar
OpenDAS
vllm_cscc
Commits
90bbe0a5
Unverified
Commit
90bbe0a5
authored
Aug 19, 2025
by
Wentao Ye
Committed by
GitHub
Aug 18, 2025
Browse files
[Log] Warning Once for Cutlass MLA (#23137)
Signed-off-by:
yewentao256
<
zhyanwentao@126.com
>
parent
e75f3422
Changes
1
Hide whitespace changes
Inline
Side-by-side
Showing
1 changed file
with
3 additions
and
3 deletions
+3
-3
vllm/v1/attention/backends/mla/cutlass_mla.py
vllm/v1/attention/backends/mla/cutlass_mla.py
+3
-3
No files found.
vllm/v1/attention/backends/mla/cutlass_mla.py
View file @
90bbe0a5
...
...
@@ -115,7 +115,7 @@ class CutlassMLAImpl(MLACommonImpl[MLACommonMetadata]):
self
.
_use_old_cutlass_mla
=
False
force_old_cutlass
=
os
.
environ
.
get
(
"FORCE_OLD_CUTLASS_MLA"
,
None
)
if
force_old_cutlass
:
logger
.
warning
(
"Forcing old cutlass mla kernel"
)
logger
.
warning
_once
(
"Forcing old cutlass mla kernel"
)
self
.
_use_old_cutlass_mla
=
True
# TODO: Currently, num_kv_splits is limited to 16 to avoid hanging
...
...
@@ -123,8 +123,8 @@ class CutlassMLAImpl(MLACommonImpl[MLACommonMetadata]):
# FORCE_NUM_KV_SPLITS=1
force_num_kv_splits
=
os
.
environ
.
get
(
"FORCE_NUM_KV_SPLITS"
,
None
)
if
force_num_kv_splits
:
logger
.
warning
(
"Forcing num_kv_splits to %d"
,
int
(
force_num_kv_splits
))
logger
.
warning
_once
(
"Forcing num_kv_splits to %d"
,
int
(
force_num_kv_splits
))
self
.
_num_kv_splits
=
int
(
force_num_kv_splits
)
else
:
self
.
_num_kv_splits
=
-
1
# => Auto-detect
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment