Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in
Toggle navigation
Menu
Open sidebar
OpenDAS
vllm_cscc
Commits
7c3f88b2
Unverified
Commit
7c3f88b2
authored
Mar 30, 2026
by
Thomas Parnell
Committed by
GitHub
Mar 30, 2026
Browse files
[Bugfix] Remove false-positive format mismatch warnings in FLA ops (#38255)
Signed-off-by:
Thomas Parnell
<
tpa@zurich.ibm.com
>
parent
6557f493
Changes
2
Show whitespace changes
Inline
Side-by-side
Showing
2 changed files
with
0 additions
and
17 deletions
+0
-17
vllm/model_executor/layers/fla/ops/chunk.py
vllm/model_executor/layers/fla/ops/chunk.py
+0
-8
vllm/model_executor/layers/fla/ops/cumsum.py
vllm/model_executor/layers/fla/ops/cumsum.py
+0
-9
No files found.
vllm/model_executor/layers/fla/ops/chunk.py
View file @
7c3f88b2
...
...
@@ -7,7 +7,6 @@
# the following copyright notice:
# Copyright (c) 2023-2025, Songlin Yang, Yu Zhang
# ruff: noqa: E501
import
warnings
import
torch
...
...
@@ -184,13 +183,6 @@ def chunk_gated_delta_rule(
"ChunkGatedDeltaRuleFunction does not support float32. Please use bfloat16."
)
assert
len
(
beta
.
shape
)
==
3
,
"beta must be of shape [B, T, H]."
if
q
.
shape
[
1
]
<
q
.
shape
[
2
]:
warnings
.
warn
(
f
"Input tensor shape suggests potential format mismatch: seq_len (
{
q
.
shape
[
1
]
}
) < num_heads (
{
q
.
shape
[
2
]
}
). "
"This may indicate the inputs were passed in head-first format [B, H, T, ...] "
"Please verify your input tensor format matches the expected shape [B, T, H, ...]."
,
stacklevel
=
2
,
)
if
cu_seqlens
is
not
None
:
if
q
.
shape
[
0
]
!=
1
:
raise
ValueError
(
...
...
vllm/model_executor/layers/fla/ops/cumsum.py
View file @
7c3f88b2
...
...
@@ -7,7 +7,6 @@
# the following copyright notice:
# Copyright (c) 2023-2025, Songlin Yang, Yu Zhang
# ruff: noqa: E501
import
warnings
import
torch
...
...
@@ -252,14 +251,6 @@ def chunk_local_cumsum(
output_dtype
:
torch
.
dtype
|
None
=
torch
.
float
,
**
kwargs
,
)
->
torch
.
Tensor
:
if
not
head_first
and
g
.
shape
[
1
]
<
g
.
shape
[
2
]:
warnings
.
warn
(
f
"Input tensor shape suggests potential format mismatch: seq_len (
{
g
.
shape
[
1
]
}
) < num_heads (
{
g
.
shape
[
2
]
}
). "
"This may indicate the inputs were passed in head-first format [B, H, T, ...] "
"when head_first=False was specified. "
"Please verify your input tensor format matches the expected shape [B, T, H, ...]."
,
stacklevel
=
2
,
)
if
cu_seqlens
is
not
None
:
assert
g
.
shape
[
0
]
==
1
,
(
"Only batch size 1 is supported when cu_seqlens are provided"
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment