Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in
Toggle navigation
Menu
Open sidebar
OpenDAS
vllm_cscc
Commits
853a8eb5
Unverified
Commit
853a8eb5
authored
Nov 02, 2025
by
Cyrus Leung
Committed by
GitHub
Nov 02, 2025
Browse files
[Bugfix] Fix Qwen Omni audio inference (#27920)
Signed-off-by:
DarkLight1337
<
tlleungac@connect.ust.hk
>
parent
758ea2e9
Changes
2
Show whitespace changes
Inline
Side-by-side
Showing
2 changed files
with
2 additions
and
10 deletions
+2
-10
vllm/model_executor/models/qwen2_5_omni_thinker.py
vllm/model_executor/models/qwen2_5_omni_thinker.py
+2
-7
vllm/model_executor/models/qwen3_omni_moe_thinker.py
vllm/model_executor/models/qwen3_omni_moe_thinker.py
+0
-3
No files found.
vllm/model_executor/models/qwen2_5_omni_thinker.py
View file @
853a8eb5
...
...
@@ -130,6 +130,8 @@ class Qwen2_5OmniAudioFeatureInputs(TensorSchema):
TensorShape
(
"nmb"
,
"tsl"
,
dynamic_dims
=
{
"tsl"
}),
]
audio_feature_lengths
:
Annotated
[
torch
.
Tensor
,
TensorShape
(
"na"
)]
feature_attention_mask
:
Annotated
[
torch
.
Tensor
|
list
[
torch
.
Tensor
],
TensorShape
(
"na"
,
"msl"
,
dynamic_dims
=
{
"msl"
}),
...
...
@@ -732,13 +734,6 @@ class Qwen2_5OmniConditionalGenerationMixin:
input_features
=
audio_input
[
"input_features"
]
audio_feature_lengths
=
audio_input
[
"audio_feature_lengths"
]
if
audio_feature_lengths
.
shape
[
0
]
==
1
:
audio_feature_lengths
=
audio_feature_lengths
.
squeeze
(
0
)
elif
audio_feature_lengths
.
shape
[
1
]
==
1
:
audio_feature_lengths
=
audio_feature_lengths
.
squeeze
(
1
)
else
:
raise
AssertionError
(
audio_feature_lengths
.
shape
)
audio_feat_lengths
,
audio_output_lengths
=
(
self
.
audio_tower
.
_get_feat_extract_output_lengths
(
audio_feature_lengths
)
)
...
...
vllm/model_executor/models/qwen3_omni_moe_thinker.py
View file @
853a8eb5
...
...
@@ -99,7 +99,6 @@ from .utils import (
AutoWeightsLoader
,
WeightsMapper
,
_merge_multimodal_embeddings
,
flatten_bn
,
maybe_prefix
,
)
from
.vision
import
(
...
...
@@ -1065,8 +1064,6 @@ class Qwen3OmniMoeConditionalGenerationMixin(Qwen2_5OmniConditionalGenerationMix
input_features
=
audio_input
[
"input_features"
]
audio_feature_lengths
=
audio_input
[
"audio_feature_lengths"
]
audio_feature_lengths
=
flatten_bn
(
audio_feature_lengths
,
concat
=
True
)
audio_feat_lengths
,
audio_output_lengths
=
_get_feat_extract_output_lengths
(
audio_feature_lengths
)
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment