Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in
Toggle navigation
Menu
Open sidebar
OpenDAS
vllm_cscc
Commits
8ece6076
Unverified
Commit
8ece6076
authored
Jan 30, 2026
by
Nicolò Lucchesi
Committed by
GitHub
Jan 30, 2026
Browse files
[CI] Qwen3-ASR transcriptios tests (#33414)
Signed-off-by:
NickLucche
<
nlucches@redhat.com
>
parent
fd0e3772
Changes
1
Hide whitespace changes
Inline
Side-by-side
Showing
1 changed file
with
9 additions
and
5 deletions
+9
-5
tests/entrypoints/openai/test_transcription_validation.py
tests/entrypoints/openai/test_transcription_validation.py
+9
-5
No files found.
tests/entrypoints/openai/test_transcription_validation.py
View file @
8ece6076
...
...
@@ -20,7 +20,9 @@ MISTRAL_FORMAT_ARGS = [
@
pytest
.
mark
.
asyncio
@
pytest
.
mark
.
parametrize
(
"model_name"
,
[
"mistralai/Voxtral-Mini-3B-2507"
])
@
pytest
.
mark
.
parametrize
(
"model_name"
,
[
"mistralai/Voxtral-Mini-3B-2507"
,
"Qwen/Qwen3-ASR-0.6B"
]
)
async
def
test_basic_audio
(
mary_had_lamb
,
model_name
,
rocm_aiter_fa_attention
):
server_args
=
[
"--enforce-eager"
]
...
...
@@ -42,7 +44,7 @@ async def test_basic_audio(mary_had_lamb, model_name, rocm_aiter_fa_attention):
out
=
json
.
loads
(
transcription
)
out_text
=
out
[
"text"
]
out_usage
=
out
[
"usage"
]
assert
"Mary had a little lamb
,
"
in
out_text
assert
"Mary had a little lamb"
in
out_text
assert
out_usage
[
"seconds"
]
==
16
,
out_usage
[
"seconds"
]
...
...
@@ -89,10 +91,12 @@ async def test_basic_audio_with_lora(mary_had_lamb, rocm_aiter_fa_attention):
@
pytest
.
mark
.
asyncio
async
def
test_basic_audio_gemma
(
foscolo
,
rocm_aiter_fa_attention
):
@
pytest
.
mark
.
parametrize
(
"model_name"
,
[
"google/gemma-3n-E2B-it"
,
"Qwen/Qwen3-ASR-0.6B"
]
)
async
def
test_basic_audio_foscolo
(
foscolo
,
rocm_aiter_fa_attention
,
model_name
):
# Gemma accuracy on some of the audio samples we use is particularly bad,
# hence we use a different one here. WER is evaluated separately.
model_name
=
"google/gemma-3n-E2B-it"
server_args
=
[
"--enforce-eager"
]
add_attention_backend
(
server_args
,
rocm_aiter_fa_attention
)
...
...
@@ -109,4 +113,4 @@ async def test_basic_audio_gemma(foscolo, rocm_aiter_fa_attention):
temperature
=
0.0
,
)
out
=
json
.
loads
(
transcription
)[
"text"
]
assert
"
da cui vergine nacque Vener
e"
in
out
assert
"
ove il mio corpo fanciulletto giacqu
e"
in
out
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment