Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in
Toggle navigation
Menu
Open sidebar
OpenDAS
vllm_cscc
Commits
58928475
Unverified
Commit
58928475
authored
Mar 06, 2026
by
Andreas Karatzas
Committed by
GitHub
Mar 06, 2026
Browse files
[ROCm][CI] Making entrypoints more deterministic on ROCm (#36293)
parent
1a971808
Changes
1
Hide whitespace changes
Inline
Side-by-side
Showing
1 changed file
with
8 additions
and
4 deletions
+8
-4
tests/entrypoints/openai/test_realtime_validation.py
tests/entrypoints/openai/test_realtime_validation.py
+8
-4
No files found.
tests/entrypoints/openai/test_realtime_validation.py
View file @
58928475
...
@@ -13,7 +13,7 @@ import websockets
...
@@ -13,7 +13,7 @@ import websockets
from
vllm.assets.audio
import
AudioAsset
from
vllm.assets.audio
import
AudioAsset
from
...utils
import
RemoteOpenAIServer
from
...utils
import
ROCM_ENV_OVERRIDES
,
ROCM_EXTRA_ARGS
,
RemoteOpenAIServer
from
.conftest
import
add_attention_backend
from
.conftest
import
add_attention_backend
MISTRAL_FORMAT_ARGS
=
[
MISTRAL_FORMAT_ARGS
=
[
...
@@ -23,7 +23,7 @@ MISTRAL_FORMAT_ARGS = [
...
@@ -23,7 +23,7 @@ MISTRAL_FORMAT_ARGS = [
"mistral"
,
"mistral"
,
"--load_format"
,
"--load_format"
,
"mistral"
,
"mistral"
,
]
]
+
ROCM_EXTRA_ARGS
MODEL_NAME
=
"mistralai/Voxtral-Mini-4B-Realtime-2602"
MODEL_NAME
=
"mistralai/Voxtral-Mini-4B-Realtime-2602"
...
@@ -77,7 +77,9 @@ async def test_multi_chunk_streaming(
...
@@ -77,7 +77,9 @@ async def test_multi_chunk_streaming(
add_attention_backend
(
server_args
,
rocm_aiter_fa_attention
)
add_attention_backend
(
server_args
,
rocm_aiter_fa_attention
)
with
RemoteOpenAIServer
(
model_name
,
server_args
)
as
remote_server
:
with
RemoteOpenAIServer
(
model_name
,
server_args
,
env_dict
=
ROCM_ENV_OVERRIDES
)
as
remote_server
:
ws_url
=
_get_websocket_url
(
remote_server
)
ws_url
=
_get_websocket_url
(
remote_server
)
async
with
websockets
.
connect
(
ws_url
)
as
ws
:
async
with
websockets
.
connect
(
ws_url
)
as
ws
:
# Receive session.created
# Receive session.created
...
@@ -178,7 +180,9 @@ async def test_empty_commit_does_not_crash_engine(
...
@@ -178,7 +180,9 @@ async def test_empty_commit_does_not_crash_engine(
add_attention_backend
(
server_args
,
rocm_aiter_fa_attention
)
add_attention_backend
(
server_args
,
rocm_aiter_fa_attention
)
with
RemoteOpenAIServer
(
model_name
,
server_args
)
as
remote_server
:
with
RemoteOpenAIServer
(
model_name
,
server_args
,
env_dict
=
ROCM_ENV_OVERRIDES
)
as
remote_server
:
ws_url
=
_get_websocket_url
(
remote_server
)
ws_url
=
_get_websocket_url
(
remote_server
)
# --- First connection: empty commit (no audio appended) ----------
# --- First connection: empty commit (no audio appended) ----------
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment