Unverified Commit 58928475 authored by Andreas Karatzas's avatar Andreas Karatzas Committed by GitHub
Browse files

[ROCm][CI] Making entrypoints more deterministic on ROCm (#36293)

parent 1a971808
...@@ -13,7 +13,7 @@ import websockets ...@@ -13,7 +13,7 @@ import websockets
from vllm.assets.audio import AudioAsset from vllm.assets.audio import AudioAsset
from ...utils import RemoteOpenAIServer from ...utils import ROCM_ENV_OVERRIDES, ROCM_EXTRA_ARGS, RemoteOpenAIServer
from .conftest import add_attention_backend from .conftest import add_attention_backend
MISTRAL_FORMAT_ARGS = [ MISTRAL_FORMAT_ARGS = [
...@@ -23,7 +23,7 @@ MISTRAL_FORMAT_ARGS = [ ...@@ -23,7 +23,7 @@ MISTRAL_FORMAT_ARGS = [
"mistral", "mistral",
"--load_format", "--load_format",
"mistral", "mistral",
] ] + ROCM_EXTRA_ARGS
MODEL_NAME = "mistralai/Voxtral-Mini-4B-Realtime-2602" MODEL_NAME = "mistralai/Voxtral-Mini-4B-Realtime-2602"
...@@ -77,7 +77,9 @@ async def test_multi_chunk_streaming( ...@@ -77,7 +77,9 @@ async def test_multi_chunk_streaming(
add_attention_backend(server_args, rocm_aiter_fa_attention) add_attention_backend(server_args, rocm_aiter_fa_attention)
with RemoteOpenAIServer(model_name, server_args) as remote_server: with RemoteOpenAIServer(
model_name, server_args, env_dict=ROCM_ENV_OVERRIDES
) as remote_server:
ws_url = _get_websocket_url(remote_server) ws_url = _get_websocket_url(remote_server)
async with websockets.connect(ws_url) as ws: async with websockets.connect(ws_url) as ws:
# Receive session.created # Receive session.created
...@@ -178,7 +180,9 @@ async def test_empty_commit_does_not_crash_engine( ...@@ -178,7 +180,9 @@ async def test_empty_commit_does_not_crash_engine(
add_attention_backend(server_args, rocm_aiter_fa_attention) add_attention_backend(server_args, rocm_aiter_fa_attention)
with RemoteOpenAIServer(model_name, server_args) as remote_server: with RemoteOpenAIServer(
model_name, server_args, env_dict=ROCM_ENV_OVERRIDES
) as remote_server:
ws_url = _get_websocket_url(remote_server) ws_url = _get_websocket_url(remote_server)
# --- First connection: empty commit (no audio appended) ---------- # --- First connection: empty commit (no audio appended) ----------
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment