diff --git a/tests/entrypoints/openai/test_realtime_validation.py b/tests/entrypoints/openai/test_realtime_validation.py index 273a034e1773..9a45ac293ef3 100644 --- a/tests/entrypoints/openai/test_realtime_validation.py +++ b/tests/entrypoints/openai/test_realtime_validation.py @@ -13,7 +13,7 @@ from vllm.assets.audio import AudioAsset -from ...utils import RemoteOpenAIServer +from ...utils import ROCM_ENV_OVERRIDES, ROCM_EXTRA_ARGS, RemoteOpenAIServer from .conftest import add_attention_backend MISTRAL_FORMAT_ARGS = [ @@ -23,7 +23,7 @@ "mistral", "--load_format", "mistral", -] +] + ROCM_EXTRA_ARGS MODEL_NAME = "mistralai/Voxtral-Mini-4B-Realtime-2602" @@ -77,7 +77,9 @@ async def test_multi_chunk_streaming( add_attention_backend(server_args, rocm_aiter_fa_attention) - with RemoteOpenAIServer(model_name, server_args) as remote_server: + with RemoteOpenAIServer( + model_name, server_args, env_dict=ROCM_ENV_OVERRIDES + ) as remote_server: ws_url = _get_websocket_url(remote_server) async with websockets.connect(ws_url) as ws: # Receive session.created @@ -178,7 +180,9 @@ async def test_empty_commit_does_not_crash_engine( add_attention_backend(server_args, rocm_aiter_fa_attention) - with RemoteOpenAIServer(model_name, server_args) as remote_server: + with RemoteOpenAIServer( + model_name, server_args, env_dict=ROCM_ENV_OVERRIDES + ) as remote_server: ws_url = _get_websocket_url(remote_server) # --- First connection: empty commit (no audio appended) ----------