We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 3790505 commit c870be6Copy full SHA for c870be6
tests/layers/test_moba_attention.py
@@ -359,7 +359,7 @@ def test_server(self):
359
model=model_path,
360
tensor_parallel_size=2,
361
max_model_len=131072,
362
- engine_worker_queue_port=8793,
+ engine_worker_queue_port=int(os.getenv("FD_ENGINE_QUEUE_PORT")),
363
max_num_seqs=32,
364
quantization="wint4",
365
enable_chunked_prefill=True,
0 commit comments