diff --git a/vllm_omni/entrypoints/omni.py b/vllm_omni/entrypoints/omni.py index dc18978f96..59be966c33 100644 --- a/vllm_omni/entrypoints/omni.py +++ b/vllm_omni/entrypoints/omni.py @@ -371,9 +371,13 @@ def _start_stages(self, model: str) -> None: # Allocate endpoints for each stage total_stages = len(self.stage_configs) self._handshake_endpoints = {} + + # If --stage-id is not set, use local_only mode + local_only = self._single_stage_id is None + for sid in range(total_stages): - in_endpoint = get_engine_client_zmq_addr(local_only=False, host=self._zmq_master_address) - out_endpoint = get_engine_client_zmq_addr(local_only=False, host=self._zmq_master_address) + in_endpoint = get_engine_client_zmq_addr(local_only=local_only, host=self._zmq_master_address) + out_endpoint = get_engine_client_zmq_addr(local_only=local_only, host=self._zmq_master_address) self._handshake_endpoints[sid] = (in_endpoint, out_endpoint) logger.debug( f"[{self._name}] Allocated endpoints for stage-{sid}: in={in_endpoint}, out={out_endpoint}"