From b5b859363d8548505e27ff2ea523a6c542b3d13c Mon Sep 17 00:00:00 2001 From: fzyzcjy Date: Mon, 8 Dec 2025 22:09:08 +0800 Subject: [PATCH] more --- python/sglang/srt/entrypoints/openai/protocol.py | 6 ++++++ python/sglang/srt/entrypoints/openai/serving_chat.py | 1 + python/sglang/srt/entrypoints/openai/serving_completions.py | 1 + 3 files changed, 8 insertions(+) diff --git a/python/sglang/srt/entrypoints/openai/protocol.py b/python/sglang/srt/entrypoints/openai/protocol.py index 7f490e95cbaa..5e7d91878ba7 100644 --- a/python/sglang/srt/entrypoints/openai/protocol.py +++ b/python/sglang/srt/entrypoints/openai/protocol.py @@ -257,6 +257,9 @@ class CompletionRequest(BaseModel): bootstrap_port: Optional[Union[List[Optional[int]], int]] = None bootstrap_room: Optional[Union[List[int], int]] = None + # For data parallel rank routing + data_parallel_rank: Optional[int] = None + # For request id rid: Optional[Union[List[str], str]] = None # Extra key for classifying the request (e.g. cache_salt) @@ -530,6 +533,9 @@ class ChatCompletionRequest(BaseModel): bootstrap_port: Optional[Union[List[Optional[int]], int]] = None bootstrap_room: Optional[Union[List[int], int]] = None + # For data parallel rank routing + data_parallel_rank: Optional[int] = None + # OpenAI/SGLang default sampling parameters _DEFAULT_SAMPLING_PARAMS = { "temperature": 1.0, diff --git a/python/sglang/srt/entrypoints/openai/serving_chat.py b/python/sglang/srt/entrypoints/openai/serving_chat.py index 48197bd78645..05a8fe90aa02 100644 --- a/python/sglang/srt/entrypoints/openai/serving_chat.py +++ b/python/sglang/srt/entrypoints/openai/serving_chat.py @@ -210,6 +210,7 @@ def _convert_to_internal_request( bootstrap_host=request.bootstrap_host, bootstrap_port=request.bootstrap_port, bootstrap_room=request.bootstrap_room, + data_parallel_rank=request.data_parallel_rank, return_hidden_states=request.return_hidden_states, rid=request.rid, extra_key=self._compute_extra_key(request), diff --git a/python/sglang/srt/entrypoints/openai/serving_completions.py b/python/sglang/srt/entrypoints/openai/serving_completions.py index 67fe3c12933d..144b7d587bdd 100644 --- a/python/sglang/srt/entrypoints/openai/serving_completions.py +++ b/python/sglang/srt/entrypoints/openai/serving_completions.py @@ -116,6 +116,7 @@ def _convert_to_internal_request( bootstrap_host=request.bootstrap_host, bootstrap_port=request.bootstrap_port, bootstrap_room=request.bootstrap_room, + data_parallel_rank=request.data_parallel_rank, return_hidden_states=request.return_hidden_states, rid=request.rid, extra_key=self._compute_extra_key(request),