Skip to content
Merged
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
10 changes: 6 additions & 4 deletions components/src/dynamo/sglang/args.py
Original file line number Diff line number Diff line change
Expand Up @@ -369,10 +369,12 @@ async def parse_args(args: list[str]) -> Config:
server_args = ServerArgs.from_cli_args(parsed_args)

# Dynamo's streaming handlers expect disjoint output_ids from SGLang (only new
# tokens since last output), not cumulative tokens. When stream_output=True,
# SGLang sends disjoint segments which Dynamo passes through directly.
# Force stream_output=True for optimal streaming performance.
server_args.stream_output = True
# tokens since last output), not cumulative tokens.
# sglang renamed stream_output -> incremental_streaming_output in PR #20614.
if hasattr(ServerArgs, "incremental_streaming_output"):
server_args.incremental_streaming_output = True
else:
server_args.stream_output = True

if dynamo_config.use_sglang_tokenizer:
warnings.warn(
Expand Down
Loading