diff --git a/python/sglang/srt/model_executor/model_runner.py b/python/sglang/srt/model_executor/model_runner.py index a1614e06b86e..b424326533e8 100644 --- a/python/sglang/srt/model_executor/model_runner.py +++ b/python/sglang/srt/model_executor/model_runner.py @@ -2783,7 +2783,7 @@ def _forward_raw( if ( forward_batch.num_token_non_padded is not None and forward_batch.global_num_tokens_gpu is not None - and require_gathered_buffer + and require_gathered_buffer(self.server_args) and not is_nsa_enable_prefill_cp() ): forward_batch.adjust_num_token_non_padded_for_attn_tp(