diff --git a/python/sglang/srt/models/qwen3.py b/python/sglang/srt/models/qwen3.py index f424052d1430..7e557a8d5b31 100644 --- a/python/sglang/srt/models/qwen3.py +++ b/python/sglang/srt/models/qwen3.py @@ -198,7 +198,9 @@ def forward_prepare_npu(self, positions, hidden_states, forward_batch): ) return q, k, v - def forward_prepare_aiter_fused_mrope(self, positions, hidden_states, forward_batch): + def forward_prepare_aiter_fused_mrope( + self, positions, hidden_states, forward_batch + ): """Fused QK-norm + 3D mRoPE + KV cache write for decode (ROCm/aiter). The fused HIP kernel replaces split → QK norm → mRoPE → cache write,