sgl-project · ByronHsu · Apr 26, 2026 · Apr 26, 2026 · gemini-code-assist · Apr 26, 2026
diff --git a/python/sglang/srt/models/qwen3_moe.py b/python/sglang/srt/models/qwen3_moe.py
@@ -335,6 +335,7 @@ def forward_normal(
         if (
             self.ep_size > 1
             and not should_allreduce_fusion
+            and not use_reduce_scatter
             and not should_use_dp_reduce_scatterv()
         ):
             final_hidden_states = moe_expert_parallel_all_reduce(final_hidden_states)