diff --git a/python/sglang/srt/models/qwen3_moe.py b/python/sglang/srt/models/qwen3_moe.py index 21412a161e40..dd9598c36fdb 100644 --- a/python/sglang/srt/models/qwen3_moe.py +++ b/python/sglang/srt/models/qwen3_moe.py @@ -335,6 +335,7 @@ def forward_normal( if ( self.ep_size > 1 and not should_allreduce_fusion + and not use_reduce_scatter and not should_use_dp_reduce_scatterv() ): final_hidden_states = moe_expert_parallel_all_reduce(final_hidden_states)