sgl-project · zhyncs · Jun 20, 2025 · Jun 20, 2025 · gemini-code-assist · Jun 20, 2025
@@ -1438,7 +1438,7 @@ def get_next_batch_to_run(self) -> Optional[ScheduleBatch]:
         if need_dp_attn_preparation and not self.spec_algorithm.is_none():
             # In speculative decoding, prefill batches and decode batches cannot be processed in the same DP attention group.
             # We prepare idle batches in advance to skip preparing decode batches when there are prefill batches in the group.
-            new_batch, _ = self.prepare_dp_attn_batch(new_batch)
+            new_batch, _ = self.prepare_mlp_sync_batch(new_batch)
-            new_batch, _ = self.prepare_mlp_sync_batch(new_batch)
+            new_batch, _ = self.prepare_mlp_sync_batch(new_batch)  # Ensure this function correctly handles DP attention preparation
-            new_batch, _ = self.prepare_mlp_sync_batch(new_batch)
+            new_batch, _ = self.prepare_mlp_sync_batch(new_batch)  # Ensure this function correctly handles DP attention preparation
             need_dp_attn_preparation = new_batch is None
 
         if new_batch is not None:
@@ -1454,7 +1454,7 @@ def get_next_batch_to_run(self) -> Optional[ScheduleBatch]:
 
         # Handle DP attention
         if need_dp_attn_preparation:
-            ret, _ = self.prepare_dp_attn_batch(ret)
+            ret, _ = self.prepare_mlp_sync_batch(ret)
-            ret, _ = self.prepare_mlp_sync_batch(ret)
+            ret, _ = self.prepare_mlp_sync_batch(ret)  # Ensure this function correctly handles DP attention
-            ret, _ = self.prepare_mlp_sync_batch(ret)
+            ret, _ = self.prepare_mlp_sync_batch(ret)  # Ensure this function correctly handles DP attention
 
         return ret