diff --git a/deepspeed/runtime/sequence_parallel/parallel_state_sp.py b/deepspeed/runtime/sequence_parallel/parallel_state_sp.py index c16880e15d42..806a58a23ff4 100644 --- a/deepspeed/runtime/sequence_parallel/parallel_state_sp.py +++ b/deepspeed/runtime/sequence_parallel/parallel_state_sp.py @@ -88,3 +88,9 @@ def get_sequence_parallel_rank(): def get_sequence_data_parallel_rank(): """Return my rank for the sequence data parallel group.""" return dist.get_rank(group=get_sequence_data_parallel_group()) + + +# since we only have 1 additional dimension over DP, we can just alias MP with SP +get_model_parallel_rank = get_sequence_parallel_rank +get_model_parallel_world_size = get_sequence_parallel_world_size +get_model_parallel_group = get_sequence_parallel_group