diff --git a/deepspeed/pt/deepspeed_lr_schedules.py b/deepspeed/pt/deepspeed_lr_schedules.py index 02f66a45aab4..996d41ae9088 100755 --- a/deepspeed/pt/deepspeed_lr_schedules.py +++ b/deepspeed/pt/deepspeed_lr_schedules.py @@ -679,7 +679,7 @@ def get_lr(self): if self.last_batch_iteration < 0: logger.warning( "Attempting to get learning rate from scheduler before it has started") - return 0.0 + return [0.0] gamma = self._get_gamma() return [ min_lr + (delta_lr * gamma) for min_lr,