diff --git a/nemo_reinforcer/distributed/virtual_cluster.py b/nemo_reinforcer/distributed/virtual_cluster.py index 8b6600353c..1213d8d897 100644 --- a/nemo_reinforcer/distributed/virtual_cluster.py +++ b/nemo_reinforcer/distributed/virtual_cluster.py @@ -160,7 +160,8 @@ def __init__( self._init_placement_groups(placement_group_strategy) # Reaching here means we were successful break - except ResourceInsufficientError: + except ResourceInsufficientError as e: + print(e) print( f"Retrying placement group creation... {i + 1}/{max_retries}. Next retry in {2**i} seconds." )