@@ -212,7 +212,7 @@ def collect_result(self, session):
212
212
for worker , (submission_id , submission_name ) in zip (workers ,
213
213
submissions ):
214
214
dt = worker .time_since_last_status_check ()
215
- if dt is not None and dt < self .time_between_collection :
215
+ if ( dt is not None ) and ( dt < self .time_between_collection ) :
216
216
self ._processing_worker_queue .put_nowait (
217
217
(worker , (submission_id , submission_name )))
218
218
time .sleep (0 )
@@ -231,20 +231,24 @@ def collect_result(self, session):
231
231
else :
232
232
self ._logger .info (f'Collecting results from worker { worker } ' )
233
233
returncode , stderr = worker .collect_results ()
234
+
234
235
if returncode :
235
236
if returncode == 124 :
236
237
self ._logger .info (
237
238
f'Worker { worker } killed due to timeout.'
238
239
)
240
+ submission_status = 'checking_error'
241
+ elif returncode == 2 :
242
+ # Error occurred when downloading the logs
243
+ submission_status = 'checking_error'
239
244
else :
240
245
self ._logger .info (
241
246
f'Worker { worker } killed due to an error '
242
247
f'during training: { stderr } '
243
248
)
244
- submission_status = 'training_error'
249
+ submission_status = 'training_error'
245
250
else :
246
251
submission_status = 'tested'
247
-
248
252
set_submission_state (
249
253
session , submission_id , submission_status
250
254
)
0 commit comments