mirror of
				https://github.com/clearml/clearml
				synced 2025-06-26 18:16:07 +00:00 
			
		
		
		
	Fix wait for jobs based on local/remote pool frequency
This commit is contained in:
		
							parent
							
								
									6bba270620
								
							
						
					
					
						commit
						6924f32d6c
					
				| @ -3206,7 +3206,7 @@ class PipelineDecorator(PipelineController): | ||||
|                             raise ValueError("Job was not created and is also not cached/executed") | ||||
|                         return "{}.{}".format(_node.executed, return_name) | ||||
| 
 | ||||
|                     _node.job.wait(pool_period=0.2) | ||||
|                     _node.job.wait(pool_period=1 if cls._debug_execute_step_process else 5) | ||||
|                     if _node.job.is_failed() and not _node.continue_on_fail: | ||||
|                         raise ValueError( | ||||
|                             'Pipeline step "{}", Task ID={} failed'.format(_node.name, _node.job.task_id())) | ||||
| @ -3224,9 +3224,9 @@ class PipelineDecorator(PipelineController): | ||||
|                     while True: | ||||
|                         # wait until job is completed | ||||
|                         if _node.job: | ||||
|                             _node.job.wait(pool_period=0.2) | ||||
|                             _node.job.wait(pool_period=1 if cls._debug_execute_step_process else 5) | ||||
|                         else: | ||||
|                             sleep(0.2) | ||||
|                             sleep(2) | ||||
|                             continue | ||||
|                         if _node.job.is_failed() or _node.job.is_aborted(): | ||||
|                             if cls._singleton._should_relaunch_node(_node): | ||||
| @ -3485,7 +3485,7 @@ class PipelineDecorator(PipelineController): | ||||
|                     for node in list(a_pipeline._nodes.values()): | ||||
|                         if node.executed or not node.job or node.job.is_stopped(): | ||||
|                             continue | ||||
|                         node.job.wait(pool_period=15) | ||||
|                         node.job.wait(pool_period=1 if cls._debug_execute_step_process else 5) | ||||
|                         waited = True | ||||
|                 # store the pipeline result of we have any: | ||||
|                 if return_value and pipeline_result is not None: | ||||
|  | ||||
		Loading…
	
		Reference in New Issue
	
	Block a user
	 allegroai
						allegroai