mirror of
https://github.com/clearml/clearml
synced 2025-06-26 18:16:07 +00:00
Initial beta version
This commit is contained in:
48
trains/backend_interface/task/development/stop_signal.py
Normal file
48
trains/backend_interface/task/development/stop_signal.py
Normal file
@@ -0,0 +1,48 @@
|
||||
from ....config import config
|
||||
from ....backend_interface import Task, TaskStatusEnum
|
||||
|
||||
|
||||
class TaskStopReason(object):
|
||||
stopped = "stopped"
|
||||
reset = "reset"
|
||||
status_changed = "status_changed"
|
||||
|
||||
|
||||
class TaskStopSignal(object):
|
||||
enabled = bool(config.get('development.support_stopping', False))
|
||||
|
||||
_number_of_consecutive_reset_tests = 4
|
||||
|
||||
_unexpected_statuses = (
|
||||
TaskStatusEnum.closed,
|
||||
TaskStatusEnum.stopped,
|
||||
TaskStatusEnum.failed,
|
||||
TaskStatusEnum.published,
|
||||
)
|
||||
|
||||
def __init__(self, task):
|
||||
assert isinstance(task, Task)
|
||||
self.task = task
|
||||
self._task_reset_state_counter = 0
|
||||
|
||||
def test(self):
|
||||
status = self.task.status
|
||||
message = self.task.data.status_message
|
||||
|
||||
if status == TaskStatusEnum.in_progress and "stopping" in message:
|
||||
return TaskStopReason.stopped
|
||||
|
||||
if status in self._unexpected_statuses and "worker" not in message:
|
||||
return TaskStopReason.status_changed
|
||||
|
||||
if status == TaskStatusEnum.created:
|
||||
self._task_reset_state_counter += 1
|
||||
|
||||
if self._task_reset_state_counter >= self._number_of_consecutive_reset_tests:
|
||||
return TaskStopReason.reset
|
||||
|
||||
self.task.get_logger().warning(
|
||||
"Task {} was reset! if state is consistent we shall terminate.".format(self.task.id),
|
||||
)
|
||||
else:
|
||||
self._task_reset_state_counter = 0
|
||||
26
trains/backend_interface/task/development/worker.py
Normal file
26
trains/backend_interface/task/development/worker.py
Normal file
@@ -0,0 +1,26 @@
|
||||
from socket import gethostname
|
||||
|
||||
import attr
|
||||
|
||||
from ....config import config, running_remotely, dev_worker_name
|
||||
|
||||
|
||||
@attr.s
|
||||
class DevWorker(object):
|
||||
prefix = attr.ib(type=str, default="MANUAL:")
|
||||
|
||||
report_period = float(config.get('development.worker.report_period_sec', 30.))
|
||||
report_stdout = bool(config.get('development.worker.log_stdout', True))
|
||||
|
||||
@classmethod
|
||||
def is_enabled(cls, model_updated=False):
|
||||
return False
|
||||
|
||||
def status_report(self, timestamp=None):
|
||||
return True
|
||||
|
||||
def register(self):
|
||||
return True
|
||||
|
||||
def unregister(self):
|
||||
return True
|
||||
Reference in New Issue
Block a user