mirror of
https://github.com/clearml/clearml-agent
synced 2025-06-26 18:16:15 +00:00
Print error on resource monitor failure
This commit is contained in:
parent
307ec9213e
commit
b6ca0fa6a5
@ -139,6 +139,7 @@ class ResourceMonitor(object):
|
|||||||
def _daemon(self):
|
def _daemon(self):
|
||||||
seconds_since_started = 0
|
seconds_since_started = 0
|
||||||
reported = 0
|
reported = 0
|
||||||
|
try:
|
||||||
while True:
|
while True:
|
||||||
last_report = time()
|
last_report = time()
|
||||||
current_report_frequency = (
|
current_report_frequency = (
|
||||||
@ -175,6 +176,8 @@ class ResourceMonitor(object):
|
|||||||
|
|
||||||
# count reported iterations
|
# count reported iterations
|
||||||
reported += 1
|
reported += 1
|
||||||
|
except Exception as ex:
|
||||||
|
log.exception("Error reporting monitoring info: %s", str(ex))
|
||||||
|
|
||||||
def _update_readouts(self):
|
def _update_readouts(self):
|
||||||
readouts = self._machine_stats()
|
readouts = self._machine_stats()
|
||||||
|
Loading…
Reference in New Issue
Block a user