mirror of
https://github.com/clearml/clearml
synced 2025-02-24 21:23:55 +00:00
Fix issue with A100 GPU monitoring
Some checks failed
CodeQL / Analyze (python) (push) Has been cancelled
Some checks failed
CodeQL / Analyze (python) (push) Has been cancelled
This commit is contained in:
parent
c46f254839
commit
342e1b35f8
@ -486,7 +486,8 @@ class ResourceMonitor(BackgroundMonitor):
|
|||||||
# only monitor the active gpu's, if none were selected, monitor everything
|
# only monitor the active gpu's, if none were selected, monitor everything
|
||||||
if self._skip_nonactive_gpu(g):
|
if self._skip_nonactive_gpu(g):
|
||||||
continue
|
continue
|
||||||
stats["gpu_%d_temperature" % i] = float(g["temperature.gpu"])
|
if g["temperature.gpu"] is not None:
|
||||||
|
stats["gpu_%d_temperature" % i] = float(g["temperature.gpu"])
|
||||||
if g["utilization.gpu"] is not None:
|
if g["utilization.gpu"] is not None:
|
||||||
stats["gpu_%d_utilization" % i] = float(g["utilization.gpu"])
|
stats["gpu_%d_utilization" % i] = float(g["utilization.gpu"])
|
||||||
else:
|
else:
|
||||||
|
Loading…
Reference in New Issue
Block a user