Skip to content
Snippets Groups Projects
Commit ae970baa authored by Daniel CARRON's avatar Daniel CARRON :b: Committed by André Anjos
Browse files

Added units to resources monitoring

parent 84c3a5f7
No related branches found
No related tags found
1 merge request!6Making use of LightningDataModule and simplification of data loading
...@@ -100,7 +100,7 @@ def gpu_constants(): ...@@ -100,7 +100,7 @@ def gpu_constants():
""" """
return run_nvidia_smi( return run_nvidia_smi(
("gpu_name", "driver_version", "memory.total"), ("gpu_name", "driver_version", "memory.total"),
("gpu_name", "gpu_driver_version", "gpu_memory_total"), ("gpu_name", "gpu_driver_version", "gpu_memory_total_GB"),
) )
...@@ -135,10 +135,10 @@ def gpu_log(): ...@@ -135,10 +135,10 @@ def gpu_log():
"utilization.gpu", "utilization.gpu",
), ),
( (
"gpu_memory_total", "gpu_memory_total_GB",
"gpu_memory_used", "gpu_memory_used_GB",
"gpu_memory_free", "gpu_memory_free_percent",
"gpu_percent", "gpu_usage_percent",
), ),
) )
...@@ -165,7 +165,7 @@ def cpu_constants(): ...@@ -165,7 +165,7 @@ def cpu_constants():
1. ``cpu_count`` (:py:class:`int`): number of logical CPUs available 1. ``cpu_count`` (:py:class:`int`): number of logical CPUs available
""" """
return ( return (
("cpu_memory_total", psutil.virtual_memory().total / GB), ("cpu_memory_total_GB", psutil.virtual_memory().total / GB),
("cpu_count", psutil.cpu_count(logical=True)), ("cpu_count", psutil.cpu_count(logical=True)),
) )
...@@ -245,9 +245,9 @@ class CPULogger: ...@@ -245,9 +245,9 @@ class CPULogger:
# at this point, but ensures to update counts later on # at this point, but ensures to update counts later on
gone.add(k) gone.add(k)
return ( return (
("cpu_memory_used", psutil.virtual_memory().used / GB), ("cpu_memory_used_GB", psutil.virtual_memory().used / GB),
("cpu_rss", sum([k.rss for k in memory_info]) / GB), ("cpu_rss_GB", sum([k.rss for k in memory_info]) / GB),
("cpu_vms", sum([k.vms for k in memory_info]) / GB), ("cpu_vms_GB", sum([k.vms for k in memory_info]) / GB),
("cpu_percent", sum(cpu_percent)), ("cpu_percent", sum(cpu_percent)),
("cpu_processes", len(self.cluster) - len(gone)), ("cpu_processes", len(self.cluster) - len(gone)),
("cpu_open_files", sum(open_files)), ("cpu_open_files", sum(open_files)),
......
0% Loading or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment