wookayin · Stonesjtu · Nov 10, 2018 · wookayin · Nov 10, 2018 · Stonesjtu
diff --git a/gpustat/__main__.py b/gpustat/__main__.py
@@ -11,12 +11,16 @@
 from .core import GPUStatCollection
 
 
-def print_gpustat(json=False, debug=False, **kwargs):
+def print_gpustat(json=False, debug=False, gpu_stat=None, **kwargs):
     '''
     Display the GPU query results into standard output.
     '''
+
     try:
-        gpu_stats = GPUStatCollection.new_query()
+        if gpu_stat is None:
+            gpu_stat = GPUStatCollection()
+        else:
+            gpu_stat.update()
     except Exception as e:
         sys.stderr.write('Error on querying NVIDIA devices.'
                          ' Use --debug flag for details\n')
@@ -32,9 +36,10 @@ def print_gpustat(json=False, debug=False, **kwargs):
         sys.exit(1)
 
     if json:
-        gpu_stats.print_json(sys.stdout)
+        gpu_stat.print_json(sys.stdout)
     else:
-        gpu_stats.print_formatted(sys.stdout, **kwargs)
+        gpu_stat.print_formatted(sys.stdout, **kwargs)
+    return gpu_stat
 
 
 def main(*argv):
@@ -88,6 +93,8 @@ def main(*argv):
     )
     args = parser.parse_args(argv[1:])
 
+    cached_stat = None
+
     if args.interval is None:  # with default value
         args.interval = 1.0
     if args.interval > 0:
@@ -102,7 +109,7 @@ def main(*argv):
                 try:
                     query_start = time.time()
                     with term.location(0, 0):
-                        print_gpustat(eol_char=term.clear_eol + '\n', **vars(args))  # noqa
+                        cached_stat = print_gpustat(gpu_stat=cached_stat, eol_char=term.clear_eol + '\n', **vars(args))  # noqa
                         print(term.clear_eos, end='')
                     query_duration = time.time() - query_start
                     sleep_duration = args.interval - query_duration
@@ -111,7 +118,7 @@ def main(*argv):
                 except KeyboardInterrupt:
                     exit(0)
     else:
-        print_gpustat(**vars(args))
+        print_gpustat(gpu_stat=cached_stat, **vars(args))
 
 
 if __name__ == '__main__':

diff --git a/gpustat/core.py b/gpustat/core.py
@@ -250,19 +250,38 @@ def jsonify(self):
 
 class GPUStatCollection(object):
 
-    def __init__(self, gpu_list):
+    def __init__(self, gpu_list=[]):
+        """The initialization argument gpu_list is remained to support
+        existing APIs"""
         self.gpus = gpu_list
 
-        # attach additional system information
-        self.hostname = platform.node()
+        N.nvmlInit()
+        device_count = N.nvmlDeviceGetCount()
+        self.handles = [N.nvmlDeviceGetHandleByIndex(idx)
+                        for idx in range(device_count)]
+
+        self.update()
+
+    def __del__(self):
+        # sometimes delayed gc causes problem, just attempt to release
+        # NVML resources
+        try:
+            N.nvmlShutdown()
+        except Exception:
+            pass
+
+    def update(self):
+        self._update_host()
+        self._update_gpu()
+
+    def _update_host(self):
+        """Update additional host information"""
         self.query_time = datetime.now()
+        self.hostname = platform.node()
 
-    @staticmethod
-    def new_query():
+    def _update_gpu(self):
         """Query the information of all the GPUs on local machine"""
 
-        N.nvmlInit()
-
         def get_gpu_info(handle):
             """Get one GPU information specified by nvml handle"""
 
@@ -365,17 +384,12 @@ def _decode(b):
             return gpu_info
 
         # 1. get the list of gpu and status
-        gpu_list = []
-        device_count = N.nvmlDeviceGetCount()
+        self.gpus = []
 
-        for index in range(device_count):
-            handle = N.nvmlDeviceGetHandleByIndex(index)
+        for handle in self.handles:
             gpu_info = get_gpu_info(handle)
             gpu_stat = GPUStat(gpu_info)
-            gpu_list.append(gpu_stat)
-
-        N.nvmlShutdown()
-        return GPUStatCollection(gpu_list)
+            self.gpus.append(gpu_stat)
 
     def __len__(self):
         return len(self.gpus)
@@ -471,7 +485,7 @@ def date_handler(obj):
 
 def new_query():
     '''
-    Obtain a new GPUStatCollection instance by querying nvidia-smi
+    Obtain a new GPUStatCollection instance by querying nvml
     to get the list of GPUs and running process information.
     '''
-    return GPUStatCollection.new_query()
+    return GPUStatCollection()