fix bug that stuck at evaluation (#53)

* fix bug that stuck at evaluation * remove mode variable

fix bug that stuck at evaluation (#53)
* fix bug that stuck at evaluation * remove mode variable
b8513677 · Cao Yuhang · Kai Chen · bef7c13a · b8513677
Commit b8513677 authored Apr 15, 2019 by Cao Yuhang Committed by Kai Chen Apr 14, 2019
Show whitespace changes
Inline Side-by-side

Showing with 12 additions and 7 deletions

mmcv/runner/hooks/logger/text.py mmcv/runner/hooks/logger/text.py +12 -7

No files found.
--- a/mmcv/runner/hooks/logger/text.py
+++ b/mmcv/runner/hooks/logger/text.py
@@ -16,6 +16,15 @@ class TextLoggerHook(LoggerHook):
        super(TextLoggerHook, self).before_run(runner)
        self.start_iter = runner.iter
+    def _get_max_memory(self, runner):
+        mem = torch.cuda.max_memory_allocated()
+        mem_mb = torch.tensor([mem / (1024 * 1024)],
+                              dtype=torch.int,
+                              device=torch.device('cuda'))
+        if runner.world_size > 1:
+            dist.reduce(mem_mb, 0, op=dist.ReduceOp.MAX)
+        return mem_mb
    def log(self, runner):
        if runner.mode == 'train':
            lr_str = ', '.join(
@@ -38,13 +47,9 @@ class TextLoggerHook(LoggerHook):
                'time: {log[time]:.3f}, data_time: {log[data_time]:.3f}, '.
                format(log=runner.log_buffer.output))
        # statistic memory
-        if runner.mode == 'train' and torch.cuda.is_available():
+        # training mode if the output contains the key "time"
-            mem = torch.cuda.max_memory_allocated()
+        if 'time' in runner.log_buffer.output and torch.cuda.is_available():
-            mem_mb = torch.tensor([mem / (1024 * 1024)],
+            mem_mb = self._get_max_memory(runner)
-                                  dtype=torch.int,
-                                  device=torch.device('cuda'))
-            if runner.world_size > 1:
-                dist.reduce(mem_mb, 0, op=dist.ReduceOp.MAX)
            log_str += 'memory: {}, '.format(mem_mb.item())
        log_items = []
        for name, val in runner.log_buffer.output.items():