[fix] Pure cpu support for benchmarks/oss.py (#185)

* now works on a machine without cuda, easier to debug and quick test

[fix] Pure cpu support for benchmarks/oss.py (#185)
* now works on a machine without cuda, easier to debug and quick test
2fe93203 · Yuanyuan (Ana) Shen · GitHub · 34df6069 · 2fe93203
Unverified Commit 2fe93203 authored Nov 12, 2020 by Yuanyuan (Ana) Shen Committed by GitHub Nov 12, 2020
Hide whitespace changes
Inline Side-by-side

Showing with 5 additions and 4 deletions

benchmarks/oss.py benchmarks/oss.py +5 -4

No files found.
--- a/benchmarks/oss.py
+++ b/benchmarks/oss.py
@@ -104,7 +104,11 @@ def train(
        optimizer = model.sharded_optimizer

    else:
-        model = DDP(model, device_ids=[rank], find_unused_parameters=False)  # type: ignore
+        if args.cpu:
+            device_ids = None
+        else:
+            device_ids = [rank]
+        model = DDP(model, device_ids=device_ids, find_unused_parameters=False)  # type: ignore
        optimizer = (
            OSS(params=model.parameters(), optim=OPTIM, lr=1e-4, momentum=0.9)
            if optim_type == OptimType.oss_ddp
@@ -211,10 +215,7 @@ def train(

    training_stop = time.monotonic()
    img_per_sec = n_items / (training_stop - training_start) * args.epochs
-    max_memory = torch.cuda.max_memory_allocated(rank) / 2 ** 20
-
    logging.info(f"[{dist.get_rank()}] : Training done. {img_per_sec:.2f} img per sec inc. checkpoint")
-    logging.info(f"[{dist.get_rank()}] : Peak memory {max_memory:.1f}MiB")

    # Compute the mean and average img per second
    mean = sum(measurements) / len(measurements)