[fix] OSS restore state to proper device (#46)

* move the restored param groups to the original device * adding a corresponding test

[fix] OSS restore state to proper device (#46)
* move the restored param groups to the original device * adding a corresponding test
c2d6f4b6 · Benjamin Lefaudeux · GitHub · 9d6c7b6a · c2d6f4b6 · c2d6f4b6
Unverified Commit c2d6f4b6 authored Aug 20, 2020 by Benjamin Lefaudeux Committed by GitHub Aug 20, 2020
Show whitespace changes
Inline Side-by-side

Showing with 4 additions and 1 deletion

fairscale/optim/oss.py fairscale/optim/oss.py +1 -1

tests/optim/test_oss.py tests/optim/test_oss.py +3 -0

No files found.
--- a/fairscale/optim/oss.py
+++ b/fairscale/optim/oss.py
@@ -148,7 +148,7 @@ class OSS(Optimizer):
        self.load_local_state_dict(state_dict["state"][self.rank])
        # Restore the global param_groups
-        self.param_groups = state_dict["param_groups"]
+        self.param_groups = recursive_copy_to_device(state_dict["param_groups"], non_blocking=True, device=self._device)
    def add_param_group(self, param_group: dict) -> None:
        super().add_param_group(param_group)

--- a/tests/optim/test_oss.py
+++ b/tests/optim/test_oss.py
@@ -62,6 +62,9 @@ def test_state_dict():
    o.step()
    assert x == torch.tensor([0.9], device=DEVICE)
+    # Check that the exposed param_groups are on the proper device
+    assert o.param_groups[0]["params"][0].device == x.device
 def test_local_state_dict():
    x = torch.tensor([1.0], device=DEVICE, requires_grad=True)