revert gpus > num processes case

5cb7af7e · haileyschoelkopf · 62f4d663 · 5cb7af7e
Commit 5cb7af7e authored Jul 03, 2023 by haileyschoelkopf
Show whitespace changes
Inline Side-by-side

Showing with 20 additions and 25 deletions

lm_eval/models/huggingface.py lm_eval/models/huggingface.py +20 -25

No files found.
--- a/lm_eval/models/huggingface.py
+++ b/lm_eval/models/huggingface.py
@@ -174,8 +174,7 @@ class HFLM(LM):
                    )
                else:
                    pass
-            else:
+            elif gpus > accelerator.num_processes:
-                if gpus > accelerator.num_processes:
                # TODO: make sure there's still never an edge case where we unintentionally default to CPU
                eval_logger.warning(
                    "WARNING: The number of total system GPUs does not match the number of spawned processes. "
@@ -185,28 +184,24 @@ class HFLM(LM):
                )
                self._rank = accelerator.local_process_index
                self._world_size = accelerator.num_processes
+                # manually set model to use gpu, for case where many GPUs available but
+                # only seek to use one
+                self._device = (
+                    torch.device(f"cuda:{accelerator.local_process_index}")
+                    if torch.cuda.is_available()
+                    else torch.device("cpu")
+                )
+                self.model.to(self.device)
+            else:
                self._model = accelerator.prepare(self.model)
                self._device = torch.device(f"cuda:{accelerator.local_process_index}")
                self.accelerator = accelerator
                if self.accelerator.is_local_main_process:
                    eval_logger.info(f"Using {gpus} devices with data parallelism")
-                # manually set model to use gpu, for case where many GPUs available but
-                # only seek to use one
+                self._rank = self.accelerator.local_process_index
-                # self._device = (
+                self._world_size = self.accelerator.num_processes
-                #     torch.device(f"cuda:{accelerator.local_process_index}")
-                #     if torch.cuda.is_available()
-                #     else torch.device("cpu")
-                # )
-                # self.model.to(self.device)
-            # else:
-            #     self._model = accelerator.prepare(self.model)
-            #     self._device = torch.device(f"cuda:{accelerator.local_process_index}")
-            #     self.accelerator = accelerator
-            #     self._rank = self.accelerator.local_process_index
-            #     self._world_size = self.accelerator.num_processes
    @property
    def config(self):