multi-device: take minimum computed autobatch over all ranks

0a7720e9 · Benjamin Fattori · f4df3e48 · 0a7720e9
Commit 0a7720e9 authored Jul 22, 2023 by Benjamin Fattori
Hide whitespace changes
Inline Side-by-side

Showing with 12 additions and 1 deletion

lm_eval/models/huggingface.py lm_eval/models/huggingface.py +12 -1

No files found.
--- a/lm_eval/models/huggingface.py
+++ b/lm_eval/models/huggingface.py
@@ -354,8 +354,19 @@ class HFLM(LM):
            return batch_size

        batch_size = forward_batch()
-        utils.clear_torch_cache()

+        if self.world_size > 1:
+            # if multi-GPU, always take minimum over all selected batch sizes
+            max_rnk_bs = torch.tensor([batch_size], device=self.device)
+            gathered = (
+                self.accelerator.gather(max_rnk_bs).cpu().detach().numpy().tolist()
+            )
+            batch_size = min(gathered)
+            utils.clear_torch_cache()
+            return batch_size
+            
+
+        utils.clear_torch_cache()
        return batch_size