fix FSDP error with .prepare_model()

92561822 · Benjamin Fattori · 4cda3a1c · 92561822
Commit 92561822 authored Aug 26, 2023 by Benjamin Fattori
Hide whitespace changes
Inline Side-by-side

Showing with 10 additions and 4 deletions

lm_eval/models/huggingface.py lm_eval/models/huggingface.py +10 -4

No files found.
--- a/lm_eval/models/huggingface.py
+++ b/lm_eval/models/huggingface.py
@@ -20,7 +20,7 @@ from lm_eval.api.registry import register_model

 from lm_eval.utils import MultiTokenEOSCriteria, stop_sequences_criteria

-from accelerate import Accelerator, find_executable_batch_size
+from accelerate import Accelerator, find_executable_batch_size, DistributedType
 from typing import List, Optional, Union


@@ -289,9 +289,15 @@ class HFLM(LM):
                        "Failed to place model onto specified device. This may be because the model is quantized via `bitsandbytes`. If the desired GPU is being used, this message is safe to ignore."
                    )
            else:
-                self._model = accelerator.prepare_model(
-                    self.model, evaluation_mode=True
-                )
+                assert accelerator.distributed_type in [DistributedType.FSDP, DistributedType.MULTI_GPU], "Unsupported distributed type provided. Only DDP and FSDP are supported."
+                if accelerator.distributed_type == DistributedType.FSDP:
+                    self._model = accelerator.prepare(
+                        self.model
+                    )
+                else:
+                    self._model = accelerator.prepare_model(
+                        self.model, evaluation_mode = True 
+                    )
                self._device = torch.device(f"cuda:{accelerator.local_process_index}")
                self.accelerator = accelerator