Extend `dtype` command line flag to `HFLM` (#523)

* allow for hf-causal to take dtype arg * document this change

Extend `dtype` command line flag to `HFLM` (#523)
* allow for hf-causal to take dtype arg * document this change
8cff2bea · Hailey Schoelkopf · GitHub · 4e94af6f · 8cff2bea · 8cff2bea
Unverified Commit 8cff2bea authored May 25, 2023 by Hailey Schoelkopf Committed by GitHub May 25, 2023
Hide whitespace changes
Inline Side-by-side

Showing with 17 additions and 3 deletions

README.md README.md +2 -2

lm_eval/models/gpt2.py lm_eval/models/gpt2.py +15 -1

No files found.
--- a/README.md
+++ b/README.md
@@ -46,12 +46,12 @@ python main.py \
    --device cuda:0
 ```

-Additional arguments can be provided to the model constructor using the `--model_args` flag. Most notably, this supports the common practice of using the `revisions` feature on the Hub to store partially trained checkpoints:
+Additional arguments can be provided to the model constructor using the `--model_args` flag. Most notably, this supports the common practice of using the `revisions` feature on the Hub to store partially trained checkpoints, or to specify the datatype for running a model:

 ```bash
 python main.py \
    --model hf-causal \
-    --model_args pretrained=EleutherAI/pythia-160m,revision=step100000 \
+    --model_args pretrained=EleutherAI/pythia-160m,revision=step100000,dtype="float" \
    --tasks lambada_openai,hellaswag \
    --device cuda:0
 ```

--- a/lm_eval/models/gpt2.py
+++ b/lm_eval/models/gpt2.py
 import torch
 import transformers
-from typing import Optional
+from typing import Optional, Union
 from lm_eval.base import BaseLM


+def _get_dtype(
+    dtype: Union[str, torch.dtype]
+) -> torch.dtype:
+    """Converts `dtype` from `str` to torch.dtype when possible. Does not use an instantiated HF AutoConfig"""
+    if isinstance(dtype, str) and dtype != "auto":
+        # Convert `str` args torch dtype: `float16` -> `torch.float16`
+        _torch_dtype = getattr(torch, dtype)
+    else:
+        _torch_dtype = dtype
+    return _torch_dtype
+
+
 class HFLM(BaseLM):
    def __init__(
        self,
@@ -16,6 +28,7 @@ class HFLM(BaseLM):
        batch_size=1,
        load_in_8bit: Optional[bool] = False,
        trust_remote_code: Optional[bool] = False,
+        dtype: Optional[Union[str, torch.dtype]]="auto",
    ):
        super().__init__()

@@ -46,6 +59,7 @@ class HFLM(BaseLM):
            load_in_8bit=load_in_8bit,
            low_cpu_mem_usage=low_cpu_mem_usage,
            revision=revision,
+            torch_dtype=_get_dtype(dtype),
            trust_remote_code=trust_remote_code,
        ).to(self.device)
        self.gpt2.eval()