tokenizer name property for cache_key

d7b8fd9c · Konrad · 615352c0 · d7b8fd9c · d7b8fd9c · d7b8fd9c
Commit d7b8fd9c authored May 30, 2024 by Konrad
Hide whitespace changes
Inline Side-by-side

Showing with 11 additions and 2 deletions

lm_eval/api/model.py lm_eval/api/model.py +6 -0

lm_eval/api/task.py lm_eval/api/task.py +1 -2

lm_eval/models/huggingface.py lm_eval/models/huggingface.py +4 -0

No files found.
--- a/lm_eval/api/model.py
+++ b/lm_eval/api/model.py
@@ -183,6 +183,12 @@ class LM(abc.ABC):
        # not support multi-device parallelism nor expect it.
        return self._world_size
+    @property
+    def get_tokenizer_name(self) -> str:
+        raise NotImplementedError(
+            "To use this model with chat templates, please implement the 'get_tokenizer_name' property."
+        )
    def set_cache_hook(self, cache_hook) -> None:
        self.cache_hook = cache_hook

--- a/lm_eval/api/task.py
+++ b/lm_eval/api/task.py
@@ -391,8 +391,7 @@ class Task(abc.ABC):
            if system_instruction is not None
            else ""
        )
-        if lm is not None and hasattr(lm, "tokenizer"):
+        cache_key += f"-tokenizer{lm.get_tokenizer_name}" if apply_chat_template else ""
-            cache_key += f"-{lm.tokenizer.name_or_path.replace('/', '__')}"
        cached_instances = load_from_cache(file_name=cache_key)

--- a/lm_eval/models/huggingface.py
+++ b/lm_eval/models/huggingface.py
@@ -415,6 +415,10 @@ class HFLM(TemplateLM):
    def world_size(self):
        return self._world_size
+    @property
+    def get_tokenizer_name(self) -> str:
+        return self.tokenizer.name_or_path.replace("/", "__")
    def _get_backend(
        self,
        config: Union[transformers.PretrainedConfig, transformers.AutoConfig],