fix params

22197e78 · Baber · d5c234ce · 22197e78 · 22197e78
Commit 22197e78 authored Oct 15, 2025 by Baber
Hide whitespace changes
Inline Side-by-side

Showing with 6 additions and 3 deletions

lm_eval/api/model.py lm_eval/api/model.py +5 -2

lm_eval/models/utils.py lm_eval/models/utils.py +1 -1

No files found.
--- a/lm_eval/api/model.py
+++ b/lm_eval/api/model.py
@@ -336,7 +336,7 @@ class TemplateLM(LM):
        return self.eot_token_id
    @abc.abstractmethod
-    def tok_encode(self, string: str, **kwargs) -> list[int]:
+    def tok_encode(self, string: str, add_special_tokens=False, **kwargs) -> list[int]:
        """
        Tokenize a string using the model's tokenizer and return a list of token IDs.
        """
@@ -377,6 +377,7 @@ class TemplateLM(LM):
            This method does NOT handle empty context. The caller should
            handle empty context (see loglikelihood method).
        """
+        assert context, "Context cannot be empty!"
        import transformers
        n_spaces = len(context) - len(context.rstrip())
@@ -429,7 +430,9 @@ class TemplateLM(LM):
        new_reqs = []
        for context, continuation in [req.args for req in requests]:
            if context == "":
-                continuation_enc = self.tok_encode(continuation)
+                continuation_enc = self.tok_encode(
+                    continuation, add_special_tokens=False
+                )
                # BOS or EOS as context
                context_enc, continuation_enc = (
                    ([self.prefix_token_id], continuation_enc)

--- a/lm_eval/models/utils.py
+++ b/lm_eval/models/utils.py
@@ -150,7 +150,7 @@ class Grouper:
 def pad_and_concat(
    max_length: int,
-    tensors: List[torch.Tensor],
+    tensors: list[torch.Tensor],
    padding_side: Literal["right", "left"] = "right",
 ):
    """