Fixing stopping criteria

ecde9d2e · Tian Yun · 1cd4ec01 · ecde9d2e · ecde9d2e
Commit ecde9d2e authored Apr 27, 2022 by Tian Yun
Hide whitespace changes
Inline Side-by-side

Showing with 17 additions and 1 deletion

lm_eval/base.py lm_eval/base.py +13 -1

lm_eval/models/gpt2.py lm_eval/models/gpt2.py +4 -0

No files found.
--- a/lm_eval/base.py
+++ b/lm_eval/base.py
@@ -121,6 +121,11 @@ class LM(abc.ABC):
 class BaseLM(LM):
+    @property
+    @abstractmethod
+    def eot_token(self):
+        pass
    @property
    @abstractmethod
    def eot_token_id(self):
@@ -354,8 +359,15 @@ class BaseLM(LM):
                isinstance(max_generation_length, int) or max_generation_length is None
            )
-            until = [stopping_criteria]
+            if stopping_criteria is None:
+                until = [self.eot_token] 
+            else:
+                until = [stopping_criteria]
            primary_until = self.tok_encode(until[0])
+            if len(primary_until) == 0:
+                primary_until = torch.tensor([self.eot_token_id])
            context_enc = torch.tensor(
                [self.tok_encode(context)[self.max_gen_toks - self.max_length :]]
            ).to(self.device)

--- a/lm_eval/models/gpt2.py
+++ b/lm_eval/models/gpt2.py
@@ -72,6 +72,10 @@ class HFLM(BaseLM):
        # if gpus > 1:
        #     self.gpt2 = nn.DataParallel(self.gpt2)
+    @property
+    def eot_token(self):
+        return self.tokenizer.eos_token
    @property
    def eot_token_id(self):
        # we use EOT because end of *text* is more accurate for what we're doing than end of *sentence*