add hacky add_bos_token forcing for Gemma to VLLM too (#1857)

b3e4c49a · Hailey Schoelkopf · GitHub · 4bb77e82 · b3e4c49a
Unverified Commit b3e4c49a authored Jun 11, 2024 by Hailey Schoelkopf Committed by GitHub Jun 11, 2024
Hide whitespace changes
Inline Side-by-side

Showing with 6 additions and 0 deletions

lm_eval/models/vllm_causallms.py lm_eval/models/vllm_causallms.py +6 -0

No files found.
--- a/lm_eval/models/vllm_causallms.py
+++ b/lm_eval/models/vllm_causallms.py
@@ -119,6 +119,12 @@ class VLLM(TemplateLM):
            tokenizer_revision=tokenizer_revision,
        )
        self.add_bos_token = add_bos_token
+        if "gemma" in pretrained.lower():
+            self.add_bos_token = True
+            eval_logger.info(
+                "Found 'gemma' in model name, a BOS token will be used as Gemma underperforms without it."
+            )
        self.custom_prefix_token_id = prefix_token_id
        if prefix_token_id is not None:
            eval_logger.info(