Unverified Commit b3e4c49a authored by Hailey Schoelkopf's avatar Hailey Schoelkopf Committed by GitHub
Browse files

add hacky add_bos_token forcing for Gemma to VLLM too (#1857)

parent 4bb77e82
...@@ -119,6 +119,12 @@ class VLLM(TemplateLM): ...@@ -119,6 +119,12 @@ class VLLM(TemplateLM):
tokenizer_revision=tokenizer_revision, tokenizer_revision=tokenizer_revision,
) )
self.add_bos_token = add_bos_token self.add_bos_token = add_bos_token
if "gemma" in pretrained.lower():
self.add_bos_token = True
eval_logger.info(
"Found 'gemma' in model name, a BOS token will be used as Gemma underperforms without it."
)
self.custom_prefix_token_id = prefix_token_id self.custom_prefix_token_id = prefix_token_id
if prefix_token_id is not None: if prefix_token_id is not None:
eval_logger.info( eval_logger.info(
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment