Unverified Commit b3e4c49a authored by Hailey Schoelkopf's avatar Hailey Schoelkopf Committed by GitHub
Browse files

add hacky add_bos_token forcing for Gemma to VLLM too (#1857)

parent 4bb77e82
......@@ -119,6 +119,12 @@ class VLLM(TemplateLM):
tokenizer_revision=tokenizer_revision,
)
self.add_bos_token = add_bos_token
if "gemma" in pretrained.lower():
self.add_bos_token = True
eval_logger.info(
"Found 'gemma' in model name, a BOS token will be used as Gemma underperforms without it."
)
self.custom_prefix_token_id = prefix_token_id
if prefix_token_id is not None:
eval_logger.info(
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment