"vscode:/vscode.git/clone" did not exist on "e6ab50dffa3c1bbf2d7107f2375db3287ddc2fa1"
Unverified Commit 9884ad6e authored by Hailey Schoelkopf's avatar Hailey Schoelkopf Committed by GitHub
Browse files

make recurrent_gemma model types included in the force-BOS case (#2105)

parent 2b26690f
...@@ -257,10 +257,10 @@ class HFLM(TemplateLM): ...@@ -257,10 +257,10 @@ class HFLM(TemplateLM):
self.tokenizer = configure_pad_token(self.tokenizer, model_config=self.config) self.tokenizer = configure_pad_token(self.tokenizer, model_config=self.config)
self.add_bos_token = add_bos_token self.add_bos_token = add_bos_token
if getattr(self.config, "model_type", None) in ["gemma", "gemma2"]: if "gemma" in getattr(self.config, "model_type", ""):
self.add_bos_token = True self.add_bos_token = True
eval_logger.info( eval_logger.info(
f"Model type is '{self.config.model_type}', a BOS token will be used as Gemma underperforms without it." f"Model type is '{self.config.model_type}', part of the Gemma family--a BOS token will be used as Gemma underperforms without it."
) )
self._max_length = max_length self._max_length = max_length
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment