"""{{cookiecutter.modelname}} Model with a `language modeling` head on top for CLM fine-tuning. """,{{cookiecutter.uppercase_modelname}}_START_DOCSTRING
"""{{cookiecutter.modelname}} Model with a `language modeling` head on top for CLM fine-tuning. """,{{cookiecutter.uppercase_modelname}}_START_DOCSTRING
...
@@ -993,15 +991,12 @@ class TF{{cookiecutter.camelcase_modelname}}ForCausalLM(TF{{cookiecutter.camelca
...
@@ -993,15 +991,12 @@ class TF{{cookiecutter.camelcase_modelname}}ForCausalLM(TF{{cookiecutter.camelca
attentions=outputs.attentions,
attentions=outputs.attentions,
)
)
# Copied from transformers.models.bert.modeling_tf_bert.TFBertLMHeadModel.serving_output