OPTForCausalLM lm_head input size should be config.word_embed_proj_dim (#17225)

71cced8a · vfbd · GitHub · 56f50590 · 71cced8a
Unverified Commit 71cced8a authored May 23, 2022 by vfbd Committed by GitHub May 23, 2022
Hide whitespace changes
Inline Side-by-side

Showing with 1 addition and 1 deletion

src/transformers/models/opt/modeling_opt.py src/transformers/models/opt/modeling_opt.py +1 -1

No files found.
--- a/src/transformers/models/opt/modeling_opt.py
+++ b/src/transformers/models/opt/modeling_opt.py
@@ -786,7 +786,7 @@ class OPTForCausalLM(OPTPreTrainedModel):
        self.model = OPTModel(config)
        # the lm_head weight is automatically tied to the embed tokens weight
-        self.lm_head = nn.Linear(config.hidden_size, config.vocab_size, bias=False)
+        self.lm_head = nn.Linear(config.word_embed_proj_dim, config.vocab_size, bias=False)
        # Initialize weights and apply final processing
        self.post_init()