XLNet bias fix on resize embeddings (cf #1124)

e0f867a9 · LysandreJik · d7a4c325 · e0f867a9
Commit e0f867a9 authored Aug 31, 2019 by LysandreJik
Hide whitespace changes
Inline Side-by-side

Showing with 8 additions and 0 deletions

pytorch_transformers/modeling_utils.py pytorch_transformers/modeling_utils.py +8 -0

No files found.
--- a/pytorch_transformers/modeling_utils.py
+++ b/pytorch_transformers/modeling_utils.py
@@ -327,6 +327,14 @@ class PreTrainedModel(nn.Module):
        else:
            first_module.weight = second_module.weight
+        if hasattr(first_module, 'bias'):
+            first_module.bias.data = torch.nn.functional.pad(
+                first_module.bias.data,
+                (0, first_module.weight.shape[0] - first_module.bias.shape[0]),
+                'constant',
+                0
+            )
    def resize_token_embeddings(self, new_num_tokens=None):
        """ Resize input token embeddings matrix of the model if new_num_tokens != config.vocab_size.
        Take care of tying weights embeddings afterwards if the model class has a `tie_weights()` method.