Fix #7331 (#7732)

1f1d950b · Lysandre Debut · GitHub · d9ffb87e · 1f1d950b
Unverified Commit 1f1d950b authored Oct 12, 2020 by Lysandre Debut Committed by GitHub Oct 12, 2020
Hide whitespace changes
Inline Side-by-side

Showing with 1 addition and 1 deletion

src/transformers/modeling_gpt2.py src/transformers/modeling_gpt2.py +1 -1

No files found.
--- a/src/transformers/modeling_gpt2.py
+++ b/src/transformers/modeling_gpt2.py
@@ -584,7 +584,7 @@ class GPT2Model(GPT2PreTrainedModel):
            # positions we want to attend and -10000.0 for masked positions.
            # Since we are adding it to the raw scores before the softmax, this is
            # effectively the same as removing these entirely.
-            attention_mask = attention_mask.to(dtype=next(self.parameters()).dtype)  # fp16 compatibility
+            attention_mask = attention_mask.to(dtype=self.dtype)  # fp16 compatibility
            attention_mask = (1.0 - attention_mask) * -10000.0

        # If a 2D ou 3D attention mask is provided for the cross-attention