Enable pegasus fp16 by clamping large activations (#7243)

* Clean clamp * boom boom * Take some other changes * boom boom * boom boom * boom boom * one chg * fix test * Use finfo * style

Enable pegasus fp16 by clamping large activations (#7243)
* Clean clamp * boom boom * Take some other changes * boom boom * boom boom * boom boom * one chg * fix test * Use finfo * style
9e80f972 · Sam Shleifer · GitHub · be51c103 · 9e80f972 · 9e80f972
Unverified Commit 9e80f972 authored Oct 01, 2020 by Sam Shleifer Committed by GitHub Oct 01, 2020
Hide whitespace changes
Inline Side-by-side

Showing with 8 additions and 3 deletions

src/transformers/modeling_bart.py src/transformers/modeling_bart.py +3 -0

tests/test_modeling_pegasus.py tests/test_modeling_pegasus.py +5 -3

No files found.
--- a/src/transformers/modeling_bart.py
+++ b/src/transformers/modeling_bart.py
@@ -269,6 +269,9 @@ class EncoderLayer(nn.Module):
        x = residual + x
        if not self.normalize_before:
            x = self.final_layer_norm(x)
+        if torch.isinf(x).any() or torch.isnan(x).any():
+            clamp_value = torch.finfo(x.dtype).max - 1000
+            x = torch.clamp(x, min=-clamp_value, max=clamp_value)
        return x, attn_weights

--- a/tests/test_modeling_pegasus.py
+++ b/tests/test_modeling_pegasus.py
@@ -47,9 +47,11 @@ class PegasusXSUMIntegrationTest(AbstractSeq2SeqIntegrationTest):
        # Demonstrate fp16 issue, Contributions welcome!
        self.model.half()
        translated_tokens_fp16 = self.model.generate(**inputs, max_length=10)
-        decoded = self.tokenizer.batch_decode(translated_tokens_fp16, skip_special_tokens=True)
+        decoded_fp16 = self.tokenizer.batch_decode(translated_tokens_fp16, skip_special_tokens=True)
-        bad_fp16_result = ["unk_7unk_7unk_7unk_7unk_7unk_7unk_7", "unk_7unk_7unk_7unk_7unk_7unk_7unk_7"]
+        assert decoded_fp16 == [
-        self.assertListEqual(decoded, bad_fp16_result)
+            "California's largest electricity provider has begun",
+            "N-Dubz have revealed they were",
+        ]
 class PegasusConfigTests(unittest.TestCase):