adding back final dropout in T5

35d32308 · thomwolf · e74c73a8 · 35d32308
Commit 35d32308 authored Dec 24, 2019 by thomwolf
Hide whitespace changes
Inline Side-by-side

Showing with 1 addition and 0 deletions

src/transformers/modeling_t5.py src/transformers/modeling_t5.py +1 -0

No files found.
--- a/src/transformers/modeling_t5.py
+++ b/src/transformers/modeling_t5.py
@@ -629,6 +629,7 @@ class T5Stack(T5PreTrainedModel):
                all_attentions = all_attentions + (layer_outputs[1],)  # We keep only self-attention weights for now

        hidden_states = self.final_layer_norm(hidden_states)
+        hidden_states = self.dropout(hidden_states)

        # Add last layer
        if self.output_hidden_states: