fix typo in comments (#6838)

6b242812 · Prajjwal Bhargava · GitHub · 7351ef83 · 6b242812
Unverified Commit 6b242812 authored Sep 02, 2020 by Prajjwal Bhargava Committed by GitHub Sep 02, 2020
Hide whitespace changes
Inline Side-by-side

Showing with 2 additions and 2 deletions

src/transformers/modeling_bert.py src/transformers/modeling_bert.py +2 -2

No files found.
--- a/src/transformers/modeling_bert.py
+++ b/src/transformers/modeling_bert.py
@@ -803,8 +803,8 @@ class BertModel(BertPreTrainedModel):
        # ourselves in which case we just need to make it broadcastable to all heads.
        extended_attention_mask: torch.Tensor = self.get_extended_attention_mask(attention_mask, input_shape, device)
-        # If a 2D ou 3D attention mask is provided for the cross-attention
+        # If a 2D or 3D attention mask is provided for the cross-attention
-        # we need to make broadcastabe to [batch_size, num_heads, seq_length, seq_length]
+        # we need to make broadcastable to [batch_size, num_heads, seq_length, seq_length]
        if self.config.is_decoder and encoder_hidden_states is not None:
            encoder_batch_size, encoder_sequence_length, _ = encoder_hidden_states.size()
            encoder_hidden_shape = (encoder_batch_size, encoder_sequence_length)