Small optimization for LSTM

f607d9e8 · Myle Ott · 8fcdb9b7 · f607d9e8
Commit f607d9e8 authored Apr 13, 2018 by Myle Ott
Hide whitespace changes
Inline Side-by-side

Showing with 1 addition and 1 deletion

fairseq/models/lstm.py fairseq/models/lstm.py +1 -1

No files found.
--- a/fairseq/models/lstm.py
+++ b/fairseq/models/lstm.py
@@ -245,7 +245,7 @@ class AttentionLayer(nn.Module):
                float('-inf')
            ).type_as(attn_scores)  # FP16 support: cast to float and back
-        attn_scores = F.softmax(attn_scores.t(), dim=1).t()  # srclen x bsz
+        attn_scores = F.softmax(attn_scores, dim=0)  # srclen x bsz
        # sum weighted sources
        x = (attn_scores.unsqueeze(2) * source_hids).sum(dim=0)