fix bug in lstm model (#68)

90b2d8de · Zrachel · Myle Ott · 884e3046 · 90b2d8de
Commit 90b2d8de authored Nov 24, 2017 by Zrachel Committed by Myle Ott Nov 24, 2017
Hide whitespace changes
Inline Side-by-side

Showing with 5 additions and 0 deletions

fairseq/models/lstm.py fairseq/models/lstm.py +5 -0

No files found.
--- a/fairseq/models/lstm.py
+++ b/fairseq/models/lstm.py
@@ -122,6 +122,8 @@ class LSTMDecoder(FairseqIncrementalDecoder):
            for layer in range(num_layers)
        ])
        self.attention = AttentionLayer(encoder_embed_dim, embed_dim)
+        if embed_dim != out_embed_dim:
+            self.additional_fc = Linear(embed_dim, out_embed_dim)
        self.fc_out = Linear(out_embed_dim, num_embeddings, dropout=dropout_out)

    def forward(self, input_tokens, encoder_out):
@@ -197,6 +199,9 @@ class LSTMDecoder(FairseqIncrementalDecoder):
        attn_scores = attn_scores.transpose(0, 2)

        # project back to size of vocabulary
+        if hasattr(self, 'additional_fc'):
+            x = self.additional_fc(x)
+            x = F.dropout(x, p=self.dropout_out, training=self.training)
        x = self.fc_out(x)

        return x, attn_scores