Allow TransformerSentenceEncoder to return only last state

Summary: Pull Request resolved: https://github.com/fairinternal/fairseq-py/pull/578 Differential Revision: D15352060 Pulled By: myleott fbshipit-source-id: 7dc2fceca37ec96c89356662831b0d82f28bef6f

Allow TransformerSentenceEncoder to return only last state
Summary: Pull Request resolved: https://github.com/fairinternal/fairseq-py/pull/578 Differential Revision: D15352060 Pulled By: myleott fbshipit-source-id: 7dc2fceca37ec96c89356662831b0d82f28bef6f
a0c5f9b8 · Myle Ott · Facebook Github Bot · 52778827 · a0c5f9b8
Commit a0c5f9b8 authored May 15, 2019 by Myle Ott Committed by Facebook Github Bot May 15, 2019
Hide whitespace changes
Inline Side-by-side

Showing with 11 additions and 3 deletions

fairseq/modules/transformer_sentence_encoder.py fairseq/modules/transformer_sentence_encoder.py +11 -3

No files found.
--- a/fairseq/modules/transformer_sentence_encoder.py
+++ b/fairseq/modules/transformer_sentence_encoder.py
@@ -152,7 +152,8 @@ class TransformerSentenceEncoder(nn.Module):
    def forward(
        self,
        tokens: torch.Tensor,
-        segment_labels: torch.Tensor
+        segment_labels: torch.Tensor,
+        last_state_only: bool = False,
    ) -> Tuple[torch.Tensor, torch.Tensor]:

        # compute padding mask. This is needed for multi-head attention
@@ -181,18 +182,25 @@ class TransformerSentenceEncoder(nn.Module):

        # B x T x C -> T x B x C
        x = x.transpose(0, 1)
-        inner_states = [x]
+
+        inner_states = []
+        if not last_state_only:
+            inner_states.append(x)

        for layer in self.layers:
            x, _ = layer(
                x,
                self_attn_padding_mask=padding_mask,
            )
-            inner_states.append(x)
+            if not last_state_only:
+                inner_states.append(x)

        # T x B x C -> B x T x C
        x = x.transpose(0, 1)

        sentence_rep = x[:, 0, :]

+        if last_state_only:
+            inner_states = [x]
+
        return inner_states, sentence_rep