Fixing bug where the wrong token was used to index the log probabilities

41df5ff7 · rprenger · e0bf5199 · 41df5ff7
Commit 41df5ff7 authored Aug 08, 2021 by rprenger
Show whitespace changes
Inline Side-by-side

Showing with 2 additions and 2 deletions

megatron/text_generation_utils.py megatron/text_generation_utils.py +2 -2

No files found.
--- a/megatron/text_generation_utils.py
+++ b/megatron/text_generation_utils.py
@@ -270,7 +270,7 @@ def sample_sequence_batch(model, context_tokens, context_lengths,
        lengths = torch.ones([batch_size]).long().cuda() * maxlen
-        while context_length <= (maxlen):
+        while context_length < maxlen:
            types2use = None
            if counter == 0:
                tokens2use = tokens[:, :context_length]
@@ -316,7 +316,7 @@ def sample_sequence_batch(model, context_tokens, context_lengths,
                if output_logits is None:
                    output_context = F.log_softmax(output[:, :context_length, :], 2)
-                    indices = torch.unsqueeze(tokens[:, :context_length],2)
+                    indices = torch.unsqueeze(tokens[:, 1:context_length+1],2)
                    output_logits = torch.gather(output_context, 2, indices).squeeze(2)
                else:
                    indices = torch.unsqueeze(new_tokens,1).unsqueeze(2)