make RepetitionPenaltyLogitsProcessor faster (#9600)

a98173cc · LSinev · GitHub · a1ad16a4 · a98173cc
Unverified Commit a98173cc authored Jan 20, 2021 by LSinev Committed by GitHub Jan 20, 2021
Hide whitespace changes
Inline Side-by-side

Showing with 2 additions and 3 deletions

src/transformers/generation_logits_process.py src/transformers/generation_logits_process.py +2 -3

No files found.
--- a/src/transformers/generation_logits_process.py
+++ b/src/transformers/generation_logits_process.py
@@ -155,13 +155,12 @@ class RepetitionPenaltyLogitsProcessor(LogitsProcessor):
        self.penalty = penalty

    def __call__(self, input_ids: torch.LongTensor, scores: torch.FloatTensor) -> torch.FloatTensor:
-        ranges = torch.arange(scores.shape[0])
-        score = scores[ranges[:, None], input_ids]
+        score = torch.gather(scores, 1, input_ids)

        # if score < 0 then repetition penalty has to be multiplied to reduce the previous token probability
        score = torch.where(score < 0, score * self.penalty, score / self.penalty)

-        scores[ranges[:, None], input_ids] = score
+        scores.scatter_(1, input_ids, score)
        return scores