[s2s] fix label_smoothed_nll_loss (#6344)

9bed3554 · Suraj Patil · GitHub · 99f73bcc · 9bed3554
Unverified Commit 9bed3554 authored Aug 08, 2020 by Suraj Patil Committed by GitHub Aug 08, 2020
Hide whitespace changes
Inline Side-by-side

Showing with 1 addition and 3 deletions

examples/seq2seq/utils.py examples/seq2seq/utils.py +1 -3

No files found.
--- a/examples/seq2seq/utils.py
+++ b/examples/seq2seq/utils.py
@@ -29,17 +29,15 @@ def label_smoothed_nll_loss(lprobs, target, epsilon, ignore_index=-100):
        pad_mask = target.eq(ignore_index)
        nll_loss.masked_fill_(pad_mask, 0.0)
        smooth_loss.masked_fill_(pad_mask, 0.0)
-        bs = pad_mask.long().sum()
    else:
        nll_loss = nll_loss.squeeze(-1)
        smooth_loss = smooth_loss.squeeze(-1)
-        bs = lprobs.shape[0]
    nll_loss = nll_loss.sum()  # mean()? Scared to break other math.
    smooth_loss = smooth_loss.sum()
    eps_i = epsilon / lprobs.size(-1)
    loss = (1.0 - epsilon) * nll_loss + eps_i * smooth_loss
-    return loss / bs, nll_loss / bs
+    return loss, nll_loss
 def encode_line(tokenizer, line, max_length, pad_to_max_length=True, return_tensors="pt"):