Use FP32 for log probabilities (#19)

a90c97d7 · Woosuk Kwon · GitHub · e3f00d19 · a90c97d7
Unverified Commit a90c97d7 authored Mar 31, 2023 by Woosuk Kwon Committed by GitHub Mar 31, 2023
Hide whitespace changes
Inline Side-by-side

Showing with 2 additions and 1 deletion

cacheflow/models/sample.py cacheflow/models/sample.py +2 -1

No files found.
--- a/cacheflow/models/sample.py
+++ b/cacheflow/models/sample.py
@@ -36,10 +36,11 @@ class Sampler(nn.Module):
            # Use in-place division to avoid creating a new tensor.
            logits.div_(t.unsqueeze(dim=1))
+        # We use float32 for probabilities and log probabilities.
        # Compute the probabilities.
        probs = torch.softmax(logits, dim=-1, dtype=torch.float)
        # Compute the log probabilities (before applying top-p).
-        logprobs = torch.log(probs, out=logits)
+        logprobs = torch.log(probs)
        # Apply top-p truncation.
        top_ps = _get_top_ps(input_metadata)