Use FP32 for log probabilities (#19)

2026-01-23 13:14:34 +08:00 · 2023-03-31 23:33:43 -07:00 · 2023-03-31 23:33:43 -07:00 · a90c97d727
commit a90c97d727
parent e3f00d191e
1 changed files with 2 additions and 1 deletions
--- a/cacheflow/models/sample.py
+++ b/cacheflow/models/sample.py
@ -36,10 +36,11 @@ class Sampler(nn.Module):
            # Use in-place division to avoid creating a new tensor.
            logits.div_(t.unsqueeze(dim=1))

+        # We use float32 for probabilities and log probabilities.
        # Compute the probabilities.
        probs = torch.softmax(logits, dim=-1, dtype=torch.float)
        # Compute the log probabilities (before applying top-p).
-        logprobs = torch.log(probs, out=logits)
+        logprobs = torch.log(probs)

        # Apply top-p truncation.
        top_ps = _get_top_ps(input_metadata)