minor

Signed-off-by: Woosuk Kwon <woosuk.kwon@berkeley.edu>
2026-06-14 02:37:11 +08:00 · 2025-09-18 16:31:01 -07:00 · 2025-09-18 16:31:01 -07:00 · efda08481b
commit efda08481b
parent 82da219ff9
1 changed files with 2 additions and 2 deletions
--- a/vllm/v1/worker/gpu/sampler.py
+++ b/vllm/v1/worker/gpu/sampler.py
@ -254,8 +254,8 @@ def compute_logprobs(
    )
    # NOTE(woosuk): Here, to save GPU memory, we do not materialize the full
-    # logprobs tensor. Instead, we only compute the logprobs of the topk + 1
+    # logprobs tensor. Instead, we only compute and return the logprobs of
-    # tokens.
+    # the topk + 1 tokens.
    BLOCK_SIZE = 1024
    _topk_logprobs_kernel[(batch_size, )](
        logprobs,