[Bugfix] Use random hidden states in dummy sampler run (#18543)

Signed-off-by: Bowen Wang <abmfy@icloud.com>
2025-12-10 06:45:01 +08:00 · 2025-05-22 06:48:56 -07:00 · 2025-05-22 06:48:56 -07:00 · 4e04eceb58
commit 4e04eceb58
parent 71075029f2
1 changed files with 4 additions and 0 deletions
--- a/vllm/v1/worker/gpu_model_runner.py
+++ b/vllm/v1/worker/gpu_model_runner.py
@ -1721,6 +1721,10 @@ class GPUModelRunner(LoRAModelRunnerMixin):
        self,
        hidden_states: torch.Tensor,
    ) -> torch.Tensor:
+        # The dummy hidden states may contain special values,
+        # like `inf` or `nan`.
+        # To avoid breaking the sampler, we use a random tensor here instead.
+        hidden_states = torch.rand_like(hidden_states)

        logits = self.model.compute_logits(hidden_states, None)
        num_reqs = logits.size(0)