[ux] Switch a warning to debug about a pytorch fallback (#23750)

Signed-off-by: Russell Bryant <rbryant@redhat.com>
This commit is contained in:
Russell Bryant 2025-09-25 10:38:16 -04:00 committed by GitHub
parent eb32335e35
commit 532a6cfccb
No known key found for this signature in database
GPG Key ID: B5690EEEBB952194

View File

@ -109,9 +109,9 @@ class TopKTopPSampler(nn.Module):
# CPU-GPU synchronization while `flashinfer_sample` does.
if (k is None and p is None) or generators:
if generators:
logger.warning_once("FlashInfer 0.2.3+ does not support "
"per-request generators. Falling back to "
"PyTorch-native implementation.")
logger.debug_once("FlashInfer 0.2.3+ does not support "
"per-request generators. Falling back to "
"PyTorch-native implementation.")
return self.forward_native(logits, generators, k, p)
assert self.logprobs_mode not in (
"processed_logits", "processed_logprobs"