mirror of
https://git.datalinker.icu/vllm-project/vllm.git
synced 2026-03-16 16:17:27 +08:00
Minor
This commit is contained in:
parent
5323969fcf
commit
e2c7dedb3a
@ -193,7 +193,7 @@ class TPUModelRunner:
|
||||
kv_caches,
|
||||
logits_indices,
|
||||
)
|
||||
# TODO
|
||||
# TODO(woosuk): Support sampling with temperature and top_p.
|
||||
next_token_ids = jnp.argmax(logits, axis=-1)
|
||||
return next_token_ids, new_kv_caches
|
||||
|
||||
|
||||
Loading…
x
Reference in New Issue
Block a user