mirror of
https://git.datalinker.icu/vllm-project/vllm.git
synced 2026-06-07 06:35:42 +08:00
Minor
This commit is contained in:
parent
5323969fcf
commit
e2c7dedb3a
@ -193,7 +193,7 @@ class TPUModelRunner:
|
|||||||
kv_caches,
|
kv_caches,
|
||||||
logits_indices,
|
logits_indices,
|
||||||
)
|
)
|
||||||
# TODO
|
# TODO(woosuk): Support sampling with temperature and top_p.
|
||||||
next_token_ids = jnp.argmax(logits, axis=-1)
|
next_token_ids = jnp.argmax(logits, axis=-1)
|
||||||
return next_token_ids, new_kv_caches
|
return next_token_ids, new_kv_caches
|
||||||
|
|
||||||
|
|||||||
Loading…
x
Reference in New Issue
Block a user