mirror of
https://git.datalinker.icu/vllm-project/vllm.git
synced 2026-05-05 11:11:21 +08:00
Fix scheduler
This commit is contained in:
parent
98eda57899
commit
b62170e4e3
@ -666,6 +666,10 @@ class Scheduler:
|
|||||||
budget.add_num_batched_tokens(seq_group.request_id, num_new_tokens)
|
budget.add_num_batched_tokens(seq_group.request_id, num_new_tokens)
|
||||||
budget.add_num_seqs(seq_group.request_id, num_new_seqs)
|
budget.add_num_seqs(seq_group.request_id, num_new_seqs)
|
||||||
|
|
||||||
|
# FIXME(woosuk): For TPUs, we want to schedule only one prompt
|
||||||
|
# per scheduling step.
|
||||||
|
break
|
||||||
|
|
||||||
# Queue requests that couldn't be scheduled.
|
# Queue requests that couldn't be scheduled.
|
||||||
waiting_queue.extendleft(leftover_waiting_sequences)
|
waiting_queue.extendleft(leftover_waiting_sequences)
|
||||||
if len(seq_groups) > 0:
|
if len(seq_groups) > 0:
|
||||||
|
|||||||
Loading…
x
Reference in New Issue
Block a user