mirror of
https://git.datalinker.icu/vllm-project/vllm.git
synced 2026-04-01 03:17:03 +08:00
Update scheduler.py
Signed-off-by: Pr0Wh1teGivee <calvin_zhu0210@outlook.com> Signed-off-by: weichen <calvin_zhu0210@outlook.com>
This commit is contained in:
parent
779769ea97
commit
6413793466
@ -21,7 +21,11 @@ logger = init_logger(__name__)
|
||||
|
||||
RunnerType = Literal["generate", "pooling", "draft"]
|
||||
SchedulerPolicy = Literal["fcfs", "priority", "sjf"]
|
||||
|
||||
""" SJF Scheduling Policy:
|
||||
It stands for shortest-job-first — requests are scheduled by total prompt +
|
||||
output length (shorter first), with aging to prevent starvation. For more
|
||||
information, please check: https://github.com/vllm-project/vllm/issues/29406
|
||||
"""
|
||||
|
||||
@config
|
||||
@dataclass
|
||||
|
||||
Loading…
x
Reference in New Issue
Block a user