mirror of
https://git.datalinker.icu/vllm-project/vllm.git
synced 2025-12-13 20:44:27 +08:00
[Bugfix] Significant performance drop on CPUs with --num-scheduler-steps > 1 (#11794)
This commit is contained in:
parent
973f5dc581
commit
a4e2b26856
@ -1157,6 +1157,12 @@ class EngineArgs:
|
|||||||
if self.enable_chunked_prefill and self.pipeline_parallel_size > 1:
|
if self.enable_chunked_prefill and self.pipeline_parallel_size > 1:
|
||||||
raise ValueError("Multi-Step Chunked-Prefill is not supported "
|
raise ValueError("Multi-Step Chunked-Prefill is not supported "
|
||||||
"for pipeline-parallel-size > 1")
|
"for pipeline-parallel-size > 1")
|
||||||
|
from vllm.platforms import current_platform
|
||||||
|
if current_platform.is_cpu():
|
||||||
|
logger.warning("Multi-Step (--num-scheduler-steps > 1) is "
|
||||||
|
"currently not supported for CPUs and has been "
|
||||||
|
"disabled.")
|
||||||
|
self.num_scheduler_steps = 1
|
||||||
|
|
||||||
# make sure num_lookahead_slots is set the higher value depending on
|
# make sure num_lookahead_slots is set the higher value depending on
|
||||||
# if we are using speculative decoding or multi-step
|
# if we are using speculative decoding or multi-step
|
||||||
|
|||||||
Loading…
x
Reference in New Issue
Block a user