mirror of
https://git.datalinker.icu/vllm-project/vllm.git
synced 2025-12-18 12:15:33 +08:00
[multi-step] Raise error if not using async engine (#7703)
This commit is contained in:
parent
1b32e02648
commit
91f4522cbf
@ -1302,6 +1302,11 @@ class LLMEngine:
|
|||||||
raise NotImplementedError(
|
raise NotImplementedError(
|
||||||
"Pipeline parallelism is only supported through AsyncLLMEngine "
|
"Pipeline parallelism is only supported through AsyncLLMEngine "
|
||||||
"as performance will be severely degraded otherwise.")
|
"as performance will be severely degraded otherwise.")
|
||||||
|
|
||||||
|
if self.scheduler_config.num_scheduler_steps > 1:
|
||||||
|
raise NotImplementedError(
|
||||||
|
"Multiple scheduler steps (multi-step) are only supported "
|
||||||
|
"through AsyncLLMEngine. ")
|
||||||
seq_group_metadata_list, scheduler_outputs = self.scheduler[
|
seq_group_metadata_list, scheduler_outputs = self.scheduler[
|
||||||
0].schedule()
|
0].schedule()
|
||||||
|
|
||||||
|
|||||||
Loading…
x
Reference in New Issue
Block a user