mirror of
https://git.datalinker.icu/vllm-project/vllm.git
synced 2025-12-30 20:49:39 +08:00
[BugFix] Spec decode with VLLM_ENABLE_V1_MULTIPROCESSING=0 (#30319)
Signed-off-by: Chen Zhang <zhangch99@outlook.com>
This commit is contained in:
parent
41b6f9200f
commit
24b65eff0d
@ -268,7 +268,8 @@ class InprocClient(EngineCoreClient):
|
||||
self.engine_core = EngineCore(*args, **kwargs)
|
||||
|
||||
def get_output(self) -> EngineCoreOutputs:
|
||||
outputs, _ = self.engine_core.step_fn()
|
||||
outputs, model_executed = self.engine_core.step_fn()
|
||||
self.engine_core.post_step(model_executed=model_executed)
|
||||
return outputs and outputs.get(0) or EngineCoreOutputs()
|
||||
|
||||
def get_supported_tasks(self) -> tuple[SupportedTask, ...]:
|
||||
|
||||
Loading…
x
Reference in New Issue
Block a user