[BugFix] Spec decode with VLLM_ENABLE_V1_MULTIPROCESSING=0 (#30319)

Signed-off-by: Chen Zhang <zhangch99@outlook.com>
This commit is contained in:
Chen Zhang 2025-12-18 11:47:56 -08:00 committed by GitHub
parent 41b6f9200f
commit 24b65eff0d
No known key found for this signature in database
GPG Key ID: B5690EEEBB952194

View File

@ -268,7 +268,8 @@ class InprocClient(EngineCoreClient):
self.engine_core = EngineCore(*args, **kwargs)
def get_output(self) -> EngineCoreOutputs:
outputs, _ = self.engine_core.step_fn()
outputs, model_executed = self.engine_core.step_fn()
self.engine_core.post_step(model_executed=model_executed)
return outputs and outputs.get(0) or EngineCoreOutputs()
def get_supported_tasks(self) -> tuple[SupportedTask, ...]: