mirror of
https://git.datalinker.icu/vllm-project/vllm.git
synced 2026-01-23 10:24:28 +08:00
[BugFix] Fix pipeline parallel (#24621)
Signed-off-by: Nick Hill <nhill@redhat.com>
This commit is contained in:
parent
29799ddacc
commit
e2d8c27f68
@ -71,6 +71,10 @@ class UniProcExecutor(ExecutorBase):
|
||||
self.shutdown()
|
||||
return
|
||||
|
||||
def shutdown(self) -> None:
|
||||
if worker := self.driver_worker:
|
||||
worker.shutdown()
|
||||
|
||||
|
||||
UniProcExecutorAsync = UniProcExecutor
|
||||
|
||||
|
||||
@ -2070,7 +2070,6 @@ class GPUModelRunner(LoRAModelRunnerMixin, KVConnectorModelRunnerMixin):
|
||||
sampler_output = self._sample(logits, spec_decode_metadata)
|
||||
|
||||
with record_function_or_nullcontext("Bookkeep"):
|
||||
assert isinstance(hidden_states, torch.Tensor)
|
||||
(
|
||||
num_nans_in_logits,
|
||||
logprobs_lists,
|
||||
|
||||
@ -45,7 +45,8 @@ class KVConnectorModelRunnerMixin:
|
||||
|
||||
@staticmethod
|
||||
def ensure_kv_transfer_shutdown() -> None:
|
||||
if has_kv_transfer_group():
|
||||
# has_kv_transfer_group can be None during interpreter shutdown.
|
||||
if has_kv_transfer_group and has_kv_transfer_group():
|
||||
ensure_kv_transfer_shutdown()
|
||||
|
||||
@staticmethod
|
||||
|
||||
Loading…
x
Reference in New Issue
Block a user