mirror of
https://git.datalinker.icu/vllm-project/vllm.git
synced 2026-04-05 03:37:03 +08:00
[BugFix] Corner case that could cause out-of-sync with external launcher mode and dp >1 (#28774)
This commit is contained in:
parent
f77bce001a
commit
61485844fc
@ -2663,6 +2663,18 @@ class GPUModelRunner(
|
||||
return make_empty_encoder_model_runner_output(scheduler_output)
|
||||
|
||||
if not num_scheduled_tokens:
|
||||
if (
|
||||
self.parallel_config.distributed_executor_backend
|
||||
== "external_launcher"
|
||||
and self.parallel_config.data_parallel_size > 1
|
||||
):
|
||||
# this is a corner case when both external launcher
|
||||
# and DP are enabled, num_scheduled_tokens could be
|
||||
# 0, and has_unfinished_requests in the outer loop
|
||||
# returns True. before returning early here we call
|
||||
# dummy run to ensure coordinate_batch_across_dp
|
||||
# is called into to avoid out of sync issues.
|
||||
self._dummy_run(1)
|
||||
if not has_kv_transfer_group():
|
||||
# Return empty ModelRunnerOutput if no work to do.
|
||||
return EMPTY_MODEL_RUNNER_OUTPUT
|
||||
|
||||
Loading…
x
Reference in New Issue
Block a user