mirror of
https://git.datalinker.icu/vllm-project/vllm.git
synced 2026-05-25 23:37:54 +08:00
updated
Signed-off-by: Robert Shaw <robshaw@redhat.com>
This commit is contained in:
parent
e81c277e6e
commit
1dcd90065d
@ -431,11 +431,11 @@ class MPClient(EngineCoreClient):
|
|||||||
dp_rank = parallel_config.data_parallel_rank
|
dp_rank = parallel_config.data_parallel_rank
|
||||||
dp_local_size = parallel_config.data_parallel_size_local
|
dp_local_size = parallel_config.data_parallel_size_local
|
||||||
offline_mode = parallel_config.data_parallel_rank_local is not None
|
offline_mode = parallel_config.data_parallel_rank_local is not None
|
||||||
|
# If Internal DPLB, the Client manages local+remote EngineCores.
|
||||||
|
# Otherwise, the Client just manages the local EngineCores.
|
||||||
local_engines_only = (parallel_config.data_parallel_hybrid_lb
|
local_engines_only = (parallel_config.data_parallel_hybrid_lb
|
||||||
or parallel_config.data_parallel_external_lb)
|
or parallel_config.data_parallel_external_lb)
|
||||||
|
|
||||||
# If External DPLB, Client manages local EngineCores.
|
|
||||||
# If Internal DPLB, Client manages local+remote EngineCores.
|
|
||||||
num_ranks = dp_local_size if local_engines_only else dp_size
|
num_ranks = dp_local_size if local_engines_only else dp_size
|
||||||
self.engine_ranks_managed = ([dp_rank] if offline_mode else range(
|
self.engine_ranks_managed = ([dp_rank] if offline_mode else range(
|
||||||
dp_rank, dp_rank + num_ranks))
|
dp_rank, dp_rank + num_ranks))
|
||||||
@ -1020,7 +1020,6 @@ class DPLBAsyncMPClient(DPAsyncMPClient):
|
|||||||
self, request: EngineCoreRequest) -> EngineIdentity:
|
self, request: EngineCoreRequest) -> EngineIdentity:
|
||||||
# Engines are in rank order.
|
# Engines are in rank order.
|
||||||
if (eng_index := request.data_parallel_rank) is None:
|
if (eng_index := request.data_parallel_rank) is None:
|
||||||
# logger.info(f"{self.lb_engines=} | {self.core_engines=}")
|
|
||||||
if not self.lb_engines:
|
if not self.lb_engines:
|
||||||
return self.core_engine
|
return self.core_engine
|
||||||
# TODO use P2C alg for larger DP sizes
|
# TODO use P2C alg for larger DP sizes
|
||||||
|
|||||||
Loading…
x
Reference in New Issue
Block a user