From a46bc0a6a3a3923aba0390a4628cc9e908b12663 Mon Sep 17 00:00:00 2001 From: Robert Shaw Date: Sun, 20 Jul 2025 21:06:47 +0000 Subject: [PATCH] updated Signed-off-by: Robert Shaw --- vllm/v1/engine/core_client.py | 7 ++++++- 1 file changed, 6 insertions(+), 1 deletion(-) diff --git a/vllm/v1/engine/core_client.py b/vllm/v1/engine/core_client.py index aea0e1e6558d5..57b5ee70a5285 100644 --- a/vllm/v1/engine/core_client.py +++ b/vllm/v1/engine/core_client.py @@ -901,6 +901,10 @@ class DPAsyncMPClient(AsyncMPClient): assert self.stats_update_address is not None + assert len(self.engine_ranks_managed) > 1 + start_idx = self.engine_ranks_managed[0] + end_idx = self.engine_ranks_managed[-1] + async def run_engine_stats_update_task(): with make_zmq_socket(self.ctx, self.stats_update_address, zmq.XSUB) as socket, make_zmq_socket( @@ -947,6 +951,7 @@ class DPAsyncMPClient(AsyncMPClient): self.engines_running = True msg = msgspec.msgpack.encode( (target_eng_index, self.current_wave)) + logger.info("FIRST_REQ") await socket.send(msg) buf = None @@ -966,7 +971,7 @@ class DPAsyncMPClient(AsyncMPClient): self.engines_running = running # NOTE: counts include all global Cores. Slice # to get get the Core's managed by this client. - self.lb_engines = counts[self.engine_ranks_managed] + self.lb_engines = counts[start_idx:end_idx] resources.stats_update_task = asyncio.create_task( run_engine_stats_update_task())