From c481d30c17d3b51f8a3d4a9775e6d52a8eab8bbd Mon Sep 17 00:00:00 2001 From: "rshaw@neuralmagic.com" Date: Mon, 30 Jun 2025 01:39:15 +0000 Subject: [PATCH] update Signed-off-by: rshaw@neuralmagic.com --- .../kv_transfer/kv_connector/v1/nixl_connector.py | 5 ++++- 1 file changed, 4 insertions(+), 1 deletion(-) diff --git a/vllm/distributed/kv_transfer/kv_connector/v1/nixl_connector.py b/vllm/distributed/kv_transfer/kv_connector/v1/nixl_connector.py index 47433ae0dabbf..c5ff321cd9f53 100644 --- a/vllm/distributed/kv_transfer/kv_connector/v1/nixl_connector.py +++ b/vllm/distributed/kv_transfer/kv_connector/v1/nixl_connector.py @@ -333,7 +333,8 @@ class NixlConnectorWorker: self.nixl_wrapper = NixlWrapper(str(uuid.uuid4()), None, num_workers=None, - num_shared_workers=16) + # num_shared_workers=16) # setting this > 0 causes the notifs to be recved + num_shared_workers=None) # Map of engine_id -> {rank0: agent_name0, rank1: agent_name1..}. self._remote_agents: dict[str, dict[int, str]] = defaultdict(dict) @@ -819,6 +820,7 @@ class NixlConnectorWorker: """ notified_req_ids: set[str] = set() for notifs in self.nixl_wrapper.get_new_notifs().values(): + print(f"{notifs=}") for notif in notifs: req_id, tp_ratio = notif.decode("utf-8").rsplit(":", 1) self.consumer_notification_counts_by_req[req_id] += 1 @@ -853,6 +855,7 @@ class NixlConnectorWorker: xfer_state) # Done. + print(f"{len(new_handles)=}") if len(new_handles) == 0: start = time.perf_counter() self.nixl_wrapper.send_notif(agent_name, notif_id)