From 0abe10e4a7fd9b0d81d440008361abf46164451d Mon Sep 17 00:00:00 2001 From: Robert Shaw Date: Wed, 23 Jul 2025 15:21:46 +0000 Subject: [PATCH] updated Signed-off-by: Robert Shaw --- .../kv_transfer/kv_connector/v1/nixl_connector.py | 9 +++++++++ 1 file changed, 9 insertions(+) diff --git a/vllm/distributed/kv_transfer/kv_connector/v1/nixl_connector.py b/vllm/distributed/kv_transfer/kv_connector/v1/nixl_connector.py index 0c5986bfafaa0..590734a380b9a 100644 --- a/vllm/distributed/kv_transfer/kv_connector/v1/nixl_connector.py +++ b/vllm/distributed/kv_transfer/kv_connector/v1/nixl_connector.py @@ -893,6 +893,7 @@ class NixlConnectorWorker: return done_req_ids def start_load_kv(self, metadata: NixlConnectorMetadata): + start = time.perf_counter() """ Start loading by triggering non-blocking nixl_xfer. We check for these trnxs to complete in each step(). @@ -921,6 +922,10 @@ class NixlConnectorWorker: # Add to requests that are waiting to be read and track expiration. self._reqs_to_send.update(metadata.reqs_to_send) + end = time.perf_counter() + logger.info( + f"===== {len(metadata.reqs_to_recv)=}start_load_kv time: {end-start: 0.5f}s" + ) def _read_blocks_for_req(self, req_id: str, meta: ReqMeta): logger.debug( @@ -1019,10 +1024,14 @@ class NixlConnectorWorker: remote_xfer_side_handle, remote_block_descs_ids, notif_msg=notif_id, + skip_desc_merge=True, ) # Begin async xfer. + start = time.perf_counter() self.nixl_wrapper.transfer(handle) + end = time.perf_counter() + logger.info(f"TRANSFER TIME: {end-start :0.4f}s") # Use handle to check completion in future step(). # TODO (NickLucche) surface xfer elapsed time