diff --git a/vllm/distributed/kv_transfer/kv_connector/v1/nixl_connector.py b/vllm/distributed/kv_transfer/kv_connector/v1/nixl_connector.py index 51c59b0e7ad43..3008223243b16 100644 --- a/vllm/distributed/kv_transfer/kv_connector/v1/nixl_connector.py +++ b/vllm/distributed/kv_transfer/kv_connector/v1/nixl_connector.py @@ -923,9 +923,7 @@ class NixlConnectorWorker: # Add to requests that are waiting to be read and track expiration. self._reqs_to_send.update(metadata.reqs_to_send) end = time.perf_counter() - logger.info( - f"===== {len(metadata.reqs_to_recv)=}start_load_kv time: {end-start: 0.5f}s" - ) + logger.info(f"===== start_load_kv time: {end-start: 0.5f}s") def _read_blocks_for_req(self, req_id: str, meta: ReqMeta): logger.debug( @@ -941,7 +939,6 @@ class NixlConnectorWorker: def _read_blocks(self, local_block_ids: list[int], remote_block_ids: list[int], dst_engine_id: str, request_id: str): - start_all = time.perf_counter() # NOTE(rob): having the staging blocks be on the READER side is # not going to work well (since we will have to call rearrange tensors). # after we detect the txn is complete (which means we cannot make the @@ -1038,8 +1035,6 @@ class NixlConnectorWorker: # TODO (NickLucche) surface xfer elapsed time self._recving_transfers[request_id].append( (handle, time.perf_counter())) - end_all = time.perf_counter() - logger.info(f"TOTAL_TIME: {end_all-start_all :0.4f}s") def _get_block_descs_ids(self, engine_id: str,