mirror of
https://git.datalinker.icu/vllm-project/vllm.git
synced 2026-03-16 14:07:13 +08:00
updated
Signed-off-by: Robert Shaw <robshaw@redhat.com>
This commit is contained in:
parent
e82e9afeb7
commit
1588294a88
@ -923,9 +923,7 @@ class NixlConnectorWorker:
|
||||
# Add to requests that are waiting to be read and track expiration.
|
||||
self._reqs_to_send.update(metadata.reqs_to_send)
|
||||
end = time.perf_counter()
|
||||
logger.info(
|
||||
f"===== {len(metadata.reqs_to_recv)=}start_load_kv time: {end-start: 0.5f}s"
|
||||
)
|
||||
logger.info(f"===== start_load_kv time: {end-start: 0.5f}s")
|
||||
|
||||
def _read_blocks_for_req(self, req_id: str, meta: ReqMeta):
|
||||
logger.debug(
|
||||
@ -941,7 +939,6 @@ class NixlConnectorWorker:
|
||||
def _read_blocks(self, local_block_ids: list[int],
|
||||
remote_block_ids: list[int], dst_engine_id: str,
|
||||
request_id: str):
|
||||
start_all = time.perf_counter()
|
||||
# NOTE(rob): having the staging blocks be on the READER side is
|
||||
# not going to work well (since we will have to call rearrange tensors).
|
||||
# after we detect the txn is complete (which means we cannot make the
|
||||
@ -1038,8 +1035,6 @@ class NixlConnectorWorker:
|
||||
# TODO (NickLucche) surface xfer elapsed time
|
||||
self._recving_transfers[request_id].append(
|
||||
(handle, time.perf_counter()))
|
||||
end_all = time.perf_counter()
|
||||
logger.info(f"TOTAL_TIME: {end_all-start_all :0.4f}s")
|
||||
|
||||
def _get_block_descs_ids(self,
|
||||
engine_id: str,
|
||||
|
||||
Loading…
x
Reference in New Issue
Block a user