mirror of
https://git.datalinker.icu/vllm-project/vllm.git
synced 2026-03-25 05:55:52 +08:00
parent
ee2a4b0889
commit
dedb1a5424
@ -330,7 +330,10 @@ class NixlConnectorWorker:
|
||||
self.block_size = vllm_config.cache_config.block_size
|
||||
|
||||
# Agent.
|
||||
self.nixl_wrapper = NixlWrapper(str(uuid.uuid4()), None)
|
||||
self.nixl_wrapper = NixlWrapper(str(uuid.uuid4()),
|
||||
None,
|
||||
num_workers=None,
|
||||
num_shared_workers=16)
|
||||
# Map of engine_id -> {rank0: agent_name0, rank1: agent_name1..}.
|
||||
self._remote_agents: dict[str, dict[int, str]] = defaultdict(dict)
|
||||
|
||||
@ -986,9 +989,9 @@ class NixlConnectorWorker:
|
||||
|
||||
# Begin async xfer.
|
||||
start = time.perf_counter()
|
||||
# for handle in handles:
|
||||
# self.nixl_wrapper.transfer(handle)
|
||||
self.nixl_wrapper.transfer_batched(handles)
|
||||
for handle in handles:
|
||||
self.nixl_wrapper.transfer(handle)
|
||||
# self.nixl_wrapper.transfer_batched(handles)
|
||||
end = time.perf_counter()
|
||||
logger.info("======== LAUNCH TIME: %s ========", end - start)
|
||||
|
||||
|
||||
Loading…
x
Reference in New Issue
Block a user