mirror of
https://git.datalinker.icu/vllm-project/vllm.git
synced 2026-06-04 07:02:14 +08:00
format
Signed-off-by: inkcherry <mingzhi.liu@amd.com>
This commit is contained in:
parent
16d2a7a343
commit
374cc25e0f
@ -79,6 +79,7 @@ class MoRIIOConstants:
|
|||||||
|
|
||||||
VLLM_MORI_READ_ABORT_REQUEST_TIMEOUT = 3600
|
VLLM_MORI_READ_ABORT_REQUEST_TIMEOUT = 3600
|
||||||
|
|
||||||
|
|
||||||
try:
|
try:
|
||||||
from mori.io import (
|
from mori.io import (
|
||||||
BackendType,
|
BackendType,
|
||||||
@ -1293,7 +1294,8 @@ class MoRIIOConnectorScheduler:
|
|||||||
if delay_free_blocks:
|
if delay_free_blocks:
|
||||||
# Prefill request on remote. It will be read from D upon completion
|
# Prefill request on remote. It will be read from D upon completion
|
||||||
self._reqs_need_send[request.request_id] = (
|
self._reqs_need_send[request.request_id] = (
|
||||||
time.perf_counter() + MoRIIOConstants.VLLM_MORI_READ_ABORT_REQUEST_TIMEOUT
|
time.perf_counter()
|
||||||
|
+ MoRIIOConstants.VLLM_MORI_READ_ABORT_REQUEST_TIMEOUT
|
||||||
)
|
)
|
||||||
|
|
||||||
# If we execute in P-D serial mode, no notification port is needed.
|
# If we execute in P-D serial mode, no notification port is needed.
|
||||||
@ -1508,8 +1510,8 @@ class MoRIIOConnectorWorker:
|
|||||||
remote_ip: IP address of remote node
|
remote_ip: IP address of remote node
|
||||||
"""
|
"""
|
||||||
|
|
||||||
|
# synchronization to prevent dirty reads between
|
||||||
# synchronization to prevent dirty reads between transfer and attention operations
|
# transfer and attention operations
|
||||||
# we can consider removing this synchronization after ibgda is enabled.
|
# we can consider removing this synchronization after ibgda is enabled.
|
||||||
# when mori-io supports ibgda functionality
|
# when mori-io supports ibgda functionality
|
||||||
|
|
||||||
@ -1934,18 +1936,17 @@ class MoRIIOConnectorWorker:
|
|||||||
to track which workers are done.
|
to track which workers are done.
|
||||||
"""
|
"""
|
||||||
|
|
||||||
done_sending, done_recving = set() ,set()
|
done_sending, done_recving = set(), set()
|
||||||
|
|
||||||
if self.is_producer:
|
if self.is_producer:
|
||||||
done_sending = self.moriio_wrapper.pop_finished_req_ids()
|
done_sending = self.moriio_wrapper.pop_finished_req_ids()
|
||||||
|
|
||||||
else:
|
else:
|
||||||
if self.mode == MoRIIOMode.WRITE:
|
if self.mode == MoRIIOMode.WRITE:
|
||||||
done_recving = self.moriio_wrapper.pop_finished_write_req_ids()
|
done_recving = self.moriio_wrapper.pop_finished_write_req_ids()
|
||||||
else:
|
else:
|
||||||
done_recving = self._pop_done_transfers()
|
done_recving = self._pop_done_transfers()
|
||||||
|
|
||||||
|
|
||||||
return done_sending, done_recving
|
return done_sending, done_recving
|
||||||
|
|
||||||
def _pop_done_transfers(self) -> set[str]:
|
def _pop_done_transfers(self) -> set[str]:
|
||||||
|
|||||||
Loading…
x
Reference in New Issue
Block a user