mirror of
https://git.datalinker.icu/vllm-project/vllm.git
synced 2025-12-10 23:55:19 +08:00
[bugfix][distributed] fix multi-node bug for shared memory (#6597)
This commit is contained in:
parent
f0bbfaf917
commit
07eb6f19f3
@ -108,8 +108,14 @@ class ShmRingBuffer:
|
|||||||
# created by the process. The following patch is a workaround.
|
# created by the process. The following patch is a workaround.
|
||||||
with patch("multiprocessing.resource_tracker.register",
|
with patch("multiprocessing.resource_tracker.register",
|
||||||
lambda *args, **kwargs: None):
|
lambda *args, **kwargs: None):
|
||||||
self.shared_memory = shared_memory.SharedMemory(name=name)
|
try:
|
||||||
assert self.shared_memory.size == self.total_bytes_of_buffer
|
self.shared_memory = shared_memory.SharedMemory(name=name)
|
||||||
|
assert self.shared_memory.size == self.total_bytes_of_buffer # noqa
|
||||||
|
except FileNotFoundError:
|
||||||
|
# we might deserialize the object in a different node
|
||||||
|
# in this case, this object is not used,
|
||||||
|
# and we should suppress the error
|
||||||
|
pass
|
||||||
|
|
||||||
def __reduce__(self):
|
def __reduce__(self):
|
||||||
return (
|
return (
|
||||||
|
|||||||
Loading…
x
Reference in New Issue
Block a user