mirror of
https://git.datalinker.icu/vllm-project/vllm.git
synced 2025-12-10 14:15:55 +08:00
[bugfix][distributed] fix multi-node bug for shared memory (#6597)
This commit is contained in:
parent
f0bbfaf917
commit
07eb6f19f3
@ -108,8 +108,14 @@ class ShmRingBuffer:
|
||||
# created by the process. The following patch is a workaround.
|
||||
with patch("multiprocessing.resource_tracker.register",
|
||||
lambda *args, **kwargs: None):
|
||||
self.shared_memory = shared_memory.SharedMemory(name=name)
|
||||
assert self.shared_memory.size == self.total_bytes_of_buffer
|
||||
try:
|
||||
self.shared_memory = shared_memory.SharedMemory(name=name)
|
||||
assert self.shared_memory.size == self.total_bytes_of_buffer # noqa
|
||||
except FileNotFoundError:
|
||||
# we might deserialize the object in a different node
|
||||
# in this case, this object is not used,
|
||||
# and we should suppress the error
|
||||
pass
|
||||
|
||||
def __reduce__(self):
|
||||
return (
|
||||
|
||||
Loading…
x
Reference in New Issue
Block a user