Merge b9968373c3d95db7abc58f2c71b8b136373a4779 into 254f6b986720c92ddf97fbb1a6a6465da8e87e29

2026-05-30 01:57:05 +08:00 · 2025-12-25 00:06:35 +00:00 · 2025-12-25 00:06:35 +00:00 · fee1157f8f
commit fee1157f8f
parent 254f6b9867 b9968373c3
1 changed files with 4 additions and 1 deletions
--- a/vllm/v1/request.py
+++ b/vllm/v1/request.py
@ -3,6 +3,7 @@
 import enum
 import time
 import weakref
 from collections.abc import Callable, Mapping
 from functools import partial
 from typing import TYPE_CHECKING, Any, Optional
@ -132,7 +133,9 @@ class Request:
        self.block_hashes: list[BlockHash] = []
        self.get_hash_new_full_blocks: Callable[[], list[BlockHash]] | None = None
        if block_hasher is not None:
-            self.get_hash_new_full_blocks = partial(block_hasher, self)
+            # Use weakref to avoid circular reference: Request -> partial -> Request
            # This allows immediate reclamation by refcounting without waiting for GC.
            self.get_hash_new_full_blocks = partial(block_hasher, weakref.proxy(self))
            self.block_hashes = self.get_hash_new_full_blocks()
        self.skip_reading_prefix_cache = self.get_skip_reading_prefix_cache()