mirror of
https://git.datalinker.icu/vllm-project/vllm.git
synced 2025-12-09 21:55:50 +08:00
OffloadingConnector: Fix GPU block tracking bug (#25856)
Signed-off-by: Or Ozeri <oro@il.ibm.com>
This commit is contained in:
parent
fb610ae684
commit
cfd302db9b
@ -278,8 +278,9 @@ class OffloadingConnectorScheduler:
|
||||
req, start_idx=start_block_idx, end_idx=num_blocks)
|
||||
store_output = self.manager.prepare_store(new_block_hashes)
|
||||
if store_output is None:
|
||||
logger.warning("Cannot store %s blocks", num_new_blocks)
|
||||
break
|
||||
logger.warning("Request %s: cannot store %s blocks", req_id,
|
||||
num_new_blocks)
|
||||
continue
|
||||
|
||||
self._next_stored_block_idx[req_id] = num_blocks
|
||||
|
||||
|
||||
Loading…
x
Reference in New Issue
Block a user