mirror of
https://git.datalinker.icu/vllm-project/vllm.git
synced 2026-04-06 05:27:04 +08:00
fix
Signed-off-by: Woosuk Kwon <woosuk.kwon@berkeley.edu>
This commit is contained in:
parent
5c133fc860
commit
e47bb9970b
@ -118,7 +118,7 @@ class BlockTables:
|
||||
# no clear upper bound on the number of new blocks.
|
||||
new_block_ids_cpu = torch.empty(
|
||||
self.num_kv_cache_groups,
|
||||
max(len(b) for b in new_block_ids),
|
||||
max(x[-1] for x in cu_num_new_blocks),
|
||||
dtype=torch.int32,
|
||||
device="cpu",
|
||||
pin_memory=self.pin_memory,
|
||||
|
||||
Loading…
x
Reference in New Issue
Block a user