mirror of
https://git.datalinker.icu/vllm-project/vllm.git
synced 2026-05-13 22:41:23 +08:00
fix
Signed-off-by: Woosuk Kwon <woosuk.kwon@berkeley.edu>
This commit is contained in:
parent
5c133fc860
commit
e47bb9970b
@ -118,7 +118,7 @@ class BlockTables:
|
|||||||
# no clear upper bound on the number of new blocks.
|
# no clear upper bound on the number of new blocks.
|
||||||
new_block_ids_cpu = torch.empty(
|
new_block_ids_cpu = torch.empty(
|
||||||
self.num_kv_cache_groups,
|
self.num_kv_cache_groups,
|
||||||
max(len(b) for b in new_block_ids),
|
max(x[-1] for x in cu_num_new_blocks),
|
||||||
dtype=torch.int32,
|
dtype=torch.int32,
|
||||||
device="cpu",
|
device="cpu",
|
||||||
pin_memory=self.pin_memory,
|
pin_memory=self.pin_memory,
|
||||||
|
|||||||
Loading…
x
Reference in New Issue
Block a user