mirror of
https://git.datalinker.icu/vllm-project/vllm.git
synced 2026-04-08 13:47:06 +08:00
update
Signed-off-by: Woosuk Kwon <woosuk.kwon@berkeley.edu>
This commit is contained in:
parent
a98eff0762
commit
323a05b3c5
@ -136,4 +136,4 @@ def init_kv_cache(
|
||||
kv_cache_raw_tensors = _allocate_kv_cache(kv_cache_config, device)
|
||||
kv_caches = _reshape_kv_cache(kv_cache_config, kv_cache_raw_tensors,
|
||||
attn_backends)
|
||||
bind_kv_cache(forward_context, kv_caches, runner_kv_caches)
|
||||
bind_kv_cache(kv_caches, forward_context, runner_kv_caches)
|
||||
|
||||
Loading…
x
Reference in New Issue
Block a user