mirror of
https://git.datalinker.icu/vllm-project/vllm.git
synced 2026-01-28 09:17:13 +08:00
[V1] Allow sliding window + prefix caching (#13069)
Signed-off-by: Woosuk Kwon <woosuk.kwon@berkeley.edu>
This commit is contained in:
parent
f5d3acd474
commit
53be4a8634
@ -1146,7 +1146,7 @@ class CacheConfig:
|
||||
if not self.enable_prefix_caching:
|
||||
return
|
||||
|
||||
if self.sliding_window is not None:
|
||||
if self.sliding_window is not None and not envs.VLLM_USE_V1:
|
||||
raise NotImplementedError(
|
||||
"Prefix caching is not supported with sliding window. "
|
||||
"Run with --disable-sliding-window to use prefix caching.")
|
||||
|
||||
Loading…
x
Reference in New Issue
Block a user