diff --git a/vllm/v1/core/single_type_kv_cache_manager.py b/vllm/v1/core/single_type_kv_cache_manager.py index 38da13a83f3ac..8444ee5ef425f 100644 --- a/vllm/v1/core/single_type_kv_cache_manager.py +++ b/vllm/v1/core/single_type_kv_cache_manager.py @@ -318,7 +318,7 @@ class FullAttentionManager(SingleTypeKVCacheManager): ) -> tuple[list[KVCacheBlock], ...]: assert isinstance( kv_cache_spec, - FullAttentionSpec | ChunkedLocalAttentionSpec | FullDiffkvAttentionSpec + FullAttentionSpec | ChunkedLocalAttentionSpec | FullDiffkvAttentionSpec, ), ( "FullAttentionManager can only be used for full attention " "and chunked local attention groups"