diff --git a/vllm/v1/core/kv_cache_coordinator.py b/vllm/v1/core/kv_cache_coordinator.py index 0cce2ec81e08a..258805843e227 100644 --- a/vllm/v1/core/kv_cache_coordinator.py +++ b/vllm/v1/core/kv_cache_coordinator.py @@ -130,10 +130,10 @@ class KVCacheCoordinator(ABC): Args: request_id: The request ID. - block_hashes: The block hashes of the request. + num_running_requests: The number of requests in the RUNNING state. Returns: - The number of common prefix blocks. + list[int]: The number of common prefix blocks. """ num_blocks_per_group = [ manager.get_num_common_prefix_blocks(request_id, diff --git a/vllm/v1/core/single_type_kv_cache_manager.py b/vllm/v1/core/single_type_kv_cache_manager.py index e8a44c7773a71..714f49494c9a1 100644 --- a/vllm/v1/core/single_type_kv_cache_manager.py +++ b/vllm/v1/core/single_type_kv_cache_manager.py @@ -181,7 +181,7 @@ class SingleTypeKVCacheManager(ABC): Args: request_id: The request ID. - block_hashes: The block hashes of the request. + num_running_requests: The number of requests in the RUNNING state. Returns: The number of common prefix blocks.