mirror of
https://git.datalinker.icu/vllm-project/vllm.git
synced 2025-12-30 15:31:49 +08:00
[V1][Minor] Remove outdated comment (#12968)
Signed-off-by: Woosuk Kwon <woosuk.kwon@berkeley.edu>
This commit is contained in:
parent
86222a3dab
commit
870c37481e
@ -205,8 +205,6 @@ class KVCacheManager:
|
||||
# Should not exceed the maximum number of blocks per request.
|
||||
# This is especially because the block table has the shape
|
||||
# [..., max_num_blocks_per_req].
|
||||
# TODO(woosuk): Check and reject requests if
|
||||
# num_prompt_tokens + max_tokens > max_model_len.
|
||||
self.max_num_blocks_per_req - len(req_blocks),
|
||||
)
|
||||
assert num_new_blocks > 0
|
||||
|
||||
Loading…
x
Reference in New Issue
Block a user