mirror of
https://git.datalinker.icu/vllm-project/vllm.git
synced 2026-03-20 14:50:20 +08:00
[Misc] Remove redundant comment (#16703)
Signed-off-by: Jade Zheng <zheng.shoujian@outlook.com>
This commit is contained in:
parent
93e561ec4d
commit
8a7368e069
@ -540,9 +540,6 @@ class GPUModelRunner(LoRAModelRunnerMixin):
|
||||
# because M (max_model_len) is not necessarily divisible by block_size.
|
||||
block_table_indices = (req_indices * self.max_num_blocks_per_req +
|
||||
positions_np // self.block_size)
|
||||
# NOTE(woosuk): We use torch.index_select instead of np.take here
|
||||
# because torch.index_select is much faster than np.take for large
|
||||
# tensors.
|
||||
block_table_cpu = self.input_batch.block_table.get_cpu_tensor()
|
||||
block_numbers = block_table_cpu.flatten()[block_table_indices].numpy()
|
||||
block_offsets = positions_np % self.block_size
|
||||
|
||||
Loading…
x
Reference in New Issue
Block a user