mirror of
https://git.datalinker.icu/vllm-project/vllm.git
synced 2026-04-07 23:47:05 +08:00
fix
Signed-off-by: Woosuk Kwon <woosuk.kwon@berkeley.edu>
This commit is contained in:
parent
17c2c106b1
commit
42f99150c1
@ -293,7 +293,7 @@ class GPUModelRunner:
|
||||
query_start_loc_gpu = query_start_loc.gpu[:num_reqs + 1]
|
||||
query_start_loc_cpu = query_start_loc.cpu[:num_reqs + 1]
|
||||
seq_lens_gpu = self.input_buffers.seq_lens.gpu[:num_reqs]
|
||||
seq_lens_cpu = self.input_buffers.seq_lens.np[:num_reqs]
|
||||
seq_lens_cpu = self.input_buffers.seq_lens.cpu[:num_reqs]
|
||||
seq_lens_np = self.input_buffers.seq_lens.np[:num_reqs]
|
||||
|
||||
# Some input token ids are directly read from the last sampled tokens.
|
||||
|
||||
Loading…
x
Reference in New Issue
Block a user