mirror of
https://git.datalinker.icu/vllm-project/vllm.git
synced 2026-03-31 00:37:07 +08:00
fix TP
This commit is contained in:
parent
984ffddda6
commit
0a02744dc8
@ -1975,7 +1975,8 @@ class CUDAGraphRunner(nn.Module):
|
||||
|
||||
# Copy the input tensors to the input buffers.
|
||||
self.input_buffers["input_ids"].copy_(input_ids, non_blocking=True)
|
||||
self.input_buffers["positions"].copy_(positions, non_blocking=True)
|
||||
if positions is not None:
|
||||
self.input_buffers["positions"].copy_(positions, non_blocking=True)
|
||||
|
||||
if self.backend_name != "NO_ATTENTION":
|
||||
self.input_buffers["slot_mapping"].copy_(
|
||||
|
||||
Loading…
x
Reference in New Issue
Block a user