mirror of
https://git.datalinker.icu/vllm-project/vllm.git
synced 2026-04-07 18:27:04 +08:00
minor change
Signed-off-by: Sage Moore <sage@neuralmagic.com>
This commit is contained in:
parent
90330563c6
commit
376e7eb838
@ -266,7 +266,7 @@ class FlashAttentionMetadataBuilder(
|
||||
use_cascade = common_prefix_len > 0
|
||||
|
||||
if use_cascade:
|
||||
cu_prefix_query_lens = torch.tensor([0,num_actual_tokens],
|
||||
cu_prefix_query_lens = torch.tensor([0, num_actual_tokens],
|
||||
dtype=torch.int32,
|
||||
device=self.runner.device)
|
||||
prefix_kv_lens = torch.tensor([common_prefix_len],
|
||||
|
||||
Loading…
x
Reference in New Issue
Block a user