mirror of
https://git.datalinker.icu/vllm-project/vllm.git
synced 2026-04-17 19:17:03 +08:00
Signed-off-by: Xiake Sun <xiake.sun@amd.com>
This commit is contained in:
parent
d64429bb36
commit
60e089f0b9
@ -729,7 +729,7 @@ class AiterFlashAttentionImpl(AttentionImpl):
|
||||
cu_seqlens_k=attn_metadata.prefill_metadata.query_start_loc,
|
||||
max_seqlen_q=attn_metadata.prefill_metadata.max_query_len,
|
||||
max_seqlen_k=attn_metadata.prefill_metadata.max_seq_len,
|
||||
min_seqlen_q=attn_metadata.prefill_metadata.min_query_len,
|
||||
min_seqlen_q=1,
|
||||
dropout_p=0.0,
|
||||
softmax_scale=self.scale,
|
||||
causal=True,
|
||||
@ -759,7 +759,7 @@ class AiterFlashAttentionImpl(AttentionImpl):
|
||||
cu_seqlens_q=attn_metadata.extend_metadata.query_start_loc,
|
||||
max_seqlen_q=attn_metadata.extend_metadata.max_query_len,
|
||||
max_seqlen_k=attn_metadata.extend_metadata.max_seq_len,
|
||||
min_seqlen_q=attn_metadata.extend_metadata.min_query_len,
|
||||
min_seqlen_q=1,
|
||||
block_table=attn_metadata.block_table[
|
||||
num_decodes : num_decodes + num_extends
|
||||
],
|
||||
|
||||
Loading…
x
Reference in New Issue
Block a user