mirror of
https://git.datalinker.icu/vllm-project/vllm.git
synced 2025-12-17 21:25:58 +08:00
Signed-off-by: tjtanaa <tunjian.tan@embeddedllm.com>
This commit is contained in:
parent
a810b5b088
commit
7de18d541b
@ -98,17 +98,17 @@ class AiterMLAMetadataBuilder(MLACommonMetadataBuilder[AiterMLAMetadata]):
|
|||||||
paged_kv_last_page_len,
|
paged_kv_last_page_len,
|
||||||
)
|
)
|
||||||
|
|
||||||
def _build_decode(self, block_table: torch.Tensor,
|
def _build_decode(self, block_table_tensor: torch.Tensor,
|
||||||
seq_lens: torch.Tensor) -> AiterMLADecodeMetadata:
|
seq_lens: torch.Tensor) -> AiterMLADecodeMetadata:
|
||||||
|
|
||||||
(
|
(
|
||||||
paged_kv_indices,
|
paged_kv_indices,
|
||||||
paged_kv_indptr,
|
paged_kv_indptr,
|
||||||
paged_last_page_len,
|
paged_last_page_len,
|
||||||
) = self._get_paged_kv_tensors(block_table, seq_lens)
|
) = self._get_paged_kv_tensors(block_table_tensor, seq_lens)
|
||||||
|
|
||||||
attn_metadata = AiterMLADecodeMetadata(
|
attn_metadata = AiterMLADecodeMetadata(
|
||||||
block_table=block_table,
|
block_table=block_table_tensor,
|
||||||
seq_lens=seq_lens,
|
seq_lens=seq_lens,
|
||||||
paged_kv_indptr=paged_kv_indptr,
|
paged_kv_indptr=paged_kv_indptr,
|
||||||
paged_kv_indices=paged_kv_indices,
|
paged_kv_indices=paged_kv_indices,
|
||||||
|
|||||||
Loading…
x
Reference in New Issue
Block a user