mirror of
https://git.datalinker.icu/vllm-project/vllm.git
synced 2026-05-24 00:31:19 +08:00
[Bugfix][ROCm] Fix AITER MLA V1 (#17880)
Signed-off-by: vllmellm <vllm.ellm@embeddedllm.com>
This commit is contained in:
parent
ff8c400502
commit
217db4baa6
@ -95,8 +95,7 @@ class AiterMLAMetadataBuilder(MLACommonMetadataBuilder[AiterMLAMetadata]):
|
|||||||
paged_kv_last_page_len,
|
paged_kv_last_page_len,
|
||||||
)
|
)
|
||||||
|
|
||||||
def _build_decode(self, input_positions: torch.Tensor,
|
def _build_decode(self, block_table: torch.Tensor,
|
||||||
block_table: torch.Tensor,
|
|
||||||
seq_lens: torch.Tensor) -> AiterMLADecodeMetadata:
|
seq_lens: torch.Tensor) -> AiterMLADecodeMetadata:
|
||||||
|
|
||||||
(
|
(
|
||||||
@ -106,7 +105,6 @@ class AiterMLAMetadataBuilder(MLACommonMetadataBuilder[AiterMLAMetadata]):
|
|||||||
) = self._get_paged_kv_tensors(block_table, seq_lens)
|
) = self._get_paged_kv_tensors(block_table, seq_lens)
|
||||||
|
|
||||||
attn_metadata = AiterMLADecodeMetadata(
|
attn_metadata = AiterMLADecodeMetadata(
|
||||||
input_positions=input_positions,
|
|
||||||
block_table=block_table,
|
block_table=block_table,
|
||||||
seq_lens=seq_lens,
|
seq_lens=seq_lens,
|
||||||
paged_kv_indptr=paged_kv_indptr,
|
paged_kv_indptr=paged_kv_indptr,
|
||||||
|
|||||||
Loading…
x
Reference in New Issue
Block a user