Update vllm/attention/backends/mla/utils.py

Co-authored-by: Michael Goin <mgoin64@gmail.com>
This commit is contained in:
Lucas Wilkinson 2025-01-29 22:51:37 -05:00 committed by GitHub
parent 4880a43d20
commit aa19f297d2
No known key found for this signature in database
GPG Key ID: B5690EEEBB952194

View File

@ -161,7 +161,7 @@ class MLAImplCommon(AttentionImpl):
def _v_up_proj_and_o_proj(self, x):
if envs.VLLM_MLA_PERFORM_MATRIX_ABSORPTION:
return self.o_proj_absored(
return self.o_proj_absorbed(
x.reshape(-1, self.num_heads * self.kv_lora_rank))[0]
else:
x = torch.einsum("bnl,lnv->bnv", x, self.W_UV)