mirror of
https://git.datalinker.icu/vllm-project/vllm.git
synced 2026-05-30 05:07:04 +08:00
[XPU]Fix flash_attn_varlen_func interface on xpu (#22350)
Signed-off-by: Kunshang Ji <kunshang.ji@intel.com>
This commit is contained in:
parent
1dc8a70b6d
commit
6b47ef24de
@ -271,6 +271,7 @@ class ipex_ops:
|
|||||||
k_descale=None,
|
k_descale=None,
|
||||||
v_descale=None,
|
v_descale=None,
|
||||||
num_splits=0,
|
num_splits=0,
|
||||||
|
s_aux: Optional[torch.Tensor] = None,
|
||||||
):
|
):
|
||||||
if cu_seqlens_k is None:
|
if cu_seqlens_k is None:
|
||||||
# cu_seqlens_k is not used in ipex kernel.
|
# cu_seqlens_k is not used in ipex kernel.
|
||||||
|
|||||||
Loading…
x
Reference in New Issue
Block a user