diff --git a/vllm/_ipex_ops.py b/vllm/_ipex_ops.py index 7533bf5ef7e60..79e3e448cada3 100644 --- a/vllm/_ipex_ops.py +++ b/vllm/_ipex_ops.py @@ -271,6 +271,7 @@ class ipex_ops: k_descale=None, v_descale=None, num_splits=0, + s_aux: Optional[torch.Tensor] = None, ): if cu_seqlens_k is None: # cu_seqlens_k is not used in ipex kernel.