diff --git a/vllm/_custom_ops.py b/vllm/_custom_ops.py index b5b0115f4cf3b..415345cdc7b6b 100644 --- a/vllm/_custom_ops.py +++ b/vllm/_custom_ops.py @@ -256,8 +256,8 @@ def copy_subranges( tgt_matrix: torch.Tensor, num_subranges: int, ) -> None: - torch.ops._C.copy_subranges(src_matrix, diff_matrix, tgt_matrix, - num_subranges) + torch.ops._C.copy_subranges.default(src_matrix, diff_matrix, tgt_matrix, + num_subranges) # fused quant layer norm ops