diff --git a/vllm/lora/ops/triton_ops/lora_kernel_metadata.py b/vllm/lora/ops/triton_ops/lora_kernel_metadata.py index 1dcdfc814a891..055e78f406f3e 100644 --- a/vllm/lora/ops/triton_ops/lora_kernel_metadata.py +++ b/vllm/lora/ops/triton_ops/lora_kernel_metadata.py @@ -111,7 +111,7 @@ class LoRAKernelMeta: # active_lora_ids, num_tokens_per_lora lora_ids, num_tokens_per_lora = torch.unique(token_lora_mapping, - sorted=False, + sorted=True, return_counts=True) self.active_lora_ids[:lora_ids.size(0)].copy_(lora_ids, non_blocking=True)