diff --git a/vllm/entrypoints/llm.py b/vllm/entrypoints/llm.py index 9c3d3bb454c5..c9ab68525503 100644 --- a/vllm/entrypoints/llm.py +++ b/vllm/entrypoints/llm.py @@ -155,4 +155,8 @@ class LLM: pbar.update(1) if use_tqdm: pbar.close() + # Sort the outputs by request ID. + # This is necessary because some requests may be finished earlier than + # its previous requests. + outputs = sorted(outputs, key=lambda x: int(x.request_id)) return outputs