[Bugfix] Incorrect MM data format in vllm bench throughput (#26395)

Signed-off-by: DarkLight1337 <tlleungac@connect.ust.hk>
2026-07-03 03:07:09 +08:00 · 2025-10-08 13:52:19 +08:00 · 2025-10-08 13:52:19 +08:00 · 0d4f48fa10
commit 0d4f48fa10
parent 127c8b782a
1 changed files with 8 additions and 8 deletions
--- a/vllm/benchmarks/throughput.py
+++ b/vllm/benchmarks/throughput.py
@ -201,16 +201,16 @@ async def run_vllm_async(
        sampling_params: list[SamplingParams] = []
        lora_requests: list[Optional[LoRARequest]] = []
        for request in requests:
-            prompts.append(
+            prompt = (
-                TokensPrompt(
+                TokensPrompt(prompt_token_ids=request.prompt["prompt_token_ids"])
                    prompt_token_ids=request.prompt["prompt_token_ids"],
                    multi_modal_data=request.multi_modal_data,
                )
                if "prompt_token_ids" in request.prompt
-                else TextPrompt(
+                else TextPrompt(prompt=request.prompt)
                    prompt=request.prompt, multi_modal_data=request.multi_modal_data
                )
            )
            if request.multi_modal_data:
                assert isinstance(request.multi_modal_data, dict)
                prompt["multi_modal_data"] = request.multi_modal_data
            sampling_params.append(
                SamplingParams(
                    n=n,