[Bugfix] Fix default MM LoRA alignment for single str prompts (#29140)

Signed-off-by: Alex-Brooks <Alex.Brooks@ibm.com>
2026-03-18 17:17:14 +08:00 · 2025-11-20 22:32:30 -07:00 · 2025-11-20 22:32:30 -07:00 · b4734b9550
commit b4734b9550
parent 30b9c67743
2 changed files with 36 additions and 1 deletions
--- a/tests/lora/test_default_mm_loras.py
+++ b/tests/lora/test_default_mm_loras.py
@ -5,7 +5,9 @@ Tests for applying default registered multimodal loras.
 """

 import os
+import unittest.mock as mock

+import pytest
 from huggingface_hub import snapshot_download

 from vllm.lora.request import LoRARequest
@ -114,3 +116,36 @@ def test_default_mm_lora_fails_with_overridden_lora_request(
        default_mm_loras={"audio": IMAGE_LORA_PATH},
        expected_suffix=RESPONSE_SUFFIX_WITH_LORA,
    )
+
+
+def test_default_mm_lora_does_not_expand_string_reqs(vllm_runner):
+    class MockEngineException(Exception):
+        pass
+
+    # Regression test for ensuring default multimodal lora resolution
+    # does not expand the lora req if the prompt type is a string.
+    vllm_runner_kwargs = {
+        **VLLM_RUNNER_BASE_KWARGS,
+        **{"default_mm_loras": {"audio": AUDIO_LORA_PATH}},
+    }
+
+    # Avoid the full generation call since these tests are expensive;
+    # just check what lora request is actually submitted to the engine
+    mock_err = "Engine is mocked for this test"
+
+    with (
+        mock.patch(
+            "vllm.v1.engine.llm_engine.LLMEngine.add_request",
+            side_effect=MockEngineException(mock_err),
+        ) as mock_add_request,
+        vllm_runner(**vllm_runner_kwargs) as vllm_model,
+    ):
+        # Die once we actually submit the request to the engine
+        with pytest.raises(MockEngineException):
+            vllm_model.llm.generate(prompts=AUDIO_PROMPT)
+
+        # Then check to make sure the submitted lora request
+        # and text prompt were zipped together correctly
+        engine_args, engine_kwargs = mock_add_request.call_args
+        assert engine_kwargs["lora_request"] is None
+        assert engine_kwargs["prompt_text"] == AUDIO_PROMPT
--- a/vllm/entrypoints/llm.py
+++ b/vllm/entrypoints/llm.py
@ -466,7 +466,7 @@ class LLM:
        ):
            return lora_request

-        if not isinstance(prompts, Sequence):
+        if not isinstance(prompts, Sequence) or isinstance(prompts, str):
            prompts = [prompts]

        optional_loras = (