[CI/Build] Fix LoRA OOM (#16624)

Signed-off-by: Jee Jee Li <pandaleefree@gmail.com>
2026-06-01 11:27:04 +08:00 · 2025-04-15 16:38:19 +08:00 · 2025-04-15 16:38:19 +08:00 · 1575c1701a
commit 1575c1701a
parent 6ae996a873
1 changed files with 13 additions and 4 deletions
--- a/tests/lora/test_minicpmv_tp.py
+++ b/tests/lora/test_minicpmv_tp.py
@ -66,8 +66,12 @@ def test_minicpmv_lora(minicpmv_lora_files):
        max_loras=2,
        max_lora_rank=8,
        enforce_eager=True,
        max_model_len=2048,
        limit_mm_per_prompt={
            "image": 2,
            "video": 0
        },
        trust_remote_code=True,
        enable_chunked_prefill=True,
    )
    output1 = do_sample(llm, minicpmv_lora_files, lora_id=1)
    for i in range(len(EXPECTED_OUTPUT)):
@ -91,9 +95,11 @@ def test_minicpmv_tp4_wo_fully_sharded_loras(minicpmv_lora_files):
        max_loras=4,
        max_lora_rank=64,
        tensor_parallel_size=4,
        limit_mm_per_prompt={
            "image": 2,
            "video": 0
        },
        trust_remote_code=True,
        enforce_eager=True,
        enable_chunked_prefill=True,
    )
    output_tp = do_sample(llm, minicpmv_lora_files, lora_id=1)
    for i in range(len(EXPECTED_OUTPUT)):
@ -115,8 +121,11 @@ def test_minicpmv_tp4_fully_sharded_loras(minicpmv_lora_files):
        max_lora_rank=8,
        tensor_parallel_size=4,
        trust_remote_code=True,
        limit_mm_per_prompt={
            "image": 1,
            "video": 0
        },
        fully_sharded_loras=True,
        enable_chunked_prefill=True,
    )
    output_tp = do_sample(llm, minicpmv_lora_files, lora_id=1)
    for i in range(len(EXPECTED_OUTPUT)):