[CI/Build] Enable phi2 lora test (#20540)

Signed-off-by: Jee Jee Li <pandaleefree@gmail.com>
2026-03-18 08:37:09 +08:00 · 2025-07-07 13:10:41 +08:00 · 2025-07-07 13:10:41 +08:00 · 2e610deb72
commit 2e610deb72
parent 6e2c19ce22
1 changed files with 0 additions and 5 deletions
--- a/tests/lora/test_phi.py
+++ b/tests/lora/test_phi.py
@ -1,8 +1,6 @@
 # SPDX-License-Identifier: Apache-2.0
 # SPDX-FileCopyrightText: Copyright contributors to the vLLM project

-import pytest
-
 import vllm
 from vllm.lora.request import LoRARequest

@ -49,9 +47,6 @@ def do_sample(llm: vllm.LLM, lora_path: str, lora_id: int) -> list[str]:
    return generated_texts


-# Skipping for V1 for now as we are hitting,
-# "Head size 80 is not supported by FlashAttention." error.
-@pytest.mark.skip(reason="Head size 80 is not supported by FlashAttention")
 def test_phi2_lora(phi2_lora_files):
    # We enable enforce_eager=True here to reduce VRAM usage for lora-test CI,
    # Otherwise, the lora-test will fail due to CUDA OOM.