[CI/Build] Skip Mllama HF runner tests with Transformers v4.55.0 (#22659)

Signed-off-by: Isotr0py <2037008807@qq.com>
2025-12-13 02:25:36 +08:00 · 2025-08-12 01:00:58 +08:00 · 2025-08-12 01:00:58 +08:00 · c90fb03df5
commit c90fb03df5
parent 84cf78acee
1 changed files with 17 additions and 0 deletions
--- a/tests/models/multimodal/generation/test_mllama.py
+++ b/tests/models/multimodal/generation/test_mllama.py
@ -6,6 +6,7 @@ from typing import Optional, overload
 import pytest
 import torch
 from transformers import AutoConfig, AutoModelForImageTextToText, AutoTokenizer
 from transformers import __version__ as TRANSFORMERS_VERSION
 from vllm import LLM, SamplingParams
 from vllm.attention.backends.flash_attn import FlashAttentionMetadata
@ -285,6 +286,10 @@ def clear_cache():
@pytest.mark.parametrize("max_tokens", [128])
@pytest.mark.parametrize("num_logprobs", [5])
@pytest.mark.parametrize("attn_backend", LIST_ENC_DEC_SUPPORTED_BACKENDS)
@pytest.mark.skipif(
    TRANSFORMERS_VERSION == "4.55.0",
    reason="Transformers v4.55.0 has a regression issue on mllama, "
    "see: https://github.com/huggingface/transformers/pull/40083")
 def test_models_single_leading_image(hf_runner, vllm_runner, image_assets,
                                     model, sizes, dtype, max_tokens,
                                     num_logprobs,
@ -313,6 +318,10 @@ def test_models_single_leading_image(hf_runner, vllm_runner, image_assets,
@pytest.mark.parametrize("max_tokens", [128])
@pytest.mark.parametrize("num_logprobs", [5])
@pytest.mark.parametrize("attn_backend", LIST_ENC_DEC_SUPPORTED_BACKENDS)
@pytest.mark.skipif(
    TRANSFORMERS_VERSION == "4.55.0",
    reason="Transformers v4.55.0 has a regression issue on mllama, "
    "see: https://github.com/huggingface/transformers/pull/40083")
 def test_models_multi_leading_images(hf_runner, vllm_runner, image_assets,
                                     model, dtype, max_tokens, num_logprobs,
                                     attn_backend: _Backend) -> None:
@ -362,6 +371,10 @@ def test_models_multi_leading_images(hf_runner, vllm_runner, image_assets,
@pytest.mark.parametrize("max_tokens", [128])
@pytest.mark.parametrize("num_logprobs", [5])
@pytest.mark.parametrize("attn_backend", LIST_ENC_DEC_SUPPORTED_BACKENDS)
@pytest.mark.skipif(
    TRANSFORMERS_VERSION == "4.55.0",
    reason="Transformers v4.55.0 has a regression issue on mllama, "
    "see: https://github.com/huggingface/transformers/pull/40083")
 def test_models_interleaved_images(hf_runner, vllm_runner, image_assets, model,
                                   dtype, max_tokens, num_logprobs,
                                   attn_backend: _Backend) -> None:
@ -402,6 +415,10 @@ def test_models_interleaved_images(hf_runner, vllm_runner, image_assets, model,
@pytest.mark.parametrize("dtype", ["bfloat16"])
@pytest.mark.parametrize("max_tokens", [64])
@pytest.mark.parametrize("num_logprobs", [5])
@pytest.mark.skipif(
    TRANSFORMERS_VERSION == "4.55.0",
    reason="Transformers v4.55.0 has a regression issue on mllama, "
    "see: https://github.com/huggingface/transformers/pull/40083")
 def test_models_distributed(
    hf_runner,
    vllm_runner,