diff --git a/requirements/common.txt b/requirements/common.txt index 6bc71df24f0e6..3c3ac0abf50f3 100644 --- a/requirements/common.txt +++ b/requirements/common.txt @@ -7,7 +7,7 @@ requests >= 2.26.0 tqdm blake3 py-cpuinfo -transformers >= 4.55.0 +transformers >= 4.55.2 tokenizers >= 0.21.1 # Required for fast incremental detokenization. protobuf # Required by LlamaTokenizer. fastapi[standard] >= 0.115.0 # Required by FastAPI's form models in the OpenAI API server's audio transcriptions endpoint. diff --git a/requirements/test.in b/requirements/test.in index 6652bfdfe66c9..7f141fe281d62 100644 --- a/requirements/test.in +++ b/requirements/test.in @@ -34,7 +34,7 @@ opencv-python-headless >= 4.11.0 # required for video test datamodel_code_generator # required for minicpm3 test lm-eval[api]==0.4.8 # required for model evaluation test mteb[bm25s]>=1.38.11, <2 # required for mteb test -transformers==4.55.0 +transformers==4.55.2 tokenizers==0.21.1 schemathesis>=3.39.15 # Required for openai schema test. # quantization diff --git a/requirements/test.txt b/requirements/test.txt index ff9886a315976..48eb09811bcc6 100644 --- a/requirements/test.txt +++ b/requirements/test.txt @@ -1139,7 +1139,7 @@ tqdm==4.66.6 # transformers tqdm-multiprocess==0.0.11 # via lm-eval -transformers==4.55.0 +transformers==4.55.2 # via # -r requirements/test.in # genai-perf diff --git a/tests/models/multimodal/generation/test_mllama.py b/tests/models/multimodal/generation/test_mllama.py index b413c4d6b3667..1c32cc6d71c04 100644 --- a/tests/models/multimodal/generation/test_mllama.py +++ b/tests/models/multimodal/generation/test_mllama.py @@ -5,6 +5,7 @@ from typing import Optional, overload import pytest import torch +from packaging.version import Version from transformers import AutoConfig, AutoModelForImageTextToText, AutoTokenizer from transformers import __version__ as TRANSFORMERS_VERSION @@ -287,8 +288,8 @@ def clear_cache(): @pytest.mark.parametrize("num_logprobs", [5]) @pytest.mark.parametrize("attn_backend", LIST_ENC_DEC_SUPPORTED_BACKENDS) @pytest.mark.skipif( - TRANSFORMERS_VERSION == "4.55.0", - reason="Transformers v4.55.0 has a regression issue on mllama, " + Version(TRANSFORMERS_VERSION) <= Version("4.55.2"), + reason="Transformers v4.55 has a regression issue on mllama, " "see: https://github.com/huggingface/transformers/pull/40083") def test_models_single_leading_image(hf_runner, vllm_runner, image_assets, model, sizes, dtype, max_tokens, @@ -319,8 +320,8 @@ def test_models_single_leading_image(hf_runner, vllm_runner, image_assets, @pytest.mark.parametrize("num_logprobs", [5]) @pytest.mark.parametrize("attn_backend", LIST_ENC_DEC_SUPPORTED_BACKENDS) @pytest.mark.skipif( - TRANSFORMERS_VERSION == "4.55.0", - reason="Transformers v4.55.0 has a regression issue on mllama, " + Version(TRANSFORMERS_VERSION) <= Version("4.55.2"), + reason="Transformers v4.55 has a regression issue on mllama, " "see: https://github.com/huggingface/transformers/pull/40083") def test_models_multi_leading_images(hf_runner, vllm_runner, image_assets, model, dtype, max_tokens, num_logprobs, @@ -372,8 +373,8 @@ def test_models_multi_leading_images(hf_runner, vllm_runner, image_assets, @pytest.mark.parametrize("num_logprobs", [5]) @pytest.mark.parametrize("attn_backend", LIST_ENC_DEC_SUPPORTED_BACKENDS) @pytest.mark.skipif( - TRANSFORMERS_VERSION == "4.55.0", - reason="Transformers v4.55.0 has a regression issue on mllama, " + Version(TRANSFORMERS_VERSION) <= Version("4.55.2"), + reason="Transformers v4.55 has a regression issue on mllama, " "see: https://github.com/huggingface/transformers/pull/40083") def test_models_interleaved_images(hf_runner, vllm_runner, image_assets, model, dtype, max_tokens, num_logprobs, @@ -416,8 +417,8 @@ def test_models_interleaved_images(hf_runner, vllm_runner, image_assets, model, @pytest.mark.parametrize("max_tokens", [64]) @pytest.mark.parametrize("num_logprobs", [5]) @pytest.mark.skipif( - TRANSFORMERS_VERSION == "4.55.0", - reason="Transformers v4.55.0 has a regression issue on mllama, " + Version(TRANSFORMERS_VERSION) <= Version("4.55.2"), + reason="Transformers v4.55 has a regression issue on mllama, " "see: https://github.com/huggingface/transformers/pull/40083") def test_models_distributed( hf_runner,