diff --git a/tests/lora/test_llama_tp.py b/tests/lora/test_llama_tp.py index 91afa42faf95..9068d3c0e536 100644 --- a/tests/lora/test_llama_tp.py +++ b/tests/lora/test_llama_tp.py @@ -4,6 +4,8 @@ import subprocess import sys from typing import Union +import pytest + import vllm from vllm import LLM from vllm.lora.request import LoRARequest @@ -149,6 +151,8 @@ def test_llama_lora_tp4_fully_sharded_loras(sql_lora_files): generate_and_test(llm, sql_lora_files) +@pytest.mark.skip(reason=("Skipping this test as tensorizer is not " + "working with LoRA as of #19619")) @multi_gpu_test(num_gpus=2) @create_new_process_for_each_test() def test_tp2_serialize_and_deserialize_lora(tmp_path, sql_lora_files,