[Quantization] Skip Fp4 Test for compressed-tensors (#19217)

2026-03-19 11:47:14 +08:00 · 2025-06-05 14:21:53 -04:00 · 2025-06-05 14:21:53 -04:00 · aa49f14832
commit aa49f14832
parent 9ef9173cfa
1 changed files with 1 additions and 0 deletions
--- a/tests/quantization/test_compressed_tensors.py
+++ b/tests/quantization/test_compressed_tensors.py
@ -651,6 +651,7 @@ def test_compressed_tensors_2of4_sparse_compressed(vllm_runner, args_2of4):
        assert output


+@pytest.mark.skip(reason="Skip until the model config is updated")
 def test_compressed_tensors_nvfp4a16(vllm_runner):
    # run weight only example
    model = "nm-testing/TinyLlama-1.1B-Chat-v1.0-FP4"