diff --git a/.buildkite/test-pipeline.yaml b/.buildkite/test-pipeline.yaml index 23830c4e0781..10d1c33f816b 100644 --- a/.buildkite/test-pipeline.yaml +++ b/.buildkite/test-pipeline.yaml @@ -460,6 +460,7 @@ steps: - tests/compile commands: - pytest -v -s compile/test_basic_correctness.py + - pytest -v -s compile/test_multimodal_compile.py - pytest -v -s compile/piecewise/ - label: PyTorch Fullgraph Test # 22min diff --git a/tests/compile/test_multimodal_compile.py b/tests/compile/test_multimodal_compile.py index 6c195dd93f42..2727821162ec 100644 --- a/tests/compile/test_multimodal_compile.py +++ b/tests/compile/test_multimodal_compile.py @@ -4,10 +4,12 @@ import pytest from vllm.compilation.counter import compilation_counter from vllm.config.compilation import CompilationMode +from vllm.platforms import current_platform # forked needed to workaround https://github.com/vllm-project/vllm/issues/21073 @pytest.mark.forked +@pytest.mark.skipif(not current_platform.is_cuda(), reason="Skip if not cuda") def test_qwen2_5_vl_compilation(vllm_runner, monkeypatch): """Test that Qwen2.5-VL vision submodules are compiled.