[XPU][CI] add v1/core test in xpu hardware ci (#20537)

Signed-off-by: Ma, Liangliang <liangliang.ma@intel.com>
2025-12-10 03:44:56 +08:00 · 2025-07-07 16:16:40 +08:00 · 2025-07-07 16:16:40 +08:00 · 2c5ebec064
commit 2c5ebec064
parent 2e610deb72
3 changed files with 6 additions and 8 deletions
--- a/.buildkite/scripts/hardware_ci/run-xpu-test.sh
+++ b/.buildkite/scripts/hardware_ci/run-xpu-test.sh
@ -27,4 +27,6 @@ docker run \
    "${image_name}" \
    sh -c '
    VLLM_USE_V1=1 python3 examples/offline_inference/basic/generate.py --model facebook/opt-125m --block-size 64 --enforce-eager
+    cd tests
+    pytest -v -s v1/core
 '
--- a/docker/Dockerfile.xpu
+++ b/docker/Dockerfile.xpu
@ -47,7 +47,7 @@ FROM vllm-base AS vllm-openai

 # install additional dependencies for openai api server
 RUN --mount=type=cache,target=/root/.cache/pip \
-    pip install accelerate hf_transfer 'modelscope!=1.15.0'
+    pip install accelerate hf_transfer pytest 'modelscope!=1.15.0'

 ENV VLLM_USAGE_SOURCE production-docker-image \
    TRITON_XPU_PROFILE 1
--- a/vllm/platforms/xpu.py
+++ b/vllm/platforms/xpu.py
@ -93,10 +93,6 @@ class XPUPlatform(Platform):
                    "mode.")
                model_config.enforce_eager = True

-        if vllm_config.speculative_config is not None:
-            raise NotImplementedError(
-                "XPU does not support speculative decoding")
-
        if vllm_config.device_config is not None:
            assert vllm_config.device_config.device_type == "xpu"