[XPU] fix xpu to set cudagraph batch sizes (#23044)

Signed-off-by: calvin chen <wen.chen@dynamia.ai>
2025-12-15 01:05:28 +08:00 · 2025-08-18 05:45:42 +08:00 · 2025-08-18 05:45:42 +08:00 · 21e39436c8
commit 21e39436c8
parent 6d243efeda
1 changed files with 4 additions and 2 deletions
--- a/vllm/v1/worker/gpu_model_runner.py
+++ b/vllm/v1/worker/gpu_model_runner.py
@ -232,8 +232,10 @@ class GPUModelRunner(LoRAModelRunnerMixin, KVConnectorModelRunnerMixin):
        # The convention is different.
        # self.cudagraph_batch_sizes sorts in ascending order.
        # The batch sizes in the config are in descending order.
-        self.cudagraph_batch_sizes = list(
+        if self.compilation_config.cudagraph_capture_sizes and \
-            reversed(self.compilation_config.cudagraph_capture_sizes))
+                self.compilation_config.cudagraph_mode != CUDAGraphMode.NONE:
            self.cudagraph_batch_sizes = list(
                reversed(self.compilation_config.cudagraph_capture_sizes))
        # Cache the device properties.
        self._init_device_properties()