Change size of single CUDA graph for CI to 4 (#26089)

Signed-off-by: Thomas Parnell <tpa@zurich.ibm.com>
Signed-off-by: yewentao256 <zhyanwentao@126.com>
This commit is contained in:
Thomas Parnell 2025-10-02 16:14:28 +02:00 committed by yewentao256
parent 5a083ce2ea
commit 83fa298682

View File

@ -732,7 +732,7 @@ class VllmRunner:
set_default_torch_num_threads(default_torch_num_threads))
if not kwargs.get("compilation_config", None):
kwargs["compilation_config"] = {"cudagraph_capture_sizes": [8]}
kwargs["compilation_config"] = {"cudagraph_capture_sizes": [4]}
with init_ctx:
self.llm = LLM(