[CI] Add comment about the single cudagraph capture size that is used (#26252)

2026-03-16 13:47:18 +08:00 · 2025-10-06 04:35:37 +02:00 · 2025-10-06 04:35:37 +02:00 · d3c84297c3
commit d3c84297c3
parent f509a20846
1 changed files with 4 additions and 0 deletions
--- a/tests/conftest.py
+++ b/tests/conftest.py
@ -740,6 +740,10 @@ class VllmRunner:
        )

        if not kwargs.get("compilation_config", None):
+            # Note(@tdoublep): This is set to 4 because some tests (e.g., hybrid
+            # model tests) may set max_num_seqs=4. If min cudagraph_capture_size is
+            # set to larger than max_num_seqs, then it will lead to *no* graphs
+            # being captured which can trigger edge cases that we don't handle yet.
            kwargs["compilation_config"] = {"cudagraph_capture_sizes": [4]}

        with init_ctx: