From 5cdd66450910589c8e1a3d25e80711b0b6e51eb1 Mon Sep 17 00:00:00 2001 From: Lucas Wilkinson Date: Tue, 2 Dec 2025 19:56:54 -0500 Subject: [PATCH] [BugFix] Fix assert in `build_for_cudagraph_capture` (#29893) Signed-off-by: Lucas Wilkinson --- vllm/v1/worker/gpu_model_runner.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/vllm/v1/worker/gpu_model_runner.py b/vllm/v1/worker/gpu_model_runner.py index ee28f477a26ad..8c22ada029b1a 100644 --- a/vllm/v1/worker/gpu_model_runner.py +++ b/vllm/v1/worker/gpu_model_runner.py @@ -4000,7 +4000,7 @@ class GPUModelRunner( num_reqs=num_reqs_padded, max_query_len=max_query_len, ubatch_slices=ubatch_slices, - for_cudagraph_capture=True, + for_cudagraph_capture=is_graph_capturing, ) with self.maybe_dummy_run_with_lora(