[BugFix] Fix AssertionError: DCP not support reorder_batch_threshold > 1 now. (#28751)

Signed-off-by: Lucas Wilkinson <lwilkins@redhat.com>
This commit is contained in:
Lucas Wilkinson 2025-11-15 17:35:06 -05:00 committed by GitHub
parent 2bb4435cb7
commit be263f7645
No known key found for this signature in database
GPG Key ID: B5690EEEBB952194

View File

@ -630,16 +630,6 @@ class GPUModelRunner(
return
if self.reorder_batch_threshold is not None:
# NOTE(lucas): currently no backend supports the custom masking
# required for DCP with q_len > 1, so we assert here. Remove this
# assert once the custom mask is support is added to FA3.
if (
self.dcp_world_size > 1
and envs.VLLM_ATTENTION_BACKEND != "FLASH_ATTN_MLA"
):
assert self.reorder_batch_threshold == 1, (
"DCP not support reorder_batch_threshold > 1 now."
)
reorder_batch_to_split_decodes_and_prefills(
self.input_batch,
scheduler_output,