[BugFix] Fix false assertion with spec-decode=[2,4,..] and TP>2 (#29036)

Signed-off-by: Lucas Wilkinson <lwilkins@redhat.com>
This commit is contained in:
Lucas Wilkinson 2025-11-19 16:43:54 -05:00 committed by GitHub
parent 22e44ad589
commit 8f4f77a727
No known key found for this signature in database
GPG Key ID: B5690EEEBB952194

View File

@ -921,7 +921,7 @@ class CompilationConfig:
self, uniform_decode_query_len: int, tensor_parallel_size: int
):
multiple_of = uniform_decode_query_len
if tensor_parallel_size > 1:
if tensor_parallel_size > 1 and self.pass_config.enable_sequence_parallelism:
multiple_of = max(uniform_decode_query_len, tensor_parallel_size)
if (
multiple_of % uniform_decode_query_len != 0