mirror of
https://git.datalinker.icu/vllm-project/vllm.git
synced 2025-12-24 13:06:01 +08:00
[BugFix] fix CUTLASS MLA full cudagraph (#23200)
Signed-off-by: Lucas Wilkinson <lwilkins@redhat.com>
This commit is contained in:
parent
0f4f0191d8
commit
14e2b0730b
@ -21,7 +21,7 @@ logger = init_logger(__name__)
|
||||
|
||||
class CutlassMLAMetadataBuilder(MLACommonMetadataBuilder[MLACommonMetadata]):
|
||||
# enable full CUDA Graph support for decode-only capture
|
||||
attn_cudagraph_support: ClassVar[
|
||||
cudagraph_support: ClassVar[
|
||||
AttentionCGSupport] = AttentionCGSupport.UNIFORM_SINGLE_TOKEN_DECODE
|
||||
|
||||
|
||||
|
||||
Loading…
x
Reference in New Issue
Block a user