diff --git a/vllm/v1/attention/backends/utils.py b/vllm/v1/attention/backends/utils.py index 0bd7eaf7f8154..e738d11665683 100644 --- a/vllm/v1/attention/backends/utils.py +++ b/vllm/v1/attention/backends/utils.py @@ -43,6 +43,7 @@ class CommonAttentionMetadata: max_query_len: int """Longest query in batch""" + M = TypeVar("M")