[Bugfix] Misaligned params in TreeAttentionImpl (#22226)

Signed-off-by: DarkLight1337 <tlleungac@connect.ust.hk>
2025-12-15 13:05:47 +08:00 · 2025-08-05 13:40:09 +08:00 · 2025-08-05 13:40:09 +08:00 · cdfd6871a5
commit cdfd6871a5
parent 4b3e4474d7
1 changed files with 1 additions and 5 deletions
--- a/vllm/v1/attention/backends/tree_attn.py
+++ b/vllm/v1/attention/backends/tree_attn.py
@ -4,7 +4,7 @@
 import ast
 from dataclasses import dataclass
-from typing import TYPE_CHECKING, Any, Optional
+from typing import TYPE_CHECKING, Optional
 import torch
@ -313,15 +313,11 @@ class TreeAttentionImpl(AttentionImpl):
        alibi_slopes: Optional[list[float]],
        sliding_window: Optional[int],
        kv_cache_dtype: str,
        blocksparse_params: Optional[dict[str, Any]] = None,
        logits_soft_cap: Optional[float] = None,
        attn_type: AttentionType = AttentionType.DECODER,
        kv_sharing_target_layer_name: Optional[str] = None,
        use_irope: bool = False,
    ) -> None:
        if blocksparse_params is not None:
            raise ValueError(
                "TreeAttention does not support block-sparse attention.")
        self.num_heads = num_heads
        self.head_size = head_size
        self.scale = float(scale)