From 5ea71ff46fe503df12f18ad41d40f5c2b18dcfcd Mon Sep 17 00:00:00 2001 From: Giancarlo Delfin <32987265+TheEpicDolphin@users.noreply.github.com> Date: Mon, 4 Aug 2025 19:11:06 -0700 Subject: [PATCH] =?UTF-8?q?[V1]=20reduce=20block=20size=20for=20tree=20att?= =?UTF-8?q?ention=20correctness=20test=20to=20fix=20'ou=E2=80=A6=20(#22207?= =?UTF-8?q?)?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit Signed-off-by: Giancarlo Delfin --- tests/v1/spec_decode/test_tree_attention.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/tests/v1/spec_decode/test_tree_attention.py b/tests/v1/spec_decode/test_tree_attention.py index 42468daa62a9a..456ce712d36e4 100644 --- a/tests/v1/spec_decode/test_tree_attention.py +++ b/tests/v1/spec_decode/test_tree_attention.py @@ -155,7 +155,7 @@ def test_tree_attn_correctness() -> None: dim_per_head = 128 num_kv_heads = 2 - block_size = 128 + block_size = 32 max_sequence_length = 8192 randomize_blocks = True for batch_size in [1, 16, 32]: