mirror of
https://git.datalinker.icu/vllm-project/vllm.git
synced 2025-12-10 06:45:01 +08:00
[V1] reduce block size for tree attention correctness test to fix 'ou… (#22207)
Signed-off-by: Giancarlo Delfin <gdelfin@meta.com>
This commit is contained in:
parent
7175817637
commit
5ea71ff46f
@ -155,7 +155,7 @@ def test_tree_attn_correctness() -> None:
|
|||||||
|
|
||||||
dim_per_head = 128
|
dim_per_head = 128
|
||||||
num_kv_heads = 2
|
num_kv_heads = 2
|
||||||
block_size = 128
|
block_size = 32
|
||||||
max_sequence_length = 8192
|
max_sequence_length = 8192
|
||||||
randomize_blocks = True
|
randomize_blocks = True
|
||||||
for batch_size in [1, 16, 32]:
|
for batch_size in [1, 16, 32]:
|
||||||
|
|||||||
Loading…
x
Reference in New Issue
Block a user