mirror of
https://git.datalinker.icu/vllm-project/vllm.git
synced 2025-12-13 19:15:34 +08:00
[Bugfix] Reduce moe_sum test size to avoid OOM (#18484)
Signed-off-by: Bill Nell <bnell@redhat.com>
This commit is contained in:
parent
c154d89306
commit
c6c10ca920
@ -577,7 +577,7 @@ def test_moe_align_block_size_opcheck():
|
|||||||
num_tokens_post_pad))
|
num_tokens_post_pad))
|
||||||
|
|
||||||
|
|
||||||
@pytest.mark.parametrize("m", [1, 33, 222, 1024 * 128])
|
@pytest.mark.parametrize("m", [1, 33, 64, 222])
|
||||||
@pytest.mark.parametrize("topk", TOP_KS)
|
@pytest.mark.parametrize("topk", TOP_KS)
|
||||||
@pytest.mark.parametrize("k", [128, 511, 1024])
|
@pytest.mark.parametrize("k", [128, 511, 1024])
|
||||||
@pytest.mark.parametrize("dtype",
|
@pytest.mark.parametrize("dtype",
|
||||||
|
|||||||
Loading…
x
Reference in New Issue
Block a user