mirror of
https://git.datalinker.icu/vllm-project/vllm.git
synced 2026-05-24 02:44:27 +08:00
[CI] Skip ci failure test (#30804)
Signed-off-by: yewentao256 <zhyanwentao@126.com> (cherry picked from commit b6ec077e058e15e5b853793924e6643ec6c579aa)
This commit is contained in:
parent
16484d394c
commit
4cd332f3cf
@ -523,6 +523,8 @@ CUSTOM_OPS_QUANT_RMS_NORM = ["+quant_fp8,+rms_norm"]
|
|||||||
list[tuple[Any, ...]](flat_product(MODELS_GROUP_FP8, CUSTOM_OPS_QUANT_RMS_NORM)),
|
list[tuple[Any, ...]](flat_product(MODELS_GROUP_FP8, CUSTOM_OPS_QUANT_RMS_NORM)),
|
||||||
)
|
)
|
||||||
@pytest.mark.parametrize("inductor_graph_partition", [True, False])
|
@pytest.mark.parametrize("inductor_graph_partition", [True, False])
|
||||||
|
# TODO: remove skip after we fix the fusion thoroughly
|
||||||
|
@pytest.mark.skipif(is_blackwell(), reason="Temporarily disabled on Blackwell")
|
||||||
def test_rms_group_quant(
|
def test_rms_group_quant(
|
||||||
model_name: str,
|
model_name: str,
|
||||||
model_kwargs: dict[str, Any],
|
model_kwargs: dict[str, Any],
|
||||||
@ -562,7 +564,7 @@ def test_rms_group_quant(
|
|||||||
splitting_ops=splitting_ops,
|
splitting_ops=splitting_ops,
|
||||||
# Common
|
# Common
|
||||||
mode=CompilationMode.VLLM_COMPILE,
|
mode=CompilationMode.VLLM_COMPILE,
|
||||||
pass_config=PassConfig(eliminate_noops=True, enable_fusion=True),
|
pass_config=PassConfig(eliminate_noops=True, fuse_norm_quant=True),
|
||||||
# Inductor caches custom passes by default as well via uuid
|
# Inductor caches custom passes by default as well via uuid
|
||||||
inductor_compile_config={"force_disable_caches": True},
|
inductor_compile_config={"force_disable_caches": True},
|
||||||
)
|
)
|
||||||
|
|||||||
Loading…
x
Reference in New Issue
Block a user