[CI Failure] Fix test_kv_cache_model_load_and_run (#27717)

Signed-off-by: Huamin Li <3ericli@gmail.com>
2026-03-16 13:57:12 +08:00 · 2025-10-30 05:27:53 -07:00 · 2025-10-30 05:27:53 -07:00 · 1994de99ea
commit 1994de99ea
parent 4464723f22
1 changed files with 12 additions and 1 deletions
--- a/tests/quantization/test_fp8.py
+++ b/tests/quantization/test_fp8.py
@ -49,7 +49,18 @@ def test_model_load_and_run(

 KV_CACHE_MODELS = [
    # AutoFP8 format using separate .k_scale and .v_scale
-    "nm-testing/Qwen2-1.5B-Instruct-FP8-K-V",
+    # The original checkpoint below was removed from the Hub. To unblock CI and
+    # until a small replacement with split K/V scales is found, skip this case.
+    # See PR #27717 for context.
+    pytest.param(
+        "nm-testing/Qwen2-1.5B-Instruct-FP8-K-V",
+        marks=pytest.mark.skip(
+            reason=(
+                "Checkpoint removed from HF; temporarily disabling this "
+                "AutoFP8 split K/V case (PR #27717)."
+            )
+        ),
+    ),
 ]