diff --git a/tests/models/quantization/test_gguf.py b/tests/models/quantization/test_gguf.py index eafdfd1b09aff..32f9472c12d5e 100644 --- a/tests/models/quantization/test_gguf.py +++ b/tests/models/quantization/test_gguf.py @@ -38,7 +38,7 @@ class GGUFTestConfig(NamedTuple): LLAMA_CONFIG = GGUFTestConfig( original_model="meta-llama/Llama-3.2-1B-Instruct", gguf_repo="bartowski/Llama-3.2-1B-Instruct-GGUF", - gguf_filename="Llama-3.2-1B-Instruct-IQ4_XS.gguf", + gguf_filename="Llama-3.2-1B-Instruct-Q6_K.gguf", ) QWEN2_CONFIG = GGUFTestConfig(