diff --git a/tests/models/test_gptq_marlin.py b/tests/models/test_gptq_marlin.py index e30100d9bf573..4abbc41c9c287 100644 --- a/tests/models/test_gptq_marlin.py +++ b/tests/models/test_gptq_marlin.py @@ -40,6 +40,9 @@ MODELS = [ ("TheBloke/TinyLlama-1.1B-Chat-v1.0-GPTQ", "gptq-8bit-128g-actorder_True"), # 8-bit, act_order==True, group_size=32 ("TheBloke/TinyLlama-1.1B-Chat-v1.0-GPTQ", "gptq-8bit-32g-actorder_True"), + + # 4-bit, act_order==True, group_size=128 + ("TechxGenus/gemma-1.1-2b-it-GPTQ", "main") ]