Allow torchao quantization in SiglipMLP (#15575)

2025-12-24 13:16:01 +08:00 · 2025-03-26 22:45:51 -07:00 · 2025-03-26 22:45:51 -07:00 · dcf2a590f5
commit dcf2a590f5
parent 54aa619459
1 changed files with 4 additions and 2 deletions
--- a/vllm/model_executor/models/siglip.py
+++ b/vllm/model_executor/models/siglip.py
@ -208,8 +208,10 @@ class SiglipMLP(nn.Module):

        self.config = config
        self.activation_fn = get_act_fn(config.hidden_act)
-        # Special handling for BNB quantization
-        if quant_config and quant_config.get_name() == "bitsandbytes":
+        # Special handling for BNB and torchao quantization
+        if quant_config and quant_config.get_name() in [
+                "bitsandbytes", "torchao"
+        ]:
            quantizable = True
        else:
            # For other quantization, we require the hidden size to be a