mirror of
https://git.datalinker.icu/vllm-project/vllm.git
synced 2026-05-24 00:04:32 +08:00
Allow torchao quantization in SiglipMLP (#15575)
This commit is contained in:
parent
54aa619459
commit
dcf2a590f5
@ -208,8 +208,10 @@ class SiglipMLP(nn.Module):
|
|||||||
|
|
||||||
self.config = config
|
self.config = config
|
||||||
self.activation_fn = get_act_fn(config.hidden_act)
|
self.activation_fn = get_act_fn(config.hidden_act)
|
||||||
# Special handling for BNB quantization
|
# Special handling for BNB and torchao quantization
|
||||||
if quant_config and quant_config.get_name() == "bitsandbytes":
|
if quant_config and quant_config.get_name() in [
|
||||||
|
"bitsandbytes", "torchao"
|
||||||
|
]:
|
||||||
quantizable = True
|
quantizable = True
|
||||||
else:
|
else:
|
||||||
# For other quantization, we require the hidden size to be a
|
# For other quantization, we require the hidden size to be a
|
||||||
|
|||||||
Loading…
x
Reference in New Issue
Block a user