mirror of
https://git.datalinker.icu/vllm-project/vllm.git
synced 2025-12-09 21:55:50 +08:00
improve the robustness of parsing vlms config in AutoRound (#18894)
Signed-off-by: wenhuach21 <wenhua.cheng@intel.com>
This commit is contained in:
parent
3132290a14
commit
3de3eadf5b
@ -116,8 +116,9 @@ class AutoRoundConfig(QuantizationConfig):
|
||||
|
||||
quantized = True
|
||||
if self.block_name_to_quantize:
|
||||
quantized = any(name in layer_name
|
||||
for name in self.block_name_to_quantize)
|
||||
quantized = any(
|
||||
layer_name.startswith(name)
|
||||
for name in self.block_name_to_quantize)
|
||||
elif isinstance(layer, ParallelLMHead):
|
||||
quantized = False
|
||||
|
||||
|
||||
Loading…
x
Reference in New Issue
Block a user