mirror of
https://git.datalinker.icu/vllm-project/vllm.git
synced 2026-05-05 12:31:23 +08:00
[XPU] Fix AWQ skipped layer detection in IPEX quantization (#29774)
Signed-off-by: Fanli Lin <fanli.lin@intel.com>
This commit is contained in:
parent
f0a28bf661
commit
f37e8938d2
@ -150,7 +150,10 @@ class IPEXConfig(QuantizationConfig):
|
|||||||
if isinstance(layer, LinearBase):
|
if isinstance(layer, LinearBase):
|
||||||
if self.method == "awq":
|
if self.method == "awq":
|
||||||
if is_layer_skipped(
|
if is_layer_skipped(
|
||||||
prefix, self.modules_to_not_convert, self.packed_modules_mapping
|
prefix,
|
||||||
|
self.modules_to_not_convert,
|
||||||
|
self.packed_modules_mapping,
|
||||||
|
skip_with_substr=True,
|
||||||
):
|
):
|
||||||
return UnquantizedLinearMethod()
|
return UnquantizedLinearMethod()
|
||||||
return IPEXAWQLinearMethod(self)
|
return IPEXAWQLinearMethod(self)
|
||||||
|
|||||||
Loading…
x
Reference in New Issue
Block a user