mirror of
https://git.datalinker.icu/vllm-project/vllm.git
synced 2026-04-30 07:36:38 +08:00
[moe][quant] add weight name case for offset (#15515)
Signed-off-by: Mengqing Cao <cmq0113@163.com>
This commit is contained in:
parent
7f301dd8ef
commit
fb22be5817
@ -699,8 +699,9 @@ class FusedMoE(torch.nn.Module):
|
|||||||
tp_rank=self.tp_rank)
|
tp_rank=self.tp_rank)
|
||||||
return
|
return
|
||||||
|
|
||||||
# Case weight scales and zero_points
|
# Case weight scales, zero_points and offset
|
||||||
if ("scale" in weight_name or "zero" in weight_name):
|
if ("scale" in weight_name or "zero" in weight_name
|
||||||
|
or "offset" in weight_name):
|
||||||
# load the weight scales and zp based on the quantization scheme
|
# load the weight scales and zp based on the quantization scheme
|
||||||
# supported weight scales/zp can be found in
|
# supported weight scales/zp can be found in
|
||||||
# FusedMoeWeightScaleSupported
|
# FusedMoeWeightScaleSupported
|
||||||
|
|||||||
Loading…
x
Reference in New Issue
Block a user