mirror of
https://git.datalinker.icu/vllm-project/vllm.git
synced 2025-12-12 08:47:07 +08:00
[Bugfix] fix qwen3 moe fp8 accuracy issue (#23031)
Signed-off-by: Jinzhen Lin <jinzhen.ljz@antgroup.com>
This commit is contained in:
parent
bf7f470b22
commit
a258ad8bcc
@ -125,6 +125,10 @@ class Fp8Config(QuantizationConfig):
|
|||||||
ignored_layers = cls.get_from_keys_or(config, ["ignored_layers"], None)
|
ignored_layers = cls.get_from_keys_or(config, ["ignored_layers"], None)
|
||||||
weight_block_size = cls.get_from_keys_or(config, ["weight_block_size"],
|
weight_block_size = cls.get_from_keys_or(config, ["weight_block_size"],
|
||||||
None)
|
None)
|
||||||
|
if not ignored_layers:
|
||||||
|
ignored_layers = cls.get_from_keys_or(config,
|
||||||
|
["modules_to_not_convert"],
|
||||||
|
None)
|
||||||
return cls(is_checkpoint_fp8_serialized=is_checkpoint_fp8_serialized,
|
return cls(is_checkpoint_fp8_serialized=is_checkpoint_fp8_serialized,
|
||||||
activation_scheme=activation_scheme,
|
activation_scheme=activation_scheme,
|
||||||
ignored_layers=ignored_layers,
|
ignored_layers=ignored_layers,
|
||||||
|
|||||||
Loading…
x
Reference in New Issue
Block a user