mirror of
https://git.datalinker.icu/vllm-project/vllm.git
synced 2026-06-06 02:09:08 +08:00
fix: gptq marlin weight loading failure (#23066)
This commit is contained in:
parent
21e39436c8
commit
0fc8fa751a
@ -56,7 +56,7 @@ def get_moe_quant_method(
|
|||||||
# Dynamic per module/layer rules may override base config
|
# Dynamic per module/layer rules may override base config
|
||||||
override_config(cloned_config, prefix=prefix)
|
override_config(cloned_config, prefix=prefix)
|
||||||
|
|
||||||
return moe_method_cls(cloned_config)
|
return moe_method_cls(cloned_config, layer.moe_config)
|
||||||
return None
|
return None
|
||||||
|
|
||||||
|
|
||||||
|
|||||||
Loading…
x
Reference in New Issue
Block a user