mirror of
https://git.datalinker.icu/vllm-project/vllm.git
synced 2025-12-18 00:35:01 +08:00
[Bugfix] Fix Granite 3.0 MoE model loading (#12446)
Signed-off-by: DarkLight1337 <tlleungac@connect.ust.hk>
This commit is contained in:
parent
0cc6b383d7
commit
5204ff5c3f
@ -348,6 +348,7 @@ class GraniteMoeForCausalLM(nn.Module, SupportsLoRA, SupportsPP):
|
|||||||
|
|
||||||
self.config = config
|
self.config = config
|
||||||
self.lora_config = lora_config
|
self.lora_config = lora_config
|
||||||
|
self.quant_config = quant_config # Required by MixtralForCausalLM
|
||||||
|
|
||||||
self.model = GraniteMoeModel(vllm_config=vllm_config,
|
self.model = GraniteMoeModel(vllm_config=vllm_config,
|
||||||
prefix=maybe_prefix(prefix, "model"))
|
prefix=maybe_prefix(prefix, "model"))
|
||||||
|
|||||||
Loading…
x
Reference in New Issue
Block a user