mirror of
https://git.datalinker.icu/vllm-project/vllm.git
synced 2026-05-30 04:37:04 +08:00
[BUGFIX] KeyError 'layers.14.mlp.gate.g_idx' for Qwen3-MoE with GPTQ on ROCm (#22017)
This commit is contained in:
parent
384a052971
commit
1e55dfa7e5
@ -149,7 +149,7 @@ class Qwen3MoeSparseMoeBlock(nn.Module):
|
|||||||
self.gate = ReplicatedLinear(config.hidden_size,
|
self.gate = ReplicatedLinear(config.hidden_size,
|
||||||
config.num_experts,
|
config.num_experts,
|
||||||
bias=False,
|
bias=False,
|
||||||
quant_config=None,
|
quant_config=quant_config,
|
||||||
prefix=f"{prefix}.gate")
|
prefix=f"{prefix}.gate")
|
||||||
|
|
||||||
def forward(self, hidden_states: torch.Tensor) -> torch.Tensor:
|
def forward(self, hidden_states: torch.Tensor) -> torch.Tensor:
|
||||||
|
|||||||
Loading…
x
Reference in New Issue
Block a user