mirror of
https://git.datalinker.icu/vllm-project/vllm.git
synced 2025-12-09 23:54:56 +08:00
[Bug] Fix Unexpected Keyword Argument 'w1_bias' (#22757)
Signed-off-by: yewentao256 <zhyanwentao@126.com>
This commit is contained in:
parent
4082338a25
commit
77a6bf07ae
@ -475,12 +475,11 @@ class UnquantizedFusedMoEMethod(FusedMoEMethodBase, CustomOp):
|
||||
activation=activation,
|
||||
apply_router_weight_on_input=apply_router_weight_on_input)
|
||||
else:
|
||||
return self.fused_experts(
|
||||
# add w1_bias/w2_bias to kwargs if they exist
|
||||
kwargs = dict(
|
||||
hidden_states=x,
|
||||
w1=layer.w13_weight,
|
||||
w2=layer.w2_weight,
|
||||
w1_bias=layer.w13_bias if self.has_bias else None,
|
||||
w2_bias=layer.w2_bias if self.has_bias else None,
|
||||
topk_weights=topk_weights,
|
||||
topk_ids=topk_ids,
|
||||
inplace=True,
|
||||
@ -489,6 +488,17 @@ class UnquantizedFusedMoEMethod(FusedMoEMethodBase, CustomOp):
|
||||
global_num_experts=global_num_experts,
|
||||
expert_map=expert_map,
|
||||
)
|
||||
if isinstance(self.fused_experts,
|
||||
FusedMoEModularKernel) and self.has_bias:
|
||||
raise ValueError(
|
||||
"FusedMoEModularKernel does not support bias.")
|
||||
if self.has_bias:
|
||||
kwargs.update({
|
||||
"w1_bias": getattr(layer, "w13_bias", None),
|
||||
"w2_bias": getattr(layer, "w2_bias", None),
|
||||
})
|
||||
|
||||
return self.fused_experts(**kwargs)
|
||||
|
||||
def forward_cpu(
|
||||
self,
|
||||
|
||||
Loading…
x
Reference in New Issue
Block a user