mirror of
https://git.datalinker.icu/vllm-project/vllm.git
synced 2026-06-08 03:29:06 +08:00
[Bugfix] deepseek-V3.2 self.weights_proj has no bias (#30841)
Signed-off-by: baoqian <1354987947@qq.com> Signed-off-by: baoqian426 <1354987947@qq.com>
This commit is contained in:
parent
4bf6c23668
commit
84896fda22
@ -835,7 +835,11 @@ class Indexer(nn.Module):
|
|||||||
)
|
)
|
||||||
self.k_norm = LayerNorm(self.head_dim, eps=1e-6)
|
self.k_norm = LayerNorm(self.head_dim, eps=1e-6)
|
||||||
self.weights_proj = ReplicatedLinear(
|
self.weights_proj = ReplicatedLinear(
|
||||||
hidden_size, self.n_head, quant_config=None, prefix=f"{prefix}.weights_proj"
|
hidden_size,
|
||||||
|
self.n_head,
|
||||||
|
bias=False,
|
||||||
|
quant_config=None,
|
||||||
|
prefix=f"{prefix}.weights_proj",
|
||||||
)
|
)
|
||||||
self.softmax_scale = self.head_dim**-0.5
|
self.softmax_scale = self.head_dim**-0.5
|
||||||
|
|
||||||
|
|||||||
Loading…
x
Reference in New Issue
Block a user