[Bugfix] deepseek-V3.2 self.weights_proj has no bias (#30841)

Signed-off-by: baoqian <1354987947@qq.com>
Signed-off-by: baoqian426 <1354987947@qq.com>
This commit is contained in:
baoqian426 2025-12-17 19:32:34 +08:00 committed by GitHub
parent 4bf6c23668
commit 84896fda22
No known key found for this signature in database
GPG Key ID: B5690EEEBB952194

View File

@ -835,7 +835,11 @@ class Indexer(nn.Module):
)
self.k_norm = LayerNorm(self.head_dim, eps=1e-6)
self.weights_proj = ReplicatedLinear(
hidden_size, self.n_head, quant_config=None, prefix=f"{prefix}.weights_proj"
hidden_size,
self.n_head,
bias=False,
quant_config=None,
prefix=f"{prefix}.weights_proj",
)
self.softmax_scale = self.head_dim**-0.5