Bugfix for whisper quantization due to fake k_proj bias (#12524)

Signed-off-by: mgoin <michael@neuralmagic.com>
2026-06-27 20:57:22 +08:00 · 2025-01-28 23:49:03 -05:00 · 2025-01-28 23:49:03 -05:00 · bd02164cf9
commit bd02164cf9
parent 46fb056749
1 changed files with 1 additions and 1 deletions
--- a/vllm/model_executor/models/whisper.py
+++ b/vllm/model_executor/models/whisper.py
@ -743,7 +743,7 @@ def _create_fake_bias_for_k_proj(
    So that the bias for k_proj in qkv_proj can be initialized with zeros.
    """
    for name, weight in weights:
-        if ".self_attn.k_proj.weight" in name:
+        if name.endswith(".self_attn.k_proj.weight"):
            bias = torch.zeros(weight.size(0))
            bias_name = name.replace("weight", "bias")
            yield from [(name, weight), (bias_name, bias)]