[BugFix] Fix DeepGEMM warmup, no m.weight_scale_inv (#25206)

Signed-off-by: Lucas Wilkinson <lwilkins@redhat.com>
2026-03-16 16:27:15 +08:00 · 2025-09-18 17:26:28 -04:00 · 2025-09-18 17:26:28 -04:00 · 9fac6aa30b
commit 9fac6aa30b
parent a53ad626d6
1 changed files with 1 additions and 1 deletions
--- a/vllm/model_executor/warmup/deep_gemm_warmup.py
+++ b/vllm/model_executor/warmup/deep_gemm_warmup.py
@ -36,7 +36,7 @@ def _extract_data_from_linear_base_module(
    assert m.quant_method.quant_config is not None

    w = m.weight
-    ws = m.weight_scale_inv
+    ws = m.weight_scale
    quant_block_size = m.quant_method.quant_config.weight_block_size

    assert isinstance(w, torch.Tensor)