mirror of
https://git.datalinker.icu/vllm-project/vllm.git
synced 2026-01-26 08:44:29 +08:00
[BugFix] Fix DeepGEMM warmup, no m.weight_scale_inv (#25206)
Signed-off-by: Lucas Wilkinson <lwilkins@redhat.com>
This commit is contained in:
parent
a53ad626d6
commit
9fac6aa30b
@ -36,7 +36,7 @@ def _extract_data_from_linear_base_module(
|
||||
assert m.quant_method.quant_config is not None
|
||||
|
||||
w = m.weight
|
||||
ws = m.weight_scale_inv
|
||||
ws = m.weight_scale
|
||||
quant_block_size = m.quant_method.quant_config.weight_block_size
|
||||
|
||||
assert isinstance(w, torch.Tensor)
|
||||
|
||||
Loading…
x
Reference in New Issue
Block a user