mirror of
https://git.datalinker.icu/vllm-project/vllm.git
synced 2026-05-14 17:47:57 +08:00
[BugFix] Fix DeepGEMM warmup, no m.weight_scale_inv (#25206)
Signed-off-by: Lucas Wilkinson <lwilkins@redhat.com>
This commit is contained in:
parent
a53ad626d6
commit
9fac6aa30b
@ -36,7 +36,7 @@ def _extract_data_from_linear_base_module(
|
|||||||
assert m.quant_method.quant_config is not None
|
assert m.quant_method.quant_config is not None
|
||||||
|
|
||||||
w = m.weight
|
w = m.weight
|
||||||
ws = m.weight_scale_inv
|
ws = m.weight_scale
|
||||||
quant_block_size = m.quant_method.quant_config.weight_block_size
|
quant_block_size = m.quant_method.quant_config.weight_block_size
|
||||||
|
|
||||||
assert isinstance(w, torch.Tensor)
|
assert isinstance(w, torch.Tensor)
|
||||||
|
|||||||
Loading…
x
Reference in New Issue
Block a user