mirror of
https://git.datalinker.icu/vllm-project/vllm.git
synced 2025-12-15 01:55:36 +08:00
[Bug] Fix AttributeError: 'QKVParallelLinear' object has no attribute 'orig_dtype' (#25958)
Signed-off-by: yewentao256 <zhyanwentao@126.com>
This commit is contained in:
parent
a2e6fa7e03
commit
e6a226efba
@ -66,6 +66,7 @@ class CompressedTensorsW8A8Fp8(CompressedTensorsScheme):
|
|||||||
output_size_per_partition = sum(output_partition_sizes)
|
output_size_per_partition = sum(output_partition_sizes)
|
||||||
layer.logical_widths = output_partition_sizes
|
layer.logical_widths = output_partition_sizes
|
||||||
layer.weight_block_size = None
|
layer.weight_block_size = None
|
||||||
|
layer.orig_dtype = params_dtype
|
||||||
|
|
||||||
if self.strategy == QuantizationStrategy.BLOCK:
|
if self.strategy == QuantizationStrategy.BLOCK:
|
||||||
assert self.weight_block_size is not None
|
assert self.weight_block_size is not None
|
||||||
|
|||||||
Loading…
x
Reference in New Issue
Block a user