[Bugfix] Fix Qwen2.5-VL quantized model weights loading (#23512)

Signed-off-by: Zifei Tong <zifeitong@gmail.com>
This commit is contained in:
zifeitong 2025-08-24 19:40:22 -07:00 committed by GitHub
parent 39971db3aa
commit a71e4765cc
No known key found for this signature in database
GPG Key ID: B5690EEEBB952194

View File

@ -852,6 +852,10 @@ class Qwen2_5_VLForConditionalGeneration(nn.Module, SupportsMultiModal,
SupportsLoRA, SupportsPP, SupportsLoRA, SupportsPP,
SupportsQuant): SupportsQuant):
packed_modules_mapping = {
"gate_up_proj": ["gate_proj", "up_proj"],
}
# To ensure correct weight loading and mapping. # To ensure correct weight loading and mapping.
hf_to_vllm_mapper = WeightsMapper( hf_to_vllm_mapper = WeightsMapper(
orig_to_new_prefix={ orig_to_new_prefix={