mirror of
https://git.datalinker.icu/vllm-project/vllm.git
synced 2026-05-30 18:07:15 +08:00
[Bugfix] Fix Qwen2.5-VL quantized model weights loading (#23512)
Signed-off-by: Zifei Tong <zifeitong@gmail.com>
This commit is contained in:
parent
39971db3aa
commit
a71e4765cc
@ -852,6 +852,10 @@ class Qwen2_5_VLForConditionalGeneration(nn.Module, SupportsMultiModal,
|
|||||||
SupportsLoRA, SupportsPP,
|
SupportsLoRA, SupportsPP,
|
||||||
SupportsQuant):
|
SupportsQuant):
|
||||||
|
|
||||||
|
packed_modules_mapping = {
|
||||||
|
"gate_up_proj": ["gate_proj", "up_proj"],
|
||||||
|
}
|
||||||
|
|
||||||
# To ensure correct weight loading and mapping.
|
# To ensure correct weight loading and mapping.
|
||||||
hf_to_vllm_mapper = WeightsMapper(
|
hf_to_vllm_mapper = WeightsMapper(
|
||||||
orig_to_new_prefix={
|
orig_to_new_prefix={
|
||||||
|
|||||||
Loading…
x
Reference in New Issue
Block a user