mirror of
https://git.datalinker.icu/vllm-project/vllm.git
synced 2026-05-31 06:37:04 +08:00
[Bugfix] fix Qwen3VLMoe load when pp > 1 (#25838)
Signed-off-by: liuye.hj <liuye.hj@alibaba-inc.com> Co-authored-by: liuye.hj <liuye.hj@alibaba-inc.com>
This commit is contained in:
parent
b1ded114b9
commit
471997adf6
@ -212,6 +212,8 @@ class Qwen3MoeLLMModel(Qwen3MoeModel):
|
|||||||
# attempted to load as other weights later
|
# attempted to load as other weights later
|
||||||
is_expert_weight = True
|
is_expert_weight = True
|
||||||
name_mapped = name.replace(weight_name, param_name)
|
name_mapped = name.replace(weight_name, param_name)
|
||||||
|
if is_pp_missing_parameter(name_mapped, self):
|
||||||
|
continue
|
||||||
if is_fused_expert:
|
if is_fused_expert:
|
||||||
loaded_weight = loaded_weight.transpose(-1,
|
loaded_weight = loaded_weight.transpose(-1,
|
||||||
-2) # no bias
|
-2) # no bias
|
||||||
@ -230,8 +232,6 @@ class Qwen3MoeLLMModel(Qwen3MoeModel):
|
|||||||
name_mapped, params_dict, loaded_weight,
|
name_mapped, params_dict, loaded_weight,
|
||||||
shard_id, num_experts)
|
shard_id, num_experts)
|
||||||
else:
|
else:
|
||||||
if is_pp_missing_parameter(name_mapped, self):
|
|
||||||
continue
|
|
||||||
# Skip loading extra parameters for GPTQ/modelopt models
|
# Skip loading extra parameters for GPTQ/modelopt models
|
||||||
if name_mapped.endswith(
|
if name_mapped.endswith(
|
||||||
ignore_suffixes
|
ignore_suffixes
|
||||||
|
|||||||
Loading…
x
Reference in New Issue
Block a user