mirror of
https://git.datalinker.icu/vllm-project/vllm.git
synced 2025-12-19 03:55:01 +08:00
[Model] Add packed_modules_mapping for Qwen3-MOE (#18118)
Signed-off-by: Jee Jee Li <pandaleefree@gmail.com>
This commit is contained in:
parent
8f5dc41481
commit
63dc3426e0
@ -475,6 +475,17 @@ class Qwen3MoeModel(nn.Module):
|
|||||||
|
|
||||||
|
|
||||||
class Qwen3MoeForCausalLM(nn.Module, SupportsPP):
|
class Qwen3MoeForCausalLM(nn.Module, SupportsPP):
|
||||||
|
packed_modules_mapping = {
|
||||||
|
"qkv_proj": [
|
||||||
|
"q_proj",
|
||||||
|
"k_proj",
|
||||||
|
"v_proj",
|
||||||
|
],
|
||||||
|
"gate_up_proj": [
|
||||||
|
"gate_proj",
|
||||||
|
"up_proj",
|
||||||
|
],
|
||||||
|
}
|
||||||
|
|
||||||
fall_back_to_pt_during_load = False
|
fall_back_to_pt_during_load = False
|
||||||
|
|
||||||
|
|||||||
Loading…
x
Reference in New Issue
Block a user