mirror of
https://git.datalinker.icu/vllm-project/vllm.git
synced 2025-12-16 08:56:02 +08:00
[ROCm][BugFix] Fix shared expert loading error when disable VLLM_ROCM_USE_AITER_FUSION_SHARED_EXPERTS (#28633)
Signed-off-by: ganyi <ygan@amd.com>
This commit is contained in:
parent
20e4497be2
commit
7218f83992
@ -287,7 +287,10 @@ class DeepseekV2MoE(nn.Module):
|
|||||||
)
|
)
|
||||||
|
|
||||||
self.is_rocm_aiter_moe_enabled = rocm_aiter_ops.is_fused_moe_enabled()
|
self.is_rocm_aiter_moe_enabled = rocm_aiter_ops.is_fused_moe_enabled()
|
||||||
if config.n_shared_experts is None or self.is_rocm_aiter_moe_enabled:
|
self.is_fusion_moe_shared_experts_enabled = (
|
||||||
|
rocm_aiter_ops.is_fusion_moe_shared_experts_enabled()
|
||||||
|
)
|
||||||
|
if config.n_shared_experts is None or self.is_fusion_moe_shared_experts_enabled:
|
||||||
self.shared_experts = None
|
self.shared_experts = None
|
||||||
else:
|
else:
|
||||||
intermediate_size = config.moe_intermediate_size * config.n_shared_experts
|
intermediate_size = config.moe_intermediate_size * config.n_shared_experts
|
||||||
@ -327,7 +330,7 @@ class DeepseekV2MoE(nn.Module):
|
|||||||
num_redundant_experts=self.n_redundant_experts,
|
num_redundant_experts=self.n_redundant_experts,
|
||||||
is_sequence_parallel=self.is_sequence_parallel,
|
is_sequence_parallel=self.is_sequence_parallel,
|
||||||
n_shared_experts=config.n_shared_experts
|
n_shared_experts=config.n_shared_experts
|
||||||
if rocm_aiter_ops.is_fusion_moe_shared_experts_enabled()
|
if self.is_fusion_moe_shared_experts_enabled
|
||||||
else None,
|
else None,
|
||||||
)
|
)
|
||||||
|
|
||||||
|
|||||||
Loading…
x
Reference in New Issue
Block a user