[Misc] duplicate code in deepseek_v2 (#14106)

This commit is contained in:
wang.yuqi 2025-03-03 14:10:11 +08:00 committed by GitHub
parent 09e56f9262
commit e584b85afd
No known key found for this signature in database
GPG Key ID: B5690EEEBB952194

View File

@ -105,7 +105,6 @@ class DeepseekV2MoE(nn.Module):
self.tp_size = get_tensor_model_parallel_world_size()
self.routed_scaling_factor = config.routed_scaling_factor
self.n_shared_experts = config.n_shared_experts
self.routed_scaling_factor = config.routed_scaling_factor
if config.hidden_act != "silu":
raise ValueError(f"Unsupported activation: {config.hidden_act}. "