[Bugfix] fix dots.llm1.inst (#29687)

Signed-off-by: zjy0516 <riverclouds.zhu@qq.com> Co-authored-by: Roger Wang <hey@rogerw.io>
2026-06-08 01:42:14 +08:00 · 2025-11-29 07:25:26 +08:00 · 2025-11-29 07:25:26 +08:00 · a51f4186f2
commit a51f4186f2
parent 7675ba30de
1 changed files with 6 additions and 5 deletions
--- a/vllm/model_executor/models/dots1.py
+++ b/vllm/model_executor/models/dots1.py
@ -181,13 +181,14 @@ class Dots1MoE(nn.Module):
        hidden_states = hidden_states.view(-1, hidden_dim)
        router_logits, _ = self.gate(hidden_states)
        final_hidden_states = (
            self.experts(hidden_states=hidden_states, router_logits=router_logits)
            * self.routed_scaling_factor
        )
        shared_out, routed_out = self.experts(
            hidden_states=hidden_states, router_logits=router_logits
        )
        if self.shared_experts is not None:
-            final_hidden_states = final_hidden_states[0] + final_hidden_states[1]
+            final_hidden_states = (routed_out + shared_out) * self.routed_scaling_factor
        else:
            final_hidden_states = routed_out * self.routed_scaling_factor
        if self.tp_size > 1:
            final_hidden_states = tensor_model_parallel_all_reduce(final_hidden_states)