[Doc] Fixed shape description for fused_batched_moe.py (#25668)

Signed-off-by: Egor <e.a.krivov@gmail.com> Signed-off-by: yewentao256 <zhyanwentao@126.com>
2026-07-16 13:47:23 +08:00 · 2025-10-03 13:00:23 +02:00 · 2025-10-03 13:00:23 +02:00 · 564233d550
commit 564233d550
parent 2bcc745042
1 changed files with 1 additions and 1 deletions
--- a/vllm/model_executor/layers/fused_moe/fused_batched_moe.py
+++ b/vllm/model_executor/layers/fused_moe/fused_batched_moe.py
@ -355,7 +355,7 @@ def batched_triton_kernel(

 def invoke_moe_batched_triton_kernel(
        A: torch.Tensor,  # [E, max_tokens, K]
-        B: torch.Tensor,  # [E, K, N]
+        B: torch.Tensor,  # [E, N, K]
        C: torch.Tensor,  # [E, max_tokens, N]
        expert_num_tokens: torch.Tensor,  # [E]
        compute_type: tl.dtype,