From aa5053e3feb26c7de244b204bccc8d403b5b3df5 Mon Sep 17 00:00:00 2001 From: Egor Date: Fri, 3 Oct 2025 13:00:23 +0200 Subject: [PATCH] [Doc] Fixed shape description for fused_batched_moe.py (#25668) Signed-off-by: Egor --- vllm/model_executor/layers/fused_moe/fused_batched_moe.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/vllm/model_executor/layers/fused_moe/fused_batched_moe.py b/vllm/model_executor/layers/fused_moe/fused_batched_moe.py index 660bae3146026..e49750bc92b3b 100644 --- a/vllm/model_executor/layers/fused_moe/fused_batched_moe.py +++ b/vllm/model_executor/layers/fused_moe/fused_batched_moe.py @@ -355,7 +355,7 @@ def batched_triton_kernel( def invoke_moe_batched_triton_kernel( A: torch.Tensor, # [E, max_tokens, K] - B: torch.Tensor, # [E, K, N] + B: torch.Tensor, # [E, N, K] C: torch.Tensor, # [E, max_tokens, N] expert_num_tokens: torch.Tensor, # [E] compute_type: tl.dtype,