Fix precommit fail in fused_moe intermediate_cache2 chunking (#13772)

Signed-off-by: mgoin <mgoin64@gmail.com>
2026-06-10 21:15:44 +08:00 · 2025-02-24 12:25:47 -05:00 · 2025-02-24 12:25:47 -05:00 · db986c19ea
commit db986c19ea
parent 227578480d
1 changed files with 2 additions and 1 deletions
--- a/vllm/model_executor/layers/fused_moe/fused_moe.py
+++ b/vllm/model_executor/layers/fused_moe/fused_moe.py
@ -1271,7 +1271,8 @@ def fused_experts_impl(hidden_states: torch.Tensor,
            # so the cache size and config are already set correctly and
            # do not need to be adjusted.
            intermediate_cache1 = intermediate_cache1[:tokens_in_chunk]
-            intermediate_cache2 = intermediate_cache2[:tokens_in_chunk * topk_ids.shape[1]]
+            intermediate_cache2 = intermediate_cache2[:tokens_in_chunk *
                                                      topk_ids.shape[1]]
            intermediate_cache3 = intermediate_cache3[:tokens_in_chunk]
            config = get_config_func(tokens_in_chunk)