mirror of
https://git.datalinker.icu/vllm-project/vllm.git
synced 2025-12-23 04:45:01 +08:00
Fix precommit fail in fused_moe intermediate_cache2 chunking (#13772)
Signed-off-by: mgoin <mgoin64@gmail.com>
This commit is contained in:
parent
227578480d
commit
db986c19ea
@ -1271,7 +1271,8 @@ def fused_experts_impl(hidden_states: torch.Tensor,
|
|||||||
# so the cache size and config are already set correctly and
|
# so the cache size and config are already set correctly and
|
||||||
# do not need to be adjusted.
|
# do not need to be adjusted.
|
||||||
intermediate_cache1 = intermediate_cache1[:tokens_in_chunk]
|
intermediate_cache1 = intermediate_cache1[:tokens_in_chunk]
|
||||||
intermediate_cache2 = intermediate_cache2[:tokens_in_chunk * topk_ids.shape[1]]
|
intermediate_cache2 = intermediate_cache2[:tokens_in_chunk *
|
||||||
|
topk_ids.shape[1]]
|
||||||
intermediate_cache3 = intermediate_cache3[:tokens_in_chunk]
|
intermediate_cache3 = intermediate_cache3[:tokens_in_chunk]
|
||||||
config = get_config_func(tokens_in_chunk)
|
config = get_config_func(tokens_in_chunk)
|
||||||
|
|
||||||
|
|||||||
Loading…
x
Reference in New Issue
Block a user