[BugFix] Illegal memory access for MoE On H20 (#13693)

This commit is contained in:
Zhonghua Deng 2025-02-24 23:37:32 +08:00 committed by GitHub
parent 781096e385
commit ccc00515fd
No known key found for this signature in database
GPG Key ID: B5690EEEBB952194

View File

@ -1271,7 +1271,7 @@ def fused_experts_impl(hidden_states: torch.Tensor,
# so the cache size and config are already set correctly and
# do not need to be adjusted.
intermediate_cache1 = intermediate_cache1[:tokens_in_chunk]
intermediate_cache2 = intermediate_cache2[:tokens_in_chunk]
intermediate_cache2 = intermediate_cache2[:tokens_in_chunk * topk_ids.shape[1]]
intermediate_cache3 = intermediate_cache3[:tokens_in_chunk]
config = get_config_func(tokens_in_chunk)