Merge a4af2e7b3a7fff90d54e579ba3fb124281c3403f into 254f6b986720c92ddf97fbb1a6a6465da8e87e29

This commit is contained in:
Andrey Khalyavin 2025-12-25 08:07:30 +08:00 committed by GitHub
commit afcaa3718f
No known key found for this signature in database
GPG Key ID: B5690EEEBB952194

View File

@ -312,7 +312,7 @@ class BatchedDeepGemmExperts(mk.FusedMoEPermuteExpertsUnpermute):
num_dispatchers = self.num_dispatchers
num_experts = local_num_experts
max_num_tokens = M if self.max_num_tokens is None else self.max_num_tokens
workspace13 = (num_experts, max_num_tokens * num_dispatchers, max(K, N))
workspace13 = (num_experts, max_num_tokens * num_dispatchers, N)
workspace2 = (num_experts, max_num_tokens * num_dispatchers, (N // 2))
output = (num_experts, max_num_tokens * num_dispatchers, K)
return (workspace13, workspace2, output)