[BugFix] Workspace allocation during profile run : DeepEPHighThroughput + DeepGEMM (#30899)

(cherry picked from commit e3fc374a9a69dddb16885d810f1e28d3fdd39ebd)
This commit is contained in:
Varun Sundar Rabindranath 2025-12-17 18:00:59 -05:00 committed by Kevin H. Luu
parent 682c38583c
commit 17f3988094

View File

@ -795,7 +795,10 @@ class FusedMoEModularKernel(torch.nn.Module):
top_k,
global_num_experts,
local_num_experts,
expert_tokens_meta,
# expert_tokens_meta help in allocating optimal/minimal
# amount of workspace. Mark it None, so we allocate for
# the worst-case scenario.
expert_tokens_meta=None,
)
)