[XPU] Enable custom routing functions in IPEX for Llama4 (#28004)

Signed-off-by: frost-intel <frost.mitchell@intel.com>
This commit is contained in:
Frost Mitchell 2025-11-05 08:39:57 -05:00 committed by GitHub
parent 6ab183813c
commit 6e97eccf5d
No known key found for this signature in database
GPG Key ID: B5690EEEBB952194

View File

@ -915,7 +915,6 @@ class UnquantizedFusedMoEMethod(FusedMoEMethodBase, CustomOp):
or logical_replica_count is not None
):
raise NotImplementedError("Expert load balancing is not supported for XPU.")
assert custom_routing_function is None
return layer.ipex_fusion(
x,
use_grouped_topk,
@ -924,6 +923,7 @@ class UnquantizedFusedMoEMethod(FusedMoEMethodBase, CustomOp):
renormalize,
topk_group,
num_expert_group,
custom_routing_function=custom_routing_function,
)
def forward_tpu(