change top level interface to mk

2026-06-06 02:35:41 +08:00 · 2025-12-19 22:16:28 +00:00 · 2025-12-19 22:16:28 +00:00 · 60279d272e
commit 60279d272e
parent f790068600
1 changed files with 4 additions and 0 deletions
--- a/vllm/model_executor/layers/fused_moe/unquantized_fused_moe_method.py
+++ b/vllm/model_executor/layers/fused_moe/unquantized_fused_moe_method.py
@ -31,6 +31,10 @@ from vllm.model_executor.utils import set_weight_attrs
 from vllm.platforms import current_platform
 from vllm.platforms.interface import CpuArchEnum
 from vllm.utils.flashinfer import has_flashinfer_cutlass_fused_moe
+import vllm.model_executor.layers.fused_moe.modular_kernel as mk
+from vllm.model_executor.layers.fused_moe.prepare_finalize import (
+    MoEPrepareAndFinalizeNoEP,
+)

 if current_platform.is_cuda_alike():
    from .fused_batched_moe import BatchedTritonExperts