diff --git a/vllm/model_executor/layers/moe/grouped_gemm_no_abstraction.py b/vllm/model_executor/layers/moe/grouped_gemm_no_abstraction.py index 128201f6f34d..d73daaa846a6 100644 --- a/vllm/model_executor/layers/moe/grouped_gemm_no_abstraction.py +++ b/vllm/model_executor/layers/moe/grouped_gemm_no_abstraction.py @@ -351,6 +351,6 @@ def run_triton_group_gemm_masked_bf16( # run_batched_deepgemm_masked_fp8(512, 8, 1024, 512) run_batched_deepgemm_contiguous_bf16(512, 8, 1024, 512) -# run_batched_deepgemm_masked_bf16(512, 8, 1024, 512) -# run_triton_group_gemm_contiguous_bf16(512, 8, 1024, 512, 4) -# run_triton_group_gemm_masked_bf16(512, 8, 1024, 512) +run_batched_deepgemm_masked_bf16(512, 8, 1024, 512) +run_triton_group_gemm_contiguous_bf16(512, 8, 1024, 512, 4) +run_triton_group_gemm_masked_bf16(512, 8, 1024, 512)