From 9101d832e6fe3811db8faa739f4a7e6e2f32a240 Mon Sep 17 00:00:00 2001 From: Woosuk Kwon Date: Mon, 18 Mar 2024 11:26:24 -0700 Subject: [PATCH] [Bugfix] Make moe_align_block_size AMD-compatible (#3470) --- csrc/moe_align_block_size_kernels.cu | 3 ++- 1 file changed, 2 insertions(+), 1 deletion(-) diff --git a/csrc/moe_align_block_size_kernels.cu b/csrc/moe_align_block_size_kernels.cu index 138615a4bfba..e01b23685ef4 100644 --- a/csrc/moe_align_block_size_kernels.cu +++ b/csrc/moe_align_block_size_kernels.cu @@ -111,7 +111,8 @@ void moe_align_block_size( // set dynamic shared mem auto kernel = vllm::moe_align_block_size_kernel; - AT_CUDA_CHECK(cudaFuncSetAttribute(kernel, cudaFuncAttributeMaxDynamicSharedMemorySize, shared_mem)); + AT_CUDA_CHECK( + VLLM_DevFuncAttribute_SET_MaxDynamicSharedMemorySize((void *)kernel, shared_mem)); kernel<<<1, num_experts, shared_mem, stream>>>( topk_ids.data_ptr(), sorted_token_ids.data_ptr(),