mirror of
https://git.datalinker.icu/vllm-project/vllm.git
synced 2025-12-11 09:06:01 +08:00
[ROCm][Kernel] Using the correct warp_size value
This commit is contained in:
parent
75404d041b
commit
5b19b93082
@ -207,8 +207,8 @@ __global__ void sgl_moe_align_block_size_kernel(
|
|||||||
__shared__ int32_t shared_counts[32][8];
|
__shared__ int32_t shared_counts[32][8];
|
||||||
__shared__ int32_t local_offsets[256];
|
__shared__ int32_t local_offsets[256];
|
||||||
|
|
||||||
const int warp_id = threadIdx.x / WARP_SIZE;
|
const int warp_id = threadIdx.x / 32;
|
||||||
const int lane_id = threadIdx.x % WARP_SIZE;
|
const int lane_id = threadIdx.x % 32;
|
||||||
const int experts_per_warp = 8;
|
const int experts_per_warp = 8;
|
||||||
const int my_expert_start = warp_id * experts_per_warp;
|
const int my_expert_start = warp_id * experts_per_warp;
|
||||||
|
|
||||||
|
|||||||
Loading…
x
Reference in New Issue
Block a user