mirror of
https://git.datalinker.icu/vllm-project/vllm.git
synced 2025-12-13 18:05:49 +08:00
[Bugfix] DeepGemm utils : Fix hardcoded type-cast (#21517)
Signed-off-by: Varun Sundar Rabindranath <vsundarr@redhat.com> Co-authored-by: Varun Sundar Rabindranath <vsundarr@redhat.com>
This commit is contained in:
parent
ce3a9b1378
commit
2212cd6cfb
@ -52,7 +52,7 @@ def compute_aligned_M(M: int, num_topk: int, local_num_experts: int,
|
|||||||
@triton.jit
|
@triton.jit
|
||||||
def apply_expert_map(expert_id, expert_map):
|
def apply_expert_map(expert_id, expert_map):
|
||||||
if expert_id != -1:
|
if expert_id != -1:
|
||||||
expert_id = tl.load(expert_map + expert_id).to(tl.int64)
|
expert_id = tl.load(expert_map + expert_id).to(expert_id.dtype)
|
||||||
return expert_id
|
return expert_id
|
||||||
|
|
||||||
|
|
||||||
|
|||||||
Loading…
x
Reference in New Issue
Block a user