From 2212cd6cfb62196d1b26b0a6e4dcb10a1ea5f7d8 Mon Sep 17 00:00:00 2001
From: Varun Sundar Rabindranath <varunsundar08@gmail.com>
Date: Fri, 25 Jul 2025 08:47:29 +0530
Subject: [PATCH] [Bugfix] DeepGemm utils : Fix hardcoded type-cast (#21517)

Signed-off-by: Varun Sundar Rabindranath <vsundarr@redhat.com>
Co-authored-by: Varun Sundar Rabindranath <vsundarr@redhat.com>
---
 vllm/model_executor/layers/fused_moe/deep_gemm_utils.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/vllm/model_executor/layers/fused_moe/deep_gemm_utils.py b/vllm/model_executor/layers/fused_moe/deep_gemm_utils.py
index 8cc5a747c6731..c8469501af5db 100644
--- a/vllm/model_executor/layers/fused_moe/deep_gemm_utils.py
+++ b/vllm/model_executor/layers/fused_moe/deep_gemm_utils.py
@@ -52,7 +52,7 @@ def compute_aligned_M(M: int, num_topk: int, local_num_experts: int,
 @triton.jit
 def apply_expert_map(expert_id, expert_map):
     if expert_id != -1:
-        expert_id = tl.load(expert_map + expert_id).to(tl.int64)
+        expert_id = tl.load(expert_map + expert_id).to(expert_id.dtype)
     return expert_id