From b166ef20e1e5256913b34456507d89850a8dba38 Mon Sep 17 00:00:00 2001 From: zzhxxx Date: Thu, 18 Dec 2025 12:45:56 +0800 Subject: [PATCH] [refactor] Add prefix support to embed_tokens in DeepSeek MTP (#30788) Signed-off-by: zzhx1 --- vllm/model_executor/models/deepseek_mtp.py | 1 + 1 file changed, 1 insertion(+) diff --git a/vllm/model_executor/models/deepseek_mtp.py b/vllm/model_executor/models/deepseek_mtp.py index ca77b8322e2e8..c25e8422da157 100644 --- a/vllm/model_executor/models/deepseek_mtp.py +++ b/vllm/model_executor/models/deepseek_mtp.py @@ -141,6 +141,7 @@ class DeepSeekMultiTokenPredictor(nn.Module): self.embed_tokens = VocabParallelEmbedding( config.vocab_size, config.hidden_size, + prefix=maybe_prefix(prefix, "embed_tokens"), ) self.logits_processor = LogitsProcessor(config.vocab_size)