From 6fb0215eee44cf5e4b28f57e6739ef4a51945127 Mon Sep 17 00:00:00 2001 From: Luke Date: Sun, 23 Nov 2025 06:43:21 -0500 Subject: [PATCH] [Bugfix] Use lazy string reference for DeepseekV3Config in config registry (#28958) Signed-off-by: Luke Signed-off-by: Isotr0py Co-authored-by: Isotr0py --- vllm/transformers_utils/config.py | 4 ++-- vllm/transformers_utils/configs/__init__.py | 6 ++++++ 2 files changed, 8 insertions(+), 2 deletions(-) diff --git a/vllm/transformers_utils/config.py b/vllm/transformers_utils/config.py index db7bf228f411d..3d282da8c6112 100644 --- a/vllm/transformers_utils/config.py +++ b/vllm/transformers_utils/config.py @@ -27,7 +27,7 @@ from huggingface_hub.utils import ( RevisionNotFoundError, ) from packaging.version import Version -from transformers import DeepseekV3Config, GenerationConfig, PretrainedConfig +from transformers import GenerationConfig, PretrainedConfig from transformers.configuration_utils import ALLOWED_LAYER_TYPES from transformers.models.auto.image_processing_auto import get_image_processor_config from transformers.models.auto.modeling_auto import ( @@ -84,7 +84,7 @@ _CONFIG_REGISTRY: dict[str, type[PretrainedConfig]] = LazyConfigDict( afmoe="AfmoeConfig", chatglm="ChatGLMConfig", deepseek_vl_v2="DeepseekVLV2Config", - deepseek_v32=DeepseekV3Config, + deepseek_v32="DeepseekV3Config", flex_olmo="FlexOlmoConfig", kimi_linear="KimiLinearConfig", kimi_vl="KimiVLConfig", diff --git a/vllm/transformers_utils/configs/__init__.py b/vllm/transformers_utils/configs/__init__.py index dcae05a15fec3..d28fd8d033373 100644 --- a/vllm/transformers_utils/configs/__init__.py +++ b/vllm/transformers_utils/configs/__init__.py @@ -5,8 +5,13 @@ Model configs may be defined in this directory for the following reasons: - There is no configuration file defined by HF Hub or Transformers library. - There is a need to override the existing config to support vLLM. +- The HF model_type isn't recognized by the Transformers library but can + be mapped to an existing Transformers config, such as + deepseek-ai/DeepSeek-V3.2-Exp. """ +from transformers import DeepseekV3Config + from vllm.transformers_utils.configs.afmoe import AfmoeConfig from vllm.transformers_utils.configs.chatglm import ChatGLMConfig from vllm.transformers_utils.configs.deepseek_vl2 import DeepseekVLV2Config @@ -44,6 +49,7 @@ __all__ = [ "AfmoeConfig", "ChatGLMConfig", "DeepseekVLV2Config", + "DeepseekV3Config", "DotsOCRConfig", "EAGLEConfig", "FlexOlmoConfig",