Unverified Commit 6fb0215e authored by Luke's avatar Luke Committed by GitHub
Browse files

[Bugfix] Use lazy string reference for DeepseekV3Config in config registry (#28958)


Signed-off-by: default avatarLuke <yq0536@gmail.com>
Signed-off-by: default avatarIsotr0py <mozf@mail2.sysu.edu.cn>
Co-authored-by: default avatarIsotr0py <mozf@mail2.sysu.edu.cn>
parent 55c21c88
...@@ -27,7 +27,7 @@ from huggingface_hub.utils import ( ...@@ -27,7 +27,7 @@ from huggingface_hub.utils import (
RevisionNotFoundError, RevisionNotFoundError,
) )
from packaging.version import Version from packaging.version import Version
from transformers import DeepseekV3Config, GenerationConfig, PretrainedConfig from transformers import GenerationConfig, PretrainedConfig
from transformers.configuration_utils import ALLOWED_LAYER_TYPES from transformers.configuration_utils import ALLOWED_LAYER_TYPES
from transformers.models.auto.image_processing_auto import get_image_processor_config from transformers.models.auto.image_processing_auto import get_image_processor_config
from transformers.models.auto.modeling_auto import ( from transformers.models.auto.modeling_auto import (
...@@ -84,7 +84,7 @@ _CONFIG_REGISTRY: dict[str, type[PretrainedConfig]] = LazyConfigDict( ...@@ -84,7 +84,7 @@ _CONFIG_REGISTRY: dict[str, type[PretrainedConfig]] = LazyConfigDict(
afmoe="AfmoeConfig", afmoe="AfmoeConfig",
chatglm="ChatGLMConfig", chatglm="ChatGLMConfig",
deepseek_vl_v2="DeepseekVLV2Config", deepseek_vl_v2="DeepseekVLV2Config",
deepseek_v32=DeepseekV3Config, deepseek_v32="DeepseekV3Config",
flex_olmo="FlexOlmoConfig", flex_olmo="FlexOlmoConfig",
kimi_linear="KimiLinearConfig", kimi_linear="KimiLinearConfig",
kimi_vl="KimiVLConfig", kimi_vl="KimiVLConfig",
......
...@@ -5,8 +5,13 @@ Model configs may be defined in this directory for the following reasons: ...@@ -5,8 +5,13 @@ Model configs may be defined in this directory for the following reasons:
- There is no configuration file defined by HF Hub or Transformers library. - There is no configuration file defined by HF Hub or Transformers library.
- There is a need to override the existing config to support vLLM. - There is a need to override the existing config to support vLLM.
- The HF model_type isn't recognized by the Transformers library but can
be mapped to an existing Transformers config, such as
deepseek-ai/DeepSeek-V3.2-Exp.
""" """
from transformers import DeepseekV3Config
from vllm.transformers_utils.configs.afmoe import AfmoeConfig from vllm.transformers_utils.configs.afmoe import AfmoeConfig
from vllm.transformers_utils.configs.chatglm import ChatGLMConfig from vllm.transformers_utils.configs.chatglm import ChatGLMConfig
from vllm.transformers_utils.configs.deepseek_vl2 import DeepseekVLV2Config from vllm.transformers_utils.configs.deepseek_vl2 import DeepseekVLV2Config
...@@ -44,6 +49,7 @@ __all__ = [ ...@@ -44,6 +49,7 @@ __all__ = [
"AfmoeConfig", "AfmoeConfig",
"ChatGLMConfig", "ChatGLMConfig",
"DeepseekVLV2Config", "DeepseekVLV2Config",
"DeepseekV3Config",
"DotsOCRConfig", "DotsOCRConfig",
"EAGLEConfig", "EAGLEConfig",
"FlexOlmoConfig", "FlexOlmoConfig",
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment