Unverified Commit 8e797a47 authored by Rain Jiang's avatar Rain Jiang Committed by GitHub
Browse files

fix: the hardcode hf repo name comparison for deepseek-ocr (#12031)


Co-authored-by: default avatargemini-code-assist[bot] <176961590+gemini-code-assist[bot]@users.noreply.github.com>
parent aa3003f1
...@@ -197,10 +197,14 @@ def get_config( ...@@ -197,10 +197,14 @@ def get_config(
config = AutoConfig.from_pretrained( config = AutoConfig.from_pretrained(
model, trust_remote_code=trust_remote_code, revision=revision, **kwargs model, trust_remote_code=trust_remote_code, revision=revision, **kwargs
) )
if "deepseek-ai/DeepSeek-OCR" in model: if (
getattr(config, "auto_map", None) is not None
and config.auto_map.get("AutoModel")
== "modeling_deepseekocr.DeepseekOCRForCausalLM"
):
config.model_type = "deepseek-ocr" config.model_type = "deepseek-ocr"
# Due to an unknown reason, Hugging Face’s AutoConfig mistakenly recognizes the configuration of deepseek-ocr as deepseekvl2. # TODO: Remove this workaround when AutoConfig correctly identifies deepseek-ocr.
# This is a temporary workaround and will require further optimization. # Hugging Face's AutoConfig currently misidentifies it as deepseekvl2.
except ValueError as e: except ValueError as e:
if not "deepseek_v32" in str(e): if not "deepseek_v32" in str(e):
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment