"vscode:/vscode.git/clone" did not exist on "30d8b2daff2749770ad8fe08d75900e7caf36aec"
Unverified Commit 8e797a47 authored by Rain Jiang's avatar Rain Jiang Committed by GitHub
Browse files

fix: the hardcode hf repo name comparison for deepseek-ocr (#12031)


Co-authored-by: default avatargemini-code-assist[bot] <176961590+gemini-code-assist[bot]@users.noreply.github.com>
parent aa3003f1
......@@ -197,10 +197,14 @@ def get_config(
config = AutoConfig.from_pretrained(
model, trust_remote_code=trust_remote_code, revision=revision, **kwargs
)
if "deepseek-ai/DeepSeek-OCR" in model:
if (
getattr(config, "auto_map", None) is not None
and config.auto_map.get("AutoModel")
== "modeling_deepseekocr.DeepseekOCRForCausalLM"
):
config.model_type = "deepseek-ocr"
# Due to an unknown reason, Hugging Face’s AutoConfig mistakenly recognizes the configuration of deepseek-ocr as deepseekvl2.
# This is a temporary workaround and will require further optimization.
# TODO: Remove this workaround when AutoConfig correctly identifies deepseek-ocr.
# Hugging Face's AutoConfig currently misidentifies it as deepseekvl2.
except ValueError as e:
if not "deepseek_v32" in str(e):
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment