Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in / Register
Toggle navigation
Menu
Open sidebar
zhougaofeng
internlm2-math-7B
Commits
f6336192
Commit
f6336192
authored
Jun 11, 2024
by
zhougaofeng
Browse files
Upload New File
parent
34ce9ee3
Pipeline
#1147
canceled with stages
Changes
1
Pipelines
1
Hide whitespace changes
Inline
Side-by-side
Showing
1 changed file
with
1295 additions
and
0 deletions
+1295
-0
src/llmfactory/extras/constants.py
src/llmfactory/extras/constants.py
+1295
-0
No files found.
src/llmfactory/extras/constants.py
0 → 100644
View file @
f6336192
from
collections
import
OrderedDict
,
defaultdict
from
enum
import
Enum
from
typing
import
Dict
,
Optional
CHOICES
=
[
"A"
,
"B"
,
"C"
,
"D"
]
DATA_CONFIG
=
"dataset_info.json"
DEFAULT_MODULE
=
defaultdict
(
str
)
DEFAULT_TEMPLATE
=
defaultdict
(
str
)
FILEEXT2TYPE
=
{
"arrow"
:
"arrow"
,
"csv"
:
"csv"
,
"json"
:
"json"
,
"jsonl"
:
"json"
,
"parquet"
:
"parquet"
,
"txt"
:
"text"
,
}
IGNORE_INDEX
=
-
100
IMAGE_TOKEN
=
"<image>"
LAYERNORM_NAMES
=
{
"norm"
,
"ln"
}
METHODS
=
[
"full"
,
"freeze"
,
"lora"
]
MOD_SUPPORTED_MODELS
=
[
"bloom"
,
"falcon"
,
"gemma"
,
"llama"
,
"mistral"
,
"mixtral"
,
"phi"
,
"starcoder2"
]
PEFT_METHODS
=
[
"lora"
]
RUNNING_LOG
=
"running_log.txt"
SUBJECTS
=
[
"Average"
,
"STEM"
,
"Social Sciences"
,
"Humanities"
,
"Other"
]
SUPPORTED_MODELS
=
OrderedDict
()
TRAINER_CONFIG
=
"trainer_config.yaml"
TRAINER_LOG
=
"trainer_log.jsonl"
TRAINING_STAGES
=
{
"Supervised Fine-Tuning"
:
"sft"
,
"Reward Modeling"
:
"rm"
,
"PPO"
:
"ppo"
,
"DPO"
:
"dpo"
,
"KTO"
:
"kto"
,
"ORPO"
:
"orpo"
,
"Pre-Training"
:
"pt"
,
}
STAGES_USE_PAIR_DATA
=
[
"rm"
,
"dpo"
,
"orpo"
]
SUPPORTED_CLASS_FOR_S2ATTN
=
[
"llama"
]
V_HEAD_WEIGHTS_NAME
=
"value_head.bin"
V_HEAD_SAFE_WEIGHTS_NAME
=
"value_head.safetensors"
VISION_MODELS
=
set
()
class
DownloadSource
(
str
,
Enum
):
DEFAULT
=
"hf"
MODELSCOPE
=
"ms"
def
register_model_group
(
models
:
Dict
[
str
,
Dict
[
DownloadSource
,
str
]],
module
:
Optional
[
str
]
=
None
,
template
:
Optional
[
str
]
=
None
,
vision
:
bool
=
False
,
)
->
None
:
prefix
=
None
for
name
,
path
in
models
.
items
():
if
prefix
is
None
:
prefix
=
name
.
split
(
"-"
)[
0
]
else
:
assert
prefix
==
name
.
split
(
"-"
)[
0
],
"prefix should be identical."
SUPPORTED_MODELS
[
name
]
=
path
if
module
is
not
None
:
DEFAULT_MODULE
[
prefix
]
=
module
if
template
is
not
None
:
DEFAULT_TEMPLATE
[
prefix
]
=
template
if
vision
:
VISION_MODELS
.
add
(
prefix
)
register_model_group
(
models
=
{
"Baichuan-7B-Base"
:
{
DownloadSource
.
DEFAULT
:
"baichuan-inc/Baichuan-7B"
,
DownloadSource
.
MODELSCOPE
:
"baichuan-inc/baichuan-7B"
,
},
"Baichuan-13B-Base"
:
{
DownloadSource
.
DEFAULT
:
"baichuan-inc/Baichuan-13B-Base"
,
DownloadSource
.
MODELSCOPE
:
"baichuan-inc/Baichuan-13B-Base"
,
},
"Baichuan-13B-Chat"
:
{
DownloadSource
.
DEFAULT
:
"baichuan-inc/Baichuan-13B-Chat"
,
DownloadSource
.
MODELSCOPE
:
"baichuan-inc/Baichuan-13B-Chat"
,
},
},
module
=
"W_pack"
,
template
=
"baichuan"
,
)
register_model_group
(
models
=
{
"Baichuan2-7B-Base"
:
{
DownloadSource
.
DEFAULT
:
"baichuan-inc/Baichuan2-7B-Base"
,
DownloadSource
.
MODELSCOPE
:
"baichuan-inc/Baichuan2-7B-Base"
,
},
"Baichuan2-13B-Base"
:
{
DownloadSource
.
DEFAULT
:
"baichuan-inc/Baichuan2-13B-Base"
,
DownloadSource
.
MODELSCOPE
:
"baichuan-inc/Baichuan2-13B-Base"
,
},
"Baichuan2-7B-Chat"
:
{
DownloadSource
.
DEFAULT
:
"baichuan-inc/Baichuan2-7B-Chat"
,
DownloadSource
.
MODELSCOPE
:
"baichuan-inc/Baichuan2-7B-Chat"
,
},
"Baichuan2-13B-Chat"
:
{
DownloadSource
.
DEFAULT
:
"baichuan-inc/Baichuan2-13B-Chat"
,
DownloadSource
.
MODELSCOPE
:
"baichuan-inc/Baichuan2-13B-Chat"
,
},
},
module
=
"W_pack"
,
template
=
"baichuan2"
,
)
register_model_group
(
models
=
{
"BLOOM-560M"
:
{
DownloadSource
.
DEFAULT
:
"bigscience/bloom-560m"
,
DownloadSource
.
MODELSCOPE
:
"AI-ModelScope/bloom-560m"
,
},
"BLOOM-3B"
:
{
DownloadSource
.
DEFAULT
:
"bigscience/bloom-3b"
,
DownloadSource
.
MODELSCOPE
:
"AI-ModelScope/bloom-3b"
,
},
"BLOOM-7B1"
:
{
DownloadSource
.
DEFAULT
:
"bigscience/bloom-7b1"
,
DownloadSource
.
MODELSCOPE
:
"AI-ModelScope/bloom-7b1"
,
},
},
module
=
"query_key_value"
,
)
register_model_group
(
models
=
{
"BLOOMZ-560M"
:
{
DownloadSource
.
DEFAULT
:
"bigscience/bloomz-560m"
,
DownloadSource
.
MODELSCOPE
:
"AI-ModelScope/bloomz-560m"
,
},
"BLOOMZ-3B"
:
{
DownloadSource
.
DEFAULT
:
"bigscience/bloomz-3b"
,
DownloadSource
.
MODELSCOPE
:
"AI-ModelScope/bloomz-3b"
,
},
"BLOOMZ-7B1-mt"
:
{
DownloadSource
.
DEFAULT
:
"bigscience/bloomz-7b1-mt"
,
DownloadSource
.
MODELSCOPE
:
"AI-ModelScope/bloomz-7b1-mt"
,
},
},
module
=
"query_key_value"
,
)
register_model_group
(
models
=
{
"BlueLM-7B-Base"
:
{
DownloadSource
.
DEFAULT
:
"vivo-ai/BlueLM-7B-Base"
,
DownloadSource
.
MODELSCOPE
:
"vivo-ai/BlueLM-7B-Base"
,
},
"BlueLM-7B-Chat"
:
{
DownloadSource
.
DEFAULT
:
"vivo-ai/BlueLM-7B-Chat"
,
DownloadSource
.
MODELSCOPE
:
"vivo-ai/BlueLM-7B-Chat"
,
},
},
template
=
"bluelm"
,
)
register_model_group
(
models
=
{
"Breeze-7B"
:
{
DownloadSource
.
DEFAULT
:
"MediaTek-Research/Breeze-7B-Base-v1_0"
,
},
"Breeze-7B-Chat"
:
{
DownloadSource
.
DEFAULT
:
"MediaTek-Research/Breeze-7B-Instruct-v1_0"
,
},
},
template
=
"breeze"
,
)
register_model_group
(
models
=
{
"ChatGLM2-6B-Chat"
:
{
DownloadSource
.
DEFAULT
:
"THUDM/chatglm2-6b"
,
DownloadSource
.
MODELSCOPE
:
"ZhipuAI/chatglm2-6b"
,
}
},
module
=
"query_key_value"
,
template
=
"chatglm2"
,
)
register_model_group
(
models
=
{
"ChatGLM3-6B-Base"
:
{
DownloadSource
.
DEFAULT
:
"THUDM/chatglm3-6b-base"
,
DownloadSource
.
MODELSCOPE
:
"ZhipuAI/chatglm3-6b-base"
,
},
"ChatGLM3-6B-Chat"
:
{
DownloadSource
.
DEFAULT
:
"THUDM/chatglm3-6b"
,
DownloadSource
.
MODELSCOPE
:
"ZhipuAI/chatglm3-6b"
,
},
},
module
=
"query_key_value"
,
template
=
"chatglm3"
,
)
register_model_group
(
models
=
{
"ChineseLLaMA2-1.3B"
:
{
DownloadSource
.
DEFAULT
:
"hfl/chinese-llama-2-1.3b"
,
DownloadSource
.
MODELSCOPE
:
"AI-ModelScope/chinese-llama-2-1.3b"
,
},
"ChineseLLaMA2-7B"
:
{
DownloadSource
.
DEFAULT
:
"hfl/chinese-llama-2-7b"
,
DownloadSource
.
MODELSCOPE
:
"AI-ModelScope/chinese-llama-2-7b"
,
},
"ChineseLLaMA2-13B"
:
{
DownloadSource
.
DEFAULT
:
"hfl/chinese-llama-2-13b"
,
DownloadSource
.
MODELSCOPE
:
"AI-ModelScope/chinese-llama-2-13b"
,
},
"ChineseLLaMA2-1.3B-Chat"
:
{
DownloadSource
.
DEFAULT
:
"hfl/chinese-alpaca-2-1.3b"
,
DownloadSource
.
MODELSCOPE
:
"AI-ModelScope/chinese-alpaca-2-1.3b"
,
},
"ChineseLLaMA2-7B-Chat"
:
{
DownloadSource
.
DEFAULT
:
"hfl/chinese-alpaca-2-7b"
,
DownloadSource
.
MODELSCOPE
:
"AI-ModelScope/chinese-alpaca-2-7b"
,
},
"ChineseLLaMA2-13B-Chat"
:
{
DownloadSource
.
DEFAULT
:
"hfl/chinese-alpaca-2-13b"
,
DownloadSource
.
MODELSCOPE
:
"AI-ModelScope/chinese-alpaca-2-13b"
,
},
},
template
=
"llama2_zh"
,
)
register_model_group
(
models
=
{
"CommandR-35B-Chat"
:
{
DownloadSource
.
DEFAULT
:
"CohereForAI/c4ai-command-r-v01"
,
DownloadSource
.
MODELSCOPE
:
"AI-ModelScope/c4ai-command-r-v01"
,
},
"CommandR-Plus-104B-Chat"
:
{
DownloadSource
.
DEFAULT
:
"CohereForAI/c4ai-command-r-plus"
,
DownloadSource
.
MODELSCOPE
:
"AI-ModelScope/c4ai-command-r-plus"
,
},
"CommandR-35B-4bit-Chat"
:
{
DownloadSource
.
DEFAULT
:
"CohereForAI/c4ai-command-r-v01-4bit"
,
DownloadSource
.
MODELSCOPE
:
"mirror013/c4ai-command-r-v01-4bit"
,
},
"CommandR-Plus-104B-4bit-Chat"
:
{
DownloadSource
.
DEFAULT
:
"CohereForAI/c4ai-command-r-plus-4bit"
,
},
},
template
=
"cohere"
,
)
register_model_group
(
models
=
{
"DBRX-132B-Base"
:
{
DownloadSource
.
DEFAULT
:
"databricks/dbrx-base"
,
DownloadSource
.
MODELSCOPE
:
"AI-ModelScope/dbrx-base"
,
},
"DBRX-132B-Chat"
:
{
DownloadSource
.
DEFAULT
:
"databricks/dbrx-instruct"
,
DownloadSource
.
MODELSCOPE
:
"AI-ModelScope/dbrx-instruct"
,
},
},
module
=
"Wqkv"
,
template
=
"dbrx"
,
)
register_model_group
(
models
=
{
"DeepSeek-LLM-7B-Base"
:
{
DownloadSource
.
DEFAULT
:
"deepseek-ai/deepseek-llm-7b-base"
,
DownloadSource
.
MODELSCOPE
:
"deepseek-ai/deepseek-llm-7b-base"
,
},
"DeepSeek-LLM-67B-Base"
:
{
DownloadSource
.
DEFAULT
:
"deepseek-ai/deepseek-llm-67b-base"
,
DownloadSource
.
MODELSCOPE
:
"deepseek-ai/deepseek-llm-67b-base"
,
},
"DeepSeek-LLM-7B-Chat"
:
{
DownloadSource
.
DEFAULT
:
"deepseek-ai/deepseek-llm-7b-chat"
,
DownloadSource
.
MODELSCOPE
:
"deepseek-ai/deepseek-llm-7b-chat"
,
},
"DeepSeek-LLM-67B-Chat"
:
{
DownloadSource
.
DEFAULT
:
"deepseek-ai/deepseek-llm-67b-chat"
,
DownloadSource
.
MODELSCOPE
:
"deepseek-ai/deepseek-llm-67b-chat"
,
},
"DeepSeek-Math-7B-Base"
:
{
DownloadSource
.
DEFAULT
:
"deepseek-ai/deepseek-math-7b-base"
,
DownloadSource
.
MODELSCOPE
:
"deepseek-ai/deepseek-math-7b-base"
,
},
"DeepSeek-Math-7B-Chat"
:
{
DownloadSource
.
DEFAULT
:
"deepseek-ai/deepseek-math-7b-instruct"
,
DownloadSource
.
MODELSCOPE
:
"deepseek-ai/deepseek-math-7b-instruct"
,
},
"DeepSeek-MoE-16B-Base"
:
{
DownloadSource
.
DEFAULT
:
"deepseek-ai/deepseek-moe-16b-base"
,
DownloadSource
.
MODELSCOPE
:
"deepseek-ai/deepseek-moe-16b-base"
,
},
"DeepSeek-MoE-16B-v2-Base"
:
{
DownloadSource
.
DEFAULT
:
"deepseek-ai/DeepSeek-V2-Lite"
,
},
"DeepSeek-MoE-236B-Base"
:
{
DownloadSource
.
DEFAULT
:
"deepseek-ai/DeepSeek-V2"
,
DownloadSource
.
MODELSCOPE
:
"deepseek-ai/DeepSeek-V2"
,
},
"DeepSeek-MoE-16B-Chat"
:
{
DownloadSource
.
DEFAULT
:
"deepseek-ai/deepseek-moe-16b-chat"
,
DownloadSource
.
MODELSCOPE
:
"deepseek-ai/deepseek-moe-16b-chat"
,
},
"DeepSeek-MoE-16B-v2-Chat"
:
{
DownloadSource
.
DEFAULT
:
"deepseek-ai/DeepSeek-V2-Lite-Chat"
,
},
"DeepSeek-MoE-236B-Chat"
:
{
DownloadSource
.
DEFAULT
:
"deepseek-ai/DeepSeek-V2-Chat"
,
DownloadSource
.
MODELSCOPE
:
"deepseek-ai/DeepSeek-V2-Chat"
,
},
},
template
=
"deepseek"
,
)
register_model_group
(
models
=
{
"DeepSeekCoder-6.7B-Base"
:
{
DownloadSource
.
DEFAULT
:
"deepseek-ai/deepseek-coder-6.7b-base"
,
DownloadSource
.
MODELSCOPE
:
"deepseek-ai/deepseek-coder-6.7b-base"
,
},
"DeepSeekCoder-7B-Base"
:
{
DownloadSource
.
DEFAULT
:
"deepseek-ai/deepseek-coder-7b-base-v1.5"
,
},
"DeepSeekCoder-33B-Base"
:
{
DownloadSource
.
DEFAULT
:
"deepseek-ai/deepseek-coder-33b-base"
,
DownloadSource
.
MODELSCOPE
:
"deepseek-ai/deepseek-coder-33b-base"
,
},
"DeepSeekCoder-6.7B-Chat"
:
{
DownloadSource
.
DEFAULT
:
"deepseek-ai/deepseek-coder-6.7b-instruct"
,
DownloadSource
.
MODELSCOPE
:
"deepseek-ai/deepseek-coder-6.7b-instruct"
,
},
"DeepSeekCoder-7B-Chat"
:
{
DownloadSource
.
DEFAULT
:
"deepseek-ai/deepseek-coder-7b-instruct-v1.5"
,
},
"DeepSeekCoder-33B-Chat"
:
{
DownloadSource
.
DEFAULT
:
"deepseek-ai/deepseek-coder-33b-instruct"
,
DownloadSource
.
MODELSCOPE
:
"deepseek-ai/deepseek-coder-33b-instruct"
,
},
},
template
=
"deepseekcoder"
,
)
register_model_group
(
models
=
{
"Falcon-7B"
:
{
DownloadSource
.
DEFAULT
:
"tiiuae/falcon-7b"
,
DownloadSource
.
MODELSCOPE
:
"AI-ModelScope/falcon-7b"
,
},
"Falcon-11B"
:
{
DownloadSource
.
DEFAULT
:
"tiiuae/falcon-11B"
,
},
"Falcon-40B"
:
{
DownloadSource
.
DEFAULT
:
"tiiuae/falcon-40b"
,
DownloadSource
.
MODELSCOPE
:
"AI-ModelScope/falcon-40b"
,
},
"Falcon-180B"
:
{
DownloadSource
.
DEFAULT
:
"tiiuae/falcon-180b"
,
DownloadSource
.
MODELSCOPE
:
"modelscope/falcon-180B"
,
},
"Falcon-7B-Chat"
:
{
DownloadSource
.
DEFAULT
:
"tiiuae/falcon-7b-instruct"
,
DownloadSource
.
MODELSCOPE
:
"AI-ModelScope/falcon-7b-instruct"
,
},
"Falcon-40B-Chat"
:
{
DownloadSource
.
DEFAULT
:
"tiiuae/falcon-40b-instruct"
,
DownloadSource
.
MODELSCOPE
:
"AI-ModelScope/falcon-40b-instruct"
,
},
"Falcon-180B-Chat"
:
{
DownloadSource
.
DEFAULT
:
"tiiuae/falcon-180b-chat"
,
DownloadSource
.
MODELSCOPE
:
"modelscope/falcon-180B-chat"
,
},
},
module
=
"query_key_value"
,
template
=
"falcon"
,
)
register_model_group
(
models
=
{
"Gemma-2B"
:
{
DownloadSource
.
DEFAULT
:
"google/gemma-2b"
,
DownloadSource
.
MODELSCOPE
:
"AI-ModelScope/gemma-2b"
,
},
"Gemma-7B"
:
{
DownloadSource
.
DEFAULT
:
"google/gemma-7b"
,
DownloadSource
.
MODELSCOPE
:
"AI-ModelScope/gemma-2b-it"
,
},
"Gemma-2B-Chat"
:
{
DownloadSource
.
DEFAULT
:
"google/gemma-2b-it"
,
DownloadSource
.
MODELSCOPE
:
"AI-ModelScope/gemma-7b"
,
},
"Gemma-7B-Chat"
:
{
DownloadSource
.
DEFAULT
:
"google/gemma-7b-it"
,
DownloadSource
.
MODELSCOPE
:
"AI-ModelScope/gemma-7b-it"
,
},
},
template
=
"gemma"
,
)
register_model_group
(
models
=
{
"CodeGemma-2B"
:
{
DownloadSource
.
DEFAULT
:
"google/codegemma-1.1-2b"
,
},
"CodeGemma-7B"
:
{
DownloadSource
.
DEFAULT
:
"google/codegemma-7b"
,
},
"CodeGemma-7B-Chat"
:
{
DownloadSource
.
DEFAULT
:
"google/codegemma-1.1-7b-it"
,
DownloadSource
.
MODELSCOPE
:
"AI-ModelScope/codegemma-7b-it"
,
},
},
template
=
"gemma"
,
)
register_model_group
(
models
=
{
"InternLM-7B"
:
{
DownloadSource
.
DEFAULT
:
"internlm/internlm-7b"
,
DownloadSource
.
MODELSCOPE
:
"Shanghai_AI_Laboratory/internlm-7b"
,
},
"InternLM-20B"
:
{
DownloadSource
.
DEFAULT
:
"internlm/internlm-20b"
,
DownloadSource
.
MODELSCOPE
:
"Shanghai_AI_Laboratory/internlm-20b"
,
},
"InternLM-7B-Chat"
:
{
DownloadSource
.
DEFAULT
:
"internlm/internlm-chat-7b"
,
DownloadSource
.
MODELSCOPE
:
"Shanghai_AI_Laboratory/internlm-chat-7b"
,
},
"InternLM-20B-Chat"
:
{
DownloadSource
.
DEFAULT
:
"internlm/internlm-chat-20b"
,
DownloadSource
.
MODELSCOPE
:
"Shanghai_AI_Laboratory/internlm-chat-20b"
,
},
},
template
=
"intern"
,
)
register_model_group
(
models
=
{
"InternLM2-7B"
:
{
DownloadSource
.
DEFAULT
:
"internlm/internlm2-7b"
,
DownloadSource
.
MODELSCOPE
:
"Shanghai_AI_Laboratory/internlm2-7b"
,
},
"InternLM2-20B"
:
{
DownloadSource
.
DEFAULT
:
"internlm/internlm2-20b"
,
DownloadSource
.
MODELSCOPE
:
"Shanghai_AI_Laboratory/internlm2-20b"
,
},
"InternLM2-7B-Chat"
:
{
DownloadSource
.
DEFAULT
:
"internlm/internlm2-chat-7b"
,
DownloadSource
.
MODELSCOPE
:
"Shanghai_AI_Laboratory/internlm2-chat-7b"
,
},
"InternLM2-20B-Chat"
:
{
DownloadSource
.
DEFAULT
:
"internlm/internlm2-chat-20b"
,
DownloadSource
.
MODELSCOPE
:
"Shanghai_AI_Laboratory/internlm2-chat-20b"
,
},
},
module
=
"wqkv"
,
template
=
"intern2"
,
)
register_model_group
(
models
=
{
"Jambda-v0.1"
:
{
DownloadSource
.
DEFAULT
:
"ai21labs/Jamba-v0.1"
,
DownloadSource
.
MODELSCOPE
:
"AI-ModelScope/Jamba-v0.1"
,
}
},
)
register_model_group
(
models
=
{
"LingoWhale-8B"
:
{
DownloadSource
.
DEFAULT
:
"deeplang-ai/LingoWhale-8B"
,
DownloadSource
.
MODELSCOPE
:
"DeepLang/LingoWhale-8B"
,
}
},
module
=
"qkv_proj"
,
)
register_model_group
(
models
=
{
"LLaMA-7B"
:
{
DownloadSource
.
DEFAULT
:
"huggyllama/llama-7b"
,
DownloadSource
.
MODELSCOPE
:
"skyline2006/llama-7b"
,
},
"LLaMA-13B"
:
{
DownloadSource
.
DEFAULT
:
"huggyllama/llama-13b"
,
DownloadSource
.
MODELSCOPE
:
"skyline2006/llama-13b"
,
},
"LLaMA-30B"
:
{
DownloadSource
.
DEFAULT
:
"huggyllama/llama-30b"
,
DownloadSource
.
MODELSCOPE
:
"skyline2006/llama-30b"
,
},
"LLaMA-65B"
:
{
DownloadSource
.
DEFAULT
:
"huggyllama/llama-65b"
,
DownloadSource
.
MODELSCOPE
:
"skyline2006/llama-65b"
,
},
}
)
register_model_group
(
models
=
{
"LLaMA2-7B"
:
{
DownloadSource
.
DEFAULT
:
"meta-llama/Llama-2-7b-hf"
,
DownloadSource
.
MODELSCOPE
:
"modelscope/Llama-2-7b-ms"
,
},
"LLaMA2-13B"
:
{
DownloadSource
.
DEFAULT
:
"meta-llama/Llama-2-13b-hf"
,
DownloadSource
.
MODELSCOPE
:
"modelscope/Llama-2-13b-ms"
,
},
"LLaMA2-70B"
:
{
DownloadSource
.
DEFAULT
:
"meta-llama/Llama-2-70b-hf"
,
DownloadSource
.
MODELSCOPE
:
"modelscope/Llama-2-70b-ms"
,
},
"LLaMA2-7B-Chat"
:
{
DownloadSource
.
DEFAULT
:
"meta-llama/Llama-2-7b-chat-hf"
,
DownloadSource
.
MODELSCOPE
:
"modelscope/Llama-2-7b-chat-ms"
,
},
"LLaMA2-13B-Chat"
:
{
DownloadSource
.
DEFAULT
:
"meta-llama/Llama-2-13b-chat-hf"
,
DownloadSource
.
MODELSCOPE
:
"modelscope/Llama-2-13b-chat-ms"
,
},
"LLaMA2-70B-Chat"
:
{
DownloadSource
.
DEFAULT
:
"meta-llama/Llama-2-70b-chat-hf"
,
DownloadSource
.
MODELSCOPE
:
"modelscope/Llama-2-70b-chat-ms"
,
},
},
template
=
"llama2"
,
)
register_model_group
(
models
=
{
"LLaMA3-8B"
:
{
DownloadSource
.
DEFAULT
:
"meta-llama/Meta-Llama-3-8B"
,
DownloadSource
.
MODELSCOPE
:
"LLM-Research/Meta-Llama-3-8B"
,
},
"LLaMA3-70B"
:
{
DownloadSource
.
DEFAULT
:
"meta-llama/Meta-Llama-3-70B"
,
DownloadSource
.
MODELSCOPE
:
"LLM-Research/Meta-Llama-3-70B"
,
},
"LLaMA3-8B-Chat"
:
{
DownloadSource
.
DEFAULT
:
"meta-llama/Meta-Llama-3-8B-Instruct"
,
DownloadSource
.
MODELSCOPE
:
"LLM-Research/Meta-Llama-3-8B-Instruct"
,
},
"LLaMA3-70B-Chat"
:
{
DownloadSource
.
DEFAULT
:
"meta-llama/Meta-Llama-3-70B-Instruct"
,
DownloadSource
.
MODELSCOPE
:
"LLM-Research/Meta-Llama-3-70B-Instruct"
,
},
"LLaMA3-8B-Chinese-Chat"
:
{
DownloadSource
.
DEFAULT
:
"shenzhi-wang/Llama3-8B-Chinese-Chat"
,
DownloadSource
.
MODELSCOPE
:
"LLM-Research/Llama3-8B-Chinese-Chat"
,
},
"LLaMA3-70B-Chinese-Chat"
:
{
DownloadSource
.
DEFAULT
:
"shenzhi-wang/Llama3-70B-Chinese-Chat"
,
},
},
template
=
"llama3"
,
)
register_model_group
(
models
=
{
"LLaVA1.5-7B-Chat"
:
{
DownloadSource
.
DEFAULT
:
"llava-hf/llava-1.5-7b-hf"
,
},
"LLaVA1.5-13B-Chat"
:
{
DownloadSource
.
DEFAULT
:
"llava-hf/llava-1.5-13b-hf"
,
},
},
template
=
"vicuna"
,
vision
=
True
,
)
register_model_group
(
models
=
{
"Mistral-7B-v0.1"
:
{
DownloadSource
.
DEFAULT
:
"mistralai/Mistral-7B-v0.1"
,
DownloadSource
.
MODELSCOPE
:
"AI-ModelScope/Mistral-7B-v0.1"
,
},
"Mistral-7B-v0.1-Chat"
:
{
DownloadSource
.
DEFAULT
:
"mistralai/Mistral-7B-Instruct-v0.1"
,
DownloadSource
.
MODELSCOPE
:
"AI-ModelScope/Mistral-7B-Instruct-v0.1"
,
},
"Mistral-7B-v0.2"
:
{
DownloadSource
.
DEFAULT
:
"alpindale/Mistral-7B-v0.2-hf"
,
DownloadSource
.
MODELSCOPE
:
"AI-ModelScope/Mistral-7B-v0.2-hf"
,
},
"Mistral-7B-v0.2-Chat"
:
{
DownloadSource
.
DEFAULT
:
"mistralai/Mistral-7B-Instruct-v0.2"
,
DownloadSource
.
MODELSCOPE
:
"AI-ModelScope/Mistral-7B-Instruct-v0.2"
,
},
},
template
=
"mistral"
,
)
register_model_group
(
models
=
{
"Mixtral-8x7B-v0.1"
:
{
DownloadSource
.
DEFAULT
:
"mistralai/Mixtral-8x7B-v0.1"
,
DownloadSource
.
MODELSCOPE
:
"AI-ModelScope/Mixtral-8x7B-v0.1"
,
},
"Mixtral-8x7B-v0.1-Chat"
:
{
DownloadSource
.
DEFAULT
:
"mistralai/Mixtral-8x7B-Instruct-v0.1"
,
DownloadSource
.
MODELSCOPE
:
"AI-ModelScope/Mixtral-8x7B-Instruct-v0.1"
,
},
"Mixtral-8x22B-v0.1"
:
{
DownloadSource
.
DEFAULT
:
"mistralai/Mixtral-8x22B-v0.1"
,
DownloadSource
.
MODELSCOPE
:
"AI-ModelScope/Mixtral-8x22B-v0.1"
,
},
"Mixtral-8x22B-v0.1-Chat"
:
{
DownloadSource
.
DEFAULT
:
"mistralai/Mixtral-8x22B-Instruct-v0.1"
,
},
},
template
=
"mistral"
,
)
register_model_group
(
models
=
{
"OLMo-1B"
:
{
DownloadSource
.
DEFAULT
:
"allenai/OLMo-1B-hf"
,
},
"OLMo-7B"
:
{
DownloadSource
.
DEFAULT
:
"allenai/OLMo-7B-hf"
,
},
"OLMo-1.7-7B"
:
{
DownloadSource
.
DEFAULT
:
"allenai/OLMo-1.7-7B-hf"
,
},
},
)
register_model_group
(
models
=
{
"OpenChat3.5-7B-Chat"
:
{
DownloadSource
.
DEFAULT
:
"openchat/openchat-3.5-0106"
,
DownloadSource
.
MODELSCOPE
:
"xcwzxcwz/openchat-3.5-0106"
,
}
},
template
=
"openchat"
,
)
register_model_group
(
models
=
{
"Orion-14B-Base"
:
{
DownloadSource
.
DEFAULT
:
"OrionStarAI/Orion-14B-Base"
,
DownloadSource
.
MODELSCOPE
:
"OrionStarAI/Orion-14B-Base"
,
},
"Orion-14B-Chat"
:
{
DownloadSource
.
DEFAULT
:
"OrionStarAI/Orion-14B-Chat"
,
DownloadSource
.
MODELSCOPE
:
"OrionStarAI/Orion-14B-Chat"
,
},
"Orion-14B-Long-Chat"
:
{
DownloadSource
.
DEFAULT
:
"OrionStarAI/Orion-14B-LongChat"
,
DownloadSource
.
MODELSCOPE
:
"OrionStarAI/Orion-14B-LongChat"
,
},
"Orion-14B-RAG-Chat"
:
{
DownloadSource
.
DEFAULT
:
"OrionStarAI/Orion-14B-Chat-RAG"
,
DownloadSource
.
MODELSCOPE
:
"OrionStarAI/Orion-14B-Chat-RAG"
,
},
"Orion-14B-Plugin-Chat"
:
{
DownloadSource
.
DEFAULT
:
"OrionStarAI/Orion-14B-Chat-Plugin"
,
DownloadSource
.
MODELSCOPE
:
"OrionStarAI/Orion-14B-Chat-Plugin"
,
},
},
template
=
"orion"
,
)
register_model_group
(
models
=
{
"PaliGemma-3B-pt-224"
:
{
DownloadSource
.
DEFAULT
:
"google/paligemma-3b-pt-224"
,
},
"PaliGemma-3B-pt-448"
:
{
DownloadSource
.
DEFAULT
:
"google/paligemma-3b-pt-448"
,
},
"PaliGemma-3B-pt-896"
:
{
DownloadSource
.
DEFAULT
:
"google/paligemma-3b-pt-896"
,
},
"PaliGemma-3B-mix-224"
:
{
DownloadSource
.
DEFAULT
:
"google/paligemma-3b-mix-224"
,
},
"PaliGemma-3B-mix-448"
:
{
DownloadSource
.
DEFAULT
:
"google/paligemma-3b-mix-448"
,
},
},
vision
=
True
,
)
register_model_group
(
models
=
{
"Phi-1.5-1.3B"
:
{
DownloadSource
.
DEFAULT
:
"microsoft/phi-1_5"
,
DownloadSource
.
MODELSCOPE
:
"allspace/PHI_1-5"
,
},
"Phi-2-2.7B"
:
{
DownloadSource
.
DEFAULT
:
"microsoft/phi-2"
,
DownloadSource
.
MODELSCOPE
:
"AI-ModelScope/phi-2"
,
},
}
)
register_model_group
(
models
=
{
"Phi3-3.8B-4k-Chat"
:
{
DownloadSource
.
DEFAULT
:
"microsoft/Phi-3-mini-4k-instruct"
,
DownloadSource
.
MODELSCOPE
:
"LLM-Research/Phi-3-mini-4k-instruct"
,
},
"Phi3-3.8B-128k-Chat"
:
{
DownloadSource
.
DEFAULT
:
"microsoft/Phi-3-mini-128k-instruct"
,
DownloadSource
.
MODELSCOPE
:
"LLM-Research/Phi-3-mini-128k-instruct"
,
},
},
module
=
"qkv_proj"
,
template
=
"phi"
,
)
register_model_group
(
models
=
{
"Qwen-1.8B"
:
{
DownloadSource
.
DEFAULT
:
"Qwen/Qwen-1_8B"
,
DownloadSource
.
MODELSCOPE
:
"qwen/Qwen-1_8B"
,
},
"Qwen-7B"
:
{
DownloadSource
.
DEFAULT
:
"Qwen/Qwen-7B"
,
DownloadSource
.
MODELSCOPE
:
"qwen/Qwen-7B"
,
},
"Qwen-14B"
:
{
DownloadSource
.
DEFAULT
:
"Qwen/Qwen-14B"
,
DownloadSource
.
MODELSCOPE
:
"qwen/Qwen-14B"
,
},
"Qwen-72B"
:
{
DownloadSource
.
DEFAULT
:
"Qwen/Qwen-72B"
,
DownloadSource
.
MODELSCOPE
:
"qwen/Qwen-72B"
,
},
"Qwen-1.8B-Chat"
:
{
DownloadSource
.
DEFAULT
:
"Qwen/Qwen-1_8B-Chat"
,
DownloadSource
.
MODELSCOPE
:
"qwen/Qwen-1_8B-Chat"
,
},
"Qwen-7B-Chat"
:
{
DownloadSource
.
DEFAULT
:
"Qwen/Qwen-7B-Chat"
,
DownloadSource
.
MODELSCOPE
:
"qwen/Qwen-7B-Chat"
,
},
"Qwen-14B-Chat"
:
{
DownloadSource
.
DEFAULT
:
"Qwen/Qwen-14B-Chat"
,
DownloadSource
.
MODELSCOPE
:
"qwen/Qwen-14B-Chat"
,
},
"Qwen-72B-Chat"
:
{
DownloadSource
.
DEFAULT
:
"Qwen/Qwen-72B-Chat"
,
DownloadSource
.
MODELSCOPE
:
"qwen/Qwen-72B-Chat"
,
},
"Qwen-1.8B-int8-Chat"
:
{
DownloadSource
.
DEFAULT
:
"Qwen/Qwen-1_8B-Chat-Int8"
,
DownloadSource
.
MODELSCOPE
:
"qwen/Qwen-1_8B-Chat-Int8"
,
},
"Qwen-1.8B-int4-Chat"
:
{
DownloadSource
.
DEFAULT
:
"Qwen/Qwen-1_8B-Chat-Int4"
,
DownloadSource
.
MODELSCOPE
:
"qwen/Qwen-1_8B-Chat-Int4"
,
},
"Qwen-7B-int8-Chat"
:
{
DownloadSource
.
DEFAULT
:
"Qwen/Qwen-7B-Chat-Int8"
,
DownloadSource
.
MODELSCOPE
:
"qwen/Qwen-7B-Chat-Int8"
,
},
"Qwen-7B-int4-Chat"
:
{
DownloadSource
.
DEFAULT
:
"Qwen/Qwen-7B-Chat-Int4"
,
DownloadSource
.
MODELSCOPE
:
"qwen/Qwen-7B-Chat-Int4"
,
},
"Qwen-14B-int8-Chat"
:
{
DownloadSource
.
DEFAULT
:
"Qwen/Qwen-14B-Chat-Int8"
,
DownloadSource
.
MODELSCOPE
:
"qwen/Qwen-14B-Chat-Int8"
,
},
"Qwen-14B-int4-Chat"
:
{
DownloadSource
.
DEFAULT
:
"Qwen/Qwen-14B-Chat-Int4"
,
DownloadSource
.
MODELSCOPE
:
"qwen/Qwen-14B-Chat-Int4"
,
},
"Qwen-72B-int8-Chat"
:
{
DownloadSource
.
DEFAULT
:
"Qwen/Qwen-72B-Chat-Int8"
,
DownloadSource
.
MODELSCOPE
:
"qwen/Qwen-72B-Chat-Int8"
,
},
"Qwen-72B-int4-Chat"
:
{
DownloadSource
.
DEFAULT
:
"Qwen/Qwen-72B-Chat-Int4"
,
DownloadSource
.
MODELSCOPE
:
"qwen/Qwen-72B-Chat-Int4"
,
},
},
module
=
"c_attn"
,
template
=
"qwen"
,
)
register_model_group
(
models
=
{
"Qwen1.5-0.5B"
:
{
DownloadSource
.
DEFAULT
:
"Qwen/Qwen1.5-0.5B"
,
DownloadSource
.
MODELSCOPE
:
"qwen/Qwen1.5-0.5B"
,
},
"Qwen1.5-1.8B"
:
{
DownloadSource
.
DEFAULT
:
"Qwen/Qwen1.5-1.8B"
,
DownloadSource
.
MODELSCOPE
:
"qwen/Qwen1.5-1.8B"
,
},
"Qwen1.5-4B"
:
{
DownloadSource
.
DEFAULT
:
"Qwen/Qwen1.5-4B"
,
DownloadSource
.
MODELSCOPE
:
"qwen/Qwen1.5-4B"
,
},
"Qwen1.5-7B"
:
{
DownloadSource
.
DEFAULT
:
"Qwen/Qwen1.5-7B"
,
DownloadSource
.
MODELSCOPE
:
"qwen/Qwen1.5-7B"
,
},
"Qwen1.5-14B"
:
{
DownloadSource
.
DEFAULT
:
"Qwen/Qwen1.5-14B"
,
DownloadSource
.
MODELSCOPE
:
"qwen/Qwen1.5-14B"
,
},
"Qwen1.5-32B"
:
{
DownloadSource
.
DEFAULT
:
"Qwen/Qwen1.5-32B"
,
DownloadSource
.
MODELSCOPE
:
"qwen/Qwen1.5-32B"
,
},
"Qwen1.5-72B"
:
{
DownloadSource
.
DEFAULT
:
"Qwen/Qwen1.5-72B"
,
DownloadSource
.
MODELSCOPE
:
"qwen/Qwen1.5-72B"
,
},
"Qwen1.5-110B"
:
{
DownloadSource
.
DEFAULT
:
"Qwen/Qwen1.5-110B"
,
DownloadSource
.
MODELSCOPE
:
"qwen/Qwen1.5-110B"
,
},
"Qwen1.5-MoE-A2.7B"
:
{
DownloadSource
.
DEFAULT
:
"Qwen/Qwen1.5-MoE-A2.7B"
,
DownloadSource
.
MODELSCOPE
:
"qwen/Qwen1.5-MoE-A2.7B"
,
},
"Qwen1.5-Code-7B"
:
{
DownloadSource
.
DEFAULT
:
"Qwen/CodeQwen1.5-7B"
,
DownloadSource
.
MODELSCOPE
:
"qwen/CodeQwen1.5-7B"
,
},
"Qwen1.5-0.5B-Chat"
:
{
DownloadSource
.
DEFAULT
:
"Qwen/Qwen1.5-0.5B-Chat"
,
DownloadSource
.
MODELSCOPE
:
"qwen/Qwen1.5-0.5B-Chat"
,
},
"Qwen1.5-1.8B-Chat"
:
{
DownloadSource
.
DEFAULT
:
"Qwen/Qwen1.5-1.8B-Chat"
,
DownloadSource
.
MODELSCOPE
:
"qwen/Qwen1.5-1.8B-Chat"
,
},
"Qwen1.5-4B-Chat"
:
{
DownloadSource
.
DEFAULT
:
"Qwen/Qwen1.5-4B-Chat"
,
DownloadSource
.
MODELSCOPE
:
"qwen/Qwen1.5-4B-Chat"
,
},
"Qwen1.5-7B-Chat"
:
{
DownloadSource
.
DEFAULT
:
"Qwen/Qwen1.5-7B-Chat"
,
DownloadSource
.
MODELSCOPE
:
"qwen/Qwen1.5-7B-Chat"
,
},
"Qwen1.5-14B-Chat"
:
{
DownloadSource
.
DEFAULT
:
"Qwen/Qwen1.5-14B-Chat"
,
DownloadSource
.
MODELSCOPE
:
"qwen/Qwen1.5-14B-Chat"
,
},
"Qwen1.5-32B-Chat"
:
{
DownloadSource
.
DEFAULT
:
"Qwen/Qwen1.5-32B-Chat"
,
DownloadSource
.
MODELSCOPE
:
"qwen/Qwen1.5-32B-Chat"
,
},
"Qwen1.5-72B-Chat"
:
{
DownloadSource
.
DEFAULT
:
"Qwen/Qwen1.5-72B-Chat"
,
DownloadSource
.
MODELSCOPE
:
"qwen/Qwen1.5-72B-Chat"
,
},
"Qwen1.5-110B-Chat"
:
{
DownloadSource
.
DEFAULT
:
"Qwen/Qwen1.5-110B-Chat"
,
DownloadSource
.
MODELSCOPE
:
"qwen/Qwen1.5-110B-Chat"
,
},
"Qwen1.5-MoE-A2.7B-Chat"
:
{
DownloadSource
.
DEFAULT
:
"Qwen/Qwen1.5-MoE-A2.7B-Chat"
,
DownloadSource
.
MODELSCOPE
:
"qwen/Qwen1.5-MoE-A2.7B-Chat"
,
},
"Qwen1.5-Code-7B-Chat"
:
{
DownloadSource
.
DEFAULT
:
"Qwen/CodeQwen1.5-7B-Chat"
,
DownloadSource
.
MODELSCOPE
:
"qwen/CodeQwen1.5-7B-Chat"
,
},
"Qwen1.5-0.5B-int8-Chat"
:
{
DownloadSource
.
DEFAULT
:
"Qwen/Qwen1.5-0.5B-Chat-GPTQ-Int8"
,
DownloadSource
.
MODELSCOPE
:
"qwen/Qwen1.5-0.5B-Chat-GPTQ-Int8"
,
},
"Qwen1.5-0.5B-int4-Chat"
:
{
DownloadSource
.
DEFAULT
:
"Qwen/Qwen1.5-0.5B-Chat-AWQ"
,
DownloadSource
.
MODELSCOPE
:
"qwen/Qwen1.5-0.5B-Chat-AWQ"
,
},
"Qwen1.5-1.8B-int8-Chat"
:
{
DownloadSource
.
DEFAULT
:
"Qwen/Qwen1.5-1.8B-Chat-GPTQ-Int8"
,
DownloadSource
.
MODELSCOPE
:
"qwen/Qwen1.5-1.8B-Chat-GPTQ-Int8"
,
},
"Qwen1.5-1.8B-int4-Chat"
:
{
DownloadSource
.
DEFAULT
:
"Qwen/Qwen1.5-1.8B-Chat-AWQ"
,
DownloadSource
.
MODELSCOPE
:
"qwen/Qwen1.5-1.8B-Chat-AWQ"
,
},
"Qwen1.5-4B-int8-Chat"
:
{
DownloadSource
.
DEFAULT
:
"Qwen/Qwen1.5-4B-Chat-GPTQ-Int8"
,
DownloadSource
.
MODELSCOPE
:
"qwen/Qwen1.5-4B-Chat-GPTQ-Int8"
,
},
"Qwen1.5-4B-int4-Chat"
:
{
DownloadSource
.
DEFAULT
:
"Qwen/Qwen1.5-4B-Chat-AWQ"
,
DownloadSource
.
MODELSCOPE
:
"qwen/Qwen1.5-4B-Chat-AWQ"
,
},
"Qwen1.5-7B-int8-Chat"
:
{
DownloadSource
.
DEFAULT
:
"Qwen/Qwen1.5-7B-Chat-GPTQ-Int8"
,
DownloadSource
.
MODELSCOPE
:
"qwen/Qwen1.5-7B-Chat-GPTQ-Int8"
,
},
"Qwen1.5-7B-int4-Chat"
:
{
DownloadSource
.
DEFAULT
:
"Qwen/Qwen1.5-7B-Chat-AWQ"
,
DownloadSource
.
MODELSCOPE
:
"qwen/Qwen1.5-7B-Chat-AWQ"
,
},
"Qwen1.5-14B-int8-Chat"
:
{
DownloadSource
.
DEFAULT
:
"Qwen/Qwen1.5-14B-Chat-GPTQ-Int8"
,
DownloadSource
.
MODELSCOPE
:
"qwen/Qwen1.5-14B-Chat-GPTQ-Int8"
,
},
"Qwen1.5-14B-int4-Chat"
:
{
DownloadSource
.
DEFAULT
:
"Qwen/Qwen1.5-14B-Chat-AWQ"
,
DownloadSource
.
MODELSCOPE
:
"qwen/Qwen1.5-14B-Chat-AWQ"
,
},
"Qwen1.5-32B-int4-Chat"
:
{
DownloadSource
.
DEFAULT
:
"Qwen/Qwen1.5-32B-Chat-AWQ"
,
DownloadSource
.
MODELSCOPE
:
"qwen/Qwen1.5-32B-Chat-AWQ"
,
},
"Qwen1.5-72B-int8-Chat"
:
{
DownloadSource
.
DEFAULT
:
"Qwen/Qwen1.5-72B-Chat-GPTQ-Int8"
,
DownloadSource
.
MODELSCOPE
:
"qwen/Qwen1.5-72B-Chat-GPTQ-Int8"
,
},
"Qwen1.5-72B-int4-Chat"
:
{
DownloadSource
.
DEFAULT
:
"Qwen/Qwen1.5-72B-Chat-AWQ"
,
DownloadSource
.
MODELSCOPE
:
"qwen/Qwen1.5-72B-Chat-AWQ"
,
},
"Qwen1.5-110B-int4-Chat"
:
{
DownloadSource
.
DEFAULT
:
"Qwen/Qwen1.5-110B-Chat-AWQ"
,
DownloadSource
.
MODELSCOPE
:
"qwen/Qwen1.5-110B-Chat-AWQ"
,
},
"Qwen1.5-MoE-A2.7B-int4-Chat"
:
{
DownloadSource
.
DEFAULT
:
"Qwen/Qwen1.5-MoE-A2.7B-Chat-GPTQ-Int4"
,
DownloadSource
.
MODELSCOPE
:
"qwen/Qwen1.5-MoE-A2.7B-Chat-GPTQ-Int4"
,
},
"Qwen1.5-Code-7B-int4-Chat"
:
{
DownloadSource
.
DEFAULT
:
"Qwen/CodeQwen1.5-7B-Chat-AWQ"
,
DownloadSource
.
MODELSCOPE
:
"qwen/CodeQwen1.5-7B-Chat-AWQ"
,
},
},
template
=
"qwen"
,
)
register_model_group
(
models
=
{
"SOLAR-10.7B"
:
{
DownloadSource
.
DEFAULT
:
"upstage/SOLAR-10.7B-v1.0"
,
},
"SOLAR-10.7B-Chat"
:
{
DownloadSource
.
DEFAULT
:
"upstage/SOLAR-10.7B-Instruct-v1.0"
,
DownloadSource
.
MODELSCOPE
:
"AI-ModelScope/SOLAR-10.7B-Instruct-v1.0"
,
},
},
template
=
"solar"
,
)
register_model_group
(
models
=
{
"Skywork-13B-Base"
:
{
DownloadSource
.
DEFAULT
:
"Skywork/Skywork-13B-base"
,
DownloadSource
.
MODELSCOPE
:
"skywork/Skywork-13B-base"
,
}
}
)
register_model_group
(
models
=
{
"StarCoder2-3B"
:
{
DownloadSource
.
DEFAULT
:
"bigcode/starcoder2-3b"
,
DownloadSource
.
MODELSCOPE
:
"AI-ModelScope/starcoder2-3b"
,
},
"StarCoder2-7B"
:
{
DownloadSource
.
DEFAULT
:
"bigcode/starcoder2-7b"
,
DownloadSource
.
MODELSCOPE
:
"AI-ModelScope/starcoder2-7b"
,
},
"StarCoder2-15B"
:
{
DownloadSource
.
DEFAULT
:
"bigcode/starcoder2-15b"
,
DownloadSource
.
MODELSCOPE
:
"AI-ModelScope/starcoder2-15b"
,
},
}
)
register_model_group
(
models
=
{
"Vicuna1.5-7B-Chat"
:
{
DownloadSource
.
DEFAULT
:
"lmsys/vicuna-7b-v1.5"
,
DownloadSource
.
MODELSCOPE
:
"Xorbits/vicuna-7b-v1.5"
,
},
"Vicuna1.5-13B-Chat"
:
{
DownloadSource
.
DEFAULT
:
"lmsys/vicuna-13b-v1.5"
,
DownloadSource
.
MODELSCOPE
:
"Xorbits/vicuna-13b-v1.5"
,
},
},
template
=
"vicuna"
,
)
register_model_group
(
models
=
{
"XuanYuan-6B"
:
{
DownloadSource
.
DEFAULT
:
"Duxiaoman-DI/XuanYuan-6B"
,
DownloadSource
.
MODELSCOPE
:
"Duxiaoman-DI/XuanYuan-6B"
,
},
"XuanYuan-70B"
:
{
DownloadSource
.
DEFAULT
:
"Duxiaoman-DI/XuanYuan-70B"
,
DownloadSource
.
MODELSCOPE
:
"Duxiaoman-DI/XuanYuan-70B"
,
},
"XuanYuan-2-70B"
:
{
DownloadSource
.
DEFAULT
:
"Duxiaoman-DI/XuanYuan2-70B"
,
DownloadSource
.
MODELSCOPE
:
"Duxiaoman-DI/XuanYuan2-70B"
,
},
"XuanYuan-6B-Chat"
:
{
DownloadSource
.
DEFAULT
:
"Duxiaoman-DI/XuanYuan-6B-Chat"
,
DownloadSource
.
MODELSCOPE
:
"Duxiaoman-DI/XuanYuan-6B-Chat"
,
},
"XuanYuan-70B-Chat"
:
{
DownloadSource
.
DEFAULT
:
"Duxiaoman-DI/XuanYuan-70B-Chat"
,
DownloadSource
.
MODELSCOPE
:
"Duxiaoman-DI/XuanYuan-70B-Chat"
,
},
"XuanYuan-2-70B-Chat"
:
{
DownloadSource
.
DEFAULT
:
"Duxiaoman-DI/XuanYuan2-70B-Chat"
,
DownloadSource
.
MODELSCOPE
:
"Duxiaoman-DI/XuanYuan2-70B-Chat"
,
},
"XuanYuan-6B-int8-Chat"
:
{
DownloadSource
.
DEFAULT
:
"Duxiaoman-DI/XuanYuan-6B-Chat-8bit"
,
DownloadSource
.
MODELSCOPE
:
"Duxiaoman-DI/XuanYuan-6B-Chat-8bit"
,
},
"XuanYuan-6B-int4-Chat"
:
{
DownloadSource
.
DEFAULT
:
"Duxiaoman-DI/XuanYuan-6B-Chat-4bit"
,
DownloadSource
.
MODELSCOPE
:
"Duxiaoman-DI/XuanYuan-6B-Chat-4bit"
,
},
"XuanYuan-70B-int8-Chat"
:
{
DownloadSource
.
DEFAULT
:
"Duxiaoman-DI/XuanYuan-70B-Chat-8bit"
,
DownloadSource
.
MODELSCOPE
:
"Duxiaoman-DI/XuanYuan-70B-Chat-8bit"
,
},
"XuanYuan-70B-int4-Chat"
:
{
DownloadSource
.
DEFAULT
:
"Duxiaoman-DI/XuanYuan-70B-Chat-4bit"
,
DownloadSource
.
MODELSCOPE
:
"Duxiaoman-DI/XuanYuan-70B-Chat-4bit"
,
},
"XuanYuan-2-70B-int8-Chat"
:
{
DownloadSource
.
DEFAULT
:
"Duxiaoman-DI/XuanYuan2-70B-Chat-8bit"
,
DownloadSource
.
MODELSCOPE
:
"Duxiaoman-DI/XuanYuan2-70B-Chat-8bit"
,
},
"XuanYuan-2-70B-int4-Chat"
:
{
DownloadSource
.
DEFAULT
:
"Duxiaoman-DI/XuanYuan2-70B-Chat-4bit"
,
DownloadSource
.
MODELSCOPE
:
"Duxiaoman-DI/XuanYuan2-70B-Chat-4bit"
,
},
},
template
=
"xuanyuan"
,
)
register_model_group
(
models
=
{
"XVERSE-7B"
:
{
DownloadSource
.
DEFAULT
:
"xverse/XVERSE-7B"
,
DownloadSource
.
MODELSCOPE
:
"xverse/XVERSE-7B"
,
},
"XVERSE-13B"
:
{
DownloadSource
.
DEFAULT
:
"xverse/XVERSE-13B"
,
DownloadSource
.
MODELSCOPE
:
"xverse/XVERSE-13B"
,
},
"XVERSE-65B"
:
{
DownloadSource
.
DEFAULT
:
"xverse/XVERSE-65B"
,
DownloadSource
.
MODELSCOPE
:
"xverse/XVERSE-65B"
,
},
"XVERSE-65B-2"
:
{
DownloadSource
.
DEFAULT
:
"xverse/XVERSE-65B-2"
,
DownloadSource
.
MODELSCOPE
:
"xverse/XVERSE-65B-2"
,
},
"XVERSE-7B-Chat"
:
{
DownloadSource
.
DEFAULT
:
"xverse/XVERSE-7B-Chat"
,
DownloadSource
.
MODELSCOPE
:
"xverse/XVERSE-7B-Chat"
,
},
"XVERSE-13B-Chat"
:
{
DownloadSource
.
DEFAULT
:
"xverse/XVERSE-13B-Chat"
,
DownloadSource
.
MODELSCOPE
:
"xverse/XVERSE-13B-Chat"
,
},
"XVERSE-65B-Chat"
:
{
DownloadSource
.
DEFAULT
:
"xverse/XVERSE-65B-Chat"
,
DownloadSource
.
MODELSCOPE
:
"xverse/XVERSE-65B-Chat"
,
},
"XVERSE-MoE-A4.2B"
:
{
DownloadSource
.
DEFAULT
:
"xverse/XVERSE-MoE-A4.2B"
,
DownloadSource
.
MODELSCOPE
:
"xverse/XVERSE-MoE-A4.2B"
,
},
"XVERSE-7B-int8-Chat"
:
{
DownloadSource
.
DEFAULT
:
"xverse/XVERSE-7B-Chat-GPTQ-Int8"
,
DownloadSource
.
MODELSCOPE
:
"xverse/XVERSE-7B-Chat-GPTQ-Int8"
,
},
"XVERSE-7B-int4-Chat"
:
{
DownloadSource
.
DEFAULT
:
"xverse/XVERSE-7B-Chat-GPTQ-Int4"
,
DownloadSource
.
MODELSCOPE
:
"xverse/XVERSE-7B-Chat-GPTQ-Int4"
,
},
"XVERSE-13B-int8-Chat"
:
{
DownloadSource
.
DEFAULT
:
"xverse/XVERSE-13B-Chat-GPTQ-Int8"
,
DownloadSource
.
MODELSCOPE
:
"xverse/XVERSE-13B-Chat-GPTQ-Int8"
,
},
"XVERSE-13B-int4-Chat"
:
{
DownloadSource
.
DEFAULT
:
"xverse/XVERSE-13B-Chat-GPTQ-Int4"
,
DownloadSource
.
MODELSCOPE
:
"xverse/XVERSE-13B-Chat-GPTQ-Int4"
,
},
"XVERSE-65B-int4-Chat"
:
{
DownloadSource
.
DEFAULT
:
"xverse/XVERSE-65B-Chat-GPTQ-Int4"
,
DownloadSource
.
MODELSCOPE
:
"xverse/XVERSE-65B-Chat-GPTQ-Int4"
,
},
},
template
=
"xverse"
,
)
register_model_group
(
models
=
{
"Yayi-7B"
:
{
DownloadSource
.
DEFAULT
:
"wenge-research/yayi-7b-llama2"
,
DownloadSource
.
MODELSCOPE
:
"AI-ModelScope/yayi-7b-llama2"
,
},
"Yayi-13B"
:
{
DownloadSource
.
DEFAULT
:
"wenge-research/yayi-13b-llama2"
,
DownloadSource
.
MODELSCOPE
:
"AI-ModelScope/yayi-13b-llama2"
,
},
},
template
=
"yayi"
,
)
register_model_group
(
models
=
{
"Yi-6B"
:
{
DownloadSource
.
DEFAULT
:
"01-ai/Yi-6B"
,
DownloadSource
.
MODELSCOPE
:
"01ai/Yi-6B"
,
},
"Yi-9B"
:
{
DownloadSource
.
DEFAULT
:
"01-ai/Yi-9B"
,
DownloadSource
.
MODELSCOPE
:
"01ai/Yi-9B"
,
},
"Yi-34B"
:
{
DownloadSource
.
DEFAULT
:
"01-ai/Yi-34B"
,
DownloadSource
.
MODELSCOPE
:
"01ai/Yi-34B"
,
},
"Yi-6B-Chat"
:
{
DownloadSource
.
DEFAULT
:
"01-ai/Yi-6B-Chat"
,
DownloadSource
.
MODELSCOPE
:
"01ai/Yi-6B-Chat"
,
},
"Yi-34B-Chat"
:
{
DownloadSource
.
DEFAULT
:
"01-ai/Yi-34B-Chat"
,
DownloadSource
.
MODELSCOPE
:
"01ai/Yi-34B-Chat"
,
},
"Yi-6B-int8-Chat"
:
{
DownloadSource
.
DEFAULT
:
"01-ai/Yi-6B-Chat-8bits"
,
DownloadSource
.
MODELSCOPE
:
"01ai/Yi-6B-Chat-8bits"
,
},
"Yi-6B-int4-Chat"
:
{
DownloadSource
.
DEFAULT
:
"01-ai/Yi-6B-Chat-4bits"
,
DownloadSource
.
MODELSCOPE
:
"01ai/Yi-6B-Chat-4bits"
,
},
"Yi-34B-int8-Chat"
:
{
DownloadSource
.
DEFAULT
:
"01-ai/Yi-34B-Chat-8bits"
,
DownloadSource
.
MODELSCOPE
:
"01ai/Yi-34B-Chat-8bits"
,
},
"Yi-34B-int4-Chat"
:
{
DownloadSource
.
DEFAULT
:
"01-ai/Yi-34B-Chat-4bits"
,
DownloadSource
.
MODELSCOPE
:
"01ai/Yi-34B-Chat-4bits"
,
},
"Yi-1.5-6B"
:
{
DownloadSource
.
DEFAULT
:
"01-ai/Yi-1.5-6B"
,
DownloadSource
.
MODELSCOPE
:
"01ai/Yi-1.5-6B"
,
},
"Yi-1.5-9B"
:
{
DownloadSource
.
DEFAULT
:
"01-ai/Yi-1.5-9B"
,
DownloadSource
.
MODELSCOPE
:
"01ai/Yi-1.5-9B"
,
},
"Yi-1.5-34B"
:
{
DownloadSource
.
DEFAULT
:
"01-ai/Yi-1.5-34B"
,
DownloadSource
.
MODELSCOPE
:
"01ai/Yi-1.5-34B"
,
},
"Yi-1.5-6B-Chat"
:
{
DownloadSource
.
DEFAULT
:
"01-ai/Yi-1.5-6B-Chat"
,
DownloadSource
.
MODELSCOPE
:
"01ai/Yi-1.5-6B-Chat"
,
},
"Yi-1.5-9B-Chat"
:
{
DownloadSource
.
DEFAULT
:
"01-ai/Yi-1.5-9B-Chat"
,
DownloadSource
.
MODELSCOPE
:
"01ai/Yi-1.5-9B-Chat"
,
},
"Yi-1.5-34B-Chat"
:
{
DownloadSource
.
DEFAULT
:
"01-ai/Yi-1.5-34B-Chat"
,
DownloadSource
.
MODELSCOPE
:
"01ai/Yi-1.5-34B-Chat"
,
},
},
template
=
"yi"
,
)
register_model_group
(
models
=
{
"YiVL-6B-Chat"
:
{
DownloadSource
.
DEFAULT
:
"BUAADreamer/Yi-VL-6B-hf"
,
},
"YiVL-34B-Chat"
:
{
DownloadSource
.
DEFAULT
:
"BUAADreamer/Yi-VL-34B-hf"
,
},
},
template
=
"yi_vl"
,
vision
=
True
,
)
register_model_group
(
models
=
{
"Yuan2-2B-Chat"
:
{
DownloadSource
.
DEFAULT
:
"IEITYuan/Yuan2-2B-hf"
,
DownloadSource
.
MODELSCOPE
:
"YuanLLM/Yuan2.0-2B-hf"
,
},
"Yuan2-51B-Chat"
:
{
DownloadSource
.
DEFAULT
:
"IEITYuan/Yuan2-51B-hf"
,
DownloadSource
.
MODELSCOPE
:
"YuanLLM/Yuan2.0-51B-hf"
,
},
"Yuan2-102B-Chat"
:
{
DownloadSource
.
DEFAULT
:
"IEITYuan/Yuan2-102B-hf"
,
DownloadSource
.
MODELSCOPE
:
"YuanLLM/Yuan2.0-102B-hf"
,
},
},
template
=
"yuan"
,
)
register_model_group
(
models
=
{
"Zephyr-7B-Alpha-Chat"
:
{
DownloadSource
.
DEFAULT
:
"HuggingFaceH4/zephyr-7b-alpha"
,
DownloadSource
.
MODELSCOPE
:
"AI-ModelScope/zephyr-7b-alpha"
,
},
"Zephyr-7B-Beta-Chat"
:
{
DownloadSource
.
DEFAULT
:
"HuggingFaceH4/zephyr-7b-beta"
,
DownloadSource
.
MODELSCOPE
:
"modelscope/zephyr-7b-beta"
,
},
"Zephyr-141B-ORPO-Chat"
:
{
DownloadSource
.
DEFAULT
:
"HuggingFaceH4/zephyr-orpo-141b-A35b-v0.1"
,
},
},
template
=
"zephyr"
,
)
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment