config.py 1.46 KB
Newer Older
Jasmond L's avatar
Jasmond L committed
1
2
from typing import Optional

Woosuk Kwon's avatar
Woosuk Kwon committed
3
from transformers import AutoConfig, MptConfig, PretrainedConfig
4
5
6
7

from vllm.transformers_utils.configs import *  # pylint: disable=wildcard-import

_CONFIG_REGISTRY = {
shunxing1234's avatar
shunxing1234 committed
8
    "aquila": AquilaConfig,
GoHomeToMacDonal's avatar
GoHomeToMacDonal committed
9
10
11
    "baichuan": BaiChuanConfig,
    "chatglm": ChatGLMConfig,
    "mpt": MptConfig,
Qing's avatar
Qing committed
12
    "qwen": QWenConfig,
Zhuohan Li's avatar
Zhuohan Li committed
13
14
    "RefinedWeb": RWConfig,  # For tiiuae/falcon-40b(-instruct)
    "RefinedWebModel": RWConfig,  # For tiiuae/falcon-7b(-instruct)
Roy's avatar
Roy committed
15
    "yi": YiConfig,
16
17
18
}


Jasmond L's avatar
Jasmond L committed
19
20
21
def get_config(model: str,
               trust_remote_code: bool,
               revision: Optional[str] = None) -> PretrainedConfig:
22
23
    try:
        config = AutoConfig.from_pretrained(
Jasmond L's avatar
Jasmond L committed
24
            model, trust_remote_code=trust_remote_code, revision=revision)
25
26
27
28
29
30
31
32
33
34
35
    except ValueError as e:
        if (not trust_remote_code and
                "requires you to execute the configuration file" in str(e)):
            err_msg = (
                "Failed to load the model config. If the model is a custom "
                "model not yet available in the HuggingFace transformers "
                "library, consider setting `trust_remote_code=True` in LLM "
                "or using the `--trust-remote-code` flag in the CLI.")
            raise RuntimeError(err_msg) from e
        else:
            raise e
36
37
    if config.model_type in _CONFIG_REGISTRY:
        config_class = _CONFIG_REGISTRY[config.model_type]
Jasmond L's avatar
Jasmond L committed
38
        config = config_class.from_pretrained(model, revision=revision)
39
    return config