hf_llama_13b.py 681 Bytes
Newer Older
cky's avatar
cky committed
1
2
3
from opencompass.models import HuggingFaceCausalLM

models = [
Leymore's avatar
Leymore committed
4
    # LLaMA 13B
cky's avatar
cky committed
5
6
    dict(
        type=HuggingFaceCausalLM,
Leymore's avatar
Leymore committed
7
        abbr='llama-13b-hf',
Tong Gao's avatar
Tong Gao committed
8
9
        path="huggyllama/llama-13b",
        tokenizer_path='huggyllama/llama-13b',
cky's avatar
cky committed
10
11
12
13
14
15
16
17
        tokenizer_kwargs=dict(padding_side='left',
                              truncation_side='left',
                              use_fast=False,
                              ),
        max_out_len=100,
        max_seq_len=2048,
        batch_size=8,
        model_kwargs=dict(device_map='auto'),
Leymore's avatar
Leymore committed
18
        batch_padding=False, # if false, inference with for-loop without batch padding
cky's avatar
cky committed
19
20
21
        run_cfg=dict(num_gpus=2, num_procs=1),
    )
]