"megatron/inference/text_generation_server.py" did not exist on "ee53612329e1fa7e0f55110735a6af24a9beb61a"
hf_vicuna_7b_v13.py 661 Bytes
Newer Older
Leymore's avatar
Leymore committed
1
2
3
4
5
6
from opencompass.models import HuggingFaceCausalLM


models = [
    dict(
        type=HuggingFaceCausalLM,
7
        abbr='vicuna-7b-v1.3-hf',
Leymore's avatar
Leymore committed
8
9
10
11
12
13
14
15
16
17
18
19
        path="lmsys/vicuna-7b-v1.3",
        tokenizer_path='lmsys/vicuna-7b-v1.3',
        tokenizer_kwargs=dict(
            padding_side='left',
            truncation_side='left',
            use_fast=False,
        ),
        max_out_len=100,
        max_seq_len=2048,
        batch_size=8,
        model_kwargs=dict(device_map='auto'),
        batch_padding=False, # if false, inference with for-loop without batch padding
20
        use_fastchat_template=True,
Leymore's avatar
Leymore committed
21
22
23
        run_cfg=dict(num_gpus=1, num_procs=1)
    )
]