vllm_internlm2_chat_7b.py 336 Bytes
Newer Older
1
2
3
4
5
6
7
8
9
10
11
12
13
from opencompass.models import VLLMwithChatTemplate

models = [
    dict(
        type=VLLMwithChatTemplate,
        abbr='internlm2-chat-7b-vllm',
        path='internlm/internlm2-chat-7b',
        model_kwargs=dict(tensor_parallel_size=1),
        max_out_len=1024,
        batch_size=32768,
        run_cfg=dict(num_gpus=1),
    )
]