lmdeploy_internlm2_chat_7b.py 942 Bytes
Newer Older
1
2
3
4
5
from opencompass.models.turbomind import TurboMindModel


_meta_template = dict(
    round=[
6
7
        dict(role='HUMAN', begin='<|im_start|>user\n', end='<|im_end|>\n'),
        dict(role='BOT', begin='<|im_start|>assistant\n', end='<|im_end|>\n', generate=True),
8
9
10
11
12
13
    ],
)

models = [
    dict(
        type=TurboMindModel,
14
15
        abbr='internlm2-chat-7b-turbomind',
        path='internlm/internlm2-chat-7b',
16
        meta_template=_meta_template,
17
        engine_config=dict(
18
19
            session_len=32768,
            max_batch_size=32,
20
            model_name='internlm2-chat-7b',
21
22
23
24
25
26
27
28
29
            tp=1,
            stop_words=[2, 92542],
        ),
        gen_config=dict(
            top_k=1,
            top_p=0.8,
            temperature=1.0,
            max_new_tokens=2000,
        ),
30
        max_out_len=2000,
31
32
        max_seq_len=32768,
        batch_size=32,
33
34
35
36
        concurrency=8,
        run_cfg=dict(num_gpus=1, num_procs=1),
    )
]