"csrc/quantization/mygq/q_gemm.cu" did not exist on "1b7c791d60629453030de1600e756a8ba555455e"
hf_deepseek_moe_16b_chat.py 304 Bytes
Newer Older
1
from opencompass.models import HuggingFacewithChatTemplate
2
3
4

models = [
    dict(
5
        type=HuggingFacewithChatTemplate,
6
        abbr='deepseek-moe-16b-chat-hf',
7
8
        path='deepseek-ai/deepseek-moe-16b-chat',
        max_out_len=1024,
9
        batch_size=8,
10
        run_cfg=dict(num_gpus=1),
11
12
    )
]