add vllm model configs (#938)

120bf8b3 · Mo Li · GitHub · 3e9844ed · 120bf8b3 · 120bf8b3
Unverified Commit 120bf8b3 authored Mar 01, 2024 by Mo Li Committed by GitHub Mar 01, 2024
Showing with 54 additions and 0 deletions

configs/models/others/vllm_orionstar_14b_longchat.py configs/models/others/vllm_orionstar_14b_longchat.py +27 -0

configs/models/qwen/vllm_qwen1_5_14b_chat.py configs/models/qwen/vllm_qwen1_5_14b_chat.py +27 -0

No files found.
--- a/configs/models/others/vllm_orionstar_14b_longchat.py
+++ b/configs/models/others/vllm_orionstar_14b_longchat.py
+from opencompass.models import VLLM
+
+
+_meta_template = dict(
+    begin='<s>',
+    round=[
+        dict(role="HUMAN", begin='Human: ', end='\n'),
+        dict(role="BOT", begin="Assistant: ", end='</s>', generate=True),
+    ],
+    eos_token_id=2
+)
+
+models = [
+    dict(
+        abbr='orionstar-14b-longchat-vllm',
+        type=VLLM,
+        path='OrionStarAI/Orion-14B-LongChat',
+        model_kwargs=dict(tensor_parallel_size=4),
+        generation_kwargs=dict(temperature=0),
+        meta_template=_meta_template,
+        max_out_len=100,
+        max_seq_len=4096,
+        batch_size=32,
+        run_cfg=dict(num_gpus=4, num_procs=1),
+        end_str='<|endoftext|>',
+    )
+]
--- a/configs/models/qwen/vllm_qwen1_5_14b_chat.py
+++ b/configs/models/qwen/vllm_qwen1_5_14b_chat.py
+from opencompass.models import VLLM
+
+
+_meta_template = dict(
+    round=[
+        dict(role="HUMAN", begin='<|im_start|>user\n', end='<|im_end|>\n'),
+        dict(role="BOT", begin="<|im_start|>assistant\n", end='<|im_end|>\n',
+             generate=True),
+    ],
+    eos_token_id=151645,
+)
+
+models = [
+    dict(
+        type=VLLM,
+        abbr='qwen1.5-14b-chat-vllm',
+        path="Qwen/Qwen1.5-14B-Chat",
+        model_kwargs=dict(tensor_parallel_size=2),
+        meta_template=_meta_template,
+        max_out_len=100,
+        max_seq_len=2048,
+        batch_size=32,
+        generation_kwargs=dict(temperature=0),
+        end_str='<|im_end|>',
+        run_cfg=dict(num_gpus=2, num_procs=1),
+    )
+]