Commit 55ce9e74 authored by weishb's avatar weishb
Browse files

update README

parent 7f2360be
...@@ -80,8 +80,8 @@ cp /path/of/MiniMax/MiniMax-M2.7/vocab.json /path/of/MiniMax/MiniMax-M2.7-bf16 ...@@ -80,8 +80,8 @@ cp /path/of/MiniMax/MiniMax-M2.7/vocab.json /path/of/MiniMax/MiniMax-M2.7-bf16
vllm serve /path/MiniMax-M2.7-bf16 \ vllm serve /path/MiniMax-M2.7-bf16 \
--trust-remote-code \ --trust-remote-code \
--served-model-name minimax-m2.7 \ --served-model-name minimax-m2.7 \
--gpu-memory-utilization 0.85 \ --gpu-memory-utilization 0.95 \
--max-model-len 32768 \ --max-model-len 4096 \
--dtype bfloat16 \ --dtype bfloat16 \
-tp 8 \ -tp 8 \
--port 8001 \ --port 8001 \
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment