Commit 2a7c435f authored by sunzhq2's avatar sunzhq2
Browse files

init

parent 59a0ec90
#!/bin/bash
## 包含推理
# evalscope eval \
# --model 'qwen3-8B' \
# --api-url 'http://0.0.0.0:8000/v1/chat/completions' \
# --api-key 'EMPTY' \
# --datasets 'math_500' \
# --dataset-args '{"math_500": {"local_path": "/data1/sunzhq/llm-benchmark/MATH-500"}}' \
# --eval-batch-size 32 \
# --generation-config '{"batch_size": 32, "temperature": 0.0}' \
# --timeout 1800 \
evalscope eval \
--use-cache /data1/sunzhq/llm-benchmark/tools/evalscope-data \
--datasets math_500 \
--model-id qwen3-8B \
--no-timestamp \
--rerun-review
# --dataset-args '{"math_500": {"local_path": "/data1/sunzhq/llm-benchmark/MATH-500", "subset_list": ["Level 2"]}}' \
\ No newline at end of file
#!/bin/bash
output_dir=/data1/sunzhq/llm-benchmark/tools/evalscope-data
rm -rf ${output_dir}
python convert_data.py \
--perf /data1/sunzhq/llm-benchmark/results-1/performance_results/qwen3_8b_math500_perf.json \
--test /data1/sunzhq/llm-benchmark/MATH-500/test.jsonl \
--output ${output_dir}/predictions/qwen3-8B
This diff is collapsed.
This diff is collapsed.
This diff is collapsed.
export VLLM_NUMA_BIND=1
export VLLM_RANK0_NUMA=0
export VLLM_RANK1_NUMA=0
export VLLM_RANK2_NUMA=0
export VLLM_RANK3_NUMA=0
export HSA_FORCE_FINE_GRAIN_PCIE=1
export NCCL_MIN_NCHANNELS=16
export NCCL_MAX_NCHANNELS=16
export NCCL_P2P_LEVEL=SYS
export NCCL_LAUNCH_MODE=GROUP
export ALLREDUCE_STREAM_WITH_COMPUTE=1
export VLLM_RPC_TIMEOUT=1800000
export VLLM_ZERO_OVERHEAD=1
export VLLM_ZERO_OPT_ZEROS=1
# 测试Qwen3-30B-A3B所需环境变量
export VLLM_USE_FUSED_RMS_ROPE=1
export VLLM_USE_MARLIN_W16A16_MOE=1
# 测试Qwen3-Next需要环境变量
export VLLM_USE_NN=0
export TRITON_MOVE_LOAD_TOFRONT_DOT=0
export HIP_VISIBLE_DEVICES=6,7
vllm serve /data2/models/qwen3-8B \
--served-model-name qwen3-8B \
--host 0.0.0.0 \
--port 8000 \
--trust-remote-code \
--tensor-parallel-size 2
\ No newline at end of file
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment