infer_think.sh 529 Bytes
Newer Older
luopl's avatar
luopl committed
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
#!/bin/bash

# MMMU Inference Script (Thinking Model)
# This script runs inference on the MMMU dataset using vLLM with thinking mode parameters

python run_mmmu.py infer \
    --model-path /path/to/Qwen3-VL-Thinking \
    --data-dir /path/to/mmmu_data \
    --dataset MMMU_DEV_VAL \
    --output-file results/mmmu_dev_val_predictions_thinking.jsonl \
    --max-new-tokens 40960 \
    --temperature 1.0 \
    --top-p 0.95 \
    --top-k 20 \
    --repetition-penalty 1.0 \
    --presence-penalty 0.0 \
    --tensor-parallel-size 4