qwen2_5_vl_3b_clevr.sh 943 Bytes
Newer Older
chenych's avatar
chenych committed
1
2
3
4
set -x

MODEL_PATH=Qwen/Qwen2.5-VL-3B-Instruct  # replace it with your local file path

chenych's avatar
Update  
chenych committed
5
FORMAT_PROMPT="""A conversation between User and Assistant. The user asks a question, and the Assistant solves it. The assistant
chenych's avatar
chenych committed
6
7
8
9
10
11
12
13
 first thinks about the reasoning process in the mind and then provides the user with the answer. The reasoning
 process and answer are enclosed within <think> </think> and <answer> </answer> tags, respectively, i.e.,
 <think> reasoning process here </think><answer> answer here </answer>"""

python3 -m verl.trainer.main \
    config=examples/config.yaml \
    data.train_files=BUAADreamer/clevr_count_70k@train \
    data.val_files=BUAADreamer/clevr_count_70k@test \
chenych's avatar
Update  
chenych committed
14
    data.format_prompt="${FORMAT_PROMPT}" \
chenych's avatar
chenych committed
15
16
    worker.actor.model.model_path=${MODEL_PATH} \
    worker.rollout.tensor_parallel_size=1 \
chenych's avatar
Update  
chenych committed
17
    worker.reward.score_function=r1v \
chenych's avatar
chenych committed
18
19
    trainer.experiment_name=qwen2_5_vl_3b_clevr \
    trainer.n_gpus_per_node=2