qwen2_5_7b_math_grpo.sh 649 Bytes
Newer Older
chenych's avatar
chenych committed
1
2
3
4
set -x

MODEL_PATH=Qwen/Qwen2.5-7B-Instruct  # replace it with your local file path

chenych's avatar
Update  
chenych committed
5
FORMAT_PROMPT="""You FIRST think about the reasoning process as an internal monologue and then provide the final answer.
chenych's avatar
chenych committed
6
7
8
9
10
11
 The reasoning process MUST BE enclosed within <think> </think> tags. The final answer MUST BE put in \boxed{}."""

python3 -m verl.trainer.main \
    config=examples/config.yaml \
    data.train_files=hiyouga/math12k@train \
    data.val_files=hiyouga/math12k@test \
chenych's avatar
Update  
chenych committed
12
    data.format_prompt="${FORMAT_PROMPT}" \
chenych's avatar
chenych committed
13
14
15
    worker.actor.model.model_path=${MODEL_PATH} \
    trainer.experiment_name=qwen2_5_7b_math_grpo \
    trainer.n_gpus_per_node=8