qwen2_5_vl_32b_geo3k_grpo.sh 675 Bytes
Newer Older
chenych's avatar
chenych committed
1
2
#!/bin/bash

chenych's avatar
chenych committed
3
4
set -x

chenych's avatar
chenych committed
5
6
export PYTHONUNBUFFERED=1

chenych's avatar
chenych committed
7
8
9
10
11
12
13
14
15
16
17
18
19
20
MODEL_PATH=Qwen/Qwen2.5-VL-32B-Instruct  # replace it with your local file path

python3 -m verl.trainer.main \
    config=examples/config.yaml \
    data.train_files=hiyouga/geometry3k@train \
    data.val_files=hiyouga/geometry3k@test \
    worker.actor.model.model_path=${MODEL_PATH} \
    worker.actor.micro_batch_size_per_device_for_update=1 \
    worker.actor.micro_batch_size_per_device_for_experience=8 \
    worker.actor.fsdp.torch_dtype=bf16 \
    worker.actor.optim.strategy=adamw_bf16 \
    worker.rollout.tensor_parallel_size=8 \
    trainer.experiment_name=qwen2_5_vl_32b_geo_grpo \
    trainer.n_gpus_per_node=8