#!/bin/bash set -x export PYTHONUNBUFFERED=1 MODEL_PATH=Qwen/Qwen2.5-VL-32B-Instruct # replace it with your local file path python3 -m verl.trainer.main \ config=examples/config.yaml \ data.train_files=hiyouga/geometry3k@train \ data.val_files=hiyouga/geometry3k@test \ worker.actor.model.model_path=${MODEL_PATH} \ worker.actor.micro_batch_size_per_device_for_update=1 \ worker.actor.micro_batch_size_per_device_for_experience=8 \ worker.actor.fsdp.torch_dtype=bf16 \ worker.actor.optim.strategy=adamw_bf16 \ worker.rollout.tensor_parallel_size=8 \ trainer.experiment_name=qwen2_5_vl_32b_geo_grpo \ trainer.n_gpus_per_node=8