set-xexport VLLM_ATTENTION_BACKEND=XFORMERSMODEL_PATH=Qwen/Qwen2.5-7B-Instruct # replace it with your local file pathpython3 -m verl.trainer.main \config=examples/grpo_example.yaml \ worker.actor.model.model_path=${MODEL_PATH}\ trainer.n_gpus_per_node=4