Commit 8cc3aa85 authored by chenzk's avatar chenzk
Browse files

v1.0.3

parent 99859057
......@@ -19,8 +19,9 @@ vllm:
dtype: auto
# max_model_len: # you may find it useful to set the vLLM model context length if you know this beforehand
rl: grpo # dr_grpo
rl: grpo
trl:
# loss_type: dr_grpo # dapo
use_vllm: true
vllm_server_host: localhost
vllm_server_port: 8000
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment