mirror of
https://github.com/open-thought/reasoning-gym.git
synced 2026-04-23 16:55:05 +00:00
add grpo launch script
This commit is contained in:
parent
2ae21c6548
commit
8e25a4585f
4 changed files with 212 additions and 2 deletions
|
|
@ -6,4 +6,4 @@ export ROLLOUT_TP_SIZE=2
|
|||
export EXPERIMENT_NAME=chain_sum_llama
|
||||
export VLLM_ATTENTION_BACKEND=XFORMERS
|
||||
|
||||
bash ./train.sh
|
||||
bash ./train_grpo.sh
|
||||
|
|
|
|||
Loading…
Add table
Add a link
Reference in a new issue