add grpo launch script

This commit is contained in:
Andreas Koepf 2025-02-17 20:52:03 +00:00
parent 2ae21c6548
commit 8e25a4585f
4 changed files with 212 additions and 2 deletions

View file

@ -6,4 +6,4 @@ export ROLLOUT_TP_SIZE=2
export EXPERIMENT_NAME=chain_sum_llama
export VLLM_ATTENTION_BACKEND=XFORMERS
bash ./train.sh
bash ./train_grpo.sh