mirror of
https://github.com/open-thought/reasoning-gym.git
synced 2026-04-27 17:23:19 +00:00
first bits of veRL example
This commit is contained in:
parent
bb620a1066
commit
e671b97ab4
5 changed files with 562 additions and 0 deletions
9
examples/veRL/launch_on_4gpu.sh
Executable file
9
examples/veRL/launch_on_4gpu.sh
Executable file
|
|
@ -0,0 +1,9 @@
|
|||
#!/bin/bash
|
||||
|
||||
export N_GPUS=4
|
||||
export BASE_MODEL=meta-llama/Llama-3.2-1B-Instruct
|
||||
export ROLLOUT_TP_SIZE=2
|
||||
export EXPERIMENT_NAME=chain_sum_llama
|
||||
export VLLM_ATTENTION_BACKEND=XFORMERS
|
||||
|
||||
bash ./train.sh
|
||||
Loading…
Add table
Add a link
Reference in a new issue