reasoning-gym/examples/veRL
2025-02-01 23:56:11 +00:00
..
config first bits of veRL example 2025-02-01 21:20:36 +00:00
.gitignore first bits of veRL example 2025-02-01 21:20:36 +00:00
launch_on_4gpu.sh first bits of veRL example 2025-02-01 21:20:36 +00:00
main_ppo_custom_reward.py reduce veRL example size 2025-02-01 23:56:11 +00:00
README.md add deps for veRL experiment in README 2025-02-01 21:27:33 +00:00
train.sh first bits of veRL example 2025-02-01 21:20:36 +00:00

env setup

conda create --name verl python=3.12 -y
conda activate verl

pip install flash-attn --no-build-isolation
pip install vllm==0.7.0 ray wandb

clone and install veRL

tested with verl HEAD a65c9157bc0b85b64cd753de19f94e80a11bd871

git clone https://github.com/volcengine/verl.git
cd verl
pip install -e .