simplify training setup instructions (#454)

* simplify training setup instructions

* tweaks

* update cfgs

* readme update

* readme update
This commit is contained in:
Oliver Stanley 2025-06-06 09:51:29 +01:00 committed by GitHub
parent 0ebabf709b
commit 1232a7d1e5
No known key found for this signature in database
GPG key ID: B5690EEEBB952194
13 changed files with 128 additions and 40 deletions

View file

@ -1,3 +1,11 @@
hydra:
searchpath:
- file://verl/verl/trainer/config
defaults:
- ppo_trainer
- _self_
reasoning_gym:
dataset_size: 20000
developer_prompt: DeepSeekZero