mirror of
https://github.com/open-thought/reasoning-gym.git
synced 2026-04-19 12:58:07 +00:00
simplify training setup instructions (#454)
* simplify training setup instructions * tweaks * update cfgs * readme update * readme update
This commit is contained in:
parent
0ebabf709b
commit
1232a7d1e5
13 changed files with 128 additions and 40 deletions
|
|
@ -1,3 +1,11 @@
|
|||
hydra:
|
||||
searchpath:
|
||||
- file://verl/verl/trainer/config
|
||||
|
||||
defaults:
|
||||
- ppo_trainer
|
||||
- _self_
|
||||
|
||||
reasoning_gym:
|
||||
dataset_size: 20000
|
||||
developer_prompt: DeepSeekZero
|
||||
|
|
|
|||
Loading…
Add table
Add a link
Reference in a new issue