mirror of
https://github.com/open-thought/reasoning-gym.git
synced 2026-04-26 17:13:17 +00:00
| .. | ||
| config | ||
| launch_on_2gpu_server.sh | ||
| launch_on_4gpu.sh | ||
| main_ppo_custom_reward.py | ||
| main_ppo_custom_reward_server.py | ||
| train_grpo.sh | ||
| train_grpo_server.sh | ||
| train_ppo.sh | ||