mirror of
https://github.com/open-thought/reasoning-gym.git
synced 2026-04-22 16:49:06 +00:00
| .. | ||
| config | ||
| launch_on_2gpu_server.sh | ||
| launch_on_4gpu.sh | ||
| main_ppo_custom_reward.py | ||
| main_ppo_custom_reward_server.py | ||
| train_grpo.sh | ||
| train_grpo_server.sh | ||
| train_ppo.sh | ||