reasoning-gym/eval/yaml/openai-o3/games.yaml
2025-02-26 08:09:12 +00:00

19 lines
304 B
YAML

model: openai/o3-mini
category: games
provider: OpenAI
datasets:
- countdown
- emoji_mystery
- futoshuki
- knight_swap
- maze
- mini_sudoku
- n_queens
- sokoban
- sudoku
- tower_of_hanoi
- tsumego
eval_dir: results/openai-03
dataset_size: 50
dataset_seed: 45
developer_role: system