reasoning-gym/eval/yaml/claude-3.5-sonnet.yaml
Andreas Köpf 850c1cf6f4
Eval script consolidation (#238)
The script now supports:
   - YAML and JSON configurations
   - Dataset-specific parameters
   - Overriding configuration via command line
   - Detailed logging and error handling
2025-02-27 17:39:14 +01:00

34 lines
1 KiB
YAML

# Combined configuration for Claude 3.5 Sonnet
model: "anthropic/claude-3.5-sonnet"
provider: "Anthropic"
output_dir: "results"
max_concurrent: 10
default_size: 50
default_seed: 45
categories:
- category: "algorithmic"
datasets:
- dataset: "count_primes"
- dataset: "game_of_life"
- dataset: "graph_color"
- dataset: "group_anagrams"
- dataset: "isomorphic_strings"
- dataset: "letter_counting"
- dataset: "letter_jumble"
- dataset: "manipulate_matrix"
- dataset: "number_filtering"
- dataset: "number_sorting"
- dataset: "palindrome"
- dataset: "pool_matrix"
- dataset: "ransom_note"
- dataset: "rotate_matrix"
- dataset: "sentence_reordering"
- dataset: "spell_backward"
- dataset: "spiral_matrix"
- dataset: "string_insertion"
- dataset: "string_manipulation"
- dataset: "string_synthesis"
- dataset: "word_ladder"
- dataset: "word_sequence_reversal"
- dataset: "word_sorting"