move r1 configs into r1 yaml/r1 subfolder

This commit is contained in:
Andreas Koepf 2025-02-25 16:24:30 +01:00
parent e7ae82a831
commit 878f9bbc76
7 changed files with 6 additions and 7 deletions

13
eval/yaml/r1/algebra.yaml Normal file
View file

@ -0,0 +1,13 @@
model: deepseek/deepseek-r1
category: algebra
datasets:
- intermediate_integration
- polynomial_equations
- polynomial_multiplication
- simple_equations
- simple_integration
- complex_arithmetic
eval_dir: results/r1
dataset_size: 50
dataset_seed: 42
developer_role: system

View file

@ -0,0 +1,24 @@
model: deepseek/deepseek-r1
category: algorithmic
datasets:
- binary_matrix
- caesar_cipher
- group_anagrams
- isomorphic_strings
- letter_counting
- letter_jumble
- number_filtering
- number_sorting
- palindrome
- ransom_note
- rotate_matrix
- sentence_reordering
- spell_backward
- spiral_matrix
- word_ladder
- word_sequence_reversal
- word_sorting
eval_dir: results/r1
dataset_size: 50
dataset_seed: 42
developer_role: system

View file

@ -0,0 +1,11 @@
model: deepseek/deepseek-r1
category: cognition
datasets:
- color_cube_rotation
- figlet_font
- number_sequence
- rubiks_cube
eval_dir: results/r1
dataset_size: 50
dataset_seed: 42
developer_role: system

11
eval/yaml/r1/logic.yaml Normal file
View file

@ -0,0 +1,11 @@
model: deepseek/deepseek-r1
category: logic
datasets:
- propositional_logic
- self_reference
- syllogism
- zebra_puzzles
eval_dir: results/r1
dataset_size: 50
dataset_seed: 42
developer_role: system

8
eval/yaml/r1/test.yaml Normal file
View file

@ -0,0 +1,8 @@
model: deepseek/deepseek-r1
category: test
datasets:
- YOUR_DATASET_NAME
eval_dir: results/r1
dataset_size: 10
dataset_seed: 42
developer_role: system