mirror of
https://github.com/open-thought/reasoning-gym.git
synced 2026-04-19 12:58:07 +00:00
added r1 evaluation logic
This commit is contained in:
parent
0657222a8f
commit
42e02640a3
6 changed files with 208 additions and 0 deletions
13
eval/r1/yaml/algebra.yaml
Normal file
13
eval/r1/yaml/algebra.yaml
Normal file
|
|
@ -0,0 +1,13 @@
|
|||
model: deepseek/deepseek-r1
|
||||
category: algebra
|
||||
datasets:
|
||||
- intermediate_integration
|
||||
- polynomial_equations
|
||||
- polynomial_multiplication
|
||||
- simple_equations
|
||||
- simple_integration
|
||||
- complex_arithmetic
|
||||
eval_dir: eval/r1
|
||||
dataset_size: 50
|
||||
dataset_seed: 42
|
||||
developer_role: system
|
||||
Loading…
Add table
Add a link
Reference in a new issue