mirror of
https://github.com/open-thought/reasoning-gym.git
synced 2026-04-22 16:49:06 +00:00
consolidate eval scripts to have single eval.py
This commit is contained in:
parent
bea806fe3c
commit
e7ae82a831
12 changed files with 104 additions and 337 deletions
|
|
@ -1,11 +0,0 @@
|
|||
model: deepseek/deepseek-r1
|
||||
category: logic
|
||||
datasets:
|
||||
- propositional_logic
|
||||
- self_reference
|
||||
- syllogism
|
||||
- zebra_puzzles
|
||||
eval_dir: eval/r1
|
||||
dataset_size: 50
|
||||
dataset_seed: 42
|
||||
developer_role: system
|
||||
Loading…
Add table
Add a link
Reference in a new issue