mirror of
https://github.com/open-thought/reasoning-gym.git
synced 2026-04-19 12:58:07 +00:00
include ranges rather than sampled values in difficulty metadata dicts (#387)
* update difficulty metadata for logic datasets * update difficulty metadata for graph datasets * update difficulty metadata for geometry datasets * update difficulty metadata for games datasets * update difficulty metadata for cognition datasets * update difficulty metadata for arithmetic datasets * update difficulty metadata for arc datasets * update difficulty metadata for algorithmic datasets * update difficulty metadata for algebra datasets * use tuples * update tests * update tests
This commit is contained in:
parent
b69c35818a
commit
7475a20700
80 changed files with 304 additions and 126 deletions
|
|
@ -103,7 +103,13 @@ class NeedleHaystackDataset(ProceduralDataset):
|
|||
return {
|
||||
"question": full_text,
|
||||
"answer": stack["needle"][0],
|
||||
"metadata": {"question": question, "difficulty": {"num_statements": num_statements}},
|
||||
"metadata": {
|
||||
"question": question,
|
||||
"num_statements": num_statements,
|
||||
"difficulty": {
|
||||
"num_statements": (self.config.min_num_statements, self.config.max_num_statements),
|
||||
},
|
||||
},
|
||||
}
|
||||
|
||||
def score_answer(self, answer: Optional[str], entry: dict[str, Any]) -> float:
|
||||
|
|
|
|||
Loading…
Add table
Add a link
Reference in a new issue