include ranges rather than sampled values in difficulty metadata dicts (#387)

* update difficulty metadata for logic datasets * update difficulty metadata for graph datasets * update difficulty metadata for geometry datasets * update difficulty metadata for games datasets * update difficulty metadata for cognition datasets * update difficulty metadata for arithmetic datasets * update difficulty metadata for arc datasets * update difficulty metadata for algorithmic datasets * update difficulty metadata for algebra datasets * use tuples * update tests * update tests
2026-04-19 12:58:07 +00:00 · 2025-03-20 09:27:03 +00:00 · 2025-03-20 09:27:03 +00:00 · 7475a20700
commit 7475a20700
parent b69c35818a
80 changed files with 304 additions and 126 deletions
--- a/reasoning_gym/algorithmic/sentence_reordering.py
+++ b/reasoning_gym/algorithmic/sentence_reordering.py
@ -90,7 +90,12 @@ class SentenceReorderingDataset(ProceduralDataset):
        return {
            "question": f"Restore the correct order of words in the following sentence: {question}",
            "answer": solved_sentence,
-            "metadata": {"word_count": word_count, "difficulty": {"words_in_sentence": word_count}},
+            "metadata": {
+                "word_count": word_count,
+                "difficulty": {
+                    "words_in_sentence": (self.config.min_words_in_sentence, self.config.max_words_in_sentence),
+                },
+            },
        }

    def score_answer(self, answer: Optional[str], entry: dict[str, Any]) -> float: