diff --git a/reasoning_gym/algorithmic/cryptarithm.py b/reasoning_gym/algorithmic/cryptarithm.py index 5ec1603a..a7b5236f 100644 --- a/reasoning_gym/algorithmic/cryptarithm.py +++ b/reasoning_gym/algorithmic/cryptarithm.py @@ -236,7 +236,6 @@ class CryptarithmDataset(ProceduralDataset): alphabet, number = pair.split("=") correct_mapping[alphabet] = int(number) - # case 1 : pairs are in a list format and the number of pairs matched up if len(answer.split(",")) != len(correct_mapping): return 0.1 diff --git a/tests/test_cryptarithm.py b/tests/test_cryptarithm.py index 686ba949..b704e3b4 100644 --- a/tests/test_cryptarithm.py +++ b/tests/test_cryptarithm.py @@ -119,7 +119,6 @@ def test_cryptarithm_score_answer(): score = dataset.score_answer(answer=correct_answer_str, answer_str=correct_answer_str) assert score == 1.0, f"Expected 1.0 for perfectly correct answer, got {score}" - # 3) Mismatch number of pairs => score should be 0.1 # For instance, drop the last pair splitted = correct_answer_str.split(",")