diff --git a/reasoning_gym/games/puzzle24.py b/reasoning_gym/games/puzzle24.py index 3cf37c47..8cb84019 100644 --- a/reasoning_gym/games/puzzle24.py +++ b/reasoning_gym/games/puzzle24.py @@ -24,7 +24,7 @@ DATASET_NAME = "puzzle24" class Puzzle24Config: operators: tuple = ("+", "-", "*", "/") min_value: int = 1 - max_value: int = 6 + max_value: int = 10 seed: Optional[int] = None size: int = 500 @@ -116,8 +116,10 @@ class Puzzle24Dataset(ProceduralDataset): try: answer = answer.strip() user_answer = int(parse_expr(answer)) + print(f"User answer: {user_answer}") solved = user_answer == 24 used_numbers = [int(num) for num in re.findall(r"\b\d+\b", answer)] + print(f"Used numbers: {used_numbers}") if len(used_numbers) != 4: reward = 0.01 elif any(num > self.config.max_value or num < self.config.min_value for num in used_numbers):