mirror of
https://github.com/open-thought/reasoning-gym.git
synced 2026-04-19 12:58:07 +00:00
Changed parmas back in puzzle24
This commit is contained in:
parent
f202e4f7f2
commit
29ec970044
1 changed files with 3 additions and 1 deletions
|
|
@ -24,7 +24,7 @@ DATASET_NAME = "puzzle24"
|
|||
class Puzzle24Config:
|
||||
operators: tuple = ("+", "-", "*", "/")
|
||||
min_value: int = 1
|
||||
max_value: int = 6
|
||||
max_value: int = 10
|
||||
seed: Optional[int] = None
|
||||
size: int = 500
|
||||
|
||||
|
|
@ -116,8 +116,10 @@ class Puzzle24Dataset(ProceduralDataset):
|
|||
try:
|
||||
answer = answer.strip()
|
||||
user_answer = int(parse_expr(answer))
|
||||
print(f"User answer: {user_answer}")
|
||||
solved = user_answer == 24
|
||||
used_numbers = [int(num) for num in re.findall(r"\b\d+\b", answer)]
|
||||
print(f"Used numbers: {used_numbers}")
|
||||
if len(used_numbers) != 4:
|
||||
reward = 0.01
|
||||
elif any(num > self.config.max_value or num < self.config.min_value for num in used_numbers):
|
||||
|
|
|
|||
Loading…
Add table
Add a link
Reference in a new issue