mirror of
https://github.com/open-thought/reasoning-gym.git
synced 2026-04-29 17:35:16 +00:00
updated datasets
This commit is contained in:
parent
9f9f816902
commit
37bbd97191
3 changed files with 28 additions and 23 deletions
|
|
@ -72,7 +72,7 @@ class SpellBackwardDataset(ProceduralDataset):
|
|||
expected_answer = expected_answer.lower()
|
||||
answer = answer.lower()
|
||||
if expected_answer == answer:
|
||||
reward = 1.0
|
||||
return 1.0
|
||||
else:
|
||||
answer_len = len(expected_answer)
|
||||
for i in range(len(expected_answer)):
|
||||
|
|
@ -83,7 +83,8 @@ class SpellBackwardDataset(ProceduralDataset):
|
|||
continue
|
||||
else:
|
||||
break
|
||||
|
||||
if reward == 1.0:
|
||||
reward -= 0.2
|
||||
except:
|
||||
reward = 0.0
|
||||
return reward
|
||||
|
|
|
|||
Loading…
Add table
Add a link
Reference in a new issue