mirror of
https://github.com/open-thought/reasoning-gym.git
synced 2026-04-19 12:58:07 +00:00
ensure reward is float
This commit is contained in:
parent
c858d1f236
commit
4c47b7966f
3 changed files with 5 additions and 5 deletions
|
|
@ -93,7 +93,7 @@ class SentenceReorderingDataset(ProceduralDataset):
|
|||
}
|
||||
|
||||
def score_answer(self, answer: Optional[str], entry: Dict[str, Any]) -> float:
|
||||
reward = 0
|
||||
reward = 0.0
|
||||
expected_answer = entry["answer"]
|
||||
if answer is not None:
|
||||
try:
|
||||
|
|
|
|||
Loading…
Add table
Add a link
Reference in a new issue