Revert "rm hardcoded same score check"

This reverts commit f02c24204d.
This commit is contained in:
Partho Das 2026-03-10 01:42:44 +05:30
parent cdc23ba5dc
commit 632ab0161c
22 changed files with 85 additions and 0 deletions

View file

@ -383,6 +383,10 @@ class MathEnv(BaseEnv):
to_postprocess = await self.score(to_score)
if to_postprocess is None:
return None, to_backlog
if all(
[to_postprocess["scores"][0] == score for score in to_postprocess["scores"]]
):
return None, to_backlog
self.normal_rollouts.append(
(
prompt_format.format(prompt=problem_format.format(problem=item[0])),