mirror of
https://github.com/NousResearch/atropos.git
synced 2026-04-30 17:40:36 +00:00
parent
cdc23ba5dc
commit
632ab0161c
22 changed files with 85 additions and 0 deletions
|
|
@ -3653,6 +3653,14 @@ class AnswerFormatEnv(BaseEnv):
|
|||
)
|
||||
await self._save_failed_rollouts_to_jsonl()
|
||||
|
||||
# Check if all scores are the same (no learning signal)
|
||||
if all(group_scores[0] == score for score in group_scores):
|
||||
if self.debug_logging:
|
||||
self.logger.debug(
|
||||
"All scores are identical, returning None for learning signal"
|
||||
)
|
||||
return None
|
||||
|
||||
# Track successful groups for equivalent ratio enforcement
|
||||
if self.ensure_equivalent_ratios:
|
||||
# Count this as a successful group if we have any successful examples
|
||||
|
|
|
|||
Loading…
Add table
Add a link
Reference in a new issue