[pre-commit.ci] auto fixes from pre-commit.com hooks

for more information, see https://pre-commit.ci
This commit is contained in:
pre-commit-ci[bot] 2025-11-14 06:55:53 +00:00
parent 76fec8b919
commit aae4432a58

View file

@ -225,7 +225,9 @@ class RLAIFEnv(BaseEnv):
scores["tokens"].append(tokens)
scores["masks"].append(masks)
scores["inference_logprobs"].append(logprobs)
scores["scores"].append(1.0 if item["finish_reason"] != "length" else -1.0)
scores["scores"].append(
1.0 if item["finish_reason"] != "length" else -1.0
)
return scores
else:
fwd_fmt = RLAIF_user_prompt_format_str.format(