diff --git a/reasoning_gym/code/bf.py b/reasoning_gym/code/bf.py index a8528843..e7def05e 100644 --- a/reasoning_gym/code/bf.py +++ b/reasoning_gym/code/bf.py @@ -127,10 +127,10 @@ int main() {{ if entry["answer"] in answer.splitlines(): # We can be quite confident that the correct answer was given # It was likely just given alongside an explanation - return 0.9 * len(answer) / len(entry["answer"]) + return max(0.9 * len(answer) / len(entry["answer"]), 0.1) if entry["answer"] in answer: # Since answers are English words, some risk of the response coincidentally containing the answer - return 0.5 * len(answer) / len(entry["answer"]) + return max(0.5 * len(answer) / len(entry["answer"]), 0.1) return 0.01 else: return 1.0 # Yay