gsm8k eval example

This commit is contained in:
hjc-puro 2025-07-11 00:22:36 +00:00
parent afe4fc318f
commit e601251893
2 changed files with 6 additions and 1 deletions

View file

@ -213,7 +213,6 @@ class GSM8kEnv(BaseEnv):
"question": question,
"gold_answer": answer,
"gold_parsed": str(gold_parsed) if gold_parsed else None,
"model_answer": response_content,
"model_parsed": str(answer_parsed) if answer_parsed else None,
"score": int(score),
"correct": bool(score),