mirror of
https://github.com/NousResearch/atropos.git
synced 2026-04-19 12:57:58 +00:00
make the evaluator more discerning
This commit is contained in:
parent
28943206a0
commit
4e83714b44
1 changed files with 1 additions and 1 deletions
|
|
@ -260,7 +260,7 @@ class GSM8kEnv(BaseEnv):
|
|||
scores["scores"] = list()
|
||||
# # random.shuffle(rollout_group_data)
|
||||
for item in rollout_group_data:
|
||||
final_question = list(item["messages"]) + [{'role': 'system', 'content': 'The conversation is over. Say meow if the caretaker did a bad job, or purr if the caretaker did a good job.'}]
|
||||
final_question = list(item["messages"]) + [{'role': 'system', 'content': 'The conversation is over. Say purr if the caretaker did everything perfectly and there was nothing that the caretaker could have done even slightly better. Otherwise, say meow. Make sure it is rare that you rate the caretaker with a purr.'}]
|
||||
caretaker_completions = await self.server.chat_completion(
|
||||
messages=final_question,
|
||||
n=1,
|
||||
|
|
|
|||
Loading…
Add table
Add a link
Reference in a new issue