mirror of
https://github.com/NousResearch/atropos.git
synced 2026-04-23 16:54:56 +00:00
Move to subfolder
This commit is contained in:
parent
a88e3afddf
commit
7eae51cc5c
23 changed files with 0 additions and 0 deletions
14
environments/hack0/DeepSacrifice/server/reward/reward_fn.ts
Normal file
14
environments/hack0/DeepSacrifice/server/reward/reward_fn.ts
Normal file
|
|
@ -0,0 +1,14 @@
|
|||
/**
|
||||
* Placeholder reward function using LLM feedback.
|
||||
* Will use OpenAI GPT-4o-mini feedback in the future.
|
||||
*/
|
||||
export async function computeReward(
|
||||
fen: string,
|
||||
moveSAN: string,
|
||||
llmScore?: string,
|
||||
llmJustification?: string,
|
||||
): Promise<number> {
|
||||
// TODO: Use real LLM feedback to compute reward
|
||||
// For now, return a dummy reward
|
||||
return 0.5;
|
||||
}
|
||||
Loading…
Add table
Add a link
Reference in a new issue