BLEUBERI/eval/arena-hard-v2.0
2025-06-04 20:36:43 +00:00
..
config initial commit 2025-06-04 20:36:43 +00:00
data initial commit 2025-06-04 20:36:43 +00:00
utils initial commit 2025-06-04 20:36:43 +00:00
gen_answer.py initial commit 2025-06-04 20:36:43 +00:00
gen_answer_local.py initial commit 2025-06-04 20:36:43 +00:00
gen_judgment.py initial commit 2025-06-04 20:36:43 +00:00
LICENSE initial commit 2025-06-04 20:36:43 +00:00
qa_browser.py initial commit 2025-06-04 20:36:43 +00:00
requirements-optional.txt initial commit 2025-06-04 20:36:43 +00:00
requirements.txt initial commit 2025-06-04 20:36:43 +00:00
run_arenahard_2.0.sh initial commit 2025-06-04 20:36:43 +00:00
show_result.py initial commit 2025-06-04 20:36:43 +00:00