| .. |
|
__init__.py
|
dev - push for submission
|
2025-05-18 17:50:15 -07:00 |
|
conversational_style_dpo_env.py
|
dev - push for submission
|
2025-05-18 17:50:15 -07:00 |
|
gsm8k_dpo_rollouts.jsonl
|
pushing jsonl files
|
2025-05-18 17:56:27 -07:00 |
|
gsm8k_dpo_rollouts_1.html
|
dev - push for submission
|
2025-05-18 17:50:15 -07:00 |
|
gsm8k_dpo_rollouts_1.jsonl
|
pushing jsonl files
|
2025-05-18 17:56:27 -07:00 |
|
gsm8k_dpo_rollouts_2.html
|
dev - push for submission
|
2025-05-18 17:50:15 -07:00 |
|
gsm8k_dpo_rollouts_2.jsonl
|
pushing jsonl files
|
2025-05-18 17:56:27 -07:00 |
|
gsm8k_dpo_rollouts_3.jsonl
|
pushing jsonl files
|
2025-05-18 17:56:27 -07:00 |
|
gsm8k_dpo_rollouts_4.html
|
dev - push for submission
|
2025-05-18 17:50:15 -07:00 |
|
gsm8k_dpo_rollouts_4.jsonl
|
pushing jsonl files
|
2025-05-18 17:56:27 -07:00 |
|
gsm8k_dpo_rollouts_5.jsonl
|
pushing jsonl files
|
2025-05-18 17:56:27 -07:00 |
|
gsm8k_dpo_rollouts_6.html
|
dev - push for submission
|
2025-05-18 17:50:15 -07:00 |
|
gsm8k_dpo_rollouts_6.jsonl
|
pushing jsonl files
|
2025-05-18 17:56:27 -07:00 |
|
gsm8k_dpo_rollouts_7.jsonl
|
pushing jsonl files
|
2025-05-18 17:56:27 -07:00 |
|
gsm8k_dpo_rollouts_8.html
|
dev - push for submission
|
2025-05-18 17:50:15 -07:00 |
|
gsm8k_dpo_rollouts_8.jsonl
|
pushing jsonl files
|
2025-05-18 17:56:27 -07:00 |
|
gsm8k_dpo_rollouts_9.html
|
dev - push for submission
|
2025-05-18 17:50:15 -07:00 |
|
gsm8k_dpo_rollouts_9.jsonl
|
pushing jsonl files
|
2025-05-18 17:56:27 -07:00 |
|
gsm8k_dpo_rollouts_10.jsonl
|
pushing jsonl files
|
2025-05-18 17:56:27 -07:00 |
|
gsm8k_dpo_rollouts_11.jsonl
|
pushing jsonl files
|
2025-05-18 17:56:27 -07:00 |
|
gsm8k_dpo_rollouts_12.jsonl
|
pushing jsonl files
|
2025-05-18 17:56:27 -07:00 |
|
gsm8k_dpo_rollouts_13.jsonl
|
pushing jsonl files
|
2025-05-18 17:56:27 -07:00 |
|
gsm8k_dpo_rollouts_14.jsonl
|
pushing jsonl files
|
2025-05-18 17:56:27 -07:00 |
|
gsm8k_dpo_rollouts_15.html
|
dev - push for submission
|
2025-05-18 17:50:15 -07:00 |
|
gsm8k_dpo_rollouts_15.jsonl
|
pushing jsonl files
|
2025-05-18 17:56:27 -07:00 |
|
gsmk8k_conversational_style_dpo_env.py
|
dev - push for submission
|
2025-05-18 17:50:15 -07:00 |
|
requirements.txt
|
dev - push for submission
|
2025-05-18 17:50:15 -07:00 |
|
train_dpo_conversational.py
|
dev - push for submission
|
2025-05-18 17:50:15 -07:00 |