added updates

2026-04-30 17:40:45 +00:00 · 2025-03-29 08:07:57 +00:00 · 2025-03-29 08:07:57 +00:00 · 9f9f816902
commit 9f9f816902
parent 774d23664d
10 changed files with 461 additions and 503 deletions
--- a/training/configs/eval_spell_backward_no_curr.yaml
+++ b/training/configs/eval_spell_backward_no_curr.yaml
@ -0,0 +1,25 @@
+# Model configuration
+model_path: utils/qwen2.5b_1.5_step312  # Change to the smaller model
+max_tokens: 1024  # From max_response_length in training config
+temperature: 0.7  # Lower temperature for more focused responses
+top_p: 0.9  # From rollout top_p
+developer_prompt: DeepSeekZero
+developer_role: system  # Standard role for system prompts
+
+# Output configuration
+output_dir: eval_results
+save_metadata: true
+save_full_results: true
+eval_repeats: 3
+
+# Categories and datasets to evaluate
+categories:
+  - category: reasoning
+    datasets:
+      - dataset: spell_backward
+        size: 100
+        seed: 42
+        params:
+          min_word_len: 3  # From training config
+          max_word_len: 10
+          data_file: holdout_words.txt