From 2dff704f0b92b9d2e01bfe801ea5b47e2e10b6fa Mon Sep 17 00:00:00 2001 From: Oliver Date: Mon, 28 Apr 2025 22:48:45 +0100 Subject: [PATCH] cfg --- .../external_generalisation/math_curriculum_qwen_7b.yaml | 2 ++ 1 file changed, 2 insertions(+) diff --git a/training/configs/external_generalisation/math_curriculum_qwen_7b.yaml b/training/configs/external_generalisation/math_curriculum_qwen_7b.yaml index 0a32a24c..1cc5ee57 100644 --- a/training/configs/external_generalisation/math_curriculum_qwen_7b.yaml +++ b/training/configs/external_generalisation/math_curriculum_qwen_7b.yaml @@ -94,6 +94,8 @@ actor_rollout_ref: ppo_epochs: 1 shuffle: False ulysses_sequence_parallel_size: 1 # sp size + checkpoint: + contents: ['model', 'optimizer', 'extra'] optim: lr: 1e-6 lr_warmup_steps_ratio: 0. # the total steps will be injected during runtime