mirror of
https://github.com/NousResearch/atropos.git
synced 2026-04-23 16:54:56 +00:00
math zero 32k
This commit is contained in:
parent
74d46aaa76
commit
7d96367516
1 changed files with 3 additions and 0 deletions
|
|
@ -250,6 +250,7 @@ CUDA_VISIBLE_DEVICES=$SHARED_GPU python -m example_trainer.grpo \
|
|||
--batch-size $BATCH_SIZE \
|
||||
--training-steps $TRAINING_STEPS \
|
||||
--max-model-len $MAX_MODEL_LEN \
|
||||
--seq-len $MAX_MODEL_LEN \
|
||||
--save-path "$LOG_DIR/checkpoints_shared" \
|
||||
$WANDB_ARGS --wandb-group "shared-vllm" \
|
||||
--benchmark \
|
||||
|
|
@ -281,6 +282,7 @@ CUDA_VISIBLE_DEVICES=$LORA_ONLY_GPU python -m example_trainer.grpo \
|
|||
--batch-size $BATCH_SIZE \
|
||||
--training-steps $TRAINING_STEPS \
|
||||
--max-model-len $MAX_MODEL_LEN \
|
||||
--seq-len $MAX_MODEL_LEN \
|
||||
--lora-r 16 \
|
||||
--lora-alpha 32 \
|
||||
--vllm-restart-interval 5 \
|
||||
|
|
@ -304,6 +306,7 @@ CUDA_VISIBLE_DEVICES=$LORA_RESTART_GPU python -m example_trainer.grpo \
|
|||
--batch-size $BATCH_SIZE \
|
||||
--training-steps $TRAINING_STEPS \
|
||||
--max-model-len $MAX_MODEL_LEN \
|
||||
--seq-len $MAX_MODEL_LEN \
|
||||
--lora-r 16 \
|
||||
--lora-alpha 32 \
|
||||
--vllm-restart-interval 5 \
|
||||
|
|
|
|||
Loading…
Add table
Add a link
Reference in a new issue