math zero ymls

This commit is contained in:
Jai Suphavadeeprasit 2026-02-04 17:52:16 -05:00
parent 19248ed5b4
commit a9ebdc50b8
2 changed files with 42 additions and 0 deletions

View file

@ -0,0 +1,21 @@
env:
tokenizer_name: "Qwen/Qwen3-4B-Instruct-2507"
rollout_server_url: "http://localhost:8001"
max_token_length: 8192
start_tok_length: 8192
group_size: 8
batch_size: 64
total_steps: 120
steps_per_eval: 20
use_wandb: true
wandb_name: "math-zero-shared-env"
eval_limit_ratio: 0.1
max_num_workers_per_node: 24
openai:
base_url: "http://localhost:9001/v1"
model_name: "Qwen/Qwen3-4B-Instruct-2507"
server_type: "vllm"
api_key: "x"
num_requests_for_eval: 256
weight: 1.0