eval max_token_length consistent with training config

instead of hardcoding, follows other envs pattern
2026-04-19 12:57:58 +00:00 · 2026-03-03 18:03:04 +05:30 · 2026-03-03 18:03:04 +05:30 · 5f52befd38
commit 5f52befd38
parent bd98a82bbc
1 changed files with 1 additions and 1 deletions
--- a/environments/math_server_zero.py
+++ b/environments/math_server_zero.py
@ -259,7 +259,7 @@ class MathEnv(BaseEnv):
            completion = await managed.completion(
                prompt=question,
                n=1,
-                max_tokens=32765,
+                max_tokens=self.config.max_token_length,
                temperature=0.0,
                split="eval",
                stop=stop_list,