make preserve thinking optional

2026-04-19 12:57:58 +00:00 · 2026-03-04 15:44:12 -06:00 · 2026-03-04 15:44:12 -06:00 · f4875c5dc6
commit f4875c5dc6
parent 12d61d197f
3 changed files with 22 additions and 8 deletions
--- a/atroposlib/envs/server_handling/server_manager.py
+++ b/atroposlib/envs/server_handling/server_manager.py
@ -384,6 +384,7 @@ class ServerManager:
        self,
        tokenizer=None,
        base_url: Optional[str] = None,
+        preserve_think_blocks: bool = False,
    ):
        """
        Context manager that provides a ManagedServer instance.
@ -397,10 +398,13 @@ class ServerManager:

        Args:
            tokenizer: Optional tokenizer to use. If not provided, will attempt to
-                      extract from server or create from model name.
+                        extract from server or create from model name.
            base_url: Pin the session to a specific backend server by its base_url.
-                     In production, this comes from the atropos API's server allocation.
-
+                        In production, this comes from the atropos API's server allocation.
+            preserve_think_blocks: If True, preserves <think> blocks in assistant messages,
+                        which are sometimes stripped by chat templates. Defaults to False.
+                        Usually not needed, since the chat template should be configured
+                        to preserve thinking blocks until a user message arrives.
        Yields:
            ManagedServer, DummyManagedServer, or ProxyManagedServer instance

@ -502,6 +506,7 @@ class ServerManager:
                server=selected_server,
                tokenizer=tokenizer,
                tool_parser=self.tool_parser,
+                preserve_think_blocks=preserve_think_blocks,
            )

            try: