diff --git a/atroposlib/cli/inference_node_wandb_watcher.py b/atroposlib/cli/inference_node_wandb_watcher.py index b5f5fc45..2ef77520 100644 --- a/atroposlib/cli/inference_node_wandb_watcher.py +++ b/atroposlib/cli/inference_node_wandb_watcher.py @@ -2,6 +2,7 @@ import argparse import time import requests + import wandb diff --git a/atroposlib/envs/base.py b/atroposlib/envs/base.py index 595a8d83..2e9c9fe6 100644 --- a/atroposlib/envs/base.py +++ b/atroposlib/envs/base.py @@ -16,7 +16,6 @@ from typing import Any, Dict, List, Optional, Tuple, TypedDict, Union import aiohttp import jsonlines import numpy as np -import wandb import yaml from pydantic import BaseModel, Field from pydantic_cli import Cmd, FailedExecutionException, run_and_exit @@ -24,6 +23,7 @@ from rich import print as rprint from tenacity import retry, stop_after_attempt, wait_random_exponential from transformers import AutoTokenizer +import wandb from atroposlib.envs.constants import ENV_NAMESPACE, NAMESPACE_SEP, OPENAI_NAMESPACE from atroposlib.envs.server_handling.openai_server import resolve_openai_configs from atroposlib.frontend.jsonl2html import generate_html diff --git a/environments/community/goofy_math/goofy_math_server.py b/environments/community/goofy_math/goofy_math_server.py index c10073a6..d12086b7 100644 --- a/environments/community/goofy_math/goofy_math_server.py +++ b/environments/community/goofy_math/goofy_math_server.py @@ -2,12 +2,12 @@ import asyncio import random from typing import Dict, List, Optional, Tuple, TypedDict, Union -import wandb from datasets import load_dataset from latex2sympy2_extended import NormalizationConfig from math_verify import LatexExtractionConfig, parse, verify from tqdm.asyncio import tqdm_asyncio +import wandb from atroposlib.envs.base import ( APIServerConfig, BaseEnv, diff --git a/environments/community/lean_proof_env/lean_env.py b/environments/community/lean_proof_env/lean_env.py index f9c5660b..bb6acb55 100644 --- a/environments/community/lean_proof_env/lean_env.py +++ b/environments/community/lean_proof_env/lean_env.py @@ -2,10 +2,10 @@ import asyncio # For async operations if PyPantograph is async import random from typing import Dict, List, Optional, Tuple, TypedDict -import wandb # For wandb.Table from datasets import load_dataset from tqdm.asyncio import tqdm_asyncio # For progress bars in evaluate +import wandb # For wandb.Table from atroposlib.envs.base import ( APIServerConfig, BaseEnv, diff --git a/environments/community/mcp_tool_calling/grpo.py b/environments/community/mcp_tool_calling/grpo.py index 38273153..fa7fca76 100644 --- a/environments/community/mcp_tool_calling/grpo.py +++ b/environments/community/mcp_tool_calling/grpo.py @@ -13,12 +13,13 @@ import numpy as np import requests import torch import torch.nn.functional as F -import wandb # Added for logging from pydantic import BaseModel, Field from tenacity import retry, stop_after_attempt, wait_exponential from torch.optim import AdamW from transformers import AutoModelForCausalLM, AutoTokenizer +import wandb # Added for logging + # Global variable to keep track of the vLLM process vllm_process = None diff --git a/environments/community/mcp_tool_calling/tool_calling_server.py b/environments/community/mcp_tool_calling/tool_calling_server.py index 3c765c72..d705cad6 100644 --- a/environments/community/mcp_tool_calling/tool_calling_server.py +++ b/environments/community/mcp_tool_calling/tool_calling_server.py @@ -3,10 +3,10 @@ import random import re from typing import Dict, List, Optional, Tuple, Union -import wandb from datasets import load_dataset from tqdm.asyncio import tqdm_asyncio +import wandb from atroposlib.envs.base import ( APIServerConfig, BaseEnv, diff --git a/environments/community/meteorology_forecast/meteorology_env.py b/environments/community/meteorology_forecast/meteorology_env.py index 552c86fc..481c59f1 100644 --- a/environments/community/meteorology_forecast/meteorology_env.py +++ b/environments/community/meteorology_forecast/meteorology_env.py @@ -9,9 +9,9 @@ from dataclasses import dataclass from pathlib import Path from typing import Any, Dict, List, Optional, Tuple -import wandb from pydantic import Field +import wandb from atroposlib.envs.base import ( APIServer, APIServerConfig, diff --git a/environments/community/options_iv_prediction/options_iv_prediction.py b/environments/community/options_iv_prediction/options_iv_prediction.py index 16d7b9fe..247c9389 100644 --- a/environments/community/options_iv_prediction/options_iv_prediction.py +++ b/environments/community/options_iv_prediction/options_iv_prediction.py @@ -3,11 +3,11 @@ import re from typing import Dict, List, Optional, Tuple, Union import pandas as pd -import wandb from datasets import Dataset from tqdm.asyncio import tqdm_asyncio from yahooquery import Ticker +import wandb from atroposlib.envs.base import ( APIServerConfig, BaseEnv, diff --git a/environments/community/padres_spatial/spatial_env.py b/environments/community/padres_spatial/spatial_env.py index b098b521..e4e3231d 100644 --- a/environments/community/padres_spatial/spatial_env.py +++ b/environments/community/padres_spatial/spatial_env.py @@ -9,9 +9,10 @@ from typing import Any, Dict, List, Optional import pybullet as p import pybullet_data -import wandb import websockets +import wandb + # LLM Service Import from .llm_services import get_anthropic_completion diff --git a/environments/community/philosophical_rlaif_env.py b/environments/community/philosophical_rlaif_env.py index 04d98266..b07df44d 100644 --- a/environments/community/philosophical_rlaif_env.py +++ b/environments/community/philosophical_rlaif_env.py @@ -3,10 +3,10 @@ import random import re # Added import for regular expressions from typing import Dict, List, Optional, Tuple -import wandb # type: ignore from datasets import load_dataset # type: ignore from pydantic import Field +import wandb # type: ignore from atroposlib.envs.base import BaseEnvConfig # Ensure BaseEnvConfig is imported from atroposlib.envs.base import ( APIServerConfig, diff --git a/environments/community/physical_space_stl/grpo.py b/environments/community/physical_space_stl/grpo.py index 144a9d81..1cf4be39 100644 --- a/environments/community/physical_space_stl/grpo.py +++ b/environments/community/physical_space_stl/grpo.py @@ -15,12 +15,13 @@ import numpy as np import requests import torch import torch.nn.functional as F -import wandb # Added for logging from pydantic import BaseModel, Field from tenacity import retry, stop_after_attempt, wait_exponential from torch.optim import AdamW from transformers import AutoModelForCausalLM, AutoTokenizer +import wandb # Added for logging + # Global variable to keep track of the vLLM process vllm_process = None diff --git a/environments/community/protein_design/protein_env.py b/environments/community/protein_design/protein_env.py index 6897d2b4..2bacd28a 100644 --- a/environments/community/protein_design/protein_env.py +++ b/environments/community/protein_design/protein_env.py @@ -5,12 +5,12 @@ import uuid from pathlib import Path from typing import Any, Dict, List, Optional, Tuple, TypedDict -import wandb import yaml from datasets import Dataset, load_dataset from dotenv import load_dotenv from pydantic import Field +import wandb from atroposlib.envs.base import ( APIServerConfig, BaseEnv, diff --git a/environments/community/wikipedia_research/tool_calling_server.py b/environments/community/wikipedia_research/tool_calling_server.py index e14bc717..752bbc39 100644 --- a/environments/community/wikipedia_research/tool_calling_server.py +++ b/environments/community/wikipedia_research/tool_calling_server.py @@ -3,10 +3,10 @@ import random import re from typing import Dict, List, Optional, Tuple, Union -import wandb from datasets import load_dataset from tqdm.asyncio import tqdm_asyncio +import wandb from atroposlib.envs.base import ( APIServerConfig, BaseEnv, diff --git a/environments/community/wikipedia_research/wikipedia_article_creator.py b/environments/community/wikipedia_research/wikipedia_article_creator.py index 342e62c1..b0a0a34c 100644 --- a/environments/community/wikipedia_research/wikipedia_article_creator.py +++ b/environments/community/wikipedia_research/wikipedia_article_creator.py @@ -25,7 +25,6 @@ except ImportError: ) import wandb - from atroposlib.envs.base import ( APIServerConfig, BaseEnv, diff --git a/environments/fundamental_prediction_environment.py b/environments/fundamental_prediction_environment.py index 7eda4110..c345e6b7 100644 --- a/environments/fundamental_prediction_environment.py +++ b/environments/fundamental_prediction_environment.py @@ -2,10 +2,10 @@ import random import re from typing import Dict, List, Optional, Tuple, Union -import wandb from datasets import load_dataset from tqdm.asyncio import tqdm_asyncio +import wandb from atroposlib.envs.base import ( APIServerConfig, BaseEnv, diff --git a/environments/instruction_following_algorithm_environment.py b/environments/instruction_following_algorithm_environment.py index 8735f3f8..4ee7c981 100644 --- a/environments/instruction_following_algorithm_environment.py +++ b/environments/instruction_following_algorithm_environment.py @@ -3,12 +3,12 @@ import random import re from typing import Dict, List, Optional, Tuple -import wandb from datasets import Dataset, load_dataset from langdetect import LangDetectException, detect from pydantic import Field from tqdm.asyncio import tqdm_asyncio +import wandb from atroposlib.envs.base import ( APIServerConfig, BaseEnv, diff --git a/environments/math_server.py b/environments/math_server.py index 8235f0e5..aafcefc5 100644 --- a/environments/math_server.py +++ b/environments/math_server.py @@ -5,7 +5,6 @@ from concurrent.futures import ProcessPoolExecutor from difflib import SequenceMatcher from typing import Dict, List, Optional, Tuple -import wandb from datasets import load_dataset from latex2sympy2_extended import NormalizationConfig from math_verify import LatexExtractionConfig, parse, verify @@ -13,6 +12,7 @@ from math_verify.errors import TimeoutException from pydantic import Field from tqdm.asyncio import tqdm_asyncio +import wandb from atroposlib.envs.base import ( APIServerConfig, BaseEnv, diff --git a/environments/math_server_zero.py b/environments/math_server_zero.py index bee1c37e..17e81ccf 100644 --- a/environments/math_server_zero.py +++ b/environments/math_server_zero.py @@ -9,7 +9,6 @@ import re from concurrent.futures import ProcessPoolExecutor from typing import Dict, List, Optional, Tuple -import wandb from datasets import load_dataset from latex2sympy2_extended import NormalizationConfig from math_verify import LatexExtractionConfig, parse, verify @@ -17,6 +16,7 @@ from math_verify.errors import TimeoutException from pydantic import Field from tqdm.asyncio import tqdm_asyncio +import wandb from atroposlib.envs.base import ( BaseEnv, BaseEnvConfig, diff --git a/environments/mcp_env.py b/environments/mcp_env.py index a8d621bc..dc2a5055 100644 --- a/environments/mcp_env.py +++ b/environments/mcp_env.py @@ -1,10 +1,10 @@ import json from typing import Dict, List, Optional, Tuple, Union -import wandb from datasets import load_dataset from tqdm.asyncio import tqdm_asyncio +import wandb from atroposlib.envs.base import ( APIServerConfig, BaseEnv, diff --git a/environments/mcqa_thinking_env.py b/environments/mcqa_thinking_env.py index f584f715..1c37a611 100644 --- a/environments/mcqa_thinking_env.py +++ b/environments/mcqa_thinking_env.py @@ -2,10 +2,10 @@ import random import re from typing import Dict, List, Optional, Tuple, Union -import wandb from datasets import load_dataset from tqdm.asyncio import tqdm_asyncio +import wandb from atroposlib.envs.base import ( APIServerConfig, BaseEnv, diff --git a/environments/rlaif_server.py b/environments/rlaif_server.py index c50ad10a..a2aa3647 100644 --- a/environments/rlaif_server.py +++ b/environments/rlaif_server.py @@ -3,9 +3,9 @@ import copy import random from typing import Dict, List, Optional, Tuple -import wandb from datasets import load_dataset +import wandb from atroposlib.envs.base import ( APIServerConfig, BaseEnv, diff --git a/environments/swe_rl_env.py b/environments/swe_rl_env.py index e3331199..b610e18e 100644 --- a/environments/swe_rl_env.py +++ b/environments/swe_rl_env.py @@ -14,11 +14,11 @@ import uuid # Import uuid module from difflib import SequenceMatcher from typing import Dict, List, Optional, Tuple, Union -import wandb from datasets import load_dataset # Ensured import load_dataset is present from pydantic import Field from tqdm.asyncio import tqdm_asyncio +import wandb from atroposlib.envs.base import ( APIServerConfig, BaseEnv, diff --git a/environments/tool_calling_server.py b/environments/tool_calling_server.py index 7de921aa..a6d8633b 100644 --- a/environments/tool_calling_server.py +++ b/environments/tool_calling_server.py @@ -3,10 +3,10 @@ import random import re from typing import Dict, List, Optional, Tuple, Union -import wandb from datasets import load_dataset from tqdm.asyncio import tqdm_asyncio +import wandb from atroposlib.envs.base import ( APIServerConfig, BaseEnv, diff --git a/environments/tool_use_interleaved_thinking.py b/environments/tool_use_interleaved_thinking.py index f4e61d8b..f10a6485 100644 --- a/environments/tool_use_interleaved_thinking.py +++ b/environments/tool_use_interleaved_thinking.py @@ -18,7 +18,6 @@ from __future__ import annotations import asyncio import json import logging -import logging import os import re from typing import Dict, List, Optional, Tuple, Union diff --git a/example_trainer/grpo.py b/example_trainer/grpo.py index 38273153..fa7fca76 100644 --- a/example_trainer/grpo.py +++ b/example_trainer/grpo.py @@ -13,12 +13,13 @@ import numpy as np import requests import torch import torch.nn.functional as F -import wandb # Added for logging from pydantic import BaseModel, Field from tenacity import retry, stop_after_attempt, wait_exponential from torch.optim import AdamW from transformers import AutoModelForCausalLM, AutoTokenizer +import wandb # Added for logging + # Global variable to keep track of the vLLM process vllm_process = None