diff --git a/.gitmodules b/.gitmodules index 94df3e16..59964cff 100644 --- a/.gitmodules +++ b/.gitmodules @@ -7,6 +7,6 @@ [submodule "environments/game_environments/diplomacy_environment/AI_Diplomacy"] path = environments/game_environments/diplomacy_environment/AI_Diplomacy url = https://github.com/GoodStartLabs/AI_Diplomacy.git -[submodule "environments/bleuberi/bleuberi-repo"] - path = environments/bleuberi/bleuberi-repo +[submodule "environments/community/bleuberi/bleuberi-repo"] + path = environments/community/bleuberi/bleuberi-repo url = https://github.com/lilakk/BLEUBERI.git diff --git a/environments/bleuberi/README.md b/environments/community/bleuberi/README.md similarity index 100% rename from environments/bleuberi/README.md rename to environments/community/bleuberi/README.md diff --git a/environments/bleuberi/__init__.py b/environments/community/bleuberi/__init__.py similarity index 100% rename from environments/bleuberi/__init__.py rename to environments/community/bleuberi/__init__.py diff --git a/environments/bleuberi/bleuberi-repo b/environments/community/bleuberi/bleuberi-repo similarity index 100% rename from environments/bleuberi/bleuberi-repo rename to environments/community/bleuberi/bleuberi-repo diff --git a/environments/bleuberi/bleuberi_env.py b/environments/community/bleuberi/bleuberi_env.py similarity index 98% rename from environments/bleuberi/bleuberi_env.py rename to environments/community/bleuberi/bleuberi_env.py index 500d145c..b3536252 100644 --- a/environments/bleuberi/bleuberi_env.py +++ b/environments/community/bleuberi/bleuberi_env.py @@ -169,10 +169,10 @@ class BLEUBERIEnv(BaseEnv): dataset_split="train", reward_funcs=["bleu"], ref_models=["gold"], - max_train_examples=2, - max_test_examples=1, - max_num_workers=2, - max_eval_workers=1, + max_train_examples=20, # 10x increase from 2 to 20 + max_test_examples=10, # 10x increase from 1 to 10 + max_num_workers=4, # Increased workers to handle more examples + max_eval_workers=2, # Increased eval workers data_path_to_save_groups="bleuberi_openai_test.jsonl", ) @@ -182,9 +182,9 @@ class BLEUBERIEnv(BaseEnv): model_name="gpt-4.1-nano", base_url="https://api.openai.com/v1", api_key=api_key, - timeout=60, - num_max_requests_at_once=4, - num_requests_for_eval=4, + timeout=120, # Increased timeout to handle more requests + num_max_requests_at_once=8, # Increased from 4 to 8 for more parallelism + num_requests_for_eval=8, # Increased from 4 to 8 ), ] diff --git a/environments/bleuberi/configs/default.yaml b/environments/community/bleuberi/configs/default.yaml similarity index 100% rename from environments/bleuberi/configs/default.yaml rename to environments/community/bleuberi/configs/default.yaml diff --git a/environments/bleuberi/configs/openai.yaml b/environments/community/bleuberi/configs/openai.yaml similarity index 80% rename from environments/bleuberi/configs/openai.yaml rename to environments/community/bleuberi/configs/openai.yaml index e38bb278..8711169b 100644 --- a/environments/bleuberi/configs/openai.yaml +++ b/environments/community/bleuberi/configs/openai.yaml @@ -8,6 +8,13 @@ env: - "gold" # Use a tokenizer that's compatible with OpenAI models tokenizer_name: "gpt2" + # Process more examples + max_train_examples: 20 + max_test_examples: 10 + group_size: 4 + max_num_workers: 4 + max_eval_workers: 2 + total_steps: 5 server: timeout: 1200 diff --git a/environments/bleuberi/requirements.txt b/environments/community/bleuberi/requirements.txt similarity index 100% rename from environments/bleuberi/requirements.txt rename to environments/community/bleuberi/requirements.txt