atropos/environments/community/bleuberi/configs/openai.yaml
Allan Niemerg 0f6c06bb56 Move BLEUBERI environment to community folder
- Moved environments/bleuberi to environments/community/bleuberi
      - Updated .gitmodules to reflect new submodule path
      - Fixed pre-commit formatting issues
      - Cleaned up test output files
2025-09-08 14:38:43 -05:00

29 lines
760 B
YAML

env:
# Standard environment configuration
wandb_name: bleuberi
dataset_name: "allenai/tulu-3-sft-mixture"
reward_funcs:
- "bleu"
ref_models:
- "gold"
# Use a tokenizer that's compatible with OpenAI models
tokenizer_name: "gpt2"
# Process more examples
max_train_examples: 20
max_test_examples: 10
group_size: 4
max_num_workers: 4
max_eval_workers: 2
total_steps: 5
server:
timeout: 1200
num_max_requests_at_once: 8
num_requests_for_eval: 16
server_type: "openai"
model_name: "gpt-4.1-nano" # Or your preferred model
base_url: "https://api.openai.com/v1" # Or your custom server URL
api_key: "${OPENAI_API_KEY}" # Will be loaded from environment variable
temperature: 0.7
max_tokens: 1024
top_p: 0.95