mirror of
https://github.com/NousResearch/atropos.git
synced 2026-04-19 12:57:58 +00:00
- Moved environments/bleuberi to environments/community/bleuberi
- Updated .gitmodules to reflect new submodule path
- Fixed pre-commit formatting issues
- Cleaned up test output files
29 lines
760 B
YAML
29 lines
760 B
YAML
env:
|
|
# Standard environment configuration
|
|
wandb_name: bleuberi
|
|
dataset_name: "allenai/tulu-3-sft-mixture"
|
|
reward_funcs:
|
|
- "bleu"
|
|
ref_models:
|
|
- "gold"
|
|
# Use a tokenizer that's compatible with OpenAI models
|
|
tokenizer_name: "gpt2"
|
|
# Process more examples
|
|
max_train_examples: 20
|
|
max_test_examples: 10
|
|
group_size: 4
|
|
max_num_workers: 4
|
|
max_eval_workers: 2
|
|
total_steps: 5
|
|
|
|
server:
|
|
timeout: 1200
|
|
num_max_requests_at_once: 8
|
|
num_requests_for_eval: 16
|
|
server_type: "openai"
|
|
model_name: "gpt-4.1-nano" # Or your preferred model
|
|
base_url: "https://api.openai.com/v1" # Or your custom server URL
|
|
api_key: "${OPENAI_API_KEY}" # Will be loaded from environment variable
|
|
temperature: 0.7
|
|
max_tokens: 1024
|
|
top_p: 0.95
|