mirror of
https://github.com/NousResearch/atropos.git
synced 2026-04-19 12:57:58 +00:00
- Trie-based solver, official scoring, normalized rewards - Configurable token limit and detailed README with dictionary download link - Removes large Dictionary.txt from tracking and adds ignore rules - All tests pass and pre-commit hooks are clean
75 lines
1.6 KiB
YAML
75 lines
1.6 KiB
YAML
# Word Hunt Environment Example Configuration
|
|
# Copy this file and modify as needed for your training runs
|
|
|
|
# Environment Configuration
|
|
env_name: "word_hunt_environment"
|
|
env_config:
|
|
# Core Training Parameters
|
|
group_size: 4
|
|
max_token_length: 2048
|
|
steps_per_eval: 100
|
|
boards_per_epoch: 50
|
|
|
|
# Game Parameters
|
|
board_size: 4
|
|
min_word_length: 3
|
|
max_word_length: 16
|
|
max_tokens_per_game: 100
|
|
|
|
# Board Generation
|
|
vowel_weight: 0.4
|
|
common_letter_bias: true
|
|
board_generation_method: "random_weighted"
|
|
|
|
# Scoring
|
|
use_official_scoring: true
|
|
normalize_scores: true
|
|
max_possible_score_estimate: 10000
|
|
|
|
# Validation
|
|
validate_words: true
|
|
validate_board_paths: true
|
|
|
|
# Prompt Configuration
|
|
prompt_style: "grid_visual" # Options: grid_visual, text_description, both
|
|
include_instructions: true
|
|
include_scoring_info: true
|
|
|
|
# Evaluation
|
|
eval_board_count: 10
|
|
eval_metrics: ["accuracy", "total_score", "word_count", "avg_word_length"]
|
|
|
|
# Logging
|
|
debug_mode: false
|
|
use_wandb: true
|
|
wandb_name: "word_hunt_training"
|
|
|
|
# Advanced Options
|
|
shuffle_boards: true
|
|
save_board_images: false
|
|
|
|
# Server Configuration (example)
|
|
server_configs:
|
|
- name: "openai"
|
|
server_type: "openai"
|
|
api_key: "${OPENAI_API_KEY}"
|
|
base_url: "https://api.openai.com/v1"
|
|
model: "gpt-4"
|
|
max_retries: 3
|
|
timeout: 60
|
|
|
|
# Training Parameters
|
|
training:
|
|
total_steps: 10000
|
|
batch_size: 512
|
|
learning_rate: 1e-5
|
|
warmup_steps: 100
|
|
gradient_accumulation_steps: 1
|
|
|
|
# Logging Configuration
|
|
logging:
|
|
log_level: "INFO"
|
|
save_checkpoints: true
|
|
checkpoint_interval: 1000
|
|
save_rollouts: false
|
|
rollout_save_interval: 500
|