mirror of
https://github.com/NousResearch/atropos.git
synced 2026-04-19 12:57:58 +00:00
add this to our pyproject
This commit is contained in:
parent
ce85c7d95e
commit
fb3228f669
2 changed files with 9 additions and 3 deletions
|
|
@ -8,8 +8,8 @@ A modular training framework for fine-tuning language models with **Group Relati
|
|||
|
||||
```
|
||||
example_trainer/
|
||||
├── grpo.py # CLI entry point (dispatches to 4 training modes)
|
||||
├── run.py # Unified launcher for shared_vllm mode (starts vLLM+trainer)
|
||||
├── grpo.py # CLI entry point (also exposed as `atropos-grpo`)
|
||||
├── run.py # Unified shared_vllm launcher (also exposed as `atropos-grpo-run`)
|
||||
├── config.py # TrainingConfig Pydantic model (all hyperparameters)
|
||||
├── cli.py # CLI argument parsing (modular, single source of truth)
|
||||
├── api.py # Atropos API communication (registration, batch fetching)
|
||||
|
|
@ -27,6 +27,10 @@ example_trainer/
|
|||
└── math_zero_lora.yaml # Config for math_server_zero.py (lora mode)
|
||||
```
|
||||
|
||||
After `pip install -e .` from the repository root, you can launch with either:
|
||||
- `python -m example_trainer.grpo` or `atropos-grpo`
|
||||
- `python -m example_trainer.run` or `atropos-grpo-run`
|
||||
|
||||
|
||||
## GRPO Training Loop
|
||||
|
||||
|
|
|
|||
|
|
@ -35,6 +35,8 @@ view-run = "atroposlib.cli.view_run:main"
|
|||
view-run-multimodal = "atroposlib.cli.view_run_multimodal:main"
|
||||
atropos-sft-gen = "atroposlib.cli.sft:main"
|
||||
atropos-dpo-gen = "atroposlib.cli.dpo:main"
|
||||
atropos-grpo = "example_trainer.grpo:main"
|
||||
atropos-grpo-run = "example_trainer.run:main"
|
||||
|
||||
[project.optional-dependencies]
|
||||
all = [
|
||||
|
|
@ -67,4 +69,4 @@ requires = ["hatchling"]
|
|||
build-backend = "hatchling.build"
|
||||
|
||||
[tool.hatch.build.targets.wheel]
|
||||
packages = ["atroposlib"]
|
||||
packages = ["atroposlib", "example_trainer"]
|
||||
|
|
|
|||
Loading…
Add table
Add a link
Reference in a new issue