remove training code

2026-04-23 16:54:56 +00:00 · 2026-03-13 12:52:52 -04:00 · 2026-03-13 12:52:52 -04:00 · 148a4fd5eb
commit 148a4fd5eb
parent 862cd3667d
6 changed files with 38 additions and 329 deletions
--- a/example_trainer/cli.py
+++ b/example_trainer/cli.py
@ -163,23 +163,6 @@ def add_grpo_args(parser: argparse.ArgumentParser) -> None:
        default=0.2,
        help="PPO-style clipping epsilon. Clips ratio to [1-eps, 1+eps].",
    )
-    group.add_argument(
-        "--distill-enabled",
-        action="store_true",
-        help="Enable teacher distillation loss (requires distill payload in Atropos batch).",
-    )
-    group.add_argument(
-        "--distill-coef",
-        type=float,
-        default=0.0,
-        help="Coefficient for distillation loss term.",
-    )
-    group.add_argument(
-        "--distill-temperature",
-        type=float,
-        default=1.0,
-        help="Temperature for teacher top-k distribution in distillation loss.",
-    )


 def add_vllm_args(parser: argparse.ArgumentParser) -> None:
@ -441,9 +424,6 @@ def config_from_args(args: argparse.Namespace) -> TrainingConfig:
        checkpoint_interval=getattr(args, "checkpoint_interval", 3),
        # GRPO/PPO hyperparameters
        clip_eps=getattr(args, "clip_eps", 0.2),
-        distill_enabled=getattr(args, "distill_enabled", False),
-        distill_coef=getattr(args, "distill_coef", 0.0),
-        distill_temperature=getattr(args, "distill_temperature", 1.0),
        adafactor_scale_parameter=getattr(args, "adafactor_scale_parameter", False),
        adafactor_relative_step=getattr(args, "adafactor_relative_step", False),
        # vLLM settings