checkpointing fixes

2026-04-24 17:04:55 +00:00 · 2026-01-29 11:41:24 -05:00 · 2026-01-29 11:41:24 -05:00 · 04652fd97c
commit 04652fd97c
parent b9414e4076
1 changed files with 2 additions and 0 deletions
--- a/example_trainer/model.py
+++ b/example_trainer/model.py
@ -48,6 +48,8 @@ def load_model_and_tokenizer(
        
        if model is not None:
            print("[Setup] ✓ Single-copy mode active - using vLLM's tensors directly!")
+            # Enable gradient checkpointing to save memory (was missing before!)
+            _setup_gradient_checkpointing(model, config)
            model.train()
            return model, tokenizer
        else: