diff --git a/example_trainer/model.py b/example_trainer/model.py index 1e80788f..b67a4313 100644 --- a/example_trainer/model.py +++ b/example_trainer/model.py @@ -85,7 +85,7 @@ def _load_model_with_attention( # Should never reach here, but just in case raise RuntimeError("Failed to load model with any attention implementation") - + def load_model_and_tokenizer( config: TrainingConfig, single_copy: bool = False, @@ -258,7 +258,7 @@ def _attach_to_vllm_shared_tensors( print("[Setup] Single-copy mode not available (single_copy_enabled=False)") print("[Setup] Make sure vLLM was started with VLLM_ENABLE_SHARED_WEIGHTS=1") return None - # Get the IPC handles. from the bridge config. these are memory pointers to the space in memory that shared weights exist in + # Get IPC handles from bridge config - memory pointers to shared weight tensors ipc_handles_raw = bridge_config.get("ipc_handles", {}) print(f"[Setup] IPC handles count: {len(ipc_handles_raw)}") if not ipc_handles_raw: diff --git a/example_trainer/run.py b/example_trainer/run.py index a16f2bd8..85e30d60 100644 --- a/example_trainer/run.py +++ b/example_trainer/run.py @@ -88,7 +88,7 @@ def main(): # Clean up old bridge config if os.path.exists(bridge_config_path): os.remove(bridge_config_path) - print(f"[Run] Removed old bridge config") + print("[Run] Removed old bridge config") # === Print Configuration === print("\n" + "="*60) @@ -172,7 +172,7 @@ def main(): sys.exit(1) # === Start Trainer === - print(f"\n[Run] Starting GRPO trainer...") + print("\n[Run] Starting GRPO trainer...") # Build config - override some fields for shared_vllm mode config = TrainingConfig(