changes based on torchtitan

2026-04-19 12:57:58 +00:00 · 2025-12-28 12:27:29 -05:00 · 2025-12-28 12:27:29 -05:00 · 53b29472b4
commit 53b29472b4
parent 078dd4a333
7 changed files with 1535 additions and 1977 deletions
--- a/example_trainer/vllm_patching/init.py
+++ b/example_trainer/vllm_patching/init.py
@ -0,0 +1,37 @@
+"""
+vLLM Patching Module - Enables shared memory weight updates.
+
+This module patches vLLM's GPUModelRunner to:
+1. Call share_memory_() on model weights after loading
+2. Spawn a daemon process that receives NCCL weight updates from trainers
+3. Enable real-time weight synchronization without restarting vLLM
+
+Usage:
+    # Import this BEFORE importing vllm
+    from example_trainer.vllm_patching import apply_patches
+    apply_patches()
+    
+    # Then import vllm normally
+    from vllm import AsyncLLM
+"""
+
+from .patched_gpu_runner import PatchedGPUModelRunner, apply_patches
+from .weight_updater import weight_updater_process
+from .distributed_utils import (
+    init_process_group,
+    broadcast_object_list,
+    get_inference_urls,
+    get_json_data,
+)
+
+__all__ = [
+    "PatchedGPUModelRunner",
+    "apply_patches",
+    "weight_updater_process",
+    "init_process_group",
+    "broadcast_object_list",
+    "get_inference_urls",
+    "get_json_data",
+]
+
+