This commit is contained in:
Jai Suphavadeeprasit 2026-02-02 22:59:32 -05:00
parent 24b8ab8574
commit c8884348c7
8 changed files with 360 additions and 820 deletions

View file

@ -92,6 +92,12 @@ class TrainingConfig(BaseModel):
vllm_gpu_memory_utilization: float = Field(
0.45, description="GPU memory utilization for vLLM server (0.0-1.0)"
)
max_model_len: int = Field(
4096, description="Maximum context length for vLLM server"
)
dtype: str = Field(
"bfloat16", description="Data type for model weights (bfloat16, float16, auto)"
)
# === Weights & Biases Configuration ===
use_wandb: bool = Field(