python versioning problems

This commit is contained in:
Jai Suphavadeeprasit 2026-02-03 11:23:53 -05:00
parent db5eba8fd2
commit 04f2850980
4 changed files with 5 additions and 105 deletions

View file

@ -47,10 +47,6 @@ from dataclasses import dataclass, field
from pathlib import Path
from typing import Any, List, Optional
# =============================================================================
# CRITICAL: Set up multiprocessing and vLLM engine BEFORE any CUDA imports
# =============================================================================
# Default to v0 engine to avoid CUDA fork issues with v1 engine
# Users can override with VLLM_USE_V1=1 if needed
os.environ.setdefault("VLLM_USE_V1", "0")
@ -168,11 +164,6 @@ except ImportError:
logger = init_logger("vllm.entrypoints.api_server")
# =============================================================================
# Global State
# =============================================================================
app = FastAPI()
engine: Optional[AsyncLLM] = None