group temps, sample temps, and logprob api params

This commit is contained in:
ropresearch 2025-09-25 16:41:58 -04:00
parent efc6b55f0a
commit c3fc68879c
4 changed files with 65 additions and 12 deletions

View file

@ -59,6 +59,8 @@ class ScoredDataGroup(TypedDict):
advantages: Optional[List[List[float]]]
ref_logprobs: Optional[List[List[float]]]
messages: Optional[List[List[Message]]]
generation_params: Optional[Dict[str, Any]]
inference_logprobs: Optional[List[List[float]]]
group_overrides: Optional[Dict]
overrides: Optional[List[Dict]]
images: Optional[Any]