mirror of
https://github.com/NousResearch/atropos.git
synced 2026-04-26 17:13:09 +00:00
Merge pull request #253 from NousResearch/rop/gen-params
group temps, sample temps, and logprob api params
This commit is contained in:
commit
36243bd3f4
5 changed files with 84 additions and 13 deletions
|
|
@ -134,6 +134,8 @@ The API documentation (Swagger UI) will be available at `http://<your-server-ip>
|
|||
scores: List[float]
|
||||
advantages: Optional[List[List[float]]] = None
|
||||
ref_logprobs: Optional[List[List[float]]] = None
|
||||
inference_logprobs: Optional[List[List[float]]] = None
|
||||
generation_params: Optional[Dict[str, Any]] = None
|
||||
messages: Optional[List[List[Message]]] = None
|
||||
overrides: Optional[List[dict]] = None # Per-item logging overrides
|
||||
group_overrides: Optional[dict] = None # Group logging overrides
|
||||
|
|
@ -154,7 +156,7 @@ The API documentation (Swagger UI) will be available at `http://<your-server-ip>
|
|||
* Not enough data: `{"batch": null}`
|
||||
* `GET /latest_example`
|
||||
* **Description:** Debug endpoint to retrieve the most recently added `ScoredData` item.
|
||||
* **Response:** The last `ScoredData` dictionary pushed, or empty lists for tokens, masks, scores, advantages, ref_logprobs, messages, and images if none yet.
|
||||
* **Response:** The last `ScoredData` dictionary pushed, or empty lists for tokens, masks, scores, advantages, ref_logprobs, inference_logprobs, generation_params, messages, and images if none yet.
|
||||
|
||||
### Debugging
|
||||
|
||||
|
|
|
|||
|
|
@ -70,6 +70,8 @@ class ScoredData(BaseModel):
|
|||
messages: Optional[List[List[Dict[str, Any]]]] = (
|
||||
None # Changed from Message TypedDict to Dict
|
||||
)
|
||||
generation_params: Optional[Dict[str, Any]] = None
|
||||
inference_logprobs: Optional[List[List[float]]] = None
|
||||
overrides: Optional[List[dict]] = None
|
||||
group_overrides: Optional[dict] = None
|
||||
images: Optional[Any] = None
|
||||
|
|
@ -267,6 +269,8 @@ async def get_latest_example():
|
|||
"scores": [],
|
||||
"advantages": [],
|
||||
"ref_logprobs": [],
|
||||
"generation_params": [],
|
||||
"inference_logprobs": [],
|
||||
"messages": [],
|
||||
"images": [],
|
||||
}
|
||||
|
|
@ -281,6 +285,8 @@ async def scored_data(scored_data: ScoredData):
|
|||
"advantages": scored_data.advantages,
|
||||
"ref_logprobs": scored_data.ref_logprobs,
|
||||
"messages": scored_data.messages,
|
||||
"generation_params": scored_data.generation_params,
|
||||
"inference_logprobs": scored_data.inference_logprobs,
|
||||
"overrides": scored_data.overrides,
|
||||
"group_overrides": scored_data.group_overrides,
|
||||
"images": scored_data.images,
|
||||
|
|
@ -343,6 +349,8 @@ async def scored_data_list(scored_data_list: List[ScoredData]):
|
|||
"ref_logprobs": scored_data.ref_logprobs,
|
||||
"images": scored_data.images,
|
||||
"messages": scored_data.messages,
|
||||
"generation_params": scored_data.generation_params,
|
||||
"inference_logprobs": scored_data.inference_logprobs,
|
||||
"overrides": scored_data.overrides,
|
||||
"group_overrides": scored_data.group_overrides,
|
||||
"env_id": scored_data.env_id,
|
||||
|
|
|
|||
Loading…
Add table
Add a link
Reference in a new issue