mirror of
https://github.com/NousResearch/atropos.git
synced 2026-04-19 12:57:58 +00:00
initial commit
This commit is contained in:
parent
81b2d4daab
commit
cc9b891eba
2 changed files with 234 additions and 0 deletions
|
|
@ -145,6 +145,9 @@ class ScoredData(BaseModel):
|
|||
group_overrides: Optional[dict] = None
|
||||
images: Optional[Any] = None
|
||||
env_id: Optional[int] = None # ID of the environment that generated this data
|
||||
# On-policy distillation: top-K logprobs from teacher model
|
||||
# Structure: [sequence][position][top_k] = [token_id, logprob]
|
||||
onpolicydistill_logprobs: Optional[List[List[List[List]]]] = None
|
||||
|
||||
@field_validator("messages", mode="before")
|
||||
@classmethod
|
||||
|
|
@ -182,6 +185,7 @@ def _scored_data_to_dict(scored_data: ScoredData) -> Dict[str, Any]:
|
|||
"group_overrides": scored_data.group_overrides,
|
||||
"images": scored_data.images,
|
||||
"env_id": scored_data.env_id,
|
||||
"onpolicydistill_logprobs": scored_data.onpolicydistill_logprobs,
|
||||
}
|
||||
|
||||
|
||||
|
|
|
|||
Loading…
Add table
Add a link
Reference in a new issue