fix(envs): Add source dataset and index to metadata (#388)

* add source dataset and index to metadata

* fix typo

* fix coach class and its test
This commit is contained in:
Zafir Stojanovski 2025-03-20 12:12:14 +01:00 committed by GitHub
parent c6d01541aa
commit 4c47527130
104 changed files with 549 additions and 146 deletions

View file

@ -9,6 +9,8 @@ from typing import Optional
from ..coaching import BaseCurriculum, RangeAttributeDefinition
from ..factory import ProceduralDataset, register_dataset
DATASET_NAME = "gcd"
@dataclass
class GCDConfig:
@ -62,6 +64,8 @@ class GCDDataset(ProceduralDataset):
"question": f"Find the Greatest Common Divisor (GCD) of these numbers: {numbers_str}. Give only the GCD as your final answer.",
"answer": str(result),
"metadata": {
"source_dataset": DATASET_NAME,
"source_index": idx,
"numbers": numbers,
"result": result,
"num_terms": num_terms,
@ -96,4 +100,4 @@ class GCDCurriculum(BaseCurriculum):
)
register_dataset("gcd", GCDDataset, GCDConfig)
register_dataset(DATASET_NAME, GCDDataset, GCDConfig)