mirror of
https://github.com/NousResearch/atropos.git
synced 2026-04-22 16:48:57 +00:00
fix: correct dataset name to bigcode/humanevalpack
This commit is contained in:
parent
590e8a1ef2
commit
5c2afa8ea7
2 changed files with 6 additions and 6 deletions
|
|
@ -2,7 +2,7 @@
|
|||
Code Debug Environment for Atropos
|
||||
|
||||
Trains LLMs to debug and fix buggy Python functions.
|
||||
Uses the HumanEvalFix dataset with execution-based verification
|
||||
Uses the HumanEvalPack dataset (HumanEvalFix subset) with execution-based verification
|
||||
against ground-truth test cases.
|
||||
|
||||
Environment pattern follows sql_query_env for consistency.
|
||||
|
|
@ -162,11 +162,11 @@ class CodeDebugEnv(BaseEnv):
|
|||
await super().wandb_log(wandb_metrics)
|
||||
|
||||
async def setup(self):
|
||||
"""Load the HumanEvalFix dataset and prepare train/test splits."""
|
||||
"""Load the HumanEvalPack dataset (HumanEvalFix) and prepare train/test splits."""
|
||||
from datasets import load_dataset
|
||||
|
||||
print("Loading HumanEvalFix dataset...")
|
||||
dataset = load_dataset("bigcode/humanevalfix-python", split="test")
|
||||
print("Loading HumanEvalPack (python) dataset...")
|
||||
dataset = load_dataset("bigcode/humanevalpack", "python", split="test")
|
||||
|
||||
all_items: List[CodeDebugItem] = []
|
||||
for row in dataset:
|
||||
|
|
|
|||
Loading…
Add table
Add a link
Reference in a new issue