Add note on code execution to CodeIODataset

This commit is contained in:
Oliver 2025-02-25 22:39:06 +00:00
parent ef2f8d1978
commit 4bdb8c7d6b

View file

@ -63,6 +63,12 @@ class CodeIOConfig:
class CodeIODataset(ProceduralDataset): class CodeIODataset(ProceduralDataset):
"""
Exercise some caution when using this dataset, as it involves executing arbitrary code snippets.
These code snippets are transformed by an LLM from raw code files which have been curated from high-quality sources.
However, there is still a risk that the LLM could have introduced code with bad effects.
"""
_jsonl_data: Optional[list] = None _jsonl_data: Optional[list] = None
def __init__(self, config: CodeIOConfig): def __init__(self, config: CodeIOConfig):