Add note on code execution to CodeIODataset

This commit is contained in:
Oliver 2025-02-25 22:39:06 +00:00
parent ef2f8d1978
commit 4bdb8c7d6b

View file

@ -63,6 +63,12 @@ class CodeIOConfig:
class CodeIODataset(ProceduralDataset):
"""
Exercise some caution when using this dataset, as it involves executing arbitrary code snippets.
These code snippets are transformed by an LLM from raw code files which have been curated from high-quality sources.
However, there is still a risk that the LLM could have introduced code with bad effects.
"""
_jsonl_data: Optional[list] = None
def __init__(self, config: CodeIOConfig):