refactor(data_pipeline): optimize data generation pipeline; add multiple preset configurations for data generation

This commit is contained in:
chenyongkang 2025-08-26 18:40:21 +08:00
parent 1a8477c8d8
commit 8d493b35a0
2160 changed files with 69199 additions and 154 deletions

View file

@ -1,41 +0,0 @@
[
{
"min_n": 8,
"max_n": 30,
"attribute_descriptions": [
"top scorer",
"perfect health",
"satisfied customer",
"damaged goods",
"active lifestyle",
"excessive noise",
"full recovery"
]
},
{
"min_n": 3,
"max_n": 20,
"attribute_descriptions": [
"excellent performance",
"no diseases",
"content with product",
"faulty goods",
"consistent work",
"high pollution",
"successful surgery"
]
},
{
"min_n": 5,
"max_n": 50,
"attribute_descriptions": [
"math score above 90",
"healthy",
"satisfied with facilities",
"defective",
"daily exercise",
"speeding behavior",
"positive response"
]
}
]