refactor(data_pipeline): optimize data generation pipeline; add multiple preset configurations for data generation

This commit is contained in:
chenyongkang 2025-08-26 18:40:21 +08:00
parent 1a8477c8d8
commit 8d493b35a0
2160 changed files with 69199 additions and 154 deletions

View file

@ -0,0 +1,22 @@
[
{
"yes_prob": 0.7,
"case_type": "YES",
"max_n": 100000
},
{
"yes_prob": 0.8,
"case_type": "NO",
"max_n": 200000
},
{
"yes_prob": 0.2,
"case_type": "None",
"max_n": 150000
},
{
"yes_prob": 0.3,
"case_type": "None",
"max_n": 200000
}
]