refactor(data_pipeline): optimize data generation pipeline; add multiple preset configurations for data generation

This commit is contained in:
chenyongkang 2025-08-26 18:40:21 +08:00
parent 1a8477c8d8
commit 8d493b35a0
2160 changed files with 69199 additions and 154 deletions

View file

@ -0,0 +1,32 @@
[
{
"affix_type": "prefix",
"min_segments": 2,
"max_segments": 5
},
{
"affix_type": "prefix",
"min_segments": 2,
"max_segments": 4
},
{
"affix_type": "random",
"min_segments": 4,
"max_segments": 5
},
{
"affix_type": "suffix",
"min_segments": 2,
"max_segments": 4
},
{
"affix_type": "random",
"min_segments": 3,
"max_segments": 5
},
{
"affix_type": "random",
"min_segments": 2,
"max_segments": 3
}
]