mirror of
https://github.com/InternLM/InternBootcamp.git
synced 2026-04-22 16:49:04 +00:00
refactor(data_pipeline): optimize data generation pipeline; add multiple preset configurations for data generation
This commit is contained in:
parent
1a8477c8d8
commit
8d493b35a0
2160 changed files with 69199 additions and 154 deletions
30
examples/pipelines/all_configs/Bzgukistringz_train.json
Normal file
30
examples/pipelines/all_configs/Bzgukistringz_train.json
Normal file
|
|
@ -0,0 +1,30 @@
|
|||
[
|
||||
{
|
||||
"max_b_length": 2,
|
||||
"max_c_length": 3,
|
||||
"max_a_length": 10,
|
||||
"min_length": 1,
|
||||
"max_attempts": 2000
|
||||
},
|
||||
{
|
||||
"max_b_length": 6,
|
||||
"max_c_length": 7,
|
||||
"max_a_length": 25,
|
||||
"min_length": 2,
|
||||
"max_attempts": 1500
|
||||
},
|
||||
{
|
||||
"max_b_length": 3,
|
||||
"max_c_length": 4,
|
||||
"max_a_length": 15,
|
||||
"min_length": 1,
|
||||
"max_attempts": 500
|
||||
},
|
||||
{
|
||||
"max_b_length": 4,
|
||||
"max_c_length": 6,
|
||||
"max_a_length": 18,
|
||||
"min_length": 2,
|
||||
"max_attempts": 800
|
||||
}
|
||||
]
|
||||
Loading…
Add table
Add a link
Reference in a new issue