|
__init__.py
|
initial commit
|
2025-06-04 20:36:43 +00:00 |
|
clean_sharegpt.py
|
initial commit
|
2025-06-04 20:36:43 +00:00 |
|
convert_alpaca.py
|
initial commit
|
2025-06-04 20:36:43 +00:00 |
|
extract_gpt4_only.py
|
initial commit
|
2025-06-04 20:36:43 +00:00 |
|
extract_single_round.py
|
initial commit
|
2025-06-04 20:36:43 +00:00 |
|
filter_wrong_format.py
|
initial commit
|
2025-06-04 20:36:43 +00:00 |
|
get_stats.py
|
initial commit
|
2025-06-04 20:36:43 +00:00 |
|
hardcoded_questions.py
|
initial commit
|
2025-06-04 20:36:43 +00:00 |
|
inspect_data.py
|
initial commit
|
2025-06-04 20:36:43 +00:00 |
|
merge.py
|
initial commit
|
2025-06-04 20:36:43 +00:00 |
|
optional_clean.py
|
initial commit
|
2025-06-04 20:36:43 +00:00 |
|
optional_replace.py
|
initial commit
|
2025-06-04 20:36:43 +00:00 |
|
prepare_all.py
|
initial commit
|
2025-06-04 20:36:43 +00:00 |
|
pretty_json.py
|
initial commit
|
2025-06-04 20:36:43 +00:00 |
|
sample.py
|
initial commit
|
2025-06-04 20:36:43 +00:00 |
|
split_long_conversation.py
|
initial commit
|
2025-06-04 20:36:43 +00:00 |
|
split_train_test.py
|
initial commit
|
2025-06-04 20:36:43 +00:00 |