CHANGES.rst
DESCRIPTION.rst
LICENSE
MANIFEST.in
README.md
setup.py
src/ldc/__init__.py
src/ldc/class_lister.py
src/ldc/core.py
src/ldc/help.py
src/ldc/registry.py
src/ldc/text_utils.py
src/ldc/utils.py
src/ldc/api/__init__.py
src/ldc/api/_downloader.py
src/ldc/api/_filter.py
src/ldc/api/_io.py
src/ldc/api/pretrain.py
src/ldc/api/translation.py
src/ldc/api/supervised/__init__.py
src/ldc/api/supervised/classification.py
src/ldc/api/supervised/pairs.py
src/ldc/downloader/__init__.py
src/ldc/downloader/_huggingface.py
src/ldc/filter/__init__.py
src/ldc/filter/_assemble_sentences.py
src/ldc/filter/_change_case.py
src/ldc/filter/_file_filter.py
src/ldc/filter/_find_substr.py
src/ldc/filter/_inspect.py
src/ldc/filter/_keyword.py
src/ldc/filter/_llama2_to_pairs.py
src/ldc/filter/_max_records.py
src/ldc/filter/_metadata.py
src/ldc/filter/_metadata_from_name.py
src/ldc/filter/_pairs_to_llama2.py
src/ldc/filter/_pairs_to_pretrain.py
src/ldc/filter/_pretrain_sentences_to_classification.py
src/ldc/filter/_pretrain_sentences_to_pairs.py
src/ldc/filter/_randomize_records.py
src/ldc/filter/_record_files.py
src/ldc/filter/_record_window.py
src/ldc/filter/_remove_blocks.py
src/ldc/filter/_remove_empty.py
src/ldc/filter/_remove_patterns.py
src/ldc/filter/_replace_patterns.py
src/ldc/filter/_reset_ids.py
src/ldc/filter/_skip_duplicate_ids.py
src/ldc/filter/_skip_duplicate_text.py
src/ldc/filter/_split_records.py
src/ldc/filter/_tee.py
src/ldc/filter/_text_length.py
src/ldc/filter/_text_stats.py
src/ldc/filter/_to_llama2_format.py
src/ldc/filter/_translation_to_pairs.py
src/ldc/filter/_translation_to_pretrain.py
src/ldc/pretrain/__init__.py
src/ldc/pretrain/_csv.py
src/ldc/pretrain/_jsonlines.py
src/ldc/pretrain/_max_length.py
src/ldc/pretrain/_parquet.py
src/ldc/pretrain/_sentences.py
src/ldc/pretrain/_split.py
src/ldc/pretrain/_txt.py
src/ldc/supervised/__init__.py
src/ldc/supervised/classification/__init__.py
src/ldc/supervised/classification/_classification_label_map.py
src/ldc/supervised/classification/_csv.py
src/ldc/supervised/classification/_jsonlines.py
src/ldc/supervised/classification/_parquet.py
src/ldc/supervised/pairs/__init__.py
src/ldc/supervised/pairs/_alpaca.py
src/ldc/supervised/pairs/_csv.py
src/ldc/supervised/pairs/_jsonlines.py
src/ldc/supervised/pairs/_parquet.py
src/ldc/supervised/pairs/_update_pair_data.py
src/ldc/supervised/pairs/_xtuner.py
src/ldc/tool/__init__.py
src/ldc/tool/append.py
src/ldc/tool/convert.py
src/ldc/tool/download.py
src/ldc/tool/file_encoding.py
src/ldc/tool/find.py
src/ldc/tool/help.py
src/ldc/tool/paste.py
src/ldc/translation/__init__.py
src/ldc/translation/_csv.py
src/ldc/translation/_jsonlines.py
src/ldc/translation/_language.py
src/ldc/translation/_parquet.py
src/ldc/translation/_require_languages.py
src/ldc/translation/_txt.py
src/llm_dataset_converter.egg-info/PKG-INFO
src/llm_dataset_converter.egg-info/SOURCES.txt
src/llm_dataset_converter.egg-info/dependency_links.txt
src/llm_dataset_converter.egg-info/entry_points.txt
src/llm_dataset_converter.egg-info/requires.txt
src/llm_dataset_converter.egg-info/top_level.txt