LICENSE
MANIFEST.in
README.md
parallel_corpus_mnbvc.py
requirements.txt
setup.py
alignment/__init__.py
alignment/batch_detector.py
alignment/batch_sequential_detector.py
alignment/batch_sequential_for_one_file.py
alignment/evaluate_segmentation.py
alignment/rule_based_detector.py
alignment/text_segmenter.py
alignment/utils.py
alignment/script/__init__.py
alignment/script/gpt_helper.py
alignment/script/preprocess.py
download_data/__init__.py
download_data/download_un_corpus.py
download_data/about_sitemap/__init__.py
download_data/about_sitemap/download_after_2000_year_pdf_to_loacl.py
download_data/about_sitemap/download_all_pdf_url.py
download_data/about_sitemap/get_pdf_link_information.py
parallel_corpus_mnbvc.egg-info/PKG-INFO
parallel_corpus_mnbvc.egg-info/SOURCES.txt
parallel_corpus_mnbvc.egg-info/dependency_links.txt
parallel_corpus_mnbvc.egg-info/requires.txt
parallel_corpus_mnbvc.egg-info/top_level.txt