LICENSE
README.md
pyproject.toml
src/intelli3Text.egg-info/PKG-INFO
src/intelli3Text.egg-info/SOURCES.txt
src/intelli3Text.egg-info/dependency_links.txt
src/intelli3Text.egg-info/entry_points.txt
src/intelli3Text.egg-info/requires.txt
src/intelli3Text.egg-info/top_level.txt
src/intelli3text/__init__.py
src/intelli3text/__main__.py
src/intelli3text/builder.py
src/intelli3text/config.py
src/intelli3text/errors.py
src/intelli3text/pipeline.py
src/intelli3text/utils.py
src/intelli3text.egg-info/PKG-INFO
src/intelli3text.egg-info/SOURCES.txt
src/intelli3text.egg-info/dependency_links.txt
src/intelli3text.egg-info/entry_points.txt
src/intelli3text.egg-info/requires.txt
src/intelli3text.egg-info/top_level.txt
src/intelli3text/cleaners/__init__.py
src/intelli3text/cleaners/base.py
src/intelli3text/cleaners/chain.py
src/intelli3text/cleaners/clean_text.py
src/intelli3text/cleaners/pdf_linebreaks.py
src/intelli3text/cleaners/unicode_ftfy.py
src/intelli3text/export/__init__.py
src/intelli3text/export/base.py
src/intelli3text/export/jsonl.py
src/intelli3text/export/pdf_reportlab.py
src/intelli3text/extractors/__init__.py
src/intelli3text/extractors/base.py
src/intelli3text/extractors/file_docx.py
src/intelli3text/extractors/file_pdfminer.py
src/intelli3text/extractors/file_text.py
src/intelli3text/extractors/web_trafilatura.py
src/intelli3text/lid/__init__.py
src/intelli3text/lid/base.py
src/intelli3text/lid/cld3_lid.py
src/intelli3text/lid/fasttext_lid.py
src/intelli3text/nlp/__init__.py
src/intelli3text/nlp/base.py
src/intelli3text/nlp/registry.py
src/intelli3text/nlp/spacy_normalizer.py
tests/test_cleaners.py
tests/test_pipeline_smoke.py