requests
beautifulsoup4
scikit-learn
numpy
click
chardet

[all]
pdfminer.six
python-docx
ebooklib
transformers
tokenizers

[docx]
python-docx

[epub]
ebooklib

[hf]
transformers
tokenizers

[pdf]
pdfminer.six
