requests
chardet
tqdm
scikit-learn
transformers
tokenizers
numpy

[all]
pypdf2
python-docx
ebooklib
beautifulsoup4
