fsspec==2023.3.0
pyarrow<=12.0.0
pandas==2.0.0
datasets==2.11.0
loguru
tabulate
tqdm
jsonargparse[signatures]
matplotlib
emoji==2.2.0
regex
requests
wget
zstandard
lz4
pdfplumber
plotly
python-docx
streamlit
spacy==3.5.0
multiprocess==0.70.12
dill==0.3.4
scipy
boto3
simhash-py
gluonnlp
mxnet
numpy==1.23.1
selectolax
ftfy
nlpaug

[all]
fsspec==2023.3.0
pyarrow<=12.0.0
pandas==2.0.0
datasets==2.11.0
loguru
tabulate
tqdm
jsonargparse[signatures]
matplotlib
emoji==2.2.0
regex
requests
wget
zstandard
lz4
pdfplumber
plotly
python-docx
streamlit
spacy==3.5.0
multiprocess==0.70.12
dill==0.3.4
scipy
boto3
simhash-py
gluonnlp
mxnet
numpy==1.23.1
selectolax
ftfy
nlpaug
fasttext-wheel
kenlm
sentencepiece
nlpcda
nltk
transformers
opencc==1.1.6
imagededup
torch
dlib
spacy-pkuseg==0.0.32
ray
pre-commit
sphinx
sphinx-autobuild
sphinx_rtd_theme
recommonmark
fire
jsonlines
pyspark

[dev]
pre-commit
sphinx
sphinx-autobuild
sphinx_rtd_theme
recommonmark

[dist]
ray

[mini]
fsspec==2023.3.0
pyarrow<=12.0.0
pandas==2.0.0
datasets==2.11.0
loguru
tabulate
tqdm
jsonargparse[signatures]
matplotlib
emoji==2.2.0
regex
requests
wget
zstandard
lz4
pdfplumber
plotly
python-docx
streamlit
spacy==3.5.0
multiprocess==0.70.12
dill==0.3.4
scipy
boto3
simhash-py
gluonnlp
mxnet
numpy==1.23.1
selectolax
ftfy
nlpaug

[sci]
fasttext-wheel
kenlm
sentencepiece
scipy
ftfy
simhash-py
selectolax
nlpaug
nlpcda
nltk
transformers
opencc==1.1.6
imagededup
torch
dlib
spacy-pkuseg==0.0.32

[tools]
fire
jsonlines
pyspark
wget
