pymupdf>=1.23
pdfplumber>=0.10
pdf2docx>=0.5
python-docx>=1.1
python-pptx>=0.6
pandas>=2.1
openpyxl>=3.1
pillow>=10.0
lxml>=5.0
numpy>=1.26
scikit-learn>=1.3
langdetect>=1.0

[all]
openai>=1.0
anthropic>=0.25
pytesseract>=0.3

[dev]
pytest>=8.0
pytest-cov
ruff
mypy
build
twine

[llm]
openai>=1.0
anthropic>=0.25

[ocr]
pytesseract>=0.3

[ocr-paddle]
paddleocr>=2.7
