numpy<2.0.0,>=1.21.0
pandas<3.0.0,>=1.3.0
scipy<2.0.0,>=1.7.0
scikit-learn<2.0.0,>=1.0.0
transformers<5.0.0,>=4.20.0
sentence-transformers<3.0.0,>=2.2.0
torch<3.0.0,>=1.12.0
nltk<4.0.0,>=3.7
spacy<4.0.0,>=3.4.0
rouge-score<1.0.0,>=0.1.0
bert-score<1.0.0,>=0.3.0
openai<2.0.0,>=1.0.0
anthropic<1.0.0,>=0.3.0
langchain<1.0.0,>=0.1.0
langchain-openai<1.0.0,>=0.1.0
langchain-anthropic<1.0.0,>=0.1.0
langsmith<1.0.0,>=0.1.0
aiohttp<4.0.0,>=3.8.0
tenacity<9.0.0,>=8.0.0
statsmodels<1.0.0,>=0.13.0
matplotlib<4.0.0,>=3.5.0
seaborn<1.0.0,>=0.11.0
plotly<6.0.0,>=5.0.0
pydantic<3.0.0,>=2.0.0
typer<1.0.0,>=0.9.0
rich<14.0.0,>=13.0.0
tqdm<5.0.0,>=4.64.0
python-dotenv<2.0.0,>=1.0.0
pyyaml<7.0,>=6.0
jsonschema<5.0.0,>=4.0.0
pillow<11.0.0,>=9.0.0
opencv-python<5.0.0,>=4.5.0
librosa<1.0.0,>=0.9.0
datasets<3.0.0,>=2.0.0
evaluate<1.0.0,>=0.4.0

[all]
evalx[dev,production,research]

[dev]
pytest<8.0.0,>=7.0.0
pytest-asyncio<1.0.0,>=0.21.0
pytest-cov<5.0.0,>=4.0.0
black<25.0.0,>=22.0.0
isort<6.0.0,>=5.10.0
flake8<8.0.0,>=5.0.0
mypy<2.0.0,>=1.0.0
pre-commit<4.0.0,>=2.20.0

[production]
redis<6.0.0,>=4.0.0
celery<6.0.0,>=5.2.0
prometheus-client<1.0.0,>=0.15.0
sentry-sdk<2.0.0,>=1.0.0

[research]
jupyter<2.0.0,>=1.0.0
ipywidgets<9.0.0,>=8.0.0
datasets<3.0.0,>=2.0.0
wandb<1.0.0,>=0.13.0
mlflow<3.0.0,>=2.0.0
