numpy
scipy
soundfile
sounddevice
pydantic>=2
rich
sentence-transformers
litellm>=1.0
python-dotenv
json-repair
torch
scikit-learn
huggingface_hub>=0.20
transformers<5,>=4.57.0
tokenizers>=0.20.0
sentencepiece
laion-clap
torchvision

[expressive]
outlines
instructor

[expressive:platform_machine != "arm64" and sys_platform != "win32"]
llama-cpp-python

[expressive:sys_platform == "darwin" and platform_machine == "arm64"]
mlx
mlx-lm

[expressive:sys_platform == "linux"]
bitsandbytes
