stream2sentence>=0.3.1
pydub>=0.25.1
pyaudio>=0.2.14
resampy==0.4.3

[all]
stream2sentence>=0.3.1
pydub>=0.25.1
pyaudio>=0.2.14
resampy==0.4.3
pyttsx3>=2.99
azure-cognitiveservices-speech>=1.48.2
elevenlabs>=2.39.0
openai>=2.29.0
gtts>=2.5.4
coqui_tts>=0.27.5
edge-tts>=7.2.7
kokoro>=0.9.4
camb-sdk>=1.5.8
requests>=2.32.0
cartesia==2.0.9
typecast-python>=0.2.0
faster-qwen3-tts>=0.2.4
snac>=1.2.1
omnivoice>=0.1.1
chatterbox-tts
sopro>=1.5.0
soprano-tts>=0.2.0
neutts
pocket-tts
torch
torchaudio
numpy
huggingface-hub>=0.36.0
safetensors
vocos
cn2an>=0.5.23
inflect
jieba>=0.42.1
lhotse
librosa
onnxruntime
piper_phonemize
pypinyin>=0.55.0
setuptools<81
tensorboard
transformers<=4.57.6
nltk
munch
PyYAML
phonemizer
transformers
soundfile>=0.13.1

[azure]
stream2sentence>=0.3.1
pydub>=0.25.1
pyaudio>=0.2.14
resampy==0.4.3
azure-cognitiveservices-speech>=1.48.2

[camb]
stream2sentence>=0.3.1
pydub>=0.25.1
pyaudio>=0.2.14
resampy==0.4.3
camb-sdk>=1.5.8

[cartesia]
stream2sentence>=0.3.1
pydub>=0.25.1
pyaudio>=0.2.14
resampy==0.4.3
cartesia==2.0.9

[chatterbox]
stream2sentence>=0.3.1
pydub>=0.25.1
pyaudio>=0.2.14
resampy==0.4.3
chatterbox-tts

[coqui]
stream2sentence>=0.3.1
pydub>=0.25.1
pyaudio>=0.2.14
resampy==0.4.3
coqui_tts>=0.27.5

[edge]
stream2sentence>=0.3.1
pydub>=0.25.1
pyaudio>=0.2.14
resampy==0.4.3
edge-tts>=7.2.7

[elevenlabs]
stream2sentence>=0.3.1
pydub>=0.25.1
pyaudio>=0.2.14
resampy==0.4.3
elevenlabs>=2.39.0

[gtts]
stream2sentence>=0.3.1
pydub>=0.25.1
pyaudio>=0.2.14
resampy==0.4.3
gtts>=2.5.4

[jp]
stream2sentence>=0.3.1
pydub>=0.25.1
pyaudio>=0.2.14
resampy==0.4.3
mecab-python3>=1.0.6
unidic-lite>=1.0.8
cutlet
fugashi>=1.4.0
jaconv>=0.4.0
mojimoji>=0.0.13
pyopenjtalk>=0.4.0

[ko]
stream2sentence>=0.3.1
pydub>=0.25.1
pyaudio>=0.2.14
resampy==0.4.3
hangul_romanize

[kokoro]
stream2sentence>=0.3.1
pydub>=0.25.1
pyaudio>=0.2.14
resampy==0.4.3
kokoro>=0.9.4

[luxtts]
stream2sentence>=0.3.1
pydub>=0.25.1
pyaudio>=0.2.14
resampy==0.4.3
cn2an>=0.5.23
inflect
jieba>=0.42.1
lhotse
librosa
numpy
onnxruntime
piper_phonemize
pypinyin>=0.55.0
safetensors
setuptools<81
tensorboard
torch
torchaudio
transformers<=4.57.6
vocos

[minimal]
stream2sentence>=0.3.1
pydub>=0.25.1
pyaudio>=0.2.14
resampy==0.4.3

[minimax]
stream2sentence>=0.3.1
pydub>=0.25.1
pyaudio>=0.2.14
resampy==0.4.3
requests>=2.32.0

[modelslab]
stream2sentence>=0.3.1
pydub>=0.25.1
pyaudio>=0.2.14
resampy==0.4.3
requests>=2.32.0

[moss]
stream2sentence>=0.3.1
pydub>=0.25.1
pyaudio>=0.2.14
resampy==0.4.3
numpy
soundfile>=0.13.1
torch
torchaudio
onnxruntime
huggingface-hub>=0.36.0
nltk

[moss-tts]
stream2sentence>=0.3.1
pydub>=0.25.1
pyaudio>=0.2.14
resampy==0.4.3
numpy
soundfile>=0.13.1
torch
torchaudio
onnxruntime
huggingface-hub>=0.36.0
nltk

[neutts]
stream2sentence>=0.3.1
pydub>=0.25.1
pyaudio>=0.2.14
resampy==0.4.3
neutts

[neutts-gguf]
stream2sentence>=0.3.1
pydub>=0.25.1
pyaudio>=0.2.14
resampy==0.4.3
neutts[llama,onnx]

[omnivoice]
stream2sentence>=0.3.1
pydub>=0.25.1
pyaudio>=0.2.14
resampy==0.4.3
omnivoice>=0.1.1

[openai]
stream2sentence>=0.3.1
pydub>=0.25.1
pyaudio>=0.2.14
resampy==0.4.3
openai>=2.29.0

[orpheus]
stream2sentence>=0.3.1
pydub>=0.25.1
pyaudio>=0.2.14
resampy==0.4.3
snac>=1.2.1

[parler]
stream2sentence>=0.3.1
pydub>=0.25.1
pyaudio>=0.2.14
resampy==0.4.3
torch
transformers

[piper]
stream2sentence>=0.3.1
pydub>=0.25.1
pyaudio>=0.2.14
resampy==0.4.3

[pocket]
stream2sentence>=0.3.1
pydub>=0.25.1
pyaudio>=0.2.14
resampy==0.4.3
pocket-tts
torch

[pockettts]
stream2sentence>=0.3.1
pydub>=0.25.1
pyaudio>=0.2.14
resampy==0.4.3
pocket-tts
torch

[qwen]
stream2sentence>=0.3.1
pydub>=0.25.1
pyaudio>=0.2.14
resampy==0.4.3
faster-qwen3-tts>=0.2.4

[soprano]
stream2sentence>=0.3.1
pydub>=0.25.1
pyaudio>=0.2.14
resampy==0.4.3
soprano-tts>=0.2.0

[sopro]
stream2sentence>=0.3.1
pydub>=0.25.1
pyaudio>=0.2.14
resampy==0.4.3
sopro>=1.5.0

[style]
stream2sentence>=0.3.1
pydub>=0.25.1
pyaudio>=0.2.14
resampy==0.4.3
torch
torchaudio
numpy
librosa
nltk
munch
PyYAML
phonemizer

[styletts]
stream2sentence>=0.3.1
pydub>=0.25.1
pyaudio>=0.2.14
resampy==0.4.3
torch
torchaudio
numpy
librosa
nltk
munch
PyYAML
phonemizer

[system]
stream2sentence>=0.3.1
pydub>=0.25.1
pyaudio>=0.2.14
resampy==0.4.3
pyttsx3>=2.99

[typecast]
stream2sentence>=0.3.1
pydub>=0.25.1
pyaudio>=0.2.14
resampy==0.4.3
typecast-python>=0.2.0

[zh]
stream2sentence>=0.3.1
pydub>=0.25.1
pyaudio>=0.2.14
resampy==0.4.3
pypinyin>=0.53.0
ordered_set>=4.1.0
jieba>=0.42.1
cn2an>=0.5.23

[zipvoice]
stream2sentence>=0.3.1
pydub>=0.25.1
pyaudio>=0.2.14
resampy==0.4.3
torch
torchaudio
numpy
huggingface-hub>=0.36.0
safetensors
vocos
