transformers==4.57.6
huggingface_hub==0.36.2
qwen_asr==0.0.6
nemo_toolkit[asr,tts]
jiwer
evaluate
Levenshtein
tqdm
editdistance
numpy
librosa
soundfile
