gradio>=5.25.2 nltk>=3.8 librosa>=0.10 ffmpeg-python>=0.2 transformers[audio]>=4.33 torch>=2.1.0 torchaudio>=2.1.0 scipy>=1.11 munch>=2.5 accelerate>=1.2.0 soundfile>=0.13.0 ordered-set>=4.1.0 phonemizer-fork>=3.3.2 nemo_toolkit[asr] faster-whisper>=1.1.1 chatterbox-tts