torch==2.1.0 numpy<2.0.0 audiofile num2words huggingface_hub cached_path einops flask librosa moviepy==1.0.3 sentencepiece omegaconf opencv-python soundfile transformers==4.49.0 audresample srt nltk phonemizer python-docx uroman