pydub>=0.25.1 | |
librosa>=0.10.1 | |
ffmpeg>=1.4 | |
yt_dlp>=2024.10.22 | |
wavio>=0.0.8 | |
# Audio speed-up and slowdown (best quality), if not installed can only speed-up with lower quality | |
# pyrubberband>=0.3.0 | |
# stackoverflow.com/questions/75813603/python-working-with-sound-librosa-and-pyrubberband-conflict | |
# pip uninstall -y pysoundfile soundfile | |
soundfile==0.12.1 | |
# Optional: Only for testing for now | |
# playsound==1.3.0 | |
# STT from microphone (may not be required if ffmpeg installed above) | |
# for any TTS: | |
torchaudio | |
soundfile>=0.12.1 | |
# GPU Only: for Coqui XTTS (ensure CUDA_HOME set and consistent with added postfix for extra-index): | |
# relaxed versions to avoid conflicts | |
# TTS | |
#deepspeed | |
noisereduce | |
emoji | |
ffmpeg-python | |
trainer | |
pysbd | |
coqpit | |
# for Coqui XTTS language helpers (specific versions probably not required) | |
cutlet>=0.3.0 | |
langid>=1.1.6 | |
g2pkk>=0.1.2 | |
jamo>=0.4.1 | |
gruut[de,es,fr]>=2.2.3 | |
jieba>=0.42.1 | |
# librosa==0.10.1 | |
# For faster whisper: | |
# git+https://github.com/SYSTRAN/faster-whisper.git | |