pydub>=0.25.1 librosa>=0.10.1 ffmpeg>=1.4 yt_dlp>=2024.10.22 wavio>=0.0.8 # Audio speed-up and slowdown (best quality), if not installed can only speed-up with lower quality # pyrubberband>=0.3.0 # stackoverflow.com/questions/75813603/python-working-with-sound-librosa-and-pyrubberband-conflict # pip uninstall -y pysoundfile soundfile soundfile==0.12.1 # Optional: Only for testing for now # playsound==1.3.0 # STT from microphone (may not be required if ffmpeg installed above) # for any TTS: torchaudio soundfile>=0.12.1 # GPU Only: for Coqui XTTS (ensure CUDA_HOME set and consistent with added postfix for extra-index): # relaxed versions to avoid conflicts # TTS #deepspeed noisereduce emoji ffmpeg-python trainer pysbd coqpit # for Coqui XTTS language helpers (specific versions probably not required) cutlet>=0.3.0 langid>=1.1.6 g2pkk>=0.1.2 jamo>=0.4.1 gruut[de,es,fr]>=2.2.3 jieba>=0.42.1 # librosa==0.10.1 # For faster whisper: # git+https://github.com/SYSTRAN/faster-whisper.git