librosa==0.8.0 transformers==4.22.2 ffmpeg-python SpeechRecognition pydub gTTS numpy opencv-contrib-python opencv-python torchvision tqdm numba basicsr>=1.4.2 facexlib>=0.2.5 lmdb pyyaml scipy tb-nightly torch>=1.7 yapf realesrgan