rvc-models

Build error

App Files Files Community

Nix Seymour commited on Jun 2, 2023

Commit

02f3806

1 Parent(s): e710f1c

Update app.py

Browse files

Files changed (1) hide show

app.py +5 -5

app.py CHANGED Viewed

@@ -37,10 +37,10 @@ def create_vc_fn(tgt_sr, net_g, vc, if_f0, file_index, file_big_npy):
                 if tts_text is None or tts_voice is None:
                     return "You need to enter text and select a voice", None
                 asyncio.run(edge_tts.Communicate(tts_text, "-".join(tts_voice.split('-')[:-1])).save("tts.mp3"))
-                audio, sr = librosa.load("tts.mp3", sr=48000, mono=True)
             else:
                 if args.files:
-                    audio, sr = librosa.load(input_audio, sr=48000, mono=True)
                 else:
                     if input_audio is None:
                         return "You need to upload an audio", None
@@ -51,8 +51,8 @@ def create_vc_fn(tgt_sr, net_g, vc, if_f0, file_index, file_big_npy):
                     audio = (audio / np.iinfo(audio.dtype).max).astype(np.float32)
                     if len(audio.shape) > 1:
                         audio = librosa.to_mono(audio.transpose(1, 0))
-                    if sampling_rate != 16000:
-                        audio = librosa.resample(audio, orig_sr=sampling_rate, target_sr=16000)
             times = [0, 0, 0]
             f0_up_key = int(f0_up_key)
             audio_opt = vc.pipeline(
@@ -185,4 +185,4 @@ if __name__ == '__main__':
                             vc_output2 = gr.Audio(label="Output Audio")
                 vc_submit.click(vc_fn, [vc_input, vc_transpose, vc_f0method, vc_index_ratio, tts_mode, tts_text, tts_voice], [vc_output1, vc_output2])
                 tts_mode.change(change_to_tts_mode, [tts_mode], [vc_input, tts_text, tts_voice])
-        app.queue(concurrency_count=1, max_size=20, api_open=args.api, status_update_rate=10).launch(share=args.share)

                 if tts_text is None or tts_voice is None:
                     return "You need to enter text and select a voice", None
                 asyncio.run(edge_tts.Communicate(tts_text, "-".join(tts_voice.split('-')[:-1])).save("tts.mp3"))
+                audio, sr = librosa.load("tts.mp3", sr=24000, mono=True)
             else:
                 if args.files:
+                    audio, sr = librosa.load(input_audio, sr=24000, mono=True)
                 else:
                     if input_audio is None:
                         return "You need to upload an audio", None
                     audio = (audio / np.iinfo(audio.dtype).max).astype(np.float32)
                     if len(audio.shape) > 1:
                         audio = librosa.to_mono(audio.transpose(1, 0))
+                    if sampling_rate != 24000:
+                        audio = librosa.resample(audio, orig_sr=sampling_rate, target_sr=24000)
             times = [0, 0, 0]
             f0_up_key = int(f0_up_key)
             audio_opt = vc.pipeline(
                             vc_output2 = gr.Audio(label="Output Audio")
                 vc_submit.click(vc_fn, [vc_input, vc_transpose, vc_f0method, vc_index_ratio, tts_mode, tts_text, tts_voice], [vc_output1, vc_output2])
                 tts_mode.change(change_to_tts_mode, [tts_mode], [vc_input, tts_text, tts_voice])
+        app.queue(concurrency_count=3, max_size=20, api_open=args.api).launch(share=args.share)