sovits-teio

Running

App Files Files Community

kenshin20080 commited on Jun 14, 2023

Commit

fafb1c4

1 Parent(s): 95c435a

Update app.py

Browse files

Files changed (1) hide show

app.py +5 -5

app.py CHANGED Viewed

@@ -41,15 +41,15 @@ def create_vc_fn(model, sid):
             soundfile.write(raw_path, audio, 16000, format="wav")
             raw_path.seek(0)
             out_audio, out_sr = model.infer(sid, vc_transform, raw_path,
-                                            auto_predict_f0=auto_f0, F0_mean_pooling=True
                                             )
             return "Success", (44100, out_audio.cpu().numpy())
         if input_audio is None:
             return "You need to upload an audio", None
         sampling_rate, audio = input_audio
         duration = audio.shape[0] / sampling_rate
-        if duration > 60 and limitation:
-            return "Please upload an audio file that is less than 60 seconds. If you need to generate a longer audio file, please use Colab.", None
         audio = (audio / np.iinfo(audio.dtype).max).astype(np.float32)
         if len(audio.shape) > 1:
             audio = librosa.to_mono(audio.transpose(1, 0))
@@ -59,7 +59,7 @@ def create_vc_fn(model, sid):
         soundfile.write(raw_path, audio, 16000, format="wav")
         raw_path.seek(0)
         out_audio, out_sr = model.infer(sid, vc_transform, raw_path,
-                                       auto_predict_f0=auto_f0, F0_mean_pooling=True
                                        )
         return "Success", (44100, out_audio.cpu().numpy())
     return vc_fn
@@ -114,7 +114,7 @@ if __name__ == '__main__':
                         )
                     with gr.Row():
                         with gr.Column():
-                            vc_input = gr.Audio(label="Input audio"+' (less than 20 seconds)' if limitation else '')
                             vc_transform = gr.Number(label="vc_transform", value=0)
                             auto_f0 = gr.Checkbox(label="auto_f0", value=False)
                             tts_mode = gr.Checkbox(label="tts (use edge-tts as input)", value=False)

             soundfile.write(raw_path, audio, 16000, format="wav")
             raw_path.seek(0)
             out_audio, out_sr = model.infer(sid, vc_transform, raw_path,
+                                            auto_predict_f0=auto_f0, F0_mean_pooling=True,
                                             )
             return "Success", (44100, out_audio.cpu().numpy())
         if input_audio is None:
             return "You need to upload an audio", None
         sampling_rate, audio = input_audio
         duration = audio.shape[0] / sampling_rate
+        if duration > 120 and limitation:
+            return "Please upload an audio file that is less than 120 seconds. If you need to generate a longer audio file, please use Colab.", None
         audio = (audio / np.iinfo(audio.dtype).max).astype(np.float32)
         if len(audio.shape) > 1:
             audio = librosa.to_mono(audio.transpose(1, 0))
         soundfile.write(raw_path, audio, 16000, format="wav")
         raw_path.seek(0)
         out_audio, out_sr = model.infer(sid, vc_transform, raw_path,
+                                       auto_predict_f0=auto_f0, F0_mean_pooling=True,
                                        )
         return "Success", (44100, out_audio.cpu().numpy())
     return vc_fn
                         )
                     with gr.Row():
                         with gr.Column():
+                            vc_input = gr.Audio(label="Input audio"+' (less than 120 seconds)' if limitation else '')
                             vc_transform = gr.Number(label="vc_transform", value=0)
                             auto_f0 = gr.Checkbox(label="auto_f0", value=False)
                             tts_mode = gr.Checkbox(label="tts (use edge-tts as input)", value=False)