Spaces:
Sleeping
Sleeping
le quy don
commited on
Update app.py
Browse files
app.py
CHANGED
@@ -199,13 +199,6 @@ def preprocess_audio_robust(audio_path, target_sr=22050, max_duration=30):
|
|
199 |
raise ValueError(f"Failed to process audio: {str(e)}")
|
200 |
|
201 |
with gr.Blocks(title="MegaTTS3 Voice Cloning") as demo:
|
202 |
-
gr.Markdown("# MegaTTS 3 Voice Cloning")
|
203 |
-
gr.Markdown("MegaTTS 3 is a text-to-speech model trained by ByteDance with exceptional voice cloning capabilities. The original authors did not release the WavVAE encoder, so voice cloning was not publicly available; however, thanks to [@ACoderPassBy](https://modelscope.cn/models/ACoderPassBy/MegaTTS-SFT)'s WavVAE encoder, we can now clone voices with MegaTTS 3!")
|
204 |
-
gr.Markdown("This is by no means the best voice cloning solution, but it works pretty well for some specific use-cases. Try out multiple and see which one works best for you.")
|
205 |
-
gr.Markdown("**Please use this Space responsibly and do not abuse it!**")
|
206 |
-
gr.Markdown("h/t to MysteryShack on Discord for the info about the unofficial WavVAE encoder!")
|
207 |
-
gr.Markdown("Upload a reference audio clip and enter text to generate speech with the cloned voice.")
|
208 |
-
|
209 |
with gr.Row():
|
210 |
with gr.Column():
|
211 |
reference_audio = gr.Audio(
|
|
|
199 |
raise ValueError(f"Failed to process audio: {str(e)}")
|
200 |
|
201 |
with gr.Blocks(title="MegaTTS3 Voice Cloning") as demo:
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
202 |
with gr.Row():
|
203 |
with gr.Column():
|
204 |
reference_audio = gr.Audio(
|