mrfakename commited on
Commit
6a1a9b3
·
verified ·
1 Parent(s): 5f635fb

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +3 -1
app.py CHANGED
@@ -40,7 +40,7 @@ def generate_speech(inp_audio, inp_text, infer_timestep, p_w, t_w):
40
  return None
41
 
42
  try:
43
- print(f"Generating speech with: {inp_text[:50]}...")
44
 
45
  # Convert and prepare audio
46
  convert_to_wav(inp_audio)
@@ -65,6 +65,8 @@ def generate_speech(inp_audio, inp_text, infer_timestep, p_w, t_w):
65
  with gr.Blocks(title="MegaTTS3 Voice Cloning") as demo:
66
  gr.Markdown("# MegaTTS 3 Voice Cloning")
67
  gr.Markdown("MegaTTS 3 is a text-to-speech model trained by ByteDance with exceptional voice cloning capabilities. The original authors did not release the WavVAE encoder, so voice cloning was not publicly available; however, thanks to [@ACoderPassBy](https://modelscope.cn/models/ACoderPassBy/MegaTTS-SFT)'s WavVAE encoder, we can now clone voices with MegaTTS 3!")
 
 
68
  gr.Markdown("h/t to MysteryShack on Discord for the info about the unofficial WavVAE encoder!")
69
  gr.Markdown("Upload a reference audio clip and enter text to generate speech with the cloned voice.")
70
 
 
40
  return None
41
 
42
  try:
43
+ print(f"Generating speech with: {inp_text}...")
44
 
45
  # Convert and prepare audio
46
  convert_to_wav(inp_audio)
 
65
  with gr.Blocks(title="MegaTTS3 Voice Cloning") as demo:
66
  gr.Markdown("# MegaTTS 3 Voice Cloning")
67
  gr.Markdown("MegaTTS 3 is a text-to-speech model trained by ByteDance with exceptional voice cloning capabilities. The original authors did not release the WavVAE encoder, so voice cloning was not publicly available; however, thanks to [@ACoderPassBy](https://modelscope.cn/models/ACoderPassBy/MegaTTS-SFT)'s WavVAE encoder, we can now clone voices with MegaTTS 3!")
68
+ gr.Markdown("This is by no means the best voice cloning solution, but it works pretty well for some specific use-cases. Try out multiple and see which one works best for you.")
69
+ gr.Markdown("**Please use this Space responsibly and do not abuse it!**")
70
  gr.Markdown("h/t to MysteryShack on Discord for the info about the unofficial WavVAE encoder!")
71
  gr.Markdown("Upload a reference audio clip and enter text to generate speech with the cloned voice.")
72