Spaces:

AI-trainer1
/

text_to_speech_test1

Build error

Aseem Gupta commited on Jan 13

Commit

d8fe51c

1 Parent(s): 9581ca3

test5

Files changed (3) hide show

.gitignore ADDED Viewed

app.py CHANGED Viewed

@@ -4,38 +4,38 @@ import os
 os.environ["COQUI_TOS_AGREED"] = "1"
-# Load the XTTS-v2 model and set it to use CPU
-tts = TTS(model_name="tts_models/multilingual/multi-dataset/xtts_v2")
-tts.to("cpu")  # Set the model to run on CPU
-# Define the function for voice cloning
 def generate_voice(text, speaker_audio):
     output_path = "output.wav"
     tts.tts_to_file(
         text=text,
-        speaker_wav=speaker_audio.name,
         file_path=output_path,
         language="en"
     )
     return output_path
-# Gradio Interface
 with gr.Blocks() as demo:
     gr.Markdown("# 🗣️ Voice Cloning with Coqui XTTS-v2")
     with gr.Row():
         text_input = gr.Textbox(label="Enter Text", placeholder="Type the text you want to synthesize...")
-        speaker_audio_input = gr.Audio(label="Upload Speaker Audio (WAV)", type="file")
     output_audio = gr.Audio(label="Generated Voice", type="filepath")
     generate_button = gr.Button("Generate Voice")
     generate_button.click(
         fn=generate_voice,
         inputs=[text_input, speaker_audio_input],
         outputs=output_audio
     )
-# Launch the Gradio app
-demo.launch()

 os.environ["COQUI_TOS_AGREED"] = "1"
+# Load the XTTS-v2 model with trust_remote_code=True
+tts = TTS(model_name="tts_models/multilingual/multi-dataset/xtts_v2", trust_remote_code=True)
+tts.to("cpu")
+# Function to synthesize voice
 def generate_voice(text, speaker_audio):
     output_path = "output.wav"
     tts.tts_to_file(
         text=text,
+        speaker_wav=speaker_audio,
         file_path=output_path,
         language="en"
     )
     return output_path
+# Gradio interface
 with gr.Blocks() as demo:
     gr.Markdown("# 🗣️ Voice Cloning with Coqui XTTS-v2")
     with gr.Row():
         text_input = gr.Textbox(label="Enter Text", placeholder="Type the text you want to synthesize...")
+        speaker_audio_input = gr.Audio(label="Upload Speaker Audio (WAV)", type="filepath")
     output_audio = gr.Audio(label="Generated Voice", type="filepath")
     generate_button = gr.Button("Generate Voice")
     generate_button.click(
         fn=generate_voice,
         inputs=[text_input, speaker_audio_input],
         outputs=output_audio
     )
+# Launch the app
+demo.launch()

requirements.txt CHANGED Viewed

@@ -1,5 +1,4 @@
 gradio
 torch
-transformers
-langdetect
-TTS

 gradio
 torch
+TTS
+soundfile