Spaces:
Build error
Build error
File size: 1,955 Bytes
c636952 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 |
import gradio as gr
import torch
from transformers import pipeline
from langdetect import detect
# Load the Coqui XTTS model
tts = pipeline("text-to-speech", model="coqui/XTTS-v2", device=0 if torch.cuda.is_available() else -1)
# Helper function to clone voice and generate speech
def clone_and_generate(audio, text_prompt, language):
if audio is None or text_prompt.strip() == "":
return "Please provide both audio input and text prompt.", None
# Check if language is supported
supported_languages = {"english": "en", "hindi": "hi"}
if language not in supported_languages:
return f"Language {language} not supported yet.", None
# Convert text to the target language (if needed)
if detect(text_prompt) != supported_languages[language]:
# For now, we assume text is already in the desired language
pass
# Generate speech
try:
result = tts(text=text_prompt, speaker=audio)
return "Speech generated successfully!", result["audio"]
except Exception as e:
return f"Error: {str(e)}", None
# Gradio Interface
with gr.Blocks() as demo:
gr.Markdown("## π€ Voice Cloning & Text-to-Speech with Language Translation")
with gr.Row():
with gr.Column():
audio_input = gr.Audio(source="microphone", type="filepath", label="ποΈ Record or Upload Voice")
text_input = gr.Textbox(label="π Enter Text to Generate Speech")
language_input = gr.Dropdown(choices=["english", "hindi"], value="english", label="π Select Language")
with gr.Column():
output_message = gr.Textbox(label="π’ Status")
output_audio = gr.Audio(label="π Generated Speech")
generate_button = gr.Button("π Generate Speech")
generate_button.click(clone_and_generate, inputs=[audio_input, text_input, language_input], outputs=[output_message, output_audio])
# Launch the app
demo.launch()
|