Podcastking2

Running

File size: 1,946 Bytes

fd43dfa
039f896
fd43dfa
 
 
039f896
fd43dfa
039f896
fd43dfa
 
 
039f896
fd43dfa
 
 
280807d
fd43dfa
 
 
 
 
 
 
 
 
 
 
996224c
fd43dfa

import gradio as gr
import os
import asyncio
from conver import ConversationConfig, URLToAudioConverter
from dotenv import load_dotenv

load_dotenv()

async def synthesize(article_url, text_input, language="en"):
    if not article_url and not text_input:
        return "Error: Ingresa una URL o texto", None

    try:
        config = ConversationConfig()
        converter = URLToAudioConverter(config, llm_api_key=os.environ.get("TOGETHER_API_KEY"))
        
        # Voces humanizadas
        voices = {
            "en": ("en-US-AvaMultilingualNeural", "en-US-AndrewMultilingualNeural"),
            "es": ("es-ES-AlvaroNeural", "es-ES-ElviraNeural")
        }
        voice1, voice2 = voices.get(language, voices["en"])

        if text_input:
            output_file, conversation = await converter.text_to_audio(text_input, voice1, voice2)
        else:
            output_file, conversation = await converter.url_to_audio(article_url, voice1, voice2)
            
        return conversation, output_file
    except Exception as e:
        return f"Error: {str(e)}", None

def synthesize_sync(article_url, text_input, language):
    return asyncio.run(synthesize(article_url, text_input, language))

with gr.Blocks(theme='gstaff/sketch') as demo:
    gr.Markdown("# 🎙 Podcast Converter (Human Voices)")
    with gr.Group():
        text_url = gr.Textbox(label="URL (opcional)", placeholder="https://...")
        text_input = gr.Textbox(label="O texto directo", lines=5)
        language = gr.Dropdown(["en", "es"], label="Idioma", value="en")
        btn = gr.Button("Generar Podcast", variant="primary")
    
    with gr.Row():
        conv_display = gr.Textbox(label="Conversación", interactive=False, lines=10)
        aud = gr.Audio(label="Audio Generado", interactive=False)
    
    btn.click(
        synthesize_sync,
        inputs=[text_url, text_input, language],
        outputs=[conv_display, aud]
    )

demo.launch()