TTS_PT

Sleeping

App Files Files Community

DHEIVER commited on Jan 12

Commit

0e9d1bc

verified ·

1 Parent(s): bd8bee9

Update app.py

Browse files

Files changed (1) hide show

app.py +32 -63

app.py CHANGED Viewed

@@ -8,7 +8,10 @@ REPO_ID = "mbarnig/lb-de-fr-en-pt-coqui-vits-tts"
 # Configurações da interface
 my_title = "🇵🇹 Sintetizador de Fala em Português com Coqui TTS"
-my_description = "Um sintetizador de fala em português baseado no modelo YourTTS da Coqui.ai. Insira o texto e gere o áudio!"
 # Texto de exemplo com o máximo de tokens (500 tokens)
 max_tokens_text = """
@@ -25,23 +28,9 @@ TTS_VOICES = [
     "Linda"  # Voz feminina
 ]
-# Exemplo de uso
-my_examples = [
-    [max_tokens_text, "Ed"],
-    [max_tokens_text, "Linda"]
-]
-# Artigo com informações adicionais
-my_article = """
-<h3>Guia do Usuário</h3>
-<p>1. Insira o texto em português no campo de entrada (até 500 tokens).</p>
-<p>2. Selecione a voz desejada (masculina ou feminina).</p>
-<p>3. Clique em "Gerar Áudio" para criar o áudio correspondente.</p>
-<p>4. Ouça o áudio gerado ou faça o download diretamente do player.</p>
-"""
 # Função para sintetizar a fala
 def tts(text: str, speaker_idx: str):
     best_model_path = hf_hub_download(repo_id=REPO_ID, filename="best_model.pth")
     config_path = hf_hub_download(repo_id=REPO_ID, filename="config.json")
     speakers_path = hf_hub_download(repo_id=REPO_ID, filename="speakers.pth")
@@ -49,6 +38,7 @@ def tts(text: str, speaker_idx: str):
     speaker_encoder_model_path = hf_hub_download(repo_id=REPO_ID, filename="model_se.pth")
     speaker_encoder_config_path = hf_hub_download(repo_id=REPO_ID, filename="config_se.json")
     synthesizer = Synthesizer(
         best_model_path,
         config_path,
@@ -61,45 +51,26 @@ def tts(text: str, speaker_idx: str):
         False
     )
-    wavs = synthesizer.tts(text, speaker_idx, "Português")
     with tempfile.NamedTemporaryFile(suffix=".wav", delete=False) as fp:
         synthesizer.save_wav(wavs, fp)
     return fp.name
-# Criar a interface Gradio aprimorada
-with gr.Blocks(title=my_title, css="""
-    .gradio-container {
-        max-width: 800px;
-        margin: auto;
-        font-family: 'Arial', sans-serif;
-    }
-    .header {
-        text-align: center;
-        margin-bottom: 20px;
-    }
-    .footer {
-        font-size: 0.85rem;
-        color: gray;
-        text-align: center;
-        margin-top: 30px;
-    }
-""") as demo:
-    # Cabeçalho
-    with gr.Row(variant="compact"):
-        gr.Markdown(f"<h1 class='header'>{my_title}</h1>")
     gr.Markdown(my_description)
-    # Entrada do usuário
     with gr.Row():
         with gr.Column(scale=1):
             text_input = gr.Textbox(
                 lines=10,
                 label="Texto em Português",
-                placeholder="Insira o texto aqui... (até 500 tokens)",
-                max_length=500
             )
-            token_counter = gr.Label(value="Tokens usados: 0 / 500", label="Progresso")
             voice_selector = gr.Radio(
                 label="Voz",
                 choices=TTS_VOICES,
@@ -107,28 +78,26 @@ with gr.Blocks(title=my_title, css="""
             )
             submit_button = gr.Button("Gerar Áudio", variant="primary")
         with gr.Column(scale=1):
-            audio_output = gr.Audio(type="filepath", label="Áudio Gerado", interactive=False)
-            download_button = gr.File(label="Download do Áudio")
-            gr.Markdown(my_article)
-    # Exemplo de uso
-    gr.Examples(
-        examples=my_examples,
-        inputs=[text_input, voice_selector],
-        outputs=[audio_output],
-        cache_examples=True
-    )
-    # Feedback e progresso
     submit_button.click(
         fn=tts,
         inputs=[text_input, voice_selector],
-        outputs=[audio_output],
-        show_progress=True
     )
-    # Rodapé
-    gr.Markdown("<p class='footer'>Desenvolvido com ❤️ usando Gradio e Coqui TTS</p>")
-# Iniciar
-demo.launch(share=True)

 # Configurações da interface
 my_title = "🇵🇹 Sintetizador de Fala em Português com Coqui TTS"
+my_description = """
+Um sintetizador de fala em português baseado no modelo YourTTS da Coqui.ai.
+Insira o texto e gere o áudio com a voz desejada (masculina ou feminina)!
+"""
 # Texto de exemplo com o máximo de tokens (500 tokens)
 max_tokens_text = """
     "Linda"  # Voz feminina
 ]
 # Função para sintetizar a fala
 def tts(text: str, speaker_idx: str):
+    # Baixar os arquivos do modelo
     best_model_path = hf_hub_download(repo_id=REPO_ID, filename="best_model.pth")
     config_path = hf_hub_download(repo_id=REPO_ID, filename="config.json")
     speakers_path = hf_hub_download(repo_id=REPO_ID, filename="speakers.pth")
     speaker_encoder_model_path = hf_hub_download(repo_id=REPO_ID, filename="model_se.pth")
     speaker_encoder_config_path = hf_hub_download(repo_id=REPO_ID, filename="config_se.json")
+    # Inicializar o sintetizador
     synthesizer = Synthesizer(
         best_model_path,
         config_path,
         False
     )
+    # Gerar o áudio
+    wavs = synthesizer.tts(text, speaker_idx, "Português")  # Idioma fixo: Português
+    # Salvar o áudio em um arquivo temporário
     with tempfile.NamedTemporaryFile(suffix=".wav", delete=False) as fp:
         synthesizer.save_wav(wavs, fp)
     return fp.name
+# Criar a interface Gradio
+with gr.Blocks(title=my_title, css=".gradio-container {max-width: 900px; margin: auto;}") as demo:
+    gr.Markdown(f"<h1 style='text-align: center;'>{my_title}</h1>")
     gr.Markdown(my_description)
     with gr.Row():
         with gr.Column(scale=1):
             text_input = gr.Textbox(
                 lines=10,
                 label="Texto em Português",
+                placeholder="Insira o texto aqui... (máximo de 500 tokens)"
             )
             voice_selector = gr.Radio(
                 label="Voz",
                 choices=TTS_VOICES,
             )
             submit_button = gr.Button("Gerar Áudio", variant="primary")
         with gr.Column(scale=1):
+            audio_output = gr.Audio(type="filepath", label="Áudio Gerado")
+            download_button = gr.File(label="Baixar Áudio")
+    gr.Markdown("<hr>")
+    gr.Markdown("""
+        <h3>Guia do Usuário:</h3>
+        <ul>
+            <li>Insira o texto em português no campo de entrada (até 500 tokens).</li>
+            <li>Selecione a voz desejada (masculina ou feminina).</li>
+            <li>Clique em "Gerar Áudio" para gerar o arquivo de áudio.</li>
+            <li>Reproduza ou faça o download do áudio gerado.</li>
+        </ul>
+    """)
+    # Ação do botão
     submit_button.click(
         fn=tts,
         inputs=[text_input, voice_selector],
+        outputs=[audio_output, download_button]
     )
+# Iniciar a interface
+demo.launch()