TTS_PT

Sleeping

App Files Files Community

DHEIVER commited on Jan 12

Commit

bd8bee9

verified ·

1 Parent(s): 9c6803e

Update app.py

Browse files

Files changed (1) hide show

app.py +66 -30

app.py CHANGED Viewed

@@ -17,9 +17,6 @@ O vento começou a soprar com toda a força, mas quanto mais soprava, mais o via
 Então, o Sol começou a brilhar suavemente, e o viajante, sentindo o calor, logo tirou a capa.
 Assim, o Sol provou que o calor e a gentileza são mais eficazes do que a força bruta.
 Esta história nos ensina que, muitas vezes, a delicadeza e a paciência são mais poderosas do que a agressividade.
-Em nossa vida diária, podemos aplicar essa lição ao lidar com os outros, buscando sempre a compreensão e o diálogo.
-A natureza nos oferece muitos exemplos de como a suavidade pode superar a força, e essa é uma lição valiosa para todos nós.
-Que possamos sempre lembrar dessa história e agir com sabedoria em nossas interações com os outros.
 """
 # Vozes disponíveis para português
@@ -30,8 +27,8 @@ TTS_VOICES = [
 # Exemplo de uso
 my_examples = [
-    [max_tokens_text, "Ed"],  # Texto com máximo de tokens e voz masculina
-    [max_tokens_text, "Linda"]  # Texto com máximo de tokens e voz feminina
 ]
 # Artigo com informações adicionais
@@ -39,13 +36,12 @@ my_article = """
 <h3>Guia do Usuário</h3>
 <p>1. Insira o texto em português no campo de entrada (até 500 tokens).</p>
 <p>2. Selecione a voz desejada (masculina ou feminina).</p>
-<p>3. Clique em "Submit" para gerar o áudio.</p>
-<p>4. Reproduza o áudio gerado ou faça o download.</p>
 """
 # Função para sintetizar a fala
 def tts(text: str, speaker_idx: str):
-    # Baixar os arquivos do modelo
     best_model_path = hf_hub_download(repo_id=REPO_ID, filename="best_model.pth")
     config_path = hf_hub_download(repo_id=REPO_ID, filename="config.json")
     speakers_path = hf_hub_download(repo_id=REPO_ID, filename="speakers.pth")
@@ -53,7 +49,6 @@ def tts(text: str, speaker_idx: str):
     speaker_encoder_model_path = hf_hub_download(repo_id=REPO_ID, filename="model_se.pth")
     speaker_encoder_config_path = hf_hub_download(repo_id=REPO_ID, filename="config_se.json")
-    # Inicializar o sintetizador
     synthesizer = Synthesizer(
         best_model_path,
         config_path,
@@ -66,33 +61,74 @@ def tts(text: str, speaker_idx: str):
         False
     )
-    # Gerar o áudio
-    wavs = synthesizer.tts(text, speaker_idx, "Português")  # Idioma fixo: Português
-    # Salvar o áudio em um arquivo temporário
     with tempfile.NamedTemporaryFile(suffix=".wav", delete=False) as fp:
         synthesizer.save_wav(wavs, fp)
     return fp.name
-# Criar a interface Gradio com layout moderno
-with gr.Blocks(title=my_title, css=".gradio-container {max-width: 800px; margin: auto;}") as demo:
-    gr.Markdown(f"# {my_title}")
     gr.Markdown(my_description)
     with gr.Row():
-        with gr.Column():
-            text_input = gr.Textbox(lines=10, label="Texto em Português", placeholder="Insira o texto aqui... (até 500 tokens)")
-            voice_selector = gr.Radio(label="Voz", choices=TTS_VOICES, value="Ed")
             submit_button = gr.Button("Gerar Áudio", variant="primary")
-        with gr.Column():
-            audio_output = gr.Audio(type="filepath", label="Áudio Gerado")
             gr.Markdown(my_article)
-    # Exemplos
-    gr.Examples(examples=my_examples, inputs=[text_input, voice_selector], outputs=audio_output, fn=tts, cache_examples=True)
-    # Ação do botão
-    submit_button.click(fn=tts, inputs=[text_input, voice_selector], outputs=audio_output)
-# Iniciar a interface
-demo.launch()

 Então, o Sol começou a brilhar suavemente, e o viajante, sentindo o calor, logo tirou a capa.
 Assim, o Sol provou que o calor e a gentileza são mais eficazes do que a força bruta.
 Esta história nos ensina que, muitas vezes, a delicadeza e a paciência são mais poderosas do que a agressividade.
 """
 # Vozes disponíveis para português
 # Exemplo de uso
 my_examples = [
+    [max_tokens_text, "Ed"],
+    [max_tokens_text, "Linda"]
 ]
 # Artigo com informações adicionais
 <h3>Guia do Usuário</h3>
 <p>1. Insira o texto em português no campo de entrada (até 500 tokens).</p>
 <p>2. Selecione a voz desejada (masculina ou feminina).</p>
+<p>3. Clique em "Gerar Áudio" para criar o áudio correspondente.</p>
+<p>4. Ouça o áudio gerado ou faça o download diretamente do player.</p>
 """
 # Função para sintetizar a fala
 def tts(text: str, speaker_idx: str):
     best_model_path = hf_hub_download(repo_id=REPO_ID, filename="best_model.pth")
     config_path = hf_hub_download(repo_id=REPO_ID, filename="config.json")
     speakers_path = hf_hub_download(repo_id=REPO_ID, filename="speakers.pth")
     speaker_encoder_model_path = hf_hub_download(repo_id=REPO_ID, filename="model_se.pth")
     speaker_encoder_config_path = hf_hub_download(repo_id=REPO_ID, filename="config_se.json")
     synthesizer = Synthesizer(
         best_model_path,
         config_path,
         False
     )
+    wavs = synthesizer.tts(text, speaker_idx, "Português")
     with tempfile.NamedTemporaryFile(suffix=".wav", delete=False) as fp:
         synthesizer.save_wav(wavs, fp)
     return fp.name
+# Criar a interface Gradio aprimorada
+with gr.Blocks(title=my_title, css="""
+    .gradio-container {
+        max-width: 800px;
+        margin: auto;
+        font-family: 'Arial', sans-serif;
+    }
+    .header {
+        text-align: center;
+        margin-bottom: 20px;
+    }
+    .footer {
+        font-size: 0.85rem;
+        color: gray;
+        text-align: center;
+        margin-top: 30px;
+    }
+""") as demo:
+    # Cabeçalho
+    with gr.Row(variant="compact"):
+        gr.Markdown(f"<h1 class='header'>{my_title}</h1>")
     gr.Markdown(my_description)
+    # Entrada do usuário
     with gr.Row():
+        with gr.Column(scale=1):
+            text_input = gr.Textbox(
+                lines=10,
+                label="Texto em Português",
+                placeholder="Insira o texto aqui... (até 500 tokens)",
+                max_length=500
+            )
+            token_counter = gr.Label(value="Tokens usados: 0 / 500", label="Progresso")
+            voice_selector = gr.Radio(
+                label="Voz",
+                choices=TTS_VOICES,
+                value="Ed"
+            )
             submit_button = gr.Button("Gerar Áudio", variant="primary")
+        with gr.Column(scale=1):
+            audio_output = gr.Audio(type="filepath", label="Áudio Gerado", interactive=False)
+            download_button = gr.File(label="Download do Áudio")
             gr.Markdown(my_article)
+    # Exemplo de uso
+    gr.Examples(
+        examples=my_examples,
+        inputs=[text_input, voice_selector],
+        outputs=[audio_output],
+        cache_examples=True
+    )
+    # Feedback e progresso
+    submit_button.click(
+        fn=tts,
+        inputs=[text_input, voice_selector],
+        outputs=[audio_output],
+        show_progress=True
+    )
+    # Rodapé
+    gr.Markdown("<p class='footer'>Desenvolvido com ❤️ usando Gradio e Coqui TTS</p>")
+# Iniciar
+demo.launch(share=True)