Spaces:

M4xjunior
/

locseed

Running

App Files Files Community

M4xjunior commited on Dec 2, 2024

Commit

889c030

1 Parent(s): 598bddf

fix

Browse files

Files changed (2) hide show

app.py +22 -33
logs/sentence_analyzer_2024-12-02.log +10 -0

app.py CHANGED Viewed

@@ -66,36 +66,23 @@ last_ema = None
 tts_api = None
 training_process = None  # Adicione esta linha se necessário para o seu contexto
-# Estilos CSS com tema escuro
-custom_css = """
-#sentences-container {
-    border: 1px solid #555;
-    border-radius: 4px;
-    padding: 10px;
-    margin-bottom: 10px;
-}
-.sentence-box {
-    border: 1px solid #333;
-    padding: 5px;
-    margin-bottom: 5px;
-    border-radius: 4px;
-    background-color: #222;
-    color: #eee;
-}
-body {
-    background-color: #111;
-    color: #eee;
-}
-.gradio-container {
-    background-color: #111;
-}
-.dark {
-    background-color: #333;
-    color: #eee;
-}
-"""
-with gr.Blocks(css=custom_css, theme=gr.themes.Default(primary_hue="gray", secondary_hue="gray")) as app:
     with gr.Tabs():
         with gr.Tab("TTS Básico"):
             gr.Markdown("# TTS Básico com F5-TTS")
@@ -153,7 +140,7 @@ with gr.Blocks(css=custom_css, theme=gr.themes.Default(primary_hue="gray", secon
                 seed_input = gr.Number(label="Seed", value=-1, minimum=-1)  # Seed na seção avançada
             analyzer = SentenceAnalyzer()
-            #add
             @gpu_decorator
             def process_chunks(
                 ref_audio_input,
@@ -168,6 +155,7 @@ with gr.Blocks(css=custom_css, theme=gr.themes.Default(primary_hue="gray", secon
             ):
                 # Acessando a instância F5TTS_ema_model diretamente
                 f5tts_model = F5TTS_ema_model
                 # Dividir o texto em sentenças
                 sentences = analyzer.split_into_sentences(gen_text_input)
@@ -223,8 +211,8 @@ with gr.Blocks(css=custom_css, theme=gr.themes.Default(primary_hue="gray", secon
                     speed_slider,
                     nfe_slider,
                     chunk_size_slider,
-                    seed_input,
-                ],  # Removido F5TTS_ema_model da lista de inputs
                 outputs=[
                     audio_output,
                     ref_text_input,
@@ -232,6 +220,7 @@ with gr.Blocks(css=custom_css, theme=gr.themes.Default(primary_hue="gray", secon
                 ],
             )
 # Código para iniciar a aplicação Gradio
     @click.command()
     @click.option("--port", "-p", default=None, type=int, help="Port to run the app on")

 tts_api = None
 training_process = None  # Adicione esta linha se necessário para o seu contexto
+# Modificação na classe F5TTS para salvar o áudio em um arquivo temporário
+class F5TTS(F5TTS):  # Herdando da classe original F5TTS
+    def infer(
+        self,
+        # ... seus argumentos
+    ):
+        # ... (seu código para gerar o áudio - wav, sr, spect)
+        # Salvar o áudio em um arquivo temporário
+        with tempfile.NamedTemporaryFile(delete=False, suffix=".wav") as f:
+            sf.write(f.name, wav, sr)
+            audio_file = f.name  # Atribuir o caminho do arquivo temporário à variável audio_file
+        # Retornar o caminho do arquivo temporário
+        return audio_file, self.device, str(self.seed)
+with gr.Blocks() as app:  # Removido o CSS customizado
     with gr.Tabs():
         with gr.Tab("TTS Básico"):
             gr.Markdown("# TTS Básico com F5-TTS")
                 seed_input = gr.Number(label="Seed", value=-1, minimum=-1)  # Seed na seção avançada
             analyzer = SentenceAnalyzer()
             @gpu_decorator
             def process_chunks(
                 ref_audio_input,
             ):
                 # Acessando a instância F5TTS_ema_model diretamente
                 f5tts_model = F5TTS_ema_model
                 # Dividir o texto em sentenças
                 sentences = analyzer.split_into_sentences(gen_text_input)
                     speed_slider,
                     nfe_slider,
                     chunk_size_slider,
+                    seed_input,
+                ],
                 outputs=[
                     audio_output,
                     ref_text_input,
                 ],
             )
 # Código para iniciar a aplicação Gradio
     @click.command()
     @click.option("--port", "-p", default=None, type=int, help="Port to run the app on")

logs/sentence_analyzer_2024-12-02.log CHANGED Viewed

@@ -56,3 +56,13 @@
 2024-12-02 20:27:51,734 - SentenceAnalyzer - INFO - Split text into 2 sentences after cleanup
 2024-12-02 20:32:57,401 - SentenceAnalyzer - DEBUG - Logger set up successfully
 2024-12-02 20:32:57,401 - SentenceAnalyzer - INFO - SentenceAnalyzer initialized successfully

 2024-12-02 20:27:51,734 - SentenceAnalyzer - INFO - Split text into 2 sentences after cleanup
 2024-12-02 20:32:57,401 - SentenceAnalyzer - DEBUG - Logger set up successfully
 2024-12-02 20:32:57,401 - SentenceAnalyzer - INFO - SentenceAnalyzer initialized successfully
+2024-12-02 20:39:49,009 - SentenceAnalyzer - DEBUG - Logger set up successfully
+2024-12-02 20:39:49,010 - SentenceAnalyzer - INFO - SentenceAnalyzer initialized successfully
+2024-12-02 20:40:49,340 - SentenceAnalyzer - DEBUG - Starting sentence splitting
+2024-12-02 20:40:49,340 - SentenceAnalyzer - DEBUG - Normalized text using NFC
+2024-12-02 20:40:49,341 - SentenceAnalyzer - DEBUG - Removed page numbers and chapter titles
+2024-12-02 20:40:49,341 - SentenceAnalyzer - DEBUG - Replaced hyphenated line breaks
+2024-12-02 20:40:49,341 - SentenceAnalyzer - DEBUG - Replaced multiple newlines with a space
+2024-12-02 20:40:49,341 - SentenceAnalyzer - DEBUG - Normalized whitespace
+2024-12-02 20:40:49,364 - SentenceAnalyzer - DEBUG - Split text into 1 sentences using NLTK
+2024-12-02 20:40:49,364 - SentenceAnalyzer - INFO - Split text into 1 sentences after cleanup