Text_to_Speech

Sleeping

App Files Files Community

Pranjal12345 commited on Oct 19, 2023

Commit

bd104fa

1 Parent(s): e9c4729

Update app.py

Browse files

Files changed (1) hide show

app.py +17 -25

app.py CHANGED Viewed

@@ -5,8 +5,7 @@ import torchaudio
 import time
 from datetime import datetime
 from tortoise.api import TextToSpeech
-from tortoise.utils.text import split_and_recombine_text
-from tortoise.utils.audio import load_audio, load_voice, load_voices
 VOICE_OPTIONS = [
     "angie",
@@ -17,22 +16,12 @@ VOICE_OPTIONS = [
 def inference(
     text,
-    script,
     voice,
     voice_b,
-    seed,
-    split_by_newline,
 ):
-    if text is None or text.strip() == "":
-        with open(script.name) as f:
-            text = f.read()
-        if text.strip() == "":
-            raise gr.Error("Please provide either text or script file with content.")
-    if split_by_newline == "Yes":
-        texts = list(filter(lambda x: x.strip() != "", text.split("\n")))
-    else:
-        texts = split_and_recombine_text(text)
     voices = [voice]
     if voice_b != "disabled":
@@ -58,9 +47,10 @@ def inference(
 def main():
     title = "Tortoise TTS "
-    label="Text (Provide either text, or upload a newline separated text file below):",
     )
-    script = gr.File(label="Upload a text file")
     voice = gr.Dropdown(
         VOICE_OPTIONS, value="jane_eyre", label="Select voice:", type="value"
@@ -71,24 +61,26 @@ def main():
         label="(Optional) Select second voice:",
         type="value",
     )
-    split_by_newline = gr.Radio(
-        ["Yes", "No"],
-        label="Split by newline (If [No], it will automatically try to find relevant splits):",
-        type="value",
-        value="No",
-    )
     output_audio = gr.Audio(label="streaming audio:", streaming=True, autoplay=True)
     interface = gr.Interface(
         fn=inference,
         inputs=[
             text,
-            script,
             voice,
             voice_b,
-            split_by_newline,
         ],
         title=title,
         outputs=[output_audio],
     )
-    interface.queue().launch()

 import time
 from datetime import datetime
 from tortoise.api import TextToSpeech
+from tortoise.utils.audio import load_voice, load_voices
 VOICE_OPTIONS = [
     "angie",
 def inference(
     text,
     voice,
     voice_b,
 ):
+    # Set split_by_newline to "No" regardless of the user input
+    texts = [text]
     voices = [voice]
     if voice_b != "disabled":
 def main():
     title = "Tortoise TTS "
+    text = gr.Textbox(
+        lines=4,
+        label="Text:",
     )
     voice = gr.Dropdown(
         VOICE_OPTIONS, value="jane_eyre", label="Select voice:", type="value"
         label="(Optional) Select second voice:",
         type="value",
     )
     output_audio = gr.Audio(label="streaming audio:", streaming=True, autoplay=True)
     interface = gr.Interface(
         fn=inference,
         inputs=[
             text,
             voice,
             voice_b,
         ],
         title=title,
         outputs=[output_audio],
     )
+    interface.queue().launch()
+if __name__ == "__main__":
+    tts = TextToSpeech(kv_cache=True, use_deepspeed=True, half=True)
+    with open("Tortoise_TTS_Runs_Scripts.log", "a") as f:
+        f.write(
+            f"\n\n-------------------------Tortoise TTS Scripts Logs, {datetime.now()}-------------------------\n"
+        )
+    main()