Text_to_Speech

Sleeping

App Files Files Community

Pranjal12345 commited on Oct 19, 2023

Commit

deb14ad

1 Parent(s): 97e4faf

Update app.py

Browse files

Files changed (1) hide show

app.py +3 -33

app.py CHANGED Viewed

@@ -15,7 +15,6 @@ VOICE_OPTIONS = [
     "random",  # special option for random voice
 ]
 def inference(
     text,
     script,
@@ -46,7 +45,6 @@ def inference(
     start_time = time.time()
-    # all_parts = []
     for j, text in enumerate(texts):
         for audio_frame in tts.tts_with_preset(
             text,
@@ -55,26 +53,11 @@ def inference(
             preset="ultra_fast",
             k=1
         ):
-            # print("Time taken: ", time.time() - start_time)
-            # all_parts.append(audio_frame)
             yield (24000, audio_frame.cpu().detach().numpy())
-    # wav = torch.cat(all_parts, dim=0).unsqueeze(0)
-    # print(wav.shape)
-    # torchaudio.save("output.wav", wav.cpu(), 24000)
-    # yield (None, gr.make_waveform(audio="output.wav",))
 def main():
-    title = "Tortoise TTS 🐢"
-    description = """
-    A text-to-speech system which powers lot of organizations in Speech synthesis domain.
-    <br/>
-    a model with strong multi-voice capabilities, highly realistic prosody and intonation.
-    <br/>
-    for faster inference, use the 'ultra_fast' preset and duplicate space if you don't want to wait in a queue.
-    <br/>
-    """
-    text = gr.Textbox(
-        lines=4,
         label="Text (Provide either text, or upload a newline separated text file below):",
     )
     script = gr.File(label="Upload a text file")
@@ -96,7 +79,6 @@ def main():
     )
     output_audio = gr.Audio(label="streaming audio:", streaming=True, autoplay=True)
-    # download_audio = gr.Audio(label="dowanload audio:")
     interface = gr.Interface(
         fn=inference,
         inputs=[
@@ -107,18 +89,6 @@ def main():
             split_by_newline,
         ],
         title=title,
-        description=description,
         outputs=[output_audio],
     )
-    interface.queue().launch()
-if __name__ == "__main__":
-    tts = TextToSpeech(kv_cache=True, use_deepspeed=True, half=True)
-    with open("Tortoise_TTS_Runs_Scripts.log", "a") as f:
-        f.write(
-            f"\n\n-------------------------Tortoise TTS Scripts Logs, {datetime.now()}-------------------------\n"
-        )
-    main()

     "random",  # special option for random voice
 ]
 def inference(
     text,
     script,
     start_time = time.time()
     for j, text in enumerate(texts):
         for audio_frame in tts.tts_with_preset(
             text,
             preset="ultra_fast",
             k=1
         ):
             yield (24000, audio_frame.cpu().detach().numpy())
 def main():
+    title = "Tortoise TTS "
         label="Text (Provide either text, or upload a newline separated text file below):",
     )
     script = gr.File(label="Upload a text file")
     )
     output_audio = gr.Audio(label="streaming audio:", streaming=True, autoplay=True)
     interface = gr.Interface(
         fn=inference,
         inputs=[
             split_by_newline,
         ],
         title=title,
         outputs=[output_audio],
     )
+    interface.queue().launch()