OpenAI-TTS-Text-to-Speech

Running

App Files Files Community

Wromo commited on Feb 20

Commit

1040619

verified ·

1 Parent(s): fa1355e

Update app.py new preview with chosen language

Browse files

The new TTS text to speech model with the choice of the desired language. It can transcribe in any desired language because AI can! Day by day it exceeds expectations in transcribing from text to speech much more realistic in all languages.
You can add your desired language if it is not in the code!

Best!
LG

Files changed (1) hide show

app.py +26 -27

app.py CHANGED Viewed

@@ -3,48 +3,47 @@ import os
 import tempfile
 from openai import OpenAI
-def tts(text, model, voice, api_key):
     if api_key == '':
-        raise gr.Error('Please enter your OpenAI API Key')
     else:
         try:
             client = OpenAI(api_key=api_key)
             response = client.audio.speech.create(
-                model=model, # "tts-1","tts-1-hd"
-                voice=voice, # 'alloy', 'echo', 'fable', 'onyx', 'nova', 'shimmer'
                 input=text,
             )
         except Exception as error:
-            # Handle any exception that occurs
-            raise gr.Error("An error occurred while generating speech. Please check your API key and try again.")
             print(str(error))
-    # Create a temp file to save the audio
-    with tempfile.NamedTemporaryFile(suffix=".mp3", delete=False) as temp_file:
-        temp_file.write(response.content)
-    # Get the file path of the temp file
-    temp_file_path = temp_file.name
-    return temp_file_path
 with gr.Blocks() as demo:
-    gr.Markdown("# <center> OpenAI Text-To-Speech API with Gradio </center>")
-    #gr.HTML("You can also access the Streaming demo for OpenAI TTS by clicking this <a href='https://huggingface.co/spaces/ysharma/OpenAI_TTS_Streaming'>Gradio demo link</a>")
-    with gr.Row(variant='panel'):
-      api_key = gr.Textbox(type='password', label='OpenAI API Key', placeholder='Enter your API key to access the TTS demo')
-      model = gr.Dropdown(choices=['tts-1','tts-1-hd'], label='Model', value='tts-1')
-      voice = gr.Dropdown(choices=['alloy', 'echo', 'fable', 'onyx', 'nova', 'shimmer'], label='Voice Options', value='alloy')
-    text = gr.Textbox(label="Input text", placeholder="Enter your text and then click on the 'Text-To-Speech' button, or simply press the Enter key.")
     btn = gr.Button("Text-To-Speech")
     output_audio = gr.Audio(label="Speech Output")
-    text.submit(fn=tts, inputs=[text, model, voice, api_key], outputs=output_audio, api_name="tts_enter_key", concurrency_limit=None)
-    btn.click(fn=tts, inputs=[text, model, voice, api_key], outputs=output_audio, api_name="tts_button", concurrency_limit=None)
 demo.launch()

 import tempfile
 from openai import OpenAI
+def tts(text, model, voice, language, api_key):
     if api_key == '':
+        raise gr.Error('Please enter your API Key')
     else:
         try:
             client = OpenAI(api_key=api_key)
             response = client.audio.speech.create(
+                model=model,
+                voice=voice,
+                language=language,  # Parametrul adăugat pentru limbă
                 input=text,
             )
+            with tempfile.NamedTemporaryFile(suffix=".mp3", delete=False) as temp_file:
+                temp_file.write(response.content)
+                temp_file_path = temp_file.name
+            return temp_file_path
         except Exception as error:
             print(str(error))
+            raise gr.Error("An error occurred while generating speech. Please check your API key and try again.")
 with gr.Blocks() as demo:
+    gr.Markdown("# <center> Text-To-Speech API Key </center>")
+    with gr.Row(variant='panel'):
+        api_key = gr.Textbox(type='password', label='OpenAI API Key', placeholder='Enter your API key to access the TTS')
+        model = gr.Dropdown(choices=['tts-1', 'tts-1-hd'], label='Model', value='tts-1-hd')
+        voice = gr.Dropdown(choices=['alloy', 'ash', 'coral', 'echo', 'fable', 'onyx', 'nova', 'sage', 'shimmer'], label='Voice Options', value='echo')
+        language = gr.Dropdown(
+            choices=['en', 'fr', 'es', 'de', 'it', 'ro', 'tr', 'br', 'ru'],
+            label='Choose a language',
+            value='en'
+        )
+    text = gr.Textbox(label="Input text", placeholder="Enter your text and then click the 'Text-To-Speech' button or press Enter.")
     btn = gr.Button("Text-To-Speech")
     output_audio = gr.Audio(label="Speech Output")
+    text.submit(fn=tts, inputs=[text, model, voice, language, api_key], outputs=output_audio, api_name="tts_enter_key", concurrency_limit=None)
+    btn.click(fn=tts, inputs=[text, model, voice, language, api_key], outputs=output_audio, api_name="tts_button", concurrency_limit=None)
 demo.launch()