Spaces:

drengskapur
/

openai-text-to-speech

Running

App Files Files

jonathanagustin commited on Sep 21, 2024

Commit

9813b68

verified ·

1 Parent(s): bc73de2

Upload folder using huggingface_hub

Browse files

Files changed (1) hide show

app.py +31 -21

app.py CHANGED Viewed

@@ -3,6 +3,7 @@ import tempfile
 import openai
 import requests
 def tts(input_text: str, model: str, voice: str, api_key: str) -> str:
     """
     Convert input text to speech using OpenAI's Text-to-Speech API.
@@ -20,7 +21,9 @@ def tts(input_text: str, model: str, voice: str, api_key: str) -> str:
         gr.Error: If input parameters are invalid or API call fails.
     """
     if not api_key.strip():
-        raise gr.Error("API key is required. Get an API key at: https://platform.openai.com/account/api-keys")
     if not input_text.strip():
         raise gr.Error("Input text cannot be empty.")
@@ -28,11 +31,7 @@ def tts(input_text: str, model: str, voice: str, api_key: str) -> str:
     openai.api_key = api_key
     try:
-        response = openai.Audio.create(
-            text=input_text,
-            voice=voice,
-            model=model
-        )
     except openai.OpenAIError as e:
         # Catch-all for OpenAI exceptions
         raise gr.Error(f"An OpenAI error occurred: {e}")
@@ -40,8 +39,10 @@ def tts(input_text: str, model: str, voice: str, api_key: str) -> str:
         # Catch any other exceptions
         raise gr.Error(f"An unexpected error occurred: {e}")
-    if not hasattr(response, 'audio'):
-        raise gr.Error("Invalid response from OpenAI API. The response does not contain audio content.")
     with tempfile.NamedTemporaryFile(suffix=".mp3", delete=False) as temp_file:
         temp_file.write(response.audio)
@@ -49,6 +50,7 @@ def tts(input_text: str, model: str, voice: str, api_key: str) -> str:
     return temp_file_path
 def main():
     """
     Main function to create and launch the Gradio interface.
@@ -58,7 +60,8 @@ def main():
     # Predefine voice previews URLs
     VOICE_PREVIEWS = {
-        voice: f"https://cdn.openai.com/API/docs/audio/{voice}.wav" for voice in VOICE_OPTIONS
     }
     with gr.Blocks() as demo:
@@ -80,27 +83,33 @@ def main():
                 # Add voice previews
                 gr.Markdown("### Voice Previews")
                 for voice in VOICE_OPTIONS:
-                    gr.Markdown(f"**{voice.capitalize()}**")
                     audio_url = VOICE_PREVIEWS[voice]
                     # Fetch the audio data
                     try:
                         response = requests.get(audio_url)
                         response.raise_for_status()
                         audio_data = response.content
-                        gr.Audio(value=audio_data, label=f"{voice.capitalize()}", autoplay=False)
                     except requests.exceptions.RequestException as e:
-                        gr.Markdown(f"Could not load preview for {voice.capitalize()}: {e}")
             with gr.Column(scale=2):
                 input_textbox = gr.Textbox(
-                    label="Input Text",
-                    lines=10,
-                    placeholder="Type your text here..."
-                )
-                submit_button = gr.Button(
-                    "Convert Text to Speech",
-                    variant="primary"
                 )
             with gr.Column(scale=1):
                 output_audio = gr.Audio(label="Output Audio")
@@ -113,11 +122,12 @@ def main():
         submit_button.click(
             fn=on_submit,
             inputs=[input_textbox, model_dropdown, voice_dropdown, api_key_input],
-            outputs=output_audio
         )
     # Launch the Gradio app with error display enabled
     demo.launch(show_error=True)
 if __name__ == "__main__":
-    main()

 import openai
 import requests
 def tts(input_text: str, model: str, voice: str, api_key: str) -> str:
     """
     Convert input text to speech using OpenAI's Text-to-Speech API.
         gr.Error: If input parameters are invalid or API call fails.
     """
     if not api_key.strip():
+        raise gr.Error(
+            "API key is required. Get an API key at: https://platform.openai.com/account/api-keys"
+        )
     if not input_text.strip():
         raise gr.Error("Input text cannot be empty.")
     openai.api_key = api_key
     try:
+        response = openai.Audio.create(text=input_text, voice=voice, model=model)
     except openai.OpenAIError as e:
         # Catch-all for OpenAI exceptions
         raise gr.Error(f"An OpenAI error occurred: {e}")
         # Catch any other exceptions
         raise gr.Error(f"An unexpected error occurred: {e}")
+    if not hasattr(response, "audio"):
+        raise gr.Error(
+            "Invalid response from OpenAI API. The response does not contain audio content."
+        )
     with tempfile.NamedTemporaryFile(suffix=".mp3", delete=False) as temp_file:
         temp_file.write(response.audio)
     return temp_file_path
 def main():
     """
     Main function to create and launch the Gradio interface.
     # Predefine voice previews URLs
     VOICE_PREVIEWS = {
+        voice: f"https://cdn.openai.com/API/docs/audio/{voice}.wav"
+        for voice in VOICE_OPTIONS
     }
     with gr.Blocks() as demo:
                 # Add voice previews
                 gr.Markdown("### Voice Previews")
                 for voice in VOICE_OPTIONS:
                     audio_url = VOICE_PREVIEWS[voice]
                     # Fetch the audio data
                     try:
                         response = requests.get(audio_url)
                         response.raise_for_status()
                         audio_data = response.content
+                        gr.Audio(
+                            value=audio_data,
+                            waveform_options=gr.WaveformOptions(
+                                waveform_color="#01C6FF",
+                                waveform_progress_color="#0066B4",
+                                skip_length=2,
+                                show_controls=False,
+                            ),
+                            label=f"{voice.capitalize()}",
+                            autoplay=False,
+                        )
                     except requests.exceptions.RequestException as e:
+                        gr.Markdown(
+                            f"Could not load preview for {voice.capitalize()}: {e}"
+                        )
             with gr.Column(scale=2):
                 input_textbox = gr.Textbox(
+                    label="Input Text", lines=10, placeholder="Type your text here..."
                 )
+                submit_button = gr.Button("Convert Text to Speech", variant="primary")
             with gr.Column(scale=1):
                 output_audio = gr.Audio(label="Output Audio")
         submit_button.click(
             fn=on_submit,
             inputs=[input_textbox, model_dropdown, voice_dropdown, api_key_input],
+            outputs=output_audio,
         )
     # Launch the Gradio app with error display enabled
     demo.launch(show_error=True)
 if __name__ == "__main__":
+    main()