Spaces:

drengskapur
/

openai-text-to-speech

Running

App Files Files

jonathanagustin commited on Sep 21, 2024

Commit

3a80faa

verified ·

1 Parent(s): 775839f

Upload folder using huggingface_hub

Browse files

Files changed (1) hide show

app.py +55 -23

app.py CHANGED Viewed

@@ -16,19 +16,21 @@ def tts(
     """
     Convert input text to speech using OpenAI's Text-to-Speech API.
-    Parameters:
-        input_text (str): The text to be converted to speech.
-        model (str): The model to use for synthesis (e.g., 'tts-1', 'tts-1-hd').
-        voice (str): The voice profile to use (e.g., 'alloy', 'echo', 'fable', etc.).
-        api_key (str): OpenAI API key.
-        response_format (str): The audio format of the output file (default is 'mp3').
-        speed (float): The speed of the synthesized speech (0.25 to 4.0).
-    Returns:
-        str: File path to the generated audio file.
-    Raises:
-        gr.Error: If input parameters are invalid or API call fails.
     """
     if not api_key.strip():
         raise gr.Error(
@@ -100,8 +102,15 @@ def main():
     with gr.Blocks(title="OpenAI - Text to Speech") as demo:
         with gr.Row():
             with gr.Column(scale=1):
-                # Function to play the selected voice sample
-                def play_voice_sample(voice):
                     return gr.update(
                         value=VOICE_PREVIEW_FILES[voice],
                         label=f"Preview Voice: {voice.capitalize()}",
@@ -109,7 +118,7 @@ def main():
                 preview_audio = gr.Audio(
                     interactive=False,
-                    label="Echo",
                     value=VOICE_PREVIEW_FILES['echo'],
                     visible=True,
                     show_download_button=False,
@@ -162,15 +171,21 @@ def main():
                 )
             with gr.Column(scale=2):
-                # Initialize the input textbox with the desired label
                 input_textbox = gr.Textbox(
                     label="Input Text (0000 / 4096 chars)",
                     lines=10,
                     placeholder="Type your text here...",
                 )
-                # Function to update the label with the character count
-                def update_label(input_text):
                     char_count = len(input_text)
                     new_label = f"Input Text ({char_count:04d} / 4096 chars)"
                     return gr.update(label=new_label)
@@ -190,10 +205,27 @@ def main():
             with gr.Column(scale=1):
                 output_audio = gr.Audio(label="Output Audio")
-        # Define the event handler for the submit button with error handling
         def on_submit(
-            input_text, model, voice, api_key, response_format, speed
-        ):
             audio_file = tts(
                 input_text, model, voice, api_key, response_format, speed
             )
@@ -217,4 +249,4 @@ def main():
     demo.launch(show_error=True)
 if __name__ == "__main__":
-    main()

     """
     Convert input text to speech using OpenAI's Text-to-Speech API.
+    :param input_text: The text to be converted to speech.
+    :type input_text: str
+    :param model: The model to use for synthesis (e.g., 'tts-1', 'tts-1-hd').
+    :type model: str
+    :param voice: The voice profile to use (e.g., 'alloy', 'echo', 'fable', etc.).
+    :type voice: str
+    :param api_key: OpenAI API key.
+    :type api_key: str
+    :param response_format: The audio format of the output file, defaults to 'mp3'.
+    :type response_format: str, optional
+    :param speed: The speed of the synthesized speech (0.25 to 4.0), defaults to 1.0.
+    :type speed: float, optional
+    :return: File path to the generated audio file.
+    :rtype: str
+    :raises gr.Error: If input parameters are invalid or API call fails.
     """
     if not api_key.strip():
         raise gr.Error(
     with gr.Blocks(title="OpenAI - Text to Speech") as demo:
         with gr.Row():
             with gr.Column(scale=1):
+                def play_voice_sample(voice: str):
+                    """
+                    Play the preview audio sample for the selected voice.
+                    :param voice: The name of the voice to preview.
+                    :type voice: str
+                    :return: Updated Gradio Audio component with the selected voice sample.
+                    :rtype: gr.Audio
+                    """
                     return gr.update(
                         value=VOICE_PREVIEW_FILES[voice],
                         label=f"Preview Voice: {voice.capitalize()}",
                 preview_audio = gr.Audio(
                     interactive=False,
+                    label="Preview Voice: Echo",
                     value=VOICE_PREVIEW_FILES['echo'],
                     visible=True,
                     show_download_button=False,
                 )
             with gr.Column(scale=2):
                 input_textbox = gr.Textbox(
                     label="Input Text (0000 / 4096 chars)",
                     lines=10,
                     placeholder="Type your text here...",
                 )
+                def update_label(input_text: str):
+                    """
+                    Update the label of the input textbox with the current character count.
+                    :param input_text: The current text in the input textbox.
+                    :type input_text: str
+                    :return: Updated Gradio component with new label.
+                    :rtype: gr.update
+                    """
                     char_count = len(input_text)
                     new_label = f"Input Text ({char_count:04d} / 4096 chars)"
                     return gr.update(label=new_label)
             with gr.Column(scale=1):
                 output_audio = gr.Audio(label="Output Audio")
         def on_submit(
+            input_text: str, model: str, voice: str, api_key: str, response_format: str, speed: float
+        ) -> str:
+            """
+            Event handler for the submit button; converts text to speech using the tts function.
+            :param input_text: The text to convert to speech.
+            :type input_text: str
+            :param model: The TTS model to use (e.g., 'tts-1', 'tts-1-hd').
+            :type model: str
+            :param voice: The voice profile to use (e.g., 'alloy', 'echo', etc.).
+            :type voice: str
+            :param api_key: OpenAI API key.
+            :type api_key: str
+            :param response_format: The audio format of the output file.
+            :type response_format: str
+            :param speed: The speed of the synthesized speech.
+            :type speed: float
+            :return: File path to the generated audio file.
+            :rtype: str
+            """
             audio_file = tts(
                 input_text, model, voice, api_key, response_format, speed
             )
     demo.launch(show_error=True)
 if __name__ == "__main__":
+    main()