Spaces:

capradeepgujaran
/

VoiceOversV3

Sleeping

App Files Files Community

capradeepgujaran commited on Oct 8, 2024

Commit

97482f2

verified ·

1 Parent(s): 4b389b6

Update app.py

Browse files

Files changed (1) hide show

app.py +20 -53

app.py CHANGED Viewed

@@ -1,45 +1,25 @@
 import gradio as gr
 import tempfile
-import os
-from openai import OpenAI
 from gtts import gTTS
 from gtts.lang import tts_langs
-# Initialize OpenAI client
-client = OpenAI(api_key=os.environ.get("OPENAI_API_KEY"))
 # Get available languages for Google TTS
 google_langs = tts_langs()
-# Define voice options for some common languages
 google_voice_options = {
-    "en": ["com.au", "ca", "co.uk", "com", "co.in", "ie", "co.za"],
-    "es": ["com", "es", "com.mx"],
-    "fr": ["fr", "ca"],
-    "de": ["de", "at"],
-    "it": ["it", "com"],
-    "ja": ["jp"],
-    "ko": ["com"],
-    "pt": ["com.br", "pt"],
-    "zh": ["cn", "tw"]
 }
-def openai_tts(text, voice, model):
-    try:
-        response = client.audio.speech.create(
-            model=model,
-            voice=voice,
-            input=text
-        )
-        with tempfile.NamedTemporaryFile(delete=False, suffix=".mp3") as temp_audio:
-            temp_audio.write(response.content)
-            temp_audio_path = temp_audio.name
-        return temp_audio_path, f"Speech generated with OpenAI TTS using {voice} voice and {model} model"
-    except Exception as e:
-        return None, f"Error in OpenAI TTS speech generation: {str(e)}"
 def google_tts(text, lang, tld):
     try:
         tts = gTTS(text=text, lang=lang, tld=tld, slow=False)
@@ -54,43 +34,30 @@ def google_tts(text, lang, tld):
 # Gradio interface
 with gr.Blocks() as iface:
-    gr.Markdown("# OpenAI TTS and Enhanced Google TTS Tool")
     text_input = gr.Textbox(label="Enter text for speech generation")
-    tts_method = gr.Radio(["OpenAI TTS", "Google TTS"], label="TTS Method", value="OpenAI TTS")
-    with gr.Group() as openai_options:
-        openai_voice_input = gr.Dropdown(["alloy", "echo", "fable", "onyx", "nova", "shimmer"], label="Select Voice", value="nova")
-        openai_model_input = gr.Dropdown(["tts-1", "tts-1-hd"], label="Select Model", value="tts-1")
     with gr.Group() as google_options:
         google_lang_input = gr.Dropdown(list(google_langs.keys()), label="Select Language", value="en")
-        google_voice_input = gr.Dropdown(google_voice_options["en"], label="Select Voice Variant", value="com")
     speech_button = gr.Button("Generate Speech")
     speech_output = gr.Audio(label="Generated Speech")
     speech_message = gr.Textbox(label="Message")
-    def generate_speech(text, method, openai_voice, openai_model, google_lang, google_voice):
-        if method == "OpenAI TTS":
-            return openai_tts(text, openai_voice, openai_model)
-        else:
-            return google_tts(text, google_lang, google_voice)
-    def update_visible_options(method):
-        if method == "OpenAI TTS":
-            return gr.Group(visible=True), gr.Group(visible=False)
-        else:
-            return gr.Group(visible=False), gr.Group(visible=True)
     def update_google_voice_options(lang):
-        return gr.Dropdown(choices=google_voice_options.get(lang, ["com"]), value="com")
     speech_button.click(generate_speech,
-                        inputs=[text_input, tts_method, openai_voice_input, openai_model_input, google_lang_input, google_voice_input],
                         outputs=[speech_output, speech_message])
-    tts_method.change(update_visible_options, inputs=[tts_method], outputs=[openai_options, google_options])
     google_lang_input.change(update_google_voice_options, inputs=[google_lang_input], outputs=[google_voice_input])
-iface.launch()

 import gradio as gr
 import tempfile
 from gtts import gTTS
 from gtts.lang import tts_langs
 # Get available languages for Google TTS
 google_langs = tts_langs()
+# Define voice options with descriptive names for each language
 google_voice_options = {
+    "en": [("Australia", "com.au"), ("Canada", "ca"), ("United Kingdom", "co.uk"),
+           ("United States", "com"), ("India", "co.in"), ("Ireland", "ie"), ("South Africa", "co.za")],
+    "es": [("Spain", "com"), ("Latin America", "es"), ("Mexico", "com.mx")],
+    "fr": [("France", "fr"), ("Canada", "ca")],
+    "de": [("Germany", "de"), ("Austria", "at")],
+    "it": [("Italy", "it"), ("United States", "com")],
+    "ja": [("Japan", "jp")],
+    "ko": [("Korea", "com")],
+    "pt": [("Brazil", "com.br"), ("Portugal", "pt")],
+    "zh": [("China", "cn"), ("Taiwan", "tw")]
 }
 def google_tts(text, lang, tld):
     try:
         tts = gTTS(text=text, lang=lang, tld=tld, slow=False)
 # Gradio interface
 with gr.Blocks() as iface:
+    gr.Markdown("# Google TTS Tool")
     text_input = gr.Textbox(label="Enter text for speech generation")
     with gr.Group() as google_options:
         google_lang_input = gr.Dropdown(list(google_langs.keys()), label="Select Language", value="en")
+        google_voice_input = gr.Dropdown([x[0] for x in google_voice_options["en"]], label="Select Voice Variant", value="United States")
     speech_button = gr.Button("Generate Speech")
     speech_output = gr.Audio(label="Generated Speech")
     speech_message = gr.Textbox(label="Message")
+    def generate_speech(text, google_lang, google_voice_desc):
+        # Find the tld (country code) based on the description
+        google_voice_tld = dict(google_voice_options[google_lang])[google_voice_desc]
+        return google_tts(text, google_lang, google_voice_tld)
     def update_google_voice_options(lang):
+        return gr.Dropdown(choices=[x[0] for x in google_voice_options.get(lang, [("United States", "com")])], value="United States")
     speech_button.click(generate_speech,
+                        inputs=[text_input, google_lang_input, google_voice_input],
                         outputs=[speech_output, speech_message])
     google_lang_input.change(update_google_voice_options, inputs=[google_lang_input], outputs=[google_voice_input])
+iface.launch()