Spaces:

snackshell
/

eng-amh-tts

Running

App Files Files Community

snackshell commited on Mar 24

Commit

ce98cc8

verified ·

1 Parent(s): 7481e8e

Update app.py

Browse files

Files changed (1) hide show

app.py +39 -80

app.py CHANGED Viewed

@@ -11,17 +11,22 @@ language_dict = {
     "English": {
         "Ryan": "en-GB-RyanNeural",
         "Clara": "en-CA-ClaraNeural"
-    },
-    "Tigrinya": {}  # Empty because we'll use Amharic voices with labels
 }
 async def text_to_speech_edge(text, language, speaker):
     if language == "Tigrinya":
-        clean_speaker = speaker.replace(" (Amharic Voice)", "")
-        voice = language_dict["Amharic"][clean_speaker]
-    else:
-        voice = language_dict[language][speaker]
     try:
         communicate = edge_tts.Communicate(text, voice)
         with tempfile.NamedTemporaryFile(delete=False, suffix=".mp3") as tmp_file:
@@ -31,104 +36,58 @@ async def text_to_speech_edge(text, language, speaker):
     except asyncio.TimeoutError:
         error_msg = ("ስህተት: ጊዜ አልቋል። እባክዎ እንደገና ይሞክሩ።"
-                    if language in ["Amharic", "Tigrinya"]
                     else "Error: Timeout. Please try again.")
         raise gr.Error(error_msg)
     except Exception as e:
         error_msg = (f"ስህተት: {str(e)}"
-                    if language in ["Amharic", "Tigrinya"]
                     else f"Error: {str(e)}")
         raise gr.Error(error_msg)
 def update_speakers(language):
     if language == "Tigrinya":
-        speakers = [f"{name} (Amharic Voice)" for name in language_dict["Amharic"].keys()]
     else:
-        speakers = list(language_dict[language].keys())
-    return gr.Dropdown(
-        choices=speakers,
-        value=speakers[0],
-        label=f"Select Speaker {'(Amharic Voices)' if language == 'Tigrinya' else ''}"
-    )
-with gr.Blocks(title="Amharic, English & Tigrinya TTS", theme=gr.themes.Soft()) as demo:
-    gr.HTML("""
-    <style>
-        h1 {
-            color: #2E86C1;
-            text-align: center;
-            background: linear-gradient(45deg, #FF007F, #2E86C1);
-            -webkit-background-clip: text;
-            -webkit-text-fill-color: transparent;
-            margin-bottom: 20px;
-        }
-        .notice {
-            font-size: 0.9em;
-            color: #666;
-            text-align: center;
-            margin: 10px 0;
-            font-style: italic;
-        }
-        .gradio-button {
-            background: linear-gradient(45deg, #FF007F, #2E86C1) !important;
-            color: white !important;
-        }
-    </style>
-    <center>
-        <h1>Amharic, English & Tigrinya Text-to-Speech</h1>
-        <div class="notice">
-            Note: Tigrinya uses Amharic-accented voices until dedicated models become available
-        </div>
-    </center>
-    """)
     with gr.Row():
-        with gr.Column():
-            language = gr.Dropdown(
-                choices=["Amharic", "English", "Tigrinya"],
-                value="Amharic",
-                label="Select Language / ቋንቋ ይምረጡ"
-            )
-            input_text = gr.Textbox(
-                lines=5,
-                label="Enter Text / ጽሑፍ ያስገቡ",
-                placeholder="Type your text here... / ጽሑፍዎን ይጻፉ..."
-            )
-            speaker = gr.Dropdown(
-                label="Select Speaker / አርቲስት ይምረጡ",
-                interactive=True
-            )
-            run_btn = gr.Button(
-                value="Generate Audio / ድምፅ ፍጠር",
-                variant="primary"
-            )
-        with gr.Column():
-            output_audio = gr.Audio(
-                type="filepath",
-                label="Generated Audio / የተፈጠረ ድምፅ",
-                interactive=False
-            )
-    # Initialize speakers dropdown
     demo.load(
-        fn=lambda: gr.update(choices=list(language_dict["Amharic"].keys())),
         outputs=speaker
     )
-    # Update speakers when language changes
     language.change(
         update_speakers,
         inputs=language,
         outputs=speaker
     )
-    run_btn.click(
         text_to_speech_edge,
         inputs=[input_text, language, speaker],
         outputs=output_audio
     )
 if __name__ == "__main__":
-    demo.launch(server_port=7860, share=False)

     "English": {
         "Ryan": "en-GB-RyanNeural",
         "Clara": "en-CA-ClaraNeural"
+    }
 }
 async def text_to_speech_edge(text, language, speaker):
+    # Handle Tigrinya as Amharic with different label
     if language == "Tigrinya":
+        language = "Amharic"
+    try:
+        voice = language_dict[language][speaker]
+    except KeyError:
+        error_msg = (f"ስህተት: ድምፅ '{speaker}' አልተገኘም።"
+                    if language == "Amharic"
+                    else f"Error: Voice '{speaker}' not found")
+        raise gr.Error(error_msg)
     try:
         communicate = edge_tts.Communicate(text, voice)
         with tempfile.NamedTemporaryFile(delete=False, suffix=".mp3") as tmp_file:
     except asyncio.TimeoutError:
         error_msg = ("ስህተት: ጊዜ አልቋል። እባክዎ እንደገና ይሞክሩ።"
+                    if language == "Amharic"
                     else "Error: Timeout. Please try again.")
         raise gr.Error(error_msg)
     except Exception as e:
         error_msg = (f"ስህተት: {str(e)}"
+                    if language == "Amharic"
                     else f"Error: {str(e)}")
         raise gr.Error(error_msg)
 def update_speakers(language):
     if language == "Tigrinya":
+        speakers = list(language_dict["Amharic"].keys())
     else:
+        speakers = list(language_dict.get(language, []))
+    return gr.Dropdown(choices=speakers, value=speakers[0] if speakers else None)
+with gr.Blocks(title="SelamGPT TTS") as demo:
+    gr.Markdown("## Amharic, English & Tigrinya Text-to-Speech")
     with gr.Row():
+        language = gr.Dropdown(
+            choices=["Amharic", "English", "Tigrinya"],
+            value="Amharic",
+            label="Language"
+        )
+        speaker = gr.Dropdown(
+            label="Speaker",
+            allow_custom_value=False
+        )
+        input_text = gr.Textbox(label="Input Text")
+    generate_btn = gr.Button("Generate Audio")
+    output_audio = gr.Audio(label="Output")
+    # API endpoints
     demo.load(
+        fn=lambda: gr.Dropdown(choices=language_dict["Amharic"].keys()),
         outputs=speaker
     )
     language.change(
         update_speakers,
         inputs=language,
         outputs=speaker
     )
+    generate_btn.click(
         text_to_speech_edge,
         inputs=[input_text, language, speaker],
         outputs=output_audio
     )
 if __name__ == "__main__":
+    demo.launch(server_port=7860)