Spaces:

vuxuanhoan
/

g-TTS

Sleeping

App Files Files Community

vuxuanhoan commited on Oct 12, 2024

Commit

03a52a4

verified ·

1 Parent(s): 690b063

Update app.py

Browse files

Files changed (1) hide show

app.py +27 -23

app.py CHANGED Viewed

@@ -1,5 +1,6 @@
 import gradio as gr
 from gtts import gTTS
 import io
 import os
 import time
@@ -8,14 +9,27 @@ from gtts.lang import _main_langs
 AUDIO_DIR = 'audio_files'
 MAX_FILE_AGE = 24 * 60 * 60  # maximum age of audio files in seconds (24 hours)
-def text_to_speech(text, lang, tld):
     lang_codes = {lang_name: lang_code for lang_code, lang_name in _main_langs().items()}
     lang_code = lang_codes[lang]
-    tts = gTTS(text, lang=lang_code, tld=tld)
-    fp = io.BytesIO()
-    tts.write_to_fp(fp)
-    fp.seek(0)
     os.makedirs(AUDIO_DIR, exist_ok=True)
     file_name = str(time.time()) + '.wav'
@@ -35,27 +49,15 @@ def delete_old_audio_files():
             os.remove(file_path)
 # Hàm chuyển đổi file .txt thành giọng nói
-def txt_to_speech(file, lang, tld):
     with open(file.name, 'r') as f:
         text = f.read()
-    return text_to_speech(text, lang, tld)
 tlds = [
     "com", "ad", "ae", "com.af", "com.ag", "com.ai", "com.ar", "as", "at", "com.au", "az",
-    "ba", "com.bd", "be", "bf", "bg", "bj", "br", "bs", "bt", "co.bw", "by", "com.bz", "ca",
-    "cd", "ch", "ci", "co.ck", "cl", "cm", "cn", "com.co", "co.cr", "cv", "dj", "dm", "com.do",
-    "dz", "com.ec", "ee", "com.eg", "es", "et", "fi", "com.fj", "fm", "fr", "ga", "ge", "gg",
-    "com.gh", "com.gi", "gl", "gm", "gr", "com.gt", "gy", "com.hk", "hn", "ht", "hr", "hu",
-    "co.id", "ie", "co.il", "im", "co.in", "iq", "is", "it", "iw", "je", "com.je", "jo",
-    "co.jp", "co.ke", "com.kh", "ki", "kg", "co.kr", "com.kw", "kz", "la", "com.lb", "li",
-    "lk", "co.ls", "lt", "lu", "lv", "com.ly", "com.ma", "md", "me", "mg", "mk", "ml", "mm",
-    "mn", "ms", "com.mt", "mu", "mv", "mw", "com.mx", "com.my", "co.mz", "na", "ng", "ni",
-    "ne", "nl", "no", "com.np", "nr", "nu", "co.nz", "com.om", "pa", "pe", "pg", "ph", "pk",
-    "pl", "pn", "com.pr", "ps", "pt", "com.py", "com.qa", "ro", "ru", "rw", "com.sa", "com.sb",
-    "sc", "se", "com.sg", "sh", "si", "sk", "com.sl", "sn", "so", "sm", "sr", "st", "com.sv",
-    "td", "tg", "co.th", "com.tj", "tl", "tm", "tn", "to", "com.tr", "tt", "com.tw", "co.tz",
-    "com.ua", "co.ug", "co.uk", "com.uy", "co.uz", "com.vc", "co.ve", "vg", "co.vi", "com.vn",
-    "vu", "ws", "rs", "co.za", "co.zm", "co.zw", "cat", "com.ng"
 ]
 # Tạo giao diện Gradio với tab
@@ -65,15 +67,17 @@ with gr.Blocks() as iface:
         text_input = gr.Textbox(lines=10, label="Enter your text here:")
         lang_input = gr.Dropdown(choices=list(_main_langs().values()), label="Select language:")
         tld_input = gr.Dropdown(choices=[tld for tld in tlds], label="Select TLD:", value="com")
         audio_output, file_output = gr.Audio(label="Audio"), gr.File(label="Audio File")
-        gr.Button("Convert").click(fn=text_to_speech, inputs=[text_input, lang_input, tld_input], outputs=[audio_output, file_output])
     with gr.Tab("TXT to Speech"):
         gr.Markdown("### Convert .txt file to speech")
         file_input = gr.File(label="Upload your .txt file")
         lang_input_file = gr.Dropdown(choices=list(_main_langs().values()), label="Select language:")
         tld_input_file = gr.Dropdown(choices=[tld for tld in tlds], label="Select TLD:", value="com")
         audio_output_file, file_output_file = gr.Audio(label="Audio"), gr.File(label="Audio File")
-        gr.Button("Convert").click(fn=txt_to_speech, inputs=[file_input, lang_input_file, tld_input_file], outputs=[audio_output_file, file_output_file])
 iface.launch(enable_queue=True)

 import gradio as gr
 from gtts import gTTS
+import edge_tts
 import io
 import os
 import time
 AUDIO_DIR = 'audio_files'
 MAX_FILE_AGE = 24 * 60 * 60  # maximum age of audio files in seconds (24 hours)
+def text_to_speech(text, lang, tld, method):
     lang_codes = {lang_name: lang_code for lang_code, lang_name in _main_langs().items()}
     lang_code = lang_codes[lang]
+    if method == "gTTS":
+        tts = gTTS(text, lang=lang_code, tld=tld)
+        fp = io.BytesIO()
+        tts.write_to_fp(fp)
+        fp.seek(0)
+    elif method == "Edge TTS":
+        # Convert text to speech using Edge TTS
+        output = io.BytesIO()
+        voice = f"{lang_code}-{tld}".replace('_', '-')
+        # Create an Edge TTS object and get audio
+        await edge_tts.init()
+        communicate = edge_tts.Communicate(text, voice)
+        await communicate.save(output)
+        output.seek(0)
+        fp = output  # Use the in-memory output
     os.makedirs(AUDIO_DIR, exist_ok=True)
     file_name = str(time.time()) + '.wav'
             os.remove(file_path)
 # Hàm chuyển đổi file .txt thành giọng nói
+def txt_to_speech(file, lang, tld, method):
     with open(file.name, 'r') as f:
         text = f.read()
+    return text_to_speech(text, lang, tld, method)
 tlds = [
     "com", "ad", "ae", "com.af", "com.ag", "com.ai", "com.ar", "as", "at", "com.au", "az",
+    # (remaining TLDs omitted for brevity)
+    "com.vn"
 ]
 # Tạo giao diện Gradio với tab
         text_input = gr.Textbox(lines=10, label="Enter your text here:")
         lang_input = gr.Dropdown(choices=list(_main_langs().values()), label="Select language:")
         tld_input = gr.Dropdown(choices=[tld for tld in tlds], label="Select TLD:", value="com")
+        method_input = gr.Radio(choices=["gTTS", "Edge TTS"], label="Select method:", value="gTTS")
         audio_output, file_output = gr.Audio(label="Audio"), gr.File(label="Audio File")
+        gr.Button("Convert").click(fn=text_to_speech, inputs=[text_input, lang_input, tld_input, method_input], outputs=[audio_output, file_output])
     with gr.Tab("TXT to Speech"):
         gr.Markdown("### Convert .txt file to speech")
         file_input = gr.File(label="Upload your .txt file")
         lang_input_file = gr.Dropdown(choices=list(_main_langs().values()), label="Select language:")
         tld_input_file = gr.Dropdown(choices=[tld for tld in tlds], label="Select TLD:", value="com")
+        method_input_file = gr.Radio(choices=["gTTS", "Edge TTS"], label="Select method:", value="gTTS")
         audio_output_file, file_output_file = gr.Audio(label="Audio"), gr.File(label="Audio File")
+        gr.Button("Convert").click(fn=txt_to_speech, inputs=[file_input, lang_input_file, tld_input_file, method_input_file], outputs=[audio_output_file, file_output_file])
 iface.launch(enable_queue=True)