Spaces:

vuxuanhoan
/

g-TTS

Sleeping

App Files Files Community

vuxuanhoan commited on Oct 12, 2024

Commit

690b063

verified ·

1 Parent(s): b384bc1

Update app.py

Browse files

Files changed (1) hide show

app.py +36 -33

app.py CHANGED Viewed

@@ -9,68 +9,71 @@ AUDIO_DIR = 'audio_files'
 MAX_FILE_AGE = 24 * 60 * 60  # maximum age of audio files in seconds (24 hours)
 def text_to_speech(text, lang, tld):
-    # map the language name to its corresponding code
     lang_codes = {lang_name: lang_code for lang_code, lang_name in _main_langs().items()}
     lang_code = lang_codes[lang]
-    # create the text-to-speech audio
     tts = gTTS(text, lang=lang_code, tld=tld)
     fp = io.BytesIO()
     tts.write_to_fp(fp)
     fp.seek(0)
-    # create the audio directory if it does not exist
     os.makedirs(AUDIO_DIR, exist_ok=True)
-    # generate a unique file name for the audio file
     file_name = str(time.time()) + '.wav'
     file_path = os.path.join(AUDIO_DIR, file_name)
-    # save the audio stream to a file
     with open(file_path, 'wb') as f:
         f.write(fp.read())
-    # delete old audio files
     delete_old_audio_files()
-    # return the file path
-    return file_path, f.name
-def txt_file_to_speech(txt_file, lang, tld):
-    # read text from the uploaded .txt file
-    text = txt_file.read().decode('utf-8')
-    return text_to_speech(text, lang, tld)
 def delete_old_audio_files():
-    # delete audio files older than MAX_FILE_AGE
     now = time.time()
     for file_name in os.listdir(AUDIO_DIR):
         file_path = os.path.join(AUDIO_DIR, file_name)
         if now - os.path.getmtime(file_path) > MAX_FILE_AGE:
             os.remove(file_path)
-# list of supported TLDs
-tlds = ["com", "vn",  # shortened for brevity
 ]
-# Interface with two tabs
 with gr.Blocks() as iface:
     with gr.Tab("Text to Speech"):
         gr.Markdown("### Convert text to speech")
         text_input = gr.Textbox(lines=10, label="Enter your text here:")
-        lang_dropdown = gr.Dropdown(choices=list(_main_langs().values()), value="Vietnamese", label="Select language:")
-        tld_dropdown = gr.Dropdown(choices=[tld for tld in tlds], label="Select TLD:", value="com")
-        audio_output = gr.Audio(label="Audio")
-        file_output = gr.File(label="Audio File")
-        gr.Button("Convert").click(text_to_speech, inputs=[text_input, lang_dropdown, tld_dropdown], outputs=[audio_output, file_output])
-    with gr.Tab("Convert .txt to Speech"):
-        gr.Markdown("### Convert a .txt file to speech")
-        txt_input = gr.File(label="Upload your .txt file", file_types=["text"])
-        lang_dropdown_txt = gr.Dropdown(choices=list(_main_langs().values()), value="Vietnamese", label="Select language:")
-        tld_dropdown_txt = gr.Dropdown(choices=[tld for tld in tlds], label="Select TLD:", value="com")
-        audio_output_txt = gr.Audio(label="Audio")
-        file_output_txt = gr.File(label="Audio File")
-        gr.Button("Convert").click(txt_file_to_speech, inputs=[txt_input, lang_dropdown_txt, tld_dropdown_txt], outputs=[audio_output_txt, file_output_txt])
 iface.launch(enable_queue=True)

 MAX_FILE_AGE = 24 * 60 * 60  # maximum age of audio files in seconds (24 hours)
 def text_to_speech(text, lang, tld):
     lang_codes = {lang_name: lang_code for lang_code, lang_name in _main_langs().items()}
     lang_code = lang_codes[lang]
     tts = gTTS(text, lang=lang_code, tld=tld)
     fp = io.BytesIO()
     tts.write_to_fp(fp)
     fp.seek(0)
     os.makedirs(AUDIO_DIR, exist_ok=True)
     file_name = str(time.time()) + '.wav'
     file_path = os.path.join(AUDIO_DIR, file_name)
     with open(file_path, 'wb') as f:
         f.write(fp.read())
     delete_old_audio_files()
+    return file_path, file_path
 def delete_old_audio_files():
     now = time.time()
     for file_name in os.listdir(AUDIO_DIR):
         file_path = os.path.join(AUDIO_DIR, file_name)
         if now - os.path.getmtime(file_path) > MAX_FILE_AGE:
             os.remove(file_path)
+# Hàm chuyển đổi file .txt thành giọng nói
+def txt_to_speech(file, lang, tld):
+    with open(file.name, 'r') as f:
+        text = f.read()
+    return text_to_speech(text, lang, tld)
+tlds = [
+    "com", "ad", "ae", "com.af", "com.ag", "com.ai", "com.ar", "as", "at", "com.au", "az",
+    "ba", "com.bd", "be", "bf", "bg", "bj", "br", "bs", "bt", "co.bw", "by", "com.bz", "ca",
+    "cd", "ch", "ci", "co.ck", "cl", "cm", "cn", "com.co", "co.cr", "cv", "dj", "dm", "com.do",
+    "dz", "com.ec", "ee", "com.eg", "es", "et", "fi", "com.fj", "fm", "fr", "ga", "ge", "gg",
+    "com.gh", "com.gi", "gl", "gm", "gr", "com.gt", "gy", "com.hk", "hn", "ht", "hr", "hu",
+    "co.id", "ie", "co.il", "im", "co.in", "iq", "is", "it", "iw", "je", "com.je", "jo",
+    "co.jp", "co.ke", "com.kh", "ki", "kg", "co.kr", "com.kw", "kz", "la", "com.lb", "li",
+    "lk", "co.ls", "lt", "lu", "lv", "com.ly", "com.ma", "md", "me", "mg", "mk", "ml", "mm",
+    "mn", "ms", "com.mt", "mu", "mv", "mw", "com.mx", "com.my", "co.mz", "na", "ng", "ni",
+    "ne", "nl", "no", "com.np", "nr", "nu", "co.nz", "com.om", "pa", "pe", "pg", "ph", "pk",
+    "pl", "pn", "com.pr", "ps", "pt", "com.py", "com.qa", "ro", "ru", "rw", "com.sa", "com.sb",
+    "sc", "se", "com.sg", "sh", "si", "sk", "com.sl", "sn", "so", "sm", "sr", "st", "com.sv",
+    "td", "tg", "co.th", "com.tj", "tl", "tm", "tn", "to", "com.tr", "tt", "com.tw", "co.tz",
+    "com.ua", "co.ug", "co.uk", "com.uy", "co.uz", "com.vc", "co.ve", "vg", "co.vi", "com.vn",
+    "vu", "ws", "rs", "co.za", "co.zm", "co.zw", "cat", "com.ng"
 ]
+# Tạo giao diện Gradio với tab
 with gr.Blocks() as iface:
     with gr.Tab("Text to Speech"):
         gr.Markdown("### Convert text to speech")
         text_input = gr.Textbox(lines=10, label="Enter your text here:")
+        lang_input = gr.Dropdown(choices=list(_main_langs().values()), label="Select language:")
+        tld_input = gr.Dropdown(choices=[tld for tld in tlds], label="Select TLD:", value="com")
+        audio_output, file_output = gr.Audio(label="Audio"), gr.File(label="Audio File")
+        gr.Button("Convert").click(fn=text_to_speech, inputs=[text_input, lang_input, tld_input], outputs=[audio_output, file_output])
+    with gr.Tab("TXT to Speech"):
+        gr.Markdown("### Convert .txt file to speech")
+        file_input = gr.File(label="Upload your .txt file")
+        lang_input_file = gr.Dropdown(choices=list(_main_langs().values()), label="Select language:")
+        tld_input_file = gr.Dropdown(choices=[tld for tld in tlds], label="Select TLD:", value="com")
+        audio_output_file, file_output_file = gr.Audio(label="Audio"), gr.File(label="Audio File")
+        gr.Button("Convert").click(fn=txt_to_speech, inputs=[file_input, lang_input_file, tld_input_file], outputs=[audio_output_file, file_output_file])
 iface.launch(enable_queue=True)