Spaces:

mbarnig
/

MULTI_TTS_for_LOD

Sleeping

App Files Files Community

mbarnig commited on Jul 9, 2024

Commit

e027fad

verified ·

1 Parent(s): e26665f

Create app.py

Browse files

Files changed (1) hide show

app.py +73 -0

app.py ADDED Viewed

	@@ -0,0 +1,73 @@

+import gradio as gr
+import tempfile
+from TTS.utils.synthesizer import Synthesizer
+from huggingface_hub import hf_hub_download
+REPO_ID = "mbarnig/MULTI_LOD_TTS"
+my_title = "🇩🇪 🇫🇷 🇬🇧 🇵🇹 Mir schwätzen wéi e Lëtzebuerger ! 🇱🇺"
+my_description = "Multilingual-Multispeaker Text-to-Speech (TTS) synthesizer speaking the five current languages in Luxembourg. This model is based on VITS, thanks to 🐸 [Coqui.ai](https://coqui.ai/)."
+TTS_VOICES = [
+    Mann,
+    Fra
+]
+TTS_LANGUAGES = [
+  "Deutsch",
+  "English",
+  "Français",
+  "Lëtzebuergesch",
+  "Português"
+]
+my_examples = []
+my_article = "<h3>User guide</h3>"
+my_inputs = [
+  gr.Textbox(lines=5, label="Input Text"),
+  gr.Radio(label="Speaker", choices = TTS_VOICES, value = "Judith"),
+  gr.Radio(label="Language", choices = TTS_LANGUAGES, value = "Lëtzebuergesch"),
+]
+my_outputs = gr.Audio(type="filepath", label="Output Audio")
+def tts(text: str, speaker_idx: str, language_idx: str):
+    best_model_path = hf_hub_download(repo_id=REPO_ID, filename="best_model.pth")
+    config_path = hf_hub_download(repo_id=REPO_ID, filename="config.json")
+    speakers_path = hf_hub_download(repo_id=REPO_ID, filename="speakers.pth")
+    languages_path = hf_hub_download(repo_id=REPO_ID, filename="language_ids.json")
+    speaker_encoder_model_path = hf_hub_download(repo_id=REPO_ID, filename="model_se.pth")
+    speaker_encoder_config_path = hf_hub_download(repo_id=REPO_ID, filename="config_se.json")
+    # init synthesizer
+    synthesizer = Synthesizer(
+        best_model_path,
+        config_path,
+        speakers_path,
+        languages_path,
+        None,
+        None,
+        speaker_encoder_model_path,
+        speaker_encoder_config_path,
+        False
+    )
+    # create audio file
+    wavs = synthesizer.tts(text, speaker_idx, language_idx)
+    with tempfile.NamedTemporaryFile(suffix = ".wav", delete = False) as fp:
+        synthesizer.save_wav(wavs, fp)
+    return fp.name
+iface = gr.Interface(
+    fn=tts,
+    inputs=my_inputs,
+    outputs=my_outputs,
+    title=my_title,
+    description = my_description,
+    article = my_article,
+    examples = my_examples,
+    allow_flagging=False
+)
+iface.launch()