Spaces:

mbazaNLP
/

Kinyarwanda-text-to-speech

Runtime error

File size: 1,658 Bytes

5e334c0
 
 
761c6e2
96dd0a7
4f802fe
5e334c0
 
4f802fe
5e334c0
 
 
 
8e663ab
 
 
 
 
 
 
 
 
 
 
761c6e2
e88cf51
8e663ab
 
 
5e334c0
 
 
 
 
 
 
 
 
e88cf51
 
5e334c0

import tempfile
from typing import Optional
import gradio as gr
from engine import TextToSpeech
import subprocess


MAX_TXT_LEN = 100

def generate_audio(text):
    if len(text) > MAX_TXT_LEN:
        text = text[:MAX_TXT_LEN]
        print(f"Input text was cutoff since it went over the {MAX_TXT_LEN} character limit.")
    # model_path, config_path, model_item = manager.download_model(model_name)
    # vocoder_name: Optional[str] = model_item["default_vocoder"]
    # vocoder_path = None
    # vocoder_config_path = None
    # if vocoder_name is not None:
    #     vocoder_path, vocoder_config_path, _ = manager.download_model(vocoder_name)
    # synthesizer = Synthesizer(
    #     model_path, config_path, None, None, vocoder_path, vocoder_config_path,
    # )
    # if synthesizer is None:
    #     raise NameError("model not found")
    tts_engine= TextToSpeech()
    return tts_engine.run_tts(text)
    # with tempfile.NamedTemporaryFile(suffix=".wav", delete=False) as fp:
    #     synthesizer.save_wav(wav, fp)
    #     return fp.name

iface = gr.Interface(
    fn=generate_audio,
    inputs=[
        gr.inputs.Textbox(
            label="Input Text",
            default="This sentence has been generated by a speech synthesis system.",
        ),
    ],
    outputs=gr.outputs.Audio(type="numpy",label="Output"),
    #outputs=gr.outputs.Textbox(label="Recognized speech from speechbrain model"),
    title="Kinyarwanda tts Demo",
    description="Kinyarwanda tts build with ",
    allow_flagging=False,
    flagging_options=['error', 'bad-quality', 'wrong-pronounciation'],
    layout="vertical",
    live=False
)
iface.launch(share=False)