Has-ai commited on
Commit
b9f5aff
·
1 Parent(s): 13e963e

Create app.py

Browse files
Files changed (1) hide show
  1. app.py +94 -0
app.py ADDED
@@ -0,0 +1,94 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+
2
+
3
+ import logging
4
+ from typing import cast
5
+
6
+ import gradio as gr
7
+ from balacoon_tts import TTS
8
+ from huggingface_hub import hf_hub_download, list_repo_files
9
+
10
+ # global tts module, initialized from a model selected
11
+ tts = None
12
+
13
+
14
+ def main():
15
+ logging.basicConfig(level=logging.INFO)
16
+
17
+ with gr.Blocks() as demo:
18
+ gr.Markdown(
19
+ """
20
+ <h1 align="center">Which voice you like?</h1>
21
+
22
+ 1. Write an utterance to generate,
23
+ 2. Select the model to synthesize with
24
+ 3. Select speaker
25
+ 4. Hit "Generate" and listen to the result!
26
+
27
+ When you select model for the first time,
28
+ it will take a little time to download it.
29
+ You can learn more about models available
30
+ [here](https://huggingface.co/balacoon/tts).
31
+ Visit [Balacoon website](https://balacoon.com/) for more info.
32
+ """
33
+ )
34
+ with gr.Row(variant="panel"):
35
+ text = gr.Textbox(label="Text", placeholder="Type something here...")
36
+
37
+ with gr.Row():
38
+ with gr.Column(variant="panel"):
39
+ repo_files = list_repo_files(repo_id="balacoon/tts")
40
+ model_files = [x for x in repo_files if x.endswith("_cpu.addon")]
41
+ model_name = gr.Dropdown(
42
+ label="Model",
43
+ choices=model_files,
44
+ )
45
+ with gr.Column(variant="panel"):
46
+ speaker = gr.Dropdown(label="Speaker", choices=[])
47
+
48
+ def set_model(model_name_str: str):
49
+ """
50
+ gets value from `model_name`, loads model,
51
+ re-initializes tts object, gets list of
52
+ speakers that model supports and set them to `speaker`
53
+ """
54
+ model_path = hf_hub_download(
55
+ repo_id="balacoon/tts", filename=model_name_str
56
+ )
57
+ global tts
58
+ tts = TTS(model_path)
59
+ speakers = tts.get_speakers()
60
+ value = speakers[-1]
61
+ return gr.Dropdown.update(
62
+ choices=speakers, value=value, visible=True
63
+ )
64
+
65
+ model_name.change(set_model, inputs=model_name, outputs=speaker)
66
+
67
+ with gr.Row(variant="panel"):
68
+ generate = gr.Button("Generate")
69
+ with gr.Row(variant="panel"):
70
+ audio = gr.Audio()
71
+
72
+ def synthesize_audio(text_str: str, speaker_str: str = ""):
73
+ """
74
+ gets utterance to synthesize from `text` Textbox
75
+ and speaker name from `speaker` dropdown list.
76
+ speaker name might be empty for single-speaker models.
77
+ Synthesizes the waveform and updates `audio` with it.
78
+ """
79
+ if not text_str:
80
+ logging.info("text or speaker are not provided")
81
+ return None
82
+ global tts
83
+ if len(text_str) > 1024:
84
+ text_str = text_str[:1024]
85
+ samples = cast(TTS, tts).synthesize(text_str, speaker_str)
86
+ return gr.Audio.update(value=(cast(TTS, tts).get_sampling_rate(), samples))
87
+
88
+ generate.click(synthesize_audio, inputs=[text, speaker], outputs=audio)
89
+
90
+ demo.launch()
91
+
92
+
93
+ if __name__ == "__main__":
94
+ main()