Update demo.py
Browse files
demo.py
CHANGED
@@ -191,15 +191,15 @@ with gr.Blocks() as audio_inf:
|
|
191 |
|
192 |
with gr.Accordion("Advanced Parameters", open=False):
|
193 |
beta = gr.Slider(minimum=0, maximum=1, value=0.4, step=0.1,
|
194 |
-
label="Beta (
|
195 |
info="Diffusion parameter. Higher means LESS like the reference audio. 0 disables diffusion.",
|
196 |
interactive=True)
|
197 |
multispeakersteps = gr.Slider(minimum=3, maximum=15, value=5, step=1,
|
198 |
-
label="Diffusion Steps",
|
199 |
info="More steps can improve quality but increase inference time.",
|
200 |
interactive=True)
|
201 |
embscale = gr.Slider(minimum=1, maximum=5, value=1, step=0.1,
|
202 |
-
label="Embedding Scale (Intensity)",
|
203 |
info="Impacts expressiveness. High values (> 1.5) might cause artifacts.",
|
204 |
interactive=True)
|
205 |
rate_of_speech = gr.Slider(minimum=0.5, maximum=2,
|
@@ -262,15 +262,15 @@ with gr.Blocks() as longform:
|
|
262 |
|
263 |
with gr.Accordion("Advanced Parameters", open=False):
|
264 |
beta_longform = gr.Slider(minimum=0, maximum=1, value=0.4, step=0.1,
|
265 |
-
label="Beta (
|
266 |
info="Diffusion parameter. Higher means LESS like the inferred style from text. 0 disables diffusion.",
|
267 |
interactive=True)
|
268 |
diffusion_steps_longform = gr.Slider(minimum=3, maximum=15, value=5, step=1,
|
269 |
-
label="Diffusion Steps",
|
270 |
info="More steps can improve quality but increase inference time.",
|
271 |
interactive=True)
|
272 |
embedding_scale_longform = gr.Slider(minimum=1, maximum=5, value=1, step=0.1,
|
273 |
-
label="Embedding Scale (Intensity)",
|
274 |
info="Impacts expressiveness. High values (> 1.5) might cause artifacts.",
|
275 |
interactive=True)
|
276 |
rate_of_speech_longform = gr.Slider(minimum=0.5, maximum=2, value=1, step=0.1,
|
|
|
191 |
|
192 |
with gr.Accordion("Advanced Parameters", open=False):
|
193 |
beta = gr.Slider(minimum=0, maximum=1, value=0.4, step=0.1,
|
194 |
+
label="Beta (Diffusion Strength vs. Reference) - Kalliope Only",
|
195 |
info="Diffusion parameter. Higher means LESS like the reference audio. 0 disables diffusion.",
|
196 |
interactive=True)
|
197 |
multispeakersteps = gr.Slider(minimum=3, maximum=15, value=5, step=1,
|
198 |
+
label="Diffusion Steps - Kalliope Only",
|
199 |
info="More steps can improve quality but increase inference time.",
|
200 |
interactive=True)
|
201 |
embscale = gr.Slider(minimum=1, maximum=5, value=1, step=0.1,
|
202 |
+
label="Embedding Scale (Intensity) - Kalliope Only",
|
203 |
info="Impacts expressiveness. High values (> 1.5) might cause artifacts.",
|
204 |
interactive=True)
|
205 |
rate_of_speech = gr.Slider(minimum=0.5, maximum=2,
|
|
|
262 |
|
263 |
with gr.Accordion("Advanced Parameters", open=False):
|
264 |
beta_longform = gr.Slider(minimum=0, maximum=1, value=0.4, step=0.1,
|
265 |
+
label="Beta (Diffusion Strength vs. Semantic Encoder) - Kalliope Only",
|
266 |
info="Diffusion parameter. Higher means LESS like the inferred style from text. 0 disables diffusion.",
|
267 |
interactive=True)
|
268 |
diffusion_steps_longform = gr.Slider(minimum=3, maximum=15, value=5, step=1,
|
269 |
+
label="Diffusion Steps - Kalliope Only",
|
270 |
info="More steps can improve quality but increase inference time.",
|
271 |
interactive=True)
|
272 |
embedding_scale_longform = gr.Slider(minimum=1, maximum=5, value=1, step=0.1,
|
273 |
+
label="Embedding Scale (Intensity) - Kalliope Only",
|
274 |
info="Impacts expressiveness. High values (> 1.5) might cause artifacts.",
|
275 |
interactive=True)
|
276 |
rate_of_speech_longform = gr.Slider(minimum=0.5, maximum=2, value=1, step=0.1,
|