Respair commited on
Commit
2817151
·
verified ·
1 Parent(s): d359296

Update demo.py

Browse files
Files changed (1) hide show
  1. demo.py +6 -6
demo.py CHANGED
@@ -191,15 +191,15 @@ with gr.Blocks() as audio_inf:
191
 
192
  with gr.Accordion("Advanced Parameters", open=False):
193
  beta = gr.Slider(minimum=0, maximum=1, value=0.4, step=0.1,
194
- label="Beta (Style Strength vs. Reference)",
195
  info="Diffusion parameter. Higher means LESS like the reference audio. 0 disables diffusion.",
196
  interactive=True)
197
  multispeakersteps = gr.Slider(minimum=3, maximum=15, value=5, step=1,
198
- label="Diffusion Steps",
199
  info="More steps can improve quality but increase inference time.",
200
  interactive=True)
201
  embscale = gr.Slider(minimum=1, maximum=5, value=1, step=0.1,
202
- label="Embedding Scale (Intensity)",
203
  info="Impacts expressiveness. High values (> 1.5) might cause artifacts.",
204
  interactive=True)
205
  rate_of_speech = gr.Slider(minimum=0.5, maximum=2,
@@ -262,15 +262,15 @@ with gr.Blocks() as longform:
262
 
263
  with gr.Accordion("Advanced Parameters", open=False):
264
  beta_longform = gr.Slider(minimum=0, maximum=1, value=0.4, step=0.1,
265
- label="Beta (Style Strength vs. Semantic Prompt)",
266
  info="Diffusion parameter. Higher means LESS like the inferred style from text. 0 disables diffusion.",
267
  interactive=True)
268
  diffusion_steps_longform = gr.Slider(minimum=3, maximum=15, value=5, step=1,
269
- label="Diffusion Steps",
270
  info="More steps can improve quality but increase inference time.",
271
  interactive=True)
272
  embedding_scale_longform = gr.Slider(minimum=1, maximum=5, value=1, step=0.1,
273
- label="Embedding Scale (Intensity)",
274
  info="Impacts expressiveness. High values (> 1.5) might cause artifacts.",
275
  interactive=True)
276
  rate_of_speech_longform = gr.Slider(minimum=0.5, maximum=2, value=1, step=0.1,
 
191
 
192
  with gr.Accordion("Advanced Parameters", open=False):
193
  beta = gr.Slider(minimum=0, maximum=1, value=0.4, step=0.1,
194
+ label="Beta (Diffusion Strength vs. Reference) - Kalliope Only",
195
  info="Diffusion parameter. Higher means LESS like the reference audio. 0 disables diffusion.",
196
  interactive=True)
197
  multispeakersteps = gr.Slider(minimum=3, maximum=15, value=5, step=1,
198
+ label="Diffusion Steps - Kalliope Only",
199
  info="More steps can improve quality but increase inference time.",
200
  interactive=True)
201
  embscale = gr.Slider(minimum=1, maximum=5, value=1, step=0.1,
202
+ label="Embedding Scale (Intensity) - Kalliope Only",
203
  info="Impacts expressiveness. High values (> 1.5) might cause artifacts.",
204
  interactive=True)
205
  rate_of_speech = gr.Slider(minimum=0.5, maximum=2,
 
262
 
263
  with gr.Accordion("Advanced Parameters", open=False):
264
  beta_longform = gr.Slider(minimum=0, maximum=1, value=0.4, step=0.1,
265
+ label="Beta (Diffusion Strength vs. Semantic Encoder) - Kalliope Only",
266
  info="Diffusion parameter. Higher means LESS like the inferred style from text. 0 disables diffusion.",
267
  interactive=True)
268
  diffusion_steps_longform = gr.Slider(minimum=3, maximum=15, value=5, step=1,
269
+ label="Diffusion Steps - Kalliope Only",
270
  info="More steps can improve quality but increase inference time.",
271
  interactive=True)
272
  embedding_scale_longform = gr.Slider(minimum=1, maximum=5, value=1, step=0.1,
273
+ label="Embedding Scale (Intensity) - Kalliope Only",
274
  info="Impacts expressiveness. High values (> 1.5) might cause artifacts.",
275
  interactive=True)
276
  rate_of_speech_longform = gr.Slider(minimum=0.5, maximum=2, value=1, step=0.1,