Spaces:
Runtime error
Runtime error
soujanyaporia
commited on
Commit
•
298880e
1
Parent(s):
aa617a2
Update app.py
Browse files
app.py
CHANGED
@@ -102,7 +102,14 @@ def gradio_generate(prompt, steps, guidance):
|
|
102 |
# Using this ChatGPT-generated description of the sound, TANGO provides superior results.
|
103 |
# <p/>
|
104 |
# """
|
105 |
-
description_text = ""
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
106 |
# Gradio input and output components
|
107 |
input_text = gr.Textbox(lines=2, label="Prompt")
|
108 |
output_audio = gr.Audio(label="Generated Audio", type="filepath")
|
@@ -114,7 +121,7 @@ gr_interface = gr.Interface(
|
|
114 |
fn=gradio_generate,
|
115 |
inputs=[input_text, denoising_steps, guidance_scale],
|
116 |
outputs=[output_audio],
|
117 |
-
title="
|
118 |
description=description_text,
|
119 |
allow_flagging=False,
|
120 |
examples=[
|
|
|
102 |
# Using this ChatGPT-generated description of the sound, TANGO provides superior results.
|
103 |
# <p/>
|
104 |
# """
|
105 |
+
description_text = """
|
106 |
+
<p><a href="https://huggingface.co/spaces/declare-lab/tango2/blob/main/app.py?duplicate=true"> <img style="margin-top: 0em; margin-bottom: 0em" src="https://bit.ly/3gLdBN6" alt="Duplicate Space"></a> For faster inference without waiting in queue, you may duplicate the space and upgrade to a GPU in the settings. <br/><br/>
|
107 |
+
Generate audio using Tango2 by providing a text prompt. Tango2 was built from Tango and was trained on <a href="https://huggingface.co/datasets/declare-lab/audio-alpaca">Audio-alpaca</a>
|
108 |
+
<br/><br/> This is the demo for Tango2 for text to audio generation: <a href="https://arxiv.org/abs/2404.09956">Read our paper.</a>
|
109 |
+
<br>
|
110 |
+
This version is trained on an extended version of Audio-alpaca and results are better.
|
111 |
+
<p/>
|
112 |
+
"""
|
113 |
# Gradio input and output components
|
114 |
input_text = gr.Textbox(lines=2, label="Prompt")
|
115 |
output_audio = gr.Audio(label="Generated Audio", type="filepath")
|
|
|
121 |
fn=gradio_generate,
|
122 |
inputs=[input_text, denoising_steps, guidance_scale],
|
123 |
outputs=[output_audio],
|
124 |
+
title="Tango 2: Aligning Diffusion-based Text-to-Audio Generations through Direct Preference Optimization",
|
125 |
description=description_text,
|
126 |
allow_flagging=False,
|
127 |
examples=[
|