soujanyaporia commited on
Commit
298880e
1 Parent(s): aa617a2

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +9 -2
app.py CHANGED
@@ -102,7 +102,14 @@ def gradio_generate(prompt, steps, guidance):
102
  # Using this ChatGPT-generated description of the sound, TANGO provides superior results.
103
  # <p/>
104
  # """
105
- description_text = ""
 
 
 
 
 
 
 
106
  # Gradio input and output components
107
  input_text = gr.Textbox(lines=2, label="Prompt")
108
  output_audio = gr.Audio(label="Generated Audio", type="filepath")
@@ -114,7 +121,7 @@ gr_interface = gr.Interface(
114
  fn=gradio_generate,
115
  inputs=[input_text, denoising_steps, guidance_scale],
116
  outputs=[output_audio],
117
- title="TANGO2: Aligning Diffusion-based Text-to-Audio Generative Models through Direct Preference Optimization",
118
  description=description_text,
119
  allow_flagging=False,
120
  examples=[
 
102
  # Using this ChatGPT-generated description of the sound, TANGO provides superior results.
103
  # <p/>
104
  # """
105
+ description_text = """
106
+ <p><a href="https://huggingface.co/spaces/declare-lab/tango2/blob/main/app.py?duplicate=true"> <img style="margin-top: 0em; margin-bottom: 0em" src="https://bit.ly/3gLdBN6" alt="Duplicate Space"></a> For faster inference without waiting in queue, you may duplicate the space and upgrade to a GPU in the settings. <br/><br/>
107
+ Generate audio using Tango2 by providing a text prompt. Tango2 was built from Tango and was trained on <a href="https://huggingface.co/datasets/declare-lab/audio-alpaca">Audio-alpaca</a>
108
+ <br/><br/> This is the demo for Tango2 for text to audio generation: <a href="https://arxiv.org/abs/2404.09956">Read our paper.</a>
109
+ <br>
110
+ This version is trained on an extended version of Audio-alpaca and results are better.
111
+ <p/>
112
+ """
113
  # Gradio input and output components
114
  input_text = gr.Textbox(lines=2, label="Prompt")
115
  output_audio = gr.Audio(label="Generated Audio", type="filepath")
 
121
  fn=gradio_generate,
122
  inputs=[input_text, denoising_steps, guidance_scale],
123
  outputs=[output_audio],
124
+ title="Tango 2: Aligning Diffusion-based Text-to-Audio Generations through Direct Preference Optimization",
125
  description=description_text,
126
  allow_flagging=False,
127
  examples=[