fantaxy commited on
Commit
82736c5
·
verified ·
1 Parent(s): 9982ba2

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +1 -36
app.py CHANGED
@@ -216,33 +216,8 @@ controller = FoleyController()
216
  device = "cuda" if torch.cuda.is_available() else "cpu"
217
 
218
  with gr.Blocks(css=css) as demo:
219
- gr.HTML(
220
- '<h1 style="height: 136px; display: flex; align-items: center; justify-content: space-around;"><span style="height: 100%; width:136px;"><img src="file/foleycrafter.png" alt="logo" style="height: 100%; width:auto; object-fit: contain; margin: 0px 0px; padding: 0px 0px;"></span><strong style="font-size: 36px;">FoleyCrafter: Bring Silent Videos to Life with Lifelike and Synchronized Sounds</strong></h1>'
221
- )
222
- gr.HTML(
223
- '<p id="authors" style="text-align:center; font-size:24px;"> \
224
- <a href="https://github.com/ymzhang0319">Yiming Zhang</a><sup>1</sup>,&nbsp \
225
- <a href="https://github.com/VocodexElysium">Yicheng Gu</a><sup>2</sup>,&nbsp \
226
- <a href="https://zengyh1900.github.io/">Yanhong Zeng</a><sup>1 †</sup>,&nbsp \
227
- <a href="https://github.com/LeoXing1996/">Zhening Xing</a><sup>1</sup>,&nbsp \
228
- <a href="https://github.com/HeCheng0625">Yuancheng Wang</a><sup>2</sup>,&nbsp \
229
- <a href="https://drwuz.com/">Zhizheng Wu</a><sup>2</sup>,&nbsp \
230
- <a href="https://chenkai.site/">Kai Chen</a><sup>1 †</sup>\
231
- <br>\
232
- <span>\
233
- <sup>1</sup>Shanghai AI Laboratory &nbsp;&nbsp;&nbsp;\
234
- <sup>2</sup>Chinese University of Hong Kong, Shenzhen &nbsp;&nbsp;&nbsp;\
235
- †Corresponding author\
236
- </span>\
237
- </p>'
238
- )
239
  with gr.Row():
240
- gr.Markdown(
241
- "<div align='center'><font size='5'><a href='https://foleycrafter.github.io/'>Project Page</a> &ensp;" # noqa
242
- "<a href='https://arxiv.org/abs/2407.01494/'>Paper</a> &ensp;"
243
- "<a href='https://github.com/open-mmlab/foleycrafter'>Code</a> &ensp;"
244
- "<a href='https://huggingface.co/spaces/ymzhang319/FoleyCrafter'>Demo</a> </font></div>"
245
- )
246
 
247
  with gr.Column(variant="panel"):
248
  with gr.Row(equal_height=False):
@@ -280,16 +255,6 @@ with gr.Blocks(css=css) as demo:
280
  with gr.Column():
281
  result_video = gr.Video(label="Generated Audio", interactive=False)
282
  with gr.Row():
283
- gr.Markdown(
284
- "<div style='word-spacing: 6px;'><font size='5'><b>Tips</b>: <br> \
285
- 1. With strong temporal visual cues in input video, you can scale up the <b>Temporal Align Scale</b>. <br>\
286
- 2. <b>Visual content scale</b> is the level of semantic alignment with visual content.</font></div> \
287
- ")
288
- # gr.HTML(
289
- # '<p style="font-size: 16px;">**Tips**: <br> \
290
- # 1. With strong temporal visual cues in input video, you can scale up the **Temporal Align Scale**. <br>\
291
- # 2. **Visual content scale** is the level of semantic alignment with visual content.</p> \
292
- # ')
293
 
294
  generate_button.click(
295
  fn=controller.foley,
 
216
  device = "cuda" if torch.cuda.is_available() else "cpu"
217
 
218
  with gr.Blocks(css=css) as demo:
219
+
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
220
  with gr.Row():
 
 
 
 
 
 
221
 
222
  with gr.Column(variant="panel"):
223
  with gr.Row(equal_height=False):
 
255
  with gr.Column():
256
  result_video = gr.Video(label="Generated Audio", interactive=False)
257
  with gr.Row():
 
 
 
 
 
 
 
 
 
 
258
 
259
  generate_button.click(
260
  fn=controller.foley,