mshukor HF staff commited on
Commit
48d1b07
·
1 Parent(s): 25e062c

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +2 -2
app.py CHANGED
@@ -480,11 +480,11 @@ def inference(image, audio, video, task_type, instruction):
480
  else:
481
  return None, tokens
482
 
483
- inputs = [gr.inputs.Image(type='pil'), gr.Audio(source="upload", type="filepath"), gr.Video(source="upload", type="filepath"), gr.inputs.Radio(choices=['Image Captioning', 'Visual Question Answering', 'Video Captioning', 'Audio Captioning', "Visual Grounding", "General", "General Video"], type="value", default="Image Captioning", label="Task"), gr.inputs.Textbox(lines=1, label="Instruction")]
484
  outputs = [gr.outputs.Image(type='pil'), 'text']
485
  examples = [
486
  ['examples/images/soccer.jpg', None, None, 'Image Captioning', None],
487
- ['examples/images/woman_inblack.jpg', None, None, 'Visual Question Answering', 'what does the woman wearing black do?'],
488
  ['examples/images/banana.jpg', None, None, 'Visual Grounding', 'the detached banana'],
489
  ['examples/images/skateboard.jpg', None, None, 'General', 'which region does the text " a yellow bird " describe?'],
490
  ['examples/images/baseball.jpg', None, None, 'General', 'what is this sport?'],
 
480
  else:
481
  return None, tokens
482
 
483
+ inputs = [gr.inputs.Image(type='pil'), gr.Audio(source="upload", type="filepath"), gr.Video(source="upload", type="filepath"), gr.inputs.Radio(choices=['Image Captioning', 'Video Captioning', 'Audio Captioning', "Visual Grounding", "General", "General Video"], type="value", default="Image Captioning", label="Task"), gr.inputs.Textbox(lines=1, label="Instruction")]
484
  outputs = [gr.outputs.Image(type='pil'), 'text']
485
  examples = [
486
  ['examples/images/soccer.jpg', None, None, 'Image Captioning', None],
487
+ # ['examples/images/woman_inblack.jpg', None, None, 'Visual Question Answering', 'what does the woman wearing black do?'],
488
  ['examples/images/banana.jpg', None, None, 'Visual Grounding', 'the detached banana'],
489
  ['examples/images/skateboard.jpg', None, None, 'General', 'which region does the text " a yellow bird " describe?'],
490
  ['examples/images/baseball.jpg', None, None, 'General', 'what is this sport?'],