csuhan commited on
Commit
373528e
·
1 Parent(s): a66a8c1

Upload folder using huggingface_hub

Browse files
.gitattributes CHANGED
@@ -32,3 +32,8 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
32
  *.zip filter=lfs diff=lfs merge=lfs -text
33
  *.zst filter=lfs diff=lfs merge=lfs -text
34
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
 
 
 
 
32
  *.zip filter=lfs diff=lfs merge=lfs -text
33
  *.zst filter=lfs diff=lfs merge=lfs -text
34
  *tfevents* filter=lfs diff=lfs merge=lfs -text
35
+ examples/animal.png filter=lfs diff=lfs merge=lfs -text
36
+ examples/bell_ring.wav filter=lfs diff=lfs merge=lfs -text
37
+ examples/caixukun.mp4 filter=lfs diff=lfs merge=lfs -text
38
+ examples/flower.mp4 filter=lfs diff=lfs merge=lfs -text
39
+ examples/food_menu.png filter=lfs diff=lfs merge=lfs -text
app.py CHANGED
@@ -200,19 +200,35 @@ def gradio_worker(
200
  with gr.Blocks(css=CSS, theme=gr.themes.Base()) as demo:
201
  gr.Markdown("## OneLLM: One Framework to Align All Modalities with Language")
202
  with gr.Row(equal_height=True):
203
- # with gr.Column(scale=1):
204
- # img_path = gr.Image(label='Image Input', type='filepath')
205
- # video_path = gr.Video(label='Video Input')
206
- # audio_path = gr.Audio(label='Audio Input', type='filepath', sources=['upload'])
207
- # modality = gr.Radio(choices=['image', 'audio', 'video'], value='image', interactive=True, label='Input Modalities', visible=False)
208
  modality = gr.Textbox(value='image', visible=False)
209
  with gr.Column(scale=1):
210
  with gr.Tab('Image') as img_tab:
211
  img_path = gr.Image(label='Image Input', type='filepath')
 
 
 
 
 
 
 
212
  with gr.Tab('Video') as video_tab:
213
  video_path = gr.Video(label='Video Input')
 
 
 
 
 
 
 
214
  with gr.Tab('Audio') as audio_tab:
215
  audio_path = gr.Audio(label='Audio Input', type='filepath', sources=['upload'])
 
 
 
 
 
 
 
216
 
217
  with gr.Column(scale=2):
218
  chatbot = gr.Chatbot(elem_id="chatbot")
 
200
  with gr.Blocks(css=CSS, theme=gr.themes.Base()) as demo:
201
  gr.Markdown("## OneLLM: One Framework to Align All Modalities with Language")
202
  with gr.Row(equal_height=True):
 
 
 
 
 
203
  modality = gr.Textbox(value='image', visible=False)
204
  with gr.Column(scale=1):
205
  with gr.Tab('Image') as img_tab:
206
  img_path = gr.Image(label='Image Input', type='filepath')
207
+ gr.Examples(
208
+ examples=[
209
+ ["examples/animal.png", "Why this image is funny?"],
210
+ ["examples/food_menu.png", "Introduce me the poster."],
211
+ ],
212
+ inputs=[img_path, msg],
213
+ )
214
  with gr.Tab('Video') as video_tab:
215
  video_path = gr.Video(label='Video Input')
216
+ gr.Examples(
217
+ examples=[
218
+ ["examples/flower.mp4", "What process does this video record?"],
219
+ ["examples/caixukun.mp4", "Describe the video in detail."],
220
+ ],
221
+ inputs=[video_path, msg],
222
+ )
223
  with gr.Tab('Audio') as audio_tab:
224
  audio_path = gr.Audio(label='Audio Input', type='filepath', sources=['upload'])
225
+ gr.Examples(
226
+ examples=[
227
+ ["examples/bell_ring.wav", "What can you hear in the audio?"],
228
+ ["examples/bird_audio.wav", "Describe the audio."],
229
+ ],
230
+ inputs=[audio_path, msg],
231
+ )
232
 
233
  with gr.Column(scale=2):
234
  chatbot = gr.Chatbot(elem_id="chatbot")
examples/animal.png ADDED

Git LFS Details

  • SHA256: 0ba055ca9485f77c577433701193d03267dce9e6d08916c44d7f3435287dca96
  • Pointer size: 132 Bytes
  • Size of remote file: 1.08 MB
examples/bell_ring.wav ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:415b5406175cafa874396f89811121fb306c17084db8ec20753ab5666b4fdcca
3
+ size 3630044
examples/bird_audio.wav ADDED
Binary file (882 kB). View file
 
examples/caixukun.mp4 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5762ad0ae954da8fbc33d524e90969b9fc56745f2ce513724e2ff40da3f1ac16
3
+ size 14008046
examples/flower.mp4 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:04f27dd2ae6f1a5cb836030983c9b423e182e6bf7de3e2138c97bf698c6f29ba
3
+ size 3139496
examples/food_menu.png ADDED

Git LFS Details

  • SHA256: bc0f838ea2a4acae6cd06a07266490ea27b7db0676f83b89ec7223c554068178
  • Pointer size: 132 Bytes
  • Size of remote file: 1.27 MB