Spaces:
Running
on
Zero
Running
on
Zero
disc
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- app.py +1 -2
- examples/barsik.jpg +0 -0
- examples/barsik.json +0 -7
- examples/biennale.jpg +0 -0
- examples/biennale.json +0 -7
- examples/billard1.jpg +0 -0
- examples/billard1.json +0 -7
- examples/billard2.jpg +0 -0
- examples/billard2.json +0 -7
- examples/bowie.jpg +0 -0
- examples/bowie.json +0 -7
- examples/branch.jpg +0 -0
- examples/branch.json +0 -7
- examples/cc_fox.jpg +0 -0
- examples/cc_fox.json +0 -7
- examples/cc_landscape.jpg +0 -0
- examples/cc_landscape.json +0 -7
- examples/cc_puffin.jpg +0 -0
- examples/cc_puffin.json +0 -7
- examples/couch.jpg +0 -0
- examples/couch.json +0 -7
- examples/couch_.json +0 -7
- examples/cups.jpg +0 -0
- examples/cups.json +0 -7
- examples/dice.jpg +0 -0
- examples/dice.json +0 -7
- examples/emu.jpg +0 -0
- examples/emu.json +0 -7
- examples/fridge.jpg +0 -0
- examples/fridge.json +0 -7
- examples/givt.jpg +0 -0
- examples/givt.json +0 -7
- examples/greenlake.jpg +0 -0
- examples/greenlake.json +0 -7
- examples/howto.jpg +0 -0
- examples/howto.json +0 -7
- examples/markers.jpg +0 -0
- examples/markers.json +0 -7
- examples/mcair.jpg +0 -0
- examples/mcair.json +0 -7
- examples/mcair_.json +0 -7
- examples/minergie.jpg +0 -0
- examples/minergie.json +0 -7
- examples/morel.jpg +0 -0
- examples/morel.json +0 -7
- examples/motorcyclists.jpg +0 -0
- examples/motorcyclists.json +0 -7
- examples/parking.jpg +0 -0
- examples/parking.json +0 -7
- examples/password.jpg +0 -0
app.py
CHANGED
@@ -58,7 +58,7 @@ def parse_segmentation(input_image, input_text):
|
|
58 |
######## Demo
|
59 |
|
60 |
INTRO_TEXT = """## PaliGemma WaveUI\n\n
|
61 |
-
|
62 |
"""
|
63 |
|
64 |
|
@@ -71,7 +71,6 @@ with gr.Blocks(css="style.css") as demo:
|
|
71 |
annotated_image = gr.AnnotatedImage(label="Output")
|
72 |
|
73 |
examples = [["./airbnb.jpg", "detect 'Amazing pools' button"]]
|
74 |
-
gr.Markdown("Example images are licensed CC0 by [akolesnikoff@](https://github.com/akolesnikoff), [mbosnjak@](https://github.com/mbosnjak), [maximneumann@](https://github.com/maximneumann) and [merve](https://huggingface.co/merve).")
|
75 |
gr.Examples(
|
76 |
examples=examples,
|
77 |
inputs=[image, seg_input],
|
|
|
58 |
######## Demo
|
59 |
|
60 |
INTRO_TEXT = """## PaliGemma WaveUI\n\n
|
61 |
+
PaliGemma 448 fine-tuned on WaveUI dataset for UI element detection
|
62 |
"""
|
63 |
|
64 |
|
|
|
71 |
annotated_image = gr.AnnotatedImage(label="Output")
|
72 |
|
73 |
examples = [["./airbnb.jpg", "detect 'Amazing pools' button"]]
|
|
|
74 |
gr.Examples(
|
75 |
examples=examples,
|
76 |
inputs=[image, seg_input],
|
examples/barsik.jpg
DELETED
Binary file (88.6 kB)
|
|
examples/barsik.json
DELETED
@@ -1,7 +0,0 @@
|
|
1 |
-
{
|
2 |
-
"name": "barsik",
|
3 |
-
"comment": "",
|
4 |
-
"model": "paligemma-3b-mix-224",
|
5 |
-
"prompt": "segment cat",
|
6 |
-
"license": "CC0 by [maximneumann@](https://github.com/maximneumann)"
|
7 |
-
}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
examples/biennale.jpg
DELETED
Binary file (56.9 kB)
|
|
examples/biennale.json
DELETED
@@ -1,7 +0,0 @@
|
|
1 |
-
{
|
2 |
-
"name": "biennale",
|
3 |
-
"comment": "",
|
4 |
-
"model": "paligemma-3b-mix-224",
|
5 |
-
"prompt": "In which city is this?",
|
6 |
-
"license": "CC0 by [andsteing@](https://huggingface.co/andsteing)"
|
7 |
-
}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
examples/billard1.jpg
DELETED
Binary file (91.1 kB)
|
|
examples/billard1.json
DELETED
@@ -1,7 +0,0 @@
|
|
1 |
-
{
|
2 |
-
"name": "billard1",
|
3 |
-
"comment": "",
|
4 |
-
"model": "paligemma-3b-mix-224",
|
5 |
-
"prompt": "How many red balls are there?",
|
6 |
-
"license": "CC0 by [mbosnjak@](https://github.com/mbosnjak)"
|
7 |
-
}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
examples/billard2.jpg
DELETED
Binary file (86.7 kB)
|
|
examples/billard2.json
DELETED
@@ -1,7 +0,0 @@
|
|
1 |
-
{
|
2 |
-
"name": "billard2",
|
3 |
-
"comment": "",
|
4 |
-
"model": "paligemma-3b-mix-224",
|
5 |
-
"prompt": "How many balls are there?",
|
6 |
-
"license": "CC0 by [mbosnjak@](https://github.com/mbosnjak)"
|
7 |
-
}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
examples/bowie.jpg
DELETED
Binary file (78.4 kB)
|
|
examples/bowie.json
DELETED
@@ -1,7 +0,0 @@
|
|
1 |
-
{
|
2 |
-
"name": "bowie",
|
3 |
-
"comment": "",
|
4 |
-
"model": "paligemma-3b-mix-224",
|
5 |
-
"prompt": "Who is this?",
|
6 |
-
"license": "CC0 by [akolesnikoff@](https://github.com/akolesnikoff)"
|
7 |
-
}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
examples/branch.jpg
DELETED
Binary file (183 kB)
|
|
examples/branch.json
DELETED
@@ -1,7 +0,0 @@
|
|
1 |
-
{
|
2 |
-
"name": "branch",
|
3 |
-
"comment": "",
|
4 |
-
"model": "paligemma-3b-mix-224",
|
5 |
-
"prompt": "What caused this?",
|
6 |
-
"license": "CC0 by [andsteing@](https://huggingface.co/andsteing)"
|
7 |
-
}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
examples/cc_fox.jpg
DELETED
Binary file (628 kB)
|
|
examples/cc_fox.json
DELETED
@@ -1,7 +0,0 @@
|
|
1 |
-
{
|
2 |
-
"name": "cc_fox",
|
3 |
-
"comment": "",
|
4 |
-
"model": "paligemma-3b-mix-448",
|
5 |
-
"prompt": "Which breed is this fox?",
|
6 |
-
"license": "CC0 by [XiaohuaZhai@](https://sites.google.com/view/xzhai)"
|
7 |
-
}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
examples/cc_landscape.jpg
DELETED
Binary file (476 kB)
|
|
examples/cc_landscape.json
DELETED
@@ -1,7 +0,0 @@
|
|
1 |
-
{
|
2 |
-
"name": "cc_landscape",
|
3 |
-
"comment": "",
|
4 |
-
"model": "paligemma-3b-mix-448",
|
5 |
-
"prompt": "What does the image show?",
|
6 |
-
"license": "CC0 by [XiaohuaZhai@](https://sites.google.com/view/xzhai)"
|
7 |
-
}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
examples/cc_puffin.jpg
DELETED
Binary file (676 kB)
|
|
examples/cc_puffin.json
DELETED
@@ -1,7 +0,0 @@
|
|
1 |
-
{
|
2 |
-
"name": "cc_puffin",
|
3 |
-
"comment": "",
|
4 |
-
"model": "paligemma-3b-mix-448",
|
5 |
-
"prompt": "detect puffin in the back; puffin in front",
|
6 |
-
"license": "CC0 by [XiaohuaZhai@](https://sites.google.com/view/xzhai)"
|
7 |
-
}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
examples/couch.jpg
DELETED
Binary file (91 kB)
|
|
examples/couch.json
DELETED
@@ -1,7 +0,0 @@
|
|
1 |
-
{
|
2 |
-
"name": "couch",
|
3 |
-
"comment": "",
|
4 |
-
"model": "paligemma-3b-mix-224",
|
5 |
-
"prompt": "How many yellow cushions are on the couch?",
|
6 |
-
"license": "CC0"
|
7 |
-
}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
examples/couch_.json
DELETED
@@ -1,7 +0,0 @@
|
|
1 |
-
{
|
2 |
-
"name": "couch",
|
3 |
-
"comment": "",
|
4 |
-
"model": "paligemma-3b-mix-224",
|
5 |
-
"prompt": "How many painting do you see in the image?",
|
6 |
-
"license": "CC0"
|
7 |
-
}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
examples/cups.jpg
DELETED
Binary file (59.2 kB)
|
|
examples/cups.json
DELETED
@@ -1,7 +0,0 @@
|
|
1 |
-
{
|
2 |
-
"name": "cups",
|
3 |
-
"comment": "",
|
4 |
-
"model": "paligemma-3b-mix-224",
|
5 |
-
"prompt": "how many cups?",
|
6 |
-
"license": "CC0 by [mbosnjak@](https://github.com/mbosnjak)"
|
7 |
-
}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
examples/dice.jpg
DELETED
Binary file (118 kB)
|
|
examples/dice.json
DELETED
@@ -1,7 +0,0 @@
|
|
1 |
-
{
|
2 |
-
"name": "dice",
|
3 |
-
"comment": "",
|
4 |
-
"model": "paligemma-3b-mix-224",
|
5 |
-
"prompt": "segment dice ; dice",
|
6 |
-
"license": "CC0 by [andresusanopinto@](https://github.com/andresusanopinto)"
|
7 |
-
}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
examples/emu.jpg
DELETED
Binary file (212 kB)
|
|
examples/emu.json
DELETED
@@ -1,7 +0,0 @@
|
|
1 |
-
{
|
2 |
-
"name": "emu",
|
3 |
-
"comment": "",
|
4 |
-
"model": "paligemma-3b-mix-224",
|
5 |
-
"prompt": "What animal is this?",
|
6 |
-
"license": "CC0 by [akolesnikoff@](https://github.com/akolesnikoff)"
|
7 |
-
}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
examples/fridge.jpg
DELETED
Binary file (37 kB)
|
|
examples/fridge.json
DELETED
@@ -1,7 +0,0 @@
|
|
1 |
-
{
|
2 |
-
"name": "fridge",
|
3 |
-
"comment": "",
|
4 |
-
"model": "paligemma-3b-mix-224",
|
5 |
-
"prompt": "Describe the image.",
|
6 |
-
"license": "CC0 by [andresusanopinto@](https://github.com/andresusanopinto)"
|
7 |
-
}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
examples/givt.jpg
DELETED
Binary file (35.7 kB)
|
|
examples/givt.json
DELETED
@@ -1,7 +0,0 @@
|
|
1 |
-
{
|
2 |
-
"name": "givt",
|
3 |
-
"comment": "",
|
4 |
-
"model": "paligemma-3b-mix-224",
|
5 |
-
"prompt": "What does the image show?",
|
6 |
-
"license": "CC-BY [GIVT paper](https://arxiv.org/abs/2312.02116)"
|
7 |
-
}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
examples/greenlake.jpg
DELETED
Binary file (153 kB)
|
|
examples/greenlake.json
DELETED
@@ -1,7 +0,0 @@
|
|
1 |
-
{
|
2 |
-
"name": "greenlake",
|
3 |
-
"comment": "",
|
4 |
-
"model": "paligemma-3b-mix-224",
|
5 |
-
"prompt": "Describe the image.",
|
6 |
-
"license": "CC0 by [akolesnikoff@](https://github.com/akolesnikoff)"
|
7 |
-
}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
examples/howto.jpg
DELETED
Binary file (45.8 kB)
|
|
examples/howto.json
DELETED
@@ -1,7 +0,0 @@
|
|
1 |
-
{
|
2 |
-
"name": "howto",
|
3 |
-
"comment": "",
|
4 |
-
"model": "paligemma-3b-mix-224",
|
5 |
-
"prompt": "What does this image show?",
|
6 |
-
"license": "CC-BY [How to train your ViT?](https://arxiv.org/abs/2106.10270)"
|
7 |
-
}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
examples/markers.jpg
DELETED
Binary file (89.4 kB)
|
|
examples/markers.json
DELETED
@@ -1,7 +0,0 @@
|
|
1 |
-
{
|
2 |
-
"name": "markers",
|
3 |
-
"comment": "answer en How many cups are there?",
|
4 |
-
"model": "paligemma-3b-mix-224",
|
5 |
-
"prompt": "How many cups are there?",
|
6 |
-
"license": "CC0"
|
7 |
-
}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
examples/mcair.jpg
DELETED
Binary file (67.3 kB)
|
|
examples/mcair.json
DELETED
@@ -1,7 +0,0 @@
|
|
1 |
-
{
|
2 |
-
"name": "mcair",
|
3 |
-
"comment": "",
|
4 |
-
"model": "paligemma-3b-mix-224",
|
5 |
-
"prompt": "Can you board this airplane?",
|
6 |
-
"license": "CC0 by [akolesnikoff@](https://github.com/akolesnikoff)"
|
7 |
-
}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
examples/mcair_.json
DELETED
@@ -1,7 +0,0 @@
|
|
1 |
-
{
|
2 |
-
"name": "mcair",
|
3 |
-
"comment": "",
|
4 |
-
"model": "paligemma-3b-mix-224",
|
5 |
-
"prompt": "Is this a restaurant?",
|
6 |
-
"license": "CC0 by [akolesnikoff@](https://github.com/akolesnikoff)"
|
7 |
-
}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
examples/minergie.jpg
DELETED
Binary file (163 kB)
|
|
examples/minergie.json
DELETED
@@ -1,7 +0,0 @@
|
|
1 |
-
{
|
2 |
-
"name": "minergie",
|
3 |
-
"comment": "",
|
4 |
-
"model": "paligemma-3b-mix-224",
|
5 |
-
"prompt": "ocr",
|
6 |
-
"license": "CC0 by [andsteing@](https://huggingface.co/andsteing)"
|
7 |
-
}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
examples/morel.jpg
DELETED
Binary file (151 kB)
|
|
examples/morel.json
DELETED
@@ -1,7 +0,0 @@
|
|
1 |
-
{
|
2 |
-
"name": "morel",
|
3 |
-
"comment": "",
|
4 |
-
"model": "paligemma-3b-mix-224",
|
5 |
-
"prompt": "detect morel",
|
6 |
-
"license": "CC0 by [andsteing@](https://huggingface.co/andsteing)"
|
7 |
-
}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
examples/motorcyclists.jpg
DELETED
Binary file (105 kB)
|
|
examples/motorcyclists.json
DELETED
@@ -1,7 +0,0 @@
|
|
1 |
-
{
|
2 |
-
"name": "motorcyclists",
|
3 |
-
"comment": "",
|
4 |
-
"model": "paligemma-3b-mix-224",
|
5 |
-
"prompt": "What does the image show?",
|
6 |
-
"license": "CC0 by [akolesnikoff@](https://github.com/akolesnikoff)"
|
7 |
-
}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
examples/parking.jpg
DELETED
Binary file (52.7 kB)
|
|
examples/parking.json
DELETED
@@ -1,7 +0,0 @@
|
|
1 |
-
{
|
2 |
-
"name": "parking",
|
3 |
-
"comment": "",
|
4 |
-
"model": "paligemma-3b-mix-224",
|
5 |
-
"prompt": "Describe the image.",
|
6 |
-
"license": "CC0 by [xiaohuazhai@](https://huggingface.co/xiaohuazhai)"
|
7 |
-
}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
examples/password.jpg
DELETED
Binary file (66.4 kB)
|
|