Spaces:

mrdbourke
/

trashify_demo_v1

Running

App Files Files Community

mrdbourke commited on Nov 16, 2024

Commit

675f436

verified ·

1 Parent(s): 2d1114b

Uploading Trashify box detection model app.py

Browse files

Files changed (8) hide show

.gitattributes +1 -0
.gradio/cached_examples/18/Image Output/66ec734ca428ae2384f6/image.webp +0 -0
.gradio/cached_examples/18/Image Output/92cc1241b9494671fc05/image.webp +0 -0
.gradio/cached_examples/18/log.csv +3 -0
app.py +74 -16
examples/trashify_example_1.jpeg +0 -0
examples/trashify_example_2.jpeg +3 -0
requirements.txt +1 -1

.gitattributes CHANGED Viewed

@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
 *.zip filter=lfs diff=lfs merge=lfs -text
 *.zst filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text

 *.zip filter=lfs diff=lfs merge=lfs -text
 *.zst filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text
+examples/trashify_example_2.jpeg filter=lfs diff=lfs merge=lfs -text

.gradio/cached_examples/18/Image Output/66ec734ca428ae2384f6/image.webp ADDED Viewed

.gradio/cached_examples/18/Image Output/92cc1241b9494671fc05/image.webp ADDED Viewed

.gradio/cached_examples/18/log.csv ADDED Viewed

	@@ -0,0 +1,3 @@

+Image Output,Text Output,timestamp
+"{""path"": "".gradio/cached_examples/18/Image Output/92cc1241b9494671fc05/image.webp"", ""url"": ""/gradio_api/file=/tmp/gradio/a00bd5b7c75100f6f600a22625949c9350d2827637ab3e454535b4f44376dde0/image.webp"", ""size"": null, ""orig_name"": ""image.webp"", ""mime_type"": null, ""is_stream"": false, ""meta"": {""_type"": ""gradio.FileData""}}","'+1! Found the following items: ['trash', 'bin', 'hand', 'not_trash', 'bin'], thank you for cleaning up the area!",2024-11-16 13:55:27.991471
+"{""path"": "".gradio/cached_examples/18/Image Output/66ec734ca428ae2384f6/image.webp"", ""url"": ""/gradio_api/file=/tmp/gradio/b83f3584e66d5d7a6d26f3988d3b8c6cb39d94dd8433f94788676e9ec8c21327/image.webp"", ""size"": null, ""orig_name"": ""image.webp"", ""mime_type"": null, ""is_stream"": false, ""meta"": {""_type"": ""gradio.FileData""}}","'+1! Found the following items: ['bin', 'trash', 'hand', 'not_trash', 'not_trash'], thank you for cleaning up the area!",2024-11-16 13:55:28.113367

app.py CHANGED Viewed

@@ -1,29 +1,44 @@
 import gradio as gr
 import torch
-from PIL import Image, ImageDraw
 from transformers import AutoImageProcessor
 from transformers import AutoModelForObjectDetection
-from PIL import Image
 model_save_path = "mrdbourke/detr_finetuned_trashify_box_detector"
 image_processor = AutoImageProcessor.from_pretrained(model_save_path)
 model = AutoModelForObjectDetection.from_pretrained(model_save_path)
 id2label = model.config.id2label
-color_dict = {
-    "not_trash": "red",
     "bin": "green",
     "trash": "blue",
-    "hand": "purple"
 }
-device = "cuda" if torch.cuda.is_available() else "cpu"
-model = model.to(device)
-def predict_on_image(image, conf_threshold=0.25):
     with torch.no_grad():
         inputs = image_processor(images=[image], return_tensors="pt")
         outputs = model(**inputs.to(device))
@@ -43,6 +58,12 @@ def predict_on_image(image, conf_threshold=0.25):
     # Can return results as plotted on a PIL image (then display the image)
     draw = ImageDraw.Draw(image)
     for box, score, label in zip(results["boxes"], results["scores"], results["labels"]):
         # Create coordinates
         x, y, x2, y2 = tuple(box.tolist())
@@ -50,6 +71,7 @@ def predict_on_image(image, conf_threshold=0.25):
         # Get label_name
         label_name = id2label[label.item()]
         targ_color = color_dict[label_name]
         # Draw the rectangle
         draw.rectangle(xy=(x, y, x2, y2),
@@ -62,23 +84,59 @@ def predict_on_image(image, conf_threshold=0.25):
         # Draw the text on the image
         draw.text(xy=(x, y),
                   text=text_string_to_show,
-                  fill="white")
     # Remove the draw each time
     del draw
-    return image
 demo = gr.Interface(
     fn=predict_on_image,
     inputs=[
-        gr.Image(type="pil", label="Upload Target Image"),
         gr.Slider(minimum=0, maximum=1, value=0.25, label="Confidence Threshold")
     ],
-    outputs=gr.Image(type="pil"),
     title="🚮 Trashify Object Detection Demo",
-    description="Upload an image to detect whether there's a bin, a hand or trash in it."
 )
-if __name__ == "__main__":
-    demo.launch()

 import gradio as gr
 import torch
+from PIL import Image, ImageDraw, ImageFont
 from transformers import AutoImageProcessor
 from transformers import AutoModelForObjectDetection
+# Note: Can load from Hugging Face or can load from local
 model_save_path = "mrdbourke/detr_finetuned_trashify_box_detector"
+# Load the model and preprocessor
 image_processor = AutoImageProcessor.from_pretrained(model_save_path)
 model = AutoModelForObjectDetection.from_pretrained(model_save_path)
+device = "cuda" if torch.cuda.is_available() else "cpu"
+model = model.to(device)
+# Get the id2label dictionary from the model
 id2label = model.config.id2label
+# Set up a colour dictionary for plotting boxes with different colours
+color_dict = {
     "bin": "green",
     "trash": "blue",
+    "hand": "purple",
+    "trash_arm": "yellow",
+    "not_trash": "red",
+    "not_bin": "red",
+    "not_hand": "red",
 }
+# Create helper functions for seeing if items from one list are in another
+def any_in_list(list_a, list_b):
+    "Returns True if any item from list_a is in list_b, otherwise False."
+    return any(item in list_b for item in list_a)
+def all_in_list(list_a, list_b):
+    "Returns True if all items from list_a are in list_b, otherwise False."
+    return all(item in list_b for item in list_a)
+def predict_on_image(image, conf_threshold):
     with torch.no_grad():
         inputs = image_processor(images=[image], return_tensors="pt")
         outputs = model(**inputs.to(device))
     # Can return results as plotted on a PIL image (then display the image)
     draw = ImageDraw.Draw(image)
+    # Get a font from ImageFont
+    font = ImageFont.load_default(size=20)
+    # Get class names as text for print out
+    class_name_text_labels = []
     for box, score, label in zip(results["boxes"], results["scores"], results["labels"]):
         # Create coordinates
         x, y, x2, y2 = tuple(box.tolist())
         # Get label_name
         label_name = id2label[label.item()]
         targ_color = color_dict[label_name]
+        class_name_text_labels.append(label_name)
         # Draw the rectangle
         draw.rectangle(xy=(x, y, x2, y2),
         # Draw the text on the image
         draw.text(xy=(x, y),
                   text=text_string_to_show,
+                  fill="white",
+                  font=font)
     # Remove the draw each time
     del draw
+    # Setup blank string to print out
+    return_string = ""
+    # Setup list of target items to discover
+    target_items = ["trash", "bin", "hand"]
+    # If no items detected or trash, bin, hand not in list, return notification
+    if (len(class_name_text_labels) == 0) or not (any_in_list(list_a=target_items, list_b=class_name_text_labels)):
+        return_string = f"No trash, bin or hand detected at confidence threshold {conf_threshold}. Try another image or lowering the confidence threshold."
+        return image, return_string
+    # If there are some missing, print the ones which are missing
+    elif not all_in_list(list_a=target_items, list_b=class_name_text_labels):
+        missing_items = []
+        for item in target_items:
+            if item not in class_name_text_labels:
+                missing_items.append(item)
+        return_string = f"Detected the following items: {class_name_text_labels}. But missing the following in order to get +1: {missing_items}. If this is an error, try altering the confidence threshold."
+    # If all 3 trash, bin, hand occur = + 1
+    if all_in_list(list_a=target_items, list_b=class_name_text_labels):
+        return_string = f"+1! Found the following items: {class_name_text_labels}, thank you for cleaning up the area!"
+    print(return_string)
+    return image, return_string
+# Create the interface
 demo = gr.Interface(
     fn=predict_on_image,
     inputs=[
+        gr.Image(type="pil", label="Target Image"),
         gr.Slider(minimum=0, maximum=1, value=0.25, label="Confidence Threshold")
     ],
+    outputs=[
+        gr.Image(type="pil", label="Image Output"),
+        gr.Text(label="Text Output")
+    ],
     title="🚮 Trashify Object Detection Demo",
+    description="Help clean up your local area! Upload an image and get +1 if there is all of the following items detected: trash, bin, hand.",
+    # Examples come in the form of a list of lists, where each inner list contains elements to prefill the `inputs` parameter with
+    examples=[
+        ["examples/trashify_example_1.jpeg", 0.25],
+        ["examples/trashify_example_2.jpeg", 0.25]
+    ],
+    cache_examples=True
 )
+# Launch the demo
+demo.launch()

examples/trashify_example_1.jpeg ADDED Viewed

examples/trashify_example_2.jpeg ADDED Viewed

Git LFS Details

SHA256: 89ed8acec03b7890e5d2e6fa509c7e842e70a6dd9f6ad4e37d5d1431a1081be7
Pointer size: 132 Bytes
Size of remote file: 1.07 MB

requirements.txt CHANGED Viewed

@@ -1,4 +1,4 @@
 gradio
 torch
 transformers
-timm

+timm
 gradio
 torch
 transformers