Spaces:

d22cs051
/

bird_sota_segmentation_demo

Runtime error

App Files Files Community

d22cs051 commited on May 19, 2023

Commit

aa1f5e1

1 Parent(s): d779e14

base app uplaod

Browse files

Files changed (7) hide show

.gitattributes +3 -0
app.py +135 -0
examples/IMG_6093.JPG +3 -0
examples/IMG_6111.JPG +3 -0
examples/IMG_7047.JPG +3 -0
models.py +14 -0
requirements.txt +4 -0

.gitattributes CHANGED Viewed

@@ -32,3 +32,6 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
 *.zip filter=lfs diff=lfs merge=lfs -text
 *.zst filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text

 *.zip filter=lfs diff=lfs merge=lfs -text
 *.zst filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text
+examples/IMG_6093.JPG filter=lfs diff=lfs merge=lfs -text
+examples/IMG_6111.JPG filter=lfs diff=lfs merge=lfs -text
+examples/IMG_7047.JPG filter=lfs diff=lfs merge=lfs -text

app.py ADDED Viewed

	@@ -0,0 +1,135 @@

+### 1. Imports and class names setup ###
+import gradio as gr
+import os
+import torch
+import PIL
+from matplotlib import pyplot as plt
+from timeit import default_timer as timer
+from typing import Tuple, Dict
+from models import get_detr, get_maskformer
+# Set device
+device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
+### 2. Model and transforms preparation ###
+# Create model
+model_name_to_fn = {
+    "detr": get_detr,
+    "maskformer": get_maskformer,
+}
+### 3. Predict function ###
+# Create predict function
+def predict(image, model_name: str = "detr",) -> Tuple[Dict, float]:
+    """
+    Desc: Transforms and performs a prediction on img and returns prediction and time taken.
+    Args:
+        model_name (str): Name of the model to use for prediction.
+        img (PIL.Image): Image to perform prediction on.
+    Returns:
+        Tuple[Image, float]: Tuple containing a dictionary of prediction labels and probabilities and the time taken to perform the prediction.
+    """
+    # Start the timer
+    start_time = timer()
+    # Get the model function based on the model name
+    model_fn = model_name_to_fn[model_name]
+    # Create the model and load its weights
+    model,processor = model_fn()
+    model = model.to(device)
+    # Put model into evaluation mode and turn on inference mode
+    model.eval()
+    if model_name == "detr":
+        inputs = processor(images=image, return_tensors="pt")
+        inputs = inputs.to(device)
+        # forward pass
+        outputs = model(**inputs)
+        print("Output Generated!")
+        # Use the `post_process_panoptic_segmentation` method of the `image_processor` to retrieve post-processed panoptic segmentation maps
+        # Segmentation results are returned as a list of dictionaries
+        result = processor.post_process_panoptic_segmentation(outputs, target_sizes=[(image.height, image.width)])
+        print("Output Post Processing Done!")
+        # print(f"result: {result[0].keys()}")
+        # A tensor of shape (height, width) where each value denotes a segment id, filled with -1 if no segment is found
+        panoptic_seg = result[0]["segmentation"]
+        # Convert the tensor to PIL image
+        plt.imsave("predicted_panoptic_map.png", panoptic_seg, cmap="viridis")
+        output = PIL.Image.open("predicted_panoptic_map.png")
+        # output = PIL.Image.fromarray(panoptic_seg.cpu().numpy().astype('uint8')).convert('RGB')
+    elif model_name == "maskformer":
+        inputs = processor(images=image, return_tensors="pt")
+        outputs = model(**inputs)
+        # model predicts class_queries_logits of shape `(batch_size, num_queries)`
+        # and masks_queries_logits of shape `(batch_size, num_queries, height, width)`
+        class_queries_logits = outputs.class_queries_logits
+        masks_queries_logits = outputs.masks_queries_logits
+        # you can pass them to feature_extractor for postprocessing
+        result = processor.post_process_panoptic_segmentation(outputs, target_sizes=[image.size[::-1]])[0]
+        # we refer to the demo notebooks for visualization (see "Resources" section in the MaskFormer docs)
+        predicted_panoptic_map = result["segmentation"]
+        plt.imsave("predicted_panoptic_map.png", predicted_panoptic_map, cmap="viridis")
+        output = PIL.Image.open("predicted_panoptic_map.png")
+        # output = PIL.Image.fromarray(predicted_panoptic_map.cpu().numpy().astype('uint8')).convert('RGB')
+    # Calculate the prediction time
+    pred_time = round(timer() - start_time, 5)
+    # Return the prediction dictionary and prediction time
+    print("Returning Results!")
+    return output, pred_time
+### 4. Gradio app ###
+# Create title, description and article strings
+title = "Segementation Demo"
+description = "An Mutimodel Segementation Demo"
+article = ""
+# Create examples list from "examples/" directory
+example_list = [["examples/" + example] for example in os.listdir("examples")]
+# Create the Gradio demo
+model_selection_dropdown = gr.components.Dropdown(
+    choices=list(model_name_to_fn.keys()),
+    label="Select a model",
+    value="detr"
+)
+demo = gr.Interface(
+    fn=predict,  # mapping function from input to output
+    inputs=[gr.Image(type="pil"),model_selection_dropdown],  # what are the inputs?
+    outputs=[
+        gr.Image(label="Mask"),  # what are the outputs?
+        gr.Number(label="Prediction time (s)"),
+    ],  # our fn has two outputs, therefore we have two outputs
+    # Create examples list from "examples/" directory
+    examples=example_list,
+    title=title,
+    description=description,
+    article=article,
+)
+# Launch the demo!
+demo.launch(
+    debug=True,
+    server_port=7860,
+    server_name="0.0.0.0"
+)

examples/IMG_6093.JPG ADDED Viewed

Git LFS Details

SHA256: 687e914608784ba79e086ee0c91829b4a68c9e78506023d5cb11cc44d2fdfc5f
Pointer size: 133 Bytes
Size of remote file: 14.1 MB

examples/IMG_6111.JPG ADDED Viewed

Git LFS Details

SHA256: d94681e7fa8e6463431f25c4822ca2d1786a96e4316a92dbabee70fb42b906ab
Pointer size: 133 Bytes
Size of remote file: 18.1 MB

examples/IMG_7047.JPG ADDED Viewed

Git LFS Details

SHA256: f8e13549ae21af65a833de0aa690be82481ab50b529091def3dddde95170b27c
Pointer size: 133 Bytes
Size of remote file: 12.6 MB

models.py ADDED Viewed

	@@ -0,0 +1,14 @@

+from transformers import AutoImageProcessor, DetrForSegmentation
+from transformers import MaskFormerFeatureExtractor, MaskFormerForInstanceSegmentation
+def get_detr():
+    image_processor = AutoImageProcessor.from_pretrained("facebook/detr-resnet-50-panoptic")
+    model = DetrForSegmentation.from_pretrained("facebook/detr-resnet-50-panoptic")
+    return model, image_processor
+def get_maskformer():
+    feature_extractor = MaskFormerFeatureExtractor.from_pretrained("facebook/maskformer-swin-small-coco")
+    model = MaskFormerForInstanceSegmentation.from_pretrained("facebook/maskformer-swin-small-coco")
+    return model, feature_extractor

requirements.txt ADDED Viewed

	@@ -0,0 +1,4 @@

+torch
+torchvision
+gradio
+'transformers[torch]'