# IMPORTS
import torch
import numpy as np
from PIL import Image
from lang_sam import LangSAM
import gradio as gr
def run_lang_sam(input_image, text_prompt, model):
image = input_image.convert("RGB").resize((512, 512))
masks, _, _, _ = model.predict(
image,
text_prompt
)
masks_int = masks.to(torch.uint8)
masks_max, _ = masks_int.max(dim=0, keepdim=True)
unified_mask = masks_max.squeeze(0).to(torch.bool)
return Image.fromarray(
(unified_mask[..., None].numpy() * np.array(image)).astype(np.uint8)
)
def setup_gradio_interface(model):
block = gr.Blocks()
with block:
gr.Markdown("
Lang SAM")
with gr.Row():
with gr.Column():
input_image = gr.Image(type="pil", label="Input Image")
text_prompt = gr.Textbox(label="Enter what you want to segment")
run_button = gr.Button(value="Run")
with gr.Column():
output_mask = gr.Image(type="numpy", label="Segmentation Mask")
run_button.click(
fn=lambda image, prompt: run_lang_sam(
image, prompt, model,
),
inputs=[input_image, text_prompt],
outputs=[output_mask],
)
gr.Examples(
examples=[["bw-image.jpeg", "road"]],
inputs=[input_image, text_prompt],
outputs=[output_mask],
fn=lambda image, prompt: run_lang_sam(
image, prompt, model,
),
cache_examples=True,
label="Try this example input!",
)
return block
if __name__ == "__main__":
model = LangSAM()
gradio_interface = setup_gradio_interface(model)
gradio_interface.launch(share=False, show_api=False, show_error=True)