Spaces:

sakshee05
/

langSAM

Sleeping

App Files Files Community

sakshee05 commited on Feb 24

Commit

70ae50f

verified ·

1 Parent(s): 1085ce5

add sam2 endpoint

Browse files

Files changed (1) hide show

main.py +69 -4

main.py CHANGED Viewed

@@ -14,6 +14,10 @@ import io
 import numpy as np
 from lang_sam import LangSAM
 import supervision as sv
 app = FastAPI()
@@ -30,13 +34,36 @@ app.add_middleware(
 os.makedirs("/tmp/huggingface", exist_ok=True)
 os.makedirs("/tmp/torch", exist_ok=True)
-# Load the segmentation model
-model = LangSAM()
 @app.get("/")
 async def root():
     return {"message": "LangSAM API is running!"}
 def draw_image(image_rgb, masks, xyxy, probs, labels):
     mask_annotator = sv.MaskAnnotator()
     # Create class_id for each unique label
@@ -54,13 +81,51 @@ def draw_image(image_rgb, masks, xyxy, probs, labels):
     annotated_image = mask_annotator.annotate(scene=image_rgb.copy(), detections=detections)
     return annotated_image
-@app.post("/segment/")
 async def segment_image(file: UploadFile = File(...), text_prompt: str = Form(...)):
     image_bytes = await file.read()
     image_pil = Image.open(io.BytesIO(image_bytes)).convert("RGB")
     # Run segmentation
-    results = model.predict([image_pil], [text_prompt])
     # Convert to NumPy array
     image_array = np.asarray(image_pil)

 import numpy as np
 from lang_sam import LangSAM
 import supervision as sv
+from sam2.build_sam import build_sam2
+from sam2.sam2_image_predictor import SAM2ImagePredictor
+import torch
+import cv2
 app = FastAPI()
 os.makedirs("/tmp/huggingface", exist_ok=True)
 os.makedirs("/tmp/torch", exist_ok=True)
+# Load the langSAM model
+langsam_model = LangSAM()
+# Load SAM2 Model
+sam2_checkpoint = "sam2.1_hiera_small.pt"
+model_cfg = "configs/sam2.1/sam2.1_hiera_s.yaml"
+device = torch.device("cpu")
+sam2_model = build_sam2(model_cfg, sam2_checkpoint, device=device)
+predictor = SAM2ImagePredictor(sam2_model)
 @app.get("/")
 async def root():
     return {"message": "LangSAM API is running!"}
+def apply_mask(image, mask):
+    """Overlay mask on image."""
+    mask = mask.astype(np.uint8) * 255  # Convert mask to 0-255 scale
+    mask_colored = np.zeros((*mask.shape, 3), dtype=np.uint8)
+    mask_colored[mask > 0] = [30, 144, 255]  # Blue color for the mask
+    # Add contour
+    contours, _ = cv2.findContours(mask, cv2.RETR_EXTERNAL, cv2.CHAIN_APPROX_SIMPLE)
+    cv2.drawContours(mask_colored, contours, -1, (255, 255, 255), thickness=2)
+    # Blend with original image
+    overlay = cv2.addWeighted(image, 0.7, mask_colored, 0.3, 0)
+    return overlay
 def draw_image(image_rgb, masks, xyxy, probs, labels):
     mask_annotator = sv.MaskAnnotator()
     # Create class_id for each unique label
     annotated_image = mask_annotator.annotate(scene=image_rgb.copy(), detections=detections)
     return annotated_image
+@app.post("/segment/sam2")
+async def segment_image(
+    file: UploadFile = File(...),
+    x: int = Form(...),
+    y: int = Form(...)
+):
+    """Segment image using SAM2 with a single input point."""
+    image_bytes = await file.read()
+    image_pil = Image.open(io.BytesIO(image_bytes)).convert("RGB")
+    image_array = np.array(image_pil)
+    predictor.set_image(image_array)
+    input_point = np.array([[x, y]])
+    input_label = np.array([1])  # Foreground point
+    # Run SAM2 model
+    masks, scores, logits = predictor.predict(
+        point_coords=input_point,
+        point_labels=input_label,
+        multimask_output=True,
+    )
+    # Get top mask
+    top_mask = masks[np.argmax(scores)]
+    # Apply mask overlay
+    output_image = apply_mask(image_array, top_mask)
+    # Convert to PNG
+    output_pil = Image.fromarray(output_image)
+    img_io = io.BytesIO()
+    output_pil.save(img_io, format="PNG")
+    img_io.seek(0)
+    return Response(content=img_io.getvalue(), media_type="image/png")
+@app.post("/segment/langsam")
 async def segment_image(file: UploadFile = File(...), text_prompt: str = Form(...)):
     image_bytes = await file.read()
     image_pil = Image.open(io.BytesIO(image_bytes)).convert("RGB")
     # Run segmentation
+    results = langsam_model.predict([image_pil], [text_prompt])
     # Convert to NumPy array
     image_array = np.asarray(image_pil)