VisAt

Runtime error

App Files Files Community

Tanzeer commited on Oct 22, 2023

Commit

776dd3c

1 Parent(s): 9ba4ed8

Update app.py

Browse files

Files changed (1) hide show

app.py +36 -39

app.py CHANGED Viewed

@@ -2,21 +2,19 @@ import streamlit as st
 import cv2
 import numpy as np
 import torch
-from torchvision import transforms, utils, models
 from PIL import Image
 from TranSalNet_Res import TranSalNet
 from tqdm import tqdm
 import torch.nn as nn
 from utils.data_process import preprocess_img, postprocess_img
-# Load the model and set the device
 device = torch.device('cpu')
 model = TranSalNet()
 model.load_state_dict(torch.load('pretrained_models/TranSalNet_Res.pth', map_location=torch.device('cpu')))
 model.to(device)
 model.eval()
-# Define Streamlit app
 st.title('Saliency Detection App')
 st.write('Upload an image for saliency detection:')
 uploaded_image = st.file_uploader("Choose an image...", type=["jpg", "jpeg", "png"])
@@ -25,60 +23,59 @@ if uploaded_image:
     image = Image.open(uploaded_image)
     st.image(image, caption='Uploaded Image', use_column_width=True)
-    # Check if the user clicks a button
     if st.button('Detect Saliency'):
-        # Create a blue background image with the same dimensions as the original image
-        blue_background = np.zeros_like(np.array(image))
-        blue_background[:] = (255, 0, 0)  # Set the background to blue (in BGR format)
-        # Preprocess the image
         img = image.resize((384, 288))
-        img = np.array(img) / 255.
         img = np.expand_dims(np.transpose(img, (2, 0, 1)), axis=0)
         img = torch.from_numpy(img)
         img = img.type(torch.FloatTensor).to(device)
-        # Get saliency prediction
         pred_saliency = model(img)
-        # Convert the result back to a PIL image
         toPIL = transforms.ToPILImage()
         pic = toPIL(pred_saliency.squeeze())
-        # Colorize the grayscale prediction
-        colorized_img = cv2.applyColorMap(np.uint8(pic), cv2.COLORMAP_JET)
-        # Ensure the colorized image has the same dimensions as the original image
         original_img = np.array(image)
         colorized_img = cv2.resize(colorized_img, (original_img.shape[1], original_img.shape[0]))
-        # Create an empty label map for ranking based on area
-        label_map = np.zeros_like(colorized_img)
-        intensity_map = cv2.cvtColor(colorized_img, cv2.COLOR_BGR2GRAY)
-        _, binary_map = cv2.threshold(intensity_map, 255, 0, cv2.THRESH_BINARY)
-        # Overlay the labels on the blended image
         font = cv2.FONT_HERSHEY_SIMPLEX
-        contours, _ = cv2.findContours(binary_map, cv2.RETR_EXTERNAL, cv2.CHAIN_APPROX_SIMPLE)
-        for i, contour in enumerate(contours):
-            M = cv2.moments(contour)
-            if M["m00"] == 0:
-                continue
-            center_x = int(M["m10"] / M["m00"])
-            center_y = int(M["m01"] / M["m00"])
-            cv2.putText(label_map, str(i + 1), (center_x, center_y), cv2.FONT_HERSHEY_SIMPLEX, 1, (255, 0, 0), 2, cv2.LINE_AA)
-        # Blend the colorized image with the blue background
-        alpha = 0.3  # Adjust the alpha value to control blending strength
-        blended_img = cv2.addWeighted(blue_background, 1 - alpha, colorized_img, alpha, 0)
-        # Display the final result
         st.image(blended_img, caption='Blended Image with Labels', use_column_width=True)
-        # Save the final result
         cv2.imwrite('example/result15.png', blended_img, [int(cv2.IMWRITE_JPEG_QUALITY), 200])
-        st.success('Saliency detection complete. Result saved as "example/result15.png"')
-st.write('Finished, check the result at: example/result15.png')

 import cv2
 import numpy as np
 import torch
+from torchvision import transforms, models
 from PIL import Image
 from TranSalNet_Res import TranSalNet
 from tqdm import tqdm
 import torch.nn as nn
 from utils.data_process import preprocess_img, postprocess_img
 device = torch.device('cpu')
 model = TranSalNet()
 model.load_state_dict(torch.load('pretrained_models/TranSalNet_Res.pth', map_location=torch.device('cpu')))
 model.to(device)
 model.eval()
 st.title('Saliency Detection App')
 st.write('Upload an image for saliency detection:')
 uploaded_image = st.file_uploader("Choose an image...", type=["jpg", "jpeg", "png"])
     image = Image.open(uploaded_image)
     st.image(image, caption='Uploaded Image', use_column_width=True)
     if st.button('Detect Saliency'):
         img = image.resize((384, 288))
+        img = np.array(img) / 100.
         img = np.expand_dims(np.transpose(img, (2, 0, 1)), axis=0)
         img = torch.from_numpy(img)
         img = img.type(torch.FloatTensor).to(device)
         pred_saliency = model(img)
         toPIL = transforms.ToPILImage()
         pic = toPIL(pred_saliency.squeeze())
+        colorized_img = cv2.applyColorMap(np.uint8(pic), cv2.COLORMAP_OCEAN)
         original_img = np.array(image)
         colorized_img = cv2.resize(colorized_img, (original_img.shape[1], original_img.shape[0]))
+        alpha = 0.7
+        blended_img = cv2.addWeighted(original_img, 1 - alpha, colorized_img, alpha, 0)
+        # Find all contours
+        contours, _ = cv2.findContours(np.uint8(pred_saliency.squeeze().detach().numpy() * 255), cv2.RETR_EXTERNAL, cv2.CHAIN_APPROX_SIMPLE)
+        saliency_8bit = np.uint8(pred_saliency.squeeze().detach().numpy() * 255)
+        # Apply dilation
+        kernel = np.ones((5,5),np.uint8)
+        dilated = cv2.dilate(saliency_8bit, kernel, iterations = 1)
+        # Find contours on dilated image
+        contours, _ = cv2.findContours(dilated, cv2.RETR_EXTERNAL, cv2.CHAIN_APPROX_SIMPLE)
         font = cv2.FONT_HERSHEY_SIMPLEX
+        label = 1
+        for contour in contours:
+            # Get bounding box for contour
+            x, y, w, h = cv2.boundingRect(contour)
+            # Calculate center of bounding box
+            center_x = x + w // 2
+            center_y = y + h // 2
+            # Find point on contour closest to center of bounding box
+            distances = np.sqrt((contour[:,0,0] - center_x)**2 + (contour[:,0,1] - center_y)**2)
+            min_index = np.argmin(distances)
+            closest_point = tuple(contour[min_index][0])
+            # Place label at closest point on contour
+            cv2.putText(blended_img, str(label), closest_point, font, 1, (0, 0, 255), 3, cv2.LINE_AA)
+            label += 1
         st.image(blended_img, caption='Blended Image with Labels', use_column_width=True)
         cv2.imwrite('example/result15.png', blended_img, [int(cv2.IMWRITE_JPEG_QUALITY), 200])
+        st.success('Saliency detection complete. Result saved as "example/result15.png".')