Spaces:

COS40007
/

Computer-Vision-Smart-City

Sleeping

App Files Files Community

phonghaitran commited on Oct 30, 2024

Commit

721557d

1 Parent(s): 310c1ed

yolov5 design with unet and split into radio button for chosen

Browse files

Files changed (11) hide show

.DS_Store +0 -0
app.py +385 -275
model/.DS_Store +0 -0
{unet → model/unet}/checkpoint_epoch5.pth +0 -0
{yolo → model/yolo}/best.pt +0 -0
unet/__init__.py +1 -0
unet/__pycache__/__init__.cpython-312.pyc +0 -0
unet/__pycache__/unet_model.cpython-312.pyc +0 -0
unet/__pycache__/unet_parts.cpython-312.pyc +0 -0
unet/unet_model.py +36 -0
unet/unet_parts.py +77 -0

.DS_Store CHANGED Viewed

Binary files a/.DS_Store and b/.DS_Store differ

app.py CHANGED Viewed

@@ -1,327 +1,437 @@
 import streamlit as st
 import torch
 import pathlib
-from PIL import Image
 import io
-import numpy as np
 import cv2
 import tempfile
-import pandas as pd
 # Adjust Path for Local Repository
 pathlib.WindowsPath = pathlib.PosixPath
 st.title("YOLO Object Detection Web App")
-# Define the available labels
-default_sub_classes = [
-    "container",
-    "waste-paper",
-    "plant",
-    "transportation",
-    "kitchenware",
-    "rubbish bag",
-    "chair",
-    "wood",
-    "electronics good",
-    "sofa",
-    "scrap metal",
-    "carton",
-    "bag",
-    "tarpaulin",
-    "accessory",
-    "rubble",
-    "table",
-    "board",
-    "mattress",
-    "beverage",
-    "tyre",
-    "nylon",
-    "rack",
-    "styrofoam",
-    "clothes",
-    "toy",
-    "furniture",
-    "trolley",
-    "carpet",
-    "plastic cup"
-]
-# Initialize session state for video processing
-if 'video_processed' not in st.session_state:
-    st.session_state.video_processed = False
-    st.session_state.output_video_path = None
-    st.session_state.detections_summary = None
-# Cache the model loading to prevent repeated loads
-@st.cache_resource
-def load_model():
-    model = torch.hub.load('./yolov5', 'custom', path='./yolo/best.pt', source='local', force_reload=False)
-    return model
-model = load_model()
-# Retrieve model class names
-model_class_names = model.names  # Dictionary {index: class_name}
-# Function to map class names to indices (case-insensitive)
-def get_class_indices(class_list):
-    indices = []
-    not_found = []
-    for cls in class_list:
-        found = False
-        for index, name in model_class_names.items():
-            if name.lower() == cls.lower():
-                indices.append(index)
-                found = True
-                break
-        if not found:
-            not_found.append(cls)
-    return indices, not_found
-# Function to annotate images
-def annotate_image(frame, results):
-    results.render()  # Updates results.ims with the annotated images
-    annotated_frame = results.ims[0]  # Get the first (and only) image
-    return annotated_frame
-# Inform the user about the available labels
-st.markdown("### Available Classes:")
-st.markdown("**" + ", ".join(default_sub_classes + ["rubbish"]) + "**")
-# Inform the user about the default detection
-st.info("By default, the application will detect **rubbish** only.")
-# User input for classes, separated by commas (optional)
-custom_classes_input = st.text_input(
-    "Enter classes (comma-separated) or type 'all' to detect everything:",
-    ""
-)
-# Retrieve all model classes
-all_model_classes = list(model_class_names.values())
-# Determine classes to use based on user input
-if custom_classes_input.strip() == "":
-    # No input provided; use only 'rubbish'
-    selected_classes = ['rubbish']
-    st.info("No classes entered. Using default class: **rubbish**.")
-elif custom_classes_input.strip().lower() == "all":
-    # User chose to detect all classes
-    selected_classes = all_model_classes
-    st.info("Detecting **all** available classes.")
-else:
-    # User provided specific classes
-    # Split the input string into a list of classes and remove any extra whitespace
-    input_classes = [cls.strip() for cls in custom_classes_input.split(",") if cls.strip()]
-    # Ensure 'rubbish' is included
-    if 'rubbish' not in [cls.lower() for cls in input_classes]:
-        selected_classes = input_classes + ['rubbish']
-        st.info(f"Detecting the following classes: **{', '.join(selected_classes)}** (Including **rubbish**)")
     else:
-        selected_classes = input_classes
-        st.info(f"Detecting the following classes: **{', '.join(selected_classes)}**")
-# Map selected class names to their indices
-selected_class_indices, not_found_classes = get_class_indices(selected_classes)
-if not_found_classes:
-    st.warning(f"The following classes were not found in the model and will be ignored: **{', '.join(not_found_classes)}**")
-# Proceed only if there are valid classes to detect
-if selected_class_indices:
-    # Set the classes for the model
-    model.classes = selected_class_indices
-    # --------------------- Image Upload and Processing ---------------------
-    st.header("Image Object Detection")
-    uploaded_file = st.file_uploader("Choose an image...", type=["jpg", "jpeg", "png"], key="image_upload")
-    if uploaded_file is not None:
-        try:
-            # Convert the file to a PIL image
-            image = Image.open(uploaded_file).convert('RGB')
-            st.image(image, caption="Uploaded Image", use_column_width=True)
-            st.write("Processing...")
-            # Perform inference
-            results = model(image)
-            # Extract DataFrame from results
-            results_df = results.pandas().xyxy[0]
-            # Filter results to include only selected classes
-            filtered_results = results_df[results_df['name'].str.lower().isin([cls.lower() for cls in selected_classes])]
-            if filtered_results.empty:
-                st.warning("No objects detected for the selected classes.")
-            else:
-                # Display filtered results
-                st.write("### Detection Results")
-                st.dataframe(filtered_results)
-            # Annotate the image
-            annotated_image = annotate_image(np.array(image), results)
-            # Convert annotated image back to PIL format
-            annotated_pil = Image.fromarray(annotated_image)
-            # Display annotated image
-            st.image(annotated_pil, caption="Annotated Image", use_column_width=True)
-            # Convert annotated image to bytes
-            img_byte_arr = io.BytesIO()
-            annotated_pil.save(img_byte_arr, format='PNG')
-            img_byte_arr = img_byte_arr.getvalue()
-            # Add download button
-            st.download_button(
-                label="Download Annotated Image",
-                data=img_byte_arr,
-                file_name='annotated_image.png',
-                mime='image/png'
-            )
-        except Exception as e:
-            st.error(f"An error occurred during image processing: {e}")
-    # --------------------- Video Upload and Processing ---------------------
-    st.header("Video Object Detection")
-    uploaded_video = st.file_uploader("Choose a video...", type=["mp4", "avi", "mov"], key="video_upload")
-    if uploaded_video is not None:
-        # Check if the uploaded video is different from the previously processed one
-        # Check if the uploaded video first time
-        if st.session_state.get("uploaded_video_name") is None:
-            st.session_state.uploaded_video_name = uploaded_video.name
-            print("First time uploaded video" +st.session_state.uploaded_video_name)
-        elif st.session_state.uploaded_video_name != uploaded_video.name:
-            st.session_state.uploaded_video_name = uploaded_video.name
-            print("Another time uploaded video" +st.session_state.uploaded_video_name)
             st.session_state.video_processed = False
             st.session_state.output_video_path = None
             st.session_state.detections_summary = None
-            print("New uploaded video")
-    # Reset session state if video upload is removed
-    if uploaded_video is None and st.session_state.video_processed:
-        st.session_state.video_processed = False
-        st.session_state.output_video_path = None
-        st.session_state.detections_summary = None
-        st.warning("Video upload has been cleared. You can upload a new video for processing.")
-    if uploaded_video:
-        if not st.session_state.video_processed:
-            try:
-                with st.spinner("Processing video..."):
-                    # Save uploaded video to a temporary file
-                    tfile = tempfile.NamedTemporaryFile(delete=False)
-                    tfile.write(uploaded_video.read())
-                    tfile.close()
-                    # Open the video file
-                    video_cap = cv2.VideoCapture(tfile.name)
-                    stframe = st.empty()  # Placeholder for displaying video frames
-                    # Initialize VideoWriter for saving the output video
-                    fourcc = cv2.VideoWriter_fourcc(*'mp4v')
-                    fps = video_cap.get(cv2.CAP_PROP_FPS)
-                    width = int(video_cap.get(cv2.CAP_PROP_FRAME_WIDTH))
-                    height = int(video_cap.get(cv2.CAP_PROP_FRAME_HEIGHT))
-                    output_video_path = tempfile.NamedTemporaryFile(delete=False, suffix='.mp4').name
-                    out = cv2.VideoWriter(output_video_path, fourcc, fps, (width, height))
-                    frame_count = int(video_cap.get(cv2.CAP_PROP_FRAME_COUNT))
-                    progress_bar = st.progress(0)
-                    # Initialize list to collect all detections
-                    all_detections = []
-                    for frame_num in range(frame_count):
-                        ret, frame = video_cap.read()  # Read a frame from the video
-                        if not ret:
-                            break
-                        # Convert frame to RGB
-                        frame_rgb = cv2.cvtColor(frame, cv2.COLOR_BGR2RGB)
-                        # Perform inference
-                        results = model(frame_rgb)
-                        # Extract DataFrame from results
-                        results_df = results.pandas().xyxy[0]
-                        results_df['frame_num'] = frame_num  # Optional: Add frame number for reference
-                        # Append detections to the list
-                        if not results_df.empty:
-                            all_detections.append(results_df)
-                        # Annotate the frame with detections
-                        annotated_frame = annotate_image(frame_rgb, results)
-                        # Convert annotated frame back to BGR for VideoWriter
-                        annotated_bgr = cv2.cvtColor(annotated_frame, cv2.COLOR_RGB2BGR)
-                        # Write the annotated frame to the output video
-                        out.write(annotated_bgr)
-                        # Display the annotated frame in Streamlit
-                        stframe.image(annotated_frame, channels="RGB", use_column_width=True)
-                        # Update progress bar
-                        progress_percent = (frame_num + 1) / frame_count
-                        progress_bar.progress(progress_percent)
-                    video_cap.release()  # Release the video capture object
-                    out.release()  # Release the VideoWriter object
-                # Save processed video path and detections summary to session state
-                st.session_state.output_video_path = output_video_path
-                if all_detections:
-                    # Concatenate all detections into a single DataFrame
-                    detections_df = pd.concat(all_detections, ignore_index=True)
-                    # Optional: Group by class name and count detections
-                    detections_summary = detections_df.groupby('name').size().reset_index(name='counts')
-                    st.session_state.detections_summary = detections_summary
-                else:
-                    st.session_state.detections_summary = None
-                # Mark video as processed
-                st.session_state.video_processed = True
-                # st.session_state.uploaded_video_name = uploaded_video.name
-                st.success("Video processing complete!")
             except Exception as e:
-                st.error(f"An error occurred during video processing: {e}")
-    # Display download button and detection summary if processed
-    if st.session_state.video_processed:
-        try:
-            # Create a download button for the annotated video
-            with open(st.session_state.output_video_path, "rb") as video_file:
-                st.download_button(
-                    label="Download Annotated Video",
-                    data=video_file,
-                    file_name="annotated_video.mp4",
-                    mime="video/mp4"
-                )
-            # Display detection table if there are detections
-            if st.session_state.detections_summary is not None:
-                detections_summary = st.session_state.detections_summary
-                st.write("### Detection Summary")
-                st.dataframe(detections_summary)
-            else:
-                st.warning("No objects detected in the video for the selected classes.")
-        except Exception as e:
-            st.error(f"An error occurred while preparing the download: {e}")
-# Optionally, display all available classes when 'all' is selected
-if custom_classes_input.strip().lower() == "all":
-    st.info(f"The model is set to detect **all** available classes: {', '.join(all_model_classes)}")

+from PIL import Image, ImageDraw
+# Import the model components from unet directory
+from unet.unet_model import UNet
 import streamlit as st
+import plotly.express as px
+import pandas as pd
+import numpy as np
+import torchvision.transforms as T
 import torch
 import pathlib
 import io
 import cv2
 import tempfile
 # Adjust Path for Local Repository
 pathlib.WindowsPath = pathlib.PosixPath
 st.title("YOLO Object Detection Web App")
+def yolo():
+    st.markdown(
+        "<h1 style='text-align: center; font-size: 36px;'>Smart city rubbish detection</h1>",
+        unsafe_allow_html=True
+    )
+    st.markdown(
+        "<h2 style='text-align: center; font-size: 30px;'>Presented by team 2</h2>",
+        unsafe_allow_html=True
+    )
+    # Define the available labels
+    default_sub_classes = [
+        "container",
+        "waste-paper",
+        "plant",
+        "transportation",
+        "kitchenware",
+        "rubbish bag",
+        "chair",
+        "wood",
+        "electronics good",
+        "sofa",
+        "scrap metal",
+        "carton",
+        "bag",
+        "tarpaulin",
+        "accessory",
+        "rubble",
+        "table",
+        "board",
+        "mattress",
+        "beverage",
+        "tyre",
+        "nylon",
+        "rack",
+        "styrofoam",
+        "clothes",
+        "toy",
+        "furniture",
+        "trolley",
+        "carpet",
+        "plastic cup"
+    ]
+    # Initialize session state for video processing
+    if 'video_processed' not in st.session_state:
+        st.session_state.video_processed = False
+        st.session_state.output_video_path = None
+        st.session_state.detections_summary = None
+    # Cache the model loading to prevent repeated loads
+    @st.cache_resource
+    def load_model():
+        model = torch.hub.load('./yolov5', 'custom', path='./model/yolo/best.pt', source='local', force_reload=False)
+        return model
+    model = load_model()
+    # Retrieve model class names
+    model_class_names = model.names  # Dictionary {index: class_name}
+    # Function to map class names to indices (case-insensitive)
+    def get_class_indices(class_list):
+        indices = []
+        not_found = []
+        for cls in class_list:
+            found = False
+            for index, name in model_class_names.items():
+                if name.lower() == cls.lower():
+                    indices.append(index)
+                    found = True
+                    break
+            if not found:
+                not_found.append(cls)
+        return indices, not_found
+    # Function to annotate images
+    def annotate_image(frame, results):
+        results.render()  # Updates results.ims with the annotated images
+        annotated_frame = results.ims[0]  # Get the first (and only) image
+        return annotated_frame
+    # Inform the user about the available labels
+    st.markdown("### Available Classes:")
+    st.markdown("**" + ", ".join(default_sub_classes + ["rubbish"]) + "**")
+    # Inform the user about the default detection
+    st.info("By default, the application will detect **rubbish** only.")
+    # User input for classes, separated by commas (optional)
+    custom_classes_input = st.text_input(
+        "Enter classes (comma-separated) or type 'all' to detect everything:",
+        ""
+    )
+    # Retrieve all model classes
+    all_model_classes = list(model_class_names.values())
+    # Determine classes to use based on user input
+    if custom_classes_input.strip() == "":
+        # No input provided; use only 'rubbish'
+        selected_classes = ['rubbish']
+        st.info("No classes entered. Using default class: **rubbish**.")
+    elif custom_classes_input.strip().lower() == "all":
+        # User chose to detect all classes
+        selected_classes = all_model_classes
+        st.info("Detecting **all** available classes.")
     else:
+        # User provided specific classes
+        # Split the input string into a list of classes and remove any extra whitespace
+        input_classes = [cls.strip() for cls in custom_classes_input.split(",") if cls.strip()]
+        # Ensure 'rubbish' is included
+        if 'rubbish' not in [cls.lower() for cls in input_classes]:
+            selected_classes = input_classes + ['rubbish']
+            st.info(f"Detecting the following classes: **{', '.join(selected_classes)}** (Including **rubbish**)")
+        else:
+            selected_classes = input_classes
+            st.info(f"Detecting the following classes: **{', '.join(selected_classes)}**")
+    # Map selected class names to their indices
+    selected_class_indices, not_found_classes = get_class_indices(selected_classes)
+    if not_found_classes:
+        st.warning(f"The following classes were not found in the model and will be ignored: **{', '.join(not_found_classes)}**")
+    # Proceed only if there are valid classes to detect
+    if selected_class_indices:
+        # Set the classes for the model
+        model.classes = selected_class_indices
+        # --------------------- Image Upload and Processing ---------------------
+        st.header("Image Object Detection")
+        uploaded_file = st.file_uploader("Choose an image...", type=["jpg", "jpeg", "png"], key="image_upload")
+        if uploaded_file is not None:
+            try:
+                # Convert the file to a PIL image
+                image = Image.open(uploaded_file).convert('RGB')
+                st.image(image, caption="Uploaded Image", use_column_width=True)
+                st.write("Processing...")
+                # Perform inference
+                results = model(image)
+                # Extract DataFrame from results
+                results_df = results.pandas().xyxy[0]
+                # Filter results to include only selected classes
+                filtered_results = results_df[results_df['name'].str.lower().isin([cls.lower() for cls in selected_classes])]
+                if filtered_results.empty:
+                    st.warning("No objects detected for the selected classes.")
+                else:
+                    # Display filtered results
+                    st.write("### Detection Results")
+                    st.dataframe(filtered_results)
+                # Annotate the image
+                annotated_image = annotate_image(np.array(image), results)
+                # Convert annotated image back to PIL format
+                annotated_pil = Image.fromarray(annotated_image)
+                # Display annotated image
+                st.image(annotated_pil, caption="Annotated Image", use_column_width=True)
+                # Convert annotated image to bytes
+                img_byte_arr = io.BytesIO()
+                annotated_pil.save(img_byte_arr, format='PNG')
+                img_byte_arr = img_byte_arr.getvalue()
+                # Add download button
+                st.download_button(
+                    label="Download Annotated Image",
+                    data=img_byte_arr,
+                    file_name='annotated_image.png',
+                    mime='image/png'
+                )
+            except Exception as e:
+                st.error(f"An error occurred during image processing: {e}")
+        # --------------------- Video Upload and Processing ---------------------
+        st.header("Video Object Detection")
+        uploaded_video = st.file_uploader("Choose a video...", type=["mp4", "avi", "mov"], key="video_upload")
+        if uploaded_video is not None:
+            # Check if the uploaded video is different from the previously processed one
+            # Check if the uploaded video first time
+            if st.session_state.get("uploaded_video_name") is None:
+                st.session_state.uploaded_video_name = uploaded_video.name
+                print("First time uploaded video" +st.session_state.uploaded_video_name)
+            elif st.session_state.uploaded_video_name != uploaded_video.name:
+                st.session_state.uploaded_video_name = uploaded_video.name
+                print("Another time uploaded video" +st.session_state.uploaded_video_name)
+                st.session_state.video_processed = False
+                st.session_state.output_video_path = None
+                st.session_state.detections_summary = None
+                print("New uploaded video")
+        # Reset session state if video upload is removed
+        if uploaded_video is None and st.session_state.video_processed:
             st.session_state.video_processed = False
             st.session_state.output_video_path = None
             st.session_state.detections_summary = None
+            st.warning("Video upload has been cleared. You can upload a new video for processing.")
+        if uploaded_video:
+            if not st.session_state.video_processed:
+                try:
+                    with st.spinner("Processing video..."):
+                        # Save uploaded video to a temporary file
+                        tfile = tempfile.NamedTemporaryFile(delete=False)
+                        tfile.write(uploaded_video.read())
+                        tfile.close()
+                        # Open the video file
+                        video_cap = cv2.VideoCapture(tfile.name)
+                        stframe = st.empty()  # Placeholder for displaying video frames
+                        # Initialize VideoWriter for saving the output video
+                        fourcc = cv2.VideoWriter_fourcc(*'mp4v')
+                        fps = video_cap.get(cv2.CAP_PROP_FPS)
+                        width = int(video_cap.get(cv2.CAP_PROP_FRAME_WIDTH))
+                        height = int(video_cap.get(cv2.CAP_PROP_FRAME_HEIGHT))
+                        output_video_path = tempfile.NamedTemporaryFile(delete=False, suffix='.mp4').name
+                        out = cv2.VideoWriter(output_video_path, fourcc, fps, (width, height))
+                        frame_count = int(video_cap.get(cv2.CAP_PROP_FRAME_COUNT))
+                        progress_bar = st.progress(0)
+                        # Initialize list to collect all detections
+                        all_detections = []
+                        for frame_num in range(frame_count):
+                            ret, frame = video_cap.read()  # Read a frame from the video
+                            if not ret:
+                                break
+                            # Convert frame to RGB
+                            frame_rgb = cv2.cvtColor(frame, cv2.COLOR_BGR2RGB)
+                            # Perform inference
+                            results = model(frame_rgb)
+                            # Extract DataFrame from results
+                            results_df = results.pandas().xyxy[0]
+                            results_df['frame_num'] = frame_num  # Optional: Add frame number for reference
+                            # Append detections to the list
+                            if not results_df.empty:
+                                all_detections.append(results_df)
+                            # Annotate the frame with detections
+                            annotated_frame = annotate_image(frame_rgb, results)
+                            # Convert annotated frame back to BGR for VideoWriter
+                            annotated_bgr = cv2.cvtColor(annotated_frame, cv2.COLOR_RGB2BGR)
+                            # Write the annotated frame to the output video
+                            out.write(annotated_bgr)
+                            # Display the annotated frame in Streamlit
+                            stframe.image(annotated_frame, channels="RGB", use_column_width=True)
+                            # Update progress bar
+                            progress_percent = (frame_num + 1) / frame_count
+                            progress_bar.progress(progress_percent)
+                        video_cap.release()  # Release the video capture object
+                        out.release()  # Release the VideoWriter object
+                    # Save processed video path and detections summary to session state
+                    st.session_state.output_video_path = output_video_path
+                    if all_detections:
+                        # Concatenate all detections into a single DataFrame
+                        detections_df = pd.concat(all_detections, ignore_index=True)
+                        # Optional: Group by class name and count detections
+                        detections_summary = detections_df.groupby('name').size().reset_index(name='counts')
+                        st.session_state.detections_summary = detections_summary
+                    else:
+                        st.session_state.detections_summary = None
+                    # Mark video as processed
+                    st.session_state.video_processed = True
+                    # st.session_state.uploaded_video_name = uploaded_video.name
+                    st.success("Video processing complete!")
+                except Exception as e:
+                    st.error(f"An error occurred during video processing: {e}")
+        # Display download button and detection summary if processed
+        if st.session_state.video_processed:
+            try:
+                # Create a download button for the annotated video
+                with open(st.session_state.output_video_path, "rb") as video_file:
+                    st.download_button(
+                        label="Download Annotated Video",
+                        data=video_file,
+                        file_name="annotated_video.mp4",
+                        mime="video/mp4"
+                    )
+                # Display detection table if there are detections
+                if st.session_state.detections_summary is not None:
+                    detections_summary = st.session_state.detections_summary
+                    st.write("### Detection Summary")
+                    st.dataframe(detections_summary)
+                else:
+                    st.warning("No objects detected in the video for the selected classes.")
             except Exception as e:
+                st.error(f"An error occurred while preparing the download: {e}")
+    # Optionally, display all available classes when 'all' is selected
+    if custom_classes_input.strip().lower() == "all":
+        st.info(f"The model is set to detect **all** available classes: {', '.join(all_model_classes)}")
+# Unet model training configuration
+# Constants
+IMG_SIZE = 128  # Resize dimension for the input image
+# Load model function
+@st.cache_resource
+def load_model():
+    model = UNet(n_channels=3, n_classes=32)  # Adjust according to your model setup
+    model.load_state_dict(torch.load("/Users/phongporter/Documents/GITHUB/cos40007-team/streamlit_unet/model/unet/checkpoint_epoch5.pth", map_location="cpu", weights_only=True), strict=False)
+    model.eval()
+    return model
+# Function to preprocess the image
+def preprocess_image(image):
+    transform = T.Compose([
+        T.Resize((IMG_SIZE, IMG_SIZE)),  # Resize to match model input size
+        T.ToTensor(),  # Convert to tensor
+    ])
+    image_tensor = transform(image).unsqueeze(0)  # Add batch dimension
+    return image_tensor
+# Function to postprocess the model output for display
+def postprocess_mask(mask):
+    # Convert mask to a numpy array and scale to 0-255
+    mask_np = mask.squeeze().cpu().numpy()  # Remove batch and channel dimensions
+    mask_np = (mask_np > 0.5).astype(np.uint8) * 255  # Binarize and scale to 0-255
+    return mask_np
+def unet():
+    try:
+        # Load the model
+        model = load_model()
+        st.markdown(
+            "<h1 style='text-align: center; font-size: 36px;'>Smart city rubbish detection</h1>",
+            unsafe_allow_html=True
+        )
+        st.markdown(
+            "<h2 style='text-align: center; font-size: 30px;'>Presented by team 2</h2>",
+            unsafe_allow_html=True
+        )
+        # Display the file upload widget
+        uploaded_file = st.file_uploader("Choose an image...", type=["jpg", "jpeg", "png"])
+        if uploaded_file is not None:
+            # Open and display the uploaded image
+            image = Image.open(uploaded_file).convert("RGB")
+            st.image(image, caption="Uploaded Image", use_column_width=True)
+            # Preprocess the image
+            input_tensor = preprocess_image(image)
+            # Perform inference
+            with torch.no_grad():  # Disable gradient calculation for inference
+                output = model(input_tensor)
+                prediction = torch.sigmoid(output)  # Apply sigmoid to get probabilities
+            # Post-process the mask for display
+            mask = postprocess_mask(prediction[0, 0])  # Get the mask from the first batch item
+            # Display the segmentation mask
+            st.image(mask, caption="Segmentation Mask", use_column_width=True)
+    except Exception as e:
+        st.error(f"An error occurred in Unet: {e}")
+# Main page
+if 'model_selected' not in st.session_state:
+    st.session_state.model_selected = None
+def main():
+    st.markdown(
+        "<h1 style='text-align: center; font-size: 36px;'>Unet </h1>",
+        unsafe_allow_html=True
+    )
+    # Radio button for model selection with consistent casing
+    option = st.radio("Select Model:", ("Unet", "YOLO"))
+    # Submit button to confirm selection
+    if st.button("Choose"):
+        st.session_state.model_selected = option
+        st.success(f"Selected Model: {st.session_state.model_selected}")
+    # Render the selected model's interface based on session state
+    if st.session_state.model_selected == "Unet":
+        unet()
+    elif st.session_state.model_selected == "YOLO":
+        yolo()
+if __name__ == "__main__":
+    main()

model/.DS_Store ADDED Viewed

Binary file (6.15 kB). View file

{unet → model/unet}/checkpoint_epoch5.pth RENAMED Viewed

File without changes

{yolo → model/yolo}/best.pt RENAMED Viewed

File without changes

unet/__init__.py ADDED Viewed

	@@ -0,0 +1 @@


1	+ from .unet_model import UNet

unet/__pycache__/__init__.cpython-312.pyc ADDED Viewed

Binary file (220 Bytes). View file

unet/__pycache__/unet_model.cpython-312.pyc ADDED Viewed

Binary file (2.21 kB). View file

unet/__pycache__/unet_parts.cpython-312.pyc ADDED Viewed

Binary file (4.46 kB). View file

unet/unet_model.py ADDED Viewed

	@@ -0,0 +1,36 @@

+""" Full assembly of the parts to form the complete network """
+from .unet_parts import *
+class UNet(nn.Module):
+    def __init__(self, n_channels, n_classes, bilinear=False):
+        super(UNet, self).__init__()
+        self.n_channels = n_channels
+        self.n_classes = n_classes
+        self.bilinear = bilinear
+        self.inc = DoubleConv(n_channels, 64)
+        self.down1 = Down(64, 128)
+        self.down2 = Down(128, 256)
+        self.down3 = Down(256, 512)
+        factor = 2 if bilinear else 1
+        self.down4 = Down(512, 1024 // factor)
+        self.up1 = Up(1024, 512 // factor, bilinear)
+        self.up2 = Up(512, 256 // factor, bilinear)
+        self.up3 = Up(256, 128 // factor, bilinear)
+        self.up4 = Up(128, 64, bilinear)
+        self.outc = OutConv(64, n_classes)
+    def forward(self, x):
+        x1 = self.inc(x)
+        x2 = self.down1(x1)
+        x3 = self.down2(x2)
+        x4 = self.down3(x3)
+        x5 = self.down4(x4)
+        x = self.up1(x5, x4)
+        x = self.up2(x, x3)
+        x = self.up3(x, x2)
+        x = self.up4(x, x1)
+        logits = self.outc(x)
+        return logits

unet/unet_parts.py ADDED Viewed

	@@ -0,0 +1,77 @@

+""" Parts of the U-Net model """
+import torch
+import torch.nn as nn
+import torch.nn.functional as F
+class DoubleConv(nn.Module):
+    """(convolution => [BN] => ReLU) * 2"""
+    def __init__(self, in_channels, out_channels, mid_channels=None):
+        super().__init__()
+        if not mid_channels:
+            mid_channels = out_channels
+        self.double_conv = nn.Sequential(
+            nn.Conv2d(in_channels, mid_channels, kernel_size=3, padding=1, bias=False),
+            nn.BatchNorm2d(mid_channels),
+            nn.ReLU(inplace=True),
+            nn.Conv2d(mid_channels, out_channels, kernel_size=3, padding=1, bias=False),
+            nn.BatchNorm2d(out_channels),
+            nn.ReLU(inplace=True)
+        )
+    def forward(self, x):
+        return self.double_conv(x)
+class Down(nn.Module):
+    """Downscaling with maxpool then double conv"""
+    def __init__(self, in_channels, out_channels):
+        super().__init__()
+        self.maxpool_conv = nn.Sequential(
+            nn.MaxPool2d(2),
+            DoubleConv(in_channels, out_channels)
+        )
+    def forward(self, x):
+        return self.maxpool_conv(x)
+class Up(nn.Module):
+    """Upscaling then double conv"""
+    def __init__(self, in_channels, out_channels, bilinear=True):
+        super().__init__()
+        # if bilinear, use the normal convolutions to reduce the number of channels
+        if bilinear:
+            self.up = nn.Upsample(scale_factor=2, mode='bilinear', align_corners=True)
+            self.conv = DoubleConv(in_channels, out_channels, in_channels // 2)
+        else:
+            self.up = nn.ConvTranspose2d(in_channels, in_channels // 2, kernel_size=2, stride=2)
+            self.conv = DoubleConv(in_channels, out_channels)
+    def forward(self, x1, x2):
+        x1 = self.up(x1)
+        # input is CHW
+        diffY = x2.size()[2] - x1.size()[2]
+        diffX = x2.size()[3] - x1.size()[3]
+        x1 = F.pad(x1, [diffX // 2, diffX - diffX // 2,
+                        diffY // 2, diffY - diffY // 2])
+        # if you have padding issues, see
+        # https://github.com/HaiyongJiang/U-Net-Pytorch-Unstructured-Buggy/commit/0e854509c2cea854e247a9c615f175f76fbb2e3a
+        # https://github.com/xiaopeng-liao/Pytorch-UNet/commit/8ebac70e633bac59fc22bb5195e513d5832fb3bd
+        x = torch.cat([x2, x1], dim=1)
+        return self.conv(x)
+class OutConv(nn.Module):
+    def __init__(self, in_channels, out_channels):
+        super(OutConv, self).__init__()
+        self.conv = nn.Conv2d(in_channels, out_channels, kernel_size=1)
+    def forward(self, x):
+        return self.conv(x)