Spaces:

MLBench
/

ImageRecognition

Running

App Files Files Community

fatima02 commited on Feb 21

Commit

fd7db55

verified ·

1 Parent(s): 2c09e8c

Upload 4 files

Browse files

Files changed (4) hide show

gradio_app.py +267 -0
image_classifier.py +139 -0
pyrightconfig.json +4 -0
requirements.txt +8 -0

gradio_app.py ADDED Viewed

	@@ -0,0 +1,267 @@

+import gradio as gr
+import numpy as np
+import cv2
+from tensorflow.keras.applications import ResNet50
+from tensorflow.keras.applications.resnet50 import preprocess_input
+from tensorflow.keras.preprocessing import image
+from skimage.metrics import structural_similarity as ssim
+import os
+import tempfile
+from PIL import Image
+class ImageCharacterClassifier:
+    def __init__(self, similarity_threshold=0.5):
+        # Initialize ResNet50 model without top classification layer
+        self.model = ResNet50(weights='imagenet', include_top=False, pooling='avg')
+        self.similarity_threshold = similarity_threshold
+    def load_and_preprocess_image(self, image_path, target_size=(224, 224)):
+        # Load and preprocess image for ResNet50
+        img = image.load_img(image_path, target_size=target_size)
+        img_array = image.img_to_array(img)
+        img_array = np.expand_dims(img_array, axis=0)
+        img_array = preprocess_input(img_array)
+        return img_array
+    def extract_features(self, image_path):
+        # Extract deep features using ResNet50
+        preprocessed_img = self.load_and_preprocess_image(image_path)
+        features = self.model.predict(preprocessed_img)
+        return features
+    def calculate_ssim(self, img1_path, img2_path):
+        # Calculate SSIM between two images
+        img1 = cv2.imread(img1_path)
+        img2 = cv2.imread(img2_path)
+        if img1 is None or img2 is None:
+            return 0.0
+        # Convert to grayscale if images are in color
+        if len(img1.shape) == 3:
+            img1 = cv2.cvtColor(img1, cv2.COLOR_BGR2GRAY)
+        if len(img2.shape) == 3:
+            img2 = cv2.cvtColor(img2, cv2.COLOR_BGR2GRAY)
+        # Resize images to same dimensions
+        img2 = cv2.resize(img2, (img1.shape[1], img1.shape[0]))
+        score = ssim(img1, img2)
+        return score
+def process_images(reference_image, comparison_images, similarity_threshold):
+    try:
+        if reference_image is None:
+            return "Please upload a reference image.", []
+        if not comparison_images:
+            return "Please upload comparison images.", []
+        # Create temporary directory for saving uploaded files
+        with tempfile.TemporaryDirectory() as temp_dir:
+            # Initialize classifier with the threshold
+            classifier = ImageCharacterClassifier(similarity_threshold=similarity_threshold)
+            # Save reference image
+            ref_path = os.path.join(temp_dir, "reference.jpg")
+            cv2.imwrite(ref_path, cv2.cvtColor(reference_image, cv2.COLOR_RGB2BGR))
+            results = []
+            html_output = """
+            <div style='text-align: center; margin-bottom: 20px;'>
+                <h2 style='color: #2c3e50;'>Results</h2>
+                <p style='color: #7f8c8d;'>Reference image compared with uploaded images</p>
+            </div>
+            """
+            # Extract reference features once
+            ref_features = classifier.extract_features(ref_path)
+            # Process each comparison image
+            for i, comp_image in enumerate(comparison_images):
+                try:
+                    # Save comparison image
+                    comp_path = os.path.join(temp_dir, f"comparison_{i}.jpg")
+                    try:
+                        # First attempt: Try using PIL
+                        with Image.open(comp_image.name) as img:
+                            img = img.convert('RGB')
+                            img_array = np.array(img)
+                            cv2.imwrite(comp_path, cv2.cvtColor(img_array, cv2.COLOR_RGB2BGR))
+                    except Exception as e1:
+                        print(f"PIL failed: {str(e1)}")
+                        # Second attempt: Try using OpenCV directly
+                        img = cv2.imread(comp_image.name)
+                        if img is not None:
+                            cv2.imwrite(comp_path, img)
+                        else:
+                            raise ValueError(f"Could not read image: {comp_image.name}")
+                    # Calculate SSIM for structural similarity
+                    ssim_score = classifier.calculate_ssim(ref_path, comp_path)
+                    # Extract features for physical feature comparison
+                    comp_features = classifier.extract_features(comp_path)
+                    # Calculate feature differences for physical features
+                    feature_diff = np.abs(ref_features - comp_features)
+                    # Calculate different aspects of similarity
+                    avg_feature_diff = np.mean(feature_diff)
+                    max_feature_diff = np.max(feature_diff)
+                    feature_similarity = np.dot(ref_features.flatten(),
+                                           comp_features.flatten()) / (
+                        np.linalg.norm(ref_features) * np.linalg.norm(comp_features))
+                    # Stricter similarity criteria
+                    is_similar = True  # Start with assumption of similarity
+                    reason = "Images are similar"
+                    # First check for major physical feature differences (like misplaced eyes)
+                    if max_feature_diff > 0.85 or avg_feature_diff > 0.5:
+                        is_similar = False
+                        reason = "Major physical differences detected (missing or misplaced features)"
+                    # Then check for overall structural similarity
+                    elif ssim_score < 0.4:  # Lowered SSIM threshold
+                        is_similar = False
+                        reason = "Overall structure is too different"
+                    # Finally check for feature similarity
+                    elif feature_similarity < 0.5:
+                        is_similar = False
+                        reason = "Features don't match well enough"
+                    # Debug information
+                    print(f"\nDebug for {os.path.basename(comp_image.name)}:")
+                    print(f"SSIM Score: {ssim_score:.3f}")
+                    print(f"Max Feature Difference: {max_feature_diff:.3f}")
+                    print(f"Average Feature Difference: {avg_feature_diff:.3f}")
+                    print(f"Feature Similarity: {feature_similarity:.3f}")
+                    # Create HTML output with improved styling and reason
+                    status_color = "#27ae60" if is_similar else "#c0392b"  # Green or Red
+                    status_text = "SIMILAR" if is_similar else "NOT SIMILAR"
+                    status_icon = "✓" if is_similar else "✗"
+                    html_output += f"""
+                    <div style='
+                        margin: 15px 0;
+                        padding: 15px;
+                        border-radius: 8px;
+                        background-color: {status_color}1a;
+                        border: 2px solid {status_color};
+                        display: flex;
+                        align-items: center;
+                        justify-content: space-between;
+                    '>
+                        <div style='display: flex; align-items: center;'>
+                            <span style='
+                                font-size: 24px;
+                                margin-right: 10px;
+                                color: {status_color};
+                            '>{status_icon}</span>
+                            <div>
+                                <span style='color: #2c3e50; font-weight: bold; display: block;'>
+                                    {os.path.basename(comp_image.name)}
+                                </span>
+                                <span style='color: {status_color}; font-size: 12px;'>
+                                    {reason}
+                                </span>
+                            </div>
+                        </div>
+                        <div style='
+                            color: {status_color};
+                            font-weight: bold;
+                            font-size: 16px;
+                        '>{status_text}</div>
+                    </div>
+                    """
+                    # Read the processed image back for display
+                    display_img = cv2.imread(comp_path)
+                    if display_img is not None:
+                        display_img = cv2.cvtColor(display_img, cv2.COLOR_BGR2RGB)
+                        results.append(display_img)
+                except Exception as e:
+                    print(f"Error processing {comp_image.name}: {str(e)}")
+                    html_output += f"""
+                    <div style='
+                        margin: 15px 0;
+                        padding: 15px;
+                        border-radius: 8px;
+                        background-color: #e74c3c1a;
+                        border: 2px solid #e74c3c;
+                    '>
+                        <h3 style='color: #e74c3c; margin: 0;'>
+                            Error processing: {os.path.basename(comp_image.name)}
+                        </h3>
+                        <p style='color: #e74c3c; margin: 5px 0 0 0;'>{str(e)}</p>
+                    </div>
+                    """
+            return html_output, results
+    except Exception as e:
+        print(f"Main error: {str(e)}")
+        return f"""
+        <div style='
+            padding: 15px;
+            border-radius: 8px;
+            background-color: #e74c3c1a;
+            border: 2px solid #e74c3c;
+        '>
+            <h3 style='color: #e74c3c; margin: 0;'>Error</h3>
+            <p style='color: #e74c3c; margin: 5px 0 0 0;'>{str(e)}</p>
+        </div>
+        """, []
+# Update the interface creation
+def create_interface():
+    with gr.Blocks() as interface:
+        gr.Markdown("# Image Similarity Classifier")
+        gr.Markdown("Upload a reference image and up to 10 comparison images to check similarity.")
+        with gr.Row():
+            with gr.Column():
+                reference_input = gr.Image(
+                    label="Reference Image",
+                    type="numpy",
+                    image_mode="RGB"
+                )
+                comparison_input = gr.File(
+                    label="Comparison Images (Upload up to 10)",
+                    file_count="multiple",
+                    file_types=["image"],
+                    maximum=10
+                )
+                threshold_slider = gr.Slider(
+                    minimum=0.0,
+                    maximum=1.0,
+                    value=0.5,
+                    step=0.05,
+                    label="Similarity Threshold"
+                )
+                submit_button = gr.Button("Compare Images", variant="primary")
+            with gr.Column():
+                output_html = gr.HTML(label="Results")
+                output_gallery = gr.Gallery(
+                    label="Processed Images",
+                    columns=5,
+                    show_label=True,
+                    height="auto"
+                )
+        submit_button.click(
+            fn=process_images,
+            inputs=[reference_input, comparison_input, threshold_slider],
+            outputs=[output_html, output_gallery]
+        )
+    return interface
+# Launch the app
+if __name__ == "__main__":
+    interface = create_interface()
+    interface.launch(share=True)

image_classifier.py ADDED Viewed

	@@ -0,0 +1,139 @@

+import numpy as np
+import cv2
+from tensorflow.keras.applications import ResNet50
+from tensorflow.keras.applications.resnet50 import preprocess_input
+from tensorflow.keras.preprocessing import image
+from skimage.metrics import structural_similarity as ssim
+import os
+import argparse
+class ImageCharacterClassifier:
+    def __init__(self, similarity_threshold=0.7):
+        # Initialize ResNet50 model without top classification layer
+        self.model = ResNet50(weights='imagenet', include_top=False, pooling='avg')
+        self.similarity_threshold = similarity_threshold
+    def load_and_preprocess_image(self, image_path, target_size=(224, 224)):
+        # Load and preprocess image for ResNet50
+        img = image.load_img(image_path, target_size=target_size)
+        img_array = image.img_to_array(img)
+        img_array = np.expand_dims(img_array, axis=0)
+        img_array = preprocess_input(img_array)
+        return img_array
+    def extract_features(self, image_path):
+        # Extract deep features using ResNet50
+        preprocessed_img = self.load_and_preprocess_image(image_path)
+        features = self.model.predict(preprocessed_img)
+        return features
+    def calculate_ssim(self, img1_path, img2_path):
+        # Calculate SSIM between two images
+        img1 = cv2.imread(img1_path)
+        img2 = cv2.imread(img2_path)
+        # Convert to grayscale if images are in color
+        if len(img1.shape) == 3:
+            img1 = cv2.cvtColor(img1, cv2.COLOR_BGR2GRAY)
+        if len(img2.shape) == 3:
+            img2 = cv2.cvtColor(img2, cv2.COLOR_BGR2GRAY)
+        # Resize images to same dimensions
+        img2 = cv2.resize(img2, (img1.shape[1], img1.shape[0]))
+        score = ssim(img1, img2)
+        return score
+    def classify_images(self, reference_image_path, image_folder_path):
+        # Extract features from reference image
+        reference_features = self.extract_features(reference_image_path)
+        results = []
+        # Process each image in the folder
+        for image_name in os.listdir(image_folder_path):
+            if image_name.lower().endswith(('.png', '.jpg', '.jpeg')):
+                image_path = os.path.join(image_folder_path, image_name)
+                try:
+                    # Calculate SSIM
+                    ssim_score = self.calculate_ssim(reference_image_path, image_path)
+                    # Extract features and calculate similarity
+                    image_features = self.extract_features(image_path)
+                    # Calculate cosine similarity
+                    feature_similarity = np.dot(reference_features.flatten(),
+                                             image_features.flatten()) / (
+                        np.linalg.norm(reference_features) * np.linalg.norm(image_features))
+                    # Give more weight to feature similarity
+                    combined_similarity = (0.3 * ssim_score + 0.7 * feature_similarity)
+                    # Classify based on similarity threshold
+                    is_similar = combined_similarity >= self.similarity_threshold
+                    results.append({
+                        'image_name': image_name,
+                        'ssim_score': ssim_score,
+                        'feature_similarity': feature_similarity,
+                        'combined_similarity': combined_similarity,
+                        'is_similar': is_similar
+                    })
+                except Exception as e:
+                    print(f"Error processing {image_name}: {str(e)}")
+                    continue
+        return results
+def main():
+    # Create argument parser
+    parser = argparse.ArgumentParser(description='Image Character Classification')
+    parser.add_argument('--reference', '-r',
+                       type=str,
+                       required=True,
+                       help='Path to reference image')
+    parser.add_argument('--folder', '-f',
+                       type=str,
+                       required=True,
+                       help='Path to folder containing images to compare')
+    parser.add_argument('--threshold', '-t',
+                       type=float,
+                       default=0.5,  # Lowered the default threshold
+                       help='Similarity threshold (default: 0.5)')
+    # Parse arguments
+    args = parser.parse_args()
+    # Initialize classifier
+    classifier = ImageCharacterClassifier(similarity_threshold=args.threshold)
+    # Check if paths exist
+    if not os.path.exists(args.reference):
+        print(f"Error: Reference image not found at {args.reference}")
+        return
+    if not os.path.exists(args.folder):
+        print(f"Error: Image folder not found at {args.folder}")
+        return
+    # Perform classification
+    results = classifier.classify_images(args.reference, args.folder)
+    # Sort results by similarity score
+    results.sort(key=lambda x: x['combined_similarity'], reverse=True)
+    # Print results
+    print("\nResults sorted by similarity (highest to lowest):")
+    print("-" * 50)
+    for result in results:
+        print(f"\nImage: {result['image_name']}")
+        print(f"SSIM Score: {result['ssim_score']:.3f}")
+        print(f"Feature Similarity: {result['feature_similarity']:.3f}")
+        print(f"Combined Similarity: {result['combined_similarity']:.3f}")
+        print(f"Is Similar: {result['is_similar']}")
+        print("-" * 30)
+if __name__ == "__main__":
+    main()

pyrightconfig.json ADDED Viewed

	@@ -0,0 +1,4 @@

+{
+    "reportMissingImports": false,
+    "reportGeneralTypeIssues": false
+}

requirements.txt ADDED Viewed

	@@ -0,0 +1,8 @@

+tensorflow==2.10.0
+tensorflow-gpu==2.10.0
+keras==2.10.0
+numpy==1.23.5
+opencv-python==4.7.0.72
+scikit-image==0.19.3
+Pillow==9.3.0
+gradio==3.50.2