multiview-incontext

Runtime error

App Files Files Community

multimodalart HF Staff commited on Nov 20, 2024

Commit

ce1bf6b

verified ·

1 Parent(s): 6c51e38

Update app.py

Browse files

Files changed (1) hide show

app.py +137 -51

app.py CHANGED Viewed

@@ -3,7 +3,10 @@ import torch
 import spaces
 from diffusers import FluxInpaintPipeline
 from PIL import Image, ImageFile
 ImageFile.LOAD_TRUNCATED_IMAGES = True
 # Initialize the pipeline
@@ -17,60 +20,134 @@ pipe.load_lora_weights(
     weight_name="visual-identity-design.safetensors"
 )
 def square_center_crop(img, target_size=768):
-    if img.mode in ('RGBA', 'P'):
-        img = img.convert('RGB')
-    width, height = img.size
-    crop_size = min(width, height)
-    left = (width - crop_size) // 2
-    top = (height - crop_size) // 2
-    right = left + crop_size
-    bottom = top + crop_size
-    img_cropped = img.crop((left, top, right, bottom))
-    return img_cropped.resize((target_size, target_size), Image.Resampling.LANCZOS)
 def duplicate_horizontally(img):
-    width, height = img.size
-    if width != height:
-        raise ValueError(f"Input image must be square, got {width}x{height}")
-    new_image = Image.new('RGB', (width * 2, height))
-    new_image.paste(img, (0, 0))
-    new_image.paste(img, (width, 0))
-    return new_image
-# Load the mask image
-mask = Image.open("mask_square.png")
 @spaces.GPU
 def generate(image, prompt_user, progress=gr.Progress(track_tqdm=True)):
-    prompt_structure = "The two-panel image showcases the logo of a brand, [LEFT] the left panel is showing the logo [RIGHT] the right panel has this logo applied to "
-    prompt = prompt_structure + prompt_user
-    cropped_image = square_center_crop(image)
-    logo_dupli = duplicate_horizontally(cropped_image)
-    out = pipe(
-        prompt=prompt,
-        image=logo_dupli,
-        mask_image=mask,
-        guidance_scale=6,
-        height=768,
-        width=1536,
-        num_inference_steps=28,
-        max_sequence_length=256,
-        strength=1
-    ).images[0]
-    yield None, out
-    width, height = out.size
-    half_width = width // 2
-    image_2 = out.crop((half_width, 0, width, height))
-    yield image_2, out
 with gr.Blocks() as demo:
     gr.Markdown("# Logo in Context")
     gr.Markdown("### In-Context LoRA + Image-to-Image, apply your logo to anything")
@@ -80,7 +157,8 @@ with gr.Blocks() as demo:
             input_image = gr.Image(
                 label="Upload Logo Image",
                 type="pil",
-                height=384
             )
             prompt_input = gr.Textbox(
                 label="Where should the logo be applied?",
@@ -90,8 +168,15 @@ with gr.Blocks() as demo:
             generate_btn = gr.Button("Generate Application", variant="primary")
         with gr.Column():
-            output_image = gr.Image(label="Generated Application")
-            output_side = gr.Image(label="Side by side")
     with gr.Row():
         gr.Markdown("""
         ### Instructions:
@@ -102,11 +187,12 @@ with gr.Blocks() as demo:
         Note: The generation process might take a few moments.
         """)
-    # Set up the click event
     generate_btn.click(
         fn=generate,
         inputs=[input_image, prompt_input],
-        outputs=[output_image, output_side]
     )
 # Launch the interface

 import spaces
 from diffusers import FluxInpaintPipeline
 from PIL import Image, ImageFile
+import io
+import numpy as np
+# Enable loading of truncated images
 ImageFile.LOAD_TRUNCATED_IMAGES = True
 # Initialize the pipeline
     weight_name="visual-identity-design.safetensors"
 )
+def safe_open_image(image):
+    """Safely open and validate image"""
+    try:
+        if isinstance(image, np.ndarray):
+            # Convert numpy array to PIL Image
+            image = Image.fromarray(image)
+        elif isinstance(image, bytes):
+            # Handle bytes input
+            image = Image.open(io.BytesIO(image))
+        # Ensure the image is in RGB mode
+        if image.mode != 'RGB':
+            image = image.convert('RGB')
+        return image
+    except Exception as e:
+        raise ValueError(f"Error processing input image: {str(e)}")
 def square_center_crop(img, target_size=768):
+    """Improved center crop with additional validation"""
+    try:
+        img = safe_open_image(img)
+        # Ensure minimum size
+        if img.size[0] < 64 or img.size[1] < 64:
+            raise ValueError("Image is too small. Minimum size is 64x64 pixels.")
+        width, height = img.size
+        crop_size = min(width, height)
+        # Calculate crop coordinates
+        left = max(0, (width - crop_size) // 2)
+        top = max(0, (height - crop_size) // 2)
+        right = min(width, left + crop_size)
+        bottom = min(height, top + crop_size)
+        img_cropped = img.crop((left, top, right, bottom))
+        # Use high-quality resizing
+        return img_cropped.resize(
+            (target_size, target_size),
+            Image.Resampling.LANCZOS,
+            reducing_gap=3.0
+        )
+    except Exception as e:
+        raise ValueError(f"Error during image cropping: {str(e)}")
 def duplicate_horizontally(img):
+    """Improved horizontal duplication with validation"""
+    try:
+        width, height = img.size
+        if width != height:
+            raise ValueError(f"Input image must be square, got {width}x{height}")
+        # Create new image with RGB mode explicitly
+        new_image = Image.new('RGB', (width * 2, height))
+        # Ensure the source image is in RGB mode
+        if img.mode != 'RGB':
+            img = img.convert('RGB')
+        new_image.paste(img, (0, 0))
+        new_image.paste(img, (width, 0))
+        return new_image
+    except Exception as e:
+        raise ValueError(f"Error during image duplication: {str(e)}")
+def safe_crop_output(img):
+    """Safely crop the output image"""
+    try:
+        width, height = img.size
+        half_width = width // 2
+        return img.crop((half_width, 0, width, height))
+    except Exception as e:
+        raise ValueError(f"Error cropping output image: {str(e)}")
+# Load the mask image with error handling
+try:
+    mask = Image.open("mask_square.png")
+    if mask.mode != 'RGB':
+        mask = mask.convert('RGB')
+except Exception as e:
+    raise RuntimeError(f"Error loading mask image: {str(e)}")
 @spaces.GPU
 def generate(image, prompt_user, progress=gr.Progress(track_tqdm=True)):
+    """Improved generation function with proper error handling"""
+    try:
+        if image is None:
+            raise ValueError("No input image provided")
+        if not prompt_user or prompt_user.strip() == "":
+            raise ValueError("Please provide a prompt")
+        prompt_structure = "The two-panel image showcases the logo of a brand, [LEFT] the left panel is showing the logo [RIGHT] the right panel has this logo applied to "
+        prompt = prompt_structure + prompt_user
+        # Process input image
+        cropped_image = square_center_crop(image)
+        logo_dupli = duplicate_horizontally(cropped_image)
+        # Generate output
+        out = pipe(
+            prompt=prompt,
+            image=logo_dupli,
+            mask_image=mask,
+            guidance_scale=6,
+            height=768,
+            width=1536,
+            num_inference_steps=28,
+            max_sequence_length=256,
+            strength=1
+        ).images[0]
+        # First yield for progress
+        yield None, out
+        # Process and return final output
+        image_2 = safe_crop_output(out)
+        yield image_2, out
+    except Exception as e:
+        error_message = f"Error during generation: {str(e)}"
+        print(error_message)  # For logging
+        raise gr.Error(error_message)
+# Create the Gradio interface
 with gr.Blocks() as demo:
     gr.Markdown("# Logo in Context")
     gr.Markdown("### In-Context LoRA + Image-to-Image, apply your logo to anything")
             input_image = gr.Image(
                 label="Upload Logo Image",
                 type="pil",
+                height=384,
+                tool=None  # Disable editing tools to prevent corruption
             )
             prompt_input = gr.Textbox(
                 label="Where should the logo be applied?",
             generate_btn = gr.Button("Generate Application", variant="primary")
         with gr.Column():
+            output_image = gr.Image(
+                label="Generated Application",
+                type="pil"
+            )
+            output_side = gr.Image(
+                label="Side by side",
+                type="pil"
+            )
     with gr.Row():
         gr.Markdown("""
         ### Instructions:
         Note: The generation process might take a few moments.
         """)
+    # Set up the click event with error handling
     generate_btn.click(
         fn=generate,
         inputs=[input_image, prompt_input],
+        outputs=[output_image, output_side],
+        api_name="generate"
     )
 # Launch the interface