Spaces:

alexander-lazarin
/

compare_visual_prompts

Running

App Files Files Community

alexander-lazarin commited on Jan 21

Commit

b11f8f0

1 Parent(s): 1b0da9b

Fix bugs

Browse files

Files changed (1) hide show

app.py +40 -14

app.py CHANGED Viewed

@@ -63,12 +63,13 @@ def get_additional_images(id_product_money: str, marketplace: str) -> List[str]:
         with db_conn.connect() as connection:
             result = connection.execute(query, {"id_product_money": id_product_money}).first()
             if result and result.more_images:
                 paths = json.loads(result.more_images)
                 return [f"https://a.lmcdn.ru/product{path}" for path in paths]
     elif marketplace == 'wildberries':
         query = text("""
-            select features->'images' as more_images
             from public.wb_chrc
             where id_product_money = :id_product_money
             limit 1
@@ -76,7 +77,17 @@ def get_additional_images(id_product_money: str, marketplace: str) -> List[str]:
         with db_conn.connect() as connection:
             result = connection.execute(query, {"id_product_money": id_product_money}).first()
             if result and result.more_images:
-                return json.loads(result.more_images)
     return []
@@ -101,7 +112,15 @@ def get_gemini_response(model_name: str, encoded_images: List[Dict], prompt: str
     """Get response from a Gemini model."""
     try:
         model = genai.GenerativeModel(model_name)
-        response = model.generate_content(encoded_images + [prompt])
         return response.text
     except Exception as e:
         return f"Error with {model_name}: {str(e)}"
@@ -109,28 +128,35 @@ def get_gemini_response(model_name: str, encoded_images: List[Dict], prompt: str
 def process_input(id_product_money: str, prompt: str) -> Tuple[List[str], str, str]:
     """Main processing function."""
     try:
-        # Get marketplace and main image
         marketplace, main_image = get_marketplace_and_main_image(id_product_money)
-        # Get additional images
         additional_images = get_additional_images(id_product_money, marketplace)
         # Combine all images
         all_image_urls = [main_image] + additional_images
-        # Download and encode images
         encoded_images = download_and_encode_images(all_image_urls)
         if not encoded_images:
             raise ValueError("No images could be downloaded")
         # Get responses from both models
-        gemini_1_5_response = get_gemini_response("gemini-1.5-pro", encoded_images, prompt)
-        gemini_2_0_response = get_gemini_response("gemini-pro-vision", encoded_images, prompt)
         return all_image_urls, gemini_1_5_response, gemini_2_0_response
     except Exception as e:
         return [], f"Error: {str(e)}", f"Error: {str(e)}"
 # Create Gradio interface
@@ -139,20 +165,20 @@ with gr.Blocks() as demo:
     with gr.Row():
         id_input = gr.Textbox(label="Product ID (id_product_money)")
-        prompt_input = gr.Textbox(label="Prompt for VLMs")
     submit_btn = gr.Button("Analyze")
     with gr.Row():
-        image_gallery = gr.Gallery(label="Product Images")
     with gr.Row():
         with gr.Column():
-            gr.Markdown("### Gemini 1.5 Pro Response")
-            gemini_1_5_output = gr.Textbox(label="")
         with gr.Column():
-            gr.Markdown("### Gemini Pro Vision Response")
-            gemini_2_0_output = gr.Textbox(label="")
     submit_btn.click(
         fn=process_input,

         with db_conn.connect() as connection:
             result = connection.execute(query, {"id_product_money": id_product_money}).first()
             if result and result.more_images:
+                print(f"Lamoda raw more_images: {result.more_images}")
                 paths = json.loads(result.more_images)
                 return [f"https://a.lmcdn.ru/product{path}" for path in paths]
     elif marketplace == 'wildberries':
         query = text("""
+            select features->>'images' as more_images
             from public.wb_chrc
             where id_product_money = :id_product_money
             limit 1
         with db_conn.connect() as connection:
             result = connection.execute(query, {"id_product_money": id_product_money}).first()
             if result and result.more_images:
+                print(f"Wildberries raw more_images: {result.more_images}")
+                try:
+                    urls = json.loads(result.more_images)
+                    if isinstance(urls, list) and len(urls) > 0:
+                        # Split the URLs by semicolons
+                        return urls[0].split(';')
+                    return []
+                except Exception as e:
+                    print(f"Error parsing JSON: {str(e)}")
+                    print(f"Type of more_images: {type(result.more_images)}")
+                    return []
     return []
     """Get response from a Gemini model."""
     try:
         model = genai.GenerativeModel(model_name)
+        # Create a list of content parts
+        content = []
+        # Add each image as a separate content part
+        for img in encoded_images:
+            content.append(img)
+        # Add the prompt as the final content part
+        content.append(prompt)
+        # Generate response
+        response = model.generate_content(content)
         return response.text
     except Exception as e:
         return f"Error with {model_name}: {str(e)}"
 def process_input(id_product_money: str, prompt: str) -> Tuple[List[str], str, str]:
     """Main processing function."""
     try:
+        print("Getting marketplace and main image...")
         marketplace, main_image = get_marketplace_and_main_image(id_product_money)
+        print(f"Marketplace: {marketplace}")
+        print(f"Main image: {main_image}")
+        print("\nGetting additional images...")
         additional_images = get_additional_images(id_product_money, marketplace)
+        print(f"Additional images: {additional_images}")
         # Combine all images
         all_image_urls = [main_image] + additional_images
+        print(f"\nAll image URLs: {all_image_urls}")
+        print("\nDownloading and encoding images...")
         encoded_images = download_and_encode_images(all_image_urls)
+        print(f"Number of encoded images: {len(encoded_images)}")
         if not encoded_images:
             raise ValueError("No images could be downloaded")
+        print("\nGetting Gemini responses...")
         # Get responses from both models
+        gemini_1_5_response = get_gemini_response("gemini-1.5-flash", encoded_images, prompt)
+        gemini_2_0_response = get_gemini_response("gemini-2.0-flash-exp", encoded_images, prompt)
         return all_image_urls, gemini_1_5_response, gemini_2_0_response
     except Exception as e:
+        print(f"\nError in process_input: {str(e)}")
         return [], f"Error: {str(e)}", f"Error: {str(e)}"
 # Create Gradio interface
     with gr.Row():
         id_input = gr.Textbox(label="Product ID (id_product_money)")
+        prompt_input = gr.Textbox(label="Prompt for VLMs", value="What is this?")
     submit_btn = gr.Button("Analyze")
     with gr.Row():
+        image_gallery = gr.Gallery(label="Product Images", show_label=True)
     with gr.Row():
         with gr.Column():
+            gr.Markdown("### Gemini 1.5 Flash Response")
+            gemini_1_5_output = gr.Textbox(label="", show_copy_button=True)
         with gr.Column():
+            gr.Markdown("### Gemini 2.0 Flash Exp Response")
+            gemini_2_0_output = gr.Textbox(label="", show_copy_button=True)
     submit_btn.click(
         fn=process_input,