Spaces:

victorgg
/

gemini_2.0_image_gen

Running

App Files Files Community

victorgg commited on Mar 27

Commit

b2c166c

verified ·

1 Parent(s): 852ed6c

Update app.py

Browse files

Files changed (1) hide show

app.py +14 -31

app.py CHANGED Viewed

@@ -25,8 +25,8 @@ def save_binary_file(file_name, data):
     logger.debug(f"File saved successfully: {file_name}")
-def generate(text, file_name, api_key, model="gemini-2.0-flash-exp-image-generation"):
-    logger.debug(f"Starting generate function with text: '{text}', file_name: '{file_name}', model: '{model}'")
     try:
         # Initialize client
@@ -41,20 +41,10 @@ def generate(text, file_name, api_key, model="gemini-2.0-flash-exp-image-generat
         logger.debug("Gemini client initialized.")
-        files = [
-            client.files.upload(file=file_name),
-        ]
-        logger.debug(f"File uploaded. URI: {files[0].uri}, MIME Type: {files[0].mime_type}")
         contents = [
             types.Content(
                 role="user",
                 parts=[
-                    types.Part.from_uri(
-                        file_uri=files[0].uri,
-                        mime_type=files[0].mime_type,
-                    ),
                     types.Part.from_text(text=text),
                 ],
             ),
@@ -110,23 +100,18 @@ def generate(text, file_name, api_key, model="gemini-2.0-flash-exp-image-generat
         return None # Return None when error happens
-def process_image_and_prompt(composite_pil, prompt, gemini_api_key):
-    logger.debug(f"Starting process_image_and_prompt with prompt: '{prompt}'")
     try:
-        with tempfile.NamedTemporaryFile(suffix=".png", delete=False) as tmp:
-            composite_path = tmp.name
-            composite_pil.save(composite_path)
-            logger.debug(f"Composite image saved to: {composite_path}")
-        file_name = composite_path
         input_text = prompt
         model = "gemini-2.0-flash-exp-image-generation"  #  Consider changing this to "gemini-pro-vision"
-        gemma_edited_image_path = generate(text=input_text, file_name=file_name, api_key=gemini_api_key, model=model)
-        if gemma_edited_image_path: # Check none or not
-            logger.debug(f"Image generated at path: {gemma_edited_image_path}")
-            result_img = Image.open(gemma_edited_image_path)
             if result_img.mode == "RGBA":
                 result_img = result_img.convert("RGB")
             return [result_img]
@@ -135,10 +120,9 @@ def process_image_and_prompt(composite_pil, prompt, gemini_api_key):
             return []  # Return empty when error
     except Exception as e:
-        logger.exception("Error occurred in process_image_and_prompt")
         return []  # Return empty when error
 # --- Gradio Interface ---
 with gr.Blocks() as demo:
     gr.HTML(
@@ -149,17 +133,16 @@ with gr.Blocks() as demo:
         </div>
         <div>
             <h1></h1>
-            <p>ပုံရိပ်တည်းဖြတ်ရန် Gemini</p>
             <p>API Key ကို <a href="https://aistudio.google.com/apikey">ဤနေရာ</a> တွင် ဖန်တီးပါ</p>
         </div>
         </div>
         """
     )
-    gr.Markdown("ပုံတစ်ပုံ တင်ပြီး ပုံကိုတည်းဖြတ်ရန် သင်လိုချင်တာကို ရိုက်ထည့်ပါ။")
     with gr.Row():
         with gr.Column():
-            image_input = gr.Image(type="pil", label="ပုံတင်ရန်", image_mode="RGBA")
             gemini_api_key = gr.Textbox(
                 lines=1,
                 placeholder="Gemini API Key ထည့်ပါ",
@@ -176,8 +159,8 @@ with gr.Blocks() as demo:
             output_gallery = gr.Gallery(label="ထုတ်လုပ်ပြီးရလဒ်များ")
     submit_btn.click(
-        fn=process_image_and_prompt,
-        inputs=[image_input, prompt_input, gemini_api_key],
         outputs=output_gallery,
     )
@@ -185,5 +168,5 @@ try:
     demo.launch(share=True)
 except Exception as e:
     logger.error(f"Failed to launch Gradio app: {e}")
-    print(f"Failed to launch Gradio app: {e}") #Print for debuging in console.

     logger.debug(f"File saved successfully: {file_name}")
+def generate(text, api_key, model="gemini-2.0-flash-exp-image-generation"):
+    logger.debug(f"Starting generate function with text: '{text}', model: '{model}'")
     try:
         # Initialize client
         logger.debug("Gemini client initialized.")
         contents = [
             types.Content(
                 role="user",
                 parts=[
                     types.Part.from_text(text=text),
                 ],
             ),
         return None # Return None when error happens
+def generate_image_from_prompt(prompt, gemini_api_key):
+    logger.debug(f"Starting generate_image_from_prompt with prompt: '{prompt}'")
     try:
         input_text = prompt
         model = "gemini-2.0-flash-exp-image-generation"  #  Consider changing this to "gemini-pro-vision"
+        gemma_generated_image_path = generate(text=input_text, api_key=gemini_api_key, model=model)
+        if gemma_generated_image_path: # Check none or not
+            logger.debug(f"Image generated at path: {gemma_generated_image_path}")
+            result_img = Image.open(gemma_generated_image_path)
             if result_img.mode == "RGBA":
                 result_img = result_img.convert("RGB")
             return [result_img]
             return []  # Return empty when error
     except Exception as e:
+        logger.exception("Error occurred in generate_image_from_prompt")
         return []  # Return empty when error
 # --- Gradio Interface ---
 with gr.Blocks() as demo:
     gr.HTML(
         </div>
         <div>
             <h1></h1>
+            <p>စာသားမှပုံသို့ပြောင်းပါ</p>
             <p>API Key ကို <a href="https://aistudio.google.com/apikey">ဤနေရာ</a> တွင် ဖန်တီးပါ</p>
         </div>
         </div>
         """
     )
+    gr.Markdown("သင်လိုချင်တဲ့ပုံအတွက် စာသား prompt ကိုထည့်ပါ။")
     with gr.Row():
         with gr.Column():
             gemini_api_key = gr.Textbox(
                 lines=1,
                 placeholder="Gemini API Key ထည့်ပါ",
             output_gallery = gr.Gallery(label="ထုတ်လုပ်ပြီးရလဒ်များ")
     submit_btn.click(
+        fn=generate_image_from_prompt,
+        inputs=[prompt_input, gemini_api_key],
         outputs=output_gallery,
     )
     demo.launch(share=True)
 except Exception as e:
     logger.error(f"Failed to launch Gradio app: {e}")
+    print(f"Failed to launch Gradio app: {e}")